260 lines
6.5 KiB
C#
260 lines
6.5 KiB
C#
/// Copyright (c) 2023 Xiaomi Corporation (authors: Fangjun Kuang)
|
|
/// Copyright (c) 2023 by manyeyes
|
|
|
|
using System.Linq;
|
|
using System.Collections.Generic;
|
|
using System.Runtime.InteropServices;
|
|
using System;
|
|
|
|
namespace SherpaOnnx
|
|
{
|
|
|
|
[StructLayout(LayoutKind.Sequential)]
|
|
public struct OfflineTransducerModelConfig
|
|
{
|
|
public OfflineTransducerModelConfig()
|
|
{
|
|
Encoder = "";
|
|
Decoder = "";
|
|
Joiner = "";
|
|
}
|
|
[MarshalAs(UnmanagedType.LPStr)]
|
|
public string Encoder;
|
|
|
|
[MarshalAs(UnmanagedType.LPStr)]
|
|
public string Decoder;
|
|
|
|
[MarshalAs(UnmanagedType.LPStr)]
|
|
public string Joiner;
|
|
}
|
|
|
|
[StructLayout(LayoutKind.Sequential)]
|
|
public struct OfflineParaformerModelConfig
|
|
{
|
|
public OfflineParaformerModelConfig()
|
|
{
|
|
Model = "";
|
|
}
|
|
[MarshalAs(UnmanagedType.LPStr)]
|
|
public string Model;
|
|
}
|
|
|
|
[StructLayout(LayoutKind.Sequential)]
|
|
public struct OfflineNemoEncDecCtcModelConfig
|
|
{
|
|
public OfflineNemoEncDecCtcModelConfig()
|
|
{
|
|
Model = "";
|
|
}
|
|
[MarshalAs(UnmanagedType.LPStr)]
|
|
public string Model;
|
|
}
|
|
|
|
[StructLayout(LayoutKind.Sequential)]
|
|
public struct OfflineLMConfig
|
|
{
|
|
public OfflineLMConfig()
|
|
{
|
|
Model = "";
|
|
Scale = 0.5F;
|
|
}
|
|
[MarshalAs(UnmanagedType.LPStr)]
|
|
public string Model;
|
|
|
|
public float Scale;
|
|
}
|
|
|
|
[StructLayout(LayoutKind.Sequential)]
|
|
public struct OfflineModelConfig
|
|
{
|
|
public OfflineModelConfig()
|
|
{
|
|
Transducer = new OfflineTransducerModelConfig();
|
|
Paraformer = new OfflineParaformerModelConfig();
|
|
NeMoCtc = new OfflineNemoEncDecCtcModelConfig();
|
|
Tokens = "";
|
|
NumThreads = 1;
|
|
Debug = 0;
|
|
}
|
|
public OfflineTransducerModelConfig Transducer;
|
|
public OfflineParaformerModelConfig Paraformer;
|
|
public OfflineNemoEncDecCtcModelConfig NeMoCtc;
|
|
|
|
[MarshalAs(UnmanagedType.LPStr)]
|
|
public string Tokens;
|
|
|
|
public int NumThreads;
|
|
|
|
public int Debug;
|
|
}
|
|
|
|
[StructLayout(LayoutKind.Sequential)]
|
|
public struct OfflineRecognizerConfig
|
|
{
|
|
public OfflineRecognizerConfig()
|
|
{
|
|
FeatConfig = new FeatureConfig();
|
|
ModelConfig = new OfflineModelConfig();
|
|
LmConfig = new OfflineLMConfig();
|
|
|
|
DecodingMethod = "greedy_search";
|
|
MaxActivePaths = 4;
|
|
|
|
}
|
|
public FeatureConfig FeatConfig;
|
|
public OfflineModelConfig ModelConfig;
|
|
public OfflineLMConfig LmConfig;
|
|
|
|
[MarshalAs(UnmanagedType.LPStr)]
|
|
public string DecodingMethod;
|
|
|
|
public int MaxActivePaths;
|
|
}
|
|
|
|
public class OfflineRecognizerResult
|
|
{
|
|
public OfflineRecognizerResult(IntPtr handle)
|
|
{
|
|
Impl impl = (Impl)Marshal.PtrToStructure(handle, typeof(Impl));
|
|
_text = Marshal.PtrToStringUTF8(impl.Text);
|
|
}
|
|
|
|
[StructLayout(LayoutKind.Sequential)]
|
|
struct Impl
|
|
{
|
|
public IntPtr Text;
|
|
}
|
|
|
|
private String _text;
|
|
public String Text => _text;
|
|
}
|
|
|
|
public class OfflineStream : IDisposable
|
|
{
|
|
public OfflineStream(IntPtr p)
|
|
{
|
|
_handle = new HandleRef(this, p);
|
|
}
|
|
|
|
public void AcceptWaveform(int sampleRate, float[] samples)
|
|
{
|
|
AcceptWaveform(Handle, sampleRate, samples, samples.Length);
|
|
}
|
|
|
|
public OfflineRecognizerResult Result
|
|
{
|
|
get
|
|
{
|
|
IntPtr h = GetResult(_handle.Handle);
|
|
OfflineRecognizerResult result = new OfflineRecognizerResult(h);
|
|
DestroyResult(h);
|
|
return result;
|
|
}
|
|
}
|
|
|
|
~OfflineStream()
|
|
{
|
|
Cleanup();
|
|
}
|
|
|
|
public void Dispose()
|
|
{
|
|
Cleanup();
|
|
// Prevent the object from being placed on the
|
|
// finalization queue
|
|
System.GC.SuppressFinalize(this);
|
|
}
|
|
|
|
private void Cleanup()
|
|
{
|
|
DestroyOfflineStream(Handle);
|
|
|
|
// Don't permit the handle to be used again.
|
|
_handle = new HandleRef(this, IntPtr.Zero);
|
|
}
|
|
|
|
private HandleRef _handle;
|
|
public IntPtr Handle => _handle.Handle;
|
|
|
|
[DllImport(Dll.Filename)]
|
|
private static extern void DestroyOfflineStream(IntPtr handle);
|
|
|
|
[DllImport(Dll.Filename, EntryPoint = "AcceptWaveformOffline")]
|
|
private static extern void AcceptWaveform(IntPtr handle, int sampleRate, float[] samples, int n);
|
|
|
|
[DllImport(Dll.Filename, EntryPoint = "GetOfflineStreamResult")]
|
|
private static extern IntPtr GetResult(IntPtr handle);
|
|
|
|
[DllImport(Dll.Filename, EntryPoint = "DestroyOfflineRecognizerResult")]
|
|
private static extern void DestroyResult(IntPtr handle);
|
|
}
|
|
|
|
public class OfflineRecognizer : IDisposable
|
|
{
|
|
public OfflineRecognizer(OfflineRecognizerConfig config)
|
|
{
|
|
IntPtr h = CreateOfflineRecognizer(ref config);
|
|
_handle = new HandleRef(this, h);
|
|
}
|
|
|
|
public OfflineStream CreateStream()
|
|
{
|
|
IntPtr p = CreateOfflineStream(_handle.Handle);
|
|
return new OfflineStream(p);
|
|
}
|
|
|
|
/// You have to ensure that IsReady(stream) returns true before
|
|
/// you call this method
|
|
public void Decode(OfflineStream stream)
|
|
{
|
|
Decode(_handle.Handle, stream.Handle);
|
|
}
|
|
|
|
// The caller should ensure all passed streams are ready for decoding.
|
|
public void Decode(IEnumerable<OfflineStream> streams)
|
|
{
|
|
IntPtr[] ptrs = streams.Select(s => s.Handle).ToArray();
|
|
Decode(_handle.Handle, ptrs, ptrs.Length);
|
|
}
|
|
|
|
public void Dispose()
|
|
{
|
|
Cleanup();
|
|
// Prevent the object from being placed on the
|
|
// finalization queue
|
|
System.GC.SuppressFinalize(this);
|
|
}
|
|
|
|
~OfflineRecognizer()
|
|
{
|
|
Cleanup();
|
|
}
|
|
|
|
private void Cleanup()
|
|
{
|
|
DestroyOfflineRecognizer(_handle.Handle);
|
|
|
|
// Don't permit the handle to be used again.
|
|
_handle = new HandleRef(this, IntPtr.Zero);
|
|
}
|
|
|
|
private HandleRef _handle;
|
|
|
|
[DllImport(Dll.Filename)]
|
|
private static extern IntPtr CreateOfflineRecognizer(ref OfflineRecognizerConfig config);
|
|
|
|
[DllImport(Dll.Filename)]
|
|
private static extern void DestroyOfflineRecognizer(IntPtr handle);
|
|
|
|
[DllImport(Dll.Filename)]
|
|
private static extern IntPtr CreateOfflineStream(IntPtr handle);
|
|
|
|
[DllImport(Dll.Filename, EntryPoint = "DecodeOfflineStream")]
|
|
private static extern void Decode(IntPtr handle, IntPtr stream);
|
|
|
|
[DllImport(Dll.Filename, EntryPoint = "DecodeMultipleOfflineStreams")]
|
|
private static extern void Decode(IntPtr handle, IntPtr[] streams, int n);
|
|
}
|
|
|
|
}
|