Add Speaker ID demo for C# (#862)
This commit is contained in:
@@ -222,6 +222,14 @@ namespace SherpaOnnx
|
||||
}
|
||||
}
|
||||
|
||||
public int NumSpeakers
|
||||
{
|
||||
get
|
||||
{
|
||||
return SherpaOnnxOfflineTtsNumSpeakers(_handle.Handle);
|
||||
}
|
||||
}
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern IntPtr SherpaOnnxCreateOfflineTts(ref OfflineTtsConfig config);
|
||||
|
||||
@@ -231,6 +239,9 @@ namespace SherpaOnnx
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern int SherpaOnnxOfflineTtsSampleRate(IntPtr handle);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern int SherpaOnnxOfflineTtsNumSpeakers(IntPtr handle);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern IntPtr SherpaOnnxOfflineTtsGenerate(IntPtr handle, [MarshalAs(UnmanagedType.LPStr)] string text, int sid, float speed);
|
||||
|
||||
@@ -556,6 +567,112 @@ namespace SherpaOnnx
|
||||
private static extern void Decode(IntPtr handle, IntPtr[] streams, int n);
|
||||
}
|
||||
|
||||
[StructLayout(LayoutKind.Sequential)]
|
||||
public struct SpeakerEmbeddingExtractorConfig
|
||||
{
|
||||
public SpeakerEmbeddingExtractorConfig()
|
||||
{
|
||||
Model = "";
|
||||
NumThreads = 1;
|
||||
Debug = 0;
|
||||
Provider = "cpu";
|
||||
}
|
||||
|
||||
[MarshalAs(UnmanagedType.LPStr)]
|
||||
public string Model;
|
||||
|
||||
public int NumThreads;
|
||||
public int Debug;
|
||||
|
||||
[MarshalAs(UnmanagedType.LPStr)]
|
||||
public string Provider;
|
||||
}
|
||||
|
||||
public class SpeakerEmbeddingExtractor : IDisposable
|
||||
{
|
||||
public SpeakerEmbeddingExtractor(SpeakerEmbeddingExtractorConfig config)
|
||||
{
|
||||
IntPtr h = SherpaOnnxCreateSpeakerEmbeddingExtractor(ref config);
|
||||
_handle = new HandleRef(this, h);
|
||||
}
|
||||
|
||||
public OnlineStream CreateStream()
|
||||
{
|
||||
IntPtr p = SherpaOnnxSpeakerEmbeddingExtractorCreateStream(_handle.Handle);
|
||||
return new OnlineStream(p);
|
||||
}
|
||||
|
||||
public bool IsReady(OnlineStream stream)
|
||||
{
|
||||
return SherpaOnnxSpeakerEmbeddingExtractorIsReady(_handle.Handle, stream.Handle) != 0;
|
||||
}
|
||||
|
||||
public float[] Compute(OnlineStream stream)
|
||||
{
|
||||
IntPtr p = SherpaOnnxSpeakerEmbeddingExtractorComputeEmbedding(_handle.Handle, stream.Handle);
|
||||
|
||||
int dim = Dim;
|
||||
float[] ans = new float[dim];
|
||||
Marshal.Copy(p, ans, 0, dim);
|
||||
|
||||
SherpaOnnxSpeakerEmbeddingExtractorDestroyEmbedding(p);
|
||||
|
||||
return ans;
|
||||
}
|
||||
|
||||
public int Dim
|
||||
{
|
||||
get
|
||||
{
|
||||
return SherpaOnnxSpeakerEmbeddingExtractorDim(_handle.Handle);
|
||||
}
|
||||
}
|
||||
|
||||
public void Dispose()
|
||||
{
|
||||
Cleanup();
|
||||
// Prevent the object from being placed on the
|
||||
// finalization queue
|
||||
System.GC.SuppressFinalize(this);
|
||||
}
|
||||
|
||||
~SpeakerEmbeddingExtractor()
|
||||
{
|
||||
Cleanup();
|
||||
}
|
||||
|
||||
private void Cleanup()
|
||||
{
|
||||
SherpaOnnxDestroySpeakerEmbeddingExtractor(_handle.Handle);
|
||||
|
||||
// Don't permit the handle to be used again.
|
||||
_handle = new HandleRef(this, IntPtr.Zero);
|
||||
}
|
||||
|
||||
private HandleRef _handle;
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern IntPtr SherpaOnnxCreateSpeakerEmbeddingExtractor(ref SpeakerEmbeddingExtractorConfig config);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern void SherpaOnnxDestroySpeakerEmbeddingExtractor(IntPtr handle);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern int SherpaOnnxSpeakerEmbeddingExtractorDim(IntPtr handle);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern IntPtr SherpaOnnxSpeakerEmbeddingExtractorCreateStream(IntPtr handle);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern int SherpaOnnxSpeakerEmbeddingExtractorIsReady(IntPtr handle, IntPtr stream);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern IntPtr SherpaOnnxSpeakerEmbeddingExtractorComputeEmbedding(IntPtr handle, IntPtr stream);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern void SherpaOnnxSpeakerEmbeddingExtractorDestroyEmbedding(IntPtr p);
|
||||
}
|
||||
|
||||
[StructLayout(LayoutKind.Sequential)]
|
||||
public struct SpokenLanguageIdentificationWhisperConfig
|
||||
{
|
||||
@@ -593,6 +710,185 @@ namespace SherpaOnnx
|
||||
public string Provider;
|
||||
}
|
||||
|
||||
public class SpeakerEmbeddingManager : IDisposable
|
||||
{
|
||||
public SpeakerEmbeddingManager(int dim)
|
||||
{
|
||||
IntPtr h = SherpaOnnxCreateSpeakerEmbeddingManager(dim);
|
||||
_handle = new HandleRef(this, h);
|
||||
this._dim = dim;
|
||||
}
|
||||
|
||||
public bool Add(string name, float[] v)
|
||||
{
|
||||
return SherpaOnnxSpeakerEmbeddingManagerAdd(_handle.Handle, name, v) == 1;
|
||||
}
|
||||
|
||||
public bool Add(string name, ICollection<float[]> v_list)
|
||||
{
|
||||
int n = v_list.Count;
|
||||
float[] v = new float[n * _dim];
|
||||
int i = 0;
|
||||
foreach (var item in v_list)
|
||||
{
|
||||
item.CopyTo(v, i);
|
||||
i += _dim;
|
||||
}
|
||||
|
||||
return SherpaOnnxSpeakerEmbeddingManagerAddListFlattened(_handle.Handle, name, v, n) == 1;
|
||||
}
|
||||
|
||||
public bool Remove(string name)
|
||||
{
|
||||
return SherpaOnnxSpeakerEmbeddingManagerRemove(_handle.Handle, name) == 1;
|
||||
}
|
||||
|
||||
public string Search(float[] v, float threshold)
|
||||
{
|
||||
IntPtr p = SherpaOnnxSpeakerEmbeddingManagerSearch(_handle.Handle, v, threshold);
|
||||
|
||||
string s = "";
|
||||
int length = 0;
|
||||
|
||||
unsafe
|
||||
{
|
||||
byte* b = (byte*)p;
|
||||
if (b != null)
|
||||
{
|
||||
while (*b != 0)
|
||||
{
|
||||
++b;
|
||||
length += 1;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
if (length > 0)
|
||||
{
|
||||
byte[] stringBuffer = new byte[length];
|
||||
Marshal.Copy(p, stringBuffer, 0, length);
|
||||
s = Encoding.UTF8.GetString(stringBuffer);
|
||||
}
|
||||
|
||||
SherpaOnnxSpeakerEmbeddingManagerFreeSearch(p);
|
||||
|
||||
return s;
|
||||
}
|
||||
|
||||
public bool Verify(string name, float[] v, float threshold)
|
||||
{
|
||||
return SherpaOnnxSpeakerEmbeddingManagerVerify(_handle.Handle, name, v, threshold) == 1;
|
||||
}
|
||||
|
||||
public bool Contains(string name)
|
||||
{
|
||||
return SherpaOnnxSpeakerEmbeddingManagerContains(_handle.Handle, name) == 1;
|
||||
}
|
||||
|
||||
public string[] GetAllSpeakers()
|
||||
{
|
||||
if (NumSpeakers == 0)
|
||||
{
|
||||
return new string[] { };
|
||||
}
|
||||
|
||||
IntPtr names = SherpaOnnxSpeakerEmbeddingManagerGetAllSpeakers(_handle.Handle);
|
||||
|
||||
string[] ans = new string[NumSpeakers];
|
||||
|
||||
unsafe
|
||||
{
|
||||
byte** p = (byte**)names;
|
||||
for (int i = 0; i != NumSpeakers; i++)
|
||||
{
|
||||
int length = 0;
|
||||
byte* s = p[i];
|
||||
while (*s != 0)
|
||||
{
|
||||
++s;
|
||||
length += 1;
|
||||
}
|
||||
byte[] stringBuffer = new byte[length];
|
||||
Marshal.Copy((IntPtr)p[i], stringBuffer, 0, length);
|
||||
ans[i] = Encoding.UTF8.GetString(stringBuffer);
|
||||
}
|
||||
}
|
||||
|
||||
SherpaOnnxSpeakerEmbeddingManagerFreeAllSpeakers(names);
|
||||
|
||||
return ans;
|
||||
}
|
||||
|
||||
public void Dispose()
|
||||
{
|
||||
Cleanup();
|
||||
// Prevent the object from being placed on the
|
||||
// finalization queue
|
||||
System.GC.SuppressFinalize(this);
|
||||
}
|
||||
|
||||
~SpeakerEmbeddingManager()
|
||||
{
|
||||
Cleanup();
|
||||
}
|
||||
|
||||
private void Cleanup()
|
||||
{
|
||||
SherpaOnnxDestroySpeakerEmbeddingManager(_handle.Handle);
|
||||
|
||||
// Don't permit the handle to be used again.
|
||||
_handle = new HandleRef(this, IntPtr.Zero);
|
||||
}
|
||||
|
||||
public int NumSpeakers
|
||||
{
|
||||
get
|
||||
{
|
||||
return SherpaOnnxSpeakerEmbeddingManagerNumSpeakers(_handle.Handle);
|
||||
}
|
||||
}
|
||||
|
||||
private HandleRef _handle;
|
||||
private int _dim;
|
||||
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern IntPtr SherpaOnnxCreateSpeakerEmbeddingManager(int dim);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern void SherpaOnnxDestroySpeakerEmbeddingManager(IntPtr handle);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern int SherpaOnnxSpeakerEmbeddingManagerAdd(IntPtr handle, [MarshalAs(UnmanagedType.LPStr)] string name, float[] v);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern int SherpaOnnxSpeakerEmbeddingManagerAddListFlattened(IntPtr handle, [MarshalAs(UnmanagedType.LPStr)] string name, float[] v, int n);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern int SherpaOnnxSpeakerEmbeddingManagerRemove(IntPtr handle, [MarshalAs(UnmanagedType.LPStr)] string name);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern IntPtr SherpaOnnxSpeakerEmbeddingManagerSearch(IntPtr handle, float[] v, float threshold);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern void SherpaOnnxSpeakerEmbeddingManagerFreeSearch(IntPtr p);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern int SherpaOnnxSpeakerEmbeddingManagerVerify(IntPtr handle, [MarshalAs(UnmanagedType.LPStr)] string name, float[] v, float threshold);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern int SherpaOnnxSpeakerEmbeddingManagerContains(IntPtr handle, [MarshalAs(UnmanagedType.LPStr)] string name);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern int SherpaOnnxSpeakerEmbeddingManagerNumSpeakers(IntPtr handle);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern IntPtr SherpaOnnxSpeakerEmbeddingManagerGetAllSpeakers(IntPtr handle);
|
||||
|
||||
[DllImport(Dll.Filename)]
|
||||
private static extern void SherpaOnnxSpeakerEmbeddingManagerFreeAllSpeakers(IntPtr names);
|
||||
}
|
||||
|
||||
public class SpokenLanguageIdentificationResult
|
||||
{
|
||||
public SpokenLanguageIdentificationResult(IntPtr handle)
|
||||
|
||||
Reference in New Issue
Block a user