Add tts play example for .Net. (#676)
It plays the generated audio via a speaker as it is generating.
This commit is contained in:
2
.github/workflows/build-wheels-aarch64.yaml
vendored
2
.github/workflows/build-wheels-aarch64.yaml
vendored
@@ -24,7 +24,7 @@ jobs:
|
|||||||
matrix:
|
matrix:
|
||||||
os: [ubuntu-latest]
|
os: [ubuntu-latest]
|
||||||
python-version: ["cp37", "cp38", "cp39", "cp310", "cp311", "cp312"]
|
python-version: ["cp37", "cp38", "cp39", "cp310", "cp311", "cp312"]
|
||||||
manylinux: [manylinux2014, manylinux_2_28]
|
manylinux: [manylinux2014] #, manylinux_2_28]
|
||||||
|
|
||||||
steps:
|
steps:
|
||||||
- uses: actions/checkout@v4
|
- uses: actions/checkout@v4
|
||||||
|
|||||||
2
.github/workflows/build-wheels-linux.yaml
vendored
2
.github/workflows/build-wheels-linux.yaml
vendored
@@ -24,7 +24,7 @@ jobs:
|
|||||||
matrix:
|
matrix:
|
||||||
os: [ubuntu-latest]
|
os: [ubuntu-latest]
|
||||||
python-version: ["cp37", "cp38", "cp39", "cp310", "cp311", "cp312"]
|
python-version: ["cp37", "cp38", "cp39", "cp310", "cp311", "cp312"]
|
||||||
manylinux: [manylinux2014, manylinux_2_28]
|
manylinux: [manylinux2014] #, manylinux_2_28]
|
||||||
|
|
||||||
|
|
||||||
steps:
|
steps:
|
||||||
|
|||||||
2
.github/workflows/build-wheels-win32.yaml
vendored
2
.github/workflows/build-wheels-win32.yaml
vendored
@@ -43,8 +43,6 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
ls -lh ./wheelhouse/
|
ls -lh ./wheelhouse/
|
||||||
|
|
||||||
ls -lh ./wheelhouse/*.whl
|
|
||||||
|
|
||||||
- uses: actions/upload-artifact@v4
|
- uses: actions/upload-artifact@v4
|
||||||
with:
|
with:
|
||||||
name: wheel-${{ matrix.python-version }}
|
name: wheel-${{ matrix.python-version }}
|
||||||
|
|||||||
@@ -6,4 +6,14 @@ Please refer to the documentation
|
|||||||
https://k2-fsa.github.io/sherpa/onnx/csharp-api/index.html
|
https://k2-fsa.github.io/sherpa/onnx/csharp-api/index.html
|
||||||
for details.
|
for details.
|
||||||
|
|
||||||
|
```bash
|
||||||
|
dotnet new console -n offline-tts-play
|
||||||
|
dotnet sln ./sherpa-onnx.sln add ./offline-tts-play
|
||||||
|
```
|
||||||
|
|
||||||
|
```bash
|
||||||
|
dotnet nuget locals all --list
|
||||||
|
dotnet nuget locals all --clear
|
||||||
|
```
|
||||||
|
|
||||||
[sherpa-onnx]: https://github.com/k2-fsa/sherpa-onnx
|
[sherpa-onnx]: https://github.com/k2-fsa/sherpa-onnx
|
||||||
|
|||||||
1
dotnet-examples/offline-tts-play/.gitignore
vendored
Normal file
1
dotnet-examples/offline-tts-play/.gitignore
vendored
Normal file
@@ -0,0 +1 @@
|
|||||||
|
run-piper.sh
|
||||||
285
dotnet-examples/offline-tts-play/Program.cs
Normal file
285
dotnet-examples/offline-tts-play/Program.cs
Normal file
@@ -0,0 +1,285 @@
|
|||||||
|
// Copyright (c) 2024 Xiaomi Corporation
|
||||||
|
//
|
||||||
|
// This file shows how to use a non-streaming TTS model for text-to-speech
|
||||||
|
// Please refer to
|
||||||
|
// https://k2-fsa.github.io/sherpa/onnx/pretrained_models/index.html
|
||||||
|
// and
|
||||||
|
// https://github.com/k2-fsa/sherpa-onnx/releases/tag/tts-models
|
||||||
|
// to download pre-trained models
|
||||||
|
//
|
||||||
|
// Note that you need a speaker to run this file since it will play
|
||||||
|
// the generated audio as it is generating.
|
||||||
|
|
||||||
|
using CommandLine.Text;
|
||||||
|
using CommandLine;
|
||||||
|
using PortAudioSharp;
|
||||||
|
using SherpaOnnx;
|
||||||
|
using System.Collections.Concurrent;
|
||||||
|
using System.Collections.Generic;
|
||||||
|
using System.Runtime.InteropServices;
|
||||||
|
using System.Threading;
|
||||||
|
using System;
|
||||||
|
|
||||||
|
class OfflineTtsPlayDemo
|
||||||
|
{
|
||||||
|
class Options
|
||||||
|
{
|
||||||
|
|
||||||
|
[Option("tts-rule-fsts", Required = false, Default = "", HelpText = "path to rule.fst")]
|
||||||
|
public string RuleFsts { get; set; }
|
||||||
|
|
||||||
|
[Option("vits-data-dir", Required = false, Default = "", HelpText = "Path to the directory containing dict for espeak-ng.")]
|
||||||
|
public string DataDir { get; set; }
|
||||||
|
|
||||||
|
[Option("vits-length-scale", Required = false, Default = 1, HelpText = "speech speed. Larger->Slower; Smaller->faster")]
|
||||||
|
public float LengthScale { get; set; }
|
||||||
|
|
||||||
|
[Option("vits-noise-scale", Required = false, Default = 0.667f, HelpText = "noise_scale for VITS models")]
|
||||||
|
public float NoiseScale { get; set; }
|
||||||
|
|
||||||
|
[Option("vits-noise-scale-w", Required = false, Default = 0.8f, HelpText = "noise_scale_w for VITS models")]
|
||||||
|
public float NoiseScaleW { get; set; }
|
||||||
|
|
||||||
|
[Option("vits-lexicon", Required = false, Default = "", HelpText = "Path to lexicon.txt")]
|
||||||
|
public string Lexicon { get; set; }
|
||||||
|
|
||||||
|
[Option("vits-tokens", Required = false, Default = "", HelpText = "Path to tokens.txt")]
|
||||||
|
public string Tokens { get; set; }
|
||||||
|
|
||||||
|
[Option("tts-max-num-sentences", Required = false, Default = 1, HelpText = "Maximum number of sentences that we process at a time.")]
|
||||||
|
public int MaxNumSentences { get; set; }
|
||||||
|
|
||||||
|
[Option(Required = false, Default = 0, HelpText = "1 to show debug messages.")]
|
||||||
|
public int Debug { get; set; }
|
||||||
|
|
||||||
|
[Option("vits-model", Required = true, HelpText = "Path to VITS model")]
|
||||||
|
public string Model { get; set; }
|
||||||
|
|
||||||
|
[Option("sid", Required = false, Default = 0, HelpText = "Speaker ID")]
|
||||||
|
public int SpeakerId { get; set; }
|
||||||
|
|
||||||
|
[Option("text", Required = true, HelpText = "Text to synthesize")]
|
||||||
|
public string Text { get; set; }
|
||||||
|
|
||||||
|
[Option("output-filename", Required = true, Default = "./generated.wav", HelpText = "Path to save the generated audio")]
|
||||||
|
public string OutputFilename { get; set; }
|
||||||
|
}
|
||||||
|
|
||||||
|
static void Main(string[] args)
|
||||||
|
{
|
||||||
|
var parser = new CommandLine.Parser(with => with.HelpWriter = null);
|
||||||
|
var parserResult = parser.ParseArguments<Options>(args);
|
||||||
|
|
||||||
|
parserResult
|
||||||
|
.WithParsed<Options>(options => Run(options))
|
||||||
|
.WithNotParsed(errs => DisplayHelp(parserResult, errs));
|
||||||
|
}
|
||||||
|
|
||||||
|
private static void DisplayHelp<T>(ParserResult<T> result, IEnumerable<Error> errs)
|
||||||
|
{
|
||||||
|
string usage = @"
|
||||||
|
# vits-aishell3
|
||||||
|
|
||||||
|
wget -qq https://github.com/k2-fsa/sherpa-onnx/releases/download/tts-models/vits-zh-aishell3.tar.bz2
|
||||||
|
tar xf vits-zh-aishell3.tar.bz2
|
||||||
|
|
||||||
|
dotnet run \
|
||||||
|
--vits-model=./vits-zh-aishell3/vits-aishell3.onnx \
|
||||||
|
--vits-tokens=./vits-zh-aishell3/tokens.txt \
|
||||||
|
--vits-lexicon=./vits-zh-aishell3/lexicon.txt \
|
||||||
|
--tts-rule-fsts=./vits-zh-aishell3/rule.fst \
|
||||||
|
--sid=66 \
|
||||||
|
--debug=1 \
|
||||||
|
--output-filename=./aishell3-66.wav \
|
||||||
|
--text=这是一个语音合成测试
|
||||||
|
|
||||||
|
# Piper models
|
||||||
|
|
||||||
|
wget -qq https://github.com/k2-fsa/sherpa-onnx/releases/download/tts-models/vits-piper-en_US-amy-low.tar.bz2
|
||||||
|
tar xf vits-piper-en_US-amy-low.tar.bz2
|
||||||
|
|
||||||
|
dotnet run \
|
||||||
|
--vits-model=./vits-piper-en_US-amy-low/en_US-amy-low.onnx \
|
||||||
|
--vits-tokens=./vits-piper-en_US-amy-low/tokens.txt \
|
||||||
|
--vits-data-dir=./vits-piper-en_US-amy-low/espeak-ng-data \
|
||||||
|
--debug=1 \
|
||||||
|
--output-filename=./amy.wav \
|
||||||
|
--text='This is a text to speech application in dotnet with Next Generation Kaldi'
|
||||||
|
|
||||||
|
Please refer to
|
||||||
|
https://k2-fsa.github.io/sherpa/onnx/tts/pretrained_models/index.html
|
||||||
|
to download more models.
|
||||||
|
";
|
||||||
|
|
||||||
|
var helpText = HelpText.AutoBuild(result, h =>
|
||||||
|
{
|
||||||
|
h.AdditionalNewLineAfterOption = false;
|
||||||
|
h.Heading = usage;
|
||||||
|
h.Copyright = "Copyright (c) 2024 Xiaomi Corporation";
|
||||||
|
return HelpText.DefaultParsingErrorsHandler(result, h);
|
||||||
|
}, e => e);
|
||||||
|
Console.WriteLine(helpText);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
private static void Run(Options options)
|
||||||
|
{
|
||||||
|
OfflineTtsConfig config = new OfflineTtsConfig();
|
||||||
|
config.Model.Vits.Model = options.Model;
|
||||||
|
config.Model.Vits.Lexicon = options.Lexicon;
|
||||||
|
config.Model.Vits.Tokens = options.Tokens;
|
||||||
|
config.Model.Vits.DataDir = options.DataDir;
|
||||||
|
config.Model.Vits.NoiseScale = options.NoiseScale;
|
||||||
|
config.Model.Vits.NoiseScaleW = options.NoiseScaleW;
|
||||||
|
config.Model.Vits.LengthScale = options.LengthScale;
|
||||||
|
config.Model.NumThreads = 1;
|
||||||
|
config.Model.Debug = options.Debug;
|
||||||
|
config.Model.Provider = "cpu";
|
||||||
|
config.RuleFsts = options.RuleFsts;
|
||||||
|
config.MaxNumSentences = options.MaxNumSentences;
|
||||||
|
|
||||||
|
OfflineTts tts = new OfflineTts(config);
|
||||||
|
float speed = 1.0f / options.LengthScale;
|
||||||
|
int sid = options.SpeakerId;
|
||||||
|
|
||||||
|
|
||||||
|
Console.WriteLine(PortAudio.VersionInfo.versionText);
|
||||||
|
PortAudio.Initialize();
|
||||||
|
Console.WriteLine($"Number of devices: {PortAudio.DeviceCount}");
|
||||||
|
|
||||||
|
for (int i = 0; i != PortAudio.DeviceCount; ++i)
|
||||||
|
{
|
||||||
|
Console.WriteLine($" Device {i}");
|
||||||
|
DeviceInfo deviceInfo = PortAudio.GetDeviceInfo(i);
|
||||||
|
Console.WriteLine($" Name: {deviceInfo.name}");
|
||||||
|
Console.WriteLine($" Max output channels: {deviceInfo.maxOutputChannels}");
|
||||||
|
Console.WriteLine($" Default sample rate: {deviceInfo.defaultSampleRate}");
|
||||||
|
}
|
||||||
|
int deviceIndex = PortAudio.DefaultOutputDevice;
|
||||||
|
if (deviceIndex == PortAudio.NoDevice)
|
||||||
|
{
|
||||||
|
Console.WriteLine("No default output device found. Please use ../offline-tts instead");
|
||||||
|
Environment.Exit(1);
|
||||||
|
}
|
||||||
|
|
||||||
|
DeviceInfo info = PortAudio.GetDeviceInfo(deviceIndex);
|
||||||
|
Console.WriteLine();
|
||||||
|
Console.WriteLine($"Use output default device {deviceIndex} ({info.name})");
|
||||||
|
|
||||||
|
StreamParameters param = new StreamParameters();
|
||||||
|
param.device = deviceIndex;
|
||||||
|
param.channelCount = 1;
|
||||||
|
param.sampleFormat = SampleFormat.Float32;
|
||||||
|
param.suggestedLatency = info.defaultLowOutputLatency;
|
||||||
|
param.hostApiSpecificStreamInfo = IntPtr.Zero;
|
||||||
|
|
||||||
|
// https://learn.microsoft.com/en-us/dotnet/standard/collections/thread-safe/blockingcollection-overview
|
||||||
|
BlockingCollection<float[]> dataItems = new BlockingCollection<float[]>();
|
||||||
|
|
||||||
|
var MyCallback = (IntPtr samples, int n) =>
|
||||||
|
{
|
||||||
|
float[] data = new float[n];
|
||||||
|
|
||||||
|
Marshal.Copy(samples, data, 0, n);
|
||||||
|
|
||||||
|
dataItems.Add(data);
|
||||||
|
};
|
||||||
|
|
||||||
|
bool playFinished = false;
|
||||||
|
|
||||||
|
float[] lastSampleArray = null;
|
||||||
|
int lastIndex = 0; // not played
|
||||||
|
|
||||||
|
PortAudioSharp.Stream.Callback playCallback = (IntPtr input, IntPtr output,
|
||||||
|
UInt32 frameCount,
|
||||||
|
ref StreamCallbackTimeInfo timeInfo,
|
||||||
|
StreamCallbackFlags statusFlags,
|
||||||
|
IntPtr userData
|
||||||
|
) =>
|
||||||
|
{
|
||||||
|
if (dataItems.IsCompleted && lastSampleArray == null && lastIndex == 0)
|
||||||
|
{
|
||||||
|
Console.WriteLine($"Finished playing");
|
||||||
|
playFinished = true;
|
||||||
|
return StreamCallbackResult.Complete;
|
||||||
|
}
|
||||||
|
|
||||||
|
int expected = Convert.ToInt32(frameCount);
|
||||||
|
int i = 0;
|
||||||
|
|
||||||
|
while ((lastSampleArray != null || dataItems.Count != 0) && (i < expected))
|
||||||
|
{
|
||||||
|
int needed = expected - i;
|
||||||
|
|
||||||
|
if (lastSampleArray != null)
|
||||||
|
{
|
||||||
|
int remaining = lastSampleArray.Length - lastIndex;
|
||||||
|
if (remaining >= needed)
|
||||||
|
{
|
||||||
|
float[] this_block = lastSampleArray.Skip(lastIndex).Take(needed).ToArray();
|
||||||
|
lastIndex += needed;
|
||||||
|
if (lastIndex == lastSampleArray.Length)
|
||||||
|
{
|
||||||
|
lastSampleArray = null;
|
||||||
|
lastIndex = 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
Marshal.Copy(this_block, 0, IntPtr.Add(output, i * sizeof(float)), needed);
|
||||||
|
return StreamCallbackResult.Continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
float[] this_block2 = lastSampleArray.Skip(lastIndex).Take(remaining).ToArray();
|
||||||
|
lastIndex = 0;
|
||||||
|
lastSampleArray = null;
|
||||||
|
|
||||||
|
Marshal.Copy(this_block2, 0, IntPtr.Add(output, i * sizeof(float)), remaining);
|
||||||
|
i += remaining;
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (dataItems.Count != 0)
|
||||||
|
{
|
||||||
|
lastSampleArray = dataItems.Take();
|
||||||
|
lastIndex = 0;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if (i < expected)
|
||||||
|
{
|
||||||
|
int sizeInBytes = (expected - i) * 4;
|
||||||
|
Marshal.Copy(new byte[sizeInBytes], 0, IntPtr.Add(output, i * sizeof(float)), sizeInBytes);
|
||||||
|
}
|
||||||
|
|
||||||
|
return StreamCallbackResult.Continue;
|
||||||
|
};
|
||||||
|
|
||||||
|
PortAudioSharp.Stream stream = new PortAudioSharp.Stream(inParams: null, outParams: param, sampleRate: tts.SampleRate,
|
||||||
|
framesPerBuffer: 0,
|
||||||
|
streamFlags: StreamFlags.ClipOff,
|
||||||
|
callback: playCallback,
|
||||||
|
userData: IntPtr.Zero
|
||||||
|
);
|
||||||
|
|
||||||
|
stream.Start();
|
||||||
|
|
||||||
|
OfflineTtsCallback callback = new OfflineTtsCallback(MyCallback);
|
||||||
|
|
||||||
|
OfflineTtsGeneratedAudio audio = tts.GenerateWithCallback(options.Text, speed, sid, callback);
|
||||||
|
bool ok = audio.SaveToWaveFile(options.OutputFilename);
|
||||||
|
|
||||||
|
if (ok)
|
||||||
|
{
|
||||||
|
Console.WriteLine($"Wrote to {options.OutputFilename} succeeded!");
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
Console.WriteLine($"Failed to write {options.OutputFilename}");
|
||||||
|
}
|
||||||
|
dataItems.CompleteAdding();
|
||||||
|
|
||||||
|
while (!playFinished)
|
||||||
|
{
|
||||||
|
Thread.Sleep(100); // 100ms
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
21
dotnet-examples/offline-tts-play/offline-tts-play.csproj
Normal file
21
dotnet-examples/offline-tts-play/offline-tts-play.csproj
Normal file
@@ -0,0 +1,21 @@
|
|||||||
|
<Project Sdk="Microsoft.NET.Sdk">
|
||||||
|
|
||||||
|
<PropertyGroup>
|
||||||
|
<OutputType>Exe</OutputType>
|
||||||
|
<TargetFramework>net6.0</TargetFramework>
|
||||||
|
<RootNamespace>offline_tts_play</RootNamespace>
|
||||||
|
<ImplicitUsings>enable</ImplicitUsings>
|
||||||
|
<Nullable>enable</Nullable>
|
||||||
|
</PropertyGroup>
|
||||||
|
|
||||||
|
<PropertyGroup>
|
||||||
|
<RestoreSources>/tmp/packages;$(RestoreSources);https://api.nuget.org/v3/index.json</RestoreSources>
|
||||||
|
</PropertyGroup>
|
||||||
|
|
||||||
|
<ItemGroup>
|
||||||
|
<PackageReference Include="CommandLineParser" Version="2.9.1" />
|
||||||
|
<PackageReference Include="org.k2fsa.sherpa.onnx" Version="*" />
|
||||||
|
<PackageReference Include="PortAudioSharp2" Version="*" />
|
||||||
|
</ItemGroup>
|
||||||
|
|
||||||
|
</Project>
|
||||||
@@ -11,6 +11,8 @@ Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "speech-recognition-from-mic
|
|||||||
EndProject
|
EndProject
|
||||||
Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "offline-tts", "offline-tts\offline-tts.csproj", "{72196886-7143-4043-96E2-BCACEC6C79EB}"
|
Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "offline-tts", "offline-tts\offline-tts.csproj", "{72196886-7143-4043-96E2-BCACEC6C79EB}"
|
||||||
EndProject
|
EndProject
|
||||||
|
Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "offline-tts-play", "offline-tts-play\offline-tts-play.csproj", "{40781464-5948-462B-BA4B-98932711513F}"
|
||||||
|
EndProject
|
||||||
Global
|
Global
|
||||||
GlobalSection(SolutionConfigurationPlatforms) = preSolution
|
GlobalSection(SolutionConfigurationPlatforms) = preSolution
|
||||||
Debug|Any CPU = Debug|Any CPU
|
Debug|Any CPU = Debug|Any CPU
|
||||||
@@ -36,5 +38,9 @@ Global
|
|||||||
{72196886-7143-4043-96E2-BCACEC6C79EB}.Debug|Any CPU.Build.0 = Debug|Any CPU
|
{72196886-7143-4043-96E2-BCACEC6C79EB}.Debug|Any CPU.Build.0 = Debug|Any CPU
|
||||||
{72196886-7143-4043-96E2-BCACEC6C79EB}.Release|Any CPU.ActiveCfg = Release|Any CPU
|
{72196886-7143-4043-96E2-BCACEC6C79EB}.Release|Any CPU.ActiveCfg = Release|Any CPU
|
||||||
{72196886-7143-4043-96E2-BCACEC6C79EB}.Release|Any CPU.Build.0 = Release|Any CPU
|
{72196886-7143-4043-96E2-BCACEC6C79EB}.Release|Any CPU.Build.0 = Release|Any CPU
|
||||||
|
{40781464-5948-462B-BA4B-98932711513F}.Debug|Any CPU.ActiveCfg = Debug|Any CPU
|
||||||
|
{40781464-5948-462B-BA4B-98932711513F}.Debug|Any CPU.Build.0 = Debug|Any CPU
|
||||||
|
{40781464-5948-462B-BA4B-98932711513F}.Release|Any CPU.ActiveCfg = Release|Any CPU
|
||||||
|
{40781464-5948-462B-BA4B-98932711513F}.Release|Any CPU.Build.0 = Release|Any CPU
|
||||||
EndGlobalSection
|
EndGlobalSection
|
||||||
EndGlobal
|
EndGlobal
|
||||||
|
|||||||
21
scripts/dotnet/examples/offline-tts-play.csproj
Normal file
21
scripts/dotnet/examples/offline-tts-play.csproj
Normal file
@@ -0,0 +1,21 @@
|
|||||||
|
<Project Sdk="Microsoft.NET.Sdk">
|
||||||
|
|
||||||
|
<PropertyGroup>
|
||||||
|
<OutputType>Exe</OutputType>
|
||||||
|
<TargetFramework>net6.0</TargetFramework>
|
||||||
|
<RootNamespace>offline_tts_play</RootNamespace>
|
||||||
|
<ImplicitUsings>enable</ImplicitUsings>
|
||||||
|
<Nullable>enable</Nullable>
|
||||||
|
</PropertyGroup>
|
||||||
|
|
||||||
|
<PropertyGroup>
|
||||||
|
<RestoreSources>/tmp/packages;$(RestoreSources);https://api.nuget.org/v3/index.json</RestoreSources>
|
||||||
|
</PropertyGroup>
|
||||||
|
|
||||||
|
<ItemGroup>
|
||||||
|
<PackageReference Include="CommandLineParser" Version="2.9.1" />
|
||||||
|
<PackageReference Include="org.k2fsa.sherpa.onnx" Version="*" />
|
||||||
|
<PackageReference Include="PortAudioSharp2" Version="*" />
|
||||||
|
</ItemGroup>
|
||||||
|
|
||||||
|
</Project>
|
||||||
@@ -159,6 +159,9 @@ namespace SherpaOnnx
|
|||||||
private static extern int SherpaOnnxWriteWave(IntPtr samples, int n, int sample_rate, [MarshalAs(UnmanagedType.LPStr)] string filename);
|
private static extern int SherpaOnnxWriteWave(IntPtr samples, int n, int sample_rate, [MarshalAs(UnmanagedType.LPStr)] string filename);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// IntPtr is actuallly a `const float*` from C++
|
||||||
|
public delegate void OfflineTtsCallback(IntPtr samples, int n);
|
||||||
|
|
||||||
public class OfflineTts : IDisposable
|
public class OfflineTts : IDisposable
|
||||||
{
|
{
|
||||||
public OfflineTts(OfflineTtsConfig config)
|
public OfflineTts(OfflineTtsConfig config)
|
||||||
@@ -173,6 +176,12 @@ namespace SherpaOnnx
|
|||||||
return new OfflineTtsGeneratedAudio(p);
|
return new OfflineTtsGeneratedAudio(p);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public OfflineTtsGeneratedAudio GenerateWithCallback(String text, float speed, int speakerId, OfflineTtsCallback callback)
|
||||||
|
{
|
||||||
|
IntPtr p = SherpaOnnxOfflineTtsGenerateWithCallback(_handle.Handle, text, speakerId, speed, callback);
|
||||||
|
return new OfflineTtsGeneratedAudio(p);
|
||||||
|
}
|
||||||
|
|
||||||
public void Dispose()
|
public void Dispose()
|
||||||
{
|
{
|
||||||
Cleanup();
|
Cleanup();
|
||||||
@@ -215,6 +224,9 @@ namespace SherpaOnnx
|
|||||||
|
|
||||||
[DllImport(Dll.Filename)]
|
[DllImport(Dll.Filename)]
|
||||||
private static extern IntPtr SherpaOnnxOfflineTtsGenerate(IntPtr handle, [MarshalAs(UnmanagedType.LPStr)] string text, int sid, float speed);
|
private static extern IntPtr SherpaOnnxOfflineTtsGenerate(IntPtr handle, [MarshalAs(UnmanagedType.LPStr)] string text, int sid, float speed);
|
||||||
|
|
||||||
|
[DllImport(Dll.Filename, CallingConvention = CallingConvention.Cdecl)]
|
||||||
|
private static extern IntPtr SherpaOnnxOfflineTtsGenerateWithCallback(IntPtr handle, [MarshalAs(UnmanagedType.LPStr)] string text, int sid, float speed, OfflineTtsCallback callback);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
@@ -10,6 +10,9 @@ echo "SHERPA_ONNX_DIR: $SHERPA_ONNX_DIR"
|
|||||||
|
|
||||||
SHERPA_ONNX_VERSION=$(grep "SHERPA_ONNX_VERSION" $SHERPA_ONNX_DIR/CMakeLists.txt | cut -d " " -f 2 | cut -d '"' -f 2)
|
SHERPA_ONNX_VERSION=$(grep "SHERPA_ONNX_VERSION" $SHERPA_ONNX_DIR/CMakeLists.txt | cut -d " " -f 2 | cut -d '"' -f 2)
|
||||||
|
|
||||||
|
# HF_MIRROR=hf-mirror.com
|
||||||
|
HF_MIRROR=hf.co
|
||||||
|
|
||||||
mkdir -p /tmp/
|
mkdir -p /tmp/
|
||||||
pushd /tmp
|
pushd /tmp
|
||||||
|
|
||||||
@@ -18,7 +21,7 @@ mkdir -p linux macos windows
|
|||||||
# You can pre-download the required wheels to /tmp
|
# You can pre-download the required wheels to /tmp
|
||||||
src_dir=/tmp
|
src_dir=/tmp
|
||||||
|
|
||||||
linux_wheel=$src_dir/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_28_x86_64.whl
|
linux_wheel=$src_dir/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
|
||||||
macos_wheel=$src_dir/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-macosx_11_0_x86_64.whl
|
macos_wheel=$src_dir/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-macosx_11_0_x86_64.whl
|
||||||
windows_wheel=$src_dir/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-win_amd64.whl
|
windows_wheel=$src_dir/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-win_amd64.whl
|
||||||
|
|
||||||
@@ -30,9 +33,9 @@ if [ ! -f /tmp/linux/libsherpa-onnx-core.so ]; then
|
|||||||
if [ -f $linux_wheel ]; then
|
if [ -f $linux_wheel ]; then
|
||||||
cp -v $linux_wheel .
|
cp -v $linux_wheel .
|
||||||
else
|
else
|
||||||
curl -OL https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_28_x86_64.whl
|
curl -OL https://$HF_MIRROR/csukuangfj/sherpa-onnx-wheels/resolve/main/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
|
||||||
fi
|
fi
|
||||||
unzip sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_28_x86_64.whl
|
unzip sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
|
||||||
cp -v sherpa_onnx/lib/*.so* ../
|
cp -v sherpa_onnx/lib/*.so* ../
|
||||||
cd ..
|
cd ..
|
||||||
rm -v libpiper_phonemize.so libpiper_phonemize.so.1.2.0
|
rm -v libpiper_phonemize.so libpiper_phonemize.so.1.2.0
|
||||||
@@ -52,7 +55,7 @@ if [ ! -f /tmp/macos/libsherpa-onnx-core.dylib ]; then
|
|||||||
if [ -f $macos_wheel ]; then
|
if [ -f $macos_wheel ]; then
|
||||||
cp -v $macos_wheel .
|
cp -v $macos_wheel .
|
||||||
else
|
else
|
||||||
curl -OL https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-macosx_11_0_x86_64.whl
|
curl -OL https://$HF_MIRROR/csukuangfj/sherpa-onnx-wheels/resolve/main/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-macosx_11_0_x86_64.whl
|
||||||
fi
|
fi
|
||||||
unzip sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-macosx_11_0_x86_64.whl
|
unzip sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-macosx_11_0_x86_64.whl
|
||||||
cp -v sherpa_onnx/lib/*.dylib ../
|
cp -v sherpa_onnx/lib/*.dylib ../
|
||||||
@@ -69,7 +72,7 @@ if [ ! -f /tmp/macos/libsherpa-onnx-core.dylib ]; then
|
|||||||
fi
|
fi
|
||||||
|
|
||||||
|
|
||||||
if [ ! -f /tmp/windows/libsherpa-onnx-core.dll ]; then
|
if [ ! -f /tmp/windows/sherpa-onnx-core.dll ]; then
|
||||||
echo "---windows x64---"
|
echo "---windows x64---"
|
||||||
cd windows
|
cd windows
|
||||||
mkdir -p wheel
|
mkdir -p wheel
|
||||||
@@ -77,7 +80,7 @@ if [ ! -f /tmp/windows/libsherpa-onnx-core.dll ]; then
|
|||||||
if [ -f $windows_wheel ]; then
|
if [ -f $windows_wheel ]; then
|
||||||
cp -v $windows_wheel .
|
cp -v $windows_wheel .
|
||||||
else
|
else
|
||||||
curl -OL https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-win_amd64.whl
|
curl -OL https://$HF_MIRROR/csukuangfj/sherpa-onnx-wheels/resolve/main/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-win_amd64.whl
|
||||||
fi
|
fi
|
||||||
unzip sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-win_amd64.whl
|
unzip sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-win_amd64.whl
|
||||||
cp -v sherpa_onnx-${SHERPA_ONNX_VERSION}.data/data/bin/*.dll ../
|
cp -v sherpa_onnx-${SHERPA_ONNX_VERSION}.data/data/bin/*.dll ../
|
||||||
|
|||||||
@@ -24,8 +24,8 @@ function linux() {
|
|||||||
dst=$(realpath sherpa-onnx-go-linux/lib/x86_64-unknown-linux-gnu)
|
dst=$(realpath sherpa-onnx-go-linux/lib/x86_64-unknown-linux-gnu)
|
||||||
mkdir t
|
mkdir t
|
||||||
cd t
|
cd t
|
||||||
wget -q https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_28_x86_64.whl
|
wget -q https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
|
||||||
unzip ./sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_28_x86_64.whl
|
unzip ./sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
|
||||||
|
|
||||||
cp -v sherpa_onnx/lib/*.so* $dst
|
cp -v sherpa_onnx/lib/*.so* $dst
|
||||||
|
|
||||||
@@ -36,8 +36,8 @@ function linux() {
|
|||||||
dst=$(realpath sherpa-onnx-go-linux/lib/aarch64-unknown-linux-gnu)
|
dst=$(realpath sherpa-onnx-go-linux/lib/aarch64-unknown-linux-gnu)
|
||||||
mkdir t
|
mkdir t
|
||||||
cd t
|
cd t
|
||||||
wget -q https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_28_aarch64.whl
|
wget -q https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl
|
||||||
unzip ./sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_28_aarch64.whl
|
unzip ./sherpa_onnx-${SHERPA_ONNX_VERSION}-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl
|
||||||
|
|
||||||
cp -v sherpa_onnx/lib/*.so* $dst
|
cp -v sherpa_onnx/lib/*.so* $dst
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user