Add dict_dir arg to c api to support Chinese TTS models using jieba (#809)

2024-04-25 12:28:31 +08:00
parent 83cd533f67
commit 6686c7d3e6
12 changed files with 48 additions and 6 deletions
--- a/scripts/go/sherpa_onnx.go
+++ b/scripts/go/sherpa_onnx.go
@@ -532,10 +532,11 @@ type OfflineTtsVitsModelConfig struct {
 	Model       string  // Path to the VITS onnx model
 	Lexicon     string  // Path to lexicon.txt
 	Tokens      string  // Path to tokens.txt
-	DataDir     string  // Path to tokens.txt
+	DataDir     string  // Path to espeak-ng-data directory
 	NoiseScale  float32 // noise scale for vits models. Please use 0.667 in general
 	NoiseScaleW float32 // noise scale for vits models. Please use 0.8 in general
 	LengthScale float32 // Please use 1.0 in general. Smaller -> Faster speech speed. Larger -> Slower speech speed
+	DictDir     string  // Path to dict directory for jieba (used only in Chinese tts)
 }

 type OfflineTtsModelConfig struct {
@@ -605,6 +606,9 @@ func NewOfflineTts(config *OfflineTtsConfig) *OfflineTts {
 	c.model.vits.noise_scale_w = C.float(config.Model.Vits.NoiseScaleW)
 	c.model.vits.length_scale = C.float(config.Model.Vits.LengthScale)

+	c.model.vits.dict_dir = C.CString(config.Model.Vits.DictDir)
+	defer C.free(unsafe.Pointer(c.model.vits.dict_dir))
+
 	c.model.num_threads = C.int(config.Model.NumThreads)
 	c.model.debug = C.int(config.Model.Debug)