Add HarmonyOS examples for MatchaTTS. (#1678)

2025-01-03 17:09:29 +08:00
parent 0e299f30f5
commit bf3330c906
9 changed files with 141 additions and 15 deletions
--- a/harmony-os/SherpaOnnxHar/sherpa_onnx/BuildProfile.ets
+++ b/harmony-os/SherpaOnnxHar/sherpa_onnx/BuildProfile.ets
@@ -1,7 +1,7 @@
 /**
 * Use these variables when you tailor your ArkTS code. They must be of the const type.
 */
-export const HAR_VERSION = '1.10.35';
+export const HAR_VERSION = '1.10.37';
 export const BUILD_MODE_NAME = 'debug';
 export const DEBUG = true;
 export const TARGET_NAME = 'default';
--- a/harmony-os/SherpaOnnxHar/sherpa_onnx/Index.ets
+++ b/harmony-os/SherpaOnnxHar/sherpa_onnx/Index.ets
@@ -1,11 +1,6 @@
 export { listRawfileDir, readWave, readWaveFromBinary, } from "libsherpa_onnx.so";

-export { CircularBuffer,
-  SileroVadConfig,
-  SpeechSegment,
-  Vad,
-  VadConfig,
-} from './src/main/ets/components/Vad';
+export { CircularBuffer, SileroVadConfig, SpeechSegment, Vad, VadConfig, } from './src/main/ets/components/Vad';


 export { Samples,
@@ -36,7 +31,8 @@ export { OnlineStream,
  OnlineRecognizer,
 } from './src/main/ets/components/StreamingAsr';

-export { OfflineTtsVitsModelConfig,
+export { OfflineTtsMatchaModelConfig,
+  OfflineTtsVitsModelConfig,
  OfflineTtsModelConfig,
  OfflineTtsConfig,
  OfflineTts,
--- a/harmony-os/SherpaOnnxHar/sherpa_onnx/src/main/ets/components/NonStreamingTts.ets
+++ b/harmony-os/SherpaOnnxHar/sherpa_onnx/src/main/ets/components/NonStreamingTts.ets
@@ -17,8 +17,20 @@ export class OfflineTtsVitsModelConfig {
  public lengthScale: number = 1.0;
 }

+export class OfflineTtsMatchaModelConfig {
+  public acousticModel: string = '';
+  public vocoder: string = '';
+  public lexicon: string = '';
+  public tokens: string = '';
+  public dataDir: string = '';
+  public dictDir: String = '';
+  public noiseScale: number = 0.667;
+  public lengthScale: number = 1.0;
+}
+
 export class OfflineTtsModelConfig {
  public vits: OfflineTtsVitsModelConfig = new OfflineTtsVitsModelConfig();
+  public matcha: OfflineTtsMatchaModelConfig = new OfflineTtsMatchaModelConfig();
  public numThreads: number = 1;
  public debug: boolean = false;
  public provider: string = 'cpu';
--- a/harmony-os/SherpaOnnxTts/entry/src/main/ets/workers/NonStreamingTtsWorker.ets
+++ b/harmony-os/SherpaOnnxTts/entry/src/main/ets/workers/NonStreamingTtsWorker.ets
@@ -73,7 +73,16 @@ function initTts(context: Context): OfflineTts {
  // for details

  let modelDir = '';
+
+  // for VITS begin
  let modelName = '';
+  // for VITS end
+
+  // for Matcha begin
+  let acousticModelName = '';
+  let vocoder = '';
+  // for Matcha end
+
  let ruleFsts = '';
  let ruleFars = '';
  let lexicon = '';
@@ -134,15 +143,47 @@ function initTts(context: Context): OfflineTts {
  // dictDir = 'dict';
  // ruleFsts = `date.fst,phone.fst,number.fst`;

+  // Example 8
+  // https://github.com/k2-fsa/sherpa-onnx/releases/tag/tts-models
+  // https://k2-fsa.github.io/sherpa/onnx/tts/pretrained_models/matcha.html#matcha-icefall-zh-baker-chinese-1-female-speaker
+  // modelDir = 'matcha-icefall-zh-baker'
+  // acousticModelName = 'model-steps-3.onnx'
+  // vocoder = 'hifigan_v2.onnx'
+  // lexicon = 'lexicon.txt'
+  // dictDir = 'dict';
+  // ruleFsts = `date.fst,phone.fst,number.fst`;
+
+  // Example 9
+  // https://github.com/k2-fsa/sherpa-onnx/releases/tag/tts-models
+  // https://k2-fsa.github.io/sherpa/onnx/tts/pretrained_models/matcha.html#matcha-icefall-en-us-ljspeech-american-english-1-female-speaker
+  // modelDir = 'matcha-icefall-en_US-ljspeech'
+  // acousticModelName = 'model-steps-3.onnx'
+  // vocoder = 'hifigan_v2.onnx'
+  // dataDir = 'espeak-ng-data';
+
  // ============================================================
  // Please don't change the remaining part of this function
  // ============================================================

-  if (modelName == '') {
+  if (modelName == '' && acousticModelName == '' && vocoder == '') {
    throw new Error('You are supposed to select a model by changing the code before you run the app');
  }

-  modelName = modelDir + '/' + modelName;
+  if (modelName != '' && acousticModelName != '') {
+    throw new Error('Please select either VITS or Matcha, not both');
+  }
+
+  if (acousticModelName != '' && vocoder == '') {
+    throw new Error('Please provider vocoder for matcha tts models');
+  }
+
+  if (modelName != '') {
+    modelName = modelDir + '/' + modelName;
+  }
+
+  if (acousticModelName != '') {
+    acousticModelName = modelDir + '/' + acousticModelName;
+  }

  if (ruleFsts != '') {
    let fsts = ruleFsts.split(',')
@@ -186,6 +227,14 @@ function initTts(context: Context): OfflineTts {
  config.model.vits.tokens = tokens;
  config.model.vits.dataDir = dataDir;
  config.model.vits.dictDir = dictDir;
+
+  config.model.matcha.acousticModel = acousticModelName;
+  config.model.matcha.vocoder = vocoder;
+  config.model.matcha.lexicon = lexicon;
+  config.model.matcha.tokens = tokens;
+  config.model.matcha.dataDir = dataDir;
+  config.model.matcha.dictDir = dictDir;
+
  config.model.numThreads = 2;
  config.model.debug = true;
  config.ruleFsts = ruleFsts;