Use piper-phonemize to convert text to token IDs (#453)

2023-11-30 23:57:43 +08:00
parent db41778e99
commit 62dc3c3e46
55 changed files with 1048 additions and 192 deletions
--- a/sherpa-onnx/csrc/offline-tts.h
+++ b/sherpa-onnx/csrc/offline-tts.h
@@ -28,10 +28,17 @@ struct OfflineTtsConfig {
  // If there are multiple rules, they are applied from left to right.
  std::string rule_fsts;

+  // Maximum number of sentences that we process at a time.
+  // This is to avoid OOM for very long input text.
+  // If you set it to -1, then we process all sentences in a single batch.
+  int32_t max_num_sentences = 2;
+
  OfflineTtsConfig() = default;
  OfflineTtsConfig(const OfflineTtsModelConfig &model,
-                   const std::string &rule_fsts)
-      : model(model), rule_fsts(rule_fsts) {}
+                   const std::string &rule_fsts, int32_t max_num_sentences)
+      : model(model),
+        rule_fsts(rule_fsts),
+        max_num_sentences(max_num_sentences) {}

  void Register(ParseOptions *po);
  bool Validate() const;