Add C++ and Python API for Kokoro TTS models. (#1715)

This commit is contained in:
Fangjun Kuang
2025-01-16 14:24:51 +08:00
committed by GitHub
parent 9efe26a646
commit ffc6b480a0
27 changed files with 1193 additions and 29 deletions

View File

@@ -0,0 +1,96 @@
// sherpa-onnx/csrc/offline-tts-kokoro-model-config.cc
//
// Copyright (c) 2025 Xiaomi Corporation
#include "sherpa-onnx/csrc/offline-tts-kokoro-model-config.h"
#include <vector>
#include "sherpa-onnx/csrc/file-utils.h"
#include "sherpa-onnx/csrc/macros.h"
namespace sherpa_onnx {
void OfflineTtsKokoroModelConfig::Register(ParseOptions *po) {
po->Register("kokoro-model", &model, "Path to Kokoro model");
po->Register("kokoro-voices", &voices,
"Path to voices.bin for Kokoro models");
po->Register("kokoro-tokens", &tokens,
"Path to tokens.txt for Kokoro models");
po->Register("kokoro-data-dir", &data_dir,
"Path to the directory containing dict for espeak-ng.");
po->Register("kokoro-length-scale", &length_scale,
"Speech speed. Larger->Slower; Smaller->faster.");
}
bool OfflineTtsKokoroModelConfig::Validate() const {
if (model.empty()) {
SHERPA_ONNX_LOGE("Please provide --kokoro-model");
return false;
}
if (!FileExists(model)) {
SHERPA_ONNX_LOGE("--kokoro-model: '%s' does not exist", model.c_str());
return false;
}
if (tokens.empty()) {
SHERPA_ONNX_LOGE("Please provide --kokoro-tokens");
return false;
}
if (!FileExists(tokens)) {
SHERPA_ONNX_LOGE("--kokoro-tokens: '%s' does not exist", tokens.c_str());
return false;
}
if (data_dir.empty()) {
SHERPA_ONNX_LOGE("Please provide --kokoro-data-dir");
return false;
}
if (!FileExists(data_dir + "/phontab")) {
SHERPA_ONNX_LOGE(
"'%s/phontab' does not exist. Please check --kokoro-data-dir",
data_dir.c_str());
return false;
}
if (!FileExists(data_dir + "/phonindex")) {
SHERPA_ONNX_LOGE(
"'%s/phonindex' does not exist. Please check --kokoro-data-dir",
data_dir.c_str());
return false;
}
if (!FileExists(data_dir + "/phondata")) {
SHERPA_ONNX_LOGE(
"'%s/phondata' does not exist. Please check --kokoro-data-dir",
data_dir.c_str());
return false;
}
if (!FileExists(data_dir + "/intonations")) {
SHERPA_ONNX_LOGE(
"'%s/intonations' does not exist. Please check --kokoro-data-dir",
data_dir.c_str());
return false;
}
return true;
}
std::string OfflineTtsKokoroModelConfig::ToString() const {
std::ostringstream os;
os << "OfflineTtsKokoroModelConfig(";
os << "model=\"" << model << "\", ";
os << "voices=\"" << voices << "\", ";
os << "tokens=\"" << tokens << "\", ";
os << "data_dir=\"" << data_dir << "\", ";
os << "length_scale=" << length_scale << ")";
return os.str();
}
} // namespace sherpa_onnx