Add C++ runtime for MeloTTS (#1138)
This commit is contained in:
@@ -17,6 +17,7 @@ namespace sherpa_onnx {
|
||||
|
||||
// implemented in ./lexicon.cc
|
||||
std::unordered_map<std::string, int32_t> ReadTokens(std::istream &is);
|
||||
|
||||
std::vector<int32_t> ConvertTokensToIds(
|
||||
const std::unordered_map<std::string, int32_t> &token2id,
|
||||
const std::vector<std::string> &tokens);
|
||||
@@ -53,8 +54,7 @@ class JiebaLexicon::Impl {
|
||||
}
|
||||
}
|
||||
|
||||
std::vector<std::vector<int64_t>> ConvertTextToTokenIds(
|
||||
const std::string &text) const {
|
||||
std::vector<TokenIDs> ConvertTextToTokenIds(const std::string &text) const {
|
||||
// see
|
||||
// https://github.com/Plachtaa/VITS-fast-fine-tuning/blob/main/text/mandarin.py#L244
|
||||
std::regex punct_re{":|、|;"};
|
||||
@@ -87,7 +87,7 @@ class JiebaLexicon::Impl {
|
||||
SHERPA_ONNX_LOGE("after jieba processing: %s", os.str().c_str());
|
||||
}
|
||||
|
||||
std::vector<std::vector<int64_t>> ans;
|
||||
std::vector<TokenIDs> ans;
|
||||
std::vector<int64_t> this_sentence;
|
||||
|
||||
int32_t blank = token2id_.at(" ");
|
||||
@@ -217,7 +217,7 @@ JiebaLexicon::JiebaLexicon(const std::string &lexicon,
|
||||
: impl_(std::make_unique<Impl>(lexicon, tokens, dict_dir, meta_data,
|
||||
debug)) {}
|
||||
|
||||
std::vector<std::vector<int64_t>> JiebaLexicon::ConvertTextToTokenIds(
|
||||
std::vector<TokenIDs> JiebaLexicon::ConvertTextToTokenIds(
|
||||
const std::string &text, const std::string & /*unused_voice = ""*/) const {
|
||||
return impl_->ConvertTextToTokenIds(text);
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user