diff --git a/sherpa-onnx/csrc/lexicon.cc b/sherpa-onnx/csrc/lexicon.cc index 9cdfd8f4..5d9ad8ff 100644 --- a/sherpa-onnx/csrc/lexicon.cc +++ b/sherpa-onnx/csrc/lexicon.cc @@ -214,7 +214,9 @@ std::vector Lexicon::ConvertTextToTokenIdsChinese( for (const auto &w : words) { if (punctuations_.count(w)) { - if (sil != -1) { + if (token2id_.count(w)) { + ans.push_back(token2id_.at(w)); + } else if (sil != -1) { ans.push_back(sil); } continue;