Support removing invalid utf-8 sequences. (#1648)
This commit is contained in:
@@ -194,6 +194,8 @@ OnlineRecognizerImpl::OnlineRecognizerImpl(Manager *mgr,
|
||||
|
||||
std::string OnlineRecognizerImpl::ApplyInverseTextNormalization(
|
||||
std::string text) const {
|
||||
text = RemoveInvalidUtf8Sequences(text);
|
||||
|
||||
if (!itn_list_.empty()) {
|
||||
for (const auto &tn : itn_list_) {
|
||||
text = tn->Normalize(text);
|
||||
|
||||
Reference in New Issue
Block a user