Add C++ runtime for Tele-AI/TeleSpeech-ASR (#970)

2024-06-05 00:26:40 +08:00
parent f8dbc10146
commit fd5a0d1e00
52 changed files with 1052 additions and 145 deletions
--- a/go-api-examples/non-streaming-decode-files/main.go
+++ b/go-api-examples/non-streaming-decode-files/main.go
@@ -40,6 +40,9 @@ func main() {
 	flag.IntVar(&config.ModelConfig.Debug, "debug", 0, "Whether to show debug message")
 	flag.StringVar(&config.ModelConfig.ModelType, "model-type", "", "Optional. Used for loading the model in a faster way")
 	flag.StringVar(&config.ModelConfig.Provider, "provider", "cpu", "Provider to use")
+	flag.StringVar(&config.ModelConfig.ModelingUnit, "modeling-unit", "cjkchar", "cjkchar, bpe, cjkchar+bpe, or leave it to empty")
+	flag.StringVar(&config.ModelConfig.BpeVocab, "bpe-vocab", "", "")
+	flag.StringVar(&config.ModelConfig.TeleSpeechCtc, "telespeech-ctc", "", "Used for TeleSpeechCtc model")
 	flag.StringVar(&config.LmConfig.Model, "lm-model", "", "Optional. Path to the LM model")
 	flag.Float32Var(&config.LmConfig.Scale, "lm-scale", 1.0, "Optional. Scale for the LM model")

--- a/go-api-examples/non-streaming-decode-files/run-telespeech-ctc.sh
+++ b/go-api-examples/non-streaming-decode-files/run-telespeech-ctc.sh
@@ -0,0 +1,19 @@
+#!/usr/bin/env bash
+
+set -ex
+
+if [ ! -d sherpa-onnx-telespeech-ctc-int8-zh-2024-06-04 ]; then
+  curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/asr-models/sherpa-onnx-telespeech-ctc-int8-zh-2024-06-04.tar.bz2
+  tar xvf sherpa-onnx-telespeech-ctc-int8-zh-2024-06-04.tar.bz2
+  rm sherpa-onnx-telespeech-ctc-int8-zh-2024-06-04.tar.bz2
+fi
+
+go mod tidy
+go build
+
+./non-streaming-decode-files \
+  --telespeech-ctc ./sherpa-onnx-telespeech-ctc-int8-zh-2024-06-04/model.int8.onnx \
+  --tokens ./sherpa-onnx-telespeech-ctc-int8-zh-2024-06-04/tokens.txt \
+  --model-type telespeech-ctc \
+  --debug 0 \
+  ./sherpa-onnx-telespeech-ctc-int8-zh-2024-06-04/test_wavs/3-sichuan.wav