Export nvidia/canary-180m-flash to sherpa-onnx (#2272)

This commit is contained in:
Fangjun Kuang
2025-06-02 22:28:15 +08:00
committed by GitHub
parent 2b2788332e
commit 6cb44d44e9
4 changed files with 851 additions and 0 deletions

View File

@@ -0,0 +1,131 @@
#!/usr/bin/env bash
# Copyright 2025 Xiaomi Corp. (authors: Fangjun Kuang)
set -ex
log() {
# This function is from espnet
local fname=${BASH_SOURCE[1]##*/}
echo -e "$(date '+%Y-%m-%d %H:%M:%S') (${fname}:${BASH_LINENO[0]}:${FUNCNAME[1]}) $*"
}
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/asr-models/de.wav
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/asr-models/en.wav
pip install \
nemo_toolkit['asr'] \
"numpy<2" \
ipython \
kaldi-native-fbank \
librosa \
onnx==1.17.0 \
onnxmltools \
onnxruntime==1.17.1 \
soundfile
python3 ./export_onnx_180m_flash.py
ls -lh *.onnx
log "-----fp32------"
python3 ./test_180m_flash.py \
--encoder ./encoder.onnx \
--decoder ./decoder.onnx \
--source-lang en \
--target-lang en \
--tokens ./tokens.txt \
--wav ./en.wav
python3 ./test_180m_flash.py \
--encoder ./encoder.onnx \
--decoder ./decoder.onnx \
--source-lang en \
--target-lang de \
--tokens ./tokens.txt \
--wav ./en.wav
python3 ./test_180m_flash.py \
--encoder ./encoder.onnx \
--decoder ./decoder.onnx \
--source-lang de \
--target-lang de \
--tokens ./tokens.txt \
--wav ./de.wav
python3 ./test_180m_flash.py \
--encoder ./encoder.onnx \
--decoder ./decoder.onnx \
--source-lang de \
--target-lang en \
--tokens ./tokens.txt \
--wav ./de.wav
log "-----int8------"
python3 ./test_180m_flash.py \
--encoder ./encoder.int8.onnx \
--decoder ./decoder.fp16.onnx \
--source-lang en \
--target-lang en \
--tokens ./tokens.txt \
--wav ./en.wav
python3 ./test_180m_flash.py \
--encoder ./encoder.int8.onnx \
--decoder ./decoder.fp16.onnx \
--source-lang en \
--target-lang de \
--tokens ./tokens.txt \
--wav ./en.wav
python3 ./test_180m_flash.py \
--encoder ./encoder.int8.onnx \
--decoder ./decoder.fp16.onnx \
--source-lang de \
--target-lang de \
--tokens ./tokens.txt \
--wav ./de.wav
python3 ./test_180m_flash.py \
--encoder ./encoder.int8.onnx \
--decoder ./decoder.fp16.onnx \
--source-lang de \
--target-lang en \
--tokens ./tokens.txt \
--wav ./de.wav
log "-----fp16------"
python3 ./test_180m_flash.py \
--encoder ./encoder.fp16.onnx \
--decoder ./decoder.fp16.onnx \
--source-lang en \
--target-lang en \
--tokens ./tokens.txt \
--wav ./en.wav
python3 ./test_180m_flash.py \
--encoder ./encoder.fp16.onnx \
--decoder ./decoder.fp16.onnx \
--source-lang en \
--target-lang de \
--tokens ./tokens.txt \
--wav ./en.wav
python3 ./test_180m_flash.py \
--encoder ./encoder.fp16.onnx \
--decoder ./decoder.fp16.onnx \
--source-lang de \
--target-lang de \
--tokens ./tokens.txt \
--wav ./de.wav
python3 ./test_180m_flash.py \
--encoder ./encoder.fp16.onnx \
--decoder ./decoder.fp16.onnx \
--source-lang de \
--target-lang en \
--tokens ./tokens.txt \
--wav ./de.wav