Add JavaScript API (WASM) for homophone replacer (#2157)
This commit is contained in:
@@ -182,10 +182,32 @@ tar xvf sherpa-onnx-paraformer-zh-2023-09-14.tar.bz2
|
||||
node ./test-offline-paraformer.js
|
||||
```
|
||||
|
||||
## ./test-offline-sense-voice-with-hr.js
|
||||
|
||||
[./test-offline-sense-voice-with-hr.js](./test-offline-sense-voice-with-hr.js) demonstrates
|
||||
how to decode a file with a non-streaming SenseVoice model with homophone replacer.
|
||||
|
||||
You can use the following command to run it:
|
||||
|
||||
```bash
|
||||
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/asr-models/sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17.tar.bz2
|
||||
tar xvf sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17.tar.bz2
|
||||
rm sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17.tar.bz2
|
||||
|
||||
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/hr-files/dict.tar.bz2
|
||||
tar xf dict.tar.bz2
|
||||
|
||||
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/hr-files/replace.fst
|
||||
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/hr-files/test-hr.wav
|
||||
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/hr-files/lexicon.txt
|
||||
|
||||
node ./test-offline-sense-voice-with-hr.js
|
||||
```
|
||||
|
||||
## ./test-offline-sense-voice.js
|
||||
|
||||
[./test-offline-sense-voice.js](./test-offline-sense-voice.js) demonstrates
|
||||
how to decode a file with a non-streaming Paraformer model.
|
||||
how to decode a file with a non-streaming SenseVoice model.
|
||||
|
||||
You can use the following command to run it:
|
||||
|
||||
|
||||
40
nodejs-examples/test-offline-sense-voice-with-hr.js
Normal file
40
nodejs-examples/test-offline-sense-voice-with-hr.js
Normal file
@@ -0,0 +1,40 @@
|
||||
// Copyright (c) 2024-2025 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
|
||||
const sherpa_onnx = require('sherpa-onnx');
|
||||
|
||||
function createOfflineRecognizer() {
|
||||
let modelConfig = {
|
||||
senseVoice: {
|
||||
model:
|
||||
'./sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17/model.int8.onnx',
|
||||
language: '',
|
||||
useInverseTextNormalization: 1,
|
||||
},
|
||||
tokens: './sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17/tokens.txt',
|
||||
};
|
||||
|
||||
let config = {
|
||||
modelConfig: modelConfig,
|
||||
hr: {
|
||||
dictDir: './dict',
|
||||
lexicon: './lexicon.txt',
|
||||
ruleFsts: './replace.fst',
|
||||
},
|
||||
};
|
||||
|
||||
return sherpa_onnx.createOfflineRecognizer(config);
|
||||
}
|
||||
|
||||
const recognizer = createOfflineRecognizer();
|
||||
const stream = recognizer.createStream();
|
||||
|
||||
const waveFilename = './test-hr.wav';
|
||||
const wave = sherpa_onnx.readWave(waveFilename);
|
||||
stream.acceptWaveform(wave.sampleRate, wave.samples);
|
||||
|
||||
recognizer.decode(stream);
|
||||
const text = recognizer.getResult(stream).text;
|
||||
console.log(text);
|
||||
|
||||
stream.free();
|
||||
recognizer.free();
|
||||
Reference in New Issue
Block a user