Add JavaScript API (WASM) for homophone replacer (#2157)

This commit is contained in:
Fangjun Kuang
2025-04-28 20:47:49 +08:00
committed by GitHub
parent e51c37eb2f
commit a0aef1f6cd
13 changed files with 165 additions and 24 deletions

View File

@@ -0,0 +1,40 @@
// Copyright (c) 2024-2025 Xiaomi Corporation (authors: Fangjun Kuang)
const sherpa_onnx = require('sherpa-onnx');
function createOfflineRecognizer() {
let modelConfig = {
senseVoice: {
model:
'./sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17/model.int8.onnx',
language: '',
useInverseTextNormalization: 1,
},
tokens: './sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17/tokens.txt',
};
let config = {
modelConfig: modelConfig,
hr: {
dictDir: './dict',
lexicon: './lexicon.txt',
ruleFsts: './replace.fst',
},
};
return sherpa_onnx.createOfflineRecognizer(config);
}
const recognizer = createOfflineRecognizer();
const stream = recognizer.createStream();
const waveFilename = './test-hr.wav';
const wave = sherpa_onnx.readWave(waveFilename);
stream.acceptWaveform(wave.sampleRate, wave.samples);
recognizer.decode(stream);
const text = recognizer.getResult(stream).text;
console.log(text);
stream.free();
recognizer.free();