Add JavaScript (WebAssembly) API for Kokoro TTS models. (#1726)

This commit is contained in:
Fangjun Kuang
2025-01-17 11:17:18 +08:00
committed by GitHub
parent e8d499d218
commit 3a1de0bfc1
5 changed files with 154 additions and 6 deletions

View File

@@ -42,6 +42,22 @@ node ./test-offline-speaker-diarization.js
In the following, we demonstrate how to run text-to-speech.
## ./test-offline-tts-kokoro-en.js
[./test-offline-tts-kokoro-en.js](./test-offline-tts-kokoro-en.js) shows how to use
[kokoro-en-v0_19](https://github.com/k2-fsa/sherpa-onnx/releases/download/tts-models/kokoro-en-v0_19.tar.bz2)
for text-to-speech.
You can use the following command to run it:
```bash
wget https://github.com/k2-fsa/sherpa-onnx/releases/download/tts-models/kokoro-en-v0_19.tar.bz2
tar xf kokoro-en-v0_19.tar.bz2
rm kokoro-en-v0_19.tar.bz2
node ./test-offline-tts-kokoro-en.js
```
## ./test-offline-tts-matcha-zh.js
[./test-offline-tts-matcha-zh.js](./test-offline-tts-matcha-zh.js) shows how to use

View File

@@ -0,0 +1,37 @@
// Copyright (c) 2025 Xiaomi Corporation (authors: Fangjun Kuang)
const sherpa_onnx = require('sherpa-onnx');
function createOfflineTts() {
let offlineTtsKokoroModelConfig = {
model: './kokoro-en-v0_19/model.onnx',
voices: './kokoro-en-v0_19/voices.bin',
tokens: './kokoro-en-v0_19/tokens.txt',
dataDir: './kokoro-en-v0_19/espeak-ng-data',
lengthScale: 1.0,
};
let offlineTtsModelConfig = {
offlineTtsKokoroModelConfig: offlineTtsKokoroModelConfig,
numThreads: 1,
debug: 1,
provider: 'cpu',
};
let offlineTtsConfig = {
offlineTtsModelConfig: offlineTtsModelConfig,
maxNumSentences: 1,
};
return sherpa_onnx.createOfflineTts(offlineTtsConfig);
}
const tts = createOfflineTts();
const speakerId = 0;
const speed = 1.0;
const text =
'Today as always, men fall into two groups: slaves and free men. Whoever does not have two-thirds of his day for himself, is a slave, whatever he may be: a statesman, a businessman, an official, or a scholar.'
const audio = tts.generate({text: text, sid: speakerId, speed: speed});
tts.save('./test-kokoro-en.wav', audio);
console.log('Saved to test-kokoro-en.wav successfully.');
tts.free();