Add C++ and Python API for Kokoro 1.0 multilingual TTS model (#1795)
This commit is contained in:
24
.github/scripts/test-python.sh
vendored
24
.github/scripts/test-python.sh
vendored
@@ -267,6 +267,27 @@ log "Offline TTS test"
|
||||
# test waves are saved in ./tts
|
||||
mkdir ./tts
|
||||
|
||||
log "kokoro-multi-lang-v1_0 test"
|
||||
|
||||
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/tts-models/kokoro-multi-lang-v1_0.tar.bz2
|
||||
tar xf kokoro-multi-lang-v1_0.tar.bz2
|
||||
rm kokoro-multi-lang-v1_0.tar.bz2
|
||||
|
||||
python3 ./python-api-examples/offline-tts.py \
|
||||
--debug=1 \
|
||||
--kokoro-model=./kokoro-multi-lang-v1_0/model.onnx \
|
||||
--kokoro-voices=./kokoro-multi-lang-v1_0/voices.bin \
|
||||
--kokoro-tokens=./kokoro-multi-lang-v1_0/tokens.txt \
|
||||
--kokoro-data-dir=./kokoro-multi-lang-v1_0/espeak-ng-data \
|
||||
--kokoro-dict-dir=./kokoro-multi-lang-v1_0/dict \
|
||||
--kokoro-lexicon=./kokoro-multi-lang-v1_0/lexicon-us-en.txt,./kokoro-multi-lang-v1_0/lexicon-zh.txt \
|
||||
--num-threads=2 \
|
||||
--sid=18 \
|
||||
--output-filename="./tts/kokoro-18-zh-en.wav" \
|
||||
"中英文语音合成测试。This is generated by next generation Kaldi using Kokoro without Misaki. 你觉得中英文说的如何呢?"
|
||||
|
||||
rm -rf kokoro-multi-lang-v1_0
|
||||
|
||||
log "kokoro-en-v0_19 test"
|
||||
|
||||
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/tts-models/kokoro-en-v0_19.tar.bz2
|
||||
@@ -580,13 +601,10 @@ if [[ x$OS != x'windows-latest' ]]; then
|
||||
repo=sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01
|
||||
log "Start testing ${repo}"
|
||||
|
||||
pushd $dir
|
||||
curl -LS -O https://github.com/pkufool/keyword-spotting-models/releases/download/v0.1/sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01.tar.bz
|
||||
tar xf sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01.tar.bz
|
||||
rm sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01.tar.bz
|
||||
popd
|
||||
|
||||
repo=$dir/$repo
|
||||
ls -lh $repo
|
||||
|
||||
python3 ./python-api-examples/keyword-spotter.py
|
||||
|
||||
16
.github/workflows/export-kokoro.yaml
vendored
16
.github/workflows/export-kokoro.yaml
vendored
@@ -4,7 +4,6 @@ on:
|
||||
push:
|
||||
branches:
|
||||
- export-kokoro
|
||||
- kokoro-1.0-2
|
||||
|
||||
workflow_dispatch:
|
||||
|
||||
@@ -76,6 +75,14 @@ jobs:
|
||||
if: matrix.version == '1.0'
|
||||
shell: bash
|
||||
run: |
|
||||
curl -SL -O https://github.com/csukuangfj/cppjieba/releases/download/sherpa-onnx-2024-04-19/dict.tar.bz2
|
||||
tar xvf dict.tar.bz2
|
||||
rm dict.tar.bz2
|
||||
|
||||
curl -SL -o date-zh.fst https://huggingface.co/csukuangfj/icefall-tts-aishell3-vits-low-2024-04-06/resolve/main/data/date.fst
|
||||
curl -SL -o number-zh.fst https://huggingface.co/csukuangfj/icefall-tts-aishell3-vits-low-2024-04-06/resolve/main/data/number.fst
|
||||
curl -SL -o phone-zh.fst https://huggingface.co/csukuangfj/icefall-tts-aishell3-vits-low-2024-04-06/resolve/main/data/phone.fst
|
||||
|
||||
src=scripts/kokoro/v1.0
|
||||
|
||||
d=kokoro-multi-lang-v1_0
|
||||
@@ -87,7 +94,12 @@ jobs:
|
||||
cp -v $src/tokens.txt $d/
|
||||
cp -v $src/lexicon*.txt $d/
|
||||
cp -v $src/README.md $d/README.md
|
||||
cp -av dict $d/
|
||||
cp -v ./*.fst $d/
|
||||
ls -lh $d/
|
||||
echo "---"
|
||||
ls -lh $d/dict
|
||||
|
||||
tar cjfv $d.tar.bz2 $d
|
||||
rm -rf $d
|
||||
|
||||
@@ -180,6 +192,8 @@ jobs:
|
||||
cp -v ../scripts/kokoro/v1.0/lexicon*.txt .
|
||||
cp -v ../scripts/kokoro/v1.0/README.md ./README.md
|
||||
cp -v ../LICENSE ./
|
||||
cp -av ../dict ./
|
||||
cp -v ../*.fst $d/
|
||||
|
||||
git lfs track "*.onnx"
|
||||
git add .
|
||||
|
||||
Reference in New Issue
Block a user