From 598213f4669ada9933393da2559b79d5556021a2 Mon Sep 17 00:00:00 2001 From: luopingyi Date: Wed, 10 Sep 2025 11:06:39 +0800 Subject: [PATCH] update README --- README.md | 125 ++++++++++++++++++++++++++++++ mr_v100-f5-tts/Dockerfile_f5 | 8 +- mr_v100-f5-tts/launch.sh | 3 - mr_v100-gpt-sovits/Dockerfile_gsv | 6 +- mr_v100-gpt-sovits/launch.sh | 17 ---- mr_v100-kokoro/Dockerfile_kokoro | 8 +- mr_v100-kokoro/launch.sh | 4 - mr_v100-matcha/Dockerfile_matcha | 5 +- mr_v100-matcha/launch.sh | 4 - mr_v100-piper/Dockerfile_piper | 5 +- mr_v100-piper/launch.sh | 3 - 11 files changed, 135 insertions(+), 53 deletions(-) create mode 100644 README.md delete mode 100755 mr_v100-f5-tts/launch.sh delete mode 100755 mr_v100-gpt-sovits/launch.sh delete mode 100755 mr_v100-kokoro/launch.sh delete mode 100755 mr_v100-matcha/launch.sh delete mode 100755 mr_v100-piper/launch.sh diff --git a/README.md b/README.md new file mode 100644 index 0000000..2c9fee5 --- /dev/null +++ b/README.md @@ -0,0 +1,125 @@ +# 天数智芯 智铠100 语音合成 + +该模型测试框架在智铠100加速卡上,适配了 Kokoro, F5-TTS, GPT-SoVITS 等模型,将语音信号转换为文本。 + +GPT-SoVITS 模型是一个集成了语音转换和文本转语音功能的先进 AI 系统,基于 GPT 和 SoVITS 技术构建。 +Kokoro 是由 hexgrad 团队开发并开源的轻量级、高性能文本转语音(TTS)模型。 +F5-TTS 模型由上海交通大学团队发布,是基于扩散 Transformer 和 ConvNeXt V2 的文本转语音(TTS)模型。 + + + +## 如何使用语音合成模型测试框架 +代码实现了一个接收音频数据并返回识别文本的语音识别 HTTP 服务,将该 HTTP 服务重新打包成 docker 镜像,通过 k8s 集群sut容器去请求这个 HTTP 服务。 + +## 智铠100系列上语音合成模型运行测试结果 +在智铠100系列上对部分语音合成模型进行适配,测试方式为在 Nvidia A100 和 智铠100加速卡上对同一段text进行语音合成任务,获取运行时间 + + +| 模型名称 | 模型类型 | 适配状态 | 智铠100运行时间/s | Nvidia A100运行时间/s | +| ---------- | ---------------------- | -------- | ----------------- | --------------------- | +| kokoro | StyleTTS 2, ISTFTNet | 成功 | 2.1 | 5.4 | +| f5-TTS | DiT, ConvNeXt V2 | 成功 | 6.5 | 5.4 | +| gpt-sovits | VITS | 成功 | 17.7 | 20.5 | +| matcha | OT-CFM, Transformer | 成功 | 3.7 | 3.2 | +| piper | - | 成功 | 0.3 | 1.7 | diff --git a/mr_v100-f5-tts/Dockerfile_f5 b/mr_v100-f5-tts/Dockerfile_f5 index ba6c267..288f5c7 100644 --- a/mr_v100-f5-tts/Dockerfile_f5 +++ b/mr_v100-f5-tts/Dockerfile_f5 @@ -2,10 +2,8 @@ FROM git.modelhub.org.cn:9443/enginex-iluvatar/mr100_corex:4.3.0 WORKDIR /workspace COPY . /workspace/ -RUN pip install -r requirements_f5.txt -c constraints_f5.txt -i https://nexus.4pd.io/repository/pypi-all/simple -RUN cd F5-TTS && pip install -e . -c ../constraints_f5.txt -i https://nexus.4pd.io/repository/pypi-all/simple +RUN pip install -r requirements_f5.txt -c constraints_f5.txt +RUN cd F5-TTS && pip install -e . -c ../constraints_f5.txt - -#ENTRYPOINT ["/bin/bash", "launch_f5.sh"] -ENTRYPOINT ["/bin/bash", "launch.sh"] +ENTRYPOINT ["/bin/bash", "launch_f5.sh"] diff --git a/mr_v100-f5-tts/launch.sh b/mr_v100-f5-tts/launch.sh deleted file mode 100755 index c4561a8..0000000 --- a/mr_v100-f5-tts/launch.sh +++ /dev/null @@ -1,3 +0,0 @@ -#!/bin/bash - -python3 f5_server.py diff --git a/mr_v100-gpt-sovits/Dockerfile_gsv b/mr_v100-gpt-sovits/Dockerfile_gsv index cdf56a7..df5845f 100644 --- a/mr_v100-gpt-sovits/Dockerfile_gsv +++ b/mr_v100-gpt-sovits/Dockerfile_gsv @@ -13,7 +13,5 @@ COPY constraints_gsv.txt /workspace/ RUN pip install -r GPT-SoVITS/extra-req.txt --no-deps \ && pip install -r GPT-SoVITS/requirements.txt -c constraints_gsv.txt -#COPY launch_gsv.sh /workspace/ -#ENTRYPOINT ["/bin/bash", "launch_gsv.sh"] -COPY launch.sh /workspace/ -ENTRYPOINT ["/bin/bash", "launch.sh"] +COPY launch_gsv.sh /workspace/ +ENTRYPOINT ["/bin/bash", "launch_gsv.sh"] diff --git a/mr_v100-gpt-sovits/launch.sh b/mr_v100-gpt-sovits/launch.sh deleted file mode 100755 index cdbf493..0000000 --- a/mr_v100-gpt-sovits/launch.sh +++ /dev/null @@ -1,17 +0,0 @@ -#!/bin/bash - -redis-server --daemonize yes - -if [ -z "$MODEL_DIR" ]; then - export MODEL_DIR="/models/GPT-SoVITS" -fi - -if [ -z "$NLTK_DATA" ]; then - export NLTK_DATA="/models/GPT-SoVITS/nltk_data" -fi - -if [ -z "$bert_path" ]; then - export bert_path="${MODEL_DIR}/chinese-roberta-wwm-ext-large" -fi - -cd GPT-SoVITS && python3 gsv_server.py diff --git a/mr_v100-kokoro/Dockerfile_kokoro b/mr_v100-kokoro/Dockerfile_kokoro index c814da4..9f5840e 100644 --- a/mr_v100-kokoro/Dockerfile_kokoro +++ b/mr_v100-kokoro/Dockerfile_kokoro @@ -7,11 +7,9 @@ RUN apt-get update && \ rm -rf /var/lib/apt/lists/* COPY requirements_kokoro.txt constraints_kokoro.txt kokoro_server.py en_core_web_sm-3.8.0.tar.gz /workspace/ -RUN pip install -r requirements_kokoro.txt -c constraints_kokoro.txt -i https://nexus.4pd.io/repository/pypi-all/simple +RUN pip install -r requirements_kokoro.txt -c constraints_kokoro.txt RUN pip install en_core_web_sm-3.8.0.tar.gz -#COPY launch_kokoro.sh /workspace/ -#ENTRYPOINT ["/bin/bash", "launch_kokoro.sh"] -COPY launch.sh /workspace/ -ENTRYPOINT ["/bin/bash", "launch.sh"] +COPY launch_kokoro.sh /workspace/ +ENTRYPOINT ["/bin/bash", "launch_kokoro.sh"] diff --git a/mr_v100-kokoro/launch.sh b/mr_v100-kokoro/launch.sh deleted file mode 100755 index 7dfbcd9..0000000 --- a/mr_v100-kokoro/launch.sh +++ /dev/null @@ -1,4 +0,0 @@ -#!/bin/bash - -python3 kokoro_server.py - diff --git a/mr_v100-matcha/Dockerfile_matcha b/mr_v100-matcha/Dockerfile_matcha index 1a18d65..56d42ef 100644 --- a/mr_v100-matcha/Dockerfile_matcha +++ b/mr_v100-matcha/Dockerfile_matcha @@ -11,10 +11,7 @@ COPY requirements_matcha.txt constraints_matcha.txt matcha_server.py launch_matc RUN pip install -r requirements_matcha.txt -c constraints_matcha.txt RUN pip install matcha-tts -c constraints_matcha.txt -#ENTRYPOINT ["/bin/bash", "launch_matcha.sh"] - -COPY launch.sh /workspace/ -ENTRYPOINT ["/bin/bash", "launch.sh"] +ENTRYPOINT ["/bin/bash", "launch_matcha.sh"] diff --git a/mr_v100-matcha/launch.sh b/mr_v100-matcha/launch.sh deleted file mode 100755 index c9ec741..0000000 --- a/mr_v100-matcha/launch.sh +++ /dev/null @@ -1,4 +0,0 @@ -#!/bin/bash - -python3 matcha_server.py - diff --git a/mr_v100-piper/Dockerfile_piper b/mr_v100-piper/Dockerfile_piper index 5ff11f3..0a56146 100644 --- a/mr_v100-piper/Dockerfile_piper +++ b/mr_v100-piper/Dockerfile_piper @@ -9,7 +9,4 @@ RUN pip install -r requirements_piper.txt -c constraints_piper.txt ENV PYTHONPATH=/workspace/piper/src/python:$PYTHONPATH RUN cd /workspace/piper/src/python && pip install -e . && ./build_monotonic_align.sh -#ENTRYPOINT ["/bin/bash", "launch_piper.sh"] - -COPY launch.sh /workspace/ -ENTRYPOINT ["/bin/bash", "launch.sh"] +ENTRYPOINT ["/bin/bash", "launch_piper.sh"] diff --git a/mr_v100-piper/launch.sh b/mr_v100-piper/launch.sh deleted file mode 100755 index fcbd834..0000000 --- a/mr_v100-piper/launch.sh +++ /dev/null @@ -1,3 +0,0 @@ -#!/bin/bash -python3 piper_server.py -