Upload speaker embedding models to huggingface (#1428)
See also https://huggingface.co/spaces/k2-fsa/speaker-diarization
This commit is contained in:
@@ -4,10 +4,10 @@ set -e
|
||||
|
||||
function install_3d_speaker() {
|
||||
echo "Install 3D-Speaker"
|
||||
git clone https://github.com/alibaba-damo-academy/3D-Speaker.git
|
||||
git clone https://github.com/modelscope/3D-Speaker
|
||||
pushd 3D-Speaker
|
||||
pip install -q -r ./requirements.txt
|
||||
pip install -q modelscope onnx onnxruntime kaldi-native-fbank
|
||||
pip install -q modelscope==1.14.0 onnx onnxruntime kaldi-native-fbank
|
||||
popd
|
||||
}
|
||||
|
||||
|
||||
@@ -7,14 +7,17 @@ function install_nemo() {
|
||||
curl https://bootstrap.pypa.io/get-pip.py -o get-pip.py
|
||||
python3 get-pip.py
|
||||
|
||||
pip install torch==2.1.0+cpu torchaudio==2.1.0+cpu -f https://download.pytorch.org/whl/torch_stable.html
|
||||
pip install torch==2.1.0 torchaudio==2.1.0 -f https://download.pytorch.org/whl/torch_stable.html
|
||||
|
||||
pip install wget text-unidecode matplotlib>=3.3.2 onnx onnxruntime pybind11 Cython einops kaldi-native-fbank soundfile
|
||||
pip install -qq wget text-unidecode matplotlib>=3.3.2 onnx onnxruntime pybind11 Cython einops kaldi-native-fbank soundfile
|
||||
pip install -qq ipython
|
||||
|
||||
sudo apt-get install -q -y sox libsndfile1 ffmpeg python3-pip
|
||||
# sudo apt-get install -q -y sox libsndfile1 ffmpeg python3-pip ipython
|
||||
|
||||
BRANCH='main'
|
||||
python3 -m pip install git+https://github.com/NVIDIA/NeMo.git@$BRANCH#egg=nemo_toolkit[asr]
|
||||
|
||||
pip install numpy==1.26.4
|
||||
}
|
||||
|
||||
install_nemo
|
||||
|
||||
Reference in New Issue
Block a user