diff --git a/scripts/tele-speech/test.py b/scripts/tele-speech/test.py index 71953700..b52174d1 100755 --- a/scripts/tele-speech/test.py +++ b/scripts/tele-speech/test.py @@ -80,7 +80,7 @@ def get_features(test_wav_filename): samples = librosa.resample(samples, orig_sr=sample_rate, target_sr=16000) sample_rate = 16000 - samples *= 372768 + samples *= 32768 opts = knf.MfccOptions() # See https://github.com/Tele-AI/TeleSpeech-ASR/blob/master/mfcc_hires.conf diff --git a/scripts/wenet/test-onnx-streaming.py b/scripts/wenet/test-onnx-streaming.py index 45a4b5b7..cbf27b74 100755 --- a/scripts/wenet/test-onnx-streaming.py +++ b/scripts/wenet/test-onnx-streaming.py @@ -112,7 +112,7 @@ def get_features(test_wav_filename): audio = torchaudio.functional.resample( audio, orig_freq=sample_rate, new_freq=16000 ) - audio *= 372768 + audio *= 32768 opts = knf.FbankOptions() opts.frame_opts.dither = 0 diff --git a/scripts/wenet/test-onnx.py b/scripts/wenet/test-onnx.py index 988fef4b..b9631ddb 100755 --- a/scripts/wenet/test-onnx.py +++ b/scripts/wenet/test-onnx.py @@ -52,7 +52,7 @@ def get_features(test_wav_filename): audio = torchaudio.functional.resample( audio, orig_freq=sample_rate, new_freq=16000 ) - audio *= 372768 + audio *= 32768 opts = knf.FbankOptions() opts.frame_opts.dither = 0