zhifu gao
2024-02-01 2ddfc27d5b69e5c1a38021554e97dae958328c20
examples/industrial_data_pretraining/seaco_paraformer/demo.py
@@ -25,6 +25,7 @@
# example2
import torchaudio
import os
wav_file = os.path.join(model.model_path, "example/asr_example.wav")
input_tensor, sample_rate = torchaudio.load(wav_file)
input_tensor = input_tensor.mean(0)
@@ -33,7 +34,7 @@
# example3
import soundfile
import os
wav_file = os.path.join(model.model_path, "example/asr_example.wav")
speech, sample_rate = soundfile.read(wav_file)
res = model.generate(input=[speech], batch_size_s=300, is_final=True)