From aa45aeeaa7e8abd11bc1be392b4547685645ca5e Mon Sep 17 00:00:00 2001 From: 语帆 <yf352572@alibaba-inc.com> Date: 星期一, 04 三月 2024 14:29:52 +0800 Subject: [PATCH] atsr --- examples/industrial_data_pretraining/lcbnet/demp.py | 35 +++++++++++++++++++++++++++++++++++ 1 files changed, 35 insertions(+), 0 deletions(-) diff --git a/examples/industrial_data_pretraining/lcbnet/demp.py b/examples/industrial_data_pretraining/lcbnet/demp.py new file mode 100644 index 0000000..cb08290 --- /dev/null +++ b/examples/industrial_data_pretraining/lcbnet/demp.py @@ -0,0 +1,35 @@ +#!/usr/bin/env python3 +# -*- encoding: utf-8 -*- +# Copyright FunASR (https://github.com/alibaba-damo-academy/FunASR). All Rights Reserved. +# MIT License (https://opensource.org/licenses/MIT) + +from funasr import AutoModel + +model = AutoModel(model="iic/LCB-NET" + ) + + +# example1 +#res = model.generate(input="https://isv-data.oss-cn-hangzhou.aliyuncs.com/ics/MaaS/ASR/test_audio/asr_example_zh.wav", + ) +#print(res) + + +''' +# tensor or numpy as input +# example2 +import torchaudio +import os +wav_file = os.path.join(model.model_path, "example/asr_example.wav") +input_tensor, sample_rate = torchaudio.load(wav_file) +input_tensor = input_tensor.mean(0) +res = model.generate(input=[input_tensor], batch_size_s=300, is_final=True) + + +# example3 +import soundfile + +wav_file = os.path.join(model.model_path, "example/asr_example.wav") +speech, sample_rate = soundfile.read(wav_file) +res = model.generate(input=[speech], batch_size_s=300, is_final=True) +''' -- Gitblit v1.9.1