From 3a4281f4959534b1bf5d01acf0085f4f8e6f2ec8 Mon Sep 17 00:00:00 2001 From: wuhongsheng <664116298@qq.com> Date: 星期五, 05 七月 2024 00:55:32 +0800 Subject: [PATCH] 优化speakid和语句匹配逻辑,部分解决speakid不从0递增问题 (#1870) --- examples/industrial_data_pretraining/qwen_audio/demo_from_local.py | 12 ++++++++---- 1 files changed, 8 insertions(+), 4 deletions(-) diff --git a/examples/industrial_data_pretraining/qwen_audio/demo_from_local.py b/examples/industrial_data_pretraining/qwen_audio/demo_from_local.py index 54ae1f0..5ade205 100644 --- a/examples/industrial_data_pretraining/qwen_audio/demo_from_local.py +++ b/examples/industrial_data_pretraining/qwen_audio/demo_from_local.py @@ -7,9 +7,13 @@ from funasr import AutoModel -model = AutoModel(model="Qwen-Audio", - model_path="/nfs/zhifu.gzf/init_model/qwen/Qwen-Audio", - ) +model = AutoModel( + model="Qwen-Audio", + model_path="/nfs/zhifu.gzf/init_model/qwen/Qwen-Audio", +) -res = model.generate(input="https://isv-data.oss-cn-hangzhou.aliyuncs.com/ics/MaaS/ASR/test_audio/asr_example_zh.wav", language=None) +audio_in = "https://github.com/QwenLM/Qwen-Audio/raw/main/assets/audio/1272-128104-0000.flac" +prompt = "<|startoftranscription|><|en|><|transcribe|><|en|><|notimestamps|><|wo_itn|>" + +res = model.generate(input=audio_in, prompt=prompt) print(res) -- Gitblit v1.9.1