From 3a4281f4959534b1bf5d01acf0085f4f8e6f2ec8 Mon Sep 17 00:00:00 2001 From: wuhongsheng <664116298@qq.com> Date: 星期五, 05 七月 2024 00:55:32 +0800 Subject: [PATCH] 优化speakid和语句匹配逻辑,部分解决speakid不从0递增问题 (#1870) --- examples/industrial_data_pretraining/qwen_audio/demo.py | 9 +++++---- 1 files changed, 5 insertions(+), 4 deletions(-) diff --git a/examples/industrial_data_pretraining/qwen_audio/demo.py b/examples/industrial_data_pretraining/qwen_audio/demo.py index 5c1e2a0..04a8e58 100644 --- a/examples/industrial_data_pretraining/qwen_audio/demo.py +++ b/examples/industrial_data_pretraining/qwen_audio/demo.py @@ -7,9 +7,10 @@ from funasr import AutoModel -model = AutoModel(model="Qwen/Qwen-Audio", - model_path=None, - ) +model = AutoModel(model="Qwen-Audio") -res = model.generate(input="https://isv-data.oss-cn-hangzhou.aliyuncs.com/ics/MaaS/ASR/test_audio/asr_example_zh.wav", language=None) +audio_in = "https://github.com/QwenLM/Qwen-Audio/raw/main/assets/audio/1272-128104-0000.flac" +prompt = "<|startoftranscription|><|en|><|transcribe|><|en|><|notimestamps|><|wo_itn|>" + +res = model.generate(input=audio_in, prompt=prompt) print(res) -- Gitblit v1.9.1