From 3a4281f4959534b1bf5d01acf0085f4f8e6f2ec8 Mon Sep 17 00:00:00 2001
From: wuhongsheng <664116298@qq.com>
Date: 星期五, 05 七月 2024 00:55:32 +0800
Subject: [PATCH] 优化speakid和语句匹配逻辑,部分解决speakid不从0递增问题 (#1870)
---
examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear2.yaml | 4 ++--
1 files changed, 2 insertions(+), 2 deletions(-)
diff --git a/examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear2.yaml b/examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear2.yaml
index c2f6419..48bd0cf 100644
--- a/examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear2.yaml
+++ b/examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear2.yaml
@@ -28,7 +28,7 @@
downsample_rate: 2
llm_dim: 4096
encoder_dim: 1280
- n_layer: 2
+ n_layer: 0
# frontend related
frontend: WhisperFrontend
@@ -69,7 +69,7 @@
batch_size_scale_ratio_max: 2
num_workers: 4
audio_adaptor_downsample_rate: ${audio_adaptor_conf.downsample_rate}
- audio_encoder_downsample_rate: 2
+ audio_encoder_downsample_rate: 4
data_split_num: 512
batch_size_sample_max: 15
retry: 20
--
Gitblit v1.9.1