From 68f0603b10d13b8b8e6e090324c7e24e009df90b Mon Sep 17 00:00:00 2001
From: zhifu gao <zhifu.gzf@alibaba-inc.com>
Date: 星期二, 12 三月 2024 09:23:04 +0800
Subject: [PATCH] Dev gzf (#1475)

---
 examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear.yaml |   18 +++++++++---------
 1 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear.yaml b/examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear.yaml
index 4603f80..fb00b12 100644
--- a/examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear.yaml
+++ b/examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear.yaml
@@ -12,17 +12,16 @@
     length_normalized_loss: true
 
 # encoder
-audio_encoder: iic/Whisper-large-v2 #iic/Whisper-large-v3
+audio_encoder: "/nfs/zhifu.gzf/init_model/Whisper-large-v3" #iic/Whisper-large-v3
 audio_encoder_conf:
     hub: ms
     freeze: true
-    init_param_path: "/nfs/maziyang.mzy/models/vicuna-7b-v1.5"
 
-llm: Vicuna
+llm: Qwen1.5-7b-chat
 llm_conf:
   hub: hf
   freeze: true
-  init_param_path: "/nfs/maziyang.mzy/models/vicuna-7b-v1.5"
+  init_param_path: "/nfs/zhifu.gzf/init_model/qwen/Qwen1___5-7B-Chat"
 
 audio_adaptor: Linear
 audio_adaptor_conf:
@@ -34,7 +33,7 @@
 frontend: WhisperFrontend
 frontend_conf:
     fs: 16000
-    whisper_model: large-v2
+    whisper_model: large-v3
     do_pad_trim: true
     permute: true # true: [bs, frames, dims]; false: [bs, dims, frames]
 
@@ -66,8 +65,9 @@
 optim: adamw
 optim_conf:
    lr: 0.0001
-   weight_decay: 0.000001
-scheduler: warmuplr
+   weight_decay: 0.000000
+
+scheduler: custom_lambdalr
 scheduler_conf:
    warmup_steps: 1000
 
@@ -83,12 +83,12 @@
     preprocessor_text: TextPreprocessRemovePunctuation
     audio_adaptor_downsample_rate: ${audio_adaptor_conf.downsample_rate}
     audio_encoder_downsample_rate: 2
-    prompt: "<|startoftranscription|><|zh|><|transcribe|><|zh|><|notimestamps|><|wo_itn|>"
+#    prompt: "<|startoftranscription|><|zh|><|transcribe|><|zh|><|notimestamps|><|wo_itn|>"
 
 
 
 tokenizer: HuggingfaceTokenizer
 tokenizer_conf:
   unk_symbol: <unk>
-  init_param_path: "/nfs/maziyang.mzy/models/vicuna-7b-v1.5"
+  init_param_path: "/nfs/zhifu.gzf/init_model/qwen/Qwen1___5-7B-Chat"
 

--
Gitblit v1.9.1