From 68f0603b10d13b8b8e6e090324c7e24e009df90b Mon Sep 17 00:00:00 2001
From: zhifu gao <zhifu.gzf@alibaba-inc.com>
Date: 星期二, 12 三月 2024 09:23:04 +0800
Subject: [PATCH] Dev gzf (#1475)

---
 .github/ISSUE_TEMPLATE/ask_questions.md                                    |    4 ++++
 .github/ISSUE_TEMPLATE/bug_report.md                                       |    3 +++
 examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear.yaml |   18 +++++++++---------
 funasr/datasets/audio_datasets/index_ds.py                                 |    3 ++-
 4 files changed, 18 insertions(+), 10 deletions(-)

diff --git a/.github/ISSUE_TEMPLATE/ask_questions.md b/.github/ISSUE_TEMPLATE/ask_questions.md
index 23a5a7f..4716faa 100644
--- a/.github/ISSUE_TEMPLATE/ask_questions.md
+++ b/.github/ISSUE_TEMPLATE/ask_questions.md
@@ -4,8 +4,12 @@
 labels: 'question, needs triage'
 ---
 
+Notice: In order to resolve issues more efficiently, please raise issue following the template.
+锛堟敞鎰忥細涓轰簡鏇村姞楂樻晥鐜囪В鍐虫偍閬囧埌鐨勯棶棰橈紝璇锋寜鐓фā鏉挎彁闂紝琛ュ厖缁嗚妭锛�
+
 ## 鉂� Questions and Help
 
+
 ### Before asking:
 1. search the issues.
 2. search the docs.
diff --git a/.github/ISSUE_TEMPLATE/bug_report.md b/.github/ISSUE_TEMPLATE/bug_report.md
index 82ba025..80b0317 100644
--- a/.github/ISSUE_TEMPLATE/bug_report.md
+++ b/.github/ISSUE_TEMPLATE/bug_report.md
@@ -4,6 +4,9 @@
 labels: 'bug, needs triage'
 ---
 
+Notice: In order to resolve issues more efficiently, please raise issue following the template.
+锛堟敞鎰忥細涓轰簡鏇村姞楂樻晥鐜囪В鍐虫偍閬囧埌鐨勯棶棰橈紝璇锋寜鐓фā鏉挎彁闂紝琛ュ厖缁嗚妭锛�
+
 ## 馃悰 Bug
 
 <!-- A clear and concise description of what the bug is. -->
diff --git a/examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear.yaml b/examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear.yaml
index 4603f80..fb00b12 100644
--- a/examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear.yaml
+++ b/examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear.yaml
@@ -12,17 +12,16 @@
     length_normalized_loss: true
 
 # encoder
-audio_encoder: iic/Whisper-large-v2 #iic/Whisper-large-v3
+audio_encoder: "/nfs/zhifu.gzf/init_model/Whisper-large-v3" #iic/Whisper-large-v3
 audio_encoder_conf:
     hub: ms
     freeze: true
-    init_param_path: "/nfs/maziyang.mzy/models/vicuna-7b-v1.5"
 
-llm: Vicuna
+llm: Qwen1.5-7b-chat
 llm_conf:
   hub: hf
   freeze: true
-  init_param_path: "/nfs/maziyang.mzy/models/vicuna-7b-v1.5"
+  init_param_path: "/nfs/zhifu.gzf/init_model/qwen/Qwen1___5-7B-Chat"
 
 audio_adaptor: Linear
 audio_adaptor_conf:
@@ -34,7 +33,7 @@
 frontend: WhisperFrontend
 frontend_conf:
     fs: 16000
-    whisper_model: large-v2
+    whisper_model: large-v3
     do_pad_trim: true
     permute: true # true: [bs, frames, dims]; false: [bs, dims, frames]
 
@@ -66,8 +65,9 @@
 optim: adamw
 optim_conf:
    lr: 0.0001
-   weight_decay: 0.000001
-scheduler: warmuplr
+   weight_decay: 0.000000
+
+scheduler: custom_lambdalr
 scheduler_conf:
    warmup_steps: 1000
 
@@ -83,12 +83,12 @@
     preprocessor_text: TextPreprocessRemovePunctuation
     audio_adaptor_downsample_rate: ${audio_adaptor_conf.downsample_rate}
     audio_encoder_downsample_rate: 2
-    prompt: "<|startoftranscription|><|zh|><|transcribe|><|zh|><|notimestamps|><|wo_itn|>"
+#    prompt: "<|startoftranscription|><|zh|><|transcribe|><|zh|><|notimestamps|><|wo_itn|>"
 
 
 
 tokenizer: HuggingfaceTokenizer
 tokenizer_conf:
   unk_symbol: <unk>
-  init_param_path: "/nfs/maziyang.mzy/models/vicuna-7b-v1.5"
+  init_param_path: "/nfs/zhifu.gzf/init_model/qwen/Qwen1___5-7B-Chat"
 
diff --git a/funasr/datasets/audio_datasets/index_ds.py b/funasr/datasets/audio_datasets/index_ds.py
index 12ffd23..34f7b4f 100644
--- a/funasr/datasets/audio_datasets/index_ds.py
+++ b/funasr/datasets/audio_datasets/index_ds.py
@@ -99,7 +99,8 @@
                     target = data["target"]
                     source_len = data.get("source_len", 1)
                     target_len = data.get("target_len", 0)
-                    
+                    if "aishell" in source:
+                        target = target.replace(" ", "")
                     contents.append({"source": source,
                                      "prompt": prompt,
                                      "target": target,

--
Gitblit v1.9.1