From 82e5ca37a8bd80f56c99f9d790a03b458ced716b Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期二, 25 二月 2025 14:28:34 +0800
Subject: [PATCH] Large-Scale Data Training
---
examples/industrial_data_pretraining/llm_asr/conf/whisper_vicuna_linear.yaml | 5 +++--
1 files changed, 3 insertions(+), 2 deletions(-)
diff --git a/examples/industrial_data_pretraining/llm_asr/conf/whisper_vicuna_linear.yaml b/examples/industrial_data_pretraining/llm_asr/conf/whisper_vicuna_linear.yaml
index 331ac0d..f4f8c01 100644
--- a/examples/industrial_data_pretraining/llm_asr/conf/whisper_vicuna_linear.yaml
+++ b/examples/industrial_data_pretraining/llm_asr/conf/whisper_vicuna_linear.yaml
@@ -65,10 +65,11 @@
optim: adamw
optim_conf:
lr: 0.0001
- weight_decay: 0.000001
+ weight_decay: 0
+
scheduler: warmuplr
scheduler_conf:
- warmup_steps: 1000
+ warmup_steps: 1500
dataset: AudioLLMVicunaDataset
dataset_conf:
--
Gitblit v1.9.1