liugz18
2024-07-18 d80ac2fd2df4e7fb8a28acfa512bb11472b5cc99
examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear2.yaml
@@ -28,7 +28,7 @@
  downsample_rate: 2
  llm_dim: 4096
  encoder_dim: 1280
  n_layer: 2
  n_layer: 0
# frontend related
frontend: WhisperFrontend
@@ -69,7 +69,7 @@
  batch_size_scale_ratio_max: 2
  num_workers: 4
  audio_adaptor_downsample_rate: ${audio_adaptor_conf.downsample_rate}
  audio_encoder_downsample_rate: 2
  audio_encoder_downsample_rate: 4
  data_split_num: 512
  batch_size_sample_max: 15
  retry: 20