北念
2024-07-10 0fe232fd7b41ad24320447d51c07f14d0a807cf3
examples/industrial_data_pretraining/llm_asr/conf/whisper_qwen_linear2.yaml
@@ -28,7 +28,7 @@
  downsample_rate: 2
  llm_dim: 4096
  encoder_dim: 1280
  n_layer: 2
  n_layer: 0
# frontend related
frontend: WhisperFrontend
@@ -69,7 +69,7 @@
  batch_size_scale_ratio_max: 2
  num_workers: 4
  audio_adaptor_downsample_rate: ${audio_adaptor_conf.downsample_rate}
  audio_encoder_downsample_rate: 2
  audio_encoder_downsample_rate: 4
  data_split_num: 512
  batch_size_sample_max: 15
  retry: 20