| | |
| | | decoder_attention_chunk_type2: chunk |
| | | loss_weight_model1: 0.5 |
| | | |
| | | |
| | | # encoder |
| | | encoder: SANMEncoderChunkOpt |
| | | encoder_conf: |
| | |
| | | kernel_size: 11 |
| | | sanm_shfit: 0 |
| | | selfattention_layer_type: sanm |
| | | chunk_size: [20, 60] |
| | | stride: [10, 40] |
| | | pad_left: [5, 10] |
| | | encoder_att_look_back_factor: [0, 0] |
| | | decoder_att_look_back_factor: [0, 0] |
| | | chunk_size: |
| | | - 20 |
| | | - 60 |
| | | stride: |
| | | - 10 |
| | | - 40 |
| | | pad_left: |
| | | - 5 |
| | | - 10 |
| | | encoder_att_look_back_factor: |
| | | - 0 |
| | | - 0 |
| | | decoder_att_look_back_factor: |
| | | - 0 |
| | | - 0 |
| | | |
| | | # decoder |
| | | decoder: FsmnDecoderSCAMAOpt |
| | |
| | | kernel_size: 11 |
| | | concat_embeds: true |
| | | |
| | | # predictor |
| | | predictor: CifPredictorV2 |
| | | predictor_conf: |
| | | idim: 320 |
| | |
| | | l_order: 1 |
| | | r_order: 1 |
| | | |
| | | |
| | | # encoder2 |
| | | encoder2: SANMEncoderChunkOpt |
| | | encoder2_conf: |
| | | output_size: 320 |
| | |
| | | kernel_size: 21 |
| | | sanm_shfit: 0 |
| | | selfattention_layer_type: sanm |
| | | chunk_size: [45, 70] |
| | | stride: [35, 50] |
| | | pad_left: [5, 10] |
| | | encoder_att_look_back_factor: [0, 0] |
| | | decoder_att_look_back_factor: [0, 0] |
| | | chunk_size: |
| | | - 45 |
| | | - 70 |
| | | stride: |
| | | - 35 |
| | | - 50 |
| | | pad_left: |
| | | - 5 |
| | | - 10 |
| | | encoder_att_look_back_factor: |
| | | - 0 |
| | | - 0 |
| | | decoder_att_look_back_factor: |
| | | - 0 |
| | | - 0 |
| | | |
| | | # decoder |
| | | decoder2: FsmnDecoderSCAMAOpt |
| | | decoder2_conf: |
| | | attention_dim: 320 |
| | |
| | | stride_conv_conf: |
| | | kernel_size: 2 |
| | | stride: 2 |
| | | pad: [0, 1] |
| | | pad: |
| | | - 0 |
| | | - 1 |
| | | |
| | | # frontend related |
| | | frontend: WavFrontendOnline |
| | | frontend: WavFrontend |
| | | frontend_conf: |
| | | fs: 16000 |
| | | window: hamming |
| | |
| | | frame_shift: 10 |
| | | lfr_m: 7 |
| | | lfr_n: 6 |
| | | dither: 0.0 |
| | | |
| | | specaug: SpecAugLFR |
| | | specaug_conf: |