egs/callhome/diarization/sond/sond.yaml
@@ -2660,13 +2660,14 @@ lsm_weight: 0.1 length_normalized_loss: true max_spk_num: 16 normlize_speech_speaker: true normalize_speech_speaker: true # speech encoder encoder: resnet34_sp_l2reg encoder_conf: # pass by model, equal to feature dim # input_size: 80 pooling_type: "window_shift" batchnorm_momentum: 0.01 pool_size: 20 stride: 1 tf2torch_tensor_name_prefix_torch: encoder