志浩
2023-03-16 2868fe3df4e92a6ae3e327faf6e57ea492e04124
egs/callhome/diarization/sond/sond.yaml
@@ -2660,13 +2660,14 @@
    lsm_weight: 0.1
    length_normalized_loss: true
    max_spk_num: 16
    normlize_speech_speaker: true
    normalize_speech_speaker: true
# speech encoder
encoder: resnet34_sp_l2reg
encoder_conf:
    # pass by model, equal to feature dim
    # input_size: 80
    pooling_type: "window_shift"
    batchnorm_momentum: 0.01
    pool_size: 20
    stride: 1
    tf2torch_tensor_name_prefix_torch: encoder