zhaomingwork
2023-05-19 b63e73ae4f5df9d4ed9fb0bee12ac2cc09d7f523
egs/callhome/diarization/sond/sond.yaml
@@ -2660,13 +2660,14 @@
    lsm_weight: 0.1
    length_normalized_loss: true
    max_spk_num: 16
    normlize_speech_speaker: true
    normalize_speech_speaker: true
# speech encoder
encoder: resnet34_sp_l2reg
encoder_conf:
    # pass by model, equal to feature dim
    # input_size: 80
    pooling_type: "window_shift"
    batchnorm_momentum: 0.01
    pool_size: 20
    stride: 1
    tf2torch_tensor_name_prefix_torch: encoder