仁迷
2023-02-09 fdf74bb85cfe3dd0ce6cbaf51ec8d5b3ca3d2039
egs/aishell2/data2vec_pretrain/conf/train_pretrain_transformer.yaml
@@ -63,3 +63,17 @@
scheduler: tri_stage
scheduler_conf:
    phase_ratio: [0.03,0.9,0.07]
# for dataset
dataset_conf:
    batch_mode: clipping
    data_names: speech,none
    data_types: kaldi_ark,none
    shuffle: true
    shuffle_conf:
        shuffle_size: 12800
        sort_size: 12800
    batch_conf:
        batch_type: token
        batch_size: 64000
    num_workers: 8