python/FunASR-XL.git

			@@ -6,7 +6,6 @@
			# tables.print()

			# network architecture
			#model: funasr.models.paraformer.model:Paraformer
			model: Paraformer
			model_conf:
			ctc_weight: 0.0
			@@ -30,7 +29,7 @@
			pos_enc_class: SinusoidalPositionEncoder
			normalize_before: true
			kernel_size: 11
			sanm_shfit: 0
			sanm_shift: 0
			selfattention_layer_type: sanm

			# decoder
			@@ -45,7 +44,7 @@
			src_attention_dropout_rate: 0.1
			att_layer_num: 16
			kernel_size: 11
			sanm_shfit: 0
			sanm_shift: 0

			predictor: CifPredictorV2
			predictor_conf:
			@@ -87,14 +86,8 @@
			accum_grad: 1
			grad_clip: 5
			max_epoch: 150
			val_scheduler_criterion:
			- valid
			- acc
			best_model_criterion:
			- - valid
			- acc
			- max
			keep_nbest_models: 10
			avg_nbest_model: 10
			log_interval: 50

			optim: adam
			@@ -107,7 +100,7 @@
			dataset: AudioDataset
			dataset_conf:
			index_ds: IndexDSJsonl
			batch_sampler: DynamicBatchLocalShuffleSampler
			batch_sampler: BatchSampler
			batch_type: example # example or length
			batch_size: 1 # if batch_type is example, batch_size is the numbers of samples; if length, batch_size is source_token_len+target_token_len;
			max_token_length: 2048 # filter samples if source_token_len+target_token_len > max_token_length,