python/FunASR-XL.git

			@@ -73,8 +73,8 @@
			seg_dict = load_seg_dict(args.seg_dict_file)
			if hasattr(args, "punc_dict_file") and args.punc_dict_file is not None:
			punc_dict = read_symbol_table(args.punc_dict_file)
			if hasattr(args, "bpemodel_file") and args.bpemodel_file is not None:
			bpe_tokenizer = SentencepiecesTokenizer(args.bpemodel_file)
			if hasattr(args, "bpemodel") and args.bpemodel is not None:
			bpe_tokenizer = SentencepiecesTokenizer(args.bpemodel)
			self.dataset_conf = args.dataset_conf
			self.frontend_conf = args.frontend_conf
			logging.info("dataloader config: {}".format(self.dataset_conf))

			@@ -46,10 +46,8 @@
			text = data["text"]
			token = []
			vad = -2

			if bpe_tokenizer is not None:
			text = bpe_tokenizer.text2tokens(text)

			text = bpe_tokenizer.text2tokens(" ".join(text))
			if seg_dict is not None:
			assert isinstance(seg_dict, dict)
			text = seg_tokenize(text, seg_dict)

			@@ -506,9 +506,9 @@
			)

			self.conv = torch.nn.Sequential(
			torch.nn.Conv2d(1, conv_size, 3, 2),
			torch.nn.Conv2d(1, conv_size, 3, 2, [1,0]),
			torch.nn.ReLU(),
			torch.nn.Conv2d(conv_size, conv_size, kernel_2, stride_2),
			torch.nn.Conv2d(conv_size, conv_size, kernel_2, stride_2, [(kernel_2-1)//2, 0]),
			torch.nn.ReLU(),
			)

			@@ -597,7 +597,7 @@
			mask: Mask of output sequences. (B, sub(T))
			"""
			if self.subsampling_factor > 1:
			return mask[:, :-2:2][:, : -(self.kernel_2 - 1) : self.stride_2]
			return mask[:, ::2][:, ::self.stride_2]
			else:
			return mask

	funasr/datasets/large_datasets/build_dataloader.py	4 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史
	funasr/datasets/large_datasets/utils/tokenize.py	4 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史
	funasr/modules/subsampling.py	6 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史