python/FunASR-XL.git

			@@ -46,7 +46,7 @@

			Examples:
			>>> import soundfile
			>>> speech2text = Speech2Text("asr_config.yml", "asr.pth")
			>>> speech2text = Speech2Text("asr_config.yml", "asr.pb")
			>>> audio, rate = soundfile.read("speech.wav")
			>>> speech2text(audio)
			[(text, token, token_int, hypothesis object), ...]
			@@ -398,6 +398,19 @@
			else:
			device = "cpu"

			if param_dict is not None and "decoding_model" in param_dict:
			if param_dict["decoding_model"] == "fast":
			decoding_ind = 0
			decoding_mode = "model1"
			elif param_dict["decoding_model"] == "normal":
			decoding_ind = 0
			decoding_mode = "model2"
			elif param_dict["decoding_model"] == "offline":
			decoding_ind = 1
			decoding_mode = "model2"
			else:
			raise NotImplementedError("unsupported decoding model {}".format(param_dict["decoding_model"]))

			# 1. Set random-seed
			set_all_random_seed(seed)

			@@ -433,6 +446,7 @@
			output_dir_v2: Optional[str] = None,
			fs: dict = None,
			param_dict: dict = None,
			**kwargs,
			):
			# 3. Build data-iterator
			if data_path_and_name_and_type is None and raw_inputs is not None: