python/FunASR-XL.git

			@@ -27,7 +27,6 @@
			from funasr.utils.types import str2triple_str
			from funasr.utils.types import str_or_none


			class Speech2Diarization:
			"""Speech2Diarlization class

			@@ -121,7 +120,7 @@
			Currently, the tags of espnet_model_zoo are supported.

			Returns:
			Speech2Xvector: Speech2Xvector instance.
			Speech2Diarization: Speech2Diarization instance.

			"""
			if model_tag is not None:
			@@ -179,7 +178,6 @@
			diar_model_file=diar_model_file,
			device=device,
			dtype=dtype,
			streaming=streaming,
			)
			logging.info("speech2diarization_kwargs: {}".format(speech2diar_kwargs))
			speech2diar = Speech2Diarization.from_pretrained(
			@@ -209,7 +207,7 @@
			if data_path_and_name_and_type is None and raw_inputs is not None:
			if isinstance(raw_inputs, torch.Tensor):
			raw_inputs = raw_inputs.numpy()
			data_path_and_name_and_type = [raw_inputs, "speech", "waveform"]
			data_path_and_name_and_type = [raw_inputs[0], "speech", "bytes"]
			loader = EENDOLADiarTask.build_streaming_iterator(
			data_path_and_name_and_type,
			dtype=dtype,
			@@ -229,6 +227,8 @@
			output_writer = open("{}/result.txt".format(output_path), "w")
			result_list = []
			for keys, batch in loader:
			logger.info("keys: {}".format(keys))
			logger.info("batch: {}".format(batch))
			assert isinstance(batch, dict), type(batch)
			assert all(isinstance(s, str) for s in keys), keys
			_bs = len(next(iter(batch.values())))