python/FunASR-XL.git

			@@ -12,12 +12,10 @@

			class SlidingWindow(AbsFrontend):
			"""Sliding Window.

			Provides a sliding window over a batched continuous raw audio tensor.
			Optionally, provides padding (Currently not implemented).
			Combine this module with a pre-encoder compatible with raw audio data,
			for example Sinc convolutions.

			Known issues:
			Output length is calculated incorrectly if audio shorter than win_length.
			WARNING: trailing values are discarded - padding not implemented yet.
			@@ -33,7 +31,6 @@
			fs=None,
			):
			"""Initialize.

			Args:
			win_length: Length of frame.
			hop_length: Relative starting point of next frame.
			@@ -53,11 +50,9 @@
			self, input: torch.Tensor, input_lengths: torch.Tensor
			) -> Tuple[torch.Tensor, torch.Tensor]:
			"""Apply a sliding window on the input.

			Args:
			input: Input (B, T, CD) or (B, TC*D), with D=C=1.
			input_lengths: Input lengths within batch.

			Returns:
			Tensor: Output with dimensions (B, T, C, D), with D=win_length.
			Tensor: Output lengths within batch.
			@@ -78,4 +73,4 @@

			def output_size(self) -> int:
			"""Return output length of feature dimension D, i.e. the window length."""
			return self.win_length
			return self.win_length