python/FunASR-XL.git

			@@ -6,18 +6,15 @@

			from funasr.models.frontend.abs_frontend import AbsFrontend
			import torch
			from typeguard import check_argument_types
			from typing import Tuple


			class SlidingWindow(AbsFrontend):
			"""Sliding Window.

			Provides a sliding window over a batched continuous raw audio tensor.
			Optionally, provides padding (Currently not implemented).
			Combine this module with a pre-encoder compatible with raw audio data,
			for example Sinc convolutions.

			Known issues:
			Output length is calculated incorrectly if audio shorter than win_length.
			WARNING: trailing values are discarded - padding not implemented yet.
			@@ -33,7 +30,6 @@
			fs=None,
			):
			"""Initialize.

			Args:
			win_length: Length of frame.
			hop_length: Relative starting point of next frame.
			@@ -41,7 +37,6 @@
			padding: Padding (placeholder, currently not implemented).
			fs: Sampling rate (placeholder for compatibility, not used).
			"""
			assert check_argument_types()
			super().__init__()
			self.fs = fs
			self.win_length = win_length
			@@ -53,11 +48,9 @@
			self, input: torch.Tensor, input_lengths: torch.Tensor
			) -> Tuple[torch.Tensor, torch.Tensor]:
			"""Apply a sliding window on the input.

			Args:
			input: Input (B, T, CD) or (B, TC*D), with D=C=1.
			input_lengths: Input lengths within batch.

			Returns:
			Tensor: Output with dimensions (B, T, C, D), with D=win_length.
			Tensor: Output lengths within batch.
			@@ -78,4 +71,4 @@

			def output_size(self) -> int:
			"""Return output length of feature dimension D, i.e. the window length."""
			return self.win_length
			return self.win_length