VirtuosoQ
2024-04-26 e9d2cfc3a134b00f4e98271fbee3838d1ccecbcc
funasr/models/sense_voice/whisper_lib/audio.py
@@ -89,7 +89,7 @@
@lru_cache(maxsize=None)
def mel_filters(device, n_mels: int) -> torch.Tensor:
def mel_filters(device, n_mels: int, filters_path: str=None) -> torch.Tensor:
    """
    load the mel filterbank matrix for projecting STFT into a Mel spectrogram.
    Allows decoupling librosa dependency; saved using:
@@ -101,8 +101,8 @@
        )
    """
    assert n_mels in {80, 128}, f"Unsupported n_mels: {n_mels}"
    filters_path = os.path.join(os.path.dirname(__file__), "assets", "mel_filters.npz")
    if filters_path is None:
        filters_path = os.path.join(os.path.dirname(__file__), "assets", "mel_filters.npz")
    with np.load(filters_path, allow_pickle=False) as f:
        return torch.from_numpy(f[f"mel_{n_mels}"]).to(device)