From 2acef4bdaea588adee3098a057a395937dff4e6a Mon Sep 17 00:00:00 2001 From: 雾聪 <wucong.lyb@alibaba-inc.com> Date: 星期一, 08 一月 2024 16:51:42 +0800 Subject: [PATCH] json stamp_sents for websocket-server --- funasr/datasets/dataset_jsonl.py | 8 +++++--- 1 files changed, 5 insertions(+), 3 deletions(-) diff --git a/funasr/datasets/dataset_jsonl.py b/funasr/datasets/dataset_jsonl.py index ec2bf07..543b60e 100644 --- a/funasr/datasets/dataset_jsonl.py +++ b/funasr/datasets/dataset_jsonl.py @@ -4,8 +4,8 @@ import numpy as np import kaldiio import librosa - - +import torchaudio +import time def load_audio(audio_path: str, fs: int=16000): audio = None @@ -17,7 +17,9 @@ if ".ark:" in audio_path: audio = kaldiio.load_mat(audio_path) else: - audio, fs = librosa.load(audio_path, sr=fs) + # audio, fs = librosa.load(audio_path, sr=fs) + audio, fs = torchaudio.load(audio_path) + audio = audio[0, :] return audio def extract_features(data, date_type: str="sound", frontend=None): -- Gitblit v1.9.1