From 2acef4bdaea588adee3098a057a395937dff4e6a Mon Sep 17 00:00:00 2001
From: 雾聪 <wucong.lyb@alibaba-inc.com>
Date: 星期一, 08 一月 2024 16:51:42 +0800
Subject: [PATCH] json stamp_sents for websocket-server

---
 funasr/datasets/dataset_jsonl.py |    8 +++++---
 1 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/funasr/datasets/dataset_jsonl.py b/funasr/datasets/dataset_jsonl.py
index ec2bf07..543b60e 100644
--- a/funasr/datasets/dataset_jsonl.py
+++ b/funasr/datasets/dataset_jsonl.py
@@ -4,8 +4,8 @@
 import numpy as np
 import kaldiio
 import librosa
-
-
+import torchaudio
+import time
 
 def load_audio(audio_path: str, fs: int=16000):
 	audio = None
@@ -17,7 +17,9 @@
 		if ".ark:" in audio_path:
 			audio = kaldiio.load_mat(audio_path)
 		else:
-			audio, fs = librosa.load(audio_path, sr=fs)
+			# audio, fs = librosa.load(audio_path, sr=fs)
+			audio, fs = torchaudio.load(audio_path)
+			audio = audio[0, :]
 	return audio
 
 def extract_features(data, date_type: str="sound", frontend=None):

--
Gitblit v1.9.1