From 5b9c073f43dbecc3ae9d771af50a8f52f87931e8 Mon Sep 17 00:00:00 2001
From: 语帆 <yf352572@alibaba-inc.com>
Date: 星期三, 28 二月 2024 15:49:41 +0800
Subject: [PATCH] test
---
funasr/utils/load_utils.py | 7 ++-----
1 files changed, 2 insertions(+), 5 deletions(-)
diff --git a/funasr/utils/load_utils.py b/funasr/utils/load_utils.py
index 20fa0fd..8b75cbd 100644
--- a/funasr/utils/load_utils.py
+++ b/funasr/utils/load_utils.py
@@ -38,7 +38,6 @@
if kwargs.get("reduce_channels", True):
data_or_path_or_list = data_or_path_or_list.mean(0)
elif data_type == "text" and tokenizer is not None:
- pdb.set_trace()
data_or_path_or_list = tokenizer.encode(data_or_path_or_list)
elif data_type == "image": # undo
pass
@@ -68,7 +67,7 @@
else:
pass
# print(f"unsupport data type: {data_or_path_or_list}, return raw data")
- pdb.set_trace()
+
if audio_fs != fs and data_type != "text":
resampler = torchaudio.transforms.Resample(audio_fs, fs)
data_or_path_or_list = resampler(data_or_path_or_list[None, :])[0, :]
@@ -109,9 +108,7 @@
data_list.append(data_i)
data_len.append(data_i.shape[0])
data = pad_sequence(data_list, batch_first=True) # data: [batch, N]
- # import pdb;
- # pdb.set_trace()
- # if data_type == "sound":
+
data, data_len = frontend(data, data_len, **kwargs)
if isinstance(data_len, (list, tuple)):
--
Gitblit v1.9.1