From 7458e39ff0756d0bae38b139e0e534e61e1fa0cf Mon Sep 17 00:00:00 2001
From: shixian.shi <shixian.shi@alibaba-inc.com>
Date: 星期三, 17 一月 2024 19:21:08 +0800
Subject: [PATCH] bug fix
---
funasr/datasets/audio_datasets/samplers.py | 5 +++--
1 files changed, 3 insertions(+), 2 deletions(-)
diff --git a/funasr/datasets/audio_datasets/samplers.py b/funasr/datasets/audio_datasets/samplers.py
index bc71b28..e170c68 100644
--- a/funasr/datasets/audio_datasets/samplers.py
+++ b/funasr/datasets/audio_datasets/samplers.py
@@ -13,6 +13,7 @@
buffer_size: int = 30,
drop_last: bool = False,
shuffle: bool = True,
+ is_training: bool = True,
**kwargs):
self.drop_last = drop_last
@@ -20,11 +21,11 @@
self.dataset = dataset
self.total_samples = len(dataset)
self.batch_type = batch_type
- self.batch_size = batch_size
+ self.batch_size = int(batch_size)
self.buffer_size = buffer_size
self.max_token_length = kwargs.get("max_token_length", 5000)
self.shuffle_idx = np.arange(self.total_samples)
- self.shuffle = shuffle
+ self.shuffle = shuffle and is_training
def __len__(self):
return self.total_samples
--
Gitblit v1.9.1