From 02f580b86aa395178aaa559a163208d166a19e4a Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期五, 12 一月 2024 00:02:10 +0800
Subject: [PATCH] Merge branch 'funasr1.0' of github.com:alibaba-damo-academy/FunASR into funasr1.0 add
---
funasr/bin/inference.py | 5 ++++-
1 files changed, 4 insertions(+), 1 deletions(-)
diff --git a/funasr/bin/inference.py b/funasr/bin/inference.py
index cf29d91..515170b 100644
--- a/funasr/bin/inference.py
+++ b/funasr/bin/inference.py
@@ -137,6 +137,9 @@
if spk_mode not in ["default", "vad_segment", "punc_segment"]:
logging.error("spk_mode should be one of default, vad_segment and punc_segment.")
self.spk_mode = spk_mode
+ self.preset_spk_num = kwargs.get("preset_spk_num", None)
+ if self.preset_spk_num:
+ logging.warning("Using preset speaker number: {}".format(self.preset_spk_num))
logging.warning("Many to print when using speaker model...")
self.kwargs = kwargs
@@ -397,7 +400,7 @@
if self.spk_model is not None:
all_segments = sorted(all_segments, key=lambda x: x[0])
spk_embedding = result['spk_embedding']
- labels = self.cb_model(spk_embedding)
+ labels = self.cb_model(spk_embedding, oracle_num=self.preset_spk_num)
del result['spk_embedding']
sv_output = postprocess(all_segments, None, labels, spk_embedding)
if self.spk_mode == 'vad_segment':
--
Gitblit v1.9.1