From a0d77813ac2221fb2b5b845cce29317c9bc0beea Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期五, 12 一月 2024 12:04:08 +0800
Subject: [PATCH] funasr1.0 streaming demo

---
 funasr/bin/inference.py |    6 +++++-
 1 files changed, 5 insertions(+), 1 deletions(-)

diff --git a/funasr/bin/inference.py b/funasr/bin/inference.py
index cf29d91..7d9c1b9 100644
--- a/funasr/bin/inference.py
+++ b/funasr/bin/inference.py
@@ -137,6 +137,9 @@
             if spk_mode not in ["default", "vad_segment", "punc_segment"]:
                 logging.error("spk_mode should be one of default, vad_segment and punc_segment.")
             self.spk_mode = spk_mode
+            self.preset_spk_num = kwargs.get("preset_spk_num", None)
+            if self.preset_spk_num:
+                logging.warning("Using preset speaker number: {}".format(self.preset_spk_num))
             logging.warning("Many to print when using speaker model...")
             
         self.kwargs = kwargs
@@ -147,6 +150,7 @@
         self.punc_kwargs = punc_kwargs
         self.spk_model = spk_model
         self.spk_kwargs = spk_kwargs
+        self.model_path = kwargs["model_path"]
   
         
     def build_model(self, **kwargs):
@@ -397,7 +401,7 @@
             if self.spk_model is not None:
                 all_segments = sorted(all_segments, key=lambda x: x[0])
                 spk_embedding = result['spk_embedding']
-                labels = self.cb_model(spk_embedding)
+                labels = self.cb_model(spk_embedding, oracle_num=self.preset_spk_num)
                 del result['spk_embedding']
                 sv_output = postprocess(all_segments, None, labels, spk_embedding)
                 if self.spk_mode == 'vad_segment':

--
Gitblit v1.9.1