From 40d1f80030d38b3377a95ead8837e82c67aa59f6 Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期五, 12 一月 2024 12:05:08 +0800
Subject: [PATCH] funasr1.0 streaming demo
---
funasr/models/paraformer_streaming/model.py | 8 ++++----
1 files changed, 4 insertions(+), 4 deletions(-)
diff --git a/funasr/models/paraformer_streaming/model.py b/funasr/models/paraformer_streaming/model.py
index fdc0c93..b736aa9 100644
--- a/funasr/models/paraformer_streaming/model.py
+++ b/funasr/models/paraformer_streaming/model.py
@@ -523,7 +523,7 @@
meta_data = {}
chunk_size = kwargs.get("chunk_size", [0, 10, 5])
- chunk_stride_samples = chunk_size[1] * 960 # 600ms
+ chunk_stride_samples = int(chunk_size[1] * 960) # 600ms
time1 = time.perf_counter()
cfg = {"is_final": kwargs.get("is_final", False)}
@@ -532,7 +532,7 @@
audio_fs=kwargs.get("fs", 16000),
data_type=kwargs.get("data_type", "sound"),
tokenizer=tokenizer,
- **cfg,
+ cache=cfg,
)
_is_final = cfg["is_final"] # if data_in is a file or url, set is_final=True
@@ -542,8 +542,8 @@
audio_sample = torch.cat((cache["prev_samples"], audio_sample_list[0]))
- n = len(audio_sample) // chunk_stride_samples + int(_is_final)
- m = len(audio_sample) % chunk_stride_samples * (1-int(_is_final))
+ n = int(len(audio_sample) // chunk_stride_samples + int(_is_final))
+ m = int(len(audio_sample) % chunk_stride_samples * (1-int(_is_final)))
tokens = []
for i in range(n):
kwargs["is_final"] = _is_final and i == n -1
--
Gitblit v1.9.1