From 8b0fb74bded1f8a162e6c0e94c3522be6216ea03 Mon Sep 17 00:00:00 2001
From: chengligen <101448376+chengligen@users.noreply.github.com>
Date: 星期一, 26 五月 2025 14:11:33 +0800
Subject: [PATCH] feat: add 'words' key aligned with timestamps in sensevoice model output (#2531)

---
 runtime/onnxruntime/src/audio.cpp |    3 ++-
 1 files changed, 2 insertions(+), 1 deletions(-)

diff --git a/runtime/onnxruntime/src/audio.cpp b/runtime/onnxruntime/src/audio.cpp
index a5a44ca..22a9ecd 100644
--- a/runtime/onnxruntime/src/audio.cpp
+++ b/runtime/onnxruntime/src/audio.cpp
@@ -1061,8 +1061,9 @@
     #ifdef USE_GPU
         max_batch = batch_size;
     #endif
+    max_batch = std::min(max_batch, (int)frame_queue.size());
 
-    for(int idx=0; idx < std::min(max_batch, (int)frame_queue.size()); idx++){
+    for(int idx=0; idx < max_batch; idx++){
         AudioFrame *frame = frame_queue.front();
         int length = frame->GetLen();
         if(length >= max_sent){

--
Gitblit v1.9.1