From ae3e2567602546e66c0f358463617e560fc70e20 Mon Sep 17 00:00:00 2001
From: lyblsgo <lyblsgo@163.com>
Date: 星期四, 20 四月 2023 14:50:55 +0800
Subject: [PATCH] add offline vad for onnxruntime
---
funasr/runtime/onnxruntime/src/libfunasrapi.cpp | 33 +++++++++++++++++++--------------
1 files changed, 19 insertions(+), 14 deletions(-)
diff --git a/funasr/runtime/onnxruntime/src/libfunasrapi.cpp b/funasr/runtime/onnxruntime/src/libfunasrapi.cpp
index a4780b2..f15e86f 100644
--- a/funasr/runtime/onnxruntime/src/libfunasrapi.cpp
+++ b/funasr/runtime/onnxruntime/src/libfunasrapi.cpp
@@ -4,14 +4,14 @@
extern "C" {
#endif
- // APIs for qmasr
- _FUNASRAPI FUNASR_HANDLE FunASRInit(const char* szModelDir, int nThreadNum, bool quantize)
+ // APIs for funasr
+ _FUNASRAPI FUNASR_HANDLE FunASRInit(const char* szModelDir, int nThreadNum, bool quantize, bool use_vad)
{
- Model* mm = create_model(szModelDir, nThreadNum, quantize);
+ Model* mm = create_model(szModelDir, nThreadNum, quantize, use_vad);
return mm;
}
- _FUNASRAPI FUNASR_RESULT FunASRRecogBuffer(FUNASR_HANDLE handle, const char* szBuf, int nLen, FUNASR_MODE Mode, QM_CALLBACK fnCallback)
+ _FUNASRAPI FUNASR_RESULT FunASRRecogBuffer(FUNASR_HANDLE handle, const char* szBuf, int nLen, FUNASR_MODE Mode, QM_CALLBACK fnCallback, bool use_vad)
{
Model* pRecogObj = (Model*)handle;
if (!pRecogObj)
@@ -21,7 +21,9 @@
Audio audio(1);
if (!audio.loadwav(szBuf, nLen, &sampling_rate))
return nullptr;
- //audio.split();
+ if(use_vad){
+ audio.split(pRecogObj);
+ }
float* buff;
int len;
@@ -31,7 +33,6 @@
int nStep = 0;
int nTotal = audio.get_queue_size();
while (audio.fetch(buff, len, flag) > 0) {
- //pRecogObj->reset();
string msg = pRecogObj->forward(buff, len, flag);
pResult->msg += msg;
nStep++;
@@ -42,7 +43,7 @@
return pResult;
}
- _FUNASRAPI FUNASR_RESULT FunASRRecogPCMBuffer(FUNASR_HANDLE handle, const char* szBuf, int nLen, int sampling_rate, FUNASR_MODE Mode, QM_CALLBACK fnCallback)
+ _FUNASRAPI FUNASR_RESULT FunASRRecogPCMBuffer(FUNASR_HANDLE handle, const char* szBuf, int nLen, int sampling_rate, FUNASR_MODE Mode, QM_CALLBACK fnCallback, bool use_vad)
{
Model* pRecogObj = (Model*)handle;
if (!pRecogObj)
@@ -51,7 +52,9 @@
Audio audio(1);
if (!audio.loadpcmwav(szBuf, nLen, &sampling_rate))
return nullptr;
- //audio.split();
+ if(use_vad){
+ audio.split(pRecogObj);
+ }
float* buff;
int len;
@@ -61,7 +64,6 @@
int nStep = 0;
int nTotal = audio.get_queue_size();
while (audio.fetch(buff, len, flag) > 0) {
- //pRecogObj->reset();
string msg = pRecogObj->forward(buff, len, flag);
pResult->msg += msg;
nStep++;
@@ -72,7 +74,7 @@
return pResult;
}
- _FUNASRAPI FUNASR_RESULT FunASRRecogPCMFile(FUNASR_HANDLE handle, const char* szFileName, int sampling_rate, FUNASR_MODE Mode, QM_CALLBACK fnCallback)
+ _FUNASRAPI FUNASR_RESULT FunASRRecogPCMFile(FUNASR_HANDLE handle, const char* szFileName, int sampling_rate, FUNASR_MODE Mode, QM_CALLBACK fnCallback, bool use_vad)
{
Model* pRecogObj = (Model*)handle;
if (!pRecogObj)
@@ -81,7 +83,9 @@
Audio audio(1);
if (!audio.loadpcmwav(szFileName, &sampling_rate))
return nullptr;
- //audio.split();
+ if(use_vad){
+ audio.split(pRecogObj);
+ }
float* buff;
int len;
@@ -91,7 +95,6 @@
int nStep = 0;
int nTotal = audio.get_queue_size();
while (audio.fetch(buff, len, flag) > 0) {
- //pRecogObj->reset();
string msg = pRecogObj->forward(buff, len, flag);
pResult->msg += msg;
nStep++;
@@ -102,7 +105,7 @@
return pResult;
}
- _FUNASRAPI FUNASR_RESULT FunASRRecogFile(FUNASR_HANDLE handle, const char* szWavfile, FUNASR_MODE Mode, QM_CALLBACK fnCallback)
+ _FUNASRAPI FUNASR_RESULT FunASRRecogFile(FUNASR_HANDLE handle, const char* szWavfile, FUNASR_MODE Mode, QM_CALLBACK fnCallback, bool use_vad)
{
Model* pRecogObj = (Model*)handle;
if (!pRecogObj)
@@ -112,7 +115,9 @@
Audio audio(1);
if(!audio.loadwav(szWavfile, &sampling_rate))
return nullptr;
- //audio.split();
+ if(use_vad){
+ audio.split(pRecogObj);
+ }
float* buff;
int len;
--
Gitblit v1.9.1