From 965797ecf087dd71ff6fb3b2bb3c18fdede07db0 Mon Sep 17 00:00:00 2001
From: zhuzizyf <42790740+zhuzizyf@users.noreply.github.com>
Date: 星期六, 22 四月 2023 14:22:17 +0800
Subject: [PATCH] Create OnlineFeature.h
---
funasr/runtime/onnxruntime/src/libfunasrapi.cpp | 46 ++++++++++++++++++++++++++--------------------
1 files changed, 26 insertions(+), 20 deletions(-)
diff --git a/funasr/runtime/onnxruntime/src/libfunasrapi.cpp b/funasr/runtime/onnxruntime/src/libfunasrapi.cpp
index 0d77d20..f15e86f 100644
--- a/funasr/runtime/onnxruntime/src/libfunasrapi.cpp
+++ b/funasr/runtime/onnxruntime/src/libfunasrapi.cpp
@@ -4,23 +4,26 @@
extern "C" {
#endif
- // APIs for qmasr
- _FUNASRAPI FUNASR_HANDLE FunASRInit(const char* szModelDir, int nThreadNum, bool quantize)
+ // APIs for funasr
+ _FUNASRAPI FUNASR_HANDLE FunASRInit(const char* szModelDir, int nThreadNum, bool quantize, bool use_vad)
{
- Model* mm = create_model(szModelDir, nThreadNum, quantize);
+ Model* mm = create_model(szModelDir, nThreadNum, quantize, use_vad);
return mm;
}
- _FUNASRAPI FUNASR_RESULT FunASRRecogBuffer(FUNASR_HANDLE handle, const char* szBuf, int nLen, FUNASR_MODE Mode, QM_CALLBACK fnCallback)
+ _FUNASRAPI FUNASR_RESULT FunASRRecogBuffer(FUNASR_HANDLE handle, const char* szBuf, int nLen, FUNASR_MODE Mode, QM_CALLBACK fnCallback, bool use_vad)
{
Model* pRecogObj = (Model*)handle;
if (!pRecogObj)
return nullptr;
+ int32_t sampling_rate = -1;
Audio audio(1);
- if (!audio.loadwav(szBuf, nLen))
+ if (!audio.loadwav(szBuf, nLen, &sampling_rate))
return nullptr;
- //audio.split();
+ if(use_vad){
+ audio.split(pRecogObj);
+ }
float* buff;
int len;
@@ -30,7 +33,6 @@
int nStep = 0;
int nTotal = audio.get_queue_size();
while (audio.fetch(buff, len, flag) > 0) {
- //pRecogObj->reset();
string msg = pRecogObj->forward(buff, len, flag);
pResult->msg += msg;
nStep++;
@@ -41,16 +43,18 @@
return pResult;
}
- _FUNASRAPI FUNASR_RESULT FunASRRecogPCMBuffer(FUNASR_HANDLE handle, const char* szBuf, int nLen, FUNASR_MODE Mode, QM_CALLBACK fnCallback)
+ _FUNASRAPI FUNASR_RESULT FunASRRecogPCMBuffer(FUNASR_HANDLE handle, const char* szBuf, int nLen, int sampling_rate, FUNASR_MODE Mode, QM_CALLBACK fnCallback, bool use_vad)
{
Model* pRecogObj = (Model*)handle;
if (!pRecogObj)
return nullptr;
Audio audio(1);
- if (!audio.loadpcmwav(szBuf, nLen))
+ if (!audio.loadpcmwav(szBuf, nLen, &sampling_rate))
return nullptr;
- //audio.split();
+ if(use_vad){
+ audio.split(pRecogObj);
+ }
float* buff;
int len;
@@ -60,7 +64,6 @@
int nStep = 0;
int nTotal = audio.get_queue_size();
while (audio.fetch(buff, len, flag) > 0) {
- //pRecogObj->reset();
string msg = pRecogObj->forward(buff, len, flag);
pResult->msg += msg;
nStep++;
@@ -71,16 +74,18 @@
return pResult;
}
- _FUNASRAPI FUNASR_RESULT FunASRRecogPCMFile(FUNASR_HANDLE handle, const char* szFileName, FUNASR_MODE Mode, QM_CALLBACK fnCallback)
+ _FUNASRAPI FUNASR_RESULT FunASRRecogPCMFile(FUNASR_HANDLE handle, const char* szFileName, int sampling_rate, FUNASR_MODE Mode, QM_CALLBACK fnCallback, bool use_vad)
{
Model* pRecogObj = (Model*)handle;
if (!pRecogObj)
return nullptr;
Audio audio(1);
- if (!audio.loadpcmwav(szFileName))
+ if (!audio.loadpcmwav(szFileName, &sampling_rate))
return nullptr;
- //audio.split();
+ if(use_vad){
+ audio.split(pRecogObj);
+ }
float* buff;
int len;
@@ -90,7 +95,6 @@
int nStep = 0;
int nTotal = audio.get_queue_size();
while (audio.fetch(buff, len, flag) > 0) {
- //pRecogObj->reset();
string msg = pRecogObj->forward(buff, len, flag);
pResult->msg += msg;
nStep++;
@@ -101,16 +105,19 @@
return pResult;
}
- _FUNASRAPI FUNASR_RESULT FunASRRecogFile(FUNASR_HANDLE handle, const char* szWavfile, FUNASR_MODE Mode, QM_CALLBACK fnCallback)
+ _FUNASRAPI FUNASR_RESULT FunASRRecogFile(FUNASR_HANDLE handle, const char* szWavfile, FUNASR_MODE Mode, QM_CALLBACK fnCallback, bool use_vad)
{
Model* pRecogObj = (Model*)handle;
if (!pRecogObj)
return nullptr;
-
+
+ int32_t sampling_rate = -1;
Audio audio(1);
- if(!audio.loadwav(szWavfile))
+ if(!audio.loadwav(szWavfile, &sampling_rate))
return nullptr;
- //audio.split();
+ if(use_vad){
+ audio.split(pRecogObj);
+ }
float* buff;
int len;
@@ -120,7 +127,6 @@
FUNASR_RECOG_RESULT* pResult = new FUNASR_RECOG_RESULT;
pResult->snippet_time = audio.get_time_len();
while (audio.fetch(buff, len, flag) > 0) {
- //pRecogObj->reset();
string msg = pRecogObj->forward(buff, len, flag);
pResult->msg+= msg;
nStep++;
--
Gitblit v1.9.1