游雁
2023-06-29 bc723ea200144bd6fa8a5dff4b9a780feda144fc
funasr/runtime/onnxruntime/src/funasrruntime.cpp
@@ -7,73 +7,53 @@
   // APIs for Init
   _FUNASRAPI FUNASR_HANDLE  FunASRInit(std::map<std::string, std::string>& model_path, int thread_num)
   {
      Model* mm = CreateModel(model_path, thread_num);
      funasr::Model* mm = funasr::CreateModel(model_path, thread_num);
      return mm;
   }
   _FUNASRAPI FUNASR_HANDLE  FsmnVadInit(std::map<std::string, std::string>& model_path, int thread_num)
   {
      VadModel* mm = CreateVadModel(model_path, thread_num);
      funasr::VadModel* mm = funasr::CreateVadModel(model_path, thread_num);
      return mm;
   }
   _FUNASRAPI FUNASR_HANDLE  FunPuncInit(std::map<std::string, std::string>& model_path, int thread_num)
   _FUNASRAPI FUNASR_HANDLE  FsmnVadOnlineInit(FUNASR_HANDLE fsmnvad_handle)
   {
      PuncModel* mm = CreatePuncModel(model_path, thread_num);
      funasr::VadModel* mm = funasr::CreateVadModel(fsmnvad_handle);
      return mm;
   }
   _FUNASRAPI FUNASR_HANDLE  CTTransformerInit(std::map<std::string, std::string>& model_path, int thread_num, PUNC_TYPE type)
   {
      funasr::PuncModel* mm = funasr::CreatePuncModel(model_path, thread_num, type);
      return mm;
   }
   _FUNASRAPI FUNASR_HANDLE  FunOfflineInit(std::map<std::string, std::string>& model_path, int thread_num)
   {
      OfflineStream* mm = CreateOfflineStream(model_path, thread_num);
      funasr::OfflineStream* mm = funasr::CreateOfflineStream(model_path, thread_num);
      return mm;
   }
   // APIs for ASR Infer
   _FUNASRAPI FUNASR_RESULT FunASRRecogBuffer(FUNASR_HANDLE handle, const char* sz_buf, int n_len, FUNASR_MODE mode, QM_CALLBACK fn_callback)
   _FUNASRAPI FUNASR_RESULT FunASRInferBuffer(FUNASR_HANDLE handle, const char* sz_buf, int n_len, FUNASR_MODE mode, QM_CALLBACK fn_callback, int sampling_rate)
   {
      Model* recog_obj = (Model*)handle;
      funasr::Model* recog_obj = (funasr::Model*)handle;
      if (!recog_obj)
         return nullptr;
      int32_t sampling_rate = -1;
      Audio audio(1);
      if (!audio.LoadWav(sz_buf, n_len, &sampling_rate))
         return nullptr;
      float* buff;
      int len;
      int flag=0;
      FUNASR_RECOG_RESULT* p_result = new FUNASR_RECOG_RESULT;
      p_result->snippet_time = audio.GetTimeLen();
      int n_step = 0;
      int n_total = audio.GetQueueSize();
      while (audio.Fetch(buff, len, flag) > 0) {
         string msg = recog_obj->Forward(buff, len, flag);
         p_result->msg += msg;
         n_step++;
         if (fn_callback)
            fn_callback(n_step, n_total);
      }
      return p_result;
   }
   _FUNASRAPI FUNASR_RESULT FunASRRecogPCMBuffer(FUNASR_HANDLE handle, const char* sz_buf, int n_len, int sampling_rate, FUNASR_MODE mode, QM_CALLBACK fn_callback)
   {
      Model* recog_obj = (Model*)handle;
      if (!recog_obj)
         return nullptr;
      Audio audio(1);
      funasr::Audio audio(1);
      if (!audio.LoadPcmwav(sz_buf, n_len, &sampling_rate))
         return nullptr;
      float* buff;
      int len;
      int flag = 0;
      FUNASR_RECOG_RESULT* p_result = new FUNASR_RECOG_RESULT;
      funasr::FUNASR_RECOG_RESULT* p_result = new funasr::FUNASR_RECOG_RESULT;
      p_result->snippet_time = audio.GetTimeLen();
      if(p_result->snippet_time == 0){
            return p_result;
        }
      int n_step = 0;
      int n_total = audio.GetQueueSize();
      while (audio.Fetch(buff, len, flag) > 0) {
@@ -87,23 +67,35 @@
      return p_result;
   }
   _FUNASRAPI FUNASR_RESULT FunASRRecogPCMFile(FUNASR_HANDLE handle, const char* sz_filename, int sampling_rate, FUNASR_MODE mode, QM_CALLBACK fn_callback)
   _FUNASRAPI FUNASR_RESULT FunASRInfer(FUNASR_HANDLE handle, const char* sz_filename, FUNASR_MODE mode, QM_CALLBACK fn_callback, int sampling_rate)
   {
      Model* recog_obj = (Model*)handle;
      funasr::Model* recog_obj = (funasr::Model*)handle;
      if (!recog_obj)
         return nullptr;
      Audio audio(1);
      if (!audio.LoadPcmwav(sz_filename, &sampling_rate))
         return nullptr;
      funasr::Audio audio(1);
      if(funasr::is_target_file(sz_filename, "wav")){
         int32_t sampling_rate_ = -1;
         if(!audio.LoadWav(sz_filename, &sampling_rate_))
            return nullptr;
      }else if(funasr::is_target_file(sz_filename, "pcm")){
         if (!audio.LoadPcmwav(sz_filename, &sampling_rate))
            return nullptr;
      }else{
         LOG(ERROR)<<"Wrong wav extension";
         exit(-1);
      }
      float* buff;
      int len;
      int flag = 0;
      FUNASR_RECOG_RESULT* p_result = new FUNASR_RECOG_RESULT;
      p_result->snippet_time = audio.GetTimeLen();
      int n_step = 0;
      int n_total = audio.GetQueueSize();
      funasr::FUNASR_RECOG_RESULT* p_result = new funasr::FUNASR_RECOG_RESULT;
      p_result->snippet_time = audio.GetTimeLen();
      if(p_result->snippet_time == 0){
            return p_result;
        }
      while (audio.Fetch(buff, len, flag) > 0) {
         string msg = recog_obj->Forward(buff, len, flag);
         p_result->msg += msg;
@@ -112,117 +104,105 @@
            fn_callback(n_step, n_total);
      }
      return p_result;
   }
   _FUNASRAPI FUNASR_RESULT FunASRRecogFile(FUNASR_HANDLE handle, const char* sz_wavfile, FUNASR_MODE mode, QM_CALLBACK fn_callback)
   {
      Model* recog_obj = (Model*)handle;
      if (!recog_obj)
         return nullptr;
      int32_t sampling_rate = -1;
      Audio audio(1);
      if(!audio.LoadWav(sz_wavfile, &sampling_rate))
         return nullptr;
      float* buff;
      int len;
      int flag = 0;
      int n_step = 0;
      int n_total = audio.GetQueueSize();
      FUNASR_RECOG_RESULT* p_result = new FUNASR_RECOG_RESULT;
      p_result->snippet_time = audio.GetTimeLen();
      while (audio.Fetch(buff, len, flag) > 0) {
         string msg = recog_obj->Forward(buff, len, flag);
         p_result->msg+= msg;
         n_step++;
         if (fn_callback)
            fn_callback(n_step, n_total);
      }
      return p_result;
   }
   // APIs for VAD Infer
   _FUNASRAPI FUNASR_RESULT FsmnVadWavFile(FUNASR_HANDLE handle, const char* sz_wavfile, FUNASR_MODE mode, QM_CALLBACK fn_callback)
   _FUNASRAPI FUNASR_RESULT FsmnVadInferBuffer(FUNASR_HANDLE handle, const char* sz_buf, int n_len, QM_CALLBACK fn_callback, bool input_finished, int sampling_rate)
   {
      VadModel* vad_obj = (VadModel*)handle;
      funasr::VadModel* vad_obj = (funasr::VadModel*)handle;
      if (!vad_obj)
         return nullptr;
      int32_t sampling_rate = -1;
      Audio audio(1);
      if(!audio.LoadWav(sz_wavfile, &sampling_rate))
      funasr::Audio audio(1);
      if (!audio.LoadPcmwav(sz_buf, n_len, &sampling_rate))
         return nullptr;
      FUNASR_VAD_RESULT* p_result = new FUNASR_VAD_RESULT;
      funasr::FUNASR_VAD_RESULT* p_result = new funasr::FUNASR_VAD_RESULT;
      p_result->snippet_time = audio.GetTimeLen();
      if(p_result->snippet_time == 0){
            return p_result;
        }
      
      vector<std::vector<int>> vad_segments;
      audio.Split(vad_obj, vad_segments);
      audio.Split(vad_obj, vad_segments, input_finished);
      p_result->segments = new vector<std::vector<int>>(vad_segments);
      return p_result;
   }
   _FUNASRAPI FUNASR_RESULT FsmnVadInfer(FUNASR_HANDLE handle, const char* sz_filename, QM_CALLBACK fn_callback, int sampling_rate)
   {
      funasr::VadModel* vad_obj = (funasr::VadModel*)handle;
      if (!vad_obj)
         return nullptr;
      funasr::Audio audio(1);
      if(funasr::is_target_file(sz_filename, "wav")){
         int32_t sampling_rate_ = -1;
         if(!audio.LoadWav(sz_filename, &sampling_rate_))
            return nullptr;
      }else if(funasr::is_target_file(sz_filename, "pcm")){
         if (!audio.LoadPcmwav(sz_filename, &sampling_rate))
            return nullptr;
      }else{
         LOG(ERROR)<<"Wrong wav extension";
         exit(-1);
      }
      funasr::FUNASR_VAD_RESULT* p_result = new funasr::FUNASR_VAD_RESULT;
      p_result->snippet_time = audio.GetTimeLen();
      if(p_result->snippet_time == 0){
            return p_result;
        }
      vector<std::vector<int>> vad_segments;
      audio.Split(vad_obj, vad_segments, true);
      p_result->segments = new vector<std::vector<int>>(vad_segments);
      return p_result;
   }
   // APIs for PUNC Infer
   _FUNASRAPI const std::string FunPuncInfer(FUNASR_HANDLE handle, const char* sz_sentence, FUNASR_MODE mode, QM_CALLBACK fn_callback)
   _FUNASRAPI FUNASR_RESULT CTTransformerInfer(FUNASR_HANDLE handle, const char* sz_sentence, FUNASR_MODE mode, QM_CALLBACK fn_callback, PUNC_TYPE type, FUNASR_RESULT pre_result)
   {
      PuncModel* punc_obj = (PuncModel*)handle;
      funasr::PuncModel* punc_obj = (funasr::PuncModel*)handle;
      if (!punc_obj)
         return nullptr;
      string punc_res = punc_obj->AddPunc(sz_sentence);
      return punc_res;
   }
   // APIs for Offline-stream Infer
   _FUNASRAPI FUNASR_RESULT FunOfflineRecogFile(FUNASR_HANDLE handle, const char* sz_wavfile, FUNASR_MODE mode, QM_CALLBACK fn_callback)
   {
      OfflineStream* offline_stream = (OfflineStream*)handle;
      if (!offline_stream)
         return nullptr;
      
      int32_t sampling_rate = -1;
      Audio audio(1);
      if(!audio.LoadWav(sz_wavfile, &sampling_rate))
         return nullptr;
      if(offline_stream->UseVad()){
         audio.Split(offline_stream);
      FUNASR_RESULT p_result = nullptr;
      if (type==PUNC_OFFLINE){
         p_result = (FUNASR_RESULT)new funasr::FUNASR_PUNC_RESULT;
         ((funasr::FUNASR_PUNC_RESULT*)p_result)->msg = punc_obj->AddPunc(sz_sentence);
      }else if(type==PUNC_ONLINE){
         if (!pre_result)
            p_result = (FUNASR_RESULT)new funasr::FUNASR_PUNC_RESULT;
         else
            p_result = pre_result;
         ((funasr::FUNASR_PUNC_RESULT*)p_result)->msg = punc_obj->AddPunc(sz_sentence, ((funasr::FUNASR_PUNC_RESULT*)p_result)->arr_cache);
      }else{
         LOG(ERROR) << "Wrong PUNC_TYPE";
         exit(-1);
      }
      float* buff;
      int len;
      int flag = 0;
      int n_step = 0;
      int n_total = audio.GetQueueSize();
      FUNASR_RECOG_RESULT* p_result = new FUNASR_RECOG_RESULT;
      p_result->snippet_time = audio.GetTimeLen();
      while (audio.Fetch(buff, len, flag) > 0) {
         string msg = (offline_stream->asr_handle)->Forward(buff, len, flag);
         p_result->msg+= msg;
         n_step++;
         if (fn_callback)
            fn_callback(n_step, n_total);
      }
      if(offline_stream->UsePunc()){
         string punc_res = (offline_stream->punc_handle)->AddPunc((p_result->msg).c_str());
         p_result->msg = punc_res;
      }
      return p_result;
   }
   _FUNASRAPI FUNASR_RESULT FunOfflineRecogPCMBuffer(FUNASR_HANDLE handle, const char* sz_buf, int n_len, int sampling_rate, FUNASR_MODE mode, QM_CALLBACK fn_callback)
   // APIs for Offline-stream Infer
   _FUNASRAPI FUNASR_RESULT FunOfflineInferBuffer(FUNASR_HANDLE handle, const char* sz_buf, int n_len, FUNASR_MODE mode, QM_CALLBACK fn_callback, int sampling_rate)
   {
      OfflineStream* offline_stream = (OfflineStream*)handle;
      funasr::OfflineStream* offline_stream = (funasr::OfflineStream*)handle;
      if (!offline_stream)
         return nullptr;
      Audio audio(1);
      funasr::Audio audio(1);
      if (!audio.LoadPcmwav(sz_buf, n_len, &sampling_rate))
         return nullptr;
      funasr::FUNASR_RECOG_RESULT* p_result = new funasr::FUNASR_RECOG_RESULT;
      p_result->snippet_time = audio.GetTimeLen();
      if(p_result->snippet_time == 0){
            return p_result;
        }
      if(offline_stream->UseVad()){
         audio.Split(offline_stream);
      }
@@ -230,8 +210,7 @@
      float* buff;
      int len;
      int flag = 0;
      FUNASR_RECOG_RESULT* p_result = new FUNASR_RECOG_RESULT;
      p_result->snippet_time = audio.GetTimeLen();
      int n_step = 0;
      int n_total = audio.GetQueueSize();
      while (audio.Fetch(buff, len, flag) > 0) {
@@ -246,6 +225,53 @@
         p_result->msg = punc_res;
      }
      return p_result;
   }
   _FUNASRAPI FUNASR_RESULT FunOfflineInfer(FUNASR_HANDLE handle, const char* sz_filename, FUNASR_MODE mode, QM_CALLBACK fn_callback, int sampling_rate)
   {
      funasr::OfflineStream* offline_stream = (funasr::OfflineStream*)handle;
      if (!offline_stream)
         return nullptr;
      funasr::Audio audio(1);
      if(funasr::is_target_file(sz_filename, "wav")){
         int32_t sampling_rate_ = -1;
         if(!audio.LoadWav(sz_filename, &sampling_rate_))
            return nullptr;
      }else if(funasr::is_target_file(sz_filename, "pcm")){
         if (!audio.LoadPcmwav(sz_filename, &sampling_rate))
            return nullptr;
      }else{
         LOG(ERROR)<<"Wrong wav extension";
         exit(-1);
      }
      funasr::FUNASR_RECOG_RESULT* p_result = new funasr::FUNASR_RECOG_RESULT;
      p_result->snippet_time = audio.GetTimeLen();
      if(p_result->snippet_time == 0){
            return p_result;
        }
      if(offline_stream->UseVad()){
         audio.Split(offline_stream);
      }
      float* buff;
      int len;
      int flag = 0;
      int n_step = 0;
      int n_total = audio.GetQueueSize();
      while (audio.Fetch(buff, len, flag) > 0) {
         string msg = (offline_stream->asr_handle)->Forward(buff, len, flag);
         p_result->msg+= msg;
         n_step++;
         if (fn_callback)
            fn_callback(n_step, n_total);
      }
      if(offline_stream->UsePunc()){
         string punc_res = (offline_stream->punc_handle)->AddPunc((p_result->msg).c_str());
         p_result->msg = punc_res;
      }
      return p_result;
   }
@@ -263,7 +289,7 @@
      if (!result)
         return 0.0f;
      return ((FUNASR_RECOG_RESULT*)result)->snippet_time;
      return ((funasr::FUNASR_RECOG_RESULT*)result)->snippet_time;
   }
   _FUNASRAPI const float FsmnVadGetRetSnippetTime(FUNASR_RESULT result)
@@ -271,13 +297,22 @@
      if (!result)
         return 0.0f;
      return ((FUNASR_VAD_RESULT*)result)->snippet_time;
      return ((funasr::FUNASR_VAD_RESULT*)result)->snippet_time;
   }
   // APIs for GetResult
   _FUNASRAPI const char* FunASRGetResult(FUNASR_RESULT result,int n_index)
   {
      FUNASR_RECOG_RESULT * p_result = (FUNASR_RECOG_RESULT*)result;
      funasr::FUNASR_RECOG_RESULT * p_result = (funasr::FUNASR_RECOG_RESULT*)result;
      if(!p_result)
         return nullptr;
      return p_result->msg.c_str();
   }
   _FUNASRAPI const char* CTTransformerGetResult(FUNASR_RESULT result,int n_index)
   {
      funasr::FUNASR_PUNC_RESULT * p_result = (funasr::FUNASR_PUNC_RESULT*)result;
      if(!p_result)
         return nullptr;
@@ -286,7 +321,7 @@
   _FUNASRAPI vector<std::vector<int>>* FsmnVadGetResult(FUNASR_RESULT result,int n_index)
   {
      FUNASR_VAD_RESULT * p_result = (FUNASR_VAD_RESULT*)result;
      funasr::FUNASR_VAD_RESULT * p_result = (funasr::FUNASR_VAD_RESULT*)result;
      if(!p_result)
         return nullptr;
@@ -298,13 +333,21 @@
   {
      if (result)
      {
         delete (FUNASR_RECOG_RESULT*)result;
         delete (funasr::FUNASR_RECOG_RESULT*)result;
      }
   }
   _FUNASRAPI void CTTransformerFreeResult(FUNASR_RESULT result)
   {
      if (result)
      {
         delete (funasr::FUNASR_PUNC_RESULT*)result;
      }
   }
   _FUNASRAPI void FsmnVadFreeResult(FUNASR_RESULT result)
   {
      FUNASR_VAD_RESULT * p_result = (FUNASR_VAD_RESULT*)result;
      funasr::FUNASR_VAD_RESULT * p_result = (funasr::FUNASR_VAD_RESULT*)result;
      if (p_result)
      {
         if(p_result->segments){
@@ -317,7 +360,7 @@
   // APIs for Uninit
   _FUNASRAPI void FunASRUninit(FUNASR_HANDLE handle)
   {
      Model* recog_obj = (Model*)handle;
      funasr::Model* recog_obj = (funasr::Model*)handle;
      if (!recog_obj)
         return;
@@ -327,7 +370,7 @@
   _FUNASRAPI void FsmnVadUninit(FUNASR_HANDLE handle)
   {
      VadModel* recog_obj = (VadModel*)handle;
      funasr::VadModel* recog_obj = (funasr::VadModel*)handle;
      if (!recog_obj)
         return;
@@ -335,9 +378,9 @@
      delete recog_obj;
   }
   _FUNASRAPI void FunPuncUninit(FUNASR_HANDLE handle)
   _FUNASRAPI void CTTransformerUninit(FUNASR_HANDLE handle)
   {
      PuncModel* punc_obj = (PuncModel*)handle;
      funasr::PuncModel* punc_obj = (funasr::PuncModel*)handle;
      if (!punc_obj)
         return;
@@ -347,7 +390,7 @@
   _FUNASRAPI void FunOfflineUninit(FUNASR_HANDLE handle)
   {
      OfflineStream* offline_stream = (OfflineStream*)handle;
      funasr::OfflineStream* offline_stream = (funasr::OfflineStream*)handle;
      if (!offline_stream)
         return;