From c8f3af885543aff5018a4897909ade8517d820ca Mon Sep 17 00:00:00 2001
From: lyblsgo <lyblsgo@163.com>
Date: 星期二, 21 三月 2023 16:50:30 +0800
Subject: [PATCH] add onnx quantize model for onnx; add tester_rtf
---
funasr/runtime/onnxruntime/tester/tester.cpp | 18 +++++++-----------
1 files changed, 7 insertions(+), 11 deletions(-)
diff --git a/funasr/runtime/onnxruntime/tester/tester.cpp b/funasr/runtime/onnxruntime/tester/tester.cpp
index f2491a9..1739f0b 100644
--- a/funasr/runtime/onnxruntime/tester/tester.cpp
+++ b/funasr/runtime/onnxruntime/tester/tester.cpp
@@ -9,39 +9,38 @@
#include <iostream>
#include <fstream>
+#include <sstream>
using namespace std;
int main(int argc, char *argv[])
{
- if (argc < 2)
+ if (argc < 3)
{
- printf("Usage: %s /path/to/model_dir /path/to/wav/file", argv[0]);
+ printf("Usage: %s /path/to/model_dir /path/to/wav/file quantize(true or false)", argv[0]);
exit(-1);
}
struct timeval start, end;
gettimeofday(&start, NULL);
int nThreadNum = 4;
- RPASR_HANDLE AsrHanlde=RapidAsrInit(argv[1], nThreadNum);
+ // is quantize
+ bool quantize = false;
+ istringstream(argv[3]) >> boolalpha >> quantize;
+ RPASR_HANDLE AsrHanlde=RapidAsrInit(argv[1], nThreadNum, quantize);
if (!AsrHanlde)
{
printf("Cannot load ASR Model from: %s, there must be files model.onnx and vocab.txt", argv[1]);
exit(-1);
}
-
-
gettimeofday(&end, NULL);
long seconds = (end.tv_sec - start.tv_sec);
long modle_init_micros = ((seconds * 1000000) + end.tv_usec) - (start.tv_usec);
printf("Model initialization takes %lfs.\n", (double)modle_init_micros / 1000000);
-
-
gettimeofday(&start, NULL);
float snippet_time = 0.0f;
-
RPASR_RESULT Result=RapidAsrRecogFile(AsrHanlde, argv[2], RASR_NONE, NULL);
@@ -61,7 +60,6 @@
{
cout <<"no return data!";
}
-
//char* buff = nullptr;
//int len = 0;
@@ -101,13 +99,11 @@
//
//delete[]buff;
//}
-
printf("Audio length %lfs.\n", (double)snippet_time);
seconds = (end.tv_sec - start.tv_sec);
long taking_micros = ((seconds * 1000000) + end.tv_usec) - (start.tv_usec);
printf("Model inference takes %lfs.\n", (double)taking_micros / 1000000);
-
printf("Model inference RTF: %04lf.\n", (double)taking_micros/ (snippet_time*1000000));
RapidAsrUninit(AsrHanlde);
--
Gitblit v1.9.1