From 03d4ce829814b4a7f57235fda049351c524ba32b Mon Sep 17 00:00:00 2001
From: zhifu gao <zhifu.gzf@alibaba-inc.com>
Date: 星期五, 17 三月 2023 14:06:56 +0800
Subject: [PATCH] Merge branch 'main' into dev_xw

---
 funasr/runtime/python/benchmark_onnx.md |   53 +++++++++++++++++++++++++++++++++++++++++++++++++++++
 1 files changed, 53 insertions(+), 0 deletions(-)

diff --git a/funasr/runtime/python/benchmark_onnx.md b/funasr/runtime/python/benchmark_onnx.md
new file mode 100644
index 0000000..02adc79
--- /dev/null
+++ b/funasr/runtime/python/benchmark_onnx.md
@@ -0,0 +1,53 @@
+# Benchmark 
+
+Aishell1 test set , the total audio duration is 36108.919 seconds. (Note: The service has been fully warm up.)
+
+## [Paraformer-large](https://www.modelscope.cn/models/damo/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8404-pytorch/summary) 
+
+ ### Intel(R) Xeon(R) Platinum 8369B CPU @ 2.90GHz   16core-32processor    with avx512_vnni
+
+| concurrent-tasks | processing time(s) |   RTF   | Speedup Rate |
+|:----------------:|:------------------:|:-------:|:------------:|
+|  1 (onnx fp32)   |        2806        | 0.0777  |     12.9     |
+|  1 (onnx int8)   |        1611        | 0.0446  |     22.4     |
+|  8 (onnx fp32)   |        538         | 0.0149  |     67.1     |
+|  8 (onnx int8)   |        210         | 0.0058  |    172.4     |
+|  16 (onnx fp32)  |        288         | 0.0080  |    125.2     |
+|  16 (onnx int8)  |        117         | 0.0032  |    309.9     |
+|  32 (onnx fp32)  |        167         | 0.0046  |    216.5     |
+|  32 (onnx int8)  |         86         | 0.0024  |    420.0     |
+|  64 (onnx fp32)  |        158         | 0.0044  |    228.1     |
+|  64 (onnx int8)  |         82         | 0.0023  |    442.8     |
+|  96 (onnx fp32)  |        151         | 0.0042  |    238.0     |
+|  96 (onnx int8)  |         80         | 0.0022  |    452.0     |
+
+
+### Intel(R) Xeon(R) Platinum 8269CY CPU @ 2.50GHz   16core-32processor    with avx512_vnni
+
+| concurrent-tasks | processing time(s) |  RTF   | Speedup Rate |
+|:----------------:|:------------------:|:------:|:------------:|
+|  1 (onnx fp32)   |        2613        | 0.0724 |     13.8     |
+|  1 (onnx int8)   |        1321        | 0.0366 |     22.4     |
+|  32 (onnx fp32)  |        170         | 0.0047 |    212.7     |
+|  32 (onnx int8)  |        89          | 0.0025 |    407.0     |
+|  64 (onnx fp32)  |        166         | 0.0046 |    217.1     |
+|  64 (onnx int8)  |         87         | 0.0024 |    414.7     |
+
+
+### Intel(R) Xeon(R) Platinum 8163 CPU @ 2.50GHz    32core-64processor   without avx512_vnni
+
+
+| concurrent-tasks | processing time(s) |  RTF   | Speedup Rate |
+|:----------------:|:------------------:|:------:|:------------:|
+|  1 (onnx fp32)   |        2959        | 0.0820 |     12.2     |
+|  1 (onnx int8)   |        2814        | 0.0778 |     12.8     |
+|  16 (onnx fp32)  |        373         | 0.0103 |     96.9     |
+|  16 (onnx int8)  |        331         | 0.0091 |    109.0     |
+|  32 (onnx fp32)  |        211         | 0.0058 |    171.4     |
+|  32 (onnx int8)  |        181         | 0.0050 |    200.0     |
+|  64 (onnx fp32)  |        153         | 0.0042 |    235.9     |
+|  64 (onnx int8)  |        103         | 0.0029 |    349.9     |
+|  96 (onnx fp32)  |        146         | 0.0041 |    247.0     |
+|  96 (onnx int8)  |        108         | 0.0030 |    334.1     |
+
+## [Paraformer](https://modelscope.cn/models/damo/speech_paraformer_asr_nat-zh-cn-16k-common-vocab8358-tensorflow1/summary)

--
Gitblit v1.9.1