From 03d4ce829814b4a7f57235fda049351c524ba32b Mon Sep 17 00:00:00 2001 From: zhifu gao <zhifu.gzf@alibaba-inc.com> Date: 星期五, 17 三月 2023 14:06:56 +0800 Subject: [PATCH] Merge branch 'main' into dev_xw --- funasr/runtime/python/benchmark_onnx.md | 53 +++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 files changed, 53 insertions(+), 0 deletions(-) diff --git a/funasr/runtime/python/benchmark_onnx.md b/funasr/runtime/python/benchmark_onnx.md new file mode 100644 index 0000000..02adc79 --- /dev/null +++ b/funasr/runtime/python/benchmark_onnx.md @@ -0,0 +1,53 @@ +# Benchmark + +Aishell1 test set , the total audio duration is 36108.919 seconds. (Note: The service has been fully warm up.) + +## [Paraformer-large](https://www.modelscope.cn/models/damo/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8404-pytorch/summary) + + ### Intel(R) Xeon(R) Platinum 8369B CPU @ 2.90GHz 16core-32processor with avx512_vnni + +| concurrent-tasks | processing time(s) | RTF | Speedup Rate | +|:----------------:|:------------------:|:-------:|:------------:| +| 1 (onnx fp32) | 2806 | 0.0777 | 12.9 | +| 1 (onnx int8) | 1611 | 0.0446 | 22.4 | +| 8 (onnx fp32) | 538 | 0.0149 | 67.1 | +| 8 (onnx int8) | 210 | 0.0058 | 172.4 | +| 16 (onnx fp32) | 288 | 0.0080 | 125.2 | +| 16 (onnx int8) | 117 | 0.0032 | 309.9 | +| 32 (onnx fp32) | 167 | 0.0046 | 216.5 | +| 32 (onnx int8) | 86 | 0.0024 | 420.0 | +| 64 (onnx fp32) | 158 | 0.0044 | 228.1 | +| 64 (onnx int8) | 82 | 0.0023 | 442.8 | +| 96 (onnx fp32) | 151 | 0.0042 | 238.0 | +| 96 (onnx int8) | 80 | 0.0022 | 452.0 | + + +### Intel(R) Xeon(R) Platinum 8269CY CPU @ 2.50GHz 16core-32processor with avx512_vnni + +| concurrent-tasks | processing time(s) | RTF | Speedup Rate | +|:----------------:|:------------------:|:------:|:------------:| +| 1 (onnx fp32) | 2613 | 0.0724 | 13.8 | +| 1 (onnx int8) | 1321 | 0.0366 | 22.4 | +| 32 (onnx fp32) | 170 | 0.0047 | 212.7 | +| 32 (onnx int8) | 89 | 0.0025 | 407.0 | +| 64 (onnx fp32) | 166 | 0.0046 | 217.1 | +| 64 (onnx int8) | 87 | 0.0024 | 414.7 | + + +### Intel(R) Xeon(R) Platinum 8163 CPU @ 2.50GHz 32core-64processor without avx512_vnni + + +| concurrent-tasks | processing time(s) | RTF | Speedup Rate | +|:----------------:|:------------------:|:------:|:------------:| +| 1 (onnx fp32) | 2959 | 0.0820 | 12.2 | +| 1 (onnx int8) | 2814 | 0.0778 | 12.8 | +| 16 (onnx fp32) | 373 | 0.0103 | 96.9 | +| 16 (onnx int8) | 331 | 0.0091 | 109.0 | +| 32 (onnx fp32) | 211 | 0.0058 | 171.4 | +| 32 (onnx int8) | 181 | 0.0050 | 200.0 | +| 64 (onnx fp32) | 153 | 0.0042 | 235.9 | +| 64 (onnx int8) | 103 | 0.0029 | 349.9 | +| 96 (onnx fp32) | 146 | 0.0041 | 247.0 | +| 96 (onnx int8) | 108 | 0.0030 | 334.1 | + +## [Paraformer](https://modelscope.cn/models/damo/speech_paraformer_asr_nat-zh-cn-16k-common-vocab8358-tensorflow1/summary) -- Gitblit v1.9.1