diff --git "a/benchmark/README.md" "b/benchmark/README.md" --- "a/benchmark/README.md" +++ "b/benchmark/README.md" @@ -55,7 +55,7 @@ python benchmark.py --all --cfg_overwrite_backend_target 1 ## Detailed Results -Benchmark is done with latest `opencv-python==4.7.0.72` and `opencv-contrib-python==4.7.0.72` on the following platforms. Some models are excluded because of support issues. +Benchmark is done with latest `opencv-python==4.8.0.74` and `opencv-contrib-python==4.8.0.74` on the following platforms. Some models are excluded because of support issues. ### Intel 12700K @@ -67,50 +67,51 @@ Specs: [details](https://www.intel.com/content/www/us/en/products/sku/134594/int CPU: ``` -$ python benchmark.py --all --model_exclude license_plate_detection_lpd_yunet_2023mar_int8.onnx:human_segmentation_pphumanseg_2023mar_int8.onnx +$ python3 benchmark.py --all Benchmarking ... backend=cv.dnn.DNN_BACKEND_OPENCV target=cv.dnn.DNN_TARGET_CPU mean median min input size model -0.58 0.67 0.48 [160, 120] YuNet with ['face_detection_yunet_2022mar.onnx'] -0.82 0.81 0.48 [160, 120] YuNet with ['face_detection_yunet_2022mar_int8.onnx'] -6.18 6.33 5.83 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] -7.42 7.42 5.83 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] -3.32 3.46 2.76 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] -4.27 4.22 2.76 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] -4.68 5.04 4.36 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] -4.82 4.98 4.36 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] -8.20 9.33 6.66 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] -6.25 7.02 5.49 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] -6.00 6.31 5.49 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] -6.23 5.64 5.49 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] -6.50 6.87 5.49 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] -35.40 36.58 33.63 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] -35.79 35.53 33.48 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] -8.53 8.59 7.55 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] -65.15 77.44 45.40 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] -58.82 69.99 45.26 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] -137.53 136.70 119.95 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] -139.60 147.79 119.95 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] -29.46 42.21 25.82 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] -6.14 6.02 5.91 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] -8.51 9.89 5.91 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] -13.88 14.82 12.39 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] -30.87 30.69 29.85 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] -30.77 30.02 27.97 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] -7.72 8.84 6.13 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] -1.35 1.37 1.30 [100, 100] WeChatQRCode with ['detect_2021nov.prototxt', 'detect_2021nov.caffemodel', 'sr_2021nov.prototxt', 'sr_2021nov.caffemodel'] -75.82 75.37 69.18 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] -74.80 75.16 69.05 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] -21.37 24.50 16.04 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] -23.08 25.14 16.04 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] -20.43 31.14 11.74 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] -[ WARN:0@145.253] global onnx_graph_simplifier.cpp:804 getMatFromTensor DNN: load FP16 model as FP32 model, and it takes twice the FP16 RAM requirement. -20.71 17.95 11.74 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] -19.48 25.14 11.74 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] -19.38 18.85 11.74 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] -19.52 25.97 11.74 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] -18.55 15.29 10.35 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] +0.73 0.81 0.58 [160, 120] YuNet with ['face_detection_yunet_2023mar.onnx'] +0.85 0.78 0.58 [160, 120] YuNet with ['face_detection_yunet_2023mar_int8.onnx'] +4.52 4.70 4.25 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] +6.67 7.25 4.25 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] +2.53 2.33 2.18 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] +3.77 3.71 2.18 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] +3.91 3.84 3.65 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] +4.66 4.99 3.65 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] +8.21 8.97 6.22 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] +8.73 10.08 6.22 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar_int8.onnx'] +4.33 4.70 3.65 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] +4.20 4.05 3.19 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] +4.87 3.92 3.19 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] +5.30 6.19 3.19 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] +24.26 23.81 23.25 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] +29.45 30.19 23.25 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] +9.06 8.40 7.64 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] +10.25 12.59 7.64 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar_int8.onnx'] +44.85 45.84 43.06 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] +46.10 47.53 43.06 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] +144.89 149.58 125.71 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] +143.83 146.39 119.75 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] +23.43 22.82 20.90 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] +12.99 13.11 12.14 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] +12.64 12.44 10.82 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] +12.64 11.83 11.03 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] +22.13 21.99 21.48 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] +26.37 33.51 21.48 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] +10.07 9.68 8.16 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] +1.19 1.30 1.07 [100, 100] WeChatQRCode with ['detect_2021nov.prototxt', 'detect_2021nov.caffemodel', 'sr_2021nov.prototxt', 'sr_2021nov.caffemodel'] +80.97 80.06 73.20 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] +80.73 85.47 72.06 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] +17.97 16.18 12.43 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] +19.54 20.66 12.43 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] +17.73 24.25 9.65 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] +17.65 18.90 9.65 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] +16.97 15.14 9.65 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] +17.21 16.47 9.65 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] +17.68 14.54 9.65 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] +17.31 16.09 9.65 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] ``` ### Rasberry Pi 4B @@ -121,50 +122,51 @@ Specs: [details](https://www.raspberrypi.com/products/raspberry-pi-4-model-b/spe CPU: ``` -$ python benchmark.py --all --model_exclude license_plate_detection_lpd_yunet_2023mar_int8.onnx:human_segmentation_pphumanseg_2023mar_int8.onnx +$ python3 benchmark.py --all Benchmarking ... backend=cv.dnn.DNN_BACKEND_OPENCV target=cv.dnn.DNN_TARGET_CPU mean median min input size model -5.45 5.44 5.39 [160, 120] YuNet with ['face_detection_yunet_2022mar.onnx'] -6.12 6.15 5.39 [160, 120] YuNet with ['face_detection_yunet_2022mar_int8.onnx'] -78.04 77.96 77.62 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] -91.44 93.03 77.62 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] -32.21 31.86 31.85 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] -38.22 39.27 31.85 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] -43.85 43.76 43.51 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] -46.66 47.00 43.51 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] -73.29 73.70 72.86 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] -74.51 87.71 73.83 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] -67.29 68.22 61.55 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] -68.53 61.77 61.55 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] -68.31 72.16 61.55 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] -547.70 547.68 494.91 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] -527.14 567.06 465.02 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] -192.61 194.08 156.62 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] -248.03 229.41 209.65 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] -246.41 247.64 207.91 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] -1932.97 1941.47 1859.96 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] -1866.98 1866.50 1746.67 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] -762.56 738.04 654.25 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] -91.48 91.28 91.15 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] -115.58 135.17 91.15 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] -98.52 98.95 97.58 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] -676.15 655.20 636.06 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] -548.93 582.29 443.32 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] -90.26 92.06 88.80 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] -8.18 8.15 8.13 [100, 100] WeChatQRCode with ['detect_2021nov.prototxt', 'detect_2021nov.caffemodel', 'sr_2021nov.prototxt', 'sr_2021nov.caffemodel'] -2025.09 2046.92 1971.57 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] -2041.85 2048.24 1971.57 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] -272.81 285.66 259.93 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] -293.83 289.93 259.93 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] -271.57 317.17 223.36 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] -[ WARN:0@2039.612] global onnx_graph_simplifier.cpp:804 getMatFromTensor DNN: load FP16 model as FP32 model, and it takes twice the FP16 RAM requirement. -266.67 269.64 223.36 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] -259.06 239.43 223.36 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] -251.39 257.43 221.20 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] -248.27 253.01 221.20 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] -239.42 238.72 190.04 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] +5.96 5.93 5.90 [160, 120] YuNet with ['face_detection_yunet_2023mar.onnx'] +6.09 6.11 5.90 [160, 120] YuNet with ['face_detection_yunet_2023mar_int8.onnx'] +73.30 73.22 72.32 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] +88.20 89.95 72.32 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] +32.33 32.20 31.99 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] +39.82 40.78 31.99 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] +108.37 108.31 106.93 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] +75.91 78.95 49.78 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] +76.29 77.10 75.21 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] +77.33 77.73 75.21 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar_int8.onnx'] +66.22 66.09 65.90 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] +59.91 60.72 54.63 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] +62.83 54.85 54.63 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] +62.47 62.13 54.63 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] +625.82 667.05 425.55 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] +508.92 667.04 373.14 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] +147.19 146.62 146.31 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] +143.70 155.87 139.90 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar_int8.onnx'] +214.87 214.19 213.21 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] +212.90 212.93 209.55 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] +1690.06 2303.34 1480.63 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] +1489.54 1435.48 1308.12 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] +564.90 580.35 527.49 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] +356.63 357.29 354.42 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] +217.52 229.39 101.61 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] +198.63 198.25 196.68 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] +417.23 434.54 388.38 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] +381.72 394.15 308.62 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] +194.47 195.18 191.67 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] +5.90 5.90 5.81 [100, 100] WeChatQRCode with ['detect_2021nov.prototxt', 'detect_2021nov.caffemodel', 'sr_2021nov.prototxt', 'sr_2021nov.caffemodel'] +2033.55 2454.13 1769.20 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] +1896.61 1977.38 1769.20 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] +237.73 237.57 236.82 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] +265.16 270.22 236.82 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] +239.69 298.68 198.88 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] +234.90 249.29 198.88 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] +227.47 200.42 198.88 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] +226.39 213.26 198.88 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] +226.10 227.18 198.88 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] +220.63 217.04 193.47 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] ``` ### Jetson Nano B01 @@ -176,111 +178,113 @@ Specs: [details](https://developer.nvidia.com/embedded/jetson-nano-developer-kit CPU: ``` -$ python3 benchmark.py --all --model_exclude license_plate_detection_lpd_yunet_2023mar_int8.onnx:human_segmentation_pphumanseg_2023mar_int8.onnx +$ python3 benchmark.py --all Benchmarking ... backend=cv.dnn.DNN_BACKEND_OPENCV target=cv.dnn.DNN_TARGET_CPU mean median min input size model -5.37 5.44 5.27 [160, 120] YuNet with ['face_detection_yunet_2022mar.onnx'] -6.11 7.99 5.27 [160, 120] YuNet with ['face_detection_yunet_2022mar_int8.onnx'] -65.14 65.13 64.93 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] -79.33 88.12 64.93 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] -28.19 28.17 28.05 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] -34.85 35.66 28.05 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] -41.02 42.37 40.80 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] -44.20 44.39 40.80 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] -65.91 65.93 65.68 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] -68.94 68.95 68.77 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] -62.12 62.24 55.29 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] -66.04 55.58 55.29 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] -65.31 64.86 55.29 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] -376.88 368.22 367.11 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] -390.32 385.28 367.11 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] -133.15 130.57 129.38 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] -215.57 225.11 212.66 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] -217.37 214.85 212.66 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] -1228.13 1233.90 1219.11 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] -1257.34 1256.26 1219.11 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] -466.19 457.89 442.88 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] -69.60 69.69 69.13 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] -81.65 82.20 69.13 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] -98.38 98.20 97.69 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] -411.49 417.53 402.57 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] -372.94 370.17 335.95 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] -74.36 75.15 72.22 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] -5.62 5.64 5.55 [100, 100] WeChatQRCode with ['detect_2021nov.prototxt', 'detect_2021nov.caffemodel', 'sr_2021nov.prototxt', 'sr_2021nov.caffemodel'] -1089.89 1091.85 1071.95 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] -1089.94 1095.07 1071.95 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] -274.45 286.03 270.52 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] -290.82 288.87 270.52 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] -269.52 311.59 228.47 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] -[ WARN:0@1497.159] global onnx_graph_simplifier.cpp:804 getMatFromTensor DNN: load FP16 model as FP32 model, and it takes twice the FP16 RAM requirement. -269.66 267.98 228.47 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] -261.39 231.92 228.47 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] -259.68 249.43 228.47 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] -260.89 283.44 228.47 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] -255.61 249.41 222.38 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] +5.64 5.55 5.50 [160, 120] YuNet with ['face_detection_yunet_2023mar.onnx'] +5.91 6.00 5.50 [160, 120] YuNet with ['face_detection_yunet_2023mar_int8.onnx'] +61.32 61.38 61.08 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] +76.85 78.69 61.08 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] +27.39 27.54 27.26 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] +34.69 35.62 27.26 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] +50.39 50.31 50.22 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] +48.97 49.42 47.46 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] +68.07 67.81 67.72 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] +73.97 74.83 67.72 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar_int8.onnx'] +63.85 63.63 63.51 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] +55.14 55.93 47.84 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] +60.80 48.09 47.84 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] +60.99 61.22 47.84 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] +352.73 352.51 351.53 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] +374.22 376.71 351.53 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] +134.60 135.00 133.68 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] +137.10 137.32 133.68 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar_int8.onnx'] +215.10 215.30 214.30 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] +216.18 216.19 214.30 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] +1207.83 1208.71 1203.64 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] +1236.98 1250.21 1203.64 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] +456.79 456.90 445.83 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] +124.89 125.25 124.53 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] +107.99 109.82 94.05 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] +108.41 108.33 107.91 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] +354.88 354.70 354.34 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] +343.35 344.56 333.41 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] +89.93 91.58 88.28 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] +5.69 5.72 5.66 [100, 100] WeChatQRCode with ['detect_2021nov.prototxt', 'detect_2021nov.caffemodel', 'sr_2021nov.prototxt', 'sr_2021nov.caffemodel'] +1070.55 1072.14 1055.67 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] +1071.56 1071.38 1055.67 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] +258.11 258.13 257.64 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] +275.27 277.20 257.64 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] +254.90 295.88 221.12 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] +252.73 258.90 221.12 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] +245.08 222.01 221.12 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] +245.75 236.58 221.12 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] +248.42 251.65 221.12 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] +244.31 236.64 221.12 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] ``` GPU (CUDA-FP32): + ``` $ python3 benchmark.py --all --fp32 --cfg_exclude wechat --cfg_overwrite_backend_target 1 Benchmarking ... backend=cv.dnn.DNN_BACKEND_CUDA target=cv.dnn.DNN_TARGET_CUDA mean median min input size model -11.22 11.49 9.59 [160, 120] YuNet with ['face_detection_yunet_2022mar.onnx'] -24.60 25.91 24.16 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] -20.64 24.00 18.88 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] -41.15 41.18 40.95 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] -90.86 90.79 84.96 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] -69.24 69.11 68.87 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] -62.12 62.30 55.28 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] -148.58 153.17 144.61 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] -53.50 54.29 51.48 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] -214.99 218.04 212.94 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] -1238.91 1244.87 1227.30 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] -76.54 76.09 74.51 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] -67.34 67.83 62.38 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] -56.69 55.54 48.96 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] -126.65 126.63 124.96 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] -73.84 75.25 72.19 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] -303.12 302.80 299.30 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] -302.58 299.78 297.83 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] -58.05 62.90 52.47 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] -59.39 56.82 52.47 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] -45.60 62.40 21.73 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] +11.16 10.31 10.23 [160, 120] YuNet with ['face_detection_yunet_2023mar.onnx'] +24.82 24.90 24.33 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] +14.39 14.44 13.83 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] +24.52 24.01 23.84 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] +69.63 69.88 64.73 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] +29.06 29.10 28.80 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] +28.54 28.57 27.88 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] +99.05 99.65 93.60 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] +54.24 55.24 52.87 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] +63.63 63.43 63.32 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] +371.45 378.00 366.39 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] +77.50 77.73 76.16 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] +33.85 33.90 33.61 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] +38.16 37.33 37.10 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] +91.65 91.98 89.90 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] +91.40 92.74 89.76 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] +223.24 224.30 216.37 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] +223.03 222.28 216.37 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] +44.24 45.21 41.87 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] +45.15 44.15 41.87 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] +36.82 46.54 21.75 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] ``` GPU (CUDA-FP16): - + ``` $ python3 benchmark.py --all --fp32 --cfg_exclude wechat --cfg_overwrite_backend_target 2 Benchmarking ... backend=cv.dnn.DNN_BACKEND_CUDA target=cv.dnn.DNN_TARGET_CUDA_FP16 mean median min input size model -26.17 26.40 25.87 [160, 120] YuNet with ['face_detection_yunet_2022mar.onnx'] -116.07 115.93 112.39 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] -119.85 121.62 114.63 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] -40.94 40.92 40.70 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] -99.88 100.49 93.24 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] -69.00 68.81 68.60 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] -61.93 62.18 55.17 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] -141.11 145.82 136.02 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] -364.70 363.48 360.28 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] -215.23 213.49 213.06 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] -1223.32 1248.88 1213.25 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] -52.91 52.96 50.17 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] -212.86 213.21 210.03 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] -221.12 255.53 217.16 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] -96.68 94.21 89.24 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] -73.68 77.30 69.17 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] -343.38 344.17 337.62 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] -344.29 345.07 337.62 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] -48.91 50.31 45.41 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] -50.20 49.66 45.41 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] -39.56 52.56 20.76 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] +25.41 25.43 25.31 [160, 120] YuNet with ['face_detection_yunet_2023mar.onnx'] +113.14 112.02 111.74 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] +89.04 88.90 88.59 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] +96.62 96.39 96.26 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] +69.78 70.65 66.74 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] +118.47 118.45 118.10 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] +125.69 126.63 118.10 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] +64.08 62.97 62.33 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] +366.46 366.88 363.46 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] +163.06 163.34 161.77 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] +301.10 311.52 297.74 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] +53.34 54.30 51.79 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] +149.37 149.95 148.01 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] +153.89 153.96 153.43 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] +44.29 44.03 43.62 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] +91.28 92.89 89.79 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] +254.78 256.13 245.60 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] +254.98 255.20 245.60 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] +33.07 32.88 32.00 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] +33.88 33.64 32.00 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] +29.32 33.70 20.69 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] ``` ### Khadas VIM3 @@ -292,74 +296,74 @@ Specs: [details](https://www.khadas.com/vim3) CPU: ``` -$ python3 benchmark.py --all --model_exclude license_plate_detection_lpd_yunet_2023mar_int8.onnx:human_segmentation_pphumanseg_2023mar_int8.onnx +$ python3 benchmark.py --all Benchmarking ... backend=cv.dnn.DNN_BACKEND_OPENCV target=cv.dnn.DNN_TARGET_CPU mean median min input size model -4.93 4.91 4.83 [160, 120] YuNet with ['face_detection_yunet_2022mar.onnx'] -5.30 5.31 4.83 [160, 120] YuNet with ['face_detection_yunet_2022mar_int8.onnx'] -60.02 61.00 57.85 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] -70.27 74.77 57.85 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] -29.36 28.28 27.97 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] -34.66 34.12 27.97 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] -38.60 37.72 36.79 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] -41.57 41.91 36.79 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] -70.82 72.70 67.14 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] -64.73 64.22 62.19 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] -58.18 59.29 49.97 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] -59.15 52.27 49.97 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] -57.38 55.13 49.97 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] -385.29 361.27 348.96 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] -352.90 395.79 328.06 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] -122.17 123.58 119.43 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] -208.25 217.96 195.76 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] -203.04 213.99 161.37 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] -1189.83 1150.85 1138.93 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] -1137.18 1142.89 1080.23 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] -428.66 524.98 391.33 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] -66.91 67.09 64.90 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] -79.42 81.44 64.90 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] -84.42 85.99 83.30 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] -439.53 431.92 406.03 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] -358.63 379.93 296.32 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] -68.51 66.87 66.53 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] -5.29 5.30 5.21 [100, 100] WeChatQRCode with ['detect_2021nov.prototxt', 'detect_2021nov.caffemodel', 'sr_2021nov.prototxt', 'sr_2021nov.caffemodel'] -973.75 968.68 954.58 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] -961.44 959.29 935.29 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] -202.74 202.73 200.75 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] -217.07 217.26 200.75 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] -199.81 231.31 169.27 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] -[ WARN:0@1277.652] global onnx_graph_simplifier.cpp:804 getMatFromTensor DNN: load FP16 model as FP32 model, and it takes twice the FP16 RAM requirement. -199.73 203.96 169.27 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] -192.97 175.68 169.27 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] -189.65 189.43 169.27 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] -188.98 202.49 169.27 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] -183.49 188.71 149.81 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] +4.60 4.57 4.47 [160, 120] YuNet with ['face_detection_yunet_2023mar.onnx'] +5.10 5.15 4.47 [160, 120] YuNet with ['face_detection_yunet_2023mar_int8.onnx'] +53.88 52.80 51.99 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] +67.86 67.67 51.99 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] +40.93 41.29 27.33 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] +42.81 56.31 27.33 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] +58.84 56.15 53.14 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] +56.36 60.14 45.29 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] +76.53 67.95 65.13 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] +72.25 69.88 65.13 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar_int8.onnx'] +66.50 64.06 58.56 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] +59.10 75.36 45.69 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] +62.44 48.81 45.69 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] +60.46 54.93 45.69 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] +372.65 404.31 326.91 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] +359.72 336.21 326.91 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] +145.21 125.62 124.87 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] +130.10 139.45 116.10 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar_int8.onnx'] +218.21 216.01 199.88 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] +212.69 262.75 170.88 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] +1110.87 1112.27 1085.31 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] +1128.73 1157.12 1085.31 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] +382.57 464.42 354.66 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] +147.01 144.01 139.27 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] +119.70 118.95 94.09 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] +107.63 107.09 105.61 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] +333.03 346.65 322.37 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] +322.95 315.22 303.07 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] +127.16 173.93 99.77 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] +975.49 977.45 952.43 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] +970.16 970.83 928.66 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] +194.80 195.37 192.65 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] +209.49 208.33 192.65 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] +192.90 227.02 161.94 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] +192.52 197.03 161.94 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] +185.92 168.22 161.94 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] +185.01 183.14 161.94 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] +186.09 194.14 161.94 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] +181.79 181.65 154.21 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] ``` NPU (TIMVX): - + ``` -$ python3 benchmark.py --all --int8 --cfg_overwrite_backend_target 3 --model_exclude license_plate_detection_lpd_yunet_2023mar_int8.onnx:human_segmentation_pphumanseg_2023mar_int8.onnx +$ python3 benchmark.py --all --int8 --cfg_overwrite_backend_target 3 --cfg_exclude face_detection:license_plate Benchmarking ... backend=cv.dnn.DNN_BACKEND_TIMVX target=cv.dnn.DNN_TARGET_NPU mean median min input size model -5.67 5.74 5.59 [160, 120] YuNet with ['face_detection_yunet_2022mar_int8.onnx'] -76.97 77.86 75.59 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] -40.38 39.41 38.12 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] -44.36 45.77 42.06 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] -60.75 62.46 56.34 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] -57.40 58.10 52.11 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] -340.20 347.74 330.70 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] -200.50 224.02 160.81 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] -1103.24 1091.76 1059.77 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] -95.92 102.80 92.77 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] -307.90 310.52 302.46 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] -178.71 178.87 177.84 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] -183.51 183.72 177.84 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] -172.06 189.19 149.19 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] +45.83 47.06 43.04 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] +29.20 27.55 26.25 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] +18.47 18.16 17.96 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] +28.25 28.35 27.98 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar_int8.onnx'] +149.05 155.10 144.42 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] +147.40 147.49 135.90 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] +75.91 79.27 71.98 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] +117.71 119.69 107.37 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] +379.46 366.19 360.02 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] +33.90 36.32 31.71 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] +40.34 41.50 38.47 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] +239.68 239.31 236.03 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] +199.42 203.20 166.15 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] +197.49 169.51 166.15 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] ``` ### Atlas 200 DK @@ -369,54 +373,55 @@ Specs: [details_en](https://e.huawei.com/uk/products/cloud-computing-dc/atlas/at - NPU: Ascend 310, dual DaVinci AI cores, 22/16/8 TOPS INT8. CPU: - + ``` -$ python3 benchmark.py --all --cfg_exclude wechat --model_exclude license_plate_detection_lpd_yunet_2023mar_int8.onnx:human_segmentation_pphumanseg_2023mar_int8.onnx +$ python3 benchmark.py --all --cfg_exclude wechat Benchmarking ... backend=cv.dnn.DNN_BACKEND_OPENCV target=cv.dnn.DNN_TARGET_CPU mean median min input size model -8.02 8.07 7.93 [160, 120] YuNet with ['face_detection_yunet_2022mar.onnx'] -9.44 9.34 7.93 [160, 120] YuNet with ['face_detection_yunet_2022mar_int8.onnx'] -104.51 112.90 102.07 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] -131.49 147.17 102.07 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] -47.71 57.86 46.48 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] -59.26 59.07 46.48 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] -57.95 58.02 57.30 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] -65.52 70.76 57.30 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] -107.98 127.65 106.59 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] -103.96 124.91 102.87 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] -90.46 90.53 76.14 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] -98.40 76.49 76.14 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] -98.06 95.36 76.14 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] -564.69 556.79 537.84 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] -621.54 661.56 537.84 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] -226.08 216.89 216.07 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] -343.08 346.39 315.99 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] -351.64 346.41 315.99 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] -1995.97 1996.82 1967.76 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] -2060.87 2055.60 1967.76 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] -701.08 708.52 685.49 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] -105.23 105.14 105.00 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] -123.41 125.65 105.00 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] -134.10 134.43 133.62 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] -631.70 631.81 630.61 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] -595.32 599.48 565.32 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] -108.55 117.88 106.66 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] -1452.55 1453.75 1450.98 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] -1433.26 1432.08 1409.78 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] -299.36 299.92 298.75 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] -329.84 333.32 298.75 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] -303.65 367.68 262.48 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] -[ WARN:0@760.743] global onnx_graph_simplifier.cpp:804 getMatFromTensor DNN: load FP16 model as FP32 model, and it takes twice the FP16 RAM requirement. -299.60 315.91 262.48 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] -290.29 263.05 262.48 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] -290.41 279.30 262.48 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] -294.61 295.36 262.48 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] -289.53 279.60 262.48 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] +7.82 7.82 7.77 [160, 120] YuNet with ['face_detection_yunet_2023mar.onnx'] +8.57 8.77 7.77 [160, 120] YuNet with ['face_detection_yunet_2023mar_int8.onnx'] +92.21 92.11 91.87 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] +122.07 126.02 91.87 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] +42.93 43.26 42.75 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] +55.91 57.40 42.75 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] +67.85 67.91 67.47 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] +70.06 70.21 67.47 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] +102.49 102.65 102.10 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] +114.02 116.16 102.10 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar_int8.onnx'] +92.66 92.49 92.36 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] +79.39 80.75 68.47 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] +89.66 68.66 68.47 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] +90.59 92.13 68.47 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] +499.55 500.15 498.36 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] +571.85 580.88 498.36 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] +201.99 201.55 200.62 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] +216.72 217.34 200.62 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar_int8.onnx'] +313.66 313.85 312.13 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] +322.98 323.45 312.13 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] +1875.33 1877.53 1871.26 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] +1989.04 2005.25 1871.26 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] +637.54 640.61 626.98 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] +159.80 159.62 159.40 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] +152.18 152.86 145.56 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] +145.83 145.77 145.45 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] +521.46 521.66 520.28 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] +541.50 544.02 520.28 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] +134.02 136.01 132.06 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] +1441.73 1442.80 1440.26 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] +1436.45 1437.89 1430.58 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] +285.19 284.91 284.69 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] +318.96 323.30 284.69 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] +289.82 360.87 244.07 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] +285.40 303.13 244.07 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] +274.67 244.47 243.87 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] +277.84 262.99 243.87 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] +283.02 280.77 243.87 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] +279.21 262.55 243.87 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] ``` -NPU: +NPU (CANN): ``` $ python3 benchmark.py --all --fp32 --cfg_exclude wechat:dasiamrpn:crnn --model_exclude pose_estimation_mediapipe_2023mar.onnx --cfg_overwrite_backend_target 4 @@ -449,51 +454,52 @@ Specs: [details](https://t.rock-chips.com/en/portal.php?mod=view&aid=26) - NPU (Not supported by OpenCV): 2.0TOPS, support 8bit / 16bit CPU: - + ``` -$ python3 benchmark.py --all --cfg_exclude wechat --model_exclude license_plate_detection_lpd_yunet_2023mar_int8.onnx:human_segmentation_pphumanseg_2023mar_int8.onnx +$ python3 benchmark.py --all --cfg_exclude wechat Benchmarking ... backend=cv.dnn.DNN_BACKEND_OPENCV target=cv.dnn.DNN_TARGET_CPU mean median min input size model -68.89 68.59 68.23 [160, 120] YuNet with ['face_detection_yunet_2022mar.onnx'] -60.98 61.11 52.00 [160, 120] YuNet with ['face_detection_yunet_2022mar_int8.onnx'] -1550.71 1578.99 1527.58 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] -1214.15 1261.66 920.50 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] -604.36 611.24 578.99 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] -496.42 537.75 397.23 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] -460.56 470.15 440.77 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] -387.63 379.96 318.71 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] -1610.78 1599.92 1583.95 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] -1546.16 1539.50 1513.14 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] -1166.56 1211.97 827.10 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] -983.80 868.18 689.32 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] -840.38 801.83 504.54 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] -11793.09 11817.73 11741.04 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] -7740.03 8134.99 4464.30 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] -3222.92 3225.18 3170.71 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] -2303.55 2307.46 2289.41 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] -1888.15 1920.41 1528.78 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] -38359.93 39021.21 37180.85 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] -24504.50 25439.34 13443.63 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] -14738.64 14764.84 14655.76 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] -872.09 877.72 838.99 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] -764.48 775.55 653.25 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] -1326.56 1327.10 1305.18 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] -11117.07 11109.12 11058.49 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] -7037.96 7424.89 3750.12 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] -704.44 704.77 672.58 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] -49065.03 49144.55 48943.50 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] -49052.24 48992.64 48927.44 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] -2200.08 2193.78 2175.77 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] -2244.03 2240.25 2175.77 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] -2230.12 2290.28 2175.77 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] -[ WARN:0@1315.065] global onnx_graph_simplifier.cpp:804 getMatFromTensor DNN: load FP16 model as FP32 model, and it takes twice the FP16 RAM requirement. -2220.33 2281.75 2171.61 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] -2216.44 2212.48 2171.61 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] -2041.65 2209.50 1268.91 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] -1933.06 2210.81 1268.91 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] -1826.34 2234.66 1184.53 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] +56.45 56.29 56.18 [160, 120] YuNet with ['face_detection_yunet_2023mar.onnx'] +48.83 49.41 41.52 [160, 120] YuNet with ['face_detection_yunet_2023mar_int8.onnx'] +1554.78 1545.63 1523.62 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] +1215.44 1251.08 921.26 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] +612.58 613.61 587.83 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] +502.02 513.29 399.51 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] +525.72 532.34 502.00 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] +415.87 442.23 318.14 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] +1631.40 1635.83 1608.43 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] +1115.29 1159.60 675.51 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar_int8.onnx'] +1546.54 1547.64 1516.69 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] +1163.10 1227.05 816.99 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] +980.56 852.38 689.31 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] +837.72 778.61 507.03 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] +11819.74 11778.79 11758.31 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] +7742.66 8151.17 4442.93 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] +3266.08 3250.08 3216.03 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] +2260.88 2368.00 1437.58 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar_int8.onnx'] +2335.65 2342.12 2304.69 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] +1903.82 1962.71 1533.79 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] +37604.10 37569.30 37502.48 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] +24229.20 25577.94 13483.54 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] +14860.23 14988.15 14769.91 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] +1133.44 1131.54 1124.83 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] +883.96 919.07 655.33 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] +1430.98 1424.55 1415.68 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] +11131.81 11141.37 11080.20 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] +7065.00 7461.37 3748.85 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] +790.98 823.19 755.99 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] +49331.32 49285.30 49210.67 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] +49327.34 49489.22 49210.67 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] +2183.70 2172.36 2156.29 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] +2225.19 2222.58 2156.29 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] +2214.03 2302.61 2156.29 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] +2203.45 2231.47 2150.19 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] +2201.14 2188.00 2150.19 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] +2029.28 2178.36 1268.17 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] +1923.12 2219.63 1268.17 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] +1818.21 2196.98 1184.98 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] ``` ### Khadas Edge2 (with RK3588) @@ -504,51 +510,52 @@ SoC specs: [details](https://www.rock-chips.com/a/en/products/RK35_Series/2022/0 - NPU (Not supported by OpenCV): Build-in 6 TOPS Performance NPU, triple core, support int4 / int8 / int16 / fp16 / bf16 / tf32 CPU: - + ``` -$ python3 benchmark.py --all --cfg_exclude wechat --model_exclude license_plate_detection_lpd_yunet_2023mar_int8.onnx:human_segmentation_pphumanseg_2023mar_int8.onnx +$ python3 benchmark.py --all --cfg_exclude wechat Benchmarking ... backend=cv.dnn.DNN_BACKEND_OPENCV target=cv.dnn.DNN_TARGET_CPU mean median min input size model -2.47 2.55 2.44 [160, 120] YuNet with ['face_detection_yunet_2022mar.onnx'] -2.81 2.84 2.44 [160, 120] YuNet with ['face_detection_yunet_2022mar_int8.onnx'] -33.79 33.83 33.24 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] -39.96 40.77 33.24 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] -15.99 16.12 15.92 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] -19.09 19.48 15.92 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] -20.27 20.45 20.11 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] -23.14 23.62 20.11 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] -34.58 34.53 33.55 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] -32.78 32.94 31.99 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] -28.38 28.80 24.59 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] -31.49 24.66 24.59 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] -31.45 32.34 24.59 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] -178.87 178.49 173.57 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] -197.19 200.06 173.57 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] -57.57 65.48 51.34 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] -118.38 132.59 88.34 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] -120.74 110.82 88.34 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] -577.93 577.17 553.81 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] -607.96 604.88 553.81 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] -152.78 155.89 121.26 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] -38.03 38.26 37.51 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] -47.12 48.12 37.51 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] -46.07 46.77 45.10 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] -195.67 198.02 182.97 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] -181.91 182.28 169.98 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] -35.47 37.63 33.55 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] -394.77 407.60 371.95 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] -392.52 404.80 367.96 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] -77.32 77.72 75.27 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] -82.93 82.93 75.27 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] -77.51 93.01 67.44 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] -[ WARN:0@598.857] global onnx_graph_simplifier.cpp:804 getMatFromTensor DNN: load FP16 model as FP32 model, and it takes twice the FP16 RAM requirement. -77.02 84.11 67.44 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] -75.11 69.82 63.98 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] -74.55 73.36 63.98 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] -75.06 77.44 63.98 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] -73.91 74.25 63.98 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] +2.29 2.30 2.25 [160, 120] YuNet with ['face_detection_yunet_2023mar.onnx'] +2.62 2.64 2.25 [160, 120] YuNet with ['face_detection_yunet_2023mar_int8.onnx'] +28.19 28.12 28.01 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] +36.68 37.80 28.01 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] +12.56 12.55 12.50 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] +17.28 17.83 12.50 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] +22.74 22.87 22.43 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] +24.56 24.61 22.43 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] +29.91 30.23 28.16 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] +35.54 35.46 28.16 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar_int8.onnx'] +27.28 27.20 27.20 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] +22.91 23.33 19.28 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] +27.36 19.46 19.28 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] +28.28 29.17 19.28 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] +150.06 150.89 147.05 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] +180.91 184.75 147.05 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] +54.14 52.95 49.31 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] +60.01 61.20 49.31 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar_int8.onnx'] +117.60 128.98 83.33 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] +117.28 150.31 83.33 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] +553.58 558.76 535.47 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] +594.18 592.64 535.47 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] +138.82 151.00 113.82 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] +56.35 55.73 55.25 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] +57.07 57.19 55.25 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] +47.94 48.41 47.05 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] +146.02 145.89 139.08 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] +157.60 158.88 139.08 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] +41.26 42.74 40.08 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] +384.47 401.25 360.71 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] +377.91 381.15 336.30 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] +68.70 68.63 68.54 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] +78.17 80.48 68.54 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] +71.42 91.44 61.14 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] +70.07 76.28 61.14 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] +67.69 61.72 61.14 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] +68.29 65.04 61.14 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] +69.58 68.63 61.14 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] +68.99 65.02 61.14 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] ``` ### Horizon Sunrise X3 PI @@ -560,49 +567,51 @@ Specs: [details_cn](https://developer.horizon.ai/sunrise) CPU: ``` -$ python3 benchmark.py --all --cfg_exclude wechat --model_exclude license_plate_detection_lpd_yunet_2023mar_int8.onnx:human_segmentation_pphumanseg_2023mar_int8.onnx +$ python3 benchmark.py --all Benchmarking ... backend=cv.dnn.DNN_BACKEND_OPENCV target=cv.dnn.DNN_TARGET_CPU mean median min input size model -11.04 11.01 10.98 [160, 120] YuNet with ['face_detection_yunet_2022mar.onnx'] -12.59 12.75 10.98 [160, 120] YuNet with ['face_detection_yunet_2022mar_int8.onnx'] -140.83 140.85 140.52 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] -171.71 175.65 140.52 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] -64.96 64.94 64.77 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] -80.20 81.82 64.77 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] -80.67 80.72 80.45 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] -89.25 90.39 80.45 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] -144.23 144.34 143.84 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] -140.60 140.62 140.33 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] -122.53 124.23 107.71 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] -128.22 107.87 107.71 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] -125.77 123.77 107.71 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] -759.81 760.01 759.11 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] -764.17 764.43 759.11 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] -283.75 284.17 282.15 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] -408.16 408.31 402.71 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] -408.82 407.99 402.71 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] -2749.22 2756.23 2737.96 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] -2671.54 2692.18 2601.24 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] -929.63 936.01 914.86 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] -142.23 142.03 141.78 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] -179.74 184.79 141.78 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] -191.41 191.48 191.00 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] -898.23 897.52 896.58 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] -749.83 765.90 630.39 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] -158.50 160.55 155.64 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] -1908.87 1905.00 1903.13 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] -1922.34 1920.65 1896.97 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] -470.78 469.17 467.92 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] -495.94 497.12 467.92 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] -464.58 528.72 408.69 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] -[ WARN:0@2820.735] global onnx_graph_simplifier.cpp:804 getMatFromTensor DNN: load FP16 model as FP32 model, and it takes twice the FP16 RAM requirement. -465.04 467.01 408.69 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] -452.90 409.34 408.69 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] -450.23 438.57 408.69 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] -453.52 468.72 408.69 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] -443.38 447.29 381.90 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] +10.15 10.07 10.04 [160, 120] YuNet with ['face_detection_yunet_2023mar.onnx'] +11.27 11.40 10.04 [160, 120] YuNet with ['face_detection_yunet_2023mar_int8.onnx'] +116.44 116.29 116.15 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] +158.75 164.22 116.15 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] +55.42 55.80 55.27 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] +76.04 78.44 55.27 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] +91.39 95.06 90.66 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] +95.54 95.39 90.66 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] +135.16 134.82 134.75 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] +148.05 149.55 134.75 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar_int8.onnx'] +115.69 115.73 115.38 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] +99.37 100.71 85.65 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] +111.02 85.94 85.65 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] +112.94 112.72 85.65 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] +641.92 643.42 640.64 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] +700.42 708.18 640.64 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] +251.52 250.97 250.36 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] +261.00 280.82 250.36 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar_int8.onnx'] +395.23 398.77 385.68 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] +406.28 416.58 385.68 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] +2608.90 2612.42 2597.93 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] +2609.88 2609.39 2597.93 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] +809.55 814.66 794.67 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] +228.95 228.74 228.35 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] +227.97 228.61 226.76 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] +192.29 192.26 191.74 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] +660.62 662.28 659.49 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] +646.25 647.89 631.03 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] +182.57 185.52 179.71 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] +9.93 9.97 9.82 [100, 100] WeChatQRCode with ['detect_2021nov.prototxt', 'detect_2021nov.caffemodel', 'sr_2021nov.prototxt', 'sr_2021nov.caffemodel'] +1914.15 1913.70 1902.25 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] +1920.07 1929.80 1902.25 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] +439.96 441.91 436.49 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] +465.56 466.86 436.49 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] +431.93 495.94 373.61 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] +432.47 435.40 373.61 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] +418.75 375.76 373.61 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] +421.81 410.25 373.61 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] +429.30 437.71 373.61 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] +422.15 406.50 373.61 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] ``` ### MAIX-III AX-PI @@ -613,51 +622,52 @@ SoC specs: [details_cn](https://axera-tech.com/product/T7297367876123493768) - NPU (Not supported by OpenCV): 14.4Tops@int4,3.6Tops@int8 CPU: - + ``` -$ python3 benchmark.py --all --cfg_exclude wechat --model_exclude license_plate_detection_lpd_yunet_2023mar_int8.onnx:human_segmentation_pphumanseg_2023mar_int8.onnx +$ python3 benchmark.py --all --cfg_exclude wechat Benchmarking ... backend=cv.dnn.DNN_BACKEND_OPENCV target=cv.dnn.DNN_TARGET_CPU mean median min input size model -98.16 98.99 97.73 [160, 120] YuNet with ['face_detection_yunet_2022mar.onnx'] -93.21 93.81 89.15 [160, 120] YuNet with ['face_detection_yunet_2022mar_int8.onnx'] -2093.12 2093.02 2092.54 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] -1845.87 1871.17 1646.65 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] -811.32 811.47 810.80 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] -743.24 750.04 688.44 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] -636.22 635.89 635.43 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] -588.83 594.01 550.49 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] -2157.86 2157.82 2156.99 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] -2091.13 2091.61 2090.72 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] -1583.25 1634.14 1176.19 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] -1450.55 1177.07 1176.19 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] -1272.81 1226.00 873.94 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] -15753.56 15751.29 15748.97 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] -11610.11 12023.99 8290.04 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] -4300.13 4301.43 4298.29 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] -3360.20 3357.84 3356.70 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] -2961.58 3005.40 2641.27 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] -49994.75 49968.90 49958.48 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] -35966.66 37391.40 24670.30 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] -19800.14 19816.02 19754.69 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] -1191.81 1192.42 1191.40 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] -1162.64 1165.77 1138.35 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] -1835.97 1836.24 1835.34 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] -14886.02 14884.48 14881.73 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] -10491.63 10930.80 6975.34 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] -987.30 992.59 982.71 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] -65681.91 65674.89 65612.09 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] -65630.56 65652.90 65531.21 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] -3248.11 3242.59 3241.18 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] -3330.69 3350.38 3241.18 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] -3277.07 3427.65 3195.84 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] -[ WARN:0@17240.397] global onnx_graph_simplifier.cpp:804 getMatFromTensor DNN: load FP16 model as FP32 model, and it takes twice the FP16 RAM requirement. -3263.48 3319.83 3195.84 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] -3258.78 3196.90 3195.84 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] -3090.12 3224.64 2353.81 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] -3001.31 3237.93 2353.81 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] -2887.05 3224.12 2206.89 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] +83.67 83.60 83.50 [160, 120] YuNet with ['face_detection_yunet_2023mar.onnx'] +76.45 77.17 70.53 [160, 120] YuNet with ['face_detection_yunet_2023mar_int8.onnx'] +2102.93 2102.75 2102.23 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] +1846.25 1872.36 1639.46 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] +825.27 825.74 824.83 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] +752.57 759.68 693.90 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] +742.35 742.87 741.42 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] +630.16 641.82 539.73 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] +2190.53 2188.01 2187.75 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] +1662.81 1712.08 1235.22 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar_int8.onnx'] +2099.43 2099.39 2098.89 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] +1589.86 1641.45 1181.62 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] +1451.24 1182.16 1181.62 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] +1277.21 1224.66 888.62 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] +15832.31 15832.41 15830.59 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] +11649.30 12067.68 8300.79 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] +4376.55 4398.44 4371.68 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] +3376.78 3480.89 2574.72 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar_int8.onnx'] +3422.70 3414.45 3413.72 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] +3002.36 3047.94 2655.38 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] +50678.08 50651.82 50651.19 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] +36249.71 37771.22 24606.37 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] +19974.99 19984.80 19948.63 [1280, 720] DaSiamRPN with ['object_tracking_dasiamrpn_kernel_cls1_2021nov.onnx', 'object_tracking_dasiamrpn_kernel_r1_2021nov.onnx', 'object_tracking_dasiamrpn_model_2021nov.onnx'] +1502.15 1501.98 1500.99 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] +1300.15 1320.44 1137.60 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] +1993.05 1993.98 1991.86 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] +14925.56 14926.90 14912.28 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] +10507.96 10944.15 6974.74 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] +1113.51 1124.83 1106.81 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] +66015.47 65997.60 65993.81 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] +66023.14 66034.99 65993.81 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] +3230.93 3228.61 3228.29 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] +3312.02 3323.17 3228.29 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] +3262.32 3413.03 3182.11 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] +3250.66 3298.06 3182.11 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] +3231.37 3185.37 3179.37 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] +3064.17 3213.91 2345.80 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] +2975.21 3227.38 2345.80 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] +2862.33 3212.57 2205.48 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] ``` ### StarFive VisionFive 2 @@ -667,47 +677,50 @@ Specs: [details_cn](https://doc.rvspace.org/VisionFive2/PB/VisionFive_2/specific - GPU: IMG BXE-4-32 MC1 with work frequency up to 600 MHz CPU: - + + ``` -$ python3 benchmark.py --all --cfg_exclude wechat:dasiam --model_exclude license_plate_detection_lpd_yunet_2023mar_int8.onnx:human_segmentation_pphumanseg_2023mar_int8.onnx +$ python3 benchmark.py --all --cfg_exclude wechat:dasiam Benchmarking ... backend=cv.dnn.DNN_BACKEND_OPENCV target=cv.dnn.DNN_TARGET_CPU mean median min input size model -50.28 50.42 50.08 [160, 120] YuNet with ['face_detection_yunet_2022mar.onnx'] -44.45 44.84 39.29 [160, 120] YuNet with ['face_detection_yunet_2022mar_int8.onnx'] -1059.87 1059.79 1058.95 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] -838.07 859.42 658.86 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] -424.55 424.74 424.06 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] -350.30 357.95 290.66 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] -314.50 313.75 313.67 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] -275.80 280.48 243.97 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] -1131.91 1132.16 1131.08 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] -1072.77 1073.31 1072.07 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] -811.64 837.32 602.08 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] -692.68 602.74 516.39 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] -596.12 559.52 382.75 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] -8131.86 8132.90 8128.55 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] -5412.98 5684.12 3236.35 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] -2265.62 2264.83 2263.38 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] -1727.39 1727.31 1726.31 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] -1429.48 1458.69 1189.19 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] -26156.87 26169.88 26134.95 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] -17151.71 17933.90 9675.03 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] -316.26 315.72 315.55 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] -276.38 280.84 243.11 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] -586.18 586.28 585.62 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] -542.79 546.26 506.12 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] -910.67 910.62 909.72 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] -7628.31 7624.65 7623.26 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] -4899.76 5171.88 2714.07 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] -486.59 490.33 484.31 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] -34888.37 34834.51 34103.30 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] -35123.00 35996.09 34103.30 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] -1425.08 1543.33 1413.01 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] -1455.55 1580.51 1413.01 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] -1457.01 1484.13 1413.01 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] -1281.84 1468.77 810.51 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] -1191.52 1517.48 810.51 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] -1111.95 1131.27 775.96 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] +41.10 41.09 41.04 [160, 120] YuNet with ['face_detection_yunet_2023mar.onnx'] +35.87 36.37 31.62 [160, 120] YuNet with ['face_detection_yunet_2023mar_int8.onnx'] +1050.45 1050.38 1050.01 [150, 150] SFace with ['face_recognition_sface_2021dec.onnx'] +832.25 854.08 657.41 [150, 150] SFace with ['face_recognition_sface_2021dec_int8.onnx'] +425.36 425.42 425.19 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july.onnx'] +351.86 372.26 292.72 [112, 112] FacialExpressionRecog with ['facial_expression_recognition_mobilefacenet_2022july_int8.onnx'] +348.67 347.98 347.67 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb.onnx'] +290.95 297.03 243.79 [224, 224] MPHandPose with ['handpose_estimation_mediapipe_2023feb_int8.onnx'] +1135.09 1135.25 1134.72 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar.onnx'] +788.33 822.69 509.67 [192, 192] PPHumanSeg with ['human_segmentation_pphumanseg_2023mar_int8.onnx'] +1065.61 1065.99 1065.30 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr.onnx'] +805.26 830.66 595.78 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr.onnx'] +687.98 609.35 514.14 [224, 224] MobileNet with ['image_classification_mobilenetv1_2022apr_int8.onnx'] +592.59 555.25 381.33 [224, 224] MobileNet with ['image_classification_mobilenetv2_2022apr_int8.onnx'] +8091.50 8090.44 8088.72 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan.onnx'] +5394.46 5666.14 3235.23 [224, 224] PPResNet with ['image_classification_ppresnet50_2022jan_int8.onnx'] +2270.14 2270.29 2267.51 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar.onnx'] +1584.83 1656.13 1033.23 [320, 240] LPD_YuNet with ['license_plate_detection_lpd_yunet_2023mar_int8.onnx'] +1732.53 1732.14 1731.47 [416, 416] NanoDet with ['object_detection_nanodet_2022nov.onnx'] +1434.56 1463.32 1194.57 [416, 416] NanoDet with ['object_detection_nanodet_2022nov_int8.onnx'] +26172.62 26160.04 26151.67 [640, 640] YoloX with ['object_detection_yolox_2022nov.onnx'] +17004.06 17909.88 9659.54 [640, 640] YoloX with ['object_detection_yolox_2022nov_int8.onnx'] +734.97 735.58 733.95 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb.onnx'] +609.61 621.69 508.04 [192, 192] MPPalmDet with ['palm_detection_mediapipe_2023feb_int8.onnx'] +961.41 962.26 960.39 [224, 224] MPPersonDet with ['person_detection_mediapipe_2023mar.onnx'] +7594.21 7590.75 7589.16 [128, 256] YoutuReID with ['person_reid_youtu_2021nov.onnx'] +4884.04 5154.38 2715.94 [128, 256] YoutuReID with ['person_reid_youtu_2021nov_int8.onnx'] +548.41 550.86 546.09 [256, 256] MPPose with ['pose_estimation_mediapipe_2023mar.onnx'] +34074.19 34077.97 34058.43 [640, 480] DB with ['text_detection_DB_IC15_resnet18_2021sep.onnx'] +34073.67 34069.82 34054.29 [640, 480] DB with ['text_detection_DB_TD500_resnet18_2021sep.onnx'] +1397.09 1396.95 1396.74 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2021sep.onnx'] +1428.65 1432.59 1396.74 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov.onnx'] +1429.56 1467.34 1396.74 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2021sep.onnx'] +1419.29 1450.55 1395.55 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2023feb_fp16.onnx'] +1421.72 1434.46 1395.55 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2023feb_fp16.onnx'] +1307.27 1415.63 807.66 [1280, 720] CRNN with ['text_recognition_CRNN_CH_2022oct_int8.onnx'] +1237.00 1395.68 807.66 [1280, 720] CRNN with ['text_recognition_CRNN_CN_2021nov_int8.onnx'] +1169.59 1415.29 774.09 [1280, 720] CRNN with ['text_recognition_CRNN_EN_2022oct_int8.onnx'] ```