Skip to content

Commit

Permalink
Added 5 devices(AMD*2, Intel*2, NVIDIA*1) benchmark result. (#5085)
Browse files Browse the repository at this point in the history
  • Loading branch information
whyb authored Oct 20, 2023
1 parent b82d395 commit 84aaedb
Showing 1 changed file with 250 additions and 0 deletions.
250 changes: 250 additions & 0 deletions benchmark/README.md
Original file line number Diff line number Diff line change
Expand Up @@ -6648,3 +6648,253 @@ cooling_down = 0
vision_transformer min = 600.83 max = 666.35 avg = 617.33
FastestDet min = 6.05 max = 6.72 avg = 6.23
```

### AMD Ryzen 9 5950X 16-Core of Desktop[2023-10-12]
```
E:\github\ncnn\build-ncnn-vs2019\benchmark\Release>benchncnn.exe 100 16 0 -1 0
loop_count = 100
num_threads = 16
powersave = 0
gpu_device = -1
cooling_down = 0
squeezenet min = 2.68 max = 3.10 avg = 2.77
squeezenet_int8 min = 3.57 max = 4.72 avg = 4.04
mobilenet min = 3.09 max = 5.44 avg = 3.38
mobilenet_int8 min = 2.36 max = 3.40 avg = 2.74
mobilenet_v2 min = 4.24 max = 4.81 avg = 4.40
mobilenet_v3 min = 3.46 max = 3.93 avg = 3.58
shufflenet min = 3.21 max = 4.54 avg = 4.01
shufflenet_v2 min = 2.99 max = 4.49 avg = 3.34
mnasnet min = 3.62 max = 4.31 avg = 3.83
proxylessnasnet min = 4.06 max = 5.70 avg = 4.23
efficientnet_b0 min = 5.60 max = 6.55 avg = 5.81
efficientnetv2_b0 min = 6.83 max = 8.82 avg = 7.12
regnety_400m min = 8.02 max = 9.75 avg = 8.34
blazeface min = 1.34 max = 1.77 avg = 1.46
googlenet min = 11.62 max = 15.95 avg = 12.70
googlenet_int8 min = 7.43 max = 10.06 avg = 7.92
resnet18 min = 8.39 max = 10.39 avg = 9.04
resnet18_int8 min = 6.23 max = 8.64 avg = 6.75
alexnet min = 7.78 max = 12.51 avg = 8.51
vgg16 min = 53.85 max = 63.39 avg = 56.36
vgg16_int8 min = 35.61 max = 46.94 avg = 38.08
resnet50 min = 18.55 max = 24.46 avg = 19.81
resnet50_int8 min = 11.95 max = 23.21 avg = 13.51
squeezenet_ssd min = 10.01 max = 13.16 avg = 10.69
squeezenet_ssd_int8 min = 9.29 max = 14.02 avg = 10.47
mobilenet_ssd min = 6.38 max = 10.26 avg = 7.15
mobilenet_ssd_int8 min = 4.69 max = 6.98 avg = 5.42
mobilenet_yolo min = 17.63 max = 22.59 avg = 19.45
mobilenetv2_yolov3 min = 11.79 max = 15.67 avg = 12.76
yolov4-tiny min = 21.53 max = 25.79 avg = 22.46
nanodet_m min = 7.16 max = 9.99 avg = 8.01
yolo-fastest-1.1 min = 3.66 max = 5.00 avg = 4.38
yolo-fastestv2 min = 3.52 max = 5.20 avg = 4.60
vision_transformer min = 67.01 max = 93.71 avg = 78.48
FastestDet min = 4.44 max = 8.62 avg = 4.69
```

### AMD Radeon RX 6900 XT of Desktop[2023-10-12]
```
E:\github\ncnn\build-ncnn-vs2019\benchmark\Release>benchncnn.exe 100 16 0 0 0
[0 AMD Radeon RX 6900 XT] queueC=1[2] queueG=0[1] queueT=2[2]
[0 AMD Radeon RX 6900 XT] bugsbn1=0 bugbilz=0 bugcopc=0 bugihfa=0
[0 AMD Radeon RX 6900 XT] fp16-p/s/a=1/1/1 int8-p/s/a=1/1/1
[0 AMD Radeon RX 6900 XT] subgroup=64 basic/vote/ballot/shuffle=1/1/1/1
[0 AMD Radeon RX 6900 XT] fp16-matrix-16_8_8/16_8_16/16_16_16=0/0/0
loop_count = 100
num_threads = 16
powersave = 0
gpu_device = 0
cooling_down = 0
squeezenet min = 2.19 max = 2.70 avg = 2.47
squeezenet_int8 min = 3.94 max = 4.51 avg = 4.18
mobilenet min = 2.03 max = 2.63 avg = 2.28
mobilenet_int8 min = 2.56 max = 3.34 avg = 2.69
mobilenet_v2 min = 2.29 max = 2.98 avg = 2.62
mobilenet_v3 min = 2.31 max = 3.10 avg = 2.75
shufflenet min = 1.89 max = 2.61 avg = 2.30
shufflenet_v2 min = 2.17 max = 3.04 avg = 2.59
mnasnet min = 2.19 max = 2.98 avg = 2.69
proxylessnasnet min = 2.12 max = 4.08 avg = 2.62
efficientnet_b0 min = 3.62 max = 5.27 avg = 4.21
efficientnetv2_b0 min = 6.09 max = 7.15 avg = 6.49
regnety_400m min = 2.55 max = 3.82 avg = 3.00
blazeface min = 1.93 max = 2.56 avg = 2.28
googlenet min = 3.35 max = 4.46 avg = 3.75
googlenet_int8 min = 8.02 max = 12.84 avg = 9.15
resnet18 min = 2.46 max = 3.14 avg = 2.84
resnet18_int8 min = 6.37 max = 9.15 avg = 7.30
alexnet min = 2.31 max = 2.91 avg = 2.69
vgg16 min = 4.76 max = 5.79 avg = 5.24
vgg16_int8 min = 35.94 max = 46.27 avg = 39.05
resnet50 min = 3.25 max = 4.09 avg = 3.75
resnet50_int8 min = 12.04 max = 20.53 avg = 14.61
squeezenet_ssd min = 3.03 max = 5.31 avg = 3.66
squeezenet_ssd_int8 min = 9.74 max = 13.46 avg = 10.42
mobilenet_ssd min = 2.82 max = 4.75 avg = 3.39
mobilenet_ssd_int8 min = 4.67 max = 6.76 avg = 5.30
mobilenet_yolo min = 3.01 max = 3.67 avg = 3.34
mobilenetv2_yolov3 min = 4.04 max = 6.46 avg = 4.55
yolov4-tiny min = 5.75 max = 8.05 avg = 6.52
nanodet_m min = 10.16 max = 14.97 avg = 13.11
yolo-fastest-1.1 min = 2.36 max = 3.80 avg = 2.88
yolo-fastestv2 min = 2.24 max = 3.19 avg = 2.80
vision_transformer min = 20.43 max = 25.06 avg = 21.07
FastestDet min = 2.49 max = 3.18 avg = 2.93
```

### NVIDIA GeForce RTX 3060 Ti of Desktop[2023-10-12]
```
E:\github\ncnn\build-ncnn-vs2019\benchmark\Release>benchncnn.exe 100 16 0 0 0
[0 NVIDIA GeForce RTX 3060 Ti] queueC=2[8] queueG=0[16] queueT=1[2]
[0 NVIDIA GeForce RTX 3060 Ti] bugsbn1=0 bugbilz=0 bugcopc=0 bugihfa=0
[0 NVIDIA GeForce RTX 3060 Ti] fp16-p/s/a=1/1/1 int8-p/s/a=1/1/1
[0 NVIDIA GeForce RTX 3060 Ti] subgroup=32 basic/vote/ballot/shuffle=1/1/1/1
[0 NVIDIA GeForce RTX 3060 Ti] fp16-matrix-16_8_8/16_8_16/16_16_16=1/1/1
[1 Intel(R) UHD Graphics 770] queueC=0[1] queueG=0[1] queueT=0[1]
[1 Intel(R) UHD Graphics 770] bugsbn1=0 bugbilz=0 bugcopc=0 bugihfa=0
[1 Intel(R) UHD Graphics 770] fp16-p/s/a=1/1/1 int8-p/s/a=1/1/1
[1 Intel(R) UHD Graphics 770] subgroup=32 basic/vote/ballot/shuffle=1/1/1/1
[1 Intel(R) UHD Graphics 770] fp16-matrix-16_8_8/16_8_16/16_16_16=0/0/0
loop_count = 100
num_threads = 16
powersave = 0
gpu_device = 0
cooling_down = 0
squeezenet min = 0.80 max = 2.51 avg = 0.89
squeezenet_int8 min = 2.81 max = 3.51 avg = 2.96
mobilenet min = 0.70 max = 0.79 avg = 0.71
mobilenet_int8 min = 2.95 max = 3.44 avg = 3.03
mobilenet_v2 min = 1.09 max = 1.25 avg = 1.12
mobilenet_v3 min = 1.33 max = 2.04 avg = 1.56
shufflenet min = 1.20 max = 1.39 avg = 1.27
shufflenet_v2 min = 1.50 max = 1.66 avg = 1.57
mnasnet min = 1.11 max = 1.22 avg = 1.15
proxylessnasnet min = 1.20 max = 1.63 avg = 1.24
efficientnet_b0 min = 2.38 max = 3.21 avg = 2.61
efficientnetv2_b0 min = 9.16 max = 11.35 avg = 9.63
regnety_400m min = 1.86 max = 2.03 avg = 1.94
blazeface min = 0.70 max = 1.10 avg = 0.76
googlenet min = 2.11 max = 2.40 avg = 2.30
googlenet_int8 min = 6.91 max = 7.88 avg = 7.17
resnet18 min = 1.14 max = 1.47 avg = 1.19
resnet18_int8 min = 4.96 max = 6.82 avg = 5.40
alexnet min = 1.10 max = 1.85 avg = 1.19
vgg16 min = 2.27 max = 3.97 avg = 2.46
vgg16_int8 min = 19.02 max = 22.20 avg = 20.28
resnet50 min = 2.00 max = 2.99 avg = 2.10
resnet50_int8 min = 10.66 max = 13.30 avg = 11.29
squeezenet_ssd min = 2.74 max = 3.44 avg = 2.90
squeezenet_ssd_int8 min = 6.93 max = 7.95 avg = 7.19
mobilenet_ssd min = 1.86 max = 2.07 avg = 1.96
mobilenet_ssd_int8 min = 5.92 max = 6.48 avg = 6.09
mobilenet_yolo min = 1.65 max = 2.58 avg = 1.78
mobilenetv2_yolov3 min = 3.85 max = 4.11 avg = 3.96
yolov4-tiny min = 6.54 max = 7.05 avg = 6.69
nanodet_m min = 2.38 max = 3.28 avg = 2.72
yolo-fastest-1.1 min = 1.73 max = 2.07 avg = 1.83
yolo-fastestv2 min = 1.72 max = 1.92 avg = 1.80
vision_transformer min = 53.91 max = 56.59 avg = 55.27
FastestDet min = 1.48 max = 1.83 avg = 1.69
```

### Intel(R) UHD Graphics 770 of Desktop[2023-10-12]
```
E:\github\ncnn\build-ncnn-vs2019\benchmark\Release>benchncnn.exe 100 16 0 1 0
[0 NVIDIA GeForce RTX 3060 Ti] queueC=2[8] queueG=0[16] queueT=1[2]
[0 NVIDIA GeForce RTX 3060 Ti] bugsbn1=0 bugbilz=0 bugcopc=0 bugihfa=0
[0 NVIDIA GeForce RTX 3060 Ti] fp16-p/s/a=1/1/1 int8-p/s/a=1/1/1
[0 NVIDIA GeForce RTX 3060 Ti] subgroup=32 basic/vote/ballot/shuffle=1/1/1/1
[0 NVIDIA GeForce RTX 3060 Ti] fp16-matrix-16_8_8/16_8_16/16_16_16=1/1/1
[1 Intel(R) UHD Graphics 770] queueC=0[1] queueG=0[1] queueT=0[1]
[1 Intel(R) UHD Graphics 770] bugsbn1=0 bugbilz=0 bugcopc=0 bugihfa=0
[1 Intel(R) UHD Graphics 770] fp16-p/s/a=1/1/1 int8-p/s/a=1/1/1
[1 Intel(R) UHD Graphics 770] subgroup=32 basic/vote/ballot/shuffle=1/1/1/1
[1 Intel(R) UHD Graphics 770] fp16-matrix-16_8_8/16_8_16/16_16_16=0/0/0
loop_count = 100
num_threads = 16
powersave = 0
gpu_device = 1
cooling_down = 0
squeezenet min = 3.11 max = 4.47 avg = 3.45
squeezenet_int8 min = 1.89 max = 2.84 avg = 2.23
mobilenet min = 4.98 max = 5.67 avg = 5.18
mobilenet_int8 min = 2.54 max = 3.17 avg = 2.98
mobilenet_v2 min = 4.03 max = 4.89 avg = 4.37
mobilenet_v3 min = 4.45 max = 5.68 avg = 4.86
shufflenet min = 3.42 max = 4.42 avg = 3.79
shufflenet_v2 min = 3.00 max = 4.01 avg = 3.30
mnasnet min = 4.21 max = 5.12 avg = 4.51
proxylessnasnet min = 4.62 max = 5.64 avg = 4.90
efficientnet_b0 min = 7.82 max = 8.63 avg = 8.10
efficientnetv2_b0 min = 34.52 max = 36.34 avg = 35.29
regnety_400m min = 6.07 max = 7.31 avg = 6.44
blazeface min = 1.54 max = 1.67 avg = 1.59
googlenet min = 11.53 max = 12.64 avg = 11.89
googlenet_int8 min = 13.71 max = 15.52 avg = 14.38
resnet18 min = 10.75 max = 12.94 avg = 11.07
resnet18_int8 min = 9.04 max = 11.05 avg = 9.53
alexnet min = 13.64 max = 14.37 avg = 13.98
vgg16 min = 38.53 max = 40.16 avg = 39.22
vgg16_int8 min = 16.04 max = 21.16 avg = 19.35
resnet50 min = 25.61 max = 28.22 avg = 26.62
resnet50_int8 min = 7.72 max = 12.83 avg = 10.29
squeezenet_ssd min = 10.34 max = 15.88 avg = 14.75
squeezenet_ssd_int8 min = 4.63 max = 7.13 avg = 5.66
mobilenet_ssd min = 11.35 max = 13.06 avg = 12.44
mobilenet_ssd_int8 min = 4.21 max = 6.31 avg = 5.32
mobilenet_yolo min = 20.14 max = 22.92 avg = 21.94
mobilenetv2_yolov3 min = 12.58 max = 14.88 avg = 14.21
yolov4-tiny min = 20.62 max = 25.58 avg = 24.39
nanodet_m min = 7.75 max = 12.49 avg = 11.42
yolo-fastest-1.1 min = 3.68 max = 6.49 avg = 5.54
yolo-fastestv2 min = 4.32 max = 5.39 avg = 4.51
vision_transformer min = 796.51 max = 805.29 avg = 802.39
FastestDet min = 2.89 max = 4.83 avg = 3.95
```

### Intel® Core™ i7-13700K of Desktop[2023-10-12]
```
E:\github\ncnn\build-ncnn-vs2019\benchmark\Release>benchncnn.exe 100 16 0 -1 0
loop_count = 100
num_threads = 16
powersave = 0
gpu_device = -1
cooling_down = 0
squeezenet min = 1.69 max = 2.63 avg = 2.12
squeezenet_int8 min = 1.83 max = 3.03 avg = 2.26
mobilenet min = 1.69 max = 2.64 avg = 2.24
mobilenet_int8 min = 2.47 max = 3.06 avg = 2.84
mobilenet_v2 min = 1.94 max = 3.47 avg = 2.47
mobilenet_v3 min = 1.49 max = 2.74 avg = 1.87
shufflenet min = 1.57 max = 3.00 avg = 1.82
shufflenet_v2 min = 1.41 max = 1.72 avg = 1.51
mnasnet min = 1.73 max = 2.94 avg = 2.13
proxylessnasnet min = 2.08 max = 3.31 avg = 2.69
efficientnet_b0 min = 3.20 max = 4.99 avg = 3.78
efficientnetv2_b0 min = 3.51 max = 5.16 avg = 4.08
regnety_400m min = 4.51 max = 10.29 avg = 6.18
blazeface min = 0.52 max = 0.92 avg = 0.59
googlenet min = 5.49 max = 7.48 avg = 6.26
googlenet_int8 min = 4.83 max = 7.54 avg = 5.90
resnet18 min = 4.05 max = 6.61 avg = 4.83
resnet18_int8 min = 3.77 max = 5.70 avg = 4.57
alexnet min = 3.60 max = 5.09 avg = 4.26
vgg16 min = 25.19 max = 28.79 avg = 26.81
vgg16_int8 min = 17.52 max = 21.79 avg = 19.80
resnet50 min = 9.23 max = 13.15 avg = 11.34
resnet50_int8 min = 7.77 max = 12.00 avg = 10.18
squeezenet_ssd min = 4.33 max = 6.73 avg = 4.96
squeezenet_ssd_int8 min = 4.77 max = 7.62 avg = 5.71
mobilenet_ssd min = 3.70 max = 6.43 avg = 4.53
mobilenet_ssd_int8 min = 4.16 max = 6.53 avg = 5.38
mobilenet_yolo min = 11.27 max = 14.93 avg = 12.90
mobilenetv2_yolov3 min = 7.41 max = 11.52 avg = 9.11
yolov4-tiny min = 12.05 max = 18.96 avg = 14.15
nanodet_m min = 3.39 max = 5.77 avg = 4.07
yolo-fastest-1.1 min = 1.95 max = 3.85 avg = 2.30
yolo-fastestv2 min = 1.91 max = 3.52 avg = 2.27
vision_transformer min = 79.50 max = 99.93 avg = 88.91
FastestDet min = 1.92 max = 2.72 avg = 2.19
```

0 comments on commit 84aaedb

Please sign in to comment.