OVHcloud GPU benchmark - YOLO Prediction FP32
Go back to listLike many deep learning models, YOLO offers 16 and 32 bits precision. This part is about FP32 performance:
# Select a sample by its size:
# sample="https://upload.wikimedia.org/wikipedia/commons/thumb/f/f3/2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg/640px-2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg"
# sample="https://upload.wikimedia.org/wikipedia/commons/thumb/f/f3/2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg/1024px-2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg"
# sample="https://upload.wikimedia.org/wikipedia/commons/thumb/f/f3/2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg/1280px-2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg"
# sample="https://upload.wikimedia.org/wikipedia/commons/thumb/f/f3/2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg/2560px-2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg"
# sample="https://upload.wikimedia.org/wikipedia/commons/f/f3/2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg"
yolo-benchmark --model yolov8n.pt predict --conf 0.25 --iou 0.7 --device cuda $sample
{
"configuration": {
"chart": {
"type": "bar",
"polar": false,
"zoomType": "",
"options3d": {},
"height": 550,
"width": null,
"margin": null,
"inverted": false,
"zooming": {}
},
"credits": {
"enabled": false
},
"title": {
"text": "Input size: 69.7 KiB"
},
"colorAxis": null,
"subtitle": {
"text": ""
},
"xAxis": {
"title": {
"text": [
""
],
"useHTML": false,
"style": {
"color": "#666666"
}
},
"categories": [
"provider__short_name",
"flavor__name",
"flavor__gpu_model"
],
"lineWidth": 1,
"tickInterval": null,
"tickWidth": 0,
"tickLength": 10,
"tickPixelInterval": null,
"plotLines": null,
"labels": {
"enabled": false,
"format": null,
"formatter": "",
"style": {
"color": "#666666",
"cursor": "default",
"fontSize": "11px"
},
"useHTML": false,
"step": 0
},
"plotBands": null,
"visible": true,
"floor": null,
"ceiling": null,
"type": "linear",
"min": null,
"gridLineWidth": null,
"gridLineColor": null,
"minorTickInterval": null,
"minorTickWidth": 0,
"minTickInterval": null,
"startOnTick": true,
"endOnTick": null,
"tickmarkPlacement": null,
"units": null,
"minRange": null
},
"yAxis": {
"title": {
"text": [
"In msec<br>Lower is better"
],
"useHTML": false,
"style": {
"color": "#666666"
}
},
"categories": null,
"plotLines": null,
"plotBands": null,
"lineWidth": null,
"tickInterval": null,
"tickLength": 10,
"floor": null,
"ceiling": null,
"gridLineInterpolation": null,
"gridLineWidth": 1,
"gridLineColor": "#CCC",
"min": null,
"max": null,
"minorTickInterval": null,
"minorTickWidth": 0,
"minTickInterval": null,
"startOnTick": true,
"endOnTick": null,
"minRange": null,
"type": "linear",
"tickmarkPlacement": null,
"labels": {
"enabled": true,
"formatter": null,
"style": {
"color": "#666666",
"cursor": "default",
"fontSize": "11px"
},
"useHTML": false
}
},
"zAxis": {
"title": {
"text": "In msec<br>Lower is better"
}
},
"plotOptions": {
"series": {
"dataLabels": {
"enabled": true,
"format": "{series.name}",
"distance": 30,
"align": "left",
"inside": true,
"allowOverlap": false,
"style": {
"fontSize": "17px"
}
},
"showInLegend": null,
"turboThreshold": 1000,
"stacking": "",
"groupPadding": 0,
"centerInCategory": false,
"findNearestPointBy": "x"
}
},
"navigator": {
"enabled": false
},
"scrollbar": {
"enabled": false
},
"rangeSelector": {
"enabled": false,
"inputEnabled": false
},
"legend": {
"enabled": true,
"maxHeight": null,
"align": "center",
"verticalAlign": "bottom",
"layout": "horizontal",
"width": null,
"margin": 12,
"reversed": false
},
"series": [
{
"name": "AWS g5.xlarge NVIDIA A10G",
"data": [
[
0,
63.541014989217125
]
],
"grouping": false,
"color": "#f7981d"
},
{
"name": "AWS p3.2xlarge Tesla V100-SXM2-16GB",
"data": [
[
1,
44.731855392456055
]
],
"grouping": false,
"color": "#f7981d"
},
{
"name": "Azure Standard_NC40ads_H100_v5 NVIDIA H100 NVL",
"data": [
[
2,
32.56034851074219
]
],
"grouping": false,
"color": "#55b3ff"
},
{
"name": "Azure Standard_NC6s_v3 Tesla V100-PCIE-16GB",
"data": [
[
3,
42.78095563252767
]
],
"grouping": false,
"color": "#55b3ff"
},
{
"name": "Google a2-highgpu-1g NVIDIA A100-SXM4-40GB",
"data": [
[
4,
56.84415499369303
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google a2-ultragpu-1g NVIDIA A100-SXM4-80GB",
"data": [
[
5,
52.193800608317055
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google g2-standard-16 NVIDIA L4",
"data": [
[
6,
61.9044303894043
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google n1-highmem-8 Intel Skylake Tesla V100 Tesla V100-SXM2-16GB",
"data": [
[
7,
42.34556357065836
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "OVH H100-380 NVIDIA H100 PCIe",
"data": [
[
8,
32.1810245513916
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH L4-90 NVIDIA L4",
"data": [
[
9,
30.471007029215496
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH L40S-90 NVIDIA L40S",
"data": [
[
10,
31.811753908793133
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH T1-LE-45 Tesla V100-PCIE-16GB",
"data": [
[
11,
46.828111012776695
]
],
"grouping": false,
"color": "#484848"
}
],
"drilldown": {},
"tooltip": {
"enabled": true,
"useHTML": false,
"format": null,
"headerFormat": "",
"pointFormat": "<span style=\"color:{series.color}\">{series.name}</span>: <b>{point.y:.1f} ms</b>",
"footerFormat": "",
"shared": false,
"outside": false,
"valueDecimals": null,
"split": false
},
"annotations": null
},
"hc_type": "chart",
"id": "71400"
}
{
"configuration": {
"chart": {
"type": "bar",
"polar": false,
"zoomType": "",
"options3d": {},
"height": 550,
"width": null,
"margin": null,
"inverted": false,
"zooming": {}
},
"credits": {
"enabled": false
},
"title": {
"text": "Input size: 135.4 KiB"
},
"colorAxis": null,
"subtitle": {
"text": ""
},
"xAxis": {
"title": {
"text": [
""
],
"useHTML": false,
"style": {
"color": "#666666"
}
},
"categories": [
"provider__short_name",
"flavor__name",
"flavor__gpu_model"
],
"lineWidth": 1,
"tickInterval": null,
"tickWidth": 0,
"tickLength": 10,
"tickPixelInterval": null,
"plotLines": null,
"labels": {
"enabled": false,
"format": null,
"formatter": "",
"style": {
"color": "#666666",
"cursor": "default",
"fontSize": "11px"
},
"useHTML": false,
"step": 0
},
"plotBands": null,
"visible": true,
"floor": null,
"ceiling": null,
"type": "linear",
"min": null,
"gridLineWidth": null,
"gridLineColor": null,
"minorTickInterval": null,
"minorTickWidth": 0,
"minTickInterval": null,
"startOnTick": true,
"endOnTick": null,
"tickmarkPlacement": null,
"units": null,
"minRange": null
},
"yAxis": {
"title": {
"text": [
"In msec<br>Lower is better"
],
"useHTML": false,
"style": {
"color": "#666666"
}
},
"categories": null,
"plotLines": null,
"plotBands": null,
"lineWidth": null,
"tickInterval": null,
"tickLength": 10,
"floor": null,
"ceiling": null,
"gridLineInterpolation": null,
"gridLineWidth": 1,
"gridLineColor": "#CCC",
"min": null,
"max": null,
"minorTickInterval": null,
"minorTickWidth": 0,
"minTickInterval": null,
"startOnTick": true,
"endOnTick": null,
"minRange": null,
"type": "linear",
"tickmarkPlacement": null,
"labels": {
"enabled": true,
"formatter": null,
"style": {
"color": "#666666",
"cursor": "default",
"fontSize": "11px"
},
"useHTML": false
}
},
"zAxis": {
"title": {
"text": "In msec<br>Lower is better"
}
},
"plotOptions": {
"series": {
"dataLabels": {
"enabled": true,
"format": "{series.name}",
"distance": 30,
"align": "left",
"inside": true,
"allowOverlap": false,
"style": {
"fontSize": "17px"
}
},
"showInLegend": null,
"turboThreshold": 1000,
"stacking": "",
"groupPadding": 0,
"centerInCategory": false,
"findNearestPointBy": "x"
}
},
"navigator": {
"enabled": false
},
"scrollbar": {
"enabled": false
},
"rangeSelector": {
"enabled": false,
"inputEnabled": false
},
"legend": {
"enabled": true,
"maxHeight": null,
"align": "center",
"verticalAlign": "bottom",
"layout": "horizontal",
"width": null,
"margin": 12,
"reversed": false
},
"series": [
{
"name": "AWS g5.xlarge NVIDIA A10G",
"data": [
[
0,
58.82620811462402
]
],
"grouping": false,
"color": "#f7981d"
},
{
"name": "AWS p3.2xlarge Tesla V100-SXM2-16GB",
"data": [
[
1,
45.35531997680664
]
],
"grouping": false,
"color": "#f7981d"
},
{
"name": "Azure Standard_NC40ads_H100_v5 NVIDIA H100 NVL",
"data": [
[
2,
32.769362131754555
]
],
"grouping": false,
"color": "#55b3ff"
},
{
"name": "Azure Standard_NC6s_v3 Tesla V100-PCIE-16GB",
"data": [
[
3,
41.556755701700844
]
],
"grouping": false,
"color": "#55b3ff"
},
{
"name": "Google a2-highgpu-1g NVIDIA A100-SXM4-40GB",
"data": [
[
4,
52.40329106648763
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google a2-ultragpu-1g NVIDIA A100-SXM4-80GB",
"data": [
[
5,
51.0107676188151
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google g2-standard-16 NVIDIA L4",
"data": [
[
6,
61.499993006388344
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google n1-highmem-8 Intel Skylake Tesla V100 Tesla V100-SXM2-16GB",
"data": [
[
7,
39.97830549875895
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "OVH H100-380 NVIDIA H100 PCIe",
"data": [
[
8,
32.185872395833336
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH L4-90 NVIDIA L4",
"data": [
[
9,
30.333280563354492
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH L40S-90 NVIDIA L40S",
"data": [
[
10,
32.119552294413246
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH T1-LE-45 Tesla V100-PCIE-16GB",
"data": [
[
11,
45.29102643330892
]
],
"grouping": false,
"color": "#484848"
}
],
"drilldown": {},
"tooltip": {
"enabled": true,
"useHTML": false,
"format": null,
"headerFormat": "",
"pointFormat": "<span style=\"color:{series.color}\">{series.name}</span>: <b>{point.y:.1f} ms</b>",
"footerFormat": "",
"shared": false,
"outside": false,
"valueDecimals": null,
"split": false
},
"annotations": null
},
"hc_type": "chart",
"id": "138602"
}
{
"configuration": {
"chart": {
"type": "bar",
"polar": false,
"zoomType": "",
"options3d": {},
"height": 550,
"width": null,
"margin": null,
"inverted": false,
"zooming": {}
},
"credits": {
"enabled": false
},
"title": {
"text": "Input size: 186.7 KiB"
},
"colorAxis": null,
"subtitle": {
"text": ""
},
"xAxis": {
"title": {
"text": [
""
],
"useHTML": false,
"style": {
"color": "#666666"
}
},
"categories": [
"provider__short_name",
"flavor__name",
"flavor__gpu_model"
],
"lineWidth": 1,
"tickInterval": null,
"tickWidth": 0,
"tickLength": 10,
"tickPixelInterval": null,
"plotLines": null,
"labels": {
"enabled": false,
"format": null,
"formatter": "",
"style": {
"color": "#666666",
"cursor": "default",
"fontSize": "11px"
},
"useHTML": false,
"step": 0
},
"plotBands": null,
"visible": true,
"floor": null,
"ceiling": null,
"type": "linear",
"min": null,
"gridLineWidth": null,
"gridLineColor": null,
"minorTickInterval": null,
"minorTickWidth": 0,
"minTickInterval": null,
"startOnTick": true,
"endOnTick": null,
"tickmarkPlacement": null,
"units": null,
"minRange": null
},
"yAxis": {
"title": {
"text": [
"In msec<br>Lower is better"
],
"useHTML": false,
"style": {
"color": "#666666"
}
},
"categories": null,
"plotLines": null,
"plotBands": null,
"lineWidth": null,
"tickInterval": null,
"tickLength": 10,
"floor": null,
"ceiling": null,
"gridLineInterpolation": null,
"gridLineWidth": 1,
"gridLineColor": "#CCC",
"min": null,
"max": null,
"minorTickInterval": null,
"minorTickWidth": 0,
"minTickInterval": null,
"startOnTick": true,
"endOnTick": null,
"minRange": null,
"type": "linear",
"tickmarkPlacement": null,
"labels": {
"enabled": true,
"formatter": null,
"style": {
"color": "#666666",
"cursor": "default",
"fontSize": "11px"
},
"useHTML": false
}
},
"zAxis": {
"title": {
"text": "In msec<br>Lower is better"
}
},
"plotOptions": {
"series": {
"dataLabels": {
"enabled": true,
"format": "{series.name}",
"distance": 30,
"align": "left",
"inside": true,
"allowOverlap": false,
"style": {
"fontSize": "17px"
}
},
"showInLegend": null,
"turboThreshold": 1000,
"stacking": "",
"groupPadding": 0,
"centerInCategory": false,
"findNearestPointBy": "x"
}
},
"navigator": {
"enabled": false
},
"scrollbar": {
"enabled": false
},
"rangeSelector": {
"enabled": false,
"inputEnabled": false
},
"legend": {
"enabled": true,
"maxHeight": null,
"align": "center",
"verticalAlign": "bottom",
"layout": "horizontal",
"width": null,
"margin": 12,
"reversed": false
},
"series": [
{
"name": "AWS g5.xlarge NVIDIA A10G",
"data": [
[
0,
59.05787150065104
]
],
"grouping": false,
"color": "#f7981d"
},
{
"name": "AWS p3.2xlarge Tesla V100-SXM2-16GB",
"data": [
[
1,
44.096151987711586
]
],
"grouping": false,
"color": "#f7981d"
},
{
"name": "Azure Standard_NC40ads_H100_v5 NVIDIA H100 NVL",
"data": [
[
2,
32.49502182006836
]
],
"grouping": false,
"color": "#55b3ff"
},
{
"name": "Azure Standard_NC6s_v3 Tesla V100-PCIE-16GB",
"data": [
[
3,
40.10136922200521
]
],
"grouping": false,
"color": "#55b3ff"
},
{
"name": "Google a2-highgpu-1g NVIDIA A100-SXM4-40GB",
"data": [
[
4,
55.02160390218099
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google a2-ultragpu-1g NVIDIA A100-SXM4-80GB",
"data": [
[
5,
50.93057950337728
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google g2-standard-16 NVIDIA L4",
"data": [
[
6,
61.77063783009847
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google n1-highmem-8 Intel Skylake Tesla V100 Tesla V100-SXM2-16GB",
"data": [
[
7,
40.11444250742594
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "OVH H100-380 NVIDIA H100 PCIe",
"data": [
[
8,
32.392263412475586
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH L4-90 NVIDIA L4",
"data": [
[
9,
30.46703338623047
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH L40S-90 NVIDIA L40S",
"data": [
[
10,
32.416343688964844
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH T1-LE-45 Tesla V100-PCIE-16GB",
"data": [
[
11,
46.94358507792155
]
],
"grouping": false,
"color": "#484848"
}
],
"drilldown": {},
"tooltip": {
"enabled": true,
"useHTML": false,
"format": null,
"headerFormat": "",
"pointFormat": "<span style=\"color:{series.color}\">{series.name}</span>: <b>{point.y:.1f} ms</b>",
"footerFormat": "",
"shared": false,
"outside": false,
"valueDecimals": null,
"split": false
},
"annotations": null
},
"hc_type": "chart",
"id": "191185"
}
{
"configuration": {
"chart": {
"type": "bar",
"polar": false,
"zoomType": "",
"options3d": {},
"height": 550,
"width": null,
"margin": null,
"inverted": false,
"zooming": {}
},
"credits": {
"enabled": false
},
"title": {
"text": "Input size: 647.1 KiB"
},
"colorAxis": null,
"subtitle": {
"text": ""
},
"xAxis": {
"title": {
"text": [
""
],
"useHTML": false,
"style": {
"color": "#666666"
}
},
"categories": [
"provider__short_name",
"flavor__name",
"flavor__gpu_model"
],
"lineWidth": 1,
"tickInterval": null,
"tickWidth": 0,
"tickLength": 10,
"tickPixelInterval": null,
"plotLines": null,
"labels": {
"enabled": false,
"format": null,
"formatter": "",
"style": {
"color": "#666666",
"cursor": "default",
"fontSize": "11px"
},
"useHTML": false,
"step": 0
},
"plotBands": null,
"visible": true,
"floor": null,
"ceiling": null,
"type": "linear",
"min": null,
"gridLineWidth": null,
"gridLineColor": null,
"minorTickInterval": null,
"minorTickWidth": 0,
"minTickInterval": null,
"startOnTick": true,
"endOnTick": null,
"tickmarkPlacement": null,
"units": null,
"minRange": null
},
"yAxis": {
"title": {
"text": [
"In msec<br>Lower is better"
],
"useHTML": false,
"style": {
"color": "#666666"
}
},
"categories": null,
"plotLines": null,
"plotBands": null,
"lineWidth": null,
"tickInterval": null,
"tickLength": 10,
"floor": null,
"ceiling": null,
"gridLineInterpolation": null,
"gridLineWidth": 1,
"gridLineColor": "#CCC",
"min": null,
"max": null,
"minorTickInterval": null,
"minorTickWidth": 0,
"minTickInterval": null,
"startOnTick": true,
"endOnTick": null,
"minRange": null,
"type": "linear",
"tickmarkPlacement": null,
"labels": {
"enabled": true,
"formatter": null,
"style": {
"color": "#666666",
"cursor": "default",
"fontSize": "11px"
},
"useHTML": false
}
},
"zAxis": {
"title": {
"text": "In msec<br>Lower is better"
}
},
"plotOptions": {
"series": {
"dataLabels": {
"enabled": true,
"format": "{series.name}",
"distance": 30,
"align": "left",
"inside": true,
"allowOverlap": false,
"style": {
"fontSize": "17px"
}
},
"showInLegend": null,
"turboThreshold": 1000,
"stacking": "",
"groupPadding": 0,
"centerInCategory": false,
"findNearestPointBy": "x"
}
},
"navigator": {
"enabled": false
},
"scrollbar": {
"enabled": false
},
"rangeSelector": {
"enabled": false,
"inputEnabled": false
},
"legend": {
"enabled": true,
"maxHeight": null,
"align": "center",
"verticalAlign": "bottom",
"layout": "horizontal",
"width": null,
"margin": 12,
"reversed": false
},
"series": [
{
"name": "AWS g5.xlarge NVIDIA A10G",
"data": [
[
0,
58.95638465881348
]
],
"grouping": false,
"color": "#f7981d"
},
{
"name": "AWS p3.2xlarge Tesla V100-SXM2-16GB",
"data": [
[
1,
45.36318778991699
]
],
"grouping": false,
"color": "#f7981d"
},
{
"name": "Azure Standard_NC40ads_H100_v5 NVIDIA H100 NVL",
"data": [
[
2,
32.25954373677572
]
],
"grouping": false,
"color": "#55b3ff"
},
{
"name": "Azure Standard_NC6s_v3 Tesla V100-PCIE-16GB",
"data": [
[
3,
43.50113868713379
]
],
"grouping": false,
"color": "#55b3ff"
},
{
"name": "Google a2-highgpu-1g NVIDIA A100-SXM4-40GB",
"data": [
[
4,
52.22320556640625
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google a2-ultragpu-1g NVIDIA A100-SXM4-80GB",
"data": [
[
5,
51.247358322143555
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google g2-standard-16 NVIDIA L4",
"data": [
[
6,
61.21468544006348
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google n1-highmem-8 Intel Skylake Tesla V100 Tesla V100-SXM2-16GB",
"data": [
[
7,
40.665229161580406
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "OVH H100-380 NVIDIA H100 PCIe",
"data": [
[
8,
33.150831858317055
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH L4-90 NVIDIA L4",
"data": [
[
9,
30.71769078572591
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH L40S-90 NVIDIA L40S",
"data": [
[
10,
32.66290823618571
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH T1-LE-45 Tesla V100-PCIE-16GB",
"data": [
[
11,
45.86418469746908
]
],
"grouping": false,
"color": "#484848"
}
],
"drilldown": {},
"tooltip": {
"enabled": true,
"useHTML": false,
"format": null,
"headerFormat": "",
"pointFormat": "<span style=\"color:{series.color}\">{series.name}</span>: <b>{point.y:.1f} ms</b>",
"footerFormat": "",
"shared": false,
"outside": false,
"valueDecimals": null,
"split": false
},
"annotations": null
},
"hc_type": "chart",
"id": "662665"
}
{
"configuration": {
"chart": {
"type": "bar",
"polar": false,
"zoomType": "",
"options3d": {},
"height": 550,
"width": null,
"margin": null,
"inverted": false,
"zooming": {}
},
"credits": {
"enabled": false
},
"title": {
"text": "Input size: 13.0 MiB"
},
"colorAxis": null,
"subtitle": {
"text": ""
},
"xAxis": {
"title": {
"text": [
""
],
"useHTML": false,
"style": {
"color": "#666666"
}
},
"categories": [
"provider__short_name",
"flavor__name",
"flavor__gpu_model"
],
"lineWidth": 1,
"tickInterval": null,
"tickWidth": 0,
"tickLength": 10,
"tickPixelInterval": null,
"plotLines": null,
"labels": {
"enabled": false,
"format": null,
"formatter": "",
"style": {
"color": "#666666",
"cursor": "default",
"fontSize": "11px"
},
"useHTML": false,
"step": 0
},
"plotBands": null,
"visible": true,
"floor": null,
"ceiling": null,
"type": "linear",
"min": null,
"gridLineWidth": null,
"gridLineColor": null,
"minorTickInterval": null,
"minorTickWidth": 0,
"minTickInterval": null,
"startOnTick": true,
"endOnTick": null,
"tickmarkPlacement": null,
"units": null,
"minRange": null
},
"yAxis": {
"title": {
"text": [
"In msec<br>Lower is better"
],
"useHTML": false,
"style": {
"color": "#666666"
}
},
"categories": null,
"plotLines": null,
"plotBands": null,
"lineWidth": null,
"tickInterval": null,
"tickLength": 10,
"floor": null,
"ceiling": null,
"gridLineInterpolation": null,
"gridLineWidth": 1,
"gridLineColor": "#CCC",
"min": null,
"max": null,
"minorTickInterval": null,
"minorTickWidth": 0,
"minTickInterval": null,
"startOnTick": true,
"endOnTick": null,
"minRange": null,
"type": "linear",
"tickmarkPlacement": null,
"labels": {
"enabled": true,
"formatter": null,
"style": {
"color": "#666666",
"cursor": "default",
"fontSize": "11px"
},
"useHTML": false
}
},
"zAxis": {
"title": {
"text": "In msec<br>Lower is better"
}
},
"plotOptions": {
"series": {
"dataLabels": {
"enabled": true,
"format": "{series.name}",
"distance": 30,
"align": "left",
"inside": true,
"allowOverlap": false,
"style": {
"fontSize": "17px"
}
},
"showInLegend": null,
"turboThreshold": 1000,
"stacking": "",
"groupPadding": 0,
"centerInCategory": false,
"findNearestPointBy": "x"
}
},
"navigator": {
"enabled": false
},
"scrollbar": {
"enabled": false
},
"rangeSelector": {
"enabled": false,
"inputEnabled": false
},
"legend": {
"enabled": true,
"maxHeight": null,
"align": "center",
"verticalAlign": "bottom",
"layout": "horizontal",
"width": null,
"margin": 12,
"reversed": false
},
"series": [
{
"name": "AWS g5.xlarge NVIDIA A10G",
"data": [
[
0,
58.710177739461265
]
],
"grouping": false,
"color": "#f7981d"
},
{
"name": "AWS p3.2xlarge Tesla V100-SXM2-16GB",
"data": [
[
1,
44.76610819498698
]
],
"grouping": false,
"color": "#f7981d"
},
{
"name": "Azure Standard_NC40ads_H100_v5 NVIDIA H100 NVL",
"data": [
[
2,
32.493034998575844
]
],
"grouping": false,
"color": "#55b3ff"
},
{
"name": "Azure Standard_NC6s_v3 Tesla V100-PCIE-16GB",
"data": [
[
3,
40.297905604044594
]
],
"grouping": false,
"color": "#55b3ff"
},
{
"name": "Google a2-highgpu-1g NVIDIA A100-SXM4-40GB",
"data": [
[
4,
53.98313204447428
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google a2-ultragpu-1g NVIDIA A100-SXM4-80GB",
"data": [
[
5,
51.91572507222494
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google g2-standard-16 NVIDIA L4",
"data": [
[
6,
61.28187974294027
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "Google n1-highmem-8 Intel Skylake Tesla V100 Tesla V100-SXM2-16GB",
"data": [
[
7,
40.47147432963053
]
],
"grouping": false,
"color": "#55b400"
},
{
"name": "OVH H100-380 NVIDIA H100 PCIe",
"data": [
[
8,
31.942208607991535
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH L4-90 NVIDIA L4",
"data": [
[
9,
29.933929443359375
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH L40S-90 NVIDIA L40S",
"data": [
[
10,
31.40572706858317
]
],
"grouping": false,
"color": "#484848"
},
{
"name": "OVH T1-LE-45 Tesla V100-PCIE-16GB",
"data": [
[
11,
42.141358057657875
]
],
"grouping": false,
"color": "#484848"
}
],
"drilldown": {},
"tooltip": {
"enabled": true,
"useHTML": false,
"format": null,
"headerFormat": "",
"pointFormat": "<span style=\"color:{series.color}\">{series.name}</span>: <b>{point.y:.1f} ms</b>",
"footerFormat": "",
"shared": false,
"outside": false,
"valueDecimals": null,
"split": false
},
"annotations": null
},
"hc_type": "chart",
"id": "13601264"
}
Cloud Mercato's observations:
- The image size doesn't influence the inference performance
- H100, L4 and L40S have the best timing among the panel