OVHcloud GPU benchmark - YOLO Prediction FP16

Go back to list

YOLO is a class of real-time object detection and image segmentation model. For this benchmark we used YOLOv8 built by the company Ultralytics. We evaluate computer vision speed via our tool yolo-benchmark

# Select a sample by its size:
# sample="https://upload.wikimedia.org/wikipedia/commons/thumb/f/f3/2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg/640px-2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg"
# sample="https://upload.wikimedia.org/wikipedia/commons/thumb/f/f3/2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg/1024px-2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg"
# sample="https://upload.wikimedia.org/wikipedia/commons/thumb/f/f3/2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg/1280px-2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg"
# sample="https://upload.wikimedia.org/wikipedia/commons/thumb/f/f3/2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg/2560px-2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg"
# sample="https://upload.wikimedia.org/wikipedia/commons/f/f3/2018-10-12_Wrestling_Boys_Greco-Roman_45kg_at_2018_Summer_Youth_Olympics_%E2%80%93_Medal_Ceremony_%28Martin_Rulsch%29_16.jpg"

yolo-benchmark --model yolov8n.pt predict --conf 0.25 --iou 0.7 --device cuda --half $sample
{ "configuration": { "chart": { "type": "bar", "polar": false, "zoomType": "", "options3d": {}, "height": 550, "width": null, "margin": null, "inverted": false, "zooming": {} }, "credits": { "enabled": false }, "title": { "text": "Input size: 69.7 KiB" }, "colorAxis": null, "subtitle": { "text": "" }, "xAxis": { "title": { "text": [ "" ], "useHTML": false, "style": { "color": "#666666" } }, "categories": [ "provider__short_name", "flavor__name", "flavor__gpu_model" ], "lineWidth": 1, "tickInterval": null, "tickWidth": 0, "tickLength": 10, "tickPixelInterval": null, "plotLines": null, "labels": { "enabled": false, "format": null, "formatter": "", "style": { "color": "#666666", "cursor": "default", "fontSize": "11px" }, "useHTML": false, "step": 0 }, "plotBands": null, "visible": true, "floor": null, "ceiling": null, "type": "linear", "min": null, "gridLineWidth": null, "gridLineColor": null, "minorTickInterval": null, "minorTickWidth": 0, "minTickInterval": null, "startOnTick": true, "endOnTick": null, "tickmarkPlacement": null, "units": null, "minRange": null }, "yAxis": { "title": { "text": [ "In msec<br>Lower is better" ], "useHTML": false, "style": { "color": "#666666" } }, "categories": null, "plotLines": null, "plotBands": null, "lineWidth": null, "tickInterval": null, "tickLength": 10, "floor": null, "ceiling": null, "gridLineInterpolation": null, "gridLineWidth": 1, "gridLineColor": "#CCC", "min": null, "max": null, "minorTickInterval": null, "minorTickWidth": 0, "minTickInterval": null, "startOnTick": true, "endOnTick": null, "minRange": null, "type": "linear", "tickmarkPlacement": null, "labels": { "enabled": true, "formatter": null, "style": { "color": "#666666", "cursor": "default", "fontSize": "11px" }, "useHTML": false } }, "zAxis": { "title": { "text": "In msec<br>Lower is better" } }, "plotOptions": { "series": { "dataLabels": { "enabled": true, "format": "{series.name}", "distance": 30, "align": "left", "inside": true, "allowOverlap": false, "style": { "fontSize": "17px" } }, "showInLegend": null, "turboThreshold": 1000, "stacking": "", "groupPadding": 0, "centerInCategory": false, "findNearestPointBy": "x" } }, "navigator": { "enabled": false }, "scrollbar": { "enabled": false }, "rangeSelector": { "enabled": false, "inputEnabled": false }, "legend": { "enabled": true, "maxHeight": null, "align": "center", "verticalAlign": "bottom", "layout": "horizontal", "width": null, "margin": 12, "reversed": false }, "series": [ { "name": "AWS g5.xlarge NVIDIA A10G", "data": [ [ 0, 76.26144091288249 ] ], "grouping": false, "color": "#f7981d" }, { "name": "AWS p3.2xlarge Tesla V100-SXM2-16GB", "data": [ [ 1, 118.66251627604167 ] ], "grouping": false, "color": "#f7981d" }, { "name": "Azure Standard_NC40ads_H100_v5 NVIDIA H100 NVL", "data": [ [ 2, 37.31489181518555 ] ], "grouping": false, "color": "#55b3ff" }, { "name": "Azure Standard_NC6s_v3 Tesla V100-PCIE-16GB", "data": [ [ 3, 108.90849431355794 ] ], "grouping": false, "color": "#55b3ff" }, { "name": "Google a2-highgpu-1g NVIDIA A100-SXM4-40GB", "data": [ [ 4, 84.58916346232097 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google a2-ultragpu-1g NVIDIA A100-SXM4-80GB", "data": [ [ 5, 81.57706260681152 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google g2-standard-16 NVIDIA L4", "data": [ [ 6, 97.2826878229777 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google n1-highmem-8 Intel Skylake Tesla V100 Tesla V100-SXM2-16GB", "data": [ [ 7, 113.28983306884766 ] ], "grouping": false, "color": "#55b400" }, { "name": "OVH H100-380 NVIDIA H100 PCIe", "data": [ [ 8, 200.04717508951822 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH L4-90 NVIDIA L4", "data": [ [ 9, 49.28978284200033 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH L40S-90 NVIDIA L40S", "data": [ [ 10, 50.87423324584961 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH T1-LE-45 Tesla V100-PCIE-16GB", "data": [ [ 11, 121.71395619710286 ] ], "grouping": false, "color": "#484848" } ], "drilldown": {}, "tooltip": { "enabled": true, "useHTML": false, "format": null, "headerFormat": "", "pointFormat": "<span style=\"color:{series.color}\">{series.name}</span>: <b>{point.y:.1f} ms</b>", "footerFormat": "", "shared": false, "outside": false, "valueDecimals": null, "split": false }, "annotations": null }, "hc_type": "chart", "id": "71400" }
{ "configuration": { "chart": { "type": "bar", "polar": false, "zoomType": "", "options3d": {}, "height": 550, "width": null, "margin": null, "inverted": false, "zooming": {} }, "credits": { "enabled": false }, "title": { "text": "Input size: 135.4 KiB" }, "colorAxis": null, "subtitle": { "text": "" }, "xAxis": { "title": { "text": [ "" ], "useHTML": false, "style": { "color": "#666666" } }, "categories": [ "provider__short_name", "flavor__name", "flavor__gpu_model" ], "lineWidth": 1, "tickInterval": null, "tickWidth": 0, "tickLength": 10, "tickPixelInterval": null, "plotLines": null, "labels": { "enabled": false, "format": null, "formatter": "", "style": { "color": "#666666", "cursor": "default", "fontSize": "11px" }, "useHTML": false, "step": 0 }, "plotBands": null, "visible": true, "floor": null, "ceiling": null, "type": "linear", "min": null, "gridLineWidth": null, "gridLineColor": null, "minorTickInterval": null, "minorTickWidth": 0, "minTickInterval": null, "startOnTick": true, "endOnTick": null, "tickmarkPlacement": null, "units": null, "minRange": null }, "yAxis": { "title": { "text": [ "In msec<br>Lower is better" ], "useHTML": false, "style": { "color": "#666666" } }, "categories": null, "plotLines": null, "plotBands": null, "lineWidth": null, "tickInterval": null, "tickLength": 10, "floor": null, "ceiling": null, "gridLineInterpolation": null, "gridLineWidth": 1, "gridLineColor": "#CCC", "min": null, "max": null, "minorTickInterval": null, "minorTickWidth": 0, "minTickInterval": null, "startOnTick": true, "endOnTick": null, "minRange": null, "type": "linear", "tickmarkPlacement": null, "labels": { "enabled": true, "formatter": null, "style": { "color": "#666666", "cursor": "default", "fontSize": "11px" }, "useHTML": false } }, "zAxis": { "title": { "text": "In msec<br>Lower is better" } }, "plotOptions": { "series": { "dataLabels": { "enabled": true, "format": "{series.name}", "distance": 30, "align": "left", "inside": true, "allowOverlap": false, "style": { "fontSize": "17px" } }, "showInLegend": null, "turboThreshold": 1000, "stacking": "", "groupPadding": 0, "centerInCategory": false, "findNearestPointBy": "x" } }, "navigator": { "enabled": false }, "scrollbar": { "enabled": false }, "rangeSelector": { "enabled": false, "inputEnabled": false }, "legend": { "enabled": true, "maxHeight": null, "align": "center", "verticalAlign": "bottom", "layout": "horizontal", "width": null, "margin": 12, "reversed": false }, "series": [ { "name": "AWS g5.xlarge NVIDIA A10G", "data": [ [ 0, 75.60261090596516 ] ], "grouping": false, "color": "#f7981d" }, { "name": "AWS p3.2xlarge Tesla V100-SXM2-16GB", "data": [ [ 1, 118.8672383626302 ] ], "grouping": false, "color": "#f7981d" }, { "name": "Azure Standard_NC40ads_H100_v5 NVIDIA H100 NVL", "data": [ [ 2, 37.12813059488932 ] ], "grouping": false, "color": "#55b3ff" }, { "name": "Azure Standard_NC6s_v3 Tesla V100-PCIE-16GB", "data": [ [ 3, 107.02848434448242 ] ], "grouping": false, "color": "#55b3ff" }, { "name": "Google a2-highgpu-1g NVIDIA A100-SXM4-40GB", "data": [ [ 4, 86.71895662943523 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google a2-ultragpu-1g NVIDIA A100-SXM4-80GB", "data": [ [ 5, 80.18716176350911 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google g2-standard-16 NVIDIA L4", "data": [ [ 6, 97.41075833638509 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google n1-highmem-8 Intel Skylake Tesla V100 Tesla V100-SXM2-16GB", "data": [ [ 7, 110.44355233510335 ] ], "grouping": false, "color": "#55b400" }, { "name": "OVH H100-380 NVIDIA H100 PCIe", "data": [ [ 8, 207.612673441569 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH L4-90 NVIDIA L4", "data": [ [ 9, 49.45063591003418 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH L40S-90 NVIDIA L40S", "data": [ [ 10, 51.17424329121908 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH T1-LE-45 Tesla V100-PCIE-16GB", "data": [ [ 11, 109.5736026763916 ] ], "grouping": false, "color": "#484848" } ], "drilldown": {}, "tooltip": { "enabled": true, "useHTML": false, "format": null, "headerFormat": "", "pointFormat": "<span style=\"color:{series.color}\">{series.name}</span>: <b>{point.y:.1f} ms</b>", "footerFormat": "", "shared": false, "outside": false, "valueDecimals": null, "split": false }, "annotations": null }, "hc_type": "chart", "id": "138602" }
{ "configuration": { "chart": { "type": "bar", "polar": false, "zoomType": "", "options3d": {}, "height": 550, "width": null, "margin": null, "inverted": false, "zooming": {} }, "credits": { "enabled": false }, "title": { "text": "Input size: 186.7 KiB" }, "colorAxis": null, "subtitle": { "text": "" }, "xAxis": { "title": { "text": [ "" ], "useHTML": false, "style": { "color": "#666666" } }, "categories": [ "provider__short_name", "flavor__name", "flavor__gpu_model" ], "lineWidth": 1, "tickInterval": null, "tickWidth": 0, "tickLength": 10, "tickPixelInterval": null, "plotLines": null, "labels": { "enabled": false, "format": null, "formatter": "", "style": { "color": "#666666", "cursor": "default", "fontSize": "11px" }, "useHTML": false, "step": 0 }, "plotBands": null, "visible": true, "floor": null, "ceiling": null, "type": "linear", "min": null, "gridLineWidth": null, "gridLineColor": null, "minorTickInterval": null, "minorTickWidth": 0, "minTickInterval": null, "startOnTick": true, "endOnTick": null, "tickmarkPlacement": null, "units": null, "minRange": null }, "yAxis": { "title": { "text": [ "In msec<br>Lower is better" ], "useHTML": false, "style": { "color": "#666666" } }, "categories": null, "plotLines": null, "plotBands": null, "lineWidth": null, "tickInterval": null, "tickLength": 10, "floor": null, "ceiling": null, "gridLineInterpolation": null, "gridLineWidth": 1, "gridLineColor": "#CCC", "min": null, "max": null, "minorTickInterval": null, "minorTickWidth": 0, "minTickInterval": null, "startOnTick": true, "endOnTick": null, "minRange": null, "type": "linear", "tickmarkPlacement": null, "labels": { "enabled": true, "formatter": null, "style": { "color": "#666666", "cursor": "default", "fontSize": "11px" }, "useHTML": false } }, "zAxis": { "title": { "text": "In msec<br>Lower is better" } }, "plotOptions": { "series": { "dataLabels": { "enabled": true, "format": "{series.name}", "distance": 30, "align": "left", "inside": true, "allowOverlap": false, "style": { "fontSize": "17px" } }, "showInLegend": null, "turboThreshold": 1000, "stacking": "", "groupPadding": 0, "centerInCategory": false, "findNearestPointBy": "x" } }, "navigator": { "enabled": false }, "scrollbar": { "enabled": false }, "rangeSelector": { "enabled": false, "inputEnabled": false }, "legend": { "enabled": true, "maxHeight": null, "align": "center", "verticalAlign": "bottom", "layout": "horizontal", "width": null, "margin": 12, "reversed": false }, "series": [ { "name": "AWS g5.xlarge NVIDIA A10G", "data": [ [ 0, 75.37023226420085 ] ], "grouping": false, "color": "#f7981d" }, { "name": "AWS p3.2xlarge Tesla V100-SXM2-16GB", "data": [ [ 1, 118.09444427490234 ] ], "grouping": false, "color": "#f7981d" }, { "name": "Azure Standard_NC40ads_H100_v5 NVIDIA H100 NVL", "data": [ [ 2, 37.46565183003744 ] ], "grouping": false, "color": "#55b3ff" }, { "name": "Azure Standard_NC6s_v3 Tesla V100-PCIE-16GB", "data": [ [ 3, 105.00009854634602 ] ], "grouping": false, "color": "#55b3ff" }, { "name": "Google a2-highgpu-1g NVIDIA A100-SXM4-40GB", "data": [ [ 4, 81.18716875712077 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google a2-ultragpu-1g NVIDIA A100-SXM4-80GB", "data": [ [ 5, 78.89080047607422 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google g2-standard-16 NVIDIA L4", "data": [ [ 6, 97.16959794362386 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google n1-highmem-8 Intel Skylake Tesla V100 Tesla V100-SXM2-16GB", "data": [ [ 7, 110.89591185251872 ] ], "grouping": false, "color": "#55b400" }, { "name": "OVH H100-380 NVIDIA H100 PCIe", "data": [ [ 8, 201.9814650217692 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH L4-90 NVIDIA L4", "data": [ [ 9, 48.88478914896647 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH L40S-90 NVIDIA L40S", "data": [ [ 10, 51.178812980651855 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH T1-LE-45 Tesla V100-PCIE-16GB", "data": [ [ 11, 114.0898068745931 ] ], "grouping": false, "color": "#484848" } ], "drilldown": {}, "tooltip": { "enabled": true, "useHTML": false, "format": null, "headerFormat": "", "pointFormat": "<span style=\"color:{series.color}\">{series.name}</span>: <b>{point.y:.1f} ms</b>", "footerFormat": "", "shared": false, "outside": false, "valueDecimals": null, "split": false }, "annotations": null }, "hc_type": "chart", "id": "191185" }
{ "configuration": { "chart": { "type": "bar", "polar": false, "zoomType": "", "options3d": {}, "height": 550, "width": null, "margin": null, "inverted": false, "zooming": {} }, "credits": { "enabled": false }, "title": { "text": "Input size: 647.1 KiB" }, "colorAxis": null, "subtitle": { "text": "" }, "xAxis": { "title": { "text": [ "" ], "useHTML": false, "style": { "color": "#666666" } }, "categories": [ "provider__short_name", "flavor__name", "flavor__gpu_model" ], "lineWidth": 1, "tickInterval": null, "tickWidth": 0, "tickLength": 10, "tickPixelInterval": null, "plotLines": null, "labels": { "enabled": false, "format": null, "formatter": "", "style": { "color": "#666666", "cursor": "default", "fontSize": "11px" }, "useHTML": false, "step": 0 }, "plotBands": null, "visible": true, "floor": null, "ceiling": null, "type": "linear", "min": null, "gridLineWidth": null, "gridLineColor": null, "minorTickInterval": null, "minorTickWidth": 0, "minTickInterval": null, "startOnTick": true, "endOnTick": null, "tickmarkPlacement": null, "units": null, "minRange": null }, "yAxis": { "title": { "text": [ "In msec<br>Lower is better" ], "useHTML": false, "style": { "color": "#666666" } }, "categories": null, "plotLines": null, "plotBands": null, "lineWidth": null, "tickInterval": null, "tickLength": 10, "floor": null, "ceiling": null, "gridLineInterpolation": null, "gridLineWidth": 1, "gridLineColor": "#CCC", "min": null, "max": null, "minorTickInterval": null, "minorTickWidth": 0, "minTickInterval": null, "startOnTick": true, "endOnTick": null, "minRange": null, "type": "linear", "tickmarkPlacement": null, "labels": { "enabled": true, "formatter": null, "style": { "color": "#666666", "cursor": "default", "fontSize": "11px" }, "useHTML": false } }, "zAxis": { "title": { "text": "In msec<br>Lower is better" } }, "plotOptions": { "series": { "dataLabels": { "enabled": true, "format": "{series.name}", "distance": 30, "align": "left", "inside": true, "allowOverlap": false, "style": { "fontSize": "17px" } }, "showInLegend": null, "turboThreshold": 1000, "stacking": "", "groupPadding": 0, "centerInCategory": false, "findNearestPointBy": "x" } }, "navigator": { "enabled": false }, "scrollbar": { "enabled": false }, "rangeSelector": { "enabled": false, "inputEnabled": false }, "legend": { "enabled": true, "maxHeight": null, "align": "center", "verticalAlign": "bottom", "layout": "horizontal", "width": null, "margin": 12, "reversed": false }, "series": [ { "name": "AWS g5.xlarge NVIDIA A10G", "data": [ [ 0, 75.2865473429362 ] ], "grouping": false, "color": "#f7981d" }, { "name": "AWS p3.2xlarge Tesla V100-SXM2-16GB", "data": [ [ 1, 117.53646532694499 ] ], "grouping": false, "color": "#f7981d" }, { "name": "Azure Standard_NC40ads_H100_v5 NVIDIA H100 NVL", "data": [ [ 2, 36.9873841603597 ] ], "grouping": false, "color": "#55b3ff" }, { "name": "Azure Standard_NC6s_v3 Tesla V100-PCIE-16GB", "data": [ [ 3, 112.85018920898438 ] ], "grouping": false, "color": "#55b3ff" }, { "name": "Google a2-highgpu-1g NVIDIA A100-SXM4-40GB", "data": [ [ 4, 84.50357119242351 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google a2-ultragpu-1g NVIDIA A100-SXM4-80GB", "data": [ [ 5, 79.35349146525066 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google g2-standard-16 NVIDIA L4", "data": [ [ 6, 97.25594520568848 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google n1-highmem-8 Intel Skylake Tesla V100 Tesla V100-SXM2-16GB", "data": [ [ 7, 113.36350440979004 ] ], "grouping": false, "color": "#55b400" }, { "name": "OVH H100-380 NVIDIA H100 PCIe", "data": [ [ 8, 211.49571736653647 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH L4-90 NVIDIA L4", "data": [ [ 9, 49.29216702779134 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH L40S-90 NVIDIA L40S", "data": [ [ 10, 51.41135056813558 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH T1-LE-45 Tesla V100-PCIE-16GB", "data": [ [ 11, 108.14380645751953 ] ], "grouping": false, "color": "#484848" } ], "drilldown": {}, "tooltip": { "enabled": true, "useHTML": false, "format": null, "headerFormat": "", "pointFormat": "<span style=\"color:{series.color}\">{series.name}</span>: <b>{point.y:.1f} ms</b>", "footerFormat": "", "shared": false, "outside": false, "valueDecimals": null, "split": false }, "annotations": null }, "hc_type": "chart", "id": "662665" }
{ "configuration": { "chart": { "type": "bar", "polar": false, "zoomType": "", "options3d": {}, "height": 550, "width": null, "margin": null, "inverted": false, "zooming": {} }, "credits": { "enabled": false }, "title": { "text": "Input size: 13.0 MiB" }, "colorAxis": null, "subtitle": { "text": "" }, "xAxis": { "title": { "text": [ "" ], "useHTML": false, "style": { "color": "#666666" } }, "categories": [ "provider__short_name", "flavor__name", "flavor__gpu_model" ], "lineWidth": 1, "tickInterval": null, "tickWidth": 0, "tickLength": 10, "tickPixelInterval": null, "plotLines": null, "labels": { "enabled": false, "format": null, "formatter": "", "style": { "color": "#666666", "cursor": "default", "fontSize": "11px" }, "useHTML": false, "step": 0 }, "plotBands": null, "visible": true, "floor": null, "ceiling": null, "type": "linear", "min": null, "gridLineWidth": null, "gridLineColor": null, "minorTickInterval": null, "minorTickWidth": 0, "minTickInterval": null, "startOnTick": true, "endOnTick": null, "tickmarkPlacement": null, "units": null, "minRange": null }, "yAxis": { "title": { "text": [ "In msec<br>Lower is better" ], "useHTML": false, "style": { "color": "#666666" } }, "categories": null, "plotLines": null, "plotBands": null, "lineWidth": null, "tickInterval": null, "tickLength": 10, "floor": null, "ceiling": null, "gridLineInterpolation": null, "gridLineWidth": 1, "gridLineColor": "#CCC", "min": null, "max": null, "minorTickInterval": null, "minorTickWidth": 0, "minTickInterval": null, "startOnTick": true, "endOnTick": null, "minRange": null, "type": "linear", "tickmarkPlacement": null, "labels": { "enabled": true, "formatter": null, "style": { "color": "#666666", "cursor": "default", "fontSize": "11px" }, "useHTML": false } }, "zAxis": { "title": { "text": "In msec<br>Lower is better" } }, "plotOptions": { "series": { "dataLabels": { "enabled": true, "format": "{series.name}", "distance": 30, "align": "left", "inside": true, "allowOverlap": false, "style": { "fontSize": "17px" } }, "showInLegend": null, "turboThreshold": 1000, "stacking": "", "groupPadding": 0, "centerInCategory": false, "findNearestPointBy": "x" } }, "navigator": { "enabled": false }, "scrollbar": { "enabled": false }, "rangeSelector": { "enabled": false, "inputEnabled": false }, "legend": { "enabled": true, "maxHeight": null, "align": "center", "verticalAlign": "bottom", "layout": "horizontal", "width": null, "margin": 12, "reversed": false }, "series": [ { "name": "AWS g5.xlarge NVIDIA A10G", "data": [ [ 0, 75.08659362792969 ] ], "grouping": false, "color": "#f7981d" }, { "name": "AWS p3.2xlarge Tesla V100-SXM2-16GB", "data": [ [ 1, 118.12901496887207 ] ], "grouping": false, "color": "#f7981d" }, { "name": "Azure Standard_NC40ads_H100_v5 NVIDIA H100 NVL", "data": [ [ 2, 37.099202473958336 ] ], "grouping": false, "color": "#55b3ff" }, { "name": "Azure Standard_NC6s_v3 Tesla V100-PCIE-16GB", "data": [ [ 3, 103.59398523966472 ] ], "grouping": false, "color": "#55b3ff" }, { "name": "Google a2-highgpu-1g NVIDIA A100-SXM4-40GB", "data": [ [ 4, 82.08942413330078 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google a2-ultragpu-1g NVIDIA A100-SXM4-80GB", "data": [ [ 5, 80.28968175252278 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google g2-standard-16 NVIDIA L4", "data": [ [ 6, 96.88623746236165 ] ], "grouping": false, "color": "#55b400" }, { "name": "Google n1-highmem-8 Intel Skylake Tesla V100 Tesla V100-SXM2-16GB", "data": [ [ 7, 110.62288284301758 ] ], "grouping": false, "color": "#55b400" }, { "name": "OVH H100-380 NVIDIA H100 PCIe", "data": [ [ 8, 216.74148241678873 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH L4-90 NVIDIA L4", "data": [ [ 9, 48.51492245992025 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH L40S-90 NVIDIA L40S", "data": [ [ 10, 49.88996187845866 ] ], "grouping": false, "color": "#484848" }, { "name": "OVH T1-LE-45 Tesla V100-PCIE-16GB", "data": [ [ 11, 109.15525754292806 ] ], "grouping": false, "color": "#484848" } ], "drilldown": {}, "tooltip": { "enabled": true, "useHTML": false, "format": null, "headerFormat": "", "pointFormat": "<span style=\"color:{series.color}\">{series.name}</span>: <b>{point.y:.1f} ms</b>", "footerFormat": "", "shared": false, "outside": false, "valueDecimals": null, "split": false }, "annotations": null }, "hc_type": "chart", "id": "13601264" }

Cloud Mercato's observations:

  • The image size doesn't influence the inference performance
  • In FP16, H100 is not able to perform well
  • Azure H100 and OVHcloud's L4/L40S have the best timing among the panel