Skip to content

Commit

Permalink
add more panels to dashboards
Browse files Browse the repository at this point in the history
  • Loading branch information
kondratyevd committed Jan 29, 2025
1 parent 4d901ee commit 3e0f3d3
Showing 1 changed file with 270 additions and 2 deletions.
272 changes: 270 additions & 2 deletions helm/supersonic/dashboards/default.json
Original file line number Diff line number Diff line change
Expand Up @@ -184,6 +184,103 @@
"title": "Server Load Metric",
"type": "timeseries"
},
{
"type": "timeseries",
"title": "Inferences per second (all models)",
"gridPos": {
"x": 0,
"y": 14,
"w": 10,
"h": 10
},
"datasource": {
"uid": "prometheus",
"type": "prometheus"
},
"id": 5,
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "prometheus"
},
"refId": "A",
"expr": "sum (\n rate(\n nv_inference_count{job=\"%RELEASE_NAME%-triton\"}[15s]\n )\n) by (job)",
"range": true,
"instant": false,
"editorMode": "code",
"legendFormat": "{{ job }}",
"exemplar": false,
"interval": ""
}
],
"options": {
"tooltip": {
"mode": "single",
"sort": "none"
},
"legend": {
"showLegend": true,
"displayMode": "list",
"placement": "bottom",
"calcs": []
}
},
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"lineInterpolation": "linear",
"barAlignment": 0,
"lineWidth": 1,
"fillOpacity": 0,
"gradientMode": "none",
"spanNulls": false,
"insertNulls": false,
"showPoints": "auto",
"pointSize": 5,
"stacking": {
"mode": "none",
"group": "A"
},
"axisPlacement": "auto",
"axisLabel": "",
"axisColorMode": "text",
"axisBorderShow": false,
"scaleDistribution": {
"type": "linear"
},
"axisCenteredZero": false,
"hideFrom": {
"tooltip": false,
"viz": false,
"legend": false
},
"thresholdsStyle": {
"mode": "off"
}
},
"color": {
"mode": "palette-classic"
},
"mappings": [],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
}
]
},
"min": 0,
"unit": "none"
},
"overrides": []
},
"pluginVersion": "10.2.3",
"description": ""
},
{
"datasource": {
"type": "prometheus",
Expand Down Expand Up @@ -282,8 +379,179 @@
],
"title": "Number of Triton Servers",
"type": "timeseries"
}
],
},
{
"type": "timeseries",
"title": "Latency Breakdown",
"gridPos": {
"x": 14,
"y": 4,
"w": 10,
"h": 10
},
"datasource": {
"uid": "prometheus",
"type": "prometheus"
},
"id": 6,
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "prometheus"
},
"refId": "A",
"expr": "sum by (job) ( rate(nv_inference_compute_infer_duration_us{job=\"%RELEASE_NAME%-triton\"}[15s])) /sum by (job) ( (rate(nv_inference_exec_count{job=\"%RELEASE_NAME%-triton\"}[15s]) * 1000) + 0.001)",
"range": true,
"instant": false,
"editorMode": "code",
"legendFormat": "Inference"
},
{
"datasource": {
"uid": "prometheus",
"type": "prometheus"
},
"refId": "B",
"expr": "sum by (job) ( rate(nv_inference_queue_duration_us{job=\"%RELEASE_NAME%-triton\"}[15s])) /sum by (job) ( (rate(nv_inference_exec_count{job=\"%RELEASE_NAME%-triton\"}[15s]) * 1000) + 0.001)",
"range": true,
"instant": false,
"hide": false,
"editorMode": "code",
"legendFormat": "Queue"
},
{
"datasource": {
"uid": "prometheus",
"type": "prometheus"
},
"refId": "C",
"expr": "sum by (job) ( rate(nv_inference_compute_input_duration_us{job=\"%RELEASE_NAME%-triton\"}[15s])) /sum by (job) ( (rate(nv_inference_exec_count{job=\"%RELEASE_NAME%-triton\"}[15s]) * 1000) + 0.001)",
"range": true,
"instant": false,
"hide": false,
"editorMode": "code",
"legendFormat": "Input"
},
{
"datasource": {
"uid": "prometheus",
"type": "prometheus"
},
"refId": "D",
"expr": "sum by (job) ( rate(nv_inference_compute_output_duration_us{job=\"%RELEASE_NAME%-triton\"}[15s])) /sum by (job) ( (rate(nv_inference_exec_count{job=\"%RELEASE_NAME%-triton\"}[15s]) * 1000) + 0.001)",
"range": true,
"instant": false,
"hide": false,
"editorMode": "code",
"legendFormat": "Output"
},
{
"datasource": {
"uid": "prometheus",
"type": "prometheus"
},
"refId": "E",
"expr": " sum(\n rate(envoy_http_downstream_rq_time_sum{envoy_http_conn_manager_prefix=\"ingress_grpc\", job=~\"%RELEASE_NAME%\"}[15s])\n /\n rate(envoy_http_downstream_rq_time_count{envoy_http_conn_manager_prefix=\"ingress_grpc\", job=~\"%RELEASE_NAME%\"}[15s])\n ) by (job)",
"range": true,
"instant": false,
"hide": false,
"editorMode": "code",
"legendFormat": "Total (measured at proxy)"
}
],
"options": {
"tooltip": {
"mode": "single",
"sort": "none"
},
"legend": {
"showLegend": true,
"displayMode": "list",
"placement": "right",
"calcs": []
}
},
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"lineInterpolation": "linear",
"barAlignment": 0,
"lineWidth": 1,
"fillOpacity": 100,
"gradientMode": "opacity",
"spanNulls": false,
"insertNulls": false,
"showPoints": "auto",
"pointSize": 5,
"stacking": {
"mode": "normal",
"group": "A"
},
"axisPlacement": "auto",
"axisLabel": "",
"axisColorMode": "text",
"axisBorderShow": false,
"scaleDistribution": {
"type": "linear"
},
"axisCenteredZero": false,
"hideFrom": {
"tooltip": false,
"viz": false,
"legend": false
},
"thresholdsStyle": {
"mode": "off"
}
},
"color": {
"mode": "palette-classic"
},
"mappings": [],
"thresholds": {
"mode": "absolute",
"steps": [
{
"value": null,
"color": "green"
},
{
"value": 80,
"color": "red"
}
]
}
},
"overrides": [
{
"matcher": {
"id": "byName",
"options": "Total (measured at proxy)"
},
"properties": [
{
"id": "custom.stacking",
"value": {
"mode": "none",
"group": "A"
}
},
{
"id": "custom.fillOpacity",
"value": 0
},
{
"id": "custom.lineWidth",
"value": 2
}
]
}
]
}
}
],
"refresh": "5s",
"schemaVersion": 38,
"style": "dark",
Expand Down

0 comments on commit 3e0f3d3

Please sign in to comment.