Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
cea64430
Unverified
Commit
cea64430
authored
May 09, 2024
by
Robert Shaw
Committed by
GitHub
May 09, 2024
Browse files
[Bugfix] Update grafana.json (#4711)
parent
a3c12457
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
239 additions
and
193 deletions
+239
-193
examples/production_monitoring/grafana.json
examples/production_monitoring/grafana.json
+239
-193
No files found.
examples/production_monitoring/grafana.json
View file @
cea64430
{
{
"__inputs"
:
[
{
"name"
:
"DS_PROMETHEUS"
,
"label"
:
"prometheus"
,
"description"
:
""
,
"type"
:
"datasource"
,
"pluginId"
:
"prometheus"
,
"pluginName"
:
"Prometheus"
}
],
"__elements"
:
{},
"__requires"
:
[
{
"type"
:
"grafana"
,
"id"
:
"grafana"
,
"name"
:
"Grafana"
,
"version"
:
"10.4.2"
},
{
"type"
:
"panel"
,
"id"
:
"heatmap"
,
"name"
:
"Heatmap"
,
"version"
:
""
},
{
"type"
:
"datasource"
,
"id"
:
"prometheus"
,
"name"
:
"Prometheus"
,
"version"
:
"1.0.0"
},
{
"type"
:
"panel"
,
"id"
:
"timeseries"
,
"name"
:
"Time series"
,
"version"
:
""
}
],
"annotations"
:
{
"annotations"
:
{
"list"
:
[
"list"
:
[
{
{
...
@@ -25,14 +62,14 @@
...
@@ -25,14 +62,14 @@
"editable"
:
true
,
"editable"
:
true
,
"fiscalYearStartMonth"
:
0
,
"fiscalYearStartMonth"
:
0
,
"graphTooltip"
:
0
,
"graphTooltip"
:
0
,
"id"
:
29
,
"id"
:
null
,
"links"
:
[],
"links"
:
[],
"liveNow"
:
false
,
"liveNow"
:
false
,
"panels"
:
[
"panels"
:
[
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"description"
:
"End to end request latency measured in seconds."
,
"description"
:
"End to end request latency measured in seconds."
,
"fieldConfig"
:
{
"fieldConfig"
:
{
...
@@ -41,6 +78,7 @@
...
@@ -41,6 +78,7 @@
"mode"
:
"palette-classic"
"mode"
:
"palette-classic"
},
},
"custom"
:
{
"custom"
:
{
"axisBorderShow"
:
false
,
"axisCenteredZero"
:
false
,
"axisCenteredZero"
:
false
,
"axisColorMode"
:
"text"
,
"axisColorMode"
:
"text"
,
"axisLabel"
:
""
,
"axisLabel"
:
""
,
...
@@ -54,6 +92,7 @@
...
@@ -54,6 +92,7 @@
"tooltip"
:
false
,
"tooltip"
:
false
,
"viz"
:
false
"viz"
:
false
},
},
"insertNulls"
:
false
,
"lineInterpolation"
:
"linear"
,
"lineInterpolation"
:
"linear"
,
"lineWidth"
:
1
,
"lineWidth"
:
1
,
"pointSize"
:
5
,
"pointSize"
:
5
,
...
@@ -111,7 +150,7 @@
...
@@ -111,7 +150,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -127,7 +166,7 @@
...
@@ -127,7 +166,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -144,7 +183,7 @@
...
@@ -144,7 +183,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -161,7 +200,7 @@
...
@@ -161,7 +200,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -178,7 +217,7 @@
...
@@ -178,7 +217,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"editorMode"
:
"code"
,
"editorMode"
:
"code"
,
"expr"
:
"rate(vllm:e2e_request_latency_seconds_sum{model_name=
\"
$model_name
\"
}[$__rate_interval])
\n
/
\n
rate(vllm:e2e_request_latency_seconds_count{model_name=
\"
$model_name
\"
}[$__rate_interval])"
,
"expr"
:
"rate(vllm:e2e_request_latency_seconds_sum{model_name=
\"
$model_name
\"
}[$__rate_interval])
\n
/
\n
rate(vllm:e2e_request_latency_seconds_count{model_name=
\"
$model_name
\"
}[$__rate_interval])"
,
...
@@ -195,7 +234,7 @@
...
@@ -195,7 +234,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"description"
:
"Number of tokens processed per second"
,
"description"
:
"Number of tokens processed per second"
,
"fieldConfig"
:
{
"fieldConfig"
:
{
...
@@ -204,6 +243,7 @@
...
@@ -204,6 +243,7 @@
"mode"
:
"palette-classic"
"mode"
:
"palette-classic"
},
},
"custom"
:
{
"custom"
:
{
"axisBorderShow"
:
false
,
"axisCenteredZero"
:
false
,
"axisCenteredZero"
:
false
,
"axisColorMode"
:
"text"
,
"axisColorMode"
:
"text"
,
"axisLabel"
:
""
,
"axisLabel"
:
""
,
...
@@ -217,6 +257,7 @@
...
@@ -217,6 +257,7 @@
"tooltip"
:
false
,
"tooltip"
:
false
,
"viz"
:
false
"viz"
:
false
},
},
"insertNulls"
:
false
,
"lineInterpolation"
:
"linear"
,
"lineInterpolation"
:
"linear"
,
"lineWidth"
:
1
,
"lineWidth"
:
1
,
"pointSize"
:
5
,
"pointSize"
:
5
,
...
@@ -273,7 +314,7 @@
...
@@ -273,7 +314,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -289,7 +330,7 @@
...
@@ -289,7 +330,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -310,7 +351,7 @@
...
@@ -310,7 +351,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"description"
:
"Inter token latency in seconds."
,
"description"
:
"Inter token latency in seconds."
,
"fieldConfig"
:
{
"fieldConfig"
:
{
...
@@ -319,6 +360,7 @@
...
@@ -319,6 +360,7 @@
"mode"
:
"palette-classic"
"mode"
:
"palette-classic"
},
},
"custom"
:
{
"custom"
:
{
"axisBorderShow"
:
false
,
"axisCenteredZero"
:
false
,
"axisCenteredZero"
:
false
,
"axisColorMode"
:
"text"
,
"axisColorMode"
:
"text"
,
"axisLabel"
:
""
,
"axisLabel"
:
""
,
...
@@ -332,6 +374,7 @@
...
@@ -332,6 +374,7 @@
"tooltip"
:
false
,
"tooltip"
:
false
,
"viz"
:
false
"viz"
:
false
},
},
"insertNulls"
:
false
,
"lineInterpolation"
:
"linear"
,
"lineInterpolation"
:
"linear"
,
"lineWidth"
:
1
,
"lineWidth"
:
1
,
"pointSize"
:
5
,
"pointSize"
:
5
,
...
@@ -389,7 +432,7 @@
...
@@ -389,7 +432,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -405,7 +448,7 @@
...
@@ -405,7 +448,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -422,7 +465,7 @@
...
@@ -422,7 +465,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -439,7 +482,7 @@
...
@@ -439,7 +482,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -456,7 +499,7 @@
...
@@ -456,7 +499,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"editorMode"
:
"code"
,
"editorMode"
:
"code"
,
"expr"
:
"rate(vllm:time_per_output_token_seconds_sum{model_name=
\"
$model_name
\"
}[$__rate_interval])
\n
/
\n
rate(vllm:time_per_output_token_seconds_count{model_name=
\"
$model_name
\"
}[$__rate_interval])"
,
"expr"
:
"rate(vllm:time_per_output_token_seconds_sum{model_name=
\"
$model_name
\"
}[$__rate_interval])
\n
/
\n
rate(vllm:time_per_output_token_seconds_count{model_name=
\"
$model_name
\"
}[$__rate_interval])"
,
...
@@ -473,7 +516,7 @@
...
@@ -473,7 +516,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"description"
:
"Number of requests in RUNNING, WAITING, and SWAPPED state"
,
"description"
:
"Number of requests in RUNNING, WAITING, and SWAPPED state"
,
"fieldConfig"
:
{
"fieldConfig"
:
{
...
@@ -482,6 +525,7 @@
...
@@ -482,6 +525,7 @@
"mode"
:
"palette-classic"
"mode"
:
"palette-classic"
},
},
"custom"
:
{
"custom"
:
{
"axisBorderShow"
:
false
,
"axisCenteredZero"
:
false
,
"axisCenteredZero"
:
false
,
"axisColorMode"
:
"text"
,
"axisColorMode"
:
"text"
,
"axisLabel"
:
""
,
"axisLabel"
:
""
,
...
@@ -495,6 +539,7 @@
...
@@ -495,6 +539,7 @@
"tooltip"
:
false
,
"tooltip"
:
false
,
"viz"
:
false
"viz"
:
false
},
},
"insertNulls"
:
false
,
"lineInterpolation"
:
"linear"
,
"lineInterpolation"
:
"linear"
,
"lineWidth"
:
1
,
"lineWidth"
:
1
,
"pointSize"
:
5
,
"pointSize"
:
5
,
...
@@ -552,7 +597,7 @@
...
@@ -552,7 +597,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -568,7 +613,7 @@
...
@@ -568,7 +613,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -585,7 +630,7 @@
...
@@ -585,7 +630,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -606,7 +651,7 @@
...
@@ -606,7 +651,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"description"
:
"P50, P90, P95, and P99 TTFT latency in seconds."
,
"description"
:
"P50, P90, P95, and P99 TTFT latency in seconds."
,
"fieldConfig"
:
{
"fieldConfig"
:
{
...
@@ -615,6 +660,7 @@
...
@@ -615,6 +660,7 @@
"mode"
:
"palette-classic"
"mode"
:
"palette-classic"
},
},
"custom"
:
{
"custom"
:
{
"axisBorderShow"
:
false
,
"axisCenteredZero"
:
false
,
"axisCenteredZero"
:
false
,
"axisColorMode"
:
"text"
,
"axisColorMode"
:
"text"
,
"axisLabel"
:
""
,
"axisLabel"
:
""
,
...
@@ -628,6 +674,7 @@
...
@@ -628,6 +674,7 @@
"tooltip"
:
false
,
"tooltip"
:
false
,
"viz"
:
false
"viz"
:
false
},
},
"insertNulls"
:
false
,
"lineInterpolation"
:
"linear"
,
"lineInterpolation"
:
"linear"
,
"lineWidth"
:
1
,
"lineWidth"
:
1
,
"pointSize"
:
5
,
"pointSize"
:
5
,
...
@@ -685,7 +732,7 @@
...
@@ -685,7 +732,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -702,7 +749,7 @@
...
@@ -702,7 +749,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -718,7 +765,7 @@
...
@@ -718,7 +765,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -735,7 +782,7 @@
...
@@ -735,7 +782,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -752,7 +799,7 @@
...
@@ -752,7 +799,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"editorMode"
:
"code"
,
"editorMode"
:
"code"
,
"expr"
:
"rate(vllm:time_to_first_token_seconds_sum{model_name=
\"
$model_name
\"
}[$__rate_interval])
\n
/
\n
rate(vllm:time_to_first_token_seconds_count{model_name=
\"
$model_name
\"
}[$__rate_interval])"
,
"expr"
:
"rate(vllm:time_to_first_token_seconds_sum{model_name=
\"
$model_name
\"
}[$__rate_interval])
\n
/
\n
rate(vllm:time_to_first_token_seconds_count{model_name=
\"
$model_name
\"
}[$__rate_interval])"
,
...
@@ -769,7 +816,7 @@
...
@@ -769,7 +816,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"description"
:
"Percentage of used cache blocks by vLLM."
,
"description"
:
"Percentage of used cache blocks by vLLM."
,
"fieldConfig"
:
{
"fieldConfig"
:
{
...
@@ -778,6 +825,7 @@
...
@@ -778,6 +825,7 @@
"mode"
:
"palette-classic"
"mode"
:
"palette-classic"
},
},
"custom"
:
{
"custom"
:
{
"axisBorderShow"
:
false
,
"axisCenteredZero"
:
false
,
"axisCenteredZero"
:
false
,
"axisColorMode"
:
"text"
,
"axisColorMode"
:
"text"
,
"axisLabel"
:
""
,
"axisLabel"
:
""
,
...
@@ -791,6 +839,7 @@
...
@@ -791,6 +839,7 @@
"tooltip"
:
false
,
"tooltip"
:
false
,
"viz"
:
false
"viz"
:
false
},
},
"insertNulls"
:
false
,
"lineInterpolation"
:
"linear"
,
"lineInterpolation"
:
"linear"
,
"lineWidth"
:
1
,
"lineWidth"
:
1
,
"pointSize"
:
5
,
"pointSize"
:
5
,
...
@@ -848,7 +897,7 @@
...
@@ -848,7 +897,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"editorMode"
:
"code"
,
"editorMode"
:
"code"
,
"expr"
:
"vllm:gpu_cache_usage_perc{model_name=
\"
$model_name
\"
}"
,
"expr"
:
"vllm:gpu_cache_usage_perc{model_name=
\"
$model_name
\"
}"
,
...
@@ -860,7 +909,7 @@
...
@@ -860,7 +909,7 @@
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"editorMode"
:
"code"
,
"editorMode"
:
"code"
,
"expr"
:
"vllm:cpu_cache_usage_perc{model_name=
\"
$model_name
\"
}"
,
"expr"
:
"vllm:cpu_cache_usage_perc{model_name=
\"
$model_name
\"
}"
,
...
@@ -875,229 +924,232 @@
...
@@ -875,229 +924,232 @@
"type"
:
"timeseries"
"type"
:
"timeseries"
},
},
{
{
"type"
:
"heatmap"
,
"datasource"
:
{
"title"
:
"Request Prompt Length"
,
"type"
:
"prometheus"
,
"uid"
:
"${DS_PROMETHEUS}"
},
"description"
:
"Heatmap of request prompt length"
,
"description"
:
"Heatmap of request prompt length"
,
"fieldConfig"
:
{
"defaults"
:
{
"custom"
:
{
"hideFrom"
:
{
"legend"
:
false
,
"tooltip"
:
false
,
"viz"
:
false
},
"scaleDistribution"
:
{
"type"
:
"linear"
}
}
},
"overrides"
:
[]
},
"gridPos"
:
{
"gridPos"
:
{
"x"
:
0
,
"h"
:
8
,
"y"
:
24
,
"w"
:
12
,
"w"
:
12
,
"h"
:
8
"x"
:
0
,
},
"y"
:
24
"datasource"
:
{
"uid"
:
"prometheus"
,
"type"
:
"prometheus"
},
},
"id"
:
12
,
"id"
:
12
,
"targets"
:
[
{
"datasource"
:
{
"type"
:
"prometheus"
,
"uid"
:
"prometheus"
},
"refId"
:
"A"
,
"expr"
:
"sum by(le) (increase(vllm:request_prompt_tokens_bucket{model_name=
\"
$model_name
\"
}[$__rate_interval]))"
,
"range"
:
true
,
"instant"
:
false
,
"editorMode"
:
"builder"
,
"legendFormat"
:
"{{le}}"
,
"useBackend"
:
false
,
"disableTextWrap"
:
false
,
"fullMetaSearch"
:
false
,
"includeNullMetadata"
:
true
,
"format"
:
"heatmap"
}
],
"options"
:
{
"options"
:
{
"calculate"
:
false
,
"calculate"
:
false
,
"yAxis"
:
{
"cellGap"
:
1
,
"axisPlacement"
:
"left"
,
"cellValues"
:
{
"reverse"
:
false
,
"unit"
:
"none"
"unit"
:
"none"
,
"axisLabel"
:
"Prompt Length"
},
"rowsFrame"
:
{
"layout"
:
"auto"
,
"value"
:
"Request count"
},
},
"color"
:
{
"color"
:
{
"
mode"
:
"scheme"
,
"
exponent"
:
0.5
,
"fill"
:
"dark-orange"
,
"fill"
:
"dark-orange"
,
"min"
:
0
,
"mode"
:
"scheme"
,
"reverse"
:
false
,
"scale"
:
"exponential"
,
"scale"
:
"exponential"
,
"exponent"
:
0.5
,
"scheme"
:
"Spectral"
,
"scheme"
:
"Spectral"
,
"steps"
:
64
,
"steps"
:
64
"reverse"
:
false
,
},
"min"
:
0
"exemplars"
:
{
"color"
:
"rgba(255,0,255,0.7)"
},
},
"cellGap"
:
1
,
"filterValues"
:
{
"filterValues"
:
{
"le"
:
1e-9
"le"
:
1e-9
},
},
"tooltip"
:
{
"show"
:
true
,
"yHistogram"
:
true
},
"legend"
:
{
"legend"
:
{
"show"
:
true
"show"
:
true
},
},
"exemplars"
:
{
"rowsFrame"
:
{
"color"
:
"rgba(255,0,255,0.7)"
"layout"
:
"auto"
,
"value"
:
"Request count"
},
},
"cellValues"
:
{
"tooltip"
:
{
"mode"
:
"single"
,
"showColorScale"
:
false
,
"yHistogram"
:
true
},
"yAxis"
:
{
"axisLabel"
:
"Prompt Length"
,
"axisPlacement"
:
"left"
,
"reverse"
:
false
,
"unit"
:
"none"
"unit"
:
"none"
}
}
},
},
"pluginVersion"
:
"10.4.2"
,
"targets"
:
[
{
"datasource"
:
{
"type"
:
"prometheus"
,
"uid"
:
"${DS_PROMETHEUS}"
},
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"expr"
:
"sum by(le) (increase(vllm:request_prompt_tokens_bucket{model_name=
\"
$model_name
\"
}[$__rate_interval]))"
,
"format"
:
"heatmap"
,
"fullMetaSearch"
:
false
,
"includeNullMetadata"
:
true
,
"instant"
:
false
,
"legendFormat"
:
"{{le}}"
,
"range"
:
true
,
"refId"
:
"A"
,
"useBackend"
:
false
}
],
"title"
:
"Request Prompt Length"
,
"type"
:
"heatmap"
},
{
"datasource"
:
{
"type"
:
"prometheus"
,
"uid"
:
"${DS_PROMETHEUS}"
},
"description"
:
"Heatmap of request generation length"
,
"fieldConfig"
:
{
"fieldConfig"
:
{
"defaults"
:
{
"defaults"
:
{
"custom"
:
{
"custom"
:
{
"scaleDistribution"
:
{
"type"
:
"linear"
},
"hideFrom"
:
{
"hideFrom"
:
{
"legend"
:
false
,
"tooltip"
:
false
,
"tooltip"
:
false
,
"viz"
:
false
,
"viz"
:
false
"legend"
:
false
},
"scaleDistribution"
:
{
"type"
:
"linear"
}
}
}
}
},
},
"overrides"
:
[]
"overrides"
:
[]
},
},
"pluginVersion"
:
"10.2.0"
},
{
"datasource"
:
{
"uid"
:
"prometheus"
,
"type"
:
"prometheus"
},
"type"
:
"heatmap"
,
"title"
:
"Request Generation Length"
,
"description"
:
"Heatmap of request generation length"
,
"gridPos"
:
{
"gridPos"
:
{
"x"
:
12
,
"h"
:
8
,
"y"
:
24
,
"w"
:
12
,
"w"
:
12
,
"h"
:
8
"x"
:
12
,
"y"
:
24
},
},
"id"
:
13
,
"id"
:
13
,
"targets"
:
[
{
"datasource"
:
{
"type"
:
"prometheus"
,
"uid"
:
"prometheus"
},
"refId"
:
"A"
,
"expr"
:
"sum by(le) (increase(vllm:request_generation_tokens_bucket{model_name=
\"
$model_name
\"
}[$__rate_interval]))"
,
"range"
:
true
,
"instant"
:
false
,
"editorMode"
:
"builder"
,
"legendFormat"
:
"{{le}}"
,
"useBackend"
:
false
,
"disableTextWrap"
:
false
,
"fullMetaSearch"
:
false
,
"includeNullMetadata"
:
true
,
"format"
:
"heatmap"
}
],
"options"
:
{
"options"
:
{
"calculate"
:
false
,
"calculate"
:
false
,
"yAxis"
:
{
"cellGap"
:
1
,
"axisPlacement"
:
"left"
,
"cellValues"
:
{
"reverse"
:
false
,
"unit"
:
"none"
"unit"
:
"none"
,
"axisLabel"
:
"Generation Length"
},
"rowsFrame"
:
{
"layout"
:
"auto"
,
"value"
:
"Request count"
},
},
"color"
:
{
"color"
:
{
"
mode"
:
"scheme"
,
"
exponent"
:
0.5
,
"fill"
:
"dark-orange"
,
"fill"
:
"dark-orange"
,
"min"
:
0
,
"mode"
:
"scheme"
,
"reverse"
:
false
,
"scale"
:
"exponential"
,
"scale"
:
"exponential"
,
"exponent"
:
0.5
,
"scheme"
:
"Spectral"
,
"scheme"
:
"Spectral"
,
"steps"
:
64
,
"steps"
:
64
"reverse"
:
false
,
},
"min"
:
0
"exemplars"
:
{
"color"
:
"rgba(255,0,255,0.7)"
},
},
"cellGap"
:
1
,
"filterValues"
:
{
"filterValues"
:
{
"le"
:
1e-9
"le"
:
1e-9
},
},
"tooltip"
:
{
"show"
:
true
,
"yHistogram"
:
true
},
"legend"
:
{
"legend"
:
{
"show"
:
true
"show"
:
true
},
},
"exemplars"
:
{
"rowsFrame"
:
{
"color"
:
"rgba(255,0,255,0.7)"
"layout"
:
"auto"
,
"value"
:
"Request count"
},
},
"cellValues"
:
{
"tooltip"
:
{
"mode"
:
"single"
,
"showColorScale"
:
false
,
"yHistogram"
:
true
},
"yAxis"
:
{
"axisLabel"
:
"Generation Length"
,
"axisPlacement"
:
"left"
,
"reverse"
:
false
,
"unit"
:
"none"
"unit"
:
"none"
}
}
},
},
"fieldConfig"
:
{
"pluginVersion"
:
"10.4.2"
,
"defaults"
:
{
"targets"
:
[
"custom"
:
{
{
"scaleDistribution"
:
{
"datasource"
:
{
"type"
:
"linear"
"type"
:
"prometheus"
,
},
"uid"
:
"${DS_PROMETHEUS}"
"hideFrom"
:
{
},
"tooltip"
:
false
,
"disableTextWrap"
:
false
,
"viz"
:
false
,
"editorMode"
:
"builder"
,
"legend"
:
false
"expr"
:
"sum by(le) (increase(vllm:request_generation_tokens_bucket{model_name=
\"
$model_name
\"
}[$__rate_interval]))"
,
}
"format"
:
"heatmap"
,
}
"fullMetaSearch"
:
false
,
},
"includeNullMetadata"
:
true
,
"overrides"
:
[]
"instant"
:
false
,
},
"legendFormat"
:
"{{le}}"
,
"pluginVersion"
:
"10.2.0"
"range"
:
true
,
"refId"
:
"A"
,
"useBackend"
:
false
}
],
"title"
:
"Request Generation Length"
,
"type"
:
"heatmap"
},
},
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"description"
:
"Number of finished requests by their finish reason: either an EOS token was generated or the max sequence length was reached."
,
"fieldConfig"
:
{
"fieldConfig"
:
{
"defaults"
:
{
"defaults"
:
{
"color"
:
{
"mode"
:
"palette-classic"
},
"custom"
:
{
"custom"
:
{
"drawStyle"
:
"line"
,
"axisBorderShow"
:
false
,
"lineInterpolation"
:
"linear"
,
"axisCenteredZero"
:
false
,
"axisColorMode"
:
"text"
,
"axisLabel"
:
""
,
"axisPlacement"
:
"auto"
,
"barAlignment"
:
0
,
"barAlignment"
:
0
,
"
lineWidth"
:
1
,
"
drawStyle"
:
"line"
,
"fillOpacity"
:
0
,
"fillOpacity"
:
0
,
"gradientMode"
:
"none"
,
"gradientMode"
:
"none"
,
"spanNulls"
:
false
,
"hideFrom"
:
{
"legend"
:
false
,
"tooltip"
:
false
,
"viz"
:
false
},
"insertNulls"
:
false
,
"insertNulls"
:
false
,
"showPoints"
:
"auto"
,
"lineInterpolation"
:
"linear"
,
"lineWidth"
:
1
,
"pointSize"
:
5
,
"pointSize"
:
5
,
"stacking"
:
{
"mode"
:
"none"
,
"group"
:
"A"
},
"axisPlacement"
:
"auto"
,
"axisLabel"
:
""
,
"axisColorMode"
:
"text"
,
"axisBorderShow"
:
false
,
"scaleDistribution"
:
{
"scaleDistribution"
:
{
"type"
:
"linear"
"type"
:
"linear"
},
},
"
axisCenteredZero"
:
false
,
"
showPoints"
:
"auto"
,
"
hideFrom"
:
{
"
spanNulls"
:
false
,
"tooltip"
:
false
,
"stacking"
:
{
"
viz"
:
false
,
"
group"
:
"A"
,
"
legend"
:
false
"
mode"
:
"none"
},
},
"thresholdsStyle"
:
{
"thresholdsStyle"
:
{
"mode"
:
"off"
"mode"
:
"off"
}
}
},
},
"color"
:
{
"mode"
:
"palette-classic"
},
"mappings"
:
[],
"mappings"
:
[],
"thresholds"
:
{
"thresholds"
:
{
"mode"
:
"absolute"
,
"mode"
:
"absolute"
,
...
@@ -1123,22 +1175,22 @@
...
@@ -1123,22 +1175,22 @@
},
},
"id"
:
11
,
"id"
:
11
,
"options"
:
{
"options"
:
{
"tooltip"
:
{
"mode"
:
"single"
,
"sort"
:
"none"
},
"legend"
:
{
"legend"
:
{
"
showLegend"
:
true
,
"
calcs"
:
[]
,
"displayMode"
:
"list"
,
"displayMode"
:
"list"
,
"placement"
:
"bottom"
,
"placement"
:
"bottom"
,
"calcs"
:
[]
"showLegend"
:
true
},
"tooltip"
:
{
"mode"
:
"single"
,
"sort"
:
"none"
}
}
},
},
"targets"
:
[
"targets"
:
[
{
{
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"disableTextWrap"
:
false
,
"disableTextWrap"
:
false
,
"editorMode"
:
"builder"
,
"editorMode"
:
"builder"
,
...
@@ -1154,25 +1206,19 @@
...
@@ -1154,25 +1206,19 @@
}
}
],
],
"title"
:
"Finish Reason"
,
"title"
:
"Finish Reason"
,
"description"
:
"Number of finished requests by their finish reason: either an EOS token was generated or the max sequence length was reached."
,
"type"
:
"timeseries"
"type"
:
"timeseries"
}
}
],
],
"refresh"
:
""
,
"refresh"
:
""
,
"schemaVersion"
:
37
,
"schemaVersion"
:
39
,
"style"
:
"dark"
,
"tags"
:
[],
"tags"
:
[],
"templating"
:
{
"templating"
:
{
"list"
:
[
"list"
:
[
{
{
"current"
:
{
"current"
:
{},
"selected"
:
false
,
"text"
:
"vllm"
,
"value"
:
"vllm"
},
"datasource"
:
{
"datasource"
:
{
"type"
:
"prometheus"
,
"type"
:
"prometheus"
,
"uid"
:
"
prometheus
"
"uid"
:
"
${DS_PROMETHEUS}
"
},
},
"definition"
:
"label_values(model_name)"
,
"definition"
:
"label_values(model_name)"
,
"hide"
:
0
,
"hide"
:
0
,
...
@@ -1201,6 +1247,6 @@
...
@@ -1201,6 +1247,6 @@
"timezone"
:
""
,
"timezone"
:
""
,
"title"
:
"vLLM"
,
"title"
:
"vLLM"
,
"uid"
:
"b281712d-8bff-41ef-9f3f-71ad43c05e9b"
,
"uid"
:
"b281712d-8bff-41ef-9f3f-71ad43c05e9b"
,
"version"
:
2
,
"version"
:
1
,
"weekStart"
:
""
"weekStart"
:
""
}
}
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment