Skip to content

Commit e6176fb

Browse files
mac0netarinkk
authored andcommitted
Correct grafana heatmap. (sgl-project#5019)
1 parent 939b6c2 commit e6176fb

File tree

1 file changed

+63
-41
lines changed

1 file changed

+63
-41
lines changed

examples/monitoring/grafana.json

Lines changed: 63 additions & 41 deletions
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@
1818
"editable": true,
1919
"fiscalYearStartMonth": 0,
2020
"graphTooltip": 0,
21-
"id": 1,
21+
"id": 8,
2222
"links": [],
2323
"panels": [
2424
{
@@ -69,8 +69,7 @@
6969
"mode": "absolute",
7070
"steps": [
7171
{
72-
"color": "green",
73-
"value": null
72+
"color": "green"
7473
},
7574
{
7675
"color": "red",
@@ -96,10 +95,12 @@
9695
"showLegend": true
9796
},
9897
"tooltip": {
98+
"hideZeros": false,
9999
"mode": "single",
100100
"sort": "none"
101101
}
102102
},
103+
"pluginVersion": "11.6.0",
103104
"targets": [
104105
{
105106
"datasource": {
@@ -199,9 +200,18 @@
199200
"y": 0
200201
},
201202
"id": 17,
203+
"maxDataPoints": 30,
202204
"options": {
203-
"calculate": true,
205+
"calculate": false,
206+
"calculation": {
207+
"yBuckets": {
208+
"scale": {
209+
"type": "linear"
210+
}
211+
}
212+
},
204213
"cellGap": 1,
214+
"cellValues": {},
205215
"color": {
206216
"exponent": 0.5,
207217
"fill": "dark-orange",
@@ -215,7 +225,7 @@
215225
"color": "rgba(255,0,255,0.7)"
216226
},
217227
"filterValues": {
218-
"le": 1e-09
228+
"le": 1e-9
219229
},
220230
"legend": {
221231
"show": true
@@ -230,19 +240,21 @@
230240
},
231241
"yAxis": {
232242
"axisPlacement": "left",
233-
"reverse": false
243+
"reverse": false,
244+
"unit": "secs"
234245
}
235246
},
236-
"pluginVersion": "11.2.0",
247+
"pluginVersion": "11.6.0",
237248
"targets": [
238249
{
239250
"datasource": {
240251
"type": "prometheus",
241252
"uid": "ddyfngn31dg5cf"
242253
},
243254
"disableTextWrap": false,
244-
"editorMode": "code",
245-
"expr": "rate(sglang:e2e_request_latency_seconds_bucket{model_name=~\"$model_name\"}[$__rate_interval])\r\n",
255+
"editorMode": "builder",
256+
"expr": "sum(increase(sglang:e2e_request_latency_seconds_bucket{model_name=~\"$model_name\"}[$__rate_interval])) by (le)\r\n",
257+
"format": "heatmap",
246258
"fullMetaSearch": false,
247259
"includeNullMetadata": true,
248260
"instant": false,
@@ -252,7 +264,7 @@
252264
"useBackend": false
253265
}
254266
],
255-
"title": "End-to-End Request Latency Heatmap",
267+
"title": "End-to-End Request Latency(s) Heatmap",
256268
"type": "heatmap"
257269
},
258270
{
@@ -303,8 +315,7 @@
303315
"mode": "absolute",
304316
"steps": [
305317
{
306-
"color": "green",
307-
"value": null
318+
"color": "green"
308319
},
309320
{
310321
"color": "red",
@@ -330,10 +341,12 @@
330341
"showLegend": true
331342
},
332343
"tooltip": {
344+
"hideZeros": false,
333345
"mode": "single",
334346
"sort": "none"
335347
}
336348
},
349+
"pluginVersion": "11.6.0",
337350
"targets": [
338351
{
339352
"datasource": {
@@ -403,7 +416,7 @@
403416
"useBackend": false
404417
}
405418
],
406-
"title": "End-to-End Request Latency",
419+
"title": "Time-To-First-Token Latency",
407420
"type": "timeseries"
408421
},
409422
{
@@ -433,8 +446,21 @@
433446
"y": 8
434447
},
435448
"id": 19,
449+
"maxDataPoints": 30,
436450
"options": {
437-
"calculate": true,
451+
"calculate": false,
452+
"calculation": {
453+
"xBuckets": {
454+
"value": ""
455+
},
456+
"yBuckets": {
457+
"mode": "size",
458+
"scale": {
459+
"type": "linear"
460+
},
461+
"value": ""
462+
}
463+
},
438464
"cellGap": 1,
439465
"color": {
440466
"exponent": 0.5,
@@ -449,7 +475,7 @@
449475
"color": "rgba(255,0,255,0.7)"
450476
},
451477
"filterValues": {
452-
"le": 1e-09
478+
"le": 1e-9
453479
},
454480
"legend": {
455481
"show": true
@@ -464,23 +490,25 @@
464490
},
465491
"yAxis": {
466492
"axisPlacement": "left",
467-
"reverse": false,
468-
"unit": "s"
493+
"reverse": false
469494
}
470495
},
471-
"pluginVersion": "11.2.0",
496+
"pluginVersion": "11.6.0",
472497
"targets": [
473498
{
474499
"datasource": {
475500
"type": "prometheus",
476501
"uid": "ddyfngn31dg5cf"
477502
},
478503
"disableTextWrap": false,
479-
"editorMode": "code",
480-
"expr": "rate(sglang:time_to_first_token_seconds_bucket{model_name=~\"$model_name\"}[$__rate_interval])\r\n",
504+
"editorMode": "builder",
505+
"exemplar": false,
506+
"expr": "sum by(le) (increase(sglang:time_to_first_token_seconds_bucket{model_name=~\"$model_name\"}[$__rate_interval]))",
507+
"format": "heatmap",
481508
"fullMetaSearch": false,
482509
"includeNullMetadata": true,
483510
"instant": false,
511+
"interval": "",
484512
"legendFormat": "{{le}}",
485513
"range": true,
486514
"refId": "A",
@@ -538,8 +566,7 @@
538566
"mode": "absolute",
539567
"steps": [
540568
{
541-
"color": "green",
542-
"value": null
569+
"color": "green"
543570
},
544571
{
545572
"color": "red",
@@ -565,10 +592,12 @@
565592
"showLegend": true
566593
},
567594
"tooltip": {
595+
"hideZeros": false,
568596
"mode": "single",
569597
"sort": "none"
570598
}
571599
},
600+
"pluginVersion": "11.6.0",
572601
"targets": [
573602
{
574603
"datasource": {
@@ -639,8 +668,7 @@
639668
"mode": "absolute",
640669
"steps": [
641670
{
642-
"color": "green",
643-
"value": null
671+
"color": "green"
644672
},
645673
{
646674
"color": "red",
@@ -666,10 +694,12 @@
666694
"showLegend": true
667695
},
668696
"tooltip": {
697+
"hideZeros": false,
669698
"mode": "single",
670699
"sort": "none"
671700
}
672701
},
702+
"pluginVersion": "11.6.0",
673703
"targets": [
674704
{
675705
"datasource": {
@@ -735,8 +765,7 @@
735765
"mode": "absolute",
736766
"steps": [
737767
{
738-
"color": "green",
739-
"value": null
768+
"color": "green"
740769
},
741770
{
742771
"color": "red",
@@ -762,10 +791,12 @@
762791
"showLegend": true
763792
},
764793
"tooltip": {
794+
"hideZeros": false,
765795
"mode": "single",
766796
"sort": "none"
767797
}
768798
},
799+
"pluginVersion": "11.6.0",
769800
"targets": [
770801
{
771802
"datasource": {
@@ -835,8 +866,7 @@
835866
"mode": "absolute",
836867
"steps": [
837868
{
838-
"color": "green",
839-
"value": null
869+
"color": "green"
840870
},
841871
{
842872
"color": "red",
@@ -862,10 +892,12 @@
862892
"showLegend": true
863893
},
864894
"tooltip": {
895+
"hideZeros": false,
865896
"mode": "single",
866897
"sort": "none"
867898
}
868899
},
900+
"pluginVersion": "11.6.0",
869901
"targets": [
870902
{
871903
"datasource": {
@@ -888,25 +920,23 @@
888920
"type": "timeseries"
889921
}
890922
],
923+
"preload": false,
891924
"refresh": "5s",
892-
"schemaVersion": 39,
925+
"schemaVersion": 41,
893926
"tags": [],
894927
"templating": {
895928
"list": [
896929
{
897930
"current": {
898-
"selected": false,
899931
"text": "127.0.0.1:30000",
900932
"value": "127.0.0.1:30000"
901933
},
902934
"datasource": {
903935
"type": "prometheus"
904936
},
905937
"definition": "label_values(instance)",
906-
"hide": 0,
907938
"includeAll": false,
908939
"label": "instance",
909-
"multi": false,
910940
"name": "instance",
911941
"options": [],
912942
"query": {
@@ -916,24 +946,19 @@
916946
},
917947
"refresh": 1,
918948
"regex": "",
919-
"skipUrlSync": false,
920-
"sort": 0,
921949
"type": "query"
922950
},
923951
{
924952
"current": {
925-
"selected": false,
926953
"text": "meta-llama/Llama-3.1-8B-Instruct",
927954
"value": "meta-llama/Llama-3.1-8B-Instruct"
928955
},
929956
"datasource": {
930957
"type": "prometheus"
931958
},
932959
"definition": "label_values(model_name)",
933-
"hide": 0,
934960
"includeAll": false,
935961
"label": "model name",
936-
"multi": false,
937962
"name": "model_name",
938963
"options": [],
939964
"query": {
@@ -943,8 +968,6 @@
943968
},
944969
"refresh": 1,
945970
"regex": "",
946-
"skipUrlSync": false,
947-
"sort": 0,
948971
"type": "query"
949972
}
950973
]
@@ -957,6 +980,5 @@
957980
"timezone": "browser",
958981
"title": "SGLang Dashboard",
959982
"uid": "sglang-dashboard",
960-
"version": 5,
961-
"weekStart": ""
983+
"version": 11
962984
}

0 commit comments

Comments
 (0)