|
18 | 18 | "editable": true,
|
19 | 19 | "fiscalYearStartMonth": 0,
|
20 | 20 | "graphTooltip": 0,
|
21 |
| - "id": 1, |
| 21 | + "id": 8, |
22 | 22 | "links": [],
|
23 | 23 | "panels": [
|
24 | 24 | {
|
|
69 | 69 | "mode": "absolute",
|
70 | 70 | "steps": [
|
71 | 71 | {
|
72 |
| - "color": "green", |
73 |
| - "value": null |
| 72 | + "color": "green" |
74 | 73 | },
|
75 | 74 | {
|
76 | 75 | "color": "red",
|
|
96 | 95 | "showLegend": true
|
97 | 96 | },
|
98 | 97 | "tooltip": {
|
| 98 | + "hideZeros": false, |
99 | 99 | "mode": "single",
|
100 | 100 | "sort": "none"
|
101 | 101 | }
|
102 | 102 | },
|
| 103 | + "pluginVersion": "11.6.0", |
103 | 104 | "targets": [
|
104 | 105 | {
|
105 | 106 | "datasource": {
|
|
199 | 200 | "y": 0
|
200 | 201 | },
|
201 | 202 | "id": 17,
|
| 203 | + "maxDataPoints": 30, |
202 | 204 | "options": {
|
203 |
| - "calculate": true, |
| 205 | + "calculate": false, |
| 206 | + "calculation": { |
| 207 | + "yBuckets": { |
| 208 | + "scale": { |
| 209 | + "type": "linear" |
| 210 | + } |
| 211 | + } |
| 212 | + }, |
204 | 213 | "cellGap": 1,
|
| 214 | + "cellValues": {}, |
205 | 215 | "color": {
|
206 | 216 | "exponent": 0.5,
|
207 | 217 | "fill": "dark-orange",
|
|
215 | 225 | "color": "rgba(255,0,255,0.7)"
|
216 | 226 | },
|
217 | 227 | "filterValues": {
|
218 |
| - "le": 1e-09 |
| 228 | + "le": 1e-9 |
219 | 229 | },
|
220 | 230 | "legend": {
|
221 | 231 | "show": true
|
|
230 | 240 | },
|
231 | 241 | "yAxis": {
|
232 | 242 | "axisPlacement": "left",
|
233 |
| - "reverse": false |
| 243 | + "reverse": false, |
| 244 | + "unit": "secs" |
234 | 245 | }
|
235 | 246 | },
|
236 |
| - "pluginVersion": "11.2.0", |
| 247 | + "pluginVersion": "11.6.0", |
237 | 248 | "targets": [
|
238 | 249 | {
|
239 | 250 | "datasource": {
|
240 | 251 | "type": "prometheus",
|
241 | 252 | "uid": "ddyfngn31dg5cf"
|
242 | 253 | },
|
243 | 254 | "disableTextWrap": false,
|
244 |
| - "editorMode": "code", |
245 |
| - "expr": "rate(sglang:e2e_request_latency_seconds_bucket{model_name=~\"$model_name\"}[$__rate_interval])\r\n", |
| 255 | + "editorMode": "builder", |
| 256 | + "expr": "sum(increase(sglang:e2e_request_latency_seconds_bucket{model_name=~\"$model_name\"}[$__rate_interval])) by (le)\r\n", |
| 257 | + "format": "heatmap", |
246 | 258 | "fullMetaSearch": false,
|
247 | 259 | "includeNullMetadata": true,
|
248 | 260 | "instant": false,
|
|
252 | 264 | "useBackend": false
|
253 | 265 | }
|
254 | 266 | ],
|
255 |
| - "title": "End-to-End Request Latency Heatmap", |
| 267 | + "title": "End-to-End Request Latency(s) Heatmap", |
256 | 268 | "type": "heatmap"
|
257 | 269 | },
|
258 | 270 | {
|
|
303 | 315 | "mode": "absolute",
|
304 | 316 | "steps": [
|
305 | 317 | {
|
306 |
| - "color": "green", |
307 |
| - "value": null |
| 318 | + "color": "green" |
308 | 319 | },
|
309 | 320 | {
|
310 | 321 | "color": "red",
|
|
330 | 341 | "showLegend": true
|
331 | 342 | },
|
332 | 343 | "tooltip": {
|
| 344 | + "hideZeros": false, |
333 | 345 | "mode": "single",
|
334 | 346 | "sort": "none"
|
335 | 347 | }
|
336 | 348 | },
|
| 349 | + "pluginVersion": "11.6.0", |
337 | 350 | "targets": [
|
338 | 351 | {
|
339 | 352 | "datasource": {
|
|
403 | 416 | "useBackend": false
|
404 | 417 | }
|
405 | 418 | ],
|
406 |
| - "title": "End-to-End Request Latency", |
| 419 | + "title": "Time-To-First-Token Latency", |
407 | 420 | "type": "timeseries"
|
408 | 421 | },
|
409 | 422 | {
|
|
433 | 446 | "y": 8
|
434 | 447 | },
|
435 | 448 | "id": 19,
|
| 449 | + "maxDataPoints": 30, |
436 | 450 | "options": {
|
437 |
| - "calculate": true, |
| 451 | + "calculate": false, |
| 452 | + "calculation": { |
| 453 | + "xBuckets": { |
| 454 | + "value": "" |
| 455 | + }, |
| 456 | + "yBuckets": { |
| 457 | + "mode": "size", |
| 458 | + "scale": { |
| 459 | + "type": "linear" |
| 460 | + }, |
| 461 | + "value": "" |
| 462 | + } |
| 463 | + }, |
438 | 464 | "cellGap": 1,
|
439 | 465 | "color": {
|
440 | 466 | "exponent": 0.5,
|
|
449 | 475 | "color": "rgba(255,0,255,0.7)"
|
450 | 476 | },
|
451 | 477 | "filterValues": {
|
452 |
| - "le": 1e-09 |
| 478 | + "le": 1e-9 |
453 | 479 | },
|
454 | 480 | "legend": {
|
455 | 481 | "show": true
|
|
464 | 490 | },
|
465 | 491 | "yAxis": {
|
466 | 492 | "axisPlacement": "left",
|
467 |
| - "reverse": false, |
468 |
| - "unit": "s" |
| 493 | + "reverse": false |
469 | 494 | }
|
470 | 495 | },
|
471 |
| - "pluginVersion": "11.2.0", |
| 496 | + "pluginVersion": "11.6.0", |
472 | 497 | "targets": [
|
473 | 498 | {
|
474 | 499 | "datasource": {
|
475 | 500 | "type": "prometheus",
|
476 | 501 | "uid": "ddyfngn31dg5cf"
|
477 | 502 | },
|
478 | 503 | "disableTextWrap": false,
|
479 |
| - "editorMode": "code", |
480 |
| - "expr": "rate(sglang:time_to_first_token_seconds_bucket{model_name=~\"$model_name\"}[$__rate_interval])\r\n", |
| 504 | + "editorMode": "builder", |
| 505 | + "exemplar": false, |
| 506 | + "expr": "sum by(le) (increase(sglang:time_to_first_token_seconds_bucket{model_name=~\"$model_name\"}[$__rate_interval]))", |
| 507 | + "format": "heatmap", |
481 | 508 | "fullMetaSearch": false,
|
482 | 509 | "includeNullMetadata": true,
|
483 | 510 | "instant": false,
|
| 511 | + "interval": "", |
484 | 512 | "legendFormat": "{{le}}",
|
485 | 513 | "range": true,
|
486 | 514 | "refId": "A",
|
|
538 | 566 | "mode": "absolute",
|
539 | 567 | "steps": [
|
540 | 568 | {
|
541 |
| - "color": "green", |
542 |
| - "value": null |
| 569 | + "color": "green" |
543 | 570 | },
|
544 | 571 | {
|
545 | 572 | "color": "red",
|
|
565 | 592 | "showLegend": true
|
566 | 593 | },
|
567 | 594 | "tooltip": {
|
| 595 | + "hideZeros": false, |
568 | 596 | "mode": "single",
|
569 | 597 | "sort": "none"
|
570 | 598 | }
|
571 | 599 | },
|
| 600 | + "pluginVersion": "11.6.0", |
572 | 601 | "targets": [
|
573 | 602 | {
|
574 | 603 | "datasource": {
|
|
639 | 668 | "mode": "absolute",
|
640 | 669 | "steps": [
|
641 | 670 | {
|
642 |
| - "color": "green", |
643 |
| - "value": null |
| 671 | + "color": "green" |
644 | 672 | },
|
645 | 673 | {
|
646 | 674 | "color": "red",
|
|
666 | 694 | "showLegend": true
|
667 | 695 | },
|
668 | 696 | "tooltip": {
|
| 697 | + "hideZeros": false, |
669 | 698 | "mode": "single",
|
670 | 699 | "sort": "none"
|
671 | 700 | }
|
672 | 701 | },
|
| 702 | + "pluginVersion": "11.6.0", |
673 | 703 | "targets": [
|
674 | 704 | {
|
675 | 705 | "datasource": {
|
|
735 | 765 | "mode": "absolute",
|
736 | 766 | "steps": [
|
737 | 767 | {
|
738 |
| - "color": "green", |
739 |
| - "value": null |
| 768 | + "color": "green" |
740 | 769 | },
|
741 | 770 | {
|
742 | 771 | "color": "red",
|
|
762 | 791 | "showLegend": true
|
763 | 792 | },
|
764 | 793 | "tooltip": {
|
| 794 | + "hideZeros": false, |
765 | 795 | "mode": "single",
|
766 | 796 | "sort": "none"
|
767 | 797 | }
|
768 | 798 | },
|
| 799 | + "pluginVersion": "11.6.0", |
769 | 800 | "targets": [
|
770 | 801 | {
|
771 | 802 | "datasource": {
|
|
835 | 866 | "mode": "absolute",
|
836 | 867 | "steps": [
|
837 | 868 | {
|
838 |
| - "color": "green", |
839 |
| - "value": null |
| 869 | + "color": "green" |
840 | 870 | },
|
841 | 871 | {
|
842 | 872 | "color": "red",
|
|
862 | 892 | "showLegend": true
|
863 | 893 | },
|
864 | 894 | "tooltip": {
|
| 895 | + "hideZeros": false, |
865 | 896 | "mode": "single",
|
866 | 897 | "sort": "none"
|
867 | 898 | }
|
868 | 899 | },
|
| 900 | + "pluginVersion": "11.6.0", |
869 | 901 | "targets": [
|
870 | 902 | {
|
871 | 903 | "datasource": {
|
|
888 | 920 | "type": "timeseries"
|
889 | 921 | }
|
890 | 922 | ],
|
| 923 | + "preload": false, |
891 | 924 | "refresh": "5s",
|
892 |
| - "schemaVersion": 39, |
| 925 | + "schemaVersion": 41, |
893 | 926 | "tags": [],
|
894 | 927 | "templating": {
|
895 | 928 | "list": [
|
896 | 929 | {
|
897 | 930 | "current": {
|
898 |
| - "selected": false, |
899 | 931 | "text": "127.0.0.1:30000",
|
900 | 932 | "value": "127.0.0.1:30000"
|
901 | 933 | },
|
902 | 934 | "datasource": {
|
903 | 935 | "type": "prometheus"
|
904 | 936 | },
|
905 | 937 | "definition": "label_values(instance)",
|
906 |
| - "hide": 0, |
907 | 938 | "includeAll": false,
|
908 | 939 | "label": "instance",
|
909 |
| - "multi": false, |
910 | 940 | "name": "instance",
|
911 | 941 | "options": [],
|
912 | 942 | "query": {
|
|
916 | 946 | },
|
917 | 947 | "refresh": 1,
|
918 | 948 | "regex": "",
|
919 |
| - "skipUrlSync": false, |
920 |
| - "sort": 0, |
921 | 949 | "type": "query"
|
922 | 950 | },
|
923 | 951 | {
|
924 | 952 | "current": {
|
925 |
| - "selected": false, |
926 | 953 | "text": "meta-llama/Llama-3.1-8B-Instruct",
|
927 | 954 | "value": "meta-llama/Llama-3.1-8B-Instruct"
|
928 | 955 | },
|
929 | 956 | "datasource": {
|
930 | 957 | "type": "prometheus"
|
931 | 958 | },
|
932 | 959 | "definition": "label_values(model_name)",
|
933 |
| - "hide": 0, |
934 | 960 | "includeAll": false,
|
935 | 961 | "label": "model name",
|
936 |
| - "multi": false, |
937 | 962 | "name": "model_name",
|
938 | 963 | "options": [],
|
939 | 964 | "query": {
|
|
943 | 968 | },
|
944 | 969 | "refresh": 1,
|
945 | 970 | "regex": "",
|
946 |
| - "skipUrlSync": false, |
947 |
| - "sort": 0, |
948 | 971 | "type": "query"
|
949 | 972 | }
|
950 | 973 | ]
|
|
957 | 980 | "timezone": "browser",
|
958 | 981 | "title": "SGLang Dashboard",
|
959 | 982 | "uid": "sglang-dashboard",
|
960 |
| - "version": 5, |
961 |
| - "weekStart": "" |
| 983 | + "version": 11 |
962 | 984 | }
|
0 commit comments