auto-update-daily-20260202
1{
2 "annotations": {
3 "list": [
4 {
5 "builtIn": 1,
6 "datasource": {
7 "type": "grafana",
8 "uid": "-- Grafana --"
9 },
10 "enable": true,
11 "hide": true,
12 "iconColor": "rgba(0, 211, 255, 1)",
13 "name": "Annotations & Alerts",
14 "type": "dashboard"
15 }
16 ]
17 },
18 "editable": true,
19 "fiscalYearStartMonth": 0,
20 "graphTooltip": 0,
21 "id": 4,
22 "links": [],
23 "liveNow": false,
24 "panels": [
25 {
26 "datasource": {
27 "type": "prometheus",
28 "uid": "${DS_PROMETHEUS}"
29 },
30 "fieldConfig": {
31 "defaults": {
32 "color": {
33 "mode": "palette-classic"
34 },
35 "custom": {
36 "axisBorderShow": false,
37 "axisCenteredZero": false,
38 "axisColorMode": "text",
39 "axisLabel": "",
40 "axisPlacement": "auto",
41 "barAlignment": 0,
42 "drawStyle": "line",
43 "fillOpacity": 10,
44 "gradientMode": "none",
45 "hideFrom": {
46 "legend": false,
47 "tooltip": false,
48 "vis": false,
49 "viz": false
50 },
51 "insertNulls": false,
52 "lineInterpolation": "linear",
53 "lineWidth": 1,
54 "pointSize": 5,
55 "scaleDistribution": {
56 "type": "linear"
57 },
58 "showPoints": "never",
59 "spanNulls": false,
60 "stacking": {
61 "group": "A",
62 "mode": "none"
63 },
64 "thresholdsStyle": {
65 "mode": "off"
66 }
67 },
68 "mappings": [],
69 "thresholds": {
70 "mode": "absolute",
71 "steps": [
72 {
73 "color": "green",
74 "value": null
75 },
76 {
77 "color": "red",
78 "value": 80
79 }
80 ]
81 },
82 "unit": "reqps"
83 },
84 "overrides": []
85 },
86 "gridPos": {
87 "h": 8,
88 "w": 12,
89 "x": 0,
90 "y": 0
91 },
92 "id": 1,
93 "options": {
94 "legend": {
95 "calcs": [],
96 "displayMode": "list",
97 "placement": "bottom",
98 "showLegend": true
99 },
100 "tooltip": {
101 "mode": "single",
102 "sort": "none"
103 }
104 },
105 "targets": [
106 {
107 "datasource": {
108 "type": "prometheus",
109 "uid": "${DS_PROMETHEUS}"
110 },
111 "editorMode": "code",
112 "expr": "rate(ollama_requests_total[$__rate_interval])",
113 "instant": false,
114 "legendFormat": "{{model}}",
115 "range": true,
116 "refId": "A"
117 }
118 ],
119 "title": "Request Rate by Model",
120 "type": "timeseries"
121 },
122 {
123 "datasource": {
124 "type": "prometheus",
125 "uid": "${DS_PROMETHEUS}"
126 },
127 "fieldConfig": {
128 "defaults": {
129 "color": {
130 "mode": "thresholds"
131 },
132 "mappings": [],
133 "thresholds": {
134 "mode": "absolute",
135 "steps": [
136 {
137 "color": "green",
138 "value": null
139 },
140 {
141 "color": "red",
142 "value": 80
143 }
144 ]
145 },
146 "unit": "short"
147 },
148 "overrides": []
149 },
150 "gridPos": {
151 "h": 8,
152 "w": 12,
153 "x": 12,
154 "y": 0
155 },
156 "id": 2,
157 "options": {
158 "colorMode": "value",
159 "graphMode": "area",
160 "justifyMode": "auto",
161 "orientation": "auto",
162 "reduceOptions": {
163 "calcs": [
164 "lastNotNull"
165 ],
166 "fields": "",
167 "values": false
168 },
169 "textMode": "auto",
170 "wideLayout": true
171 },
172 "pluginVersion": "10.2.6",
173 "targets": [
174 {
175 "datasource": {
176 "type": "prometheus",
177 "uid": "${DS_PROMETHEUS}"
178 },
179 "editorMode": "code",
180 "expr": "ollama_requests_total",
181 "instant": false,
182 "legendFormat": "{{model}}",
183 "range": true,
184 "refId": "A"
185 }
186 ],
187 "title": "Total Requests by Model",
188 "type": "stat"
189 },
190 {
191 "datasource": {
192 "type": "prometheus",
193 "uid": "${DS_PROMETHEUS}"
194 },
195 "fieldConfig": {
196 "defaults": {
197 "color": {
198 "mode": "palette-classic"
199 },
200 "custom": {
201 "axisBorderShow": false,
202 "axisCenteredZero": false,
203 "axisColorMode": "text",
204 "axisLabel": "",
205 "axisPlacement": "auto",
206 "barAlignment": 0,
207 "drawStyle": "line",
208 "fillOpacity": 10,
209 "gradientMode": "none",
210 "hideFrom": {
211 "legend": false,
212 "tooltip": false,
213 "vis": false,
214 "viz": false
215 },
216 "insertNulls": false,
217 "lineInterpolation": "linear",
218 "lineWidth": 1,
219 "pointSize": 5,
220 "scaleDistribution": {
221 "type": "linear"
222 },
223 "showPoints": "never",
224 "spanNulls": false,
225 "stacking": {
226 "group": "A",
227 "mode": "none"
228 },
229 "thresholdsStyle": {
230 "mode": "off"
231 }
232 },
233 "mappings": [],
234 "thresholds": {
235 "mode": "absolute",
236 "steps": [
237 {
238 "color": "green",
239 "value": null
240 },
241 {
242 "color": "red",
243 "value": 80
244 }
245 ]
246 },
247 "unit": "s"
248 },
249 "overrides": []
250 },
251 "gridPos": {
252 "h": 8,
253 "w": 12,
254 "x": 0,
255 "y": 8
256 },
257 "id": 3,
258 "options": {
259 "legend": {
260 "calcs": [],
261 "displayMode": "list",
262 "placement": "bottom",
263 "showLegend": true
264 },
265 "tooltip": {
266 "mode": "single",
267 "sort": "none"
268 }
269 },
270 "targets": [
271 {
272 "datasource": {
273 "type": "prometheus",
274 "uid": "${DS_PROMETHEUS}"
275 },
276 "editorMode": "code",
277 "expr": "rate(ollama_response_seconds_sum[$__rate_interval]) / rate(ollama_response_seconds_count[$__rate_interval])",
278 "instant": false,
279 "legendFormat": "Average - {{model}}",
280 "range": true,
281 "refId": "A"
282 }
283 ],
284 "title": "Average Response Time",
285 "type": "timeseries"
286 },
287 {
288 "datasource": {
289 "type": "prometheus",
290 "uid": "${DS_PROMETHEUS}"
291 },
292 "fieldConfig": {
293 "defaults": {
294 "color": {
295 "mode": "palette-classic"
296 },
297 "custom": {
298 "axisBorderShow": false,
299 "axisCenteredZero": false,
300 "axisColorMode": "text",
301 "axisLabel": "",
302 "axisPlacement": "auto",
303 "barAlignment": 0,
304 "drawStyle": "line",
305 "fillOpacity": 10,
306 "gradientMode": "none",
307 "hideFrom": {
308 "legend": false,
309 "tooltip": false,
310 "vis": false,
311 "viz": false
312 },
313 "insertNulls": false,
314 "lineInterpolation": "linear",
315 "lineWidth": 1,
316 "pointSize": 5,
317 "scaleDistribution": {
318 "type": "linear"
319 },
320 "showPoints": "never",
321 "spanNulls": false,
322 "stacking": {
323 "group": "A",
324 "mode": "none"
325 },
326 "thresholdsStyle": {
327 "mode": "off"
328 }
329 },
330 "mappings": [],
331 "thresholds": {
332 "mode": "absolute",
333 "steps": [
334 {
335 "color": "green",
336 "value": null
337 },
338 {
339 "color": "red",
340 "value": 80
341 }
342 ]
343 },
344 "unit": "s"
345 },
346 "overrides": []
347 },
348 "gridPos": {
349 "h": 8,
350 "w": 12,
351 "x": 12,
352 "y": 8
353 },
354 "id": 4,
355 "options": {
356 "legend": {
357 "calcs": [],
358 "displayMode": "list",
359 "placement": "bottom",
360 "showLegend": true
361 },
362 "tooltip": {
363 "mode": "single",
364 "sort": "none"
365 }
366 },
367 "targets": [
368 {
369 "datasource": {
370 "type": "prometheus",
371 "uid": "${DS_PROMETHEUS}"
372 },
373 "editorMode": "code",
374 "expr": "rate(ollama_load_duration_seconds_sum[$__rate_interval]) / rate(ollama_load_duration_seconds_count[$__rate_interval])",
375 "instant": false,
376 "legendFormat": "Average Load Time - {{model}}",
377 "range": true,
378 "refId": "A"
379 }
380 ],
381 "title": "Average Model Load Time",
382 "type": "timeseries"
383 },
384 {
385 "datasource": {
386 "type": "prometheus",
387 "uid": "${DS_PROMETHEUS}"
388 },
389 "fieldConfig": {
390 "defaults": {
391 "color": {
392 "mode": "palette-classic"
393 },
394 "custom": {
395 "axisBorderShow": false,
396 "axisCenteredZero": false,
397 "axisColorMode": "text",
398 "axisLabel": "",
399 "axisPlacement": "auto",
400 "barAlignment": 0,
401 "drawStyle": "line",
402 "fillOpacity": 10,
403 "gradientMode": "none",
404 "hideFrom": {
405 "legend": false,
406 "tooltip": false,
407 "vis": false,
408 "viz": false
409 },
410 "insertNulls": false,
411 "lineInterpolation": "linear",
412 "lineWidth": 1,
413 "pointSize": 5,
414 "scaleDistribution": {
415 "type": "linear"
416 },
417 "showPoints": "never",
418 "spanNulls": false,
419 "stacking": {
420 "group": "A",
421 "mode": "none"
422 },
423 "thresholdsStyle": {
424 "mode": "off"
425 }
426 },
427 "mappings": [],
428 "thresholds": {
429 "mode": "absolute",
430 "steps": [
431 {
432 "color": "green",
433 "value": null
434 },
435 {
436 "color": "red",
437 "value": 80
438 }
439 ]
440 },
441 "unit": "tps"
442 },
443 "overrides": []
444 },
445 "gridPos": {
446 "h": 8,
447 "w": 12,
448 "x": 0,
449 "y": 16
450 },
451 "id": 5,
452 "options": {
453 "legend": {
454 "calcs": [],
455 "displayMode": "list",
456 "placement": "bottom",
457 "showLegend": true
458 },
459 "tooltip": {
460 "mode": "single",
461 "sort": "none"
462 }
463 },
464 "targets": [
465 {
466 "datasource": {
467 "type": "prometheus",
468 "uid": "${DS_PROMETHEUS}"
469 },
470 "editorMode": "code",
471 "expr": "rate(ollama_tokens_processed_total[$__rate_interval])",
472 "instant": false,
473 "legendFormat": "Input Tokens/s - {{model}}",
474 "range": true,
475 "refId": "A"
476 },
477 {
478 "datasource": {
479 "type": "prometheus",
480 "uid": "${DS_PROMETHEUS}"
481 },
482 "editorMode": "code",
483 "expr": "rate(ollama_tokens_generated_total[$__rate_interval])",
484 "instant": false,
485 "legendFormat": "Output Tokens/s - {{model}}",
486 "range": true,
487 "refId": "B"
488 }
489 ],
490 "title": "Token Processing Rate",
491 "type": "timeseries"
492 },
493 {
494 "datasource": {
495 "type": "prometheus",
496 "uid": "${DS_PROMETHEUS}"
497 },
498 "fieldConfig": {
499 "defaults": {
500 "color": {
501 "mode": "palette-classic"
502 },
503 "custom": {
504 "axisBorderShow": false,
505 "axisCenteredZero": false,
506 "axisColorMode": "text",
507 "axisLabel": "",
508 "axisPlacement": "auto",
509 "barAlignment": 0,
510 "drawStyle": "line",
511 "fillOpacity": 10,
512 "gradientMode": "none",
513 "hideFrom": {
514 "legend": false,
515 "tooltip": false,
516 "vis": false,
517 "viz": false
518 },
519 "insertNulls": false,
520 "lineInterpolation": "linear",
521 "lineWidth": 1,
522 "pointSize": 5,
523 "scaleDistribution": {
524 "type": "linear"
525 },
526 "showPoints": "never",
527 "spanNulls": false,
528 "stacking": {
529 "group": "A",
530 "mode": "none"
531 },
532 "thresholdsStyle": {
533 "mode": "off"
534 }
535 },
536 "mappings": [],
537 "thresholds": {
538 "mode": "absolute",
539 "steps": [
540 {
541 "color": "green",
542 "value": null
543 },
544 {
545 "color": "red",
546 "value": 80
547 }
548 ]
549 },
550 "unit": "tps"
551 },
552 "overrides": []
553 },
554 "gridPos": {
555 "h": 8,
556 "w": 12,
557 "x": 12,
558 "y": 16
559 },
560 "id": 6,
561 "options": {
562 "legend": {
563 "calcs": [],
564 "displayMode": "list",
565 "placement": "bottom",
566 "showLegend": true
567 },
568 "tooltip": {
569 "mode": "single",
570 "sort": "none"
571 }
572 },
573 "targets": [
574 {
575 "datasource": {
576 "type": "prometheus",
577 "uid": "${DS_PROMETHEUS}"
578 },
579 "editorMode": "code",
580 "expr": "rate(ollama_tokens_per_second_sum[$__rate_interval]) / rate(ollama_tokens_per_second_count[$__rate_interval])",
581 "instant": false,
582 "legendFormat": "Average - {{model}}",
583 "range": true,
584 "refId": "A"
585 }
586 ],
587 "title": "Average Generation Speed (Tokens/Second)",
588 "type": "timeseries"
589 },
590 {
591 "datasource": {
592 "type": "prometheus",
593 "uid": "${DS_PROMETHEUS}"
594 },
595 "fieldConfig": {
596 "defaults": {
597 "color": {
598 "mode": "palette-classic"
599 },
600 "custom": {
601 "axisBorderShow": false,
602 "axisCenteredZero": false,
603 "axisColorMode": "text",
604 "axisLabel": "",
605 "axisPlacement": "auto",
606 "barAlignment": 0,
607 "drawStyle": "line",
608 "fillOpacity": 10,
609 "gradientMode": "none",
610 "hideFrom": {
611 "legend": false,
612 "tooltip": false,
613 "vis": false,
614 "viz": false
615 },
616 "insertNulls": false,
617 "lineInterpolation": "linear",
618 "lineWidth": 1,
619 "pointSize": 5,
620 "scaleDistribution": {
621 "type": "linear"
622 },
623 "showPoints": "never",
624 "spanNulls": false,
625 "stacking": {
626 "group": "A",
627 "mode": "none"
628 },
629 "thresholdsStyle": {
630 "mode": "off"
631 }
632 },
633 "mappings": [],
634 "thresholds": {
635 "mode": "absolute",
636 "steps": [
637 {
638 "color": "green",
639 "value": null
640 },
641 {
642 "color": "red",
643 "value": 80
644 }
645 ]
646 },
647 "unit": "s"
648 },
649 "overrides": []
650 },
651 "gridPos": {
652 "h": 8,
653 "w": 12,
654 "x": 0,
655 "y": 24
656 },
657 "id": 7,
658 "options": {
659 "legend": {
660 "calcs": [],
661 "displayMode": "list",
662 "placement": "bottom",
663 "showLegend": true
664 },
665 "tooltip": {
666 "mode": "single",
667 "sort": "none"
668 }
669 },
670 "targets": [
671 {
672 "datasource": {
673 "type": "prometheus",
674 "uid": "${DS_PROMETHEUS}"
675 },
676 "editorMode": "code",
677 "expr": "rate(ollama_prompt_eval_duration_seconds_sum[$__rate_interval]) / rate(ollama_prompt_eval_duration_seconds_count[$__rate_interval])",
678 "instant": false,
679 "legendFormat": "Avg Prompt Eval - {{model}}",
680 "range": true,
681 "refId": "A"
682 },
683 {
684 "datasource": {
685 "type": "prometheus",
686 "uid": "${DS_PROMETHEUS}"
687 },
688 "editorMode": "code",
689 "expr": "rate(ollama_eval_duration_seconds_sum[$__rate_interval]) / rate(ollama_eval_duration_seconds_count[$__rate_interval])",
690 "instant": false,
691 "legendFormat": "Avg Response Gen - {{model}}",
692 "range": true,
693 "refId": "B"
694 }
695 ],
696 "title": "Average Processing Time Breakdown",
697 "type": "timeseries"
698 },
699 {
700 "datasource": {
701 "type": "prometheus",
702 "uid": "${DS_PROMETHEUS}"
703 },
704 "fieldConfig": {
705 "defaults": {
706 "color": {
707 "mode": "thresholds"
708 },
709 "custom": {
710 "align": "auto",
711 "cellOptions": {
712 "type": "auto"
713 },
714 "inspect": false
715 },
716 "mappings": [],
717 "thresholds": {
718 "mode": "absolute",
719 "steps": [
720 {
721 "color": "green",
722 "value": null
723 },
724 {
725 "color": "red",
726 "value": 80
727 }
728 ]
729 }
730 },
731 "overrides": [
732 {
733 "matcher": {
734 "id": "byName",
735 "options": "Avg Response Time"
736 },
737 "properties": [
738 {
739 "id": "unit",
740 "value": "s"
741 }
742 ]
743 },
744 {
745 "matcher": {
746 "id": "byName",
747 "options": "Avg Tokens/Second"
748 },
749 "properties": [
750 {
751 "id": "unit",
752 "value": "tps"
753 }
754 ]
755 }
756 ]
757 },
758 "gridPos": {
759 "h": 8,
760 "w": 12,
761 "x": 12,
762 "y": 24
763 },
764 "id": 8,
765 "options": {
766 "cellHeight": "sm",
767 "footer": {
768 "countRows": false,
769 "fields": "",
770 "reducer": [
771 "sum"
772 ],
773 "show": false
774 },
775 "showHeader": true
776 },
777 "pluginVersion": "10.2.6",
778 "targets": [
779 {
780 "datasource": {
781 "type": "prometheus",
782 "uid": "${DS_PROMETHEUS}"
783 },
784 "editorMode": "code",
785 "expr": "sum by (model) (ollama_requests_total)",
786 "format": "table",
787 "instant": true,
788 "legendFormat": "__auto",
789 "range": false,
790 "refId": "A"
791 },
792 {
793 "datasource": {
794 "type": "prometheus",
795 "uid": "${DS_PROMETHEUS}"
796 },
797 "editorMode": "code",
798 "expr": "sum by (model) (ollama_response_seconds_sum) / sum by (model) (ollama_response_seconds_count)",
799 "format": "table",
800 "instant": true,
801 "legendFormat": "__auto",
802 "range": false,
803 "refId": "B"
804 },
805 {
806 "datasource": {
807 "type": "prometheus",
808 "uid": "${DS_PROMETHEUS}"
809 },
810 "editorMode": "code",
811 "expr": "sum by (model) (ollama_tokens_per_second_sum) / sum by (model) (ollama_tokens_per_second_count)",
812 "format": "table",
813 "instant": true,
814 "legendFormat": "__auto",
815 "range": false,
816 "refId": "C"
817 }
818 ],
819 "title": "Model Performance Summary",
820 "transformations": [
821 {
822 "id": "merge",
823 "options": {}
824 },
825 {
826 "id": "organize",
827 "options": {
828 "excludeByName": {
829 "Time": true
830 },
831 "indexByName": {},
832 "renameByName": {
833 "Value #A": "Total Requests",
834 "Value #B": "Avg Response Time",
835 "Value #C": "Avg Tokens/Second",
836 "model": "Model"
837 }
838 }
839 }
840 ],
841 "type": "table"
842 }
843 ],
844 "refresh": "5s",
845 "schemaVersion": 39,
846 "tags": [
847 "ollama",
848 "ai",
849 "llm"
850 ],
851 "templating": {
852 "list": [
853 {
854 "current": {
855 "selected": false,
856 "text": "prometheus",
857 "value": "c09d1a89-4ff3-4c52-b8d5-dba793da5d90"
858 },
859 "hide": 0,
860 "includeAll": false,
861 "multi": false,
862 "name": "DS_PROMETHEUS",
863 "options": [],
864 "query": "prometheus",
865 "refresh": 1,
866 "regex": "",
867 "skipUrlSync": false,
868 "type": "datasource"
869 }
870 ]
871 },
872 "time": {
873 "from": "now-1h",
874 "to": "now"
875 },
876 "timepicker": {},
877 "timezone": "",
878 "title": "Ollama Performance Monitoring",
879 "uid": "ollama-dashboard",
880 "version": 1,
881 "weekStart": ""
882}