auto-update-daily-20260202
  1{
  2  "annotations": {
  3    "list": [
  4      {
  5        "builtIn": 1,
  6        "datasource": {
  7          "type": "grafana",
  8          "uid": "-- Grafana --"
  9        },
 10        "enable": true,
 11        "hide": true,
 12        "iconColor": "rgba(0, 211, 255, 1)",
 13        "name": "Annotations & Alerts",
 14        "type": "dashboard"
 15      }
 16    ]
 17  },
 18  "editable": true,
 19  "fiscalYearStartMonth": 0,
 20  "graphTooltip": 0,
 21  "id": 4,
 22  "links": [],
 23  "liveNow": false,
 24  "panels": [
 25    {
 26      "datasource": {
 27        "type": "prometheus",
 28        "uid": "${DS_PROMETHEUS}"
 29      },
 30      "fieldConfig": {
 31        "defaults": {
 32          "color": {
 33            "mode": "palette-classic"
 34          },
 35          "custom": {
 36            "axisBorderShow": false,
 37            "axisCenteredZero": false,
 38            "axisColorMode": "text",
 39            "axisLabel": "",
 40            "axisPlacement": "auto",
 41            "barAlignment": 0,
 42            "drawStyle": "line",
 43            "fillOpacity": 10,
 44            "gradientMode": "none",
 45            "hideFrom": {
 46              "legend": false,
 47              "tooltip": false,
 48              "vis": false,
 49              "viz": false
 50            },
 51            "insertNulls": false,
 52            "lineInterpolation": "linear",
 53            "lineWidth": 1,
 54            "pointSize": 5,
 55            "scaleDistribution": {
 56              "type": "linear"
 57            },
 58            "showPoints": "never",
 59            "spanNulls": false,
 60            "stacking": {
 61              "group": "A",
 62              "mode": "none"
 63            },
 64            "thresholdsStyle": {
 65              "mode": "off"
 66            }
 67          },
 68          "mappings": [],
 69          "thresholds": {
 70            "mode": "absolute",
 71            "steps": [
 72              {
 73                "color": "green",
 74                "value": null
 75              },
 76              {
 77                "color": "red",
 78                "value": 80
 79              }
 80            ]
 81          },
 82          "unit": "reqps"
 83        },
 84        "overrides": []
 85      },
 86      "gridPos": {
 87        "h": 8,
 88        "w": 12,
 89        "x": 0,
 90        "y": 0
 91      },
 92      "id": 1,
 93      "options": {
 94        "legend": {
 95          "calcs": [],
 96          "displayMode": "list",
 97          "placement": "bottom",
 98          "showLegend": true
 99        },
100        "tooltip": {
101          "mode": "single",
102          "sort": "none"
103        }
104      },
105      "targets": [
106        {
107          "datasource": {
108            "type": "prometheus",
109            "uid": "${DS_PROMETHEUS}"
110          },
111          "editorMode": "code",
112          "expr": "rate(ollama_requests_total[$__rate_interval])",
113          "instant": false,
114          "legendFormat": "{{model}}",
115          "range": true,
116          "refId": "A"
117        }
118      ],
119      "title": "Request Rate by Model",
120      "type": "timeseries"
121    },
122    {
123      "datasource": {
124        "type": "prometheus",
125        "uid": "${DS_PROMETHEUS}"
126      },
127      "fieldConfig": {
128        "defaults": {
129          "color": {
130            "mode": "thresholds"
131          },
132          "mappings": [],
133          "thresholds": {
134            "mode": "absolute",
135            "steps": [
136              {
137                "color": "green",
138                "value": null
139              },
140              {
141                "color": "red",
142                "value": 80
143              }
144            ]
145          },
146          "unit": "short"
147        },
148        "overrides": []
149      },
150      "gridPos": {
151        "h": 8,
152        "w": 12,
153        "x": 12,
154        "y": 0
155      },
156      "id": 2,
157      "options": {
158        "colorMode": "value",
159        "graphMode": "area",
160        "justifyMode": "auto",
161        "orientation": "auto",
162        "reduceOptions": {
163          "calcs": [
164            "lastNotNull"
165          ],
166          "fields": "",
167          "values": false
168        },
169        "textMode": "auto",
170        "wideLayout": true
171      },
172      "pluginVersion": "10.2.6",
173      "targets": [
174        {
175          "datasource": {
176            "type": "prometheus",
177            "uid": "${DS_PROMETHEUS}"
178          },
179          "editorMode": "code",
180          "expr": "ollama_requests_total",
181          "instant": false,
182          "legendFormat": "{{model}}",
183          "range": true,
184          "refId": "A"
185        }
186      ],
187      "title": "Total Requests by Model",
188      "type": "stat"
189    },
190    {
191      "datasource": {
192        "type": "prometheus",
193        "uid": "${DS_PROMETHEUS}"
194      },
195      "fieldConfig": {
196        "defaults": {
197          "color": {
198            "mode": "palette-classic"
199          },
200          "custom": {
201            "axisBorderShow": false,
202            "axisCenteredZero": false,
203            "axisColorMode": "text",
204            "axisLabel": "",
205            "axisPlacement": "auto",
206            "barAlignment": 0,
207            "drawStyle": "line",
208            "fillOpacity": 10,
209            "gradientMode": "none",
210            "hideFrom": {
211              "legend": false,
212              "tooltip": false,
213              "vis": false,
214              "viz": false
215            },
216            "insertNulls": false,
217            "lineInterpolation": "linear",
218            "lineWidth": 1,
219            "pointSize": 5,
220            "scaleDistribution": {
221              "type": "linear"
222            },
223            "showPoints": "never",
224            "spanNulls": false,
225            "stacking": {
226              "group": "A",
227              "mode": "none"
228            },
229            "thresholdsStyle": {
230              "mode": "off"
231            }
232          },
233          "mappings": [],
234          "thresholds": {
235            "mode": "absolute",
236            "steps": [
237              {
238                "color": "green",
239                "value": null
240              },
241              {
242                "color": "red",
243                "value": 80
244              }
245            ]
246          },
247          "unit": "s"
248        },
249        "overrides": []
250      },
251      "gridPos": {
252        "h": 8,
253        "w": 12,
254        "x": 0,
255        "y": 8
256      },
257      "id": 3,
258      "options": {
259        "legend": {
260          "calcs": [],
261          "displayMode": "list",
262          "placement": "bottom",
263          "showLegend": true
264        },
265        "tooltip": {
266          "mode": "single",
267          "sort": "none"
268        }
269      },
270      "targets": [
271        {
272          "datasource": {
273            "type": "prometheus",
274            "uid": "${DS_PROMETHEUS}"
275          },
276          "editorMode": "code",
277          "expr": "rate(ollama_response_seconds_sum[$__rate_interval]) / rate(ollama_response_seconds_count[$__rate_interval])",
278          "instant": false,
279          "legendFormat": "Average - {{model}}",
280          "range": true,
281          "refId": "A"
282        }
283      ],
284      "title": "Average Response Time",
285      "type": "timeseries"
286    },
287    {
288      "datasource": {
289        "type": "prometheus",
290        "uid": "${DS_PROMETHEUS}"
291      },
292      "fieldConfig": {
293        "defaults": {
294          "color": {
295            "mode": "palette-classic"
296          },
297          "custom": {
298            "axisBorderShow": false,
299            "axisCenteredZero": false,
300            "axisColorMode": "text",
301            "axisLabel": "",
302            "axisPlacement": "auto",
303            "barAlignment": 0,
304            "drawStyle": "line",
305            "fillOpacity": 10,
306            "gradientMode": "none",
307            "hideFrom": {
308              "legend": false,
309              "tooltip": false,
310              "vis": false,
311              "viz": false
312            },
313            "insertNulls": false,
314            "lineInterpolation": "linear",
315            "lineWidth": 1,
316            "pointSize": 5,
317            "scaleDistribution": {
318              "type": "linear"
319            },
320            "showPoints": "never",
321            "spanNulls": false,
322            "stacking": {
323              "group": "A",
324              "mode": "none"
325            },
326            "thresholdsStyle": {
327              "mode": "off"
328            }
329          },
330          "mappings": [],
331          "thresholds": {
332            "mode": "absolute",
333            "steps": [
334              {
335                "color": "green",
336                "value": null
337              },
338              {
339                "color": "red",
340                "value": 80
341              }
342            ]
343          },
344          "unit": "s"
345        },
346        "overrides": []
347      },
348      "gridPos": {
349        "h": 8,
350        "w": 12,
351        "x": 12,
352        "y": 8
353      },
354      "id": 4,
355      "options": {
356        "legend": {
357          "calcs": [],
358          "displayMode": "list",
359          "placement": "bottom",
360          "showLegend": true
361        },
362        "tooltip": {
363          "mode": "single",
364          "sort": "none"
365        }
366      },
367      "targets": [
368        {
369          "datasource": {
370            "type": "prometheus",
371            "uid": "${DS_PROMETHEUS}"
372          },
373          "editorMode": "code",
374          "expr": "rate(ollama_load_duration_seconds_sum[$__rate_interval]) / rate(ollama_load_duration_seconds_count[$__rate_interval])",
375          "instant": false,
376          "legendFormat": "Average Load Time - {{model}}",
377          "range": true,
378          "refId": "A"
379        }
380      ],
381      "title": "Average Model Load Time",
382      "type": "timeseries"
383    },
384    {
385      "datasource": {
386        "type": "prometheus",
387        "uid": "${DS_PROMETHEUS}"
388      },
389      "fieldConfig": {
390        "defaults": {
391          "color": {
392            "mode": "palette-classic"
393          },
394          "custom": {
395            "axisBorderShow": false,
396            "axisCenteredZero": false,
397            "axisColorMode": "text",
398            "axisLabel": "",
399            "axisPlacement": "auto",
400            "barAlignment": 0,
401            "drawStyle": "line",
402            "fillOpacity": 10,
403            "gradientMode": "none",
404            "hideFrom": {
405              "legend": false,
406              "tooltip": false,
407              "vis": false,
408              "viz": false
409            },
410            "insertNulls": false,
411            "lineInterpolation": "linear",
412            "lineWidth": 1,
413            "pointSize": 5,
414            "scaleDistribution": {
415              "type": "linear"
416            },
417            "showPoints": "never",
418            "spanNulls": false,
419            "stacking": {
420              "group": "A",
421              "mode": "none"
422            },
423            "thresholdsStyle": {
424              "mode": "off"
425            }
426          },
427          "mappings": [],
428          "thresholds": {
429            "mode": "absolute",
430            "steps": [
431              {
432                "color": "green",
433                "value": null
434              },
435              {
436                "color": "red",
437                "value": 80
438              }
439            ]
440          },
441          "unit": "tps"
442        },
443        "overrides": []
444      },
445      "gridPos": {
446        "h": 8,
447        "w": 12,
448        "x": 0,
449        "y": 16
450      },
451      "id": 5,
452      "options": {
453        "legend": {
454          "calcs": [],
455          "displayMode": "list",
456          "placement": "bottom",
457          "showLegend": true
458        },
459        "tooltip": {
460          "mode": "single",
461          "sort": "none"
462        }
463      },
464      "targets": [
465        {
466          "datasource": {
467            "type": "prometheus",
468            "uid": "${DS_PROMETHEUS}"
469          },
470          "editorMode": "code",
471          "expr": "rate(ollama_tokens_processed_total[$__rate_interval])",
472          "instant": false,
473          "legendFormat": "Input Tokens/s - {{model}}",
474          "range": true,
475          "refId": "A"
476        },
477        {
478          "datasource": {
479            "type": "prometheus",
480            "uid": "${DS_PROMETHEUS}"
481          },
482          "editorMode": "code",
483          "expr": "rate(ollama_tokens_generated_total[$__rate_interval])",
484          "instant": false,
485          "legendFormat": "Output Tokens/s - {{model}}",
486          "range": true,
487          "refId": "B"
488        }
489      ],
490      "title": "Token Processing Rate",
491      "type": "timeseries"
492    },
493    {
494      "datasource": {
495        "type": "prometheus",
496        "uid": "${DS_PROMETHEUS}"
497      },
498      "fieldConfig": {
499        "defaults": {
500          "color": {
501            "mode": "palette-classic"
502          },
503          "custom": {
504            "axisBorderShow": false,
505            "axisCenteredZero": false,
506            "axisColorMode": "text",
507            "axisLabel": "",
508            "axisPlacement": "auto",
509            "barAlignment": 0,
510            "drawStyle": "line",
511            "fillOpacity": 10,
512            "gradientMode": "none",
513            "hideFrom": {
514              "legend": false,
515              "tooltip": false,
516              "vis": false,
517              "viz": false
518            },
519            "insertNulls": false,
520            "lineInterpolation": "linear",
521            "lineWidth": 1,
522            "pointSize": 5,
523            "scaleDistribution": {
524              "type": "linear"
525            },
526            "showPoints": "never",
527            "spanNulls": false,
528            "stacking": {
529              "group": "A",
530              "mode": "none"
531            },
532            "thresholdsStyle": {
533              "mode": "off"
534            }
535          },
536          "mappings": [],
537          "thresholds": {
538            "mode": "absolute",
539            "steps": [
540              {
541                "color": "green",
542                "value": null
543              },
544              {
545                "color": "red",
546                "value": 80
547              }
548            ]
549          },
550          "unit": "tps"
551        },
552        "overrides": []
553      },
554      "gridPos": {
555        "h": 8,
556        "w": 12,
557        "x": 12,
558        "y": 16
559      },
560      "id": 6,
561      "options": {
562        "legend": {
563          "calcs": [],
564          "displayMode": "list",
565          "placement": "bottom",
566          "showLegend": true
567        },
568        "tooltip": {
569          "mode": "single",
570          "sort": "none"
571        }
572      },
573      "targets": [
574        {
575          "datasource": {
576            "type": "prometheus",
577            "uid": "${DS_PROMETHEUS}"
578          },
579          "editorMode": "code",
580          "expr": "rate(ollama_tokens_per_second_sum[$__rate_interval]) / rate(ollama_tokens_per_second_count[$__rate_interval])",
581          "instant": false,
582          "legendFormat": "Average - {{model}}",
583          "range": true,
584          "refId": "A"
585        }
586      ],
587      "title": "Average Generation Speed (Tokens/Second)",
588      "type": "timeseries"
589    },
590    {
591      "datasource": {
592        "type": "prometheus",
593        "uid": "${DS_PROMETHEUS}"
594      },
595      "fieldConfig": {
596        "defaults": {
597          "color": {
598            "mode": "palette-classic"
599          },
600          "custom": {
601            "axisBorderShow": false,
602            "axisCenteredZero": false,
603            "axisColorMode": "text",
604            "axisLabel": "",
605            "axisPlacement": "auto",
606            "barAlignment": 0,
607            "drawStyle": "line",
608            "fillOpacity": 10,
609            "gradientMode": "none",
610            "hideFrom": {
611              "legend": false,
612              "tooltip": false,
613              "vis": false,
614              "viz": false
615            },
616            "insertNulls": false,
617            "lineInterpolation": "linear",
618            "lineWidth": 1,
619            "pointSize": 5,
620            "scaleDistribution": {
621              "type": "linear"
622            },
623            "showPoints": "never",
624            "spanNulls": false,
625            "stacking": {
626              "group": "A",
627              "mode": "none"
628            },
629            "thresholdsStyle": {
630              "mode": "off"
631            }
632          },
633          "mappings": [],
634          "thresholds": {
635            "mode": "absolute",
636            "steps": [
637              {
638                "color": "green",
639                "value": null
640              },
641              {
642                "color": "red",
643                "value": 80
644              }
645            ]
646          },
647          "unit": "s"
648        },
649        "overrides": []
650      },
651      "gridPos": {
652        "h": 8,
653        "w": 12,
654        "x": 0,
655        "y": 24
656      },
657      "id": 7,
658      "options": {
659        "legend": {
660          "calcs": [],
661          "displayMode": "list",
662          "placement": "bottom",
663          "showLegend": true
664        },
665        "tooltip": {
666          "mode": "single",
667          "sort": "none"
668        }
669      },
670      "targets": [
671        {
672          "datasource": {
673            "type": "prometheus",
674            "uid": "${DS_PROMETHEUS}"
675          },
676          "editorMode": "code",
677          "expr": "rate(ollama_prompt_eval_duration_seconds_sum[$__rate_interval]) / rate(ollama_prompt_eval_duration_seconds_count[$__rate_interval])",
678          "instant": false,
679          "legendFormat": "Avg Prompt Eval - {{model}}",
680          "range": true,
681          "refId": "A"
682        },
683        {
684          "datasource": {
685            "type": "prometheus",
686            "uid": "${DS_PROMETHEUS}"
687          },
688          "editorMode": "code",
689          "expr": "rate(ollama_eval_duration_seconds_sum[$__rate_interval]) / rate(ollama_eval_duration_seconds_count[$__rate_interval])",
690          "instant": false,
691          "legendFormat": "Avg Response Gen - {{model}}",
692          "range": true,
693          "refId": "B"
694        }
695      ],
696      "title": "Average Processing Time Breakdown",
697      "type": "timeseries"
698    },
699    {
700      "datasource": {
701        "type": "prometheus",
702        "uid": "${DS_PROMETHEUS}"
703      },
704      "fieldConfig": {
705        "defaults": {
706          "color": {
707            "mode": "thresholds"
708          },
709          "custom": {
710            "align": "auto",
711            "cellOptions": {
712              "type": "auto"
713            },
714            "inspect": false
715          },
716          "mappings": [],
717          "thresholds": {
718            "mode": "absolute",
719            "steps": [
720              {
721                "color": "green",
722                "value": null
723              },
724              {
725                "color": "red",
726                "value": 80
727              }
728            ]
729          }
730        },
731        "overrides": [
732          {
733            "matcher": {
734              "id": "byName",
735              "options": "Avg Response Time"
736            },
737            "properties": [
738              {
739                "id": "unit",
740                "value": "s"
741              }
742            ]
743          },
744          {
745            "matcher": {
746              "id": "byName",
747              "options": "Avg Tokens/Second"
748            },
749            "properties": [
750              {
751                "id": "unit",
752                "value": "tps"
753              }
754            ]
755          }
756        ]
757      },
758      "gridPos": {
759        "h": 8,
760        "w": 12,
761        "x": 12,
762        "y": 24
763      },
764      "id": 8,
765      "options": {
766        "cellHeight": "sm",
767        "footer": {
768          "countRows": false,
769          "fields": "",
770          "reducer": [
771            "sum"
772          ],
773          "show": false
774        },
775        "showHeader": true
776      },
777      "pluginVersion": "10.2.6",
778      "targets": [
779        {
780          "datasource": {
781            "type": "prometheus",
782            "uid": "${DS_PROMETHEUS}"
783          },
784          "editorMode": "code",
785          "expr": "sum by (model) (ollama_requests_total)",
786          "format": "table",
787          "instant": true,
788          "legendFormat": "__auto",
789          "range": false,
790          "refId": "A"
791        },
792        {
793          "datasource": {
794            "type": "prometheus",
795            "uid": "${DS_PROMETHEUS}"
796          },
797          "editorMode": "code",
798          "expr": "sum by (model) (ollama_response_seconds_sum) / sum by (model) (ollama_response_seconds_count)",
799          "format": "table",
800          "instant": true,
801          "legendFormat": "__auto",
802          "range": false,
803          "refId": "B"
804        },
805        {
806          "datasource": {
807            "type": "prometheus",
808            "uid": "${DS_PROMETHEUS}"
809          },
810          "editorMode": "code",
811          "expr": "sum by (model) (ollama_tokens_per_second_sum) / sum by (model) (ollama_tokens_per_second_count)",
812          "format": "table",
813          "instant": true,
814          "legendFormat": "__auto",
815          "range": false,
816          "refId": "C"
817        }
818      ],
819      "title": "Model Performance Summary",
820      "transformations": [
821        {
822          "id": "merge",
823          "options": {}
824        },
825        {
826          "id": "organize",
827          "options": {
828            "excludeByName": {
829              "Time": true
830            },
831            "indexByName": {},
832            "renameByName": {
833              "Value #A": "Total Requests",
834              "Value #B": "Avg Response Time",
835              "Value #C": "Avg Tokens/Second",
836              "model": "Model"
837            }
838          }
839        }
840      ],
841      "type": "table"
842    }
843  ],
844  "refresh": "5s",
845  "schemaVersion": 39,
846  "tags": [
847    "ollama",
848    "ai",
849    "llm"
850  ],
851  "templating": {
852    "list": [
853      {
854        "current": {
855          "selected": false,
856          "text": "prometheus",
857          "value": "c09d1a89-4ff3-4c52-b8d5-dba793da5d90"
858        },
859        "hide": 0,
860        "includeAll": false,
861        "multi": false,
862        "name": "DS_PROMETHEUS",
863        "options": [],
864        "query": "prometheus",
865        "refresh": 1,
866        "regex": "",
867        "skipUrlSync": false,
868        "type": "datasource"
869      }
870    ]
871  },
872  "time": {
873    "from": "now-1h",
874    "to": "now"
875  },
876  "timepicker": {},
877  "timezone": "",
878  "title": "Ollama Performance Monitoring",
879  "uid": "ollama-dashboard",
880  "version": 1,
881  "weekStart": ""
882}