flake-update-20260201
1{
2 "annotations": {
3 "list": [
4 {
5 "builtIn": 1,
6 "datasource": {
7 "type": "grafana",
8 "uid": "-- Grafana --"
9 },
10 "enable": true,
11 "hide": true,
12 "iconColor": "rgba(0, 211, 255, 1)",
13 "name": "Annotations & Alerts",
14 "type": "dashboard"
15 }
16 ]
17 },
18 "editable": true,
19 "fiscalYearStartMonth": 0,
20 "graphTooltip": 0,
21 "id": 15,
22 "links": [],
23 "panels": [
24 {
25 "datasource": {
26 "type": "prometheus"
27 },
28 "fieldConfig": {
29 "defaults": {
30 "mappings": [],
31 "thresholds": {
32 "mode": "absolute",
33 "steps": [
34 {
35 "color": "green"
36 },
37 {
38 "color": "red",
39 "value": 80
40 }
41 ]
42 }
43 },
44 "overrides": []
45 },
46 "gridPos": {
47 "h": 3,
48 "w": 6,
49 "x": 0,
50 "y": 0
51 },
52 "id": 1,
53 "options": {
54 "colorMode": "value",
55 "graphMode": "area",
56 "justifyMode": "auto",
57 "orientation": "auto",
58 "percentChangeColorMode": "standard",
59 "reduceOptions": {
60 "calcs": [
61 "lastNotNull"
62 ],
63 "fields": "",
64 "values": false
65 },
66 "showPercentChange": false,
67 "textMode": "auto",
68 "wideLayout": true
69 },
70 "pluginVersion": "12.0.1",
71 "targets": [
72 {
73 "datasource": {
74 "type": "prometheus"
75 },
76 "expr": "sum by (model) (ollama_requests_total)",
77 "format": "time_series",
78 "refId": "A"
79 }
80 ],
81 "title": "Total Requests Per Model",
82 "type": "stat"
83 },
84 {
85 "datasource": {
86 "type": "prometheus"
87 },
88 "fieldConfig": {
89 "defaults": {
90 "custom": {
91 "hideFrom": {
92 "legend": false,
93 "tooltip": false,
94 "viz": false
95 },
96 "scaleDistribution": {
97 "type": "linear"
98 }
99 }
100 },
101 "overrides": []
102 },
103 "gridPos": {
104 "h": 15,
105 "w": 18,
106 "x": 6,
107 "y": 0
108 },
109 "id": 6,
110 "options": {
111 "calculate": false,
112 "cellGap": 1,
113 "color": {
114 "exponent": 0.5,
115 "fill": "dark-orange",
116 "mode": "scheme",
117 "reverse": true,
118 "scale": "exponential",
119 "scheme": "Oranges",
120 "steps": 64
121 },
122 "exemplars": {
123 "color": "rgba(255,0,255,0.7)"
124 },
125 "filterValues": {
126 "le": 1e-9
127 },
128 "legend": {
129 "show": true
130 },
131 "rowsFrame": {
132 "layout": "auto"
133 },
134 "tooltip": {
135 "mode": "single",
136 "showColorScale": false,
137 "yHistogram": false
138 },
139 "yAxis": {
140 "axisPlacement": "left",
141 "reverse": false,
142 "unit": "Tokens/s"
143 }
144 },
145 "pluginVersion": "12.0.1",
146 "targets": [
147 {
148 "datasource": {
149 "type": "prometheus"
150 },
151 "editorMode": "code",
152 "expr": "ollama_tokens_per_second_bucket",
153 "format": "heatmap",
154 "hide": false,
155 "instant": false,
156 "legendFormat": "__auto",
157 "range": true,
158 "refId": "A"
159 }
160 ],
161 "title": "Count of responses by Token/s",
162 "type": "heatmap"
163 },
164 {
165 "datasource": {
166 "type": "prometheus"
167 },
168 "fieldConfig": {
169 "defaults": {
170 "color": {
171 "mode": "palette-classic"
172 },
173 "custom": {
174 "axisBorderShow": false,
175 "axisCenteredZero": false,
176 "axisColorMode": "text",
177 "axisLabel": "",
178 "axisPlacement": "auto",
179 "barAlignment": 0,
180 "barWidthFactor": 0.6,
181 "drawStyle": "points",
182 "fillOpacity": 0,
183 "gradientMode": "none",
184 "hideFrom": {
185 "legend": false,
186 "tooltip": false,
187 "viz": false
188 },
189 "insertNulls": false,
190 "lineInterpolation": "linear",
191 "lineWidth": 1,
192 "pointSize": 5,
193 "scaleDistribution": {
194 "type": "linear"
195 },
196 "showPoints": "auto",
197 "spanNulls": false,
198 "stacking": {
199 "group": "A",
200 "mode": "none"
201 },
202 "thresholdsStyle": {
203 "mode": "off"
204 }
205 },
206 "mappings": [],
207 "thresholds": {
208 "mode": "absolute",
209 "steps": [
210 {
211 "color": "green"
212 },
213 {
214 "color": "red",
215 "value": 80
216 }
217 ]
218 }
219 },
220 "overrides": []
221 },
222 "gridPos": {
223 "h": 3,
224 "w": 6,
225 "x": 0,
226 "y": 3
227 },
228 "id": 2,
229 "options": {
230 "legend": {
231 "calcs": [],
232 "displayMode": "list",
233 "placement": "bottom",
234 "showLegend": true
235 },
236 "tooltip": {
237 "hideZeros": false,
238 "mode": "single",
239 "sort": "none"
240 }
241 },
242 "pluginVersion": "12.0.1",
243 "targets": [
244 {
245 "datasource": {
246 "type": "prometheus"
247 },
248 "expr": "histogram_quantile(0.95, sum(rate(ollama_response_seconds_bucket[5m])) by (le, model))",
249 "format": "time_series",
250 "refId": "A"
251 }
252 ],
253 "title": "Response Time (Seconds)",
254 "type": "timeseries"
255 },
256 {
257 "datasource": {
258 "type": "prometheus"
259 },
260 "fieldConfig": {
261 "defaults": {
262 "mappings": [],
263 "thresholds": {
264 "mode": "absolute",
265 "steps": [
266 {
267 "color": "green"
268 },
269 {
270 "color": "red",
271 "value": 80
272 }
273 ]
274 }
275 },
276 "overrides": []
277 },
278 "gridPos": {
279 "h": 3,
280 "w": 6,
281 "x": 0,
282 "y": 6
283 },
284 "id": 3,
285 "options": {
286 "colorMode": "value",
287 "graphMode": "area",
288 "justifyMode": "auto",
289 "orientation": "auto",
290 "percentChangeColorMode": "standard",
291 "reduceOptions": {
292 "calcs": [
293 "lastNotNull"
294 ],
295 "fields": "",
296 "values": false
297 },
298 "showPercentChange": false,
299 "textMode": "auto",
300 "wideLayout": true
301 },
302 "pluginVersion": "12.0.1",
303 "targets": [
304 {
305 "datasource": {
306 "type": "prometheus"
307 },
308 "expr": "sum by (model) (rate(ollama_tokens_generated_total[5m]))",
309 "format": "time_series",
310 "refId": "A"
311 }
312 ],
313 "title": "Tokens Generated Per Model",
314 "type": "stat"
315 },
316 {
317 "datasource": {
318 "type": "prometheus"
319 },
320 "fieldConfig": {
321 "defaults": {
322 "color": {
323 "mode": "palette-classic"
324 },
325 "custom": {
326 "axisBorderShow": false,
327 "axisCenteredZero": false,
328 "axisColorMode": "text",
329 "axisLabel": "",
330 "axisPlacement": "auto",
331 "barAlignment": 0,
332 "barWidthFactor": 0.6,
333 "drawStyle": "points",
334 "fillOpacity": 0,
335 "gradientMode": "none",
336 "hideFrom": {
337 "legend": false,
338 "tooltip": false,
339 "viz": false
340 },
341 "insertNulls": false,
342 "lineInterpolation": "linear",
343 "lineWidth": 1,
344 "pointSize": 5,
345 "scaleDistribution": {
346 "type": "linear"
347 },
348 "showPoints": "auto",
349 "spanNulls": false,
350 "stacking": {
351 "group": "A",
352 "mode": "none"
353 },
354 "thresholdsStyle": {
355 "mode": "off"
356 }
357 },
358 "mappings": [],
359 "thresholds": {
360 "mode": "absolute",
361 "steps": [
362 {
363 "color": "green"
364 },
365 {
366 "color": "red",
367 "value": 80
368 }
369 ]
370 }
371 },
372 "overrides": []
373 },
374 "gridPos": {
375 "h": 3,
376 "w": 6,
377 "x": 0,
378 "y": 9
379 },
380 "id": 4,
381 "options": {
382 "legend": {
383 "calcs": [],
384 "displayMode": "list",
385 "placement": "bottom",
386 "showLegend": true
387 },
388 "tooltip": {
389 "hideZeros": false,
390 "mode": "single",
391 "sort": "none"
392 }
393 },
394 "pluginVersion": "12.0.1",
395 "targets": [
396 {
397 "datasource": {
398 "type": "prometheus"
399 },
400 "expr": "sum by (model) (rate(ollama_eval_total[5m]))",
401 "format": "time_series",
402 "refId": "A"
403 }
404 ],
405 "title": "Evaluation Steps",
406 "type": "timeseries"
407 },
408 {
409 "datasource": {
410 "type": "prometheus",
411 "uid": "fenqsyb8rfke8c"
412 },
413 "fieldConfig": {
414 "defaults": {
415 "color": {
416 "mode": "palette-classic"
417 },
418 "custom": {
419 "axisBorderShow": false,
420 "axisCenteredZero": false,
421 "axisColorMode": "text",
422 "axisLabel": "",
423 "axisPlacement": "auto",
424 "barAlignment": 0,
425 "barWidthFactor": 0.6,
426 "drawStyle": "points",
427 "fillOpacity": 0,
428 "gradientMode": "none",
429 "hideFrom": {
430 "legend": false,
431 "tooltip": false,
432 "viz": false
433 },
434 "insertNulls": false,
435 "lineInterpolation": "linear",
436 "lineWidth": 1,
437 "pointSize": 5,
438 "scaleDistribution": {
439 "type": "linear"
440 },
441 "showPoints": "auto",
442 "spanNulls": false,
443 "stacking": {
444 "group": "A",
445 "mode": "none"
446 },
447 "thresholdsStyle": {
448 "mode": "off"
449 }
450 },
451 "mappings": [],
452 "thresholds": {
453 "mode": "absolute",
454 "steps": [
455 {
456 "color": "green"
457 },
458 {
459 "color": "red",
460 "value": 80
461 }
462 ]
463 }
464 },
465 "overrides": []
466 },
467 "gridPos": {
468 "h": 3,
469 "w": 6,
470 "x": 0,
471 "y": 12
472 },
473 "id": 5,
474 "options": {
475 "legend": {
476 "calcs": [],
477 "displayMode": "list",
478 "placement": "bottom",
479 "showLegend": true
480 },
481 "tooltip": {
482 "hideZeros": false,
483 "mode": "single",
484 "sort": "none"
485 }
486 },
487 "pluginVersion": "12.0.1",
488 "targets": [
489 {
490 "datasource": {
491 "type": "prometheus"
492 },
493 "expr": "histogram_quantile(0.95, sum(rate(ollama_load_time_seconds_bucket[5m])) by (le, model))",
494 "format": "time_series",
495 "refId": "A"
496 }
497 ],
498 "title": "Model Load Time (Seconds)",
499 "type": "timeseries"
500 }
501 ],
502 "preload": false,
503 "refresh": "5s",
504 "schemaVersion": 41,
505 "tags": [],
506 "templating": {
507 "list": []
508 },
509 "time": {
510 "from": "now-30m",
511 "to": "now"
512 },
513 "timepicker": {},
514 "timezone": "",
515 "title": "Ollama Metrics Dashboard",
516 "version": 2
517}