]> git.proxmox.com Git - ceph.git/blob - ceph/monitoring/ceph-mixin/dashboards_out/osds-overview.json
import quincy 17.2.0
[ceph.git] / ceph / monitoring / ceph-mixin / dashboards_out / osds-overview.json
1 {
2 "__inputs": [ ],
3 "__requires": [
4 {
5 "id": "grafana",
6 "name": "Grafana",
7 "type": "grafana",
8 "version": "5.0.0"
9 },
10 {
11 "id": "grafana-piechart-panel",
12 "name": "Pie Chart",
13 "type": "panel",
14 "version": "1.3.3"
15 },
16 {
17 "id": "graph",
18 "name": "Graph",
19 "type": "panel",
20 "version": "5.0.0"
21 },
22 {
23 "id": "table",
24 "name": "Table",
25 "type": "panel",
26 "version": "5.0.0"
27 }
28 ],
29 "annotations": {
30 "list": [
31 {
32 "builtIn": 1,
33 "datasource": "-- Grafana --",
34 "enable": true,
35 "hide": true,
36 "iconColor": "rgba(0, 211, 255, 1)",
37 "name": "Annotations & Alerts",
38 "showIn": 0,
39 "tags": [ ],
40 "type": "dashboard"
41 }
42 ]
43 },
44 "description": "",
45 "editable": false,
46 "gnetId": null,
47 "graphTooltip": 0,
48 "hideControls": false,
49 "id": null,
50 "links": [ ],
51 "panels": [
52 {
53 "aliasColors": {
54 "@95%ile": "#e0752d"
55 },
56 "bars": false,
57 "dashLength": 10,
58 "dashes": false,
59 "datasource": "$datasource",
60 "description": "",
61 "fill": 1,
62 "fillGradient": 0,
63 "gridPos": {
64 "h": 8,
65 "w": 8,
66 "x": 0,
67 "y": 0
68 },
69 "id": 2,
70 "legend": {
71 "alignAsTable": false,
72 "avg": false,
73 "current": false,
74 "max": false,
75 "min": false,
76 "rightSide": false,
77 "show": true,
78 "sideWidth": null,
79 "total": false,
80 "values": false
81 },
82 "lines": true,
83 "linewidth": 1,
84 "links": [ ],
85 "nullPointMode": "null",
86 "percentage": false,
87 "pointradius": 5,
88 "points": false,
89 "renderer": "flot",
90 "repeat": null,
91 "seriesOverrides": [ ],
92 "spaceLength": 10,
93 "stack": false,
94 "steppedLine": false,
95 "targets": [
96 {
97 "expr": "avg (irate(ceph_osd_op_r_latency_sum[1m]) / on (ceph_daemon) irate(ceph_osd_op_r_latency_count[1m]) * 1000)",
98 "format": "time_series",
99 "intervalFactor": 1,
100 "legendFormat": "AVG read",
101 "refId": "A"
102 },
103 {
104 "expr": "max (irate(ceph_osd_op_r_latency_sum[1m]) / on (ceph_daemon) irate(ceph_osd_op_r_latency_count[1m]) * 1000)",
105 "format": "time_series",
106 "intervalFactor": 1,
107 "legendFormat": "MAX read",
108 "refId": "B"
109 },
110 {
111 "expr": "quantile(0.95,\n (irate(ceph_osd_op_r_latency_sum[1m]) / on (ceph_daemon) irate(ceph_osd_op_r_latency_count[1m]) * 1000)\n)",
112 "format": "time_series",
113 "intervalFactor": 1,
114 "legendFormat": "@95%ile",
115 "refId": "C"
116 }
117 ],
118 "thresholds": [ ],
119 "timeFrom": null,
120 "timeShift": null,
121 "title": "OSD Read Latencies",
122 "tooltip": {
123 "shared": true,
124 "sort": 0,
125 "value_type": "individual"
126 },
127 "type": "graph",
128 "xaxis": {
129 "buckets": null,
130 "mode": "time",
131 "name": null,
132 "show": true,
133 "values": [ ]
134 },
135 "yaxes": [
136 {
137 "format": "ms",
138 "label": null,
139 "logBase": 1,
140 "max": null,
141 "min": "0",
142 "show": true
143 },
144 {
145 "format": "short",
146 "label": null,
147 "logBase": 1,
148 "max": null,
149 "min": "0",
150 "show": true
151 }
152 ]
153 },
154 {
155 "columns": [ ],
156 "datasource": "$datasource",
157 "description": "This table shows the osd's that are delivering the 10 highest read latencies within the cluster",
158 "gridPos": {
159 "h": 8,
160 "w": 4,
161 "x": 8,
162 "y": 0
163 },
164 "id": 3,
165 "links": [ ],
166 "sort": {
167 "col": 2,
168 "desc": true
169 },
170 "styles": [
171 {
172 "alias": "OSD ID",
173 "colorMode": null,
174 "colors": [
175 "rgba(245, 54, 54, 0.9)",
176 "rgba(237, 129, 40, 0.89)",
177 "rgba(50, 172, 45, 0.97)"
178 ],
179 "dateFormat": "YYYY-MM-DD HH:mm:ss",
180 "decimals": 2,
181 "mappingType": 1,
182 "pattern": "ceph_daemon",
183 "thresholds": [ ],
184 "type": "string",
185 "unit": "short",
186 "valueMaps": [ ]
187 },
188 {
189 "alias": "Latency (ms)",
190 "colorMode": null,
191 "colors": [
192 "rgba(245, 54, 54, 0.9)",
193 "rgba(237, 129, 40, 0.89)",
194 "rgba(50, 172, 45, 0.97)"
195 ],
196 "dateFormat": "YYYY-MM-DD HH:mm:ss",
197 "decimals": 2,
198 "mappingType": 1,
199 "pattern": "Value",
200 "thresholds": [ ],
201 "type": "number",
202 "unit": "none",
203 "valueMaps": [ ]
204 },
205 {
206 "alias": "",
207 "colorMode": null,
208 "colors": [
209 "rgba(245, 54, 54, 0.9)",
210 "rgba(237, 129, 40, 0.89)",
211 "rgba(50, 172, 45, 0.97)"
212 ],
213 "dateFormat": "YYYY-MM-DD HH:mm:ss",
214 "decimals": 2,
215 "mappingType": 1,
216 "pattern": "/.*/",
217 "thresholds": [ ],
218 "type": "hidden",
219 "unit": "short",
220 "valueMaps": [ ]
221 }
222 ],
223 "targets": [
224 {
225 "expr": "topk(10,\n (sort(\n (irate(ceph_osd_op_r_latency_sum[1m]) / on (ceph_daemon) irate(ceph_osd_op_r_latency_count[1m]) * 1000)\n ))\n)\n\n",
226 "format": "table",
227 "instant": true,
228 "intervalFactor": 1,
229 "legendFormat": "",
230 "refId": "A"
231 }
232 ],
233 "timeFrom": null,
234 "timeShift": null,
235 "title": "Highest READ Latencies",
236 "transform": "table",
237 "type": "table"
238 },
239 {
240 "aliasColors": {
241 "@95%ile write": "#e0752d"
242 },
243 "bars": false,
244 "dashLength": 10,
245 "dashes": false,
246 "datasource": "$datasource",
247 "description": "",
248 "fill": 1,
249 "fillGradient": 0,
250 "gridPos": {
251 "h": 8,
252 "w": 8,
253 "x": 12,
254 "y": 0
255 },
256 "id": 4,
257 "legend": {
258 "alignAsTable": false,
259 "avg": false,
260 "current": false,
261 "max": false,
262 "min": false,
263 "rightSide": false,
264 "show": true,
265 "sideWidth": null,
266 "total": false,
267 "values": false
268 },
269 "lines": true,
270 "linewidth": 1,
271 "links": [ ],
272 "nullPointMode": "null",
273 "percentage": false,
274 "pointradius": 5,
275 "points": false,
276 "renderer": "flot",
277 "repeat": null,
278 "seriesOverrides": [ ],
279 "spaceLength": 10,
280 "stack": false,
281 "steppedLine": false,
282 "targets": [
283 {
284 "expr": "avg (irate(ceph_osd_op_w_latency_sum[1m]) / on (ceph_daemon) irate(ceph_osd_op_w_latency_count[1m]) * 1000)",
285 "format": "time_series",
286 "intervalFactor": 1,
287 "legendFormat": "AVG write",
288 "refId": "A"
289 },
290 {
291 "expr": "max (irate(ceph_osd_op_w_latency_sum[1m]) / on (ceph_daemon) irate(ceph_osd_op_w_latency_count[1m]) * 1000)",
292 "format": "time_series",
293 "intervalFactor": 1,
294 "legendFormat": "MAX write",
295 "refId": "B"
296 },
297 {
298 "expr": "quantile(0.95,\n (irate(ceph_osd_op_w_latency_sum[1m]) / on (ceph_daemon) irate(ceph_osd_op_w_latency_count[1m]) * 1000)\n)",
299 "format": "time_series",
300 "intervalFactor": 1,
301 "legendFormat": "@95%ile write",
302 "refId": "C"
303 }
304 ],
305 "thresholds": [ ],
306 "timeFrom": null,
307 "timeShift": null,
308 "title": "OSD Write Latencies",
309 "tooltip": {
310 "shared": true,
311 "sort": 0,
312 "value_type": "individual"
313 },
314 "type": "graph",
315 "xaxis": {
316 "buckets": null,
317 "mode": "time",
318 "name": null,
319 "show": true,
320 "values": [ ]
321 },
322 "yaxes": [
323 {
324 "format": "ms",
325 "label": null,
326 "logBase": 1,
327 "max": null,
328 "min": "0",
329 "show": true
330 },
331 {
332 "format": "short",
333 "label": null,
334 "logBase": 1,
335 "max": null,
336 "min": "0",
337 "show": true
338 }
339 ]
340 },
341 {
342 "columns": [ ],
343 "datasource": "$datasource",
344 "description": "This table shows the osd's that are delivering the 10 highest write latencies within the cluster",
345 "gridPos": {
346 "h": 8,
347 "w": 4,
348 "x": 20,
349 "y": 0
350 },
351 "id": 5,
352 "links": [ ],
353 "sort": {
354 "col": 2,
355 "desc": true
356 },
357 "styles": [
358 {
359 "alias": "OSD ID",
360 "colorMode": null,
361 "colors": [
362 "rgba(245, 54, 54, 0.9)",
363 "rgba(237, 129, 40, 0.89)",
364 "rgba(50, 172, 45, 0.97)"
365 ],
366 "dateFormat": "YYYY-MM-DD HH:mm:ss",
367 "decimals": 2,
368 "mappingType": 1,
369 "pattern": "ceph_daemon",
370 "thresholds": [ ],
371 "type": "string",
372 "unit": "short",
373 "valueMaps": [ ]
374 },
375 {
376 "alias": "Latency (ms)",
377 "colorMode": null,
378 "colors": [
379 "rgba(245, 54, 54, 0.9)",
380 "rgba(237, 129, 40, 0.89)",
381 "rgba(50, 172, 45, 0.97)"
382 ],
383 "dateFormat": "YYYY-MM-DD HH:mm:ss",
384 "decimals": 2,
385 "mappingType": 1,
386 "pattern": "Value",
387 "thresholds": [ ],
388 "type": "number",
389 "unit": "none",
390 "valueMaps": [ ]
391 },
392 {
393 "alias": "",
394 "colorMode": null,
395 "colors": [
396 "rgba(245, 54, 54, 0.9)",
397 "rgba(237, 129, 40, 0.89)",
398 "rgba(50, 172, 45, 0.97)"
399 ],
400 "dateFormat": "YYYY-MM-DD HH:mm:ss",
401 "decimals": 2,
402 "mappingType": 1,
403 "pattern": "/.*/",
404 "thresholds": [ ],
405 "type": "hidden",
406 "unit": "short",
407 "valueMaps": [ ]
408 }
409 ],
410 "targets": [
411 {
412 "expr": "topk(10,\n (sort(\n (irate(ceph_osd_op_w_latency_sum[1m]) / on (ceph_daemon) irate(ceph_osd_op_w_latency_count[1m]) * 1000)\n ))\n)\n\n",
413 "format": "table",
414 "instant": true,
415 "intervalFactor": 1,
416 "legendFormat": "",
417 "refId": "A"
418 }
419 ],
420 "timeFrom": null,
421 "timeShift": null,
422 "title": "Highest WRITE Latencies",
423 "transform": "table",
424 "type": "table"
425 },
426 {
427 "aliasColors": { },
428 "datasource": "$datasource",
429 "description": "",
430 "gridPos": {
431 "h": 8,
432 "w": 4,
433 "x": 0,
434 "y": 8
435 },
436 "id": 6,
437 "legend": {
438 "percentage": true,
439 "show": true,
440 "values": true
441 },
442 "legendType": "Under graph",
443 "pieType": "pie",
444 "targets": [
445 {
446 "expr": "count by (device_class) (ceph_osd_metadata)",
447 "format": "time_series",
448 "intervalFactor": 1,
449 "legendFormat": "{{device_class}}",
450 "refId": "A"
451 }
452 ],
453 "title": "OSD Types Summary",
454 "type": "grafana-piechart-panel",
455 "valueName": "current"
456 },
457 {
458 "aliasColors": {
459 "Non-Encrypted": "#E5AC0E"
460 },
461 "datasource": "$datasource",
462 "description": "",
463 "gridPos": {
464 "h": 8,
465 "w": 4,
466 "x": 4,
467 "y": 8
468 },
469 "id": 7,
470 "legend": {
471 "percentage": true,
472 "show": true,
473 "values": true
474 },
475 "legendType": "Under graph",
476 "pieType": "pie",
477 "targets": [
478 {
479 "expr": "count(ceph_bluefs_wal_total_bytes)",
480 "format": "time_series",
481 "intervalFactor": 2,
482 "legendFormat": "bluestore",
483 "refId": "A"
484 },
485 {
486 "expr": "absent(ceph_bluefs_wal_total_bytes)*count(ceph_osd_metadata)",
487 "format": "time_series",
488 "intervalFactor": 2,
489 "legendFormat": "filestore",
490 "refId": "B"
491 }
492 ],
493 "title": "OSD Objectstore Types",
494 "type": "grafana-piechart-panel",
495 "valueName": "current"
496 },
497 {
498 "aliasColors": { },
499 "datasource": "$datasource",
500 "description": "The pie chart shows the various OSD sizes used within the cluster",
501 "gridPos": {
502 "h": 8,
503 "w": 4,
504 "x": 8,
505 "y": 8
506 },
507 "id": 8,
508 "legend": {
509 "percentage": true,
510 "show": true,
511 "values": true
512 },
513 "legendType": "Under graph",
514 "pieType": "pie",
515 "targets": [
516 {
517 "expr": "count(ceph_osd_stat_bytes < 1099511627776)",
518 "format": "time_series",
519 "intervalFactor": 2,
520 "legendFormat": "<1TB",
521 "refId": "A"
522 },
523 {
524 "expr": "count(ceph_osd_stat_bytes >= 1099511627776 < 2199023255552)",
525 "format": "time_series",
526 "intervalFactor": 2,
527 "legendFormat": "<2TB",
528 "refId": "B"
529 },
530 {
531 "expr": "count(ceph_osd_stat_bytes >= 2199023255552 < 3298534883328)",
532 "format": "time_series",
533 "intervalFactor": 2,
534 "legendFormat": "<3TB",
535 "refId": "C"
536 },
537 {
538 "expr": "count(ceph_osd_stat_bytes >= 3298534883328 < 4398046511104)",
539 "format": "time_series",
540 "intervalFactor": 2,
541 "legendFormat": "<4TB",
542 "refId": "D"
543 },
544 {
545 "expr": "count(ceph_osd_stat_bytes >= 4398046511104 < 6597069766656)",
546 "format": "time_series",
547 "intervalFactor": 2,
548 "legendFormat": "<6TB",
549 "refId": "E"
550 },
551 {
552 "expr": "count(ceph_osd_stat_bytes >= 6597069766656 < 8796093022208)",
553 "format": "time_series",
554 "intervalFactor": 2,
555 "legendFormat": "<8TB",
556 "refId": "F"
557 },
558 {
559 "expr": "count(ceph_osd_stat_bytes >= 8796093022208 < 10995116277760)",
560 "format": "time_series",
561 "intervalFactor": 2,
562 "legendFormat": "<10TB",
563 "refId": "G"
564 },
565 {
566 "expr": "count(ceph_osd_stat_bytes >= 10995116277760 < 13194139533312)",
567 "format": "time_series",
568 "intervalFactor": 2,
569 "legendFormat": "<12TB",
570 "refId": "H"
571 },
572 {
573 "expr": "count(ceph_osd_stat_bytes >= 13194139533312)",
574 "format": "time_series",
575 "intervalFactor": 2,
576 "legendFormat": "<12TB+",
577 "refId": "I"
578 }
579 ],
580 "title": "OSD Size Summary",
581 "type": "grafana-piechart-panel",
582 "valueName": "current"
583 },
584 {
585 "aliasColors": { },
586 "bars": true,
587 "dashLength": 10,
588 "dashes": false,
589 "datasource": "$datasource",
590 "fill": 1,
591 "fillGradient": 0,
592 "gridPos": {
593 "h": 8,
594 "w": 8,
595 "x": 12,
596 "y": 8
597 },
598 "id": 9,
599 "legend": {
600 "alignAsTable": false,
601 "avg": false,
602 "current": false,
603 "max": false,
604 "min": false,
605 "rightSide": false,
606 "show": true,
607 "sideWidth": null,
608 "total": false,
609 "values": false
610 },
611 "lines": true,
612 "linewidth": 1,
613 "links": [ ],
614 "nullPointMode": "null",
615 "percentage": false,
616 "pointradius": 5,
617 "points": false,
618 "renderer": "flot",
619 "repeat": null,
620 "seriesOverrides": [ ],
621 "spaceLength": 10,
622 "stack": false,
623 "steppedLine": false,
624 "targets": [
625 {
626 "expr": "ceph_osd_numpg\n",
627 "format": "time_series",
628 "instant": true,
629 "intervalFactor": 1,
630 "legendFormat": "PGs per OSD",
631 "refId": "A"
632 }
633 ],
634 "thresholds": [ ],
635 "timeFrom": null,
636 "timeShift": null,
637 "title": "Distribution of PGs per OSD",
638 "tooltip": {
639 "shared": true,
640 "sort": 0,
641 "value_type": "individual"
642 },
643 "type": "graph",
644 "xaxis": {
645 "buckets": 20,
646 "mode": "histogram",
647 "name": null,
648 "show": true,
649 "values": [ ]
650 },
651 "yaxes": [
652 {
653 "format": "short",
654 "label": "# of OSDs",
655 "logBase": 1,
656 "max": null,
657 "min": "0",
658 "show": true
659 },
660 {
661 "format": "short",
662 "label": null,
663 "logBase": 1,
664 "max": null,
665 "min": "0",
666 "show": true
667 }
668 ]
669 },
670 {
671 "cacheTimeout": null,
672 "colorBackground": false,
673 "colorValue": true,
674 "colors": [
675 "#d44a3a",
676 "#299c46"
677 ],
678 "datasource": "$datasource",
679 "description": "This gauge panel shows onode Hits ratio to help determine if increasing RAM per OSD could help improve the performance of the cluster",
680 "format": "percentunit",
681 "gauge": {
682 "maxValue": 1,
683 "minValue": 0,
684 "show": true,
685 "thresholdLabels": false,
686 "thresholdMarkers": true
687 },
688 "gridPos": {
689 "h": 8,
690 "w": 4,
691 "x": 20,
692 "y": 8
693 },
694 "id": 10,
695 "interval": null,
696 "links": [ ],
697 "mappingType": 1,
698 "mappingTypes": [
699 {
700 "name": "value to text",
701 "value": 1
702 },
703 {
704 "name": "range to text",
705 "value": 2
706 }
707 ],
708 "maxDataPoints": 100,
709 "nullPointMode": "connected",
710 "nullText": null,
711 "postfix": "",
712 "postfixFontSize": "50%",
713 "prefix": "",
714 "prefixFontSize": "50%",
715 "rangeMaps": [
716 {
717 "from": "null",
718 "text": "N/A",
719 "to": "null"
720 }
721 ],
722 "sparkline": {
723 "fillColor": "rgba(31, 118, 189, 0.18)",
724 "full": false,
725 "lineColor": "rgb(31, 120, 193)",
726 "show": false
727 },
728 "tableColumn": "",
729 "targets": [
730 {
731 "expr": "sum(ceph_bluestore_onode_hits)/(sum(ceph_bluestore_onode_hits) + sum(ceph_bluestore_onode_misses))",
732 "format": "time_series",
733 "intervalFactor": 1,
734 "legendFormat": "",
735 "refId": "A"
736 }
737 ],
738 "thresholds": ".75",
739 "title": "OSD onode Hits Ratio",
740 "type": "singlestat",
741 "valueFontSize": "80%",
742 "valueMaps": [
743 {
744 "op": "=",
745 "text": "N/A",
746 "value": "null"
747 }
748 ],
749 "valueName": "current"
750 },
751 {
752 "collapse": false,
753 "collapsed": false,
754 "gridPos": {
755 "h": 1,
756 "w": 24,
757 "x": 0,
758 "y": 16
759 },
760 "id": 11,
761 "panels": [ ],
762 "repeat": null,
763 "repeatIteration": null,
764 "repeatRowId": null,
765 "showTitle": true,
766 "title": "R/W Profile",
767 "titleSize": "h6",
768 "type": "row"
769 },
770 {
771 "aliasColors": { },
772 "bars": false,
773 "dashLength": 10,
774 "dashes": false,
775 "datasource": "$datasource",
776 "description": "Show the read/write workload profile overtime",
777 "fill": 1,
778 "fillGradient": 0,
779 "gridPos": {
780 "h": 8,
781 "w": 24,
782 "x": 0,
783 "y": 17
784 },
785 "id": 12,
786 "legend": {
787 "alignAsTable": false,
788 "avg": false,
789 "current": false,
790 "max": false,
791 "min": false,
792 "rightSide": false,
793 "show": true,
794 "sideWidth": null,
795 "total": false,
796 "values": false
797 },
798 "lines": true,
799 "linewidth": 1,
800 "links": [ ],
801 "nullPointMode": "null",
802 "percentage": false,
803 "pointradius": 5,
804 "points": false,
805 "renderer": "flot",
806 "repeat": null,
807 "seriesOverrides": [ ],
808 "spaceLength": 10,
809 "stack": false,
810 "steppedLine": false,
811 "targets": [
812 {
813 "expr": "round(sum(irate(ceph_pool_rd[30s])))",
814 "format": "time_series",
815 "intervalFactor": 1,
816 "legendFormat": "Reads",
817 "refId": "A"
818 },
819 {
820 "expr": "round(sum(irate(ceph_pool_wr[30s])))",
821 "format": "time_series",
822 "intervalFactor": 1,
823 "legendFormat": "Writes",
824 "refId": "B"
825 }
826 ],
827 "thresholds": [ ],
828 "timeFrom": null,
829 "timeShift": null,
830 "title": "Read/Write Profile",
831 "tooltip": {
832 "shared": true,
833 "sort": 0,
834 "value_type": "individual"
835 },
836 "type": "graph",
837 "xaxis": {
838 "buckets": null,
839 "mode": "time",
840 "name": null,
841 "show": true,
842 "values": [ ]
843 },
844 "yaxes": [
845 {
846 "format": "short",
847 "label": null,
848 "logBase": 1,
849 "max": null,
850 "min": null,
851 "show": true
852 },
853 {
854 "format": "short",
855 "label": null,
856 "logBase": 1,
857 "max": null,
858 "min": null,
859 "show": true
860 }
861 ]
862 }
863 ],
864 "refresh": "10s",
865 "rows": [ ],
866 "schemaVersion": 16,
867 "style": "dark",
868 "tags": [ ],
869 "templating": {
870 "list": [
871 {
872 "current": {
873 "text": "default",
874 "value": "default"
875 },
876 "hide": 0,
877 "label": "Data Source",
878 "name": "datasource",
879 "options": [ ],
880 "query": "prometheus",
881 "refresh": 1,
882 "regex": "",
883 "type": "datasource"
884 }
885 ]
886 },
887 "time": {
888 "from": "now-1h",
889 "to": "now"
890 },
891 "timepicker": {
892 "refresh_intervals": [
893 "5s",
894 "10s",
895 "30s",
896 "1m",
897 "5m",
898 "15m",
899 "30m",
900 "1h",
901 "2h",
902 "1d"
903 ],
904 "time_options": [
905 "5m",
906 "15m",
907 "1h",
908 "6h",
909 "12h",
910 "24h",
911 "2d",
912 "7d",
913 "30d"
914 ]
915 },
916 "timezone": "",
917 "title": "OSD Overview",
918 "uid": "lo02I1Aiz",
919 "version": 0
920 }