12 "iconColor": "rgba(0, 211, 255, 1)",
13 "name": "Annotations & Alerts",
24 "description": "Kafka resource usage and throughput",
26 "fiscalYearStartMonth": 0,
55 "title": "Healthcheck",
61 "uid": "PBFA97CFB590B2093"
63 "description": "Number of Brokers Online",
88 "color": "rgba(237, 129, 40, 0.89)",
109 "maxDataPoints": 100,
111 "colorMode": "value",
113 "justifyMode": "auto",
114 "orientation": "horizontal",
125 "pluginVersion": "10.0.3",
126 "repeatDirection": "h",
130 "type": "prometheus",
131 "uid": "PBFA97CFB590B2093"
133 "expr": "count(kafka_server_replicamanager_leadercount{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"})",
134 "format": "time_series",
142 "title": "Brokers Online",
147 "type": "prometheus",
148 "uid": "PBFA97CFB590B2093"
150 "description": "Number of active controllers in the cluster.",
192 "maxDataPoints": 100,
194 "colorMode": "value",
196 "justifyMode": "auto",
197 "orientation": "vertical",
206 "textMode": "value_and_name"
208 "pluginVersion": "10.0.3",
212 "type": "prometheus",
213 "uid": "PBFA97CFB590B2093"
215 "expr": "kafka_controller_kafkacontroller_activecontrollercount{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"} > 0",
216 "format": "time_series",
220 "legendFormat": "{{instance}}",
224 "title": "Active Controllers",
229 "type": "prometheus",
230 "uid": "PBFA97CFB590B2093"
232 "description": "Partitions that are online",
257 "color": "rgba(237, 129, 40, 0.89)",
278 "maxDataPoints": 100,
280 "colorMode": "value",
282 "justifyMode": "auto",
283 "orientation": "horizontal",
294 "pluginVersion": "10.0.3",
298 "type": "prometheus",
299 "uid": "PBFA97CFB590B2093"
301 "expr": "sum(kafka_server_replicamanager_partitioncount{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"})",
302 "format": "time_series",
310 "title": "Online Partitions",
315 "type": "prometheus",
316 "uid": "PBFA97CFB590B2093"
343 "color": "rgba(237, 129, 40, 0.89)",
363 "maxDataPoints": 100,
365 "colorMode": "value",
367 "justifyMode": "auto",
368 "orientation": "horizontal",
379 "pluginVersion": "10.0.3",
383 "type": "prometheus",
384 "uid": "PBFA97CFB590B2093"
386 "expr": "sum(kafka_controller_kafkacontroller_preferredreplicaimbalancecount{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"})",
387 "format": "time_series",
395 "title": "Preferred Replica Imbalance",
400 "type": "prometheus",
401 "uid": "PBFA97CFB590B2093"
403 "description": "Unclean leader election rate",
428 "color": "rgba(237, 129, 40, 0.89)",
448 "maxDataPoints": 100,
450 "colorMode": "value",
452 "justifyMode": "auto",
453 "orientation": "horizontal",
464 "pluginVersion": "10.0.3",
468 "type": "prometheus",
469 "uid": "PBFA97CFB590B2093"
471 "expr": "sum(kafka_controller_controllerstats_uncleanleaderelectionspersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"})",
472 "format": "time_series",
480 "title": "Unclean Leader Election Rate",
485 "type": "prometheus",
486 "uid": "PBFA97CFB590B2093"
488 "description": "Number of under-replicated partitions (| ISR | < | all replicas |).",
513 "color": "rgba(237, 129, 40, 0.89)",
534 "maxDataPoints": 100,
536 "colorMode": "value",
538 "justifyMode": "auto",
539 "orientation": "horizontal",
550 "pluginVersion": "10.0.3",
554 "type": "prometheus",
555 "uid": "PBFA97CFB590B2093"
557 "editorMode": "code",
559 "expr": "sum(kafka_server_replicamanager_underreplicatedpartitions{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"})",
560 "format": "time_series",
570 "title": "Under Replicated Partitions",
575 "type": "prometheus",
576 "uid": "PBFA97CFB590B2093"
582 "mode": "palette-classic"
585 "axisCenteredZero": false,
586 "axisColorMode": "text",
588 "axisPlacement": "auto",
592 "gradientMode": "none",
598 "lineInterpolation": "linear",
601 "scaleDistribution": {
604 "showPoints": "never",
658 "displayMode": "table",
659 "placement": "bottom",
667 "pluginVersion": "8.1.3",
671 "type": "prometheus",
672 "uid": "PBFA97CFB590B2093"
674 "editorMode": "code",
676 "expr": "kafka_server_replicamanager_underreplicatedpartitions{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"}",
679 "legendFormat": "{{instance}}",
684 "title": "Underreplicated Partitions",
689 "type": "prometheus",
690 "uid": "PBFA97CFB590B2093"
696 "mode": "palette-classic"
735 "displayMode": "list",
736 "placement": "right",
755 "pluginVersion": "8.1.3",
759 "type": "prometheus",
760 "uid": "PBFA97CFB590B2093"
762 "editorMode": "code",
764 "expr": "kafka_server_replicamanager_leadercount{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"}",
767 "legendFormat": "{{instance}}",
772 "title": "Leader Count",
777 "type": "prometheus",
778 "uid": "PBFA97CFB590B2093"
780 "description": "Number of partitions under min insync replicas.",
805 "color": "rgba(237, 129, 40, 0.89)",
826 "maxDataPoints": 100,
828 "colorMode": "value",
830 "justifyMode": "auto",
831 "orientation": "horizontal",
842 "pluginVersion": "10.0.3",
846 "type": "prometheus",
847 "uid": "PBFA97CFB590B2093"
849 "editorMode": "code",
850 "expr": "sum(kafka_cluster_partition_underminisr{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"})",
851 "format": "time_series",
861 "title": "Under Min ISR Partitions",
866 "type": "prometheus",
867 "uid": "PBFA97CFB590B2093"
869 "description": "Number of partitions that dont have an active leader and are hence not writable or readable.",
915 "maxDataPoints": 100,
917 "colorMode": "value",
919 "justifyMode": "auto",
920 "orientation": "horizontal",
931 "pluginVersion": "10.0.3",
935 "type": "prometheus",
936 "uid": "PBFA97CFB590B2093"
938 "editorMode": "code",
939 "expr": "sum(kafka_controller_kafkacontroller_offlinepartitionscount{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"})",
940 "format": "time_series",
949 "title": "Offline Partitions Count",
955 "type": "datasource",
968 "type": "prometheus",
969 "uid": "PBFA97CFB590B2093"
974 "mode": "palette-classic"
977 "axisCenteredZero": false,
978 "axisColorMode": "text",
979 "axisLabel": "Cores",
980 "axisPlacement": "auto",
984 "gradientMode": "none",
990 "lineInterpolation": "linear",
993 "scaleDistribution": {
996 "showPoints": "never",
1002 "thresholdsStyle": {
1026 "options": "localhost:7071"
1032 "fixedColor": "#629E51",
1055 "displayMode": "table",
1056 "placement": "bottom",
1064 "pluginVersion": "8.1.3",
1068 "type": "prometheus",
1069 "uid": "PBFA97CFB590B2093"
1071 "expr": "irate(process_cpu_seconds_total{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"}[5m])*100",
1072 "format": "time_series",
1074 "intervalFactor": 2,
1075 "legendFormat": "{{instance}}",
1076 "metric": "process_cpu_secondspersec",
1081 "title": "CPU Usage",
1082 "type": "timeseries"
1086 "type": "prometheus",
1087 "uid": "PBFA97CFB590B2093"
1092 "mode": "palette-classic"
1095 "axisCenteredZero": false,
1096 "axisColorMode": "text",
1097 "axisLabel": "Memory",
1098 "axisPlacement": "auto",
1100 "drawStyle": "line",
1102 "gradientMode": "none",
1108 "lineInterpolation": "linear",
1111 "scaleDistribution": {
1114 "showPoints": "never",
1120 "thresholdsStyle": {
1144 "options": "localhost:7071"
1150 "fixedColor": "#BA43A9",
1157 "__systemRef": "hideSeriesFrom",
1165 "prefix": "All except:",
1171 "id": "custom.hideFrom",
1197 "displayMode": "table",
1198 "placement": "bottom",
1206 "pluginVersion": "8.1.3",
1210 "type": "prometheus",
1211 "uid": "PBFA97CFB590B2093"
1213 "expr": "sum without(area)(jvm_memory_bytes_used{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"})",
1215 "intervalFactor": 2,
1216 "legendFormat": "{{instance}}",
1217 "metric": "jvm_memory_bytes_used",
1223 "type": "prometheus",
1224 "uid": "PBFA97CFB590B2093"
1226 "expr": "jvm_memory_bytes_max{job=\"kafka-broker\",area=\"heap\",env=\"$env\",instance=~\"$instance\"}",
1228 "legendFormat": "{{instance}}",
1232 "title": "JVM Memory Used",
1233 "type": "timeseries"
1237 "type": "prometheus",
1238 "uid": "PBFA97CFB590B2093"
1243 "mode": "palette-classic"
1246 "axisCenteredZero": false,
1247 "axisColorMode": "text",
1248 "axisLabel": "% time in GC",
1249 "axisPlacement": "auto",
1251 "drawStyle": "line",
1253 "gradientMode": "none",
1259 "lineInterpolation": "linear",
1262 "scaleDistribution": {
1265 "showPoints": "never",
1271 "thresholdsStyle": {
1289 "unit": "percentunit"
1295 "options": "localhost:7071"
1301 "fixedColor": "#890F02",
1324 "displayMode": "table",
1325 "placement": "bottom",
1333 "pluginVersion": "8.1.3",
1337 "type": "prometheus",
1338 "uid": "PBFA97CFB590B2093"
1340 "expr": "sum without(gc)(rate(jvm_gc_collection_seconds_sum{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"}[5m]))",
1342 "intervalFactor": 2,
1343 "legendFormat": "{{instance}}",
1344 "metric": "jvm_gc_collection_seconds_sum",
1349 "title": "Time spent in GC",
1350 "type": "timeseries"
1356 "type": "datasource",
1368 "type": "datasource",
1382 "type": "datasource",
1388 "title": "Throughput & Request rate",
1393 "type": "prometheus",
1394 "uid": "PBFA97CFB590B2093"
1399 "mode": "palette-classic"
1402 "axisCenteredZero": false,
1403 "axisColorMode": "text",
1404 "axisLabel": "Bytes/s",
1405 "axisPlacement": "auto",
1407 "drawStyle": "line",
1409 "gradientMode": "none",
1415 "lineInterpolation": "linear",
1418 "scaleDistribution": {
1421 "showPoints": "never",
1427 "thresholdsStyle": {
1465 "displayMode": "list",
1466 "placement": "bottom",
1474 "pluginVersion": "8.1.3",
1478 "type": "prometheus",
1479 "uid": "PBFA97CFB590B2093"
1481 "expr": "sum(rate(kafka_server_brokertopicmetrics_bytesinpersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",topic!=\"\"}[5m]))",
1482 "format": "time_series",
1484 "intervalFactor": 2,
1485 "legendFormat": "Bytes in",
1486 "metric": "kafka_server_brokertopicmetrics_bytesinpersec",
1492 "type": "prometheus",
1493 "uid": "PBFA97CFB590B2093"
1495 "expr": "sum(rate(kafka_server_brokertopicmetrics_bytesoutpersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",topic!=\"\"}[5m]))",
1496 "format": "time_series",
1499 "intervalFactor": 2,
1500 "legendFormat": "Bytes out",
1501 "metric": "kafka_server_brokertopicmetrics_bytesinpersec",
1506 "title": "Broker network throughput",
1507 "type": "timeseries"
1511 "type": "prometheus",
1512 "uid": "PBFA97CFB590B2093"
1514 "description": "Produce request rate.",
1549 "maxDataPoints": 100,
1551 "colorMode": "value",
1552 "graphMode": "area",
1553 "justifyMode": "auto",
1554 "orientation": "horizontal",
1565 "pluginVersion": "10.0.3",
1569 "type": "prometheus",
1570 "uid": "PBFA97CFB590B2093"
1572 "expr": "sum(rate(kafka_network_requestmetrics_requestspersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"}[5m]))",
1578 "title": "All Request Per Sec",
1583 "type": "prometheus",
1584 "uid": "PBFA97CFB590B2093"
1586 "description": "Fetch request rate.",
1621 "maxDataPoints": 100,
1623 "colorMode": "value",
1624 "graphMode": "area",
1625 "justifyMode": "auto",
1626 "orientation": "horizontal",
1637 "pluginVersion": "10.0.3",
1641 "type": "prometheus",
1642 "uid": "PBFA97CFB590B2093"
1644 "expr": "sum(rate(kafka_network_requestmetrics_requestspersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",request=\"FetchConsumer\"}[5m]))",
1650 "title": "Consumer Fetch Request Per Sec",
1655 "type": "prometheus",
1656 "uid": "PBFA97CFB590B2093"
1658 "description": "Produce request rate.",
1693 "maxDataPoints": 100,
1695 "colorMode": "value",
1696 "graphMode": "area",
1697 "justifyMode": "auto",
1698 "orientation": "horizontal",
1709 "pluginVersion": "10.0.3",
1713 "type": "prometheus",
1714 "uid": "PBFA97CFB590B2093"
1716 "expr": "sum(rate(kafka_network_requestmetrics_requestspersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",request=\"Produce\"}[5m]))",
1722 "title": "Produce Request Per Sec",
1727 "type": "prometheus",
1728 "uid": "PBFA97CFB590B2093"
1730 "description": "Metadata request rate.",
1765 "maxDataPoints": 100,
1767 "colorMode": "value",
1768 "graphMode": "area",
1769 "justifyMode": "auto",
1770 "orientation": "horizontal",
1781 "pluginVersion": "10.0.3",
1785 "type": "prometheus",
1786 "uid": "PBFA97CFB590B2093"
1788 "expr": "sum(rate(kafka_network_requestmetrics_requestspersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",request=\"Metadata\"}[5m]))",
1794 "title": "Metadata Request Per Sec",
1799 "type": "prometheus",
1800 "uid": "PBFA97CFB590B2093"
1802 "description": "Offset Commit request rate.",
1837 "maxDataPoints": 100,
1839 "colorMode": "value",
1840 "graphMode": "area",
1841 "justifyMode": "auto",
1842 "orientation": "horizontal",
1853 "pluginVersion": "10.0.3",
1857 "type": "prometheus",
1858 "uid": "PBFA97CFB590B2093"
1860 "expr": "sum(rate(kafka_network_requestmetrics_requestspersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",request=\"OffsetCommit\"}[5m]))",
1866 "title": "Offset Commit Request Per Sec",
1871 "type": "prometheus",
1872 "uid": "PBFA97CFB590B2093"
1874 "description": "Fetch request rate.",
1909 "maxDataPoints": 100,
1911 "colorMode": "value",
1912 "graphMode": "area",
1913 "justifyMode": "auto",
1914 "orientation": "horizontal",
1925 "pluginVersion": "10.0.3",
1929 "type": "prometheus",
1930 "uid": "PBFA97CFB590B2093"
1932 "expr": "sum(rate(kafka_network_requestmetrics_requestspersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",request=\"Fetch\"}[5m]))",
1938 "title": "Broker Fetch Request Per Sec",
1944 "type": "datasource",
1958 "type": "datasource",
1964 "title": "Throughput In/Out",
1969 "type": "prometheus",
1970 "uid": "PBFA97CFB590B2093"
1975 "mode": "palette-classic"
1978 "axisCenteredZero": false,
1979 "axisColorMode": "text",
1980 "axisLabel": "Messages/s",
1981 "axisPlacement": "auto",
1983 "drawStyle": "line",
1985 "gradientMode": "none",
1991 "lineInterpolation": "linear",
1994 "scaleDistribution": {
1997 "showPoints": "never",
2003 "thresholdsStyle": {
2038 "displayMode": "table",
2039 "placement": "bottom",
2047 "pluginVersion": "8.1.3",
2051 "type": "prometheus",
2052 "uid": "PBFA97CFB590B2093"
2055 "expr": "sum without(instance,topic)(rate(kafka_server_brokertopicmetrics_messagesinpersec{job=\"kafka-broker\",env=\"$env\",topic!=\"\"}[5m]))",
2057 "intervalFactor": 2,
2058 "legendFormat": "bytes/sec",
2059 "metric": "kafka_server_brokertopicmetrics_messagesinpersec",
2064 "title": "Messages In",
2065 "type": "timeseries"
2069 "type": "prometheus",
2070 "uid": "PBFA97CFB590B2093"
2075 "mode": "palette-classic"
2078 "axisCenteredZero": false,
2079 "axisColorMode": "text",
2080 "axisLabel": "Bytes/s",
2081 "axisPlacement": "auto",
2083 "drawStyle": "line",
2085 "gradientMode": "none",
2091 "lineInterpolation": "linear",
2094 "scaleDistribution": {
2097 "showPoints": "never",
2103 "thresholdsStyle": {
2142 "displayMode": "table",
2143 "placement": "bottom",
2151 "pluginVersion": "8.1.3",
2155 "type": "prometheus",
2156 "uid": "PBFA97CFB590B2093"
2159 "expr": "sum without(instance,topic)(rate(kafka_server_brokertopicmetrics_bytesinpersec{job=\"kafka-broker\",env=\"$env\",topic!=\"\"}[5m]))",
2160 "format": "time_series",
2162 "intervalFactor": 2,
2163 "legendFormat": "bytes/sec",
2164 "metric": "kafka_server_brokertopicmetrics_bytesinpersec",
2169 "title": "Bytes In",
2170 "type": "timeseries"
2174 "type": "prometheus",
2175 "uid": "PBFA97CFB590B2093"
2180 "mode": "palette-classic"
2183 "axisCenteredZero": false,
2184 "axisColorMode": "text",
2185 "axisLabel": "Bytes/s",
2186 "axisPlacement": "auto",
2188 "drawStyle": "line",
2190 "gradientMode": "none",
2196 "lineInterpolation": "linear",
2199 "scaleDistribution": {
2202 "showPoints": "never",
2208 "thresholdsStyle": {
2247 "displayMode": "table",
2248 "placement": "bottom",
2256 "pluginVersion": "8.1.3",
2260 "type": "prometheus",
2261 "uid": "PBFA97CFB590B2093"
2264 "expr": "sum without(instance,topic)(rate(kafka_server_brokertopicmetrics_bytesoutpersec{job=\"kafka-broker\",env=\"$env\",topic!=\"\"}[5m]))",
2266 "intervalFactor": 2,
2267 "legendFormat": "bytes/sec",
2268 "metric": "kafka_server_brokertopicmetrics_bytesinpersec",
2273 "title": "Bytes Out",
2274 "type": "timeseries"
2278 "type": "prometheus",
2279 "uid": "PBFA97CFB590B2093"
2284 "mode": "palette-classic"
2287 "axisCenteredZero": false,
2288 "axisColorMode": "text",
2289 "axisLabel": "Messages/s",
2290 "axisPlacement": "auto",
2292 "drawStyle": "line",
2294 "gradientMode": "none",
2300 "lineInterpolation": "linear",
2303 "scaleDistribution": {
2306 "showPoints": "never",
2312 "thresholdsStyle": {
2350 "displayMode": "table",
2351 "placement": "bottom",
2359 "pluginVersion": "8.1.3",
2363 "type": "prometheus",
2364 "uid": "PBFA97CFB590B2093"
2366 "expr": "sum without(topic)(rate(kafka_server_brokertopicmetrics_messagesinpersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",topic!=\"\"}[5m]))",
2367 "format": "time_series",
2369 "intervalFactor": 2,
2370 "legendFormat": "{{instance}}",
2371 "metric": "kafka_server_brokertopicmetrics_messagesinpersec",
2376 "title": "Messages In Per Broker",
2377 "type": "timeseries"
2381 "type": "prometheus",
2382 "uid": "PBFA97CFB590B2093"
2387 "mode": "palette-classic"
2390 "axisCenteredZero": false,
2391 "axisColorMode": "text",
2392 "axisLabel": "Bytes/s",
2393 "axisPlacement": "auto",
2395 "drawStyle": "line",
2397 "gradientMode": "none",
2403 "lineInterpolation": "linear",
2406 "scaleDistribution": {
2409 "showPoints": "never",
2415 "thresholdsStyle": {
2453 "displayMode": "table",
2454 "placement": "bottom",
2462 "pluginVersion": "8.1.3",
2466 "type": "prometheus",
2467 "uid": "PBFA97CFB590B2093"
2469 "expr": "sum without(topic)(rate(kafka_server_brokertopicmetrics_bytesinpersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",topic!=\"\"}[5m]))",
2470 "format": "time_series",
2472 "intervalFactor": 2,
2473 "legendFormat": "{{instance}}",
2474 "metric": "kafka_server_brokertopicmetrics_bytesinpersec",
2479 "title": "Bytes In Per Broker",
2480 "type": "timeseries"
2484 "type": "prometheus",
2485 "uid": "PBFA97CFB590B2093"
2490 "mode": "palette-classic"
2493 "axisCenteredZero": false,
2494 "axisColorMode": "text",
2496 "axisPlacement": "auto",
2498 "drawStyle": "line",
2500 "gradientMode": "none",
2506 "lineInterpolation": "linear",
2509 "scaleDistribution": {
2512 "showPoints": "never",
2518 "thresholdsStyle": {
2557 "displayMode": "table",
2558 "placement": "bottom",
2566 "pluginVersion": "8.1.3",
2570 "type": "prometheus",
2571 "uid": "PBFA97CFB590B2093"
2573 "expr": "sum without(topic)(rate(kafka_server_brokertopicmetrics_bytesoutpersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",topic!=\"\"}[5m]))",
2574 "format": "time_series",
2576 "intervalFactor": 1,
2577 "legendFormat": "{{instance}}",
2581 "title": "Bytes Out Per Broker",
2582 "type": "timeseries"
2587 "type": "datasource",
2601 "type": "datasource",
2607 "title": "Thread utilization",
2612 "type": "prometheus",
2613 "uid": "PBFA97CFB590B2093"
2615 "description": "Average fraction of time the network processor threads are idle. Values are between 0 (all resources are used) and 100 (all resources are available)\n",
2619 "mode": "palette-classic"
2622 "axisCenteredZero": false,
2623 "axisColorMode": "text",
2625 "axisPlacement": "auto",
2627 "drawStyle": "line",
2629 "gradientMode": "none",
2635 "lineInterpolation": "linear",
2638 "scaleDistribution": {
2641 "showPoints": "never",
2647 "thresholdsStyle": {
2666 "unit": "percentunit"
2684 "displayMode": "table",
2685 "placement": "bottom",
2693 "pluginVersion": "8.1.3",
2697 "type": "prometheus",
2698 "uid": "PBFA97CFB590B2093"
2700 "expr": "1-kafka_network_socketserver_networkprocessoravgidlepercent{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"}",
2702 "legendFormat": "{{instance}}",
2706 "title": "Network Processor Avg Usage Percent",
2707 "type": "timeseries"
2711 "type": "prometheus",
2712 "uid": "PBFA97CFB590B2093"
2714 "description": "Average fraction of time the request handler threads are idle. Values are between 0 (all resources are used) and 100 (all resources are available).\n",
2718 "mode": "palette-classic"
2721 "axisCenteredZero": false,
2722 "axisColorMode": "text",
2724 "axisPlacement": "auto",
2726 "drawStyle": "line",
2728 "gradientMode": "none",
2734 "lineInterpolation": "linear",
2737 "scaleDistribution": {
2740 "showPoints": "never",
2746 "thresholdsStyle": {
2766 "unit": "percentunit"
2784 "displayMode": "table",
2785 "placement": "bottom",
2793 "pluginVersion": "8.1.3",
2797 "type": "prometheus",
2798 "uid": "PBFA97CFB590B2093"
2800 "expr": "1 - kafka_server_kafkarequesthandlerpool_requesthandleravgidlepercent_total{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"}",
2802 "legendFormat": "{{instance}}",
2806 "title": "Request Handler Avg Percent",
2807 "type": "timeseries"
2812 "type": "datasource",
2826 "type": "datasource",
2832 "title": "Isr Shrinks / Expands",
2837 "type": "prometheus",
2838 "uid": "PBFA97CFB590B2093"
2840 "description": ": The number of in-sync replicas (ISRs) for a particular partition should remain fairly static, the only exceptions are when you are expanding your broker cluster or removing partitions. In order to maintain high availability, a healthy Kafka cluster requires a minimum number of ISRs for failover. A replica could be removed from the ISR pool for a couple of reasons: it is too far behind the leaders offset (user-configurable by setting the replica.lag.max.messages configuration parameter), or it has not contacted the leader for some time (configurable with the replica.socket.timeout.ms parameter). No matter the reason, an increase in IsrShrinksPerSec without a corresponding increase in IsrExpandsPerSec shortly thereafter is cause for concern and requires user intervention.The Kafka documentation provides a wealth of information on the user-configurable parameters for brokers.",
2844 "mode": "palette-classic"
2847 "axisCenteredZero": false,
2848 "axisColorMode": "text",
2850 "axisPlacement": "auto",
2852 "drawStyle": "line",
2854 "gradientMode": "none",
2860 "lineInterpolation": "linear",
2863 "scaleDistribution": {
2866 "showPoints": "never",
2872 "thresholdsStyle": {
2896 "__systemRef": "hideSeriesFrom",
2904 "prefix": "All except:",
2910 "id": "custom.hideFrom",
2935 "displayMode": "table",
2936 "placement": "bottom",
2944 "pluginVersion": "8.1.3",
2948 "type": "prometheus",
2949 "uid": "PBFA97CFB590B2093"
2951 "expr": "rate(kafka_server_replicamanager_isrshrinkspersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"}[5m])",
2953 "legendFormat": "{{instance}}",
2957 "title": "IsrShrinks per Sec",
2958 "type": "timeseries"
2962 "type": "prometheus",
2963 "uid": "PBFA97CFB590B2093"
2965 "description": ": The number of in-sync replicas (ISRs) for a particular partition should remain fairly static, the only exceptions are when you are expanding your broker cluster or removing partitions. In order to maintain high availability, a healthy Kafka cluster requires a minimum number of ISRs for failover. A replica could be removed from the ISR pool for a couple of reasons: it is too far behind the leaders offset (user-configurable by setting the replica.lag.max.messages configuration parameter), or it has not contacted the leader for some time (configurable with the replica.socket.timeout.ms parameter). No matter the reason, an increase in IsrShrinksPerSec without a corresponding increase in IsrExpandsPerSec shortly thereafter is cause for concern and requires user intervention.The Kafka documentation provides a wealth of information on the user-configurable parameters for brokers.",
2969 "mode": "palette-classic"
2972 "axisCenteredZero": false,
2973 "axisColorMode": "text",
2975 "axisPlacement": "auto",
2977 "drawStyle": "line",
2979 "gradientMode": "none",
2985 "lineInterpolation": "linear",
2988 "scaleDistribution": {
2991 "showPoints": "never",
2997 "thresholdsStyle": {
3021 "__systemRef": "hideSeriesFrom",
3029 "prefix": "All except:",
3035 "id": "custom.hideFrom",
3060 "displayMode": "table",
3061 "placement": "bottom",
3069 "pluginVersion": "8.1.3",
3073 "type": "prometheus",
3074 "uid": "PBFA97CFB590B2093"
3076 "expr": "rate(kafka_server_replicamanager_isrexpandspersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"}[5m])",
3079 "legendFormat": "{{instance}}",
3083 "title": "IsrExpands per Sec",
3084 "type": "timeseries"
3089 "type": "datasource",
3103 "type": "datasource",
3109 "title": "Logs size",
3114 "type": "prometheus",
3115 "uid": "PBFA97CFB590B2093"
3120 "mode": "palette-classic"
3123 "axisCenteredZero": false,
3124 "axisColorMode": "text",
3126 "axisPlacement": "auto",
3128 "drawStyle": "line",
3130 "gradientMode": "none",
3136 "lineInterpolation": "linear",
3139 "scaleDistribution": {
3142 "showPoints": "never",
3148 "thresholdsStyle": {
3185 "displayMode": "table",
3186 "placement": "bottom",
3194 "pluginVersion": "8.1.3",
3198 "type": "prometheus",
3199 "uid": "PBFA97CFB590B2093"
3201 "expr": "sum(kafka_log_log_size{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"}) by (topic)",
3202 "legendFormat": "{{topic}}",
3206 "title": "Log size per Topic",
3207 "type": "timeseries"
3211 "type": "prometheus",
3212 "uid": "PBFA97CFB590B2093"
3217 "mode": "palette-classic"
3220 "axisCenteredZero": false,
3221 "axisColorMode": "text",
3223 "axisPlacement": "auto",
3225 "drawStyle": "line",
3227 "gradientMode": "none",
3233 "lineInterpolation": "linear",
3236 "scaleDistribution": {
3239 "showPoints": "never",
3245 "thresholdsStyle": {
3282 "displayMode": "table",
3283 "placement": "bottom",
3291 "pluginVersion": "8.1.3",
3295 "type": "prometheus",
3296 "uid": "PBFA97CFB590B2093"
3298 "expr": "sum(kafka_log_log_size{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"}) by (instance)",
3299 "legendFormat": "{{instance}}",
3303 "title": "Log size per Broker",
3304 "type": "timeseries"
3309 "type": "datasource",
3323 "type": "datasource",
3329 "title": "Producer Performance",
3334 "type": "prometheus",
3335 "uid": "PBFA97CFB590B2093"
3337 "description": "A high value can imply there aren't enough IO threads or the CPU is a bottleneck, or the request queue isnt large enough. The request queue size should match the number of connections.",
3341 "mode": "palette-classic"
3344 "axisCenteredZero": false,
3345 "axisColorMode": "text",
3347 "axisPlacement": "auto",
3349 "drawStyle": "line",
3351 "gradientMode": "none",
3357 "lineInterpolation": "linear",
3360 "scaleDistribution": {
3363 "showPoints": "never",
3369 "thresholdsStyle": {
3406 "displayMode": "list",
3407 "placement": "bottom",
3415 "pluginVersion": "8.1.3",
3419 "type": "prometheus",
3420 "uid": "PBFA97CFB590B2093"
3422 "expr": "kafka_network_requestmetrics_requestqueuetimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"Produce\"}",
3424 "legendFormat": "{{instance}} - {{quantile}}",
3428 "title": "Producer - RequestQueueTimeMs",
3429 "type": "timeseries"
3433 "type": "prometheus",
3434 "uid": "PBFA97CFB590B2093"
3436 "description": "In most cases, a high value can imply slow local storage or the storage is a bottleneck. One should also investigate LogFlushRateAndTimeMs to know how long page flushes are taking, which will also indicate a slow disk. In the case of FetchFollower requests, time spent in LocalTimeMs can be the result of a ZooKeeper write to change the ISR.",
3440 "mode": "palette-classic"
3443 "axisCenteredZero": false,
3444 "axisColorMode": "text",
3446 "axisPlacement": "auto",
3448 "drawStyle": "line",
3450 "gradientMode": "none",
3456 "lineInterpolation": "linear",
3459 "scaleDistribution": {
3462 "showPoints": "never",
3468 "thresholdsStyle": {
3505 "displayMode": "list",
3506 "placement": "bottom",
3514 "pluginVersion": "8.1.3",
3518 "type": "prometheus",
3519 "uid": "PBFA97CFB590B2093"
3521 "expr": "kafka_network_requestmetrics_localtimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"Produce\"}",
3523 "legendFormat": "{{instance}} - {{quantile}}",
3527 "title": "Producer - LocalTimeMs",
3528 "type": "timeseries"
3532 "type": "prometheus",
3533 "uid": "PBFA97CFB590B2093"
3535 "description": "A high value can imply a slow network connection. For fetch request, if the remote time is high, it could be that there is not enough data to give in a fetch response. This can happen when the consumer or replica is caught up and there is no new incoming data. If this is the case, remote time will be close to the max wait time, which is normal. Max wait time is configured via replica.fetch.wait.max.ms and fetch.max.wait.ms.\n",
3539 "mode": "palette-classic"
3542 "axisCenteredZero": false,
3543 "axisColorMode": "text",
3545 "axisPlacement": "auto",
3547 "drawStyle": "line",
3549 "gradientMode": "none",
3555 "lineInterpolation": "linear",
3558 "scaleDistribution": {
3561 "showPoints": "never",
3567 "thresholdsStyle": {
3604 "displayMode": "table",
3605 "placement": "bottom",
3613 "pluginVersion": "8.1.3",
3617 "type": "prometheus",
3618 "uid": "PBFA97CFB590B2093"
3620 "expr": "kafka_network_requestmetrics_remotetimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"Produce\"}",
3622 "legendFormat": "{{instance}} - {{quantile}}",
3626 "title": "Producer - RemoteTimeMs",
3627 "type": "timeseries"
3631 "type": "prometheus",
3632 "uid": "PBFA97CFB590B2093"
3634 "description": "A high value can imply there aren't enough network threads or the network cant dequeue responses quickly enough, causing back pressure in the response queue.\n",
3638 "mode": "palette-classic"
3641 "axisCenteredZero": false,
3642 "axisColorMode": "text",
3644 "axisPlacement": "auto",
3646 "drawStyle": "line",
3648 "gradientMode": "none",
3654 "lineInterpolation": "linear",
3657 "scaleDistribution": {
3660 "showPoints": "never",
3666 "thresholdsStyle": {
3703 "displayMode": "table",
3704 "placement": "bottom",
3712 "pluginVersion": "8.1.3",
3716 "type": "prometheus",
3717 "uid": "PBFA97CFB590B2093"
3719 "expr": "kafka_network_requestmetrics_responsequeuetimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"Produce\"}",
3721 "legendFormat": "{{instance}} - {{quantile}}",
3725 "title": "Producer - ResponseQueueTimeMs",
3726 "type": "timeseries"
3730 "type": "prometheus",
3731 "uid": "PBFA97CFB590B2093"
3733 "description": "A high value can imply the zero-copy from disk to the network is slow, or the network is the bottleneck because the network cant dequeue responses of the TCP socket as quickly as theyre being created. If the network buffer gets full, Kafka will block.\n",
3737 "mode": "palette-classic"
3740 "axisCenteredZero": false,
3741 "axisColorMode": "text",
3743 "axisPlacement": "auto",
3745 "drawStyle": "line",
3747 "gradientMode": "none",
3753 "lineInterpolation": "linear",
3756 "scaleDistribution": {
3759 "showPoints": "never",
3765 "thresholdsStyle": {
3803 "displayMode": "table",
3804 "placement": "bottom",
3812 "pluginVersion": "8.1.3",
3816 "type": "prometheus",
3817 "uid": "PBFA97CFB590B2093"
3819 "expr": "kafka_network_requestmetrics_responsesendtimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"Produce\"}",
3821 "legendFormat": "{{instance}} - {{quantile}}",
3825 "title": "Producer - ResponseSendTimeMs",
3826 "type": "timeseries"
3831 "type": "datasource",
3844 "type": "prometheus",
3845 "uid": "PBFA97CFB590B2093"
3847 "description": "A high value can imply there aren't enough IO threads or the CPU is a bottleneck, or the request queue isnt large enough. The request queue size should match the number of connections.",
3851 "mode": "palette-classic"
3855 "axisPlacement": "auto",
3857 "drawStyle": "line",
3859 "gradientMode": "none",
3865 "lineInterpolation": "linear",
3868 "scaleDistribution": {
3871 "showPoints": "never",
3877 "thresholdsStyle": {
3914 "displayMode": "list",
3915 "placement": "bottom",
3922 "pluginVersion": "8.1.3",
3926 "type": "prometheus",
3927 "uid": "PBFA97CFB590B2093"
3929 "expr": "kafka_network_requestmetrics_requestqueuetimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"Fetch\"}",
3931 "legendFormat": "{{instance}} - {{quantile}}",
3935 "title": "Consumer - RequestQueueTimeMs",
3936 "type": "timeseries"
3940 "type": "prometheus",
3941 "uid": "PBFA97CFB590B2093"
3943 "description": "In most cases, a high value can imply slow local storage or the storage is a bottleneck. One should also investigate LogFlushRateAndTimeMs to know how long page flushes are taking, which will also indicate a slow disk. In the case of FetchFollower requests, time spent in LocalTimeMs can be the result of a ZooKeeper write to change the ISR.",
3947 "mode": "palette-classic"
3951 "axisPlacement": "auto",
3953 "drawStyle": "line",
3955 "gradientMode": "none",
3961 "lineInterpolation": "linear",
3964 "scaleDistribution": {
3967 "showPoints": "never",
3973 "thresholdsStyle": {
4009 "displayMode": "list",
4010 "placement": "bottom",
4017 "pluginVersion": "8.1.3",
4021 "type": "prometheus",
4022 "uid": "PBFA97CFB590B2093"
4024 "expr": "kafka_network_requestmetrics_localtimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"Fetch\"}",
4026 "legendFormat": "{{instance}} - {{quantile}}",
4030 "title": "Consumer - LocalTimeMs",
4031 "type": "timeseries"
4035 "type": "prometheus",
4036 "uid": "PBFA97CFB590B2093"
4038 "description": "A high value can imply a slow network connection. For fetch request, if the remote time is high, it could be that there is not enough data to give in a fetch response. This can happen when the consumer or replica is caught up and there is no new incoming data. If this is the case, remote time will be close to the max wait time, which is normal. Max wait time is configured via replica.fetch.wait.max.ms and fetch.max.wait.ms.\n",
4042 "mode": "palette-classic"
4046 "axisPlacement": "auto",
4048 "drawStyle": "line",
4050 "gradientMode": "none",
4056 "lineInterpolation": "linear",
4059 "scaleDistribution": {
4062 "showPoints": "never",
4068 "thresholdsStyle": {
4104 "displayMode": "table",
4105 "placement": "bottom",
4112 "pluginVersion": "8.1.3",
4116 "type": "prometheus",
4117 "uid": "PBFA97CFB590B2093"
4119 "expr": "kafka_network_requestmetrics_remotetimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"Fetch\"}",
4121 "legendFormat": "{{instance}} - {{quantile}}",
4125 "title": "Consumer - RemoteTimeMs",
4126 "type": "timeseries"
4130 "type": "prometheus",
4131 "uid": "PBFA97CFB590B2093"
4133 "description": "A high value can imply there aren't enough network threads or the network cant dequeue responses quickly enough, causing back pressure in the response queue.\n",
4137 "mode": "palette-classic"
4141 "axisPlacement": "auto",
4143 "drawStyle": "line",
4145 "gradientMode": "none",
4151 "lineInterpolation": "linear",
4154 "scaleDistribution": {
4157 "showPoints": "never",
4163 "thresholdsStyle": {
4200 "displayMode": "table",
4201 "placement": "bottom",
4208 "pluginVersion": "8.1.3",
4212 "type": "prometheus",
4213 "uid": "PBFA97CFB590B2093"
4215 "expr": "kafka_network_requestmetrics_responsequeuetimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"Fetch\"}",
4217 "legendFormat": "{{instance}} - {{quantile}}",
4221 "title": "Consumer - ResponseQueueTimeMs",
4222 "type": "timeseries"
4226 "type": "prometheus",
4227 "uid": "PBFA97CFB590B2093"
4229 "description": "A high value can imply the zero-copy from disk to the network is slow, or the network is the bottleneck because the network cant dequeue responses of the TCP socket as quickly as theyre being created. If the network buffer gets full, Kafka will block.\n",
4233 "mode": "palette-classic"
4237 "axisPlacement": "auto",
4239 "drawStyle": "line",
4241 "gradientMode": "none",
4247 "lineInterpolation": "linear",
4250 "scaleDistribution": {
4253 "showPoints": "never",
4259 "thresholdsStyle": {
4296 "displayMode": "table",
4297 "placement": "bottom",
4304 "pluginVersion": "8.1.3",
4308 "type": "prometheus",
4309 "uid": "PBFA97CFB590B2093"
4311 "expr": "kafka_network_requestmetrics_responsesendtimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"Fetch\"}",
4313 "legendFormat": "{{instance}} - {{quantile}}",
4317 "title": "Consumer - ResponseSendTimeMs",
4318 "type": "timeseries"
4324 "type": "datasource",
4330 "title": "Consumer Performance",
4336 "type": "datasource",
4350 "type": "datasource",
4356 "title": "Fetch Follower Performance",
4361 "type": "prometheus",
4362 "uid": "PBFA97CFB590B2093"
4364 "description": "A high value can imply there aren't enough IO threads or the CPU is a bottleneck, or the request queue isnt large enough. The request queue size should match the number of connections.",
4368 "mode": "palette-classic"
4371 "axisCenteredZero": false,
4372 "axisColorMode": "text",
4374 "axisPlacement": "auto",
4376 "drawStyle": "line",
4378 "gradientMode": "none",
4384 "lineInterpolation": "linear",
4387 "scaleDistribution": {
4390 "showPoints": "never",
4396 "thresholdsStyle": {
4434 "displayMode": "list",
4435 "placement": "bottom",
4443 "pluginVersion": "8.1.3",
4447 "type": "prometheus",
4448 "uid": "PBFA97CFB590B2093"
4450 "expr": "kafka_network_requestmetrics_requestqueuetimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"FetchFollower\"}",
4452 "legendFormat": "{{instance}} - {{quantile}}",
4456 "title": "FetchFollower - RequestQueueTimeMs",
4457 "type": "timeseries"
4461 "type": "prometheus",
4462 "uid": "PBFA97CFB590B2093"
4464 "description": "In most cases, a high value can imply slow local storage or the storage is a bottleneck. One should also investigate LogFlushRateAndTimeMs to know how long page flushes are taking, which will also indicate a slow disk. In the case of FetchFollower requests, time spent in LocalTimeMs can be the result of a ZooKeeper write to change the ISR.",
4468 "mode": "palette-classic"
4471 "axisCenteredZero": false,
4472 "axisColorMode": "text",
4474 "axisPlacement": "auto",
4476 "drawStyle": "line",
4478 "gradientMode": "none",
4484 "lineInterpolation": "linear",
4487 "scaleDistribution": {
4490 "showPoints": "never",
4496 "thresholdsStyle": {
4534 "displayMode": "list",
4535 "placement": "bottom",
4543 "pluginVersion": "8.1.3",
4547 "type": "prometheus",
4548 "uid": "PBFA97CFB590B2093"
4550 "expr": "kafka_network_requestmetrics_localtimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"FetchFollower\"}",
4552 "legendFormat": "{{instance}} - {{quantile}}",
4556 "title": "FetchFollower - LocalTimeMs",
4557 "type": "timeseries"
4561 "type": "prometheus",
4562 "uid": "PBFA97CFB590B2093"
4564 "description": "A high value can imply a slow network connection. For fetch request, if the remote time is high, it could be that there is not enough data to give in a fetch response. This can happen when the consumer or replica is caught up and there is no new incoming data. If this is the case, remote time will be close to the max wait time, which is normal. Max wait time is configured via replica.fetch.wait.max.ms and fetch.max.wait.ms.\n",
4568 "mode": "palette-classic"
4571 "axisCenteredZero": false,
4572 "axisColorMode": "text",
4574 "axisPlacement": "auto",
4576 "drawStyle": "line",
4578 "gradientMode": "none",
4584 "lineInterpolation": "linear",
4587 "scaleDistribution": {
4590 "showPoints": "never",
4596 "thresholdsStyle": {
4633 "displayMode": "table",
4634 "placement": "bottom",
4642 "pluginVersion": "8.1.3",
4646 "type": "prometheus",
4647 "uid": "PBFA97CFB590B2093"
4649 "expr": "kafka_network_requestmetrics_remotetimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"FetchFollower\"}",
4651 "legendFormat": "{{instance}} - {{quantile}}",
4655 "title": "FetchFollower - RemoteTimeMs",
4656 "type": "timeseries"
4660 "type": "prometheus",
4661 "uid": "PBFA97CFB590B2093"
4663 "description": "A high value can imply there aren't enough network threads or the network cant dequeue responses quickly enough, causing back pressure in the response queue.\n",
4667 "mode": "palette-classic"
4670 "axisCenteredZero": false,
4671 "axisColorMode": "text",
4673 "axisPlacement": "auto",
4675 "drawStyle": "line",
4677 "gradientMode": "none",
4683 "lineInterpolation": "linear",
4686 "scaleDistribution": {
4689 "showPoints": "never",
4695 "thresholdsStyle": {
4732 "displayMode": "table",
4733 "placement": "bottom",
4741 "pluginVersion": "8.1.3",
4745 "type": "prometheus",
4746 "uid": "PBFA97CFB590B2093"
4748 "expr": "kafka_network_requestmetrics_responsequeuetimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"FetchFollower\"}",
4750 "legendFormat": "{{instance}} - {{quantile}}",
4754 "title": "FetchFollower - ResponseQueueTimeMs",
4755 "type": "timeseries"
4759 "type": "prometheus",
4760 "uid": "PBFA97CFB590B2093"
4762 "description": "A high value can imply the zero-copy from disk to the network is slow, or the network is the bottleneck because the network cant dequeue responses of the TCP socket as quickly as theyre being created. If the network buffer gets full, Kafka will block.\n",
4766 "mode": "palette-classic"
4769 "axisCenteredZero": false,
4770 "axisColorMode": "text",
4772 "axisPlacement": "auto",
4774 "drawStyle": "line",
4776 "gradientMode": "none",
4782 "lineInterpolation": "linear",
4785 "scaleDistribution": {
4788 "showPoints": "never",
4794 "thresholdsStyle": {
4832 "displayMode": "table",
4833 "placement": "bottom",
4841 "pluginVersion": "8.1.3",
4845 "type": "prometheus",
4846 "uid": "PBFA97CFB590B2093"
4848 "expr": "kafka_network_requestmetrics_responsesendtimems{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\",quantile=~\"$percentile\",request=\"FetchFollower\"}",
4850 "legendFormat": "{{instance}} - {{quantile}}",
4854 "title": "FetchFollower - ResponseSendTimeMs",
4855 "type": "timeseries"
4860 "type": "datasource",
4874 "type": "datasource",
4880 "title": "Connections",
4885 "type": "prometheus",
4886 "uid": "PBFA97CFB590B2093"
4891 "mode": "palette-classic"
4894 "axisCenteredZero": false,
4895 "axisColorMode": "text",
4897 "axisPlacement": "auto",
4899 "drawStyle": "line",
4901 "gradientMode": "none",
4907 "lineInterpolation": "linear",
4910 "scaleDistribution": {
4913 "showPoints": "never",
4919 "thresholdsStyle": {
4956 "displayMode": "table",
4957 "placement": "bottom",
4965 "pluginVersion": "8.1.3",
4969 "type": "prometheus",
4970 "uid": "PBFA97CFB590B2093"
4972 "expr": "sum(kafka_server_socketservermetrics_connection_count{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"}) by (listener)",
4974 "legendFormat": "{{listener}}",
4978 "title": "Connections count per listener",
4979 "type": "timeseries"
4983 "type": "prometheus",
4984 "uid": "PBFA97CFB590B2093"
4989 "mode": "palette-classic"
4992 "axisCenteredZero": false,
4993 "axisColorMode": "text",
4995 "axisPlacement": "auto",
4997 "drawStyle": "line",
4999 "gradientMode": "none",
5005 "lineInterpolation": "linear",
5008 "scaleDistribution": {
5011 "showPoints": "never",
5017 "thresholdsStyle": {
5054 "displayMode": "table",
5055 "placement": "bottom",
5063 "pluginVersion": "8.1.3",
5067 "type": "prometheus",
5068 "uid": "PBFA97CFB590B2093"
5070 "expr": "sum(kafka_server_socketservermetrics_connection_count{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"}) by (instance)",
5072 "legendFormat": "{{instance}}",
5076 "title": "Connections count per broker",
5077 "type": "timeseries"
5081 "type": "prometheus",
5082 "uid": "PBFA97CFB590B2093"
5087 "mode": "palette-classic"
5090 "axisCenteredZero": false,
5091 "axisColorMode": "text",
5093 "axisPlacement": "auto",
5095 "drawStyle": "line",
5097 "gradientMode": "none",
5103 "lineInterpolation": "linear",
5106 "scaleDistribution": {
5109 "showPoints": "never",
5115 "thresholdsStyle": {
5152 "displayMode": "table",
5153 "placement": "bottom",
5161 "pluginVersion": "8.1.3",
5165 "type": "prometheus",
5166 "uid": "PBFA97CFB590B2093"
5168 "expr": "sum(kafka_server_socketservermetrics_connection_creation_rate{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"}) by (listener)",
5170 "legendFormat": "{{listener}}",
5174 "title": "Connections creation rate per listener",
5175 "type": "timeseries"
5179 "type": "prometheus",
5180 "uid": "PBFA97CFB590B2093"
5185 "mode": "palette-classic"
5188 "axisCenteredZero": false,
5189 "axisColorMode": "text",
5191 "axisPlacement": "auto",
5193 "drawStyle": "line",
5195 "gradientMode": "none",
5201 "lineInterpolation": "linear",
5204 "scaleDistribution": {
5207 "showPoints": "never",
5213 "thresholdsStyle": {
5250 "displayMode": "table",
5251 "placement": "bottom",
5259 "pluginVersion": "8.1.3",
5263 "type": "prometheus",
5264 "uid": "PBFA97CFB590B2093"
5266 "expr": "sum(kafka_server_socketservermetrics_connection_creation_rate{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"}) by (instance)",
5268 "legendFormat": "{{instance}}",
5272 "title": "Connections creation rate per instance",
5273 "type": "timeseries"
5277 "type": "prometheus",
5278 "uid": "PBFA97CFB590B2093"
5283 "mode": "palette-classic"
5286 "axisCenteredZero": false,
5287 "axisColorMode": "text",
5289 "axisPlacement": "auto",
5291 "drawStyle": "line",
5293 "gradientMode": "none",
5299 "lineInterpolation": "linear",
5302 "scaleDistribution": {
5305 "showPoints": "never",
5311 "thresholdsStyle": {
5348 "displayMode": "table",
5349 "placement": "bottom",
5357 "pluginVersion": "8.1.3",
5361 "type": "prometheus",
5362 "uid": "PBFA97CFB590B2093"
5364 "expr": "sum(kafka_server_socketservermetrics_connection_close_rate{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"}) by (listener)",
5366 "legendFormat": "{{listener}}",
5370 "title": "Connections close rate per listener",
5371 "type": "timeseries"
5375 "type": "prometheus",
5376 "uid": "PBFA97CFB590B2093"
5381 "mode": "palette-classic"
5384 "axisCenteredZero": false,
5385 "axisColorMode": "text",
5387 "axisPlacement": "auto",
5389 "drawStyle": "line",
5391 "gradientMode": "none",
5397 "lineInterpolation": "linear",
5400 "scaleDistribution": {
5403 "showPoints": "never",
5409 "thresholdsStyle": {
5446 "displayMode": "table",
5447 "placement": "bottom",
5455 "pluginVersion": "8.1.3",
5459 "type": "prometheus",
5460 "uid": "PBFA97CFB590B2093"
5462 "expr": "sum(kafka_server_socketservermetrics_connection_close_rate{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"}) by (instance)",
5464 "legendFormat": "{{instance}}",
5468 "title": "Connections close rate per instance",
5469 "type": "timeseries"
5473 "type": "prometheus",
5474 "uid": "PBFA97CFB590B2093"
5476 "description": "Tracks the amount of time Acceptor is blocked from accepting connections. See KIP-402 for more details.",
5480 "mode": "palette-classic"
5483 "axisCenteredZero": false,
5484 "axisColorMode": "text",
5486 "axisPlacement": "auto",
5488 "drawStyle": "line",
5490 "gradientMode": "none",
5496 "lineInterpolation": "linear",
5499 "scaleDistribution": {
5502 "showPoints": "never",
5508 "thresholdsStyle": {
5546 "displayMode": "table",
5547 "placement": "bottom",
5555 "pluginVersion": "8.1.3",
5559 "type": "prometheus",
5560 "uid": "PBFA97CFB590B2093"
5562 "expr": "kafka_network_acceptor_acceptorblockedpercent{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"}",
5564 "legendFormat": "{{instance}} - {{listener}}",
5568 "title": "Acceptor Blocked Percentage",
5569 "type": "timeseries"
5573 "type": "prometheus",
5574 "uid": "PBFA97CFB590B2093"
5579 "mode": "palette-classic"
5582 "axisCenteredZero": false,
5583 "axisColorMode": "text",
5585 "axisPlacement": "auto",
5587 "drawStyle": "line",
5589 "gradientMode": "none",
5595 "lineInterpolation": "linear",
5598 "scaleDistribution": {
5601 "showPoints": "never",
5607 "thresholdsStyle": {
5644 "displayMode": "table",
5645 "placement": "bottom",
5653 "pluginVersion": "8.1.3",
5657 "type": "prometheus",
5658 "uid": "PBFA97CFB590B2093"
5660 "expr": "sum(kafka_server_socketservermetrics_connections{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"}) by (client_software_name, client_software_version)",
5662 "legendFormat": "{{client_software_name}} {{client_software_version}}",
5666 "title": "Connections per client version",
5667 "type": "timeseries"
5672 "type": "datasource",
5686 "type": "datasource",
5692 "title": "Group Coordinator",
5697 "type": "prometheus",
5698 "uid": "PBFA97CFB590B2093"
5700 "description": "Number of consumer groups per group coordinator",
5704 "mode": "palette-classic"
5707 "axisCenteredZero": false,
5708 "axisColorMode": "text",
5710 "axisPlacement": "auto",
5712 "drawStyle": "line",
5714 "gradientMode": "none",
5720 "lineInterpolation": "linear",
5723 "scaleDistribution": {
5726 "showPoints": "never",
5732 "thresholdsStyle": {
5769 "displayMode": "table",
5770 "placement": "bottom",
5778 "pluginVersion": "8.1.3",
5782 "type": "prometheus",
5783 "uid": "PBFA97CFB590B2093"
5785 "expr": "kafka_coordinator_group_groupmetadatamanager_numgroups{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"}",
5788 "legendFormat": "{{instance}}",
5792 "title": "Consumer groups number per coordinator",
5793 "type": "timeseries"
5797 "type": "prometheus",
5798 "uid": "PBFA97CFB590B2093"
5800 "description": "Number of consumer group per state",
5804 "mode": "palette-classic"
5807 "axisCenteredZero": false,
5808 "axisColorMode": "text",
5810 "axisPlacement": "auto",
5812 "drawStyle": "line",
5814 "gradientMode": "none",
5820 "lineInterpolation": "linear",
5823 "scaleDistribution": {
5826 "showPoints": "never",
5832 "thresholdsStyle": {
5869 "displayMode": "table",
5870 "placement": "bottom",
5878 "pluginVersion": "8.1.3",
5882 "type": "prometheus",
5883 "uid": "PBFA97CFB590B2093"
5885 "expr": "sum(kafka_coordinator_group_groupmetadatamanager_numgroupsstable{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"})",
5888 "legendFormat": "stable",
5893 "type": "prometheus",
5894 "uid": "PBFA97CFB590B2093"
5896 "expr": "sum(kafka_coordinator_group_groupmetadatamanager_numgroupspreparingrebalance{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"})",
5898 "legendFormat": "preparing-rebalance",
5903 "type": "prometheus",
5904 "uid": "PBFA97CFB590B2093"
5906 "expr": "sum(kafka_coordinator_group_groupmetadatamanager_numgroupsdead{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"})",
5908 "legendFormat": "dead",
5913 "type": "prometheus",
5914 "uid": "PBFA97CFB590B2093"
5916 "expr": "sum(kafka_coordinator_group_groupmetadatamanager_numgroupscompletingrebalance{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"})",
5918 "legendFormat": "completing-rebalance",
5923 "type": "prometheus",
5924 "uid": "PBFA97CFB590B2093"
5926 "expr": "sum(kafka_coordinator_group_groupmetadatamanager_numgroupsempty{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"})",
5928 "legendFormat": "empty",
5932 "title": "Nb consumer groups per state",
5933 "type": "timeseries"
5938 "type": "datasource",
5952 "type": "datasource",
5958 "title": "Message Conversion",
5963 "type": "prometheus",
5964 "uid": "PBFA97CFB590B2093"
5966 "description": "The number of messages produced converted to match the log.message.format.version.",
5970 "mode": "palette-classic"
5973 "axisCenteredZero": false,
5974 "axisColorMode": "text",
5976 "axisPlacement": "auto",
5978 "drawStyle": "line",
5980 "gradientMode": "none",
5986 "lineInterpolation": "linear",
5989 "scaleDistribution": {
5992 "showPoints": "never",
5998 "thresholdsStyle": {
6036 "displayMode": "list",
6037 "placement": "bottom",
6045 "pluginVersion": "8.1.3",
6049 "type": "prometheus",
6050 "uid": "PBFA97CFB590B2093"
6052 "expr": "sum(kafka_server_brokertopicmetrics_producemessageconversionspersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"})",
6055 "legendFormat": "{{topic}}",
6059 "title": "Number of produced message conversion",
6060 "type": "timeseries"
6064 "type": "prometheus",
6065 "uid": "PBFA97CFB590B2093"
6067 "description": "The number of messages consumed converted at consumer to match the log.message.format.version.",
6071 "mode": "palette-classic"
6074 "axisCenteredZero": false,
6075 "axisColorMode": "text",
6077 "axisPlacement": "auto",
6079 "drawStyle": "line",
6081 "gradientMode": "none",
6087 "lineInterpolation": "linear",
6090 "scaleDistribution": {
6093 "showPoints": "never",
6099 "thresholdsStyle": {
6137 "displayMode": "list",
6138 "placement": "bottom",
6146 "pluginVersion": "8.1.3",
6150 "type": "prometheus",
6151 "uid": "PBFA97CFB590B2093"
6153 "expr": "sum(kafka_server_brokertopicmetrics_fetchmessageconversionspersec{job=\"kafka-broker\",env=\"$env\",instance=~\"$instance\"})",
6156 "legendFormat": "{{topic}}",
6160 "title": "Number of consumed message conversion",
6161 "type": "timeseries"
6165 "type": "datasource",
6168 "description": "Number of connection per client version",
6172 "mode": "palette-classic"
6198 "displayMode": "table",
6199 "placement": "bottom",
6221 "type": "datasource",
6224 "expr": "sum(kafka_server_socketservermetrics_connections{job=\"kafka-broker\", env=\"$env\", instance=~\"$instance\"}) by (client_software_name, client_software_version) ",
6226 "legendFormat": "{{client_software_name}} - {{client_software_version}}",
6230 "title": "Client version repartition",
6235 "schemaVersion": 38,
6247 "type": "prometheus",
6248 "uid": "PBFA97CFB590B2093"
6250 "definition": "label_values(env)",
6252 "includeAll": false,
6253 "label": "Environment",
6258 "query": "label_values(env)",
6259 "refId": "Prometheus-env-Variable-Query"
6263 "skipUrlSync": false,
6265 "tagValuesQuery": "",
6281 "type": "prometheus",
6282 "uid": "PBFA97CFB590B2093"
6284 "definition": "label_values(kafka_server_kafkaserver_brokerstate{env=\"${env}\"}, instance)",
6287 "label": "Instance",
6292 "query": "label_values(kafka_server_kafkaserver_brokerstate{env=\"${env}\"}, instance)",
6293 "refId": "Prometheus-instance-Variable-Query"
6297 "skipUrlSync": false,
6299 "tagValuesQuery": "",
6316 "type": "prometheus",
6317 "uid": "PBFA97CFB590B2093"
6319 "definition": "label_values(quantile)",
6322 "label": "Percentile",
6324 "name": "percentile",
6327 "query": "label_values(quantile)",
6328 "refId": "Prometheus-percentile-Variable-Query"
6332 "skipUrlSync": false,
6334 "tagValuesQuery": "",
6346 "refresh_intervals": [
6370 "timezone": "browser",
6371 "title": "Kafka cluster",