From: Amos Kong <
am...@scylladb.com>
Committer: Amos Kong <
am...@scylladb.com>
Branch: master
data_dir: update master dashboard
Signed-off-by: Amos Kong <
am...@scylladb.com>
---
diff --git a/data_dir/scylla-dash-io-per-server.master.json
b/data_dir/scylla-dash-io-per-server.master.json
--- a/data_dir/scylla-dash-io-per-server.master.json
+++ b/data_dir/scylla-dash-io-per-server.master.json
@@ -101,7 +101,7 @@
{
"expr": "count(up{job=\"scylla\"})",
"intervalFactor": 1,
- "legendFormat": "",
+ "legendFormat": "Total Nodes",
"refId": "A",
"step": 240
}
@@ -180,14 +180,15 @@
},
"targets": [
{
- "expr": "count(up{job=\"scylla\"})-count(scylla_memory_free_operations{shard=\"0\"})",
+ "expr": "count(scrape_samples_scraped{job=\"scylla\"}==0)
OR
vector(0)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Unreachable Nodes",
"step": 120
}
],
"thresholds": "1,2",
- "title": "Dead Nodes",
+ "title": "Unreachable Nodes",
"transparent": true,
"type": "singlestat",
"valueFontSize": "150%",
@@ -267,6 +268,7 @@
"expr": "sum(irate(scylla_transport_requests_served{}[30s]))
+
sum(irate(scylla_thrift_served{}[30s]))",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Total Requests",
"step": 30
}
],
@@ -379,6 +381,7 @@
"expr": "avg(scylla_reactor_utilization{}
) by (instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Load per Server",
"step": 30
}
],
@@ -461,6 +464,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Requests Served per
Server",
"step": 30
}
],
@@ -625,7 +629,7 @@
{
"expr": "irate(node_disk_writes_completed{device=\"$monitor_disk\"}[30s])",
"intervalFactor": 1,
- "legendFormat": "",
+ "legendFormat": "Disk Writes per Server
per Second",
"metric": "",
"refId": "A",
"step": 20
@@ -708,6 +712,7 @@
"expr": "irate(node_disk_reads_completed{device=\"$monitor_disk\"}[30s])",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Disk Reads per Server per
Second",
"step": 20
}
],
@@ -797,6 +802,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Disk Writes Bps per
Server",
"step": 20
}
],
@@ -877,6 +883,7 @@
"expr": "irate(node_disk_bytes_read{device=\"$monitor_disk\"}[30s])",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Disk Read Bps per Server",
"step": 20
}
],
@@ -993,6 +1000,7 @@
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Compactions I/O Queue
delay",
"step": 30
}
],
@@ -1075,6 +1083,7 @@
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Compactions I/O Queue
bandwidth",
"step": 30
}
],
@@ -1157,6 +1166,7 @@
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Compactions I/O Queue
IOPS",
"step": 30
}
],
@@ -1239,6 +1249,7 @@
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Query I/O Queue delay",
"step": 30
}
],
@@ -1321,6 +1332,7 @@
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Query I/O Queue
bandwidth",
"step": 30
}
],
@@ -1403,6 +1415,7 @@
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Query I/O Queue IOPS",
"step": 30
}
],
@@ -1486,6 +1499,7 @@
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Commitlog I/O Queue
delay",
"step": 30
}
],
@@ -1568,6 +1582,7 @@
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Commitlog I/O Queue
bandwidth",
"step": 30
}
],
@@ -1650,6 +1665,7 @@
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Commitlog I/O Queue IOPS",
"step": 30
}
],
@@ -1732,6 +1748,7 @@
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Memtable Flush I/O Queue
delay",
"step": 30
}
],
@@ -1814,6 +1831,7 @@
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Memtable Flush I/O Queue
bandwidth",
"step": 30
}
],
@@ -1896,6 +1914,7 @@
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Memtable Flush I/O Queue
IOPS",
"step": 30
}
],
@@ -1974,10 +1993,11 @@
"steppedLine": false,
"targets": [
{
- "expr": "1000000*max(scylla_io_queue_delay_streaming_read{})
by
(instance)",
+ "expr": "1000000*max(scylla_io_queue_streaming_read_delay{})
by
(instance)",
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Streaming Reads I/O Queue
delay",
"step": 30
}
],
@@ -2056,10 +2076,11 @@
"steppedLine": false,
"targets": [
{
- "expr": "sum(irate(scylla_io_queue_derive_streaming_read{}[30s]))
by
(instance)",
+ "expr": "sum(irate(scylla_io_queue_streaming_read_delay{}[30s]))
by
(instance)",
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Streaming Reads I/O Queue
bandwidth",
"step": 30
}
],
@@ -2138,10 +2159,11 @@
"steppedLine": false,
"targets": [
{
- "expr": "sum(irate(scylla_io_queue_total_operations_streaming_read{}[30s]))
by
(instance)",
+ "expr": "sum(irate(scylla_io_queue_streaming_read_total_operations{}[30s]))
by
(instance)",
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Streaming Reads I/O Queue
IOPS",
"step": 30
}
],
@@ -2220,10 +2242,11 @@
"steppedLine": false,
"targets": [
{
- "expr": "1000000*max(scylla_io_queue_delay_streaming_write{})
by
(instance)",
+ "expr": "1000000*max(scylla_io_queue_streaming_write_delay{})
by
(instance)",
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Streaming Writes I/O
Queue delay",
"step": 30
}
],
@@ -2302,10 +2325,11 @@
"steppedLine": false,
"targets": [
{
- "expr": "sum(irate(scylla_io_queue_derive_streaming_write{}[30s]))
by
(instance)",
+ "expr": "sum(irate(scylla_io_queue_streaming_write_delay{}[30s]))
by
(instance)",
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Streaming Writes I/O
Queue bandwidth",
"step": 30
}
],
@@ -2384,10 +2408,11 @@
"steppedLine": false,
"targets": [
{
- "expr": "sum(irate(scylla_io_queue_total_operations_streaming_write{}[30s]))
by
(instance)",
+ "expr": "sum(irate(scylla_io_queue_streaming_write_total_operations{}[30s]))
by
(instance)",
"intervalFactor": 1,
"metric": "seastar_io_queue_delay",
"refId": "A",
+ "legendFormat": "Streaming Writes I/O
Queue IOPS",
"step": 30
}
],
diff --git a/data_dir/scylla-dash-per-server.master.json
b/data_dir/scylla-dash-per-server.master.json
--- a/data_dir/scylla-dash-per-server.master.json
+++ b/data_dir/scylla-dash-per-server.master.json
@@ -101,7 +101,7 @@
{
"expr": "count(up{job=\"scylla\"})",
"intervalFactor": 1,
- "legendFormat": "",
+ "legendFormat": "Total Nodes",
"refId": "A",
"step": 1
}
@@ -180,14 +180,15 @@
},
"targets": [
{
- "expr": "count(up{job=\"scylla\"})-count(scylla_memory_free_operations{shard=\"0\"})",
+ "legendFormat": "Unreachable Nodes",
+ "expr": "count(scrape_samples_scraped{job=\"scylla\"}==0)
OR
vector(0)",
"intervalFactor": 1,
"refId": "A",
"step": 1
}
],
"thresholds": "1,2",
- "title": "Dead Nodes",
+ "title": "Unreachable Nodes",
"transparent": true,
"type": "singlestat",
"valueFontSize": "150%",
@@ -267,6 +268,7 @@
"expr": "sum(irate(scylla_transport_requests_served{}[30s]))
+
sum(irate(scylla_thrift_served{}[30s]))",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Total Requests",
"step": 1
}
],
@@ -379,6 +381,7 @@
"expr": "avg(scylla_reactor_utilization{}
) by (instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Load per Server",
"step": 1
}
],
@@ -461,6 +464,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Requests Served per
Server",
"step": 1
}
],
@@ -649,6 +653,7 @@
"expr": "sum(scylla_storage_proxy_coordinator_foreground_writes{})
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Foreground Writes per
Server",
"step": 1
}
],
@@ -730,6 +735,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Foreground Reads per
Server",
"step": 1
}
],
@@ -810,6 +816,7 @@
"expr": "sum(irate(scylla_storage_proxy_coordinator_write_timeouts{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Write Timeouts per Second
per Server",
"step": 1
}
],
@@ -890,6 +897,7 @@
"expr": "sum(irate(scylla_storage_proxy_coordinator_write_unavailable{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Write Unavailable per
Second per Server",
"step": 1
}
],
@@ -978,6 +986,7 @@
"expr": "sum(scylla_storage_proxy_coordinator_background_writes{})
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Background Writes per
Server",
"step": 1
}
],
@@ -1058,6 +1067,7 @@
"expr": "sum(scylla_storage_proxy_coordinator_background_reads{})
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Background Reads per
Server",
"step": 4
}
],
@@ -1138,6 +1148,7 @@
"expr": "sum(irate(scylla_storage_proxy_coordinator_read_timeouts{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Read Timeouts per Second
per Server",
"step": 1
}
],
@@ -1218,6 +1229,7 @@
"expr": "sum(irate(scylla_storage_proxy_coordinator_read_unavailable{}[30s]))
by
(instance)",
"intervalFactor": 1,
"metric": "",
+ "legendFormat": "Read Unavailable per
Second per Server",
"refId": "A",
"step": 4
}
@@ -1326,6 +1338,7 @@
"expr": "sum(irate(scylla_database_total_reads{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Reads",
"step": 1
}
],
@@ -1407,6 +1420,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Writes",
"step": 1
}
],
@@ -1487,6 +1501,7 @@
"expr": "sum(scylla_database_active_reads{})
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Active sstable reads",
"step": 1
}
],
@@ -1567,6 +1582,7 @@
"expr": "sum(scylla_database_queued_reads{})
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Queued sstable reads",
"step": 1
}
],
@@ -1647,6 +1663,7 @@
"expr": "sum(scylla_database_requests_blocked_memory{})
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Writes currently blocked
on dirty",
"step": 1
}
],
@@ -1727,6 +1744,7 @@
"expr": "sum(scylla_commitlog_pending_allocations{})
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Writes currently blocked
on commitlog",
"step": 1
}
],
@@ -1822,6 +1840,7 @@
"expr": "sum(irate(scylla_database_total_reads_failed{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Reads failed",
"step": 1
}
],
@@ -1902,6 +1921,7 @@
"expr": "sum(irate(scylla_database_requests_blocked_memory{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Writes blocked on dirty",
"step": 1
}
],
@@ -1982,6 +2002,7 @@
"expr": "sum(irate(scylla_commitlog_requests_blocked_memory{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Writes blocked on
commitlog",
"step": 1
}
],
@@ -2092,6 +2113,7 @@
"expr": "sum(irate(scylla_database_total_writes_failed{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Writes failed",
"step": 1
}
],
@@ -2172,6 +2194,7 @@
"expr": "sum(irate(scylla_database_total_writes_timedout{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Writes timed out",
"step": 1
}
],
@@ -2303,7 +2326,7 @@
{
"expr": "irate(node_disk_writes_completed{device=\"$monitor_disk\"}[30s])",
"intervalFactor": 1,
- "legendFormat": "",
+ "legendFormat": "Disk Writes per Server
per Second",
"metric": "",
"refId": "A",
"step": 1
@@ -2386,6 +2409,7 @@
"expr": "irate(node_disk_reads_completed{device=\"$monitor_disk\"}[30s])",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Disk Reads per Server per
Second",
"step": 1
}
],
@@ -2466,6 +2490,7 @@
"expr": "sum(irate(scylla_cache_hits{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Cache Hits",
"step": 1
}
],
@@ -2546,6 +2571,7 @@
"expr": "sum(irate(scylla_cache_misses{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Cache Misses",
"step": 1
}
],
@@ -2635,6 +2661,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Disk Writes Bps per
Server",
"step": 1
}
],
@@ -2715,6 +2742,7 @@
"expr": "irate(node_disk_bytes_read{device=\"$monitor_disk\"}[30s])",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Disk Read Bps per Server",
"step": 1
}
],
@@ -2795,6 +2823,7 @@
"expr": "sum(irate(scylla_cache_insertions{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Cache Insertions",
"step": 1
}
],
@@ -2875,6 +2904,7 @@
"expr": "sum(irate(scylla_cache_evictions{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Cache Evictions",
"step": 1
}
],
@@ -2970,6 +3000,7 @@
"expr": "sum(irate(scylla_cache_merges{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Cache Merges",
"step": 1
}
],
@@ -3050,6 +3081,7 @@
"expr": "sum(irate(scylla_cache_removals{}[30s]))
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Cache Removals",
"step": 1
}
],
@@ -3145,6 +3177,7 @@
"expr": "sum(scylla_cache_partitions{}) by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Cache Partitions",
"step": 1
}
],
@@ -3225,6 +3258,7 @@
"expr": "sum(scylla_cache_total{}) by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Cache Total Bytes",
"step": 1
}
],
@@ -3339,6 +3373,7 @@
"expr": "sum(scylla_lsa_total_space_bytes{})
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "LSA total memory",
"step": 1
}
],
@@ -3419,6 +3454,7 @@
"expr": "sum(scylla_lsa_non_lsa_used_space_bytes{})
by
(instance)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Non-LSA used memory",
"step": 1
}
],
@@ -3534,6 +3570,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Interface Rx Packets",
"step": 1
}
],
@@ -3615,6 +3652,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Interface Tx Packets",
"step": 1
}
],
@@ -3704,6 +3742,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Interface Rx Bps",
"step": 1
}
],
@@ -3785,6 +3824,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Interface Tx Bps",
"step": 1
}
],
@@ -3900,6 +3940,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Running Compactions",
"step": 1
}
],
diff --git a/data_dir/scylla-dash.master.json
b/data_dir/scylla-dash.master.json
--- a/data_dir/scylla-dash.master.json
+++ b/data_dir/scylla-dash.master.json
@@ -84,7 +84,7 @@
{
"expr": "count(up{job=\"scylla\"})",
"intervalFactor": 1,
- "legendFormat": "",
+ "legendFormat": "Total Nodes",
"refId": "A",
"step": 40
}
@@ -145,14 +145,15 @@
},
"targets": [
{
- "expr": "count(up{job=\"scylla\"})-count(scylla_memory_free_operations{shard=\"0\"})",
+ "expr": "count(scrape_samples_scraped{job=\"scylla\"}==0)
OR
vector(0)",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Unreachable Nodes",
"step": 20
}
],
"thresholds": "1,2",
- "title": "Dead Nodes",
+ "title": "Unreachable Nodes",
"transparent": true,
"type": "singlestat",
"valueFontSize": "150%",
@@ -261,6 +262,7 @@
"expr": "avg(scylla_reactor_utilization{}
) ",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Load",
"step": 4
}
],
@@ -342,6 +344,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Requests Served",
"step": 4
}
],
@@ -407,6 +410,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Total Storage",
"step": 1200
},
{
@@ -519,6 +523,7 @@
"expr": "sum(scylla_storage_proxy_coordinator_foreground_writes{}) ",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Foreground Writes",
"step": 10
}
],
@@ -599,6 +604,7 @@
"intervalFactor": 1,
"metric": "",
"refId": "A",
+ "legendFormat": "Foreground Reads",
"step": 10
}
],
@@ -678,6 +684,7 @@
"expr": "sum(irate(scylla_storage_proxy_coordinator_write_timeouts{}[30s])) ",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Write Timeouts per
Second",
"step": 10
}
],
@@ -757,6 +764,7 @@
"expr": "sum(irate(scylla_storage_proxy_coordinator_write_unavailable{}[30s])) ",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Write Unavailable per
Second",
"step": 10
}
],
@@ -844,6 +852,7 @@
"expr": "sum(scylla_storage_proxy_coordinator_background_writes{}) ",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Background Writes",
"step": 10
}
],
@@ -923,6 +932,7 @@
"expr": "sum(scylla_storage_proxy_coordinator_background_reads{}) ",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Background Reads",
"step": 10
}
],
@@ -1002,6 +1012,7 @@
"expr": "sum(irate(scylla_storage_proxy_coordinator_read_timeouts{}[30s])) ",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Read Timeouts per Second",
"step": 10
}
],
@@ -1081,6 +1092,7 @@
"expr": "sum(irate(scylla_storage_proxy_coordinator_read_unavailable{}[30s])) ",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Read Unavailable per
Second",
"step": 10
}
],
@@ -1194,6 +1206,7 @@
"expr": "sum(irate(scylla_cache_hits{}[30s])) ",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Cache Hits",
"step": 10
}
],
@@ -1273,6 +1286,7 @@
"expr": "sum(irate(scylla_cache_misses{}[30s])) ",
"intervalFactor": 1,
"refId": "A",
+ "legendFormat": "Cache Misses",
"step": 10
}
],