From 032a44e6bf195f98b36990d9940ac2aa213abd4e Mon Sep 17 00:00:00 2001 From: pancho horrillo Date: Mon, 8 Apr 2019 16:12:00 +0200 Subject: [PATCH] AWS deploy: organize RocksDB dashboard a bit better MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Co-authored-by: Álvaro Alda --- .../files/grafana/dashboards/RocksDB.json | 481 ++++++------------ 1 file changed, 166 insertions(+), 315 deletions(-) diff --git a/deploy/aws/provision/files/grafana/dashboards/RocksDB.json b/deploy/aws/provision/files/grafana/dashboards/RocksDB.json index 1f26639ef..3a564386d 100644 --- a/deploy/aws/provision/files/grafana/dashboards/RocksDB.json +++ b/deploy/aws/provision/files/grafana/dashboards/RocksDB.json @@ -15,111 +15,21 @@ "editable": true, "gnetId": null, "graphTooltip": 2, - "id": 7, - "iteration": 1554727786862, + "iteration": 1554731702959, "links": [], "panels": [ { - "aliasColors": {}, - "bars": false, - "dashLength": 10, - "dashes": false, - "fill": 1, + "collapsed": false, "gridPos": { - "h": 9, - "w": 12, + "h": 1, + "w": 24, "x": 0, "y": 0 }, - "id": 3, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 1, - "links": [ - { - "dashboard": "Cache Data, Filter, Index", - "includeVars": true, - "params": "", - "targetBlank": true, - "title": "Cache Data, Filter, Index", - "type": "dashboard", - "url": "/d/gD89ti6mZ/cache-data-filter-index" - } - ], - "nullPointMode": "null", - "paceLength": 10, - "percentage": false, - "pointradius": 2, - "points": false, - "renderer": "flot", - "seriesOverrides": [], - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sum(qed_[[instance]]_block_cache_hit) by (job)", - "format": "time_series", - "interval": "", - "intervalFactor": 1, - "legendFormat": "hit_{{job}}", - "refId": "A" - }, - { - "expr": "sum(qed_[[instance]]_block_cache_miss) by (job)", - "format": "time_series", - "intervalFactor": 1, - "legendFormat": "miss_{{job}}", - "refId": "B" - } - ], - "thresholds": [], - "timeFrom": null, - "timeRegions": [], - "timeShift": null, - "title": "Block cache hits and misses", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [] - }, - "yaxes": [ - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": "0", - "show": true - }, - { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ], - "yaxis": { - "align": false, - "alignLevel": null - } + "id": 26, + "panels": [], + "title": "Block cache", + "type": "row" }, { "aliasColors": {}, @@ -130,10 +40,10 @@ "gridPos": { "h": 9, "w": 12, - "x": 12, - "y": 0 + "x": 6, + "y": 1 }, - "id": 6, + "id": 11, "legend": { "avg": false, "current": false, @@ -159,38 +69,29 @@ "steppedLine": false, "targets": [ { - "expr": "sum(qed_[[instance]]_filter_useful) by (job)", + "expr": "sum(qed_[[instance]]_block_cache_memory_usage) by (job)", "format": "time_series", "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "useful{{job}}", + "legendFormat": "bytes{{job}}", "refId": "A" }, { - "expr": "sum(qed_[[instance]]_filter_full_positive) by (job)", + "expr": "sum(qed_[[instance]]_block_cache_pinned_memory_usage) by (job)", "format": "time_series", "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "full_positive{job}}", + "legendFormat": "bytes_pinned{{job}}", "refId": "B" - }, - { - "expr": "sum(qed_[[instance]]_filter_full_true_positive) by (job)", - "format": "time_series", - "hide": false, - "interval": "", - "intervalFactor": 1, - "legendFormat": "full_true_positive{job}}", - "refId": "C" } ], "thresholds": [], "timeFrom": null, "timeRegions": [], "timeShift": null, - "title": "Block cache bloom filter effectiveness", + "title": "Block cache memory usage", "tooltip": { "shared": true, "sort": 0, @@ -237,14 +138,12 @@ "h": 9, "w": 12, "x": 0, - "y": 9 + "y": 10 }, - "id": 4, + "id": 3, "legend": { "avg": false, "current": false, - "hideEmpty": true, - "hideZero": true, "max": false, "min": false, "show": true, @@ -253,7 +152,17 @@ }, "lines": true, "linewidth": 1, - "links": [], + "links": [ + { + "dashboard": "Cache Data, Filter, Index", + "includeVars": true, + "params": "", + "targetBlank": true, + "title": "Cache Data, Filter, Index", + "type": "dashboard", + "url": "/d/gD89ti6mZ/cache-data-filter-index" + } + ], "nullPointMode": "null", "paceLength": 10, "percentage": false, @@ -265,18 +174,16 @@ "steppedLine": false, "targets": [ { - "expr": "sum(qed_[[instance]]_block_cache_add) by (job)", + "expr": "sum(qed_[[instance]]_block_cache_hit) by (job)", "format": "time_series", - "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "add_{{job}}", + "legendFormat": "hit_{{job}}", "refId": "A" }, { - "expr": "sum(qed_[[instance]]_block_cache_add_failures) by (job)", + "expr": "sum(qed_[[instance]]_block_cache_miss) by (job)", "format": "time_series", - "hide": false, "intervalFactor": 1, "legendFormat": "miss_{{job}}", "refId": "B" @@ -286,7 +193,7 @@ "timeFrom": null, "timeRegions": [], "timeShift": null, - "title": "Block cache add and add failures", + "title": "Block cache hits and misses", "tooltip": { "shared": true, "sort": 0, @@ -333,9 +240,9 @@ "h": 9, "w": 12, "x": 12, - "y": 9 + "y": 10 }, - "id": 11, + "id": 4, "legend": { "avg": false, "current": false, @@ -361,21 +268,20 @@ "steppedLine": false, "targets": [ { - "expr": "sum(qed_[[instance]]_block_cache_memory_usage) by (job)", + "expr": "sum(qed_[[instance]]_block_cache_add) by (job)", "format": "time_series", "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "bytes{{job}}", + "legendFormat": "add_{{job}}", "refId": "A" }, { - "expr": "sum(qed_[[instance]]_block_cache_pinned_memory_usage) by (job)", + "expr": "sum(qed_[[instance]]_block_cache_add_failures) by (job)", "format": "time_series", "hide": false, - "interval": "", "intervalFactor": 1, - "legendFormat": "bytes_pinned{{job}}", + "legendFormat": "miss_{{job}}", "refId": "B" } ], @@ -383,7 +289,7 @@ "timeFrom": null, "timeRegions": [], "timeShift": null, - "title": "Block cache memory usage", + "title": "Block cache add and add failures", "tooltip": { "shared": true, "sort": 0, @@ -430,7 +336,7 @@ "h": 9, "w": 12, "x": 0, - "y": 18 + "y": 19 }, "id": 5, "legend": { @@ -527,9 +433,9 @@ "h": 9, "w": 12, "x": 12, - "y": 18 + "y": 19 }, - "id": 7, + "id": 6, "legend": { "avg": false, "current": false, @@ -555,29 +461,38 @@ "steppedLine": false, "targets": [ { - "expr": "sum(qed_[[instance]]_memtable_hit) by (job)", + "expr": "sum(qed_[[instance]]_filter_useful) by (job)", "format": "time_series", "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "hit{{job}}", + "legendFormat": "useful{{job}}", "refId": "A" }, { - "expr": "sum(qed_[[instance]]_memtable_miss) by (job)", + "expr": "sum(qed_[[instance]]_filter_full_positive) by (job)", "format": "time_series", "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "miss{{job}}", + "legendFormat": "full_positive{job}}", "refId": "B" + }, + { + "expr": "sum(qed_[[instance]]_filter_full_true_positive) by (job)", + "format": "time_series", + "hide": false, + "interval": "", + "intervalFactor": 1, + "legendFormat": "full_true_positive{job}}", + "refId": "C" } ], "thresholds": [], "timeFrom": null, "timeRegions": [], "timeShift": null, - "title": "Memtable hits and misses", + "title": "Block cache bloom filter effectiveness", "tooltip": { "shared": true, "sort": 0, @@ -614,6 +529,19 @@ "alignLevel": null } }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 28 + }, + "id": 24, + "panels": [], + "title": "Read/Write Activity", + "type": "row" + }, { "aliasColors": {}, "bars": false, @@ -624,7 +552,7 @@ "h": 9, "w": 12, "x": 0, - "y": 27 + "y": 29 }, "id": 9, "legend": { @@ -730,9 +658,9 @@ "h": 9, "w": 12, "x": 12, - "y": 27 + "y": 29 }, - "id": 8, + "id": 7, "legend": { "avg": false, "current": false, @@ -758,38 +686,29 @@ "steppedLine": false, "targets": [ { - "expr": "sum(qed_[[instance]]_get_hits_l0) by (job)", + "expr": "sum(qed_[[instance]]_memtable_hit) by (job)", "format": "time_series", "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "hit_l0{{job}}", + "legendFormat": "hit{{job}}", "refId": "A" }, { - "expr": "sum(qed_[[instance]]_get_hits_l1) by (job)", + "expr": "sum(qed_[[instance]]_memtable_miss) by (job)", "format": "time_series", "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "hit_l1{{job}}", + "legendFormat": "miss{{job}}", "refId": "B" - }, - { - "expr": "sum(qed_[[instance]]_get_hits_l2_up) by (job)", - "format": "time_series", - "hide": false, - "interval": "", - "intervalFactor": 1, - "legendFormat": "hit_l2_and_up{{job}}", - "refId": "C" } ], "thresholds": [], "timeFrom": null, "timeRegions": [], "timeShift": null, - "title": "Get hits per level", + "title": "Memtable hits and misses", "tooltip": { "shared": true, "sort": 0, @@ -835,10 +754,10 @@ "gridPos": { "h": 9, "w": 12, - "x": 0, - "y": 36 + "x": 6, + "y": 38 }, - "id": 10, + "id": 8, "legend": { "avg": false, "current": false, @@ -864,112 +783,38 @@ "steppedLine": false, "targets": [ { - "expr": "sum(qed_[[instance]]_io_stall_micros) by (job)", + "expr": "sum(qed_[[instance]]_get_hits_l0) by (job)", "format": "time_series", "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "bytes_read{{job}}", + "legendFormat": "hit_l0{{job}}", "refId": "A" - } - ], - "thresholds": [], - "timeFrom": null, - "timeRegions": [], - "timeShift": null, - "title": "IO wait in compaction or flush", - "tooltip": { - "shared": true, - "sort": 0, - "value_type": "individual" - }, - "type": "graph", - "xaxis": { - "buckets": null, - "mode": "time", - "name": null, - "show": true, - "values": [] - }, - "yaxes": [ - { - "format": "µs", - "label": null, - "logBase": 1, - "max": null, - "min": "0", - "show": true }, { - "format": "short", - "label": null, - "logBase": 1, - "max": null, - "min": null, - "show": false - } - ], - "yaxis": { - "align": false, - "alignLevel": null - } - }, - { - "aliasColors": {}, - "bars": false, - "dashLength": 10, - "dashes": false, - "fill": 1, - "gridPos": { - "h": 9, - "w": 12, - "x": 12, - "y": 36 - }, - "id": 2, - "legend": { - "avg": false, - "current": false, - "max": false, - "min": false, - "show": true, - "total": false, - "values": false - }, - "lines": true, - "linewidth": 1, - "links": [], - "nullPointMode": "null", - "paceLength": 10, - "percentage": false, - "pointradius": 2, - "points": false, - "renderer": "flot", - "seriesOverrides": [], - "stack": false, - "steppedLine": false, - "targets": [ - { - "expr": "sum(qed_[[instance]]_io_bytes_read) by (job)", + "expr": "sum(qed_[[instance]]_get_hits_l1) by (job)", "format": "time_series", + "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "read_{{job}}", - "refId": "A" + "legendFormat": "hit_l1{{job}}", + "refId": "B" }, { - "expr": "sum(qed_[[instance]]_io_bytes_written) by (job)", + "expr": "sum(qed_[[instance]]_get_hits_l2_up) by (job)", "format": "time_series", + "hide": false, + "interval": "", "intervalFactor": 1, - "legendFormat": "write_{{job}}", - "refId": "B" + "legendFormat": "hit_l2_and_up{{job}}", + "refId": "C" } ], "thresholds": [], "timeFrom": null, "timeRegions": [], "timeShift": null, - "title": "IO bytes read and written", + "title": "Get hits per level", "tooltip": { "shared": true, "sort": 0, @@ -985,7 +830,7 @@ }, "yaxes": [ { - "format": "decbytes", + "format": "short", "label": null, "logBase": 1, "max": null, @@ -1006,6 +851,19 @@ "alignLevel": null } }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 47 + }, + "id": 22, + "panels": [], + "title": "IO", + "type": "row" + }, { "aliasColors": {}, "bars": false, @@ -1016,9 +874,9 @@ "h": 9, "w": 12, "x": 0, - "y": 45 + "y": 48 }, - "id": 12, + "id": 13, "legend": { "avg": false, "current": false, @@ -1044,12 +902,12 @@ "steppedLine": false, "targets": [ { - "expr": "sum(qed_[[instance]]_io_wal_files_synced) by (job)", + "expr": "sum(qed_[[instance]]_io_wal_file_bytes) by (job)", "format": "time_series", "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "files_synced{{job}}", + "legendFormat": "bytes{{job}}", "refId": "A" } ], @@ -1057,7 +915,7 @@ "timeFrom": null, "timeRegions": [], "timeShift": null, - "title": "WAL files synced", + "title": "WAL bytes written", "tooltip": { "shared": true, "sort": 0, @@ -1073,7 +931,7 @@ }, "yaxes": [ { - "format": "short", + "format": "decbytes", "label": null, "logBase": 1, "max": null, @@ -1104,14 +962,12 @@ "h": 9, "w": 12, "x": 12, - "y": 45 + "y": 48 }, - "id": 13, + "id": 2, "legend": { "avg": false, "current": false, - "hideEmpty": true, - "hideZero": true, "max": false, "min": false, "show": true, @@ -1132,20 +988,26 @@ "steppedLine": false, "targets": [ { - "expr": "sum(qed_[[instance]]_io_wal_file_bytes) by (job)", + "expr": "sum(qed_[[instance]]_io_bytes_read) by (job)", "format": "time_series", - "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "bytes{{job}}", + "legendFormat": "read_{{job}}", "refId": "A" + }, + { + "expr": "sum(qed_[[instance]]_io_bytes_written) by (job)", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "write_{{job}}", + "refId": "B" } ], "thresholds": [], "timeFrom": null, "timeRegions": [], "timeShift": null, - "title": "WAL bytes written", + "title": "IO bytes read and written", "tooltip": { "shared": true, "sort": 0, @@ -1192,7 +1054,7 @@ "h": 9, "w": 12, "x": 0, - "y": 54 + "y": 57 }, "id": 15, "legend": { @@ -1298,9 +1160,9 @@ "h": 9, "w": 12, "x": 12, - "y": 54 + "y": 57 }, - "id": 16, + "id": 10, "legend": { "avg": false, "current": false, @@ -1326,38 +1188,20 @@ "steppedLine": false, "targets": [ { - "expr": "sum(qed_[[instance]]_compress_block_compressed) by (job)", + "expr": "sum(qed_[[instance]]_io_stall_micros) by (job)", "format": "time_series", "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "compressed{{job}}", + "legendFormat": "bytes_read{{job}}", "refId": "A" - }, - { - "expr": "sum(qed_[[instance]]_compress_block_decompressed) by (job)", - "format": "time_series", - "hide": false, - "interval": "", - "intervalFactor": 1, - "legendFormat": "decompressed{{job}}", - "refId": "B" - }, - { - "expr": "sum(qed_[[instance]]_compress_block_not_compressed) by (job)", - "format": "time_series", - "hide": false, - "interval": "", - "intervalFactor": 1, - "legendFormat": "not_compressed{{job}}", - "refId": "C" } ], "thresholds": [], "timeFrom": null, "timeRegions": [], "timeShift": null, - "title": "Block compression", + "title": "stall time for compaction or flush", "tooltip": { "shared": true, "sort": 0, @@ -1373,7 +1217,7 @@ }, "yaxes": [ { - "format": "short", + "format": "µs", "label": null, "logBase": 1, "max": null, @@ -1399,15 +1243,14 @@ "bars": false, "dashLength": 10, "dashes": false, - "description": "", "fill": 1, "gridPos": { "h": 9, "w": 12, "x": 0, - "y": 63 + "y": 66 }, - "id": 17, + "id": 16, "legend": { "avg": false, "current": false, @@ -1433,12 +1276,30 @@ "steppedLine": false, "targets": [ { - "expr": "sum(node_disk_io_now) by (job,device)", + "expr": "sum(qed_[[instance]]_compress_block_compressed) by (job)", + "format": "time_series", + "hide": false, + "interval": "", + "intervalFactor": 1, + "legendFormat": "compressed{{job}}", + "refId": "A" + }, + { + "expr": "sum(qed_[[instance]]_compress_block_decompressed) by (job)", + "format": "time_series", + "hide": false, + "interval": "", + "intervalFactor": 1, + "legendFormat": "decompressed{{job}}", + "refId": "B" + }, + { + "expr": "sum(qed_[[instance]]_compress_block_not_compressed) by (job)", "format": "time_series", "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "ops{{job}}@{{device}}", + "legendFormat": "not_compressed{{job}}", "refId": "C" } ], @@ -1446,7 +1307,7 @@ "timeFrom": null, "timeRegions": [], "timeShift": null, - "title": "IO ops", + "title": "Block compression", "tooltip": { "shared": true, "sort": 0, @@ -1488,15 +1349,14 @@ "bars": false, "dashLength": 10, "dashes": false, - "description": "", "fill": 1, "gridPos": { "h": 9, "w": 12, "x": 12, - "y": 63 + "y": 66 }, - "id": 18, + "id": 12, "legend": { "avg": false, "current": false, @@ -1522,21 +1382,12 @@ "steppedLine": false, "targets": [ { - "expr": "sum(rate(node_disk_writes_completed_total[30s])) by (job,device)", - "format": "time_series", - "hide": true, - "interval": "", - "intervalFactor": 1, - "legendFormat": "writes{{job}}@{{device}}", - "refId": "C" - }, - { - "expr": "sum(rate(node_disk_reads_completed_total[30s])) by (job,device)", + "expr": "sum(qed_[[instance]]_io_wal_files_synced) by (job)", "format": "time_series", "hide": false, "interval": "", "intervalFactor": 1, - "legendFormat": "reads{{job}}@{{device}}", + "legendFormat": "files_synced{{job}}", "refId": "A" } ], @@ -1544,7 +1395,7 @@ "timeFrom": null, "timeRegions": [], "timeShift": null, - "title": "IO reads and writes", + "title": "WAL files synced", "tooltip": { "shared": true, "sort": 0, @@ -1560,7 +1411,7 @@ }, "yaxes": [ { - "format": "Bps", + "format": "short", "label": null, "logBase": 1, "max": null, @@ -1592,8 +1443,8 @@ "allValue": null, "current": { "tags": [], - "text": "storage", - "value": "storage" + "text": "wal", + "value": "wal" }, "hide": 0, "includeAll": false, @@ -1602,12 +1453,12 @@ "name": "instance", "options": [ { - "selected": true, + "selected": false, "text": "storage", "value": "storage" }, { - "selected": false, + "selected": true, "text": "wal", "value": "wal" } @@ -1650,5 +1501,5 @@ "timezone": "", "title": "RocksDB", "uid": "j3KzCD6iz", - "version": 2 + "version": 3 } \ No newline at end of file