Skip to content

Commit

Permalink
[dashboards] sync grafana dashboards (aptos-labs#4835)
Browse files Browse the repository at this point in the history
Co-authored-by: rustielin <[email protected]>
  • Loading branch information
github-actions[bot] and rustielin authored Oct 7, 2022
1 parent a0f03a6 commit 8c59034
Show file tree
Hide file tree
Showing 14 changed files with 5,614 additions and 5,238 deletions.
157 changes: 106 additions & 51 deletions dashboards/blockchain-health.json
Original file line number Diff line number Diff line change
Expand Up @@ -90,18 +90,19 @@
"editable": false,
"error": false,
"gridPos": { "h": 8, "w": 8, "x": 8, "y": 1 },
"id": 45,
"id": 57,
"isNew": false,
"span": 0,
"title": "Current Round",
"description": "The current round consensus is at, the rate of this is roughly Committed blocks per sec.",
"title": "Transactions per block",
"description": "The average number of transactions of a block, can impact the execution time and overall latency.",
"transparent": false,
"type": "timeseries",
"targets": [
{
"refId": "A",
"datasource": { "type": "prometheus", "uid": "${Datasource}" },
"expr": "aptos_consensus_current_round{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}",
"expr": "rate(aptos_consensus_num_txns_per_block_sum{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}[$interval]) / rate(aptos_consensus_num_txns_per_block_count{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}[$interval])",
"intervalFactor": 1,
"legendFormat": "{{kubernetes_pod_name}}-{{role}}",
"format": "time_series"
}
Expand All @@ -122,7 +123,7 @@
]
},
"custom": {
"axisLabel": "round #",
"axisLabel": "# transactions / block",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
Expand All @@ -147,18 +148,19 @@
"editable": false,
"error": false,
"gridPos": { "h": 8, "w": 8, "x": 16, "y": 1 },
"id": 60,
"id": 2,
"isNew": false,
"span": 0,
"title": "Current Epoch",
"description": "The current epoch number the node is in, the number is bumped with reconfiguration event like key rotation, validator set change etc.",
"title": "Committed blocks per sec",
"description": "The rate of the committed round number.",
"transparent": false,
"type": "timeseries",
"targets": [
{
"refId": "A",
"datasource": { "type": "prometheus", "uid": "${Datasource}" },
"expr": "aptos_consensus_epoch{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}",
"expr": "rate(aptos_consensus_last_committed_round{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}[$interval])",
"intervalFactor": 1,
"legendFormat": "{{kubernetes_pod_name}}-{{role}}",
"format": "time_series"
}
Expand All @@ -179,7 +181,7 @@
]
},
"custom": {
"axisLabel": "Epoch #",
"axisLabel": "blocks / s",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
Expand All @@ -200,34 +202,32 @@
}
},
{
"datasource": { "type": "prometheus", "uid": "${Datasource}" },
"datasource": { "type": "prometheus", "uid": "MJnqIFmVk" },
"editable": false,
"error": false,
"gridPos": { "h": 8, "w": 8, "x": 0, "y": 9 },
"id": 6,
"id": 146,
"isNew": false,
"span": 0,
"title": "Committed successful txns per sec",
"description": "The rate of the committed transaction version.",
"title": "Synced version",
"transparent": false,
"type": "timeseries",
"targets": [
{
"refId": "A",
"datasource": { "type": "prometheus", "uid": "${Datasource}" },
"expr": "rate(aptos_consensus_last_committed_version{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}[$interval])",
"refId": "B",
"datasource": { "type": "prometheus", "uid": "MJnqIFmVk" },
"expr": "aptos_state_sync_version{type=\"synced\", role=\"validator\", kubernetes_pod_name=~\".*\", chain_name=~\"3\", namespace=~\"telemetry-service\"}",
"intervalFactor": 1,
"legendFormat": "{{kubernetes_pod_name}}-{{role}}",
"format": "time_series"
}
],
"options": {
"legend": { "calcs": [], "displayMode": "list", "placement": "bottom" },
"tooltip": { "mode": "multi" }
"tooltip": { "mode": "single" }
},
"fieldConfig": {
"defaults": {
"unit": "short",
"unit": "",
"color": { "mode": "palette-classic" },
"thresholds": {
"mode": "absolute",
Expand All @@ -237,7 +237,6 @@
]
},
"custom": {
"axisLabel": "transactions / s",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
Expand All @@ -246,7 +245,7 @@
"lineInterpolation": "linear",
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"showPoints": "auto",
"spanNulls": false,
"hideFrom": { "legend": false, "tooltip": false, "viz": false },
"lineStyle": { "fill": "" },
Expand All @@ -262,20 +261,19 @@
"editable": false,
"error": false,
"gridPos": { "h": 8, "w": 8, "x": 8, "y": 9 },
"id": 127,
"id": 45,
"isNew": false,
"span": 0,
"title": "Transaction execution failed per sec",
"description": "",
"title": "Current Round",
"description": "The current round consensus is at, the rate of this is roughly Committed blocks per sec.",
"transparent": false,
"type": "timeseries",
"targets": [
{
"refId": "A",
"datasource": { "type": "prometheus", "uid": "${Datasource}" },
"expr": "rate(aptos_consensus_committed_txns_count{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\",state=\"failed\"}[$interval])",
"intervalFactor": 1,
"legendFormat": "{{kubernetes_pod_name}}-{{state}}",
"expr": "aptos_consensus_current_round{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}",
"legendFormat": "{{kubernetes_pod_name}}-{{role}}",
"format": "time_series"
}
],
Expand All @@ -295,7 +293,7 @@
]
},
"custom": {
"axisLabel": "transactions / s",
"axisLabel": "round #",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
Expand All @@ -320,20 +318,19 @@
"editable": false,
"error": false,
"gridPos": { "h": 8, "w": 8, "x": 16, "y": 9 },
"id": 128,
"id": 60,
"isNew": false,
"span": 0,
"title": "Transaction execution retry per sec",
"description": "",
"title": "Current Epoch",
"description": "The current epoch number the node is in, the number is bumped with reconfiguration event like key rotation, validator set change etc.",
"transparent": false,
"type": "timeseries",
"targets": [
{
"refId": "A",
"datasource": { "type": "prometheus", "uid": "${Datasource}" },
"expr": "rate(aptos_consensus_committed_txns_count{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\",state=\"retry\"}[$interval])",
"intervalFactor": 1,
"legendFormat": "{{kubernetes_pod_name}}-{{state}}",
"expr": "aptos_consensus_epoch{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}",
"legendFormat": "{{kubernetes_pod_name}}-{{role}}",
"format": "time_series"
}
],
Expand All @@ -353,7 +350,7 @@
]
},
"custom": {
"axisLabel": "transactions / s",
"axisLabel": "Epoch #",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
Expand All @@ -378,18 +375,18 @@
"editable": false,
"error": false,
"gridPos": { "h": 8, "w": 8, "x": 0, "y": 17 },
"id": 2,
"id": 6,
"isNew": false,
"span": 0,
"title": "Committed blocks per sec",
"description": "The rate of the committed round number.",
"title": "Committed successful txns per sec",
"description": "The rate of the committed transaction version.",
"transparent": false,
"type": "timeseries",
"targets": [
{
"refId": "A",
"datasource": { "type": "prometheus", "uid": "${Datasource}" },
"expr": "rate(aptos_consensus_last_committed_round{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}[$interval])",
"expr": "rate(aptos_consensus_last_committed_version{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}[$interval])",
"intervalFactor": 1,
"legendFormat": "{{kubernetes_pod_name}}-{{role}}",
"format": "time_series"
Expand All @@ -411,7 +408,7 @@
]
},
"custom": {
"axisLabel": "blocks / s",
"axisLabel": "transactions / s",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
Expand All @@ -436,20 +433,20 @@
"editable": false,
"error": false,
"gridPos": { "h": 8, "w": 8, "x": 8, "y": 17 },
"id": 57,
"id": 127,
"isNew": false,
"span": 0,
"title": "Transactions per block",
"description": "The average number of transactions of a block, can impact the execution time and overall latency.",
"title": "Transaction execution failed per sec",
"description": "",
"transparent": false,
"type": "timeseries",
"targets": [
{
"refId": "A",
"datasource": { "type": "prometheus", "uid": "${Datasource}" },
"expr": "rate(aptos_consensus_num_txns_per_block_sum{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}[$interval]) / rate(aptos_consensus_num_txns_per_block_count{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}[$interval])",
"expr": "rate(aptos_consensus_committed_txns_count{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\",state=\"failed\"}[$interval])",
"intervalFactor": 1,
"legendFormat": "{{kubernetes_pod_name}}-{{role}}",
"legendFormat": "{{kubernetes_pod_name}}-{{state}}",
"format": "time_series"
}
],
Expand All @@ -469,7 +466,7 @@
]
},
"custom": {
"axisLabel": "# transactions / block",
"axisLabel": "transactions / s",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
Expand All @@ -494,18 +491,18 @@
"editable": false,
"error": false,
"gridPos": { "h": 8, "w": 8, "x": 16, "y": 17 },
"id": 140,
"id": 128,
"isNew": false,
"span": 0,
"title": "Round manager error rate",
"title": "Transaction execution retry per sec",
"description": "",
"transparent": false,
"type": "timeseries",
"targets": [
{
"refId": "A",
"datasource": { "type": "prometheus", "uid": "${Datasource}" },
"expr": "rate(aptos_consensus_error_count{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}[$interval])",
"expr": "rate(aptos_consensus_committed_txns_count{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\",state=\"retry\"}[$interval])",
"intervalFactor": 1,
"legendFormat": "{{kubernetes_pod_name}}-{{state}}",
"format": "time_series"
Expand Down Expand Up @@ -699,6 +696,64 @@
}
}
},
{
"datasource": { "type": "prometheus", "uid": "${Datasource}" },
"editable": false,
"error": false,
"gridPos": { "h": 8, "w": 8, "x": 16, "y": 25 },
"id": 140,
"isNew": false,
"span": 0,
"title": "Round manager error rate",
"description": "",
"transparent": false,
"type": "timeseries",
"targets": [
{
"refId": "A",
"datasource": { "type": "prometheus", "uid": "${Datasource}" },
"expr": "rate(aptos_consensus_error_count{chain_name=~\"$chain_name\", namespace=~\"$namespace\", kubernetes_pod_name=~\"$kubernetes_pod_name\", role=~\"$role\"}[$interval])",
"intervalFactor": 1,
"legendFormat": "{{kubernetes_pod_name}}-{{state}}",
"format": "time_series"
}
],
"options": {
"legend": { "calcs": [], "displayMode": "list", "placement": "bottom" },
"tooltip": { "mode": "multi" }
},
"fieldConfig": {
"defaults": {
"unit": "short",
"color": { "mode": "palette-classic" },
"thresholds": {
"mode": "absolute",
"steps": [
{ "color": "green", "value": null },
{ "color": "red", "value": 80 }
]
},
"custom": {
"axisLabel": "transactions / s",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
"fillOpacity": 0,
"gradientMode": "none",
"lineInterpolation": "linear",
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"hideFrom": { "legend": false, "tooltip": false, "viz": false },
"lineStyle": { "fill": "" },
"scaleDistribution": { "type": "linear" },
"stacking": { "group": "A", "mode": "none" },
"thresholdsStyle": { "mode": "off" }
}
}
}
},
{
"editable": false,
"error": false,
Expand Down Expand Up @@ -1854,7 +1909,7 @@
},
"refresh": false,
"schemaVersion": 37,
"version": 4,
"version": 5,
"links": [
{
"title": "aptos-core",
Expand Down
Binary file modified dashboards/blockchain-health.json.gz
Binary file not shown.
Loading

0 comments on commit 8c59034

Please sign in to comment.