[arvados] created: 2.7.0-5081-g6280dbe8a3
git repository hosting
git at public.arvados.org
Wed Oct 25 20:26:29 UTC 2023
at 6280dbe8a31b9fe9afcf28041cecd29382bfa437 (commit)
commit 6280dbe8a31b9fe9afcf28041cecd29382bfa437
Author: Lucas Di Pentima <lucas.dipentima at curii.com>
Date: Wed Oct 25 17:17:25 2023 -0300
20953: Adds TLS certificate expiration red/yellow/green light on main dashboard
Arvados-DCO-1.1-Signed-off-by: Lucas Di Pentima <lucas.dipentima at curii.com>
diff --git a/tools/salt-install/config_examples/multi_host/aws/dashboards/arvados_overview.json b/tools/salt-install/config_examples/multi_host/aws/dashboards/arvados_overview.json
index 36f24c2c4d..daf8f2f0a7 100644
--- a/tools/salt-install/config_examples/multi_host/aws/dashboards/arvados_overview.json
+++ b/tools/salt-install/config_examples/multi_host/aws/dashboards/arvados_overview.json
@@ -9,6 +9,33 @@
"pluginName": "Prometheus"
}
],
+ "__elements": {},
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "10.2.0"
+ },
+ {
+ "type": "panel",
+ "id": "graph",
+ "name": "Graph (old)",
+ "version": ""
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "table",
+ "name": "Table",
+ "version": ""
+ }
+ ],
"annotations": {
"list": [
{
@@ -34,10 +61,132 @@
"editable": true,
"fiscalYearStartMonth": 0,
"graphTooltip": 0,
- "id": 6,
+ "id": null,
"links": [],
"liveNow": false,
"panels": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "fieldConfig": {
+ "defaults": {
+ "color": {
+ "mode": "thresholds"
+ },
+ "custom": {
+ "align": "center",
+ "cellOptions": {
+ "type": "auto"
+ },
+ "inspect": false
+ },
+ "decimals": 2,
+ "mappings": [],
+ "thresholds": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "green",
+ "value": null
+ }
+ ]
+ },
+ "unit": "dtdurations"
+ },
+ "overrides": [
+ {
+ "matcher": {
+ "id": "byName",
+ "options": "Earliest SSL cert expiration"
+ },
+ "properties": [
+ {
+ "id": "thresholds",
+ "value": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "red",
+ "value": null
+ },
+ {
+ "color": "yellow",
+ "value": __TLS_EXPIRATION_YELLOW__
+ },
+ {
+ "color": "green",
+ "value": __TLS_EXPIRATION_GREEN__
+ }
+ ]
+ }
+ },
+ {
+ "id": "custom.cellOptions",
+ "value": {
+ "type": "color-background"
+ }
+ }
+ ]
+ }
+ ]
+ },
+ "gridPos": {
+ "h": 3,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 35,
+ "links": [],
+ "options": {
+ "cellHeight": "sm",
+ "footer": {
+ "countRows": false,
+ "fields": "",
+ "reducer": [
+ "sum"
+ ],
+ "show": false
+ },
+ "showHeader": false
+ },
+ "pluginVersion": "10.2.0",
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "editorMode": "code",
+ "exemplar": false,
+ "expr": "min(probe_ssl_earliest_cert_expiry)-time()",
+ "format": "time_series",
+ "instant": true,
+ "legendFormat": "__auto",
+ "range": false,
+ "refId": "A"
+ }
+ ],
+ "title": "Earliest SSL certificate expiration",
+ "transformations": [
+ {
+ "id": "organize",
+ "options": {
+ "excludeByName": {
+ "Time": true
+ },
+ "indexByName": {},
+ "renameByName": {
+ "Time": "",
+ "min(probe_ssl_earliest_cert_expiry)-time()": "Earliest SSL cert expiration"
+ }
+ }
+ }
+ ],
+ "type": "table"
+ },
{
"aliasColors": {},
"bars": false,
@@ -53,7 +202,7 @@
"h": 8,
"w": 12,
"x": 0,
- "y": 0
+ "y": 3
},
"hiddenSeries": false,
"id": 34,
@@ -73,7 +222,7 @@
"alertThreshold": true
},
"percentage": false,
- "pluginVersion": "9.4.3",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -153,7 +302,7 @@
"h": 8,
"w": 12,
"x": 12,
- "y": 0
+ "y": 3
},
"hiddenSeries": false,
"id": 14,
@@ -173,7 +322,7 @@
"alertThreshold": true
},
"percentage": false,
- "pluginVersion": "9.4.3",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -248,7 +397,7 @@
"h": 8,
"w": 12,
"x": 0,
- "y": 8
+ "y": 11
},
"hiddenSeries": false,
"id": 8,
@@ -268,7 +417,7 @@
"alertThreshold": true
},
"percentage": false,
- "pluginVersion": "9.4.3",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -342,7 +491,7 @@
"h": 8,
"w": 12,
"x": 12,
- "y": 8
+ "y": 11
},
"hiddenSeries": false,
"id": 12,
@@ -362,7 +511,7 @@
"alertThreshold": true
},
"percentage": false,
- "pluginVersion": "9.4.3",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -456,7 +605,7 @@
"h": 8,
"w": 12,
"x": 0,
- "y": 16
+ "y": 19
},
"hiddenSeries": false,
"id": 10,
@@ -476,7 +625,7 @@
"alertThreshold": true
},
"percentage": false,
- "pluginVersion": "9.4.3",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -544,7 +693,7 @@
"h": 8,
"w": 12,
"x": 12,
- "y": 16
+ "y": 19
},
"hiddenSeries": false,
"id": 24,
@@ -564,7 +713,7 @@
"alertThreshold": true
},
"percentage": false,
- "pluginVersion": "9.4.3",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -648,7 +797,7 @@
"h": 8,
"w": 12,
"x": 0,
- "y": 24
+ "y": 27
},
"hiddenSeries": false,
"id": 6,
@@ -668,7 +817,7 @@
"alertThreshold": true
},
"percentage": false,
- "pluginVersion": "9.4.3",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -768,7 +917,7 @@
"h": 8,
"w": 12,
"x": 12,
- "y": 24
+ "y": 27
},
"hiddenSeries": false,
"id": 22,
@@ -788,7 +937,7 @@
"alertThreshold": true
},
"percentage": false,
- "pluginVersion": "9.4.3",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -867,7 +1016,7 @@
"h": 8,
"w": 12,
"x": 0,
- "y": 32
+ "y": 35
},
"hiddenSeries": false,
"id": 32,
@@ -887,7 +1036,7 @@
"alertThreshold": true
},
"percentage": false,
- "pluginVersion": "9.4.3",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -961,7 +1110,7 @@
"h": 8,
"w": 12,
"x": 12,
- "y": 32
+ "y": 35
},
"hiddenSeries": false,
"id": 2,
@@ -981,7 +1130,7 @@
"alertThreshold": true
},
"percentage": false,
- "pluginVersion": "9.4.3",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -1055,7 +1204,7 @@
"h": 8,
"w": 12,
"x": 0,
- "y": 40
+ "y": 43
},
"hiddenSeries": false,
"id": 16,
@@ -1075,7 +1224,7 @@
"alertThreshold": true
},
"percentage": false,
- "pluginVersion": "9.4.3",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -1151,7 +1300,7 @@
"h": 8,
"w": 12,
"x": 12,
- "y": 40
+ "y": 43
},
"hiddenSeries": false,
"id": 4,
@@ -1171,7 +1320,7 @@
"alertThreshold": true
},
"percentage": false,
- "pluginVersion": "9.4.3",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -1245,7 +1394,7 @@
"h": 8,
"w": 12,
"x": 0,
- "y": 48
+ "y": 51
},
"hiddenSeries": false,
"id": 18,
@@ -1261,8 +1410,11 @@
"lines": true,
"linewidth": 1,
"nullPointMode": "null as zero",
+ "options": {
+ "alertThreshold": true
+ },
"percentage": false,
- "pluginVersion": "8.4.5",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -1332,7 +1484,7 @@
"h": 8,
"w": 12,
"x": 12,
- "y": 48
+ "y": 51
},
"hiddenSeries": false,
"id": 26,
@@ -1348,8 +1500,11 @@
"lines": true,
"linewidth": 1,
"nullPointMode": "null as zero",
+ "options": {
+ "alertThreshold": true
+ },
"percentage": false,
- "pluginVersion": "8.4.5",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -1423,7 +1578,7 @@
"h": 8,
"w": 12,
"x": 0,
- "y": 56
+ "y": 59
},
"hiddenSeries": false,
"id": 20,
@@ -1439,8 +1594,11 @@
"lines": true,
"linewidth": 1,
"nullPointMode": "null as zero",
+ "options": {
+ "alertThreshold": true
+ },
"percentage": false,
- "pluginVersion": "8.4.5",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -1518,7 +1676,7 @@
"h": 8,
"w": 12,
"x": 0,
- "y": 64
+ "y": 67
},
"hiddenSeries": false,
"id": 28,
@@ -1534,8 +1692,11 @@
"lines": true,
"linewidth": 1,
"nullPointMode": "null as zero",
+ "options": {
+ "alertThreshold": true
+ },
"percentage": false,
- "pluginVersion": "8.4.5",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -1603,7 +1764,7 @@
"h": 8,
"w": 12,
"x": 0,
- "y": 72
+ "y": 75
},
"hiddenSeries": false,
"id": 30,
@@ -1619,8 +1780,11 @@
"lines": true,
"linewidth": 1,
"nullPointMode": "null",
+ "options": {
+ "alertThreshold": true
+ },
"percentage": false,
- "pluginVersion": "8.4.5",
+ "pluginVersion": "10.2.0",
"pointradius": 2,
"points": false,
"renderer": "flot",
@@ -1678,7 +1842,6 @@
"refresh": "10s",
"revision": 1,
"schemaVersion": 38,
- "style": "dark",
"tags": [],
"templating": {
"list": []
@@ -1703,6 +1866,6 @@
"timezone": "",
"title": "Arvados cluster overview",
"uid": "ArvadosClusterOverviewDashboard",
- "version": 6,
+ "version": 1,
"weekStart": ""
}
\ No newline at end of file
commit 382460d9b5614598bfc6a28f93a1e140df45ab4a
Author: Lucas Di Pentima <lucas.dipentima at curii.com>
Date: Wed Oct 25 17:15:59 2023 -0300
20953: Fixes indentation on dashboard JSON file.
Arvados-DCO-1.1-Signed-off-by: Lucas Di Pentima <lucas.dipentima at curii.com>
diff --git a/tools/salt-install/config_examples/multi_host/aws/dashboards/arvados_overview.json b/tools/salt-install/config_examples/multi_host/aws/dashboards/arvados_overview.json
index c1278967bb..36f24c2c4d 100644
--- a/tools/salt-install/config_examples/multi_host/aws/dashboards/arvados_overview.json
+++ b/tools/salt-install/config_examples/multi_host/aws/dashboards/arvados_overview.json
@@ -1,1708 +1,1708 @@
{
- "__inputs": [
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "Prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "annotations": {
+ "list": [
{
- "name": "DS_PROMETHEUS",
- "label": "Prometheus",
- "description": "",
- "type": "datasource",
- "pluginId": "prometheus",
- "pluginName": "Prometheus"
+ "builtIn": 1,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "target": {
+ "limit": 100,
+ "matchAny": false,
+ "tags": [],
+ "type": "dashboard"
+ },
+ "type": "dashboard"
}
- ],
- "annotations": {
- "list": [
+ ]
+ },
+ "editable": true,
+ "fiscalYearStartMonth": 0,
+ "graphTooltip": 0,
+ "id": 6,
+ "links": [],
+ "liveNow": false,
+ "panels": [
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "fill": 4,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 0,
+ "y": 0
+ },
+ "hiddenSeries": false,
+ "id": 34,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null as zero",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "9.4.3",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [
+ {
+ "$$hashKey": "object:424",
+ "alias": "/out/",
+ "stack": "B",
+ "transform": "negative-Y"
+ }
+ ],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
{
- "builtIn": 1,
"datasource": {
"type": "prometheus",
"uid": "${DS_PROMETHEUS}"
},
- "enable": true,
- "hide": true,
- "iconColor": "rgba(0, 211, 255, 1)",
- "name": "Annotations & Alerts",
- "target": {
- "limit": 100,
- "matchAny": false,
- "tags": [],
- "type": "dashboard"
- },
- "type": "dashboard"
+ "expr": "sum(rate(arvados_keepstore_volume_io_bytes{}[1m])) without (operation,device_id)",
+ "interval": "",
+ "legendFormat": "{{ instance }} {{ direction }}",
+ "refId": "A"
}
- ]
- },
- "editable": true,
- "fiscalYearStartMonth": 0,
- "graphTooltip": 0,
- "id": 6,
- "links": [],
- "liveNow": false,
- "panels": [
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "fill": 4,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 0,
- "y": 0
- },
- "hiddenSeries": false,
- "id": 34,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null as zero",
- "options": {
- "alertThreshold": true
- },
- "percentage": false,
- "pluginVersion": "9.4.3",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [
- {
- "$$hashKey": "object:424",
- "alias": "/out/",
- "stack": "B",
- "transform": "negative-Y"
- }
- ],
- "spaceLength": 10,
- "stack": true,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "sum(rate(arvados_keepstore_volume_io_bytes{}[1m])) without (operation,device_id)",
- "interval": "",
- "legendFormat": "{{ instance }} {{ direction }}",
- "refId": "A"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "Keepstore bandwidth [1m]",
- "tooltip": {
- "shared": true,
- "sort": 0,
- "value_type": "individual"
- },
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "Keepstore bandwidth [1m]",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:159",
+ "format": "Bps",
+ "logBase": 1,
+ "show": true
},
- "yaxes": [
- {
- "$$hashKey": "object:159",
- "format": "Bps",
- "logBase": 1,
- "show": true
- },
- {
- "$$hashKey": "object:160",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ {
+ "$$hashKey": "object:160",
+ "format": "short",
+ "logBase": 1,
+ "show": true
}
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
+ "fieldConfig": {
+ "defaults": {
+ "links": []
},
- "fieldConfig": {
- "defaults": {
- "links": []
+ "overrides": []
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 12,
+ "y": 0
+ },
+ "hiddenSeries": false,
+ "id": 14,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null as zero",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "9.4.3",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- "overrides": []
- },
- "fill": 1,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 12,
- "y": 0
- },
- "hiddenSeries": false,
- "id": 14,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null as zero",
- "options": {
- "alertThreshold": true
- },
- "percentage": false,
- "pluginVersion": "9.4.3",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": false,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_dispatchcloud_containers_running{}",
- "interval": "",
- "legendFormat": "# containers",
- "refId": "A"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "Containers running",
- "tooltip": {
- "shared": true,
- "sort": 0,
- "value_type": "individual"
- },
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ "expr": "arvados_dispatchcloud_containers_running{}",
+ "interval": "",
+ "legendFormat": "# containers",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "Containers running",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:973",
+ "format": "short",
+ "label": "",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "yaxes": [
- {
- "$$hashKey": "object:973",
- "format": "short",
- "label": "",
- "logBase": 1,
- "min": "0",
- "show": true
- },
- {
- "$$hashKey": "object:974",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ {
+ "$$hashKey": "object:974",
+ "format": "short",
+ "logBase": 1,
+ "show": true
}
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
+ "fieldConfig": {
+ "defaults": {
+ "links": []
},
- "fieldConfig": {
- "defaults": {
- "links": []
+ "overrides": []
+ },
+ "fill": 8,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 0,
+ "y": 8
+ },
+ "hiddenSeries": false,
+ "id": 8,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "9.4.3",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- "overrides": []
- },
- "fill": 8,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 0,
- "y": 8
- },
- "hiddenSeries": false,
- "id": 8,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null",
- "options": {
- "alertThreshold": true
- },
- "percentage": false,
- "pluginVersion": "9.4.3",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": true,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "sum(rate(arvados_keepstore_volume_operations{}[1m])) without (operation,device_id)",
- "interval": "",
- "legendFormat": "{{instance}}",
- "refId": "A"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "Keepstore volume operations rate/second",
- "tooltip": {
- "shared": true,
- "sort": 2,
- "value_type": "individual"
- },
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ "expr": "sum(rate(arvados_keepstore_volume_operations{}[1m])) without (operation,device_id)",
+ "interval": "",
+ "legendFormat": "{{instance}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "Keepstore volume operations rate/second",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:982",
+ "format": "short",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "yaxes": [
- {
- "$$hashKey": "object:982",
- "format": "short",
- "logBase": 1,
- "min": "0",
- "show": true
- },
- {
- "$$hashKey": "object:983",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ {
+ "$$hashKey": "object:983",
+ "format": "short",
+ "logBase": 1,
+ "show": true
}
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
+ "fieldConfig": {
+ "defaults": {
+ "links": []
},
- "fieldConfig": {
- "defaults": {
- "links": []
+ "overrides": []
+ },
+ "fill": 6,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 12,
+ "y": 8
+ },
+ "hiddenSeries": false,
+ "id": 12,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null as zero",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "9.4.3",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- "overrides": []
- },
- "fill": 6,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 12,
- "y": 8
+ "expr": "arvados_dispatchcloud_queue_entries{}",
+ "interval": "",
+ "legendFormat": "{{instance_type}} {{state}}",
+ "refId": "A"
},
- "hiddenSeries": false,
- "id": 12,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null as zero",
- "options": {
- "alertThreshold": true
- },
- "percentage": false,
- "pluginVersion": "9.4.3",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": true,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_dispatchcloud_queue_entries{}",
- "interval": "",
- "legendFormat": "{{instance_type}} {{state}}",
- "refId": "A"
- },
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_dispatchcloud_containers_allocated_not_started{}",
- "interval": "",
- "legendFormat": "allocated, not started",
- "refId": "B"
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_dispatchcloud_containers_not_allocated_over_quota{}",
- "interval": "",
- "legendFormat": "not allocated, over quota",
- "refId": "C"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "Queue: # containers per {state, instance type}",
- "tooltip": {
- "shared": true,
- "sort": 2,
- "value_type": "individual"
+ "expr": "arvados_dispatchcloud_containers_allocated_not_started{}",
+ "interval": "",
+ "legendFormat": "allocated, not started",
+ "refId": "B"
},
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
- },
- "yaxes": [
- {
- "$$hashKey": "object:4306",
- "format": "short",
- "logBase": 1,
- "min": "0",
- "show": true
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "$$hashKey": "object:4307",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ "expr": "arvados_dispatchcloud_containers_not_allocated_over_quota{}",
+ "interval": "",
+ "legendFormat": "not allocated, over quota",
+ "refId": "C"
}
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "Queue: # containers per {state, instance type}",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "fieldConfig": {
- "defaults": {
- "links": []
- },
- "overrides": []
- },
- "fill": 8,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 0,
- "y": 16
- },
- "hiddenSeries": false,
- "id": 10,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null",
- "options": {
- "alertThreshold": true
- },
- "percentage": false,
- "pluginVersion": "9.4.3",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": true,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_keepstore_bufferpool_inuse_buffers{}",
- "interval": "",
- "legendFormat": "{{instance}}",
- "refId": "A"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "Keepstore buffers in use",
- "tooltip": {
- "shared": true,
- "sort": 2,
- "value_type": "individual"
- },
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:4306",
+ "format": "short",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "yaxes": [
- {
- "$$hashKey": "object:929",
- "format": "short",
- "logBase": 1,
- "min": "0",
- "show": true
- },
- {
- "$$hashKey": "object:930",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ {
+ "$$hashKey": "object:4307",
+ "format": "short",
+ "logBase": 1,
+ "show": true
}
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "fill": 1,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 12,
- "y": 16
- },
- "hiddenSeries": false,
- "id": 24,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null as zero",
- "options": {
- "alertThreshold": true
- },
- "percentage": false,
- "pluginVersion": "9.4.3",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": false,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_dispatchcloud_containers_longest_wait_time_seconds{}",
- "interval": "",
- "legendFormat": "Longest wait time",
- "refId": "A"
- },
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "rate(arvados_dispatchcloud_containers_time_from_queue_to_crunch_run_seconds_sum{}[10m]) / rate(arvados_dispatchcloud_containers_time_from_queue_to_crunch_run_seconds_count{}[10m])",
- "interval": "",
- "legendFormat": "avg wait time [10m]",
- "refId": "B"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "Container wait times",
- "tooltip": {
- "shared": true,
- "sort": 0,
- "value_type": "individual"
- },
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ "fieldConfig": {
+ "defaults": {
+ "links": []
},
- "yaxes": [
- {
- "$$hashKey": "object:138",
- "format": "s",
- "logBase": 1,
- "min": "0",
- "show": true
+ "overrides": []
+ },
+ "fill": 8,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 0,
+ "y": 16
+ },
+ "hiddenSeries": false,
+ "id": 10,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "9.4.3",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "$$hashKey": "object:139",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ "expr": "arvados_keepstore_bufferpool_inuse_buffers{}",
+ "interval": "",
+ "legendFormat": "{{instance}}",
+ "refId": "A"
}
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "Keepstore buffers in use",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "fieldConfig": {
- "defaults": {
- "links": []
- },
- "overrides": []
- },
- "fill": 1,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 0,
- "y": 24
- },
- "hiddenSeries": false,
- "id": 6,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null",
- "options": {
- "alertThreshold": true
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:929",
+ "format": "short",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "percentage": false,
- "pluginVersion": "9.4.3",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": false,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_keep_total_bytes{}",
- "interval": "",
- "legendFormat": "Total stored",
- "refId": "A"
- },
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_keep_overreplicated_bytes{}",
- "interval": "",
- "legendFormat": "Overreplicated",
- "refId": "B"
- },
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_keep_underreplicated_bytes{}",
- "interval": "",
- "legendFormat": "Underreplicated",
- "refId": "C"
+ {
+ "$$hashKey": "object:930",
+ "format": "short",
+ "logBase": 1,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 12,
+ "y": 16
+ },
+ "hiddenSeries": false,
+ "id": 24,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null as zero",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "9.4.3",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_keep_lost_bytes{}",
- "interval": "",
- "legendFormat": "Lost",
- "refId": "D"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "Total bytes by type",
- "tooltip": {
- "shared": true,
- "sort": 0,
- "value_type": "individual"
- },
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ "expr": "arvados_dispatchcloud_containers_longest_wait_time_seconds{}",
+ "interval": "",
+ "legendFormat": "Longest wait time",
+ "refId": "A"
},
- "yaxes": [
- {
- "$$hashKey": "object:304",
- "decimals": 2,
- "format": "decbytes",
- "label": "",
- "logBase": 1,
- "min": "0",
- "show": true
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "$$hashKey": "object:305",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ "expr": "rate(arvados_dispatchcloud_containers_time_from_queue_to_crunch_run_seconds_sum{}[10m]) / rate(arvados_dispatchcloud_containers_time_from_queue_to_crunch_run_seconds_count{}[10m])",
+ "interval": "",
+ "legendFormat": "avg wait time [10m]",
+ "refId": "B"
}
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "Container wait times",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
},
- {
- "aliasColors": {},
- "bars": true,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "fill": 1,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 12,
- "y": 24
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:138",
+ "format": "s",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "hiddenSeries": false,
- "id": 22,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
+ {
+ "$$hashKey": "object:139",
+ "format": "short",
+ "logBase": 1,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "fieldConfig": {
+ "defaults": {
+ "links": []
},
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null as zero",
- "options": {
- "alertThreshold": true
+ "overrides": []
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 0,
+ "y": 24
+ },
+ "hiddenSeries": false,
+ "id": 6,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "9.4.3",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "expr": "arvados_keep_total_bytes{}",
+ "interval": "",
+ "legendFormat": "Total stored",
+ "refId": "A"
},
- "percentage": false,
- "pluginVersion": "9.4.3",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": true,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "rate(arvados_dispatchcloud_instances_time_to_ssh_seconds_sum{}[10m]) / rate(arvados_dispatchcloud_instances_time_to_ssh_seconds_count{}[10m])",
- "hide": false,
- "interval": "",
- "legendFormat": "ssh",
- "refId": "A"
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "rate(arvados_dispatchcloud_instances_time_to_ready_for_container_seconds_sum{}[10m]) / rate(arvados_dispatchcloud_instances_time_to_ready_for_container_seconds_count{}[10m])",
- "interval": "",
- "legendFormat": "ready",
- "refId": "B"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "Instance time to ... avg [10m]",
- "tooltip": {
- "shared": true,
- "sort": 0,
- "value_type": "individual"
+ "expr": "arvados_keep_overreplicated_bytes{}",
+ "interval": "",
+ "legendFormat": "Overreplicated",
+ "refId": "B"
},
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "expr": "arvados_keep_underreplicated_bytes{}",
+ "interval": "",
+ "legendFormat": "Underreplicated",
+ "refId": "C"
},
- "yaxes": [
- {
- "$$hashKey": "object:113",
- "format": "s",
- "logBase": 1,
- "min": "0",
- "show": true
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "$$hashKey": "object:114",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ "expr": "arvados_keep_lost_bytes{}",
+ "interval": "",
+ "legendFormat": "Lost",
+ "refId": "D"
}
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "Total bytes by type",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "fill": 1,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 0,
- "y": 32
- },
- "hiddenSeries": false,
- "id": 32,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null",
- "options": {
- "alertThreshold": true
- },
- "percentage": false,
- "pluginVersion": "9.4.3",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": false,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_concurrent_requests{}",
- "interval": "",
- "legendFormat": "{{instance}}",
- "refId": "A"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "Concurrent requests",
- "tooltip": {
- "shared": true,
- "sort": 0,
- "value_type": "individual"
- },
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:304",
+ "decimals": 2,
+ "format": "decbytes",
+ "label": "",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "yaxes": [
- {
- "$$hashKey": "object:109",
- "format": "short",
- "logBase": 1,
- "min": "0",
- "show": true
- },
- {
- "$$hashKey": "object:110",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ {
+ "$$hashKey": "object:305",
+ "format": "short",
+ "logBase": 1,
+ "show": true
}
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": true,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "fieldConfig": {
- "defaults": {
- "links": []
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 12,
+ "y": 24
+ },
+ "hiddenSeries": false,
+ "id": 22,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null as zero",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "9.4.3",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- "overrides": []
- },
- "fill": 1,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 12,
- "y": 32
- },
- "hiddenSeries": false,
- "id": 2,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
+ "expr": "rate(arvados_dispatchcloud_instances_time_to_ssh_seconds_sum{}[10m]) / rate(arvados_dispatchcloud_instances_time_to_ssh_seconds_count{}[10m])",
+ "hide": false,
+ "interval": "",
+ "legendFormat": "ssh",
+ "refId": "A"
},
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null as zero",
- "options": {
- "alertThreshold": true
- },
- "percentage": false,
- "pluginVersion": "9.4.3",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": true,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_dispatchcloud_boot_outcomes{}",
- "interval": "",
- "legendFormat": "{{outcome}}",
- "refId": "A"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "Boot outcomes",
- "tooltip": {
- "shared": true,
- "sort": 2,
- "value_type": "individual"
- },
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
- },
- "yaxes": [
- {
- "$$hashKey": "object:921",
- "format": "short",
- "logBase": 1,
- "min": "0",
- "show": true
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "$$hashKey": "object:922",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ "expr": "rate(arvados_dispatchcloud_instances_time_to_ready_for_container_seconds_sum{}[10m]) / rate(arvados_dispatchcloud_instances_time_to_ready_for_container_seconds_count{}[10m])",
+ "interval": "",
+ "legendFormat": "ready",
+ "refId": "B"
}
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "Instance time to ... avg [10m]",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:113",
+ "format": "s",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "fieldConfig": {
- "defaults": {
- "links": []
+ {
+ "$$hashKey": "object:114",
+ "format": "short",
+ "logBase": 1,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 0,
+ "y": 32
+ },
+ "hiddenSeries": false,
+ "id": 32,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "9.4.3",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- "overrides": []
- },
- "fill": 1,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 0,
- "y": 40
- },
- "hiddenSeries": false,
- "id": 16,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null as zero",
- "options": {
- "alertThreshold": true
- },
- "percentage": false,
- "pluginVersion": "9.4.3",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": false,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "sum(arvados_dispatchcloud_instances_price{})",
- "interval": "",
- "intervalFactor": 10,
- "legendFormat": "cost ($)",
- "refId": "A"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "Cost",
- "tooltip": {
- "shared": true,
- "sort": 0,
- "value_type": "individual"
- },
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ "expr": "arvados_concurrent_requests{}",
+ "interval": "",
+ "legendFormat": "{{instance}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "Concurrent requests",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:109",
+ "format": "short",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "yaxes": [
- {
- "$$hashKey": "object:623",
- "format": "short",
- "label": "$ / hour",
- "logBase": 1,
- "min": "0",
- "show": true
- },
- {
- "$$hashKey": "object:624",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ {
+ "$$hashKey": "object:110",
+ "format": "short",
+ "logBase": 1,
+ "show": true
}
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
+ "fieldConfig": {
+ "defaults": {
+ "links": []
},
- "fieldConfig": {
- "defaults": {
- "links": []
+ "overrides": []
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 12,
+ "y": 32
+ },
+ "hiddenSeries": false,
+ "id": 2,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null as zero",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "9.4.3",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- "overrides": []
- },
- "fill": 1,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 12,
- "y": 40
- },
- "hiddenSeries": false,
- "id": 4,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null as zero",
- "options": {
- "alertThreshold": true
- },
- "percentage": false,
- "pluginVersion": "9.4.3",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": true,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_dispatchcloud_instances_disappeared{}",
- "interval": "",
- "legendFormat": "{{state}}",
- "refId": "A"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "instance state before disappearance",
- "tooltip": {
- "shared": true,
- "sort": 2,
- "value_type": "individual"
- },
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ "expr": "arvados_dispatchcloud_boot_outcomes{}",
+ "interval": "",
+ "legendFormat": "{{outcome}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "Boot outcomes",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:921",
+ "format": "short",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "yaxes": [
- {
- "$$hashKey": "object:1025",
- "format": "short",
- "logBase": 1,
- "min": "0",
- "show": true
- },
- {
- "$$hashKey": "object:1026",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ {
+ "$$hashKey": "object:922",
+ "format": "short",
+ "logBase": 1,
+ "show": true
}
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
+ "fieldConfig": {
+ "defaults": {
+ "links": []
},
- "fieldConfig": {
- "defaults": {
- "links": []
+ "overrides": []
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 0,
+ "y": 40
+ },
+ "hiddenSeries": false,
+ "id": 16,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null as zero",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "9.4.3",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- "overrides": []
- },
- "fill": 1,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 0,
- "y": 48
- },
- "hiddenSeries": false,
- "id": 18,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null as zero",
- "percentage": false,
- "pluginVersion": "8.4.5",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": true,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_dispatchcloud_instances_price{}",
- "interval": "",
- "intervalFactor": 10,
- "legendFormat": "{{category}}",
- "refId": "A"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "Cost by node state",
- "tooltip": {
- "shared": true,
- "sort": 2,
- "value_type": "individual"
+ "expr": "sum(arvados_dispatchcloud_instances_price{})",
+ "interval": "",
+ "intervalFactor": 10,
+ "legendFormat": "cost ($)",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "Cost",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:623",
+ "format": "short",
+ "label": "$ / hour",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ {
+ "$$hashKey": "object:624",
+ "format": "short",
+ "logBase": 1,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "fieldConfig": {
+ "defaults": {
+ "links": []
},
- "yaxes": [
- {
- "$$hashKey": "object:574",
- "format": "short",
- "label": "$ / hour",
- "logBase": 1,
- "min": "0",
- "show": true
+ "overrides": []
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 12,
+ "y": 40
+ },
+ "hiddenSeries": false,
+ "id": 4,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null as zero",
+ "options": {
+ "alertThreshold": true
+ },
+ "percentage": false,
+ "pluginVersion": "9.4.3",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "$$hashKey": "object:575",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ "expr": "arvados_dispatchcloud_instances_disappeared{}",
+ "interval": "",
+ "legendFormat": "{{state}}",
+ "refId": "A"
}
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "instance state before disappearance",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "fill": 1,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 12,
- "y": 48
- },
- "hiddenSeries": false,
- "id": 26,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null as zero",
- "percentage": false,
- "pluginVersion": "8.4.5",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": false,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "rate(arvados_dispatchcloud_instances_time_from_shutdown_request_to_disappearance_seconds_sum{}[10m]) / rate(arvados_dispatchcloud_instances_time_from_shutdown_request_to_disappearance_seconds_count{}[10m])",
- "interval": "",
- "legendFormat": "shutdown to disappearance",
- "refId": "A"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "Instances time from shutdown to disappearance avg[10m]",
- "tooltip": {
- "shared": true,
- "sort": 0,
- "value_type": "individual"
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:1025",
+ "format": "short",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ {
+ "$$hashKey": "object:1026",
+ "format": "short",
+ "logBase": 1,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "fieldConfig": {
+ "defaults": {
+ "links": []
},
- "yaxes": [
- {
- "$$hashKey": "object:450",
- "format": "s",
- "logBase": 1,
- "min": "0",
- "show": true
+ "overrides": []
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 0,
+ "y": 48
+ },
+ "hiddenSeries": false,
+ "id": 18,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null as zero",
+ "percentage": false,
+ "pluginVersion": "8.4.5",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "$$hashKey": "object:451",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ "expr": "arvados_dispatchcloud_instances_price{}",
+ "interval": "",
+ "intervalFactor": 10,
+ "legendFormat": "{{category}}",
+ "refId": "A"
}
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "Cost by node state",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:574",
+ "format": "short",
+ "label": "$ / hour",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "fieldConfig": {
- "defaults": {
- "links": []
+ {
+ "$$hashKey": "object:575",
+ "format": "short",
+ "logBase": 1,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 12,
+ "y": 48
+ },
+ "hiddenSeries": false,
+ "id": 26,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null as zero",
+ "percentage": false,
+ "pluginVersion": "8.4.5",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- "overrides": []
- },
- "fill": 1,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 0,
- "y": 56
- },
- "hiddenSeries": false,
- "id": 20,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null as zero",
- "percentage": false,
- "pluginVersion": "8.4.5",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": true,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "arvados_dispatchcloud_instances_total{}",
- "instant": false,
- "interval": "",
- "legendFormat": "{{instance_type}} : {{category}}",
- "refId": "A"
- }
- ],
- "thresholds": [
- {
- "$$hashKey": "object:540",
- "colorMode": "critical",
- "fill": true,
- "line": true,
- "op": "gt",
- "yaxis": "left"
- }
- ],
- "timeRegions": [],
- "title": "Nodes by state",
- "tooltip": {
- "shared": true,
- "sort": 2,
- "value_type": "individual"
+ "expr": "rate(arvados_dispatchcloud_instances_time_from_shutdown_request_to_disappearance_seconds_sum{}[10m]) / rate(arvados_dispatchcloud_instances_time_from_shutdown_request_to_disappearance_seconds_count{}[10m])",
+ "interval": "",
+ "legendFormat": "shutdown to disappearance",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "Instances time from shutdown to disappearance avg[10m]",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:450",
+ "format": "s",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ {
+ "$$hashKey": "object:451",
+ "format": "short",
+ "logBase": 1,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "fieldConfig": {
+ "defaults": {
+ "links": []
},
- "yaxes": [
- {
- "$$hashKey": "object:723",
- "format": "short",
- "logBase": 1,
- "min": "0",
- "show": true
+ "overrides": []
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 0,
+ "y": 56
+ },
+ "hiddenSeries": false,
+ "id": 20,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null as zero",
+ "percentage": false,
+ "pluginVersion": "8.4.5",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": true,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "$$hashKey": "object:724",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ "expr": "arvados_dispatchcloud_instances_total{}",
+ "instant": false,
+ "interval": "",
+ "legendFormat": "{{instance_type}} : {{category}}",
+ "refId": "A"
+ }
+ ],
+ "thresholds": [
+ {
+ "$$hashKey": "object:540",
+ "colorMode": "critical",
+ "fill": true,
+ "line": true,
+ "op": "gt",
+ "yaxis": "left"
}
+ ],
+ "timeRegions": [],
+ "title": "Nodes by state",
+ "tooltip": {
+ "shared": true,
+ "sort": 2,
+ "value_type": "individual"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "fill": 1,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 0,
- "y": 64
- },
- "hiddenSeries": false,
- "id": 28,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null as zero",
- "percentage": false,
- "pluginVersion": "8.4.5",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": false,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "rate(arvados_dispatchcloud_instances_run_probe_duration_seconds_sum{}[10m]) / rate(arvados_dispatchcloud_instances_run_probe_duration_seconds_count{}[10m])",
- "interval": "",
- "legendFormat": "{{outcome}}",
- "refId": "A"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "run probe duration avg[10m]",
- "tooltip": {
- "shared": true,
- "sort": 0,
- "value_type": "individual"
- },
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:723",
+ "format": "short",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "yaxes": [
- {
- "$$hashKey": "object:125",
- "format": "s",
- "logBase": 1,
- "min": "0",
- "show": true
+ {
+ "$$hashKey": "object:724",
+ "format": "short",
+ "logBase": 1,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false
+ }
+ },
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 0,
+ "y": 64
+ },
+ "hiddenSeries": false,
+ "id": 28,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null as zero",
+ "percentage": false,
+ "pluginVersion": "8.4.5",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
},
- {
- "$$hashKey": "object:126",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ "expr": "rate(arvados_dispatchcloud_instances_run_probe_duration_seconds_sum{}[10m]) / rate(arvados_dispatchcloud_instances_run_probe_duration_seconds_count{}[10m])",
+ "interval": "",
+ "legendFormat": "{{outcome}}",
+ "refId": "A"
}
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "run probe duration avg[10m]",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
},
- {
- "aliasColors": {},
- "bars": false,
- "dashLength": 10,
- "dashes": false,
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "fill": 1,
- "fillGradient": 0,
- "gridPos": {
- "h": 8,
- "w": 12,
- "x": 0,
- "y": 72
- },
- "hiddenSeries": false,
- "id": 30,
- "legend": {
- "avg": false,
- "current": false,
- "max": false,
- "min": false,
- "show": true,
- "total": false,
- "values": false
- },
- "lines": true,
- "linewidth": 1,
- "nullPointMode": "null",
- "percentage": false,
- "pluginVersion": "8.4.5",
- "pointradius": 2,
- "points": false,
- "renderer": "flot",
- "seriesOverrides": [],
- "spaceLength": 10,
- "stack": false,
- "steppedLine": false,
- "targets": [
- {
- "datasource": {
- "type": "prometheus",
- "uid": "${DS_PROMETHEUS}"
- },
- "expr": "delta(arvados_dispatchcloud_instances_run_probe_duration_seconds_count{}[1m])",
- "instant": false,
- "interval": "",
- "legendFormat": "{{outcome}}",
- "refId": "B"
- }
- ],
- "thresholds": [],
- "timeRegions": [],
- "title": "run probe count by outcome -- delta[1m]",
- "tooltip": {
- "shared": true,
- "sort": 0,
- "value_type": "individual"
- },
- "type": "graph",
- "xaxis": {
- "mode": "time",
- "show": true,
- "values": []
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:125",
+ "format": "s",
+ "logBase": 1,
+ "min": "0",
+ "show": true
},
- "yaxes": [
- {
- "$$hashKey": "object:149",
- "format": "short",
- "logBase": 10,
- "min": "0",
- "show": true
- },
- {
- "$$hashKey": "object:150",
- "format": "short",
- "logBase": 1,
- "show": true
- }
- ],
- "yaxis": {
- "align": false
+ {
+ "$$hashKey": "object:126",
+ "format": "short",
+ "logBase": 1,
+ "show": true
}
+ ],
+ "yaxis": {
+ "align": false
}
- ],
- "refresh": "10s",
- "revision": 1,
- "schemaVersion": 38,
- "style": "dark",
- "tags": [],
- "templating": {
- "list": []
- },
- "time": {
- "from": "now-1h",
- "to": "now"
- },
- "timepicker": {
- "refresh_intervals": [
- "10s",
- "30s",
- "1m",
- "5m",
- "15m",
- "30m",
- "1h",
- "2h",
- "1d"
- ]
},
- "timezone": "",
- "title": "Arvados cluster overview",
- "uid": "ArvadosClusterOverviewDashboard",
- "version": 6,
- "weekStart": ""
- }
\ No newline at end of file
+ {
+ "aliasColors": {},
+ "bars": false,
+ "dashLength": 10,
+ "dashes": false,
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "fill": 1,
+ "fillGradient": 0,
+ "gridPos": {
+ "h": 8,
+ "w": 12,
+ "x": 0,
+ "y": 72
+ },
+ "hiddenSeries": false,
+ "id": 30,
+ "legend": {
+ "avg": false,
+ "current": false,
+ "max": false,
+ "min": false,
+ "show": true,
+ "total": false,
+ "values": false
+ },
+ "lines": true,
+ "linewidth": 1,
+ "nullPointMode": "null",
+ "percentage": false,
+ "pluginVersion": "8.4.5",
+ "pointradius": 2,
+ "points": false,
+ "renderer": "flot",
+ "seriesOverrides": [],
+ "spaceLength": 10,
+ "stack": false,
+ "steppedLine": false,
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "expr": "delta(arvados_dispatchcloud_instances_run_probe_duration_seconds_count{}[1m])",
+ "instant": false,
+ "interval": "",
+ "legendFormat": "{{outcome}}",
+ "refId": "B"
+ }
+ ],
+ "thresholds": [],
+ "timeRegions": [],
+ "title": "run probe count by outcome -- delta[1m]",
+ "tooltip": {
+ "shared": true,
+ "sort": 0,
+ "value_type": "individual"
+ },
+ "type": "graph",
+ "xaxis": {
+ "mode": "time",
+ "show": true,
+ "values": []
+ },
+ "yaxes": [
+ {
+ "$$hashKey": "object:149",
+ "format": "short",
+ "logBase": 10,
+ "min": "0",
+ "show": true
+ },
+ {
+ "$$hashKey": "object:150",
+ "format": "short",
+ "logBase": 1,
+ "show": true
+ }
+ ],
+ "yaxis": {
+ "align": false
+ }
+ }
+ ],
+ "refresh": "10s",
+ "revision": 1,
+ "schemaVersion": 38,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": []
+ },
+ "time": {
+ "from": "now-1h",
+ "to": "now"
+ },
+ "timepicker": {
+ "refresh_intervals": [
+ "10s",
+ "30s",
+ "1m",
+ "5m",
+ "15m",
+ "30m",
+ "1h",
+ "2h",
+ "1d"
+ ]
+ },
+ "timezone": "",
+ "title": "Arvados cluster overview",
+ "uid": "ArvadosClusterOverviewDashboard",
+ "version": 6,
+ "weekStart": ""
+}
\ No newline at end of file
commit f361686b04e978c652f4d7442f12511fdfd06719
Author: Lucas Di Pentima <lucas.dipentima at curii.com>
Date: Wed Oct 25 17:07:31 2023 -0300
20953: Sets sensible coloring thresholds on cert expire dates.
If using Let's Encrypt certificates, the max lifetime is 3 months, so it'll
show green if the expiration is >2 months out, yellow if it's >1.
Arvados-DCO-1.1-Signed-off-by: Lucas Di Pentima <lucas.dipentima at curii.com>
diff --git a/tools/salt-install/common.sh b/tools/salt-install/common.sh
index 5d9dba14cd..360c2c7cc3 100644
--- a/tools/salt-install/common.sh
+++ b/tools/salt-install/common.sh
@@ -48,6 +48,14 @@ for node in "${!NODES[@]}"; do
done
done
+# Sets TLS certificate expiration thresholds
+TLS_EXPIRATION_YELLOW=5184000 # > 2 months
+TLS_EXPIRATION_GREEN=15552000 # > 6 months
+if [[ "${SSL_MODE}" == "lets-encrypt" ]]; then
+ TLS_EXPIRATION_YELLOW=2592000 # > 1 months
+ TLS_EXPIRATION_GREEN=5184000 # > 2 months
+fi
+
# Auto-detects load-balancing mode
if [ -z "${ROLE2NODES['balancer']:-}" ]; then
ENABLE_BALANCER="no"
diff --git a/tools/salt-install/config_examples/multi_host/aws/dashboards/ssl-certificate-monitor.json b/tools/salt-install/config_examples/multi_host/aws/dashboards/ssl-certificate-monitor.json
index 92eb5391a7..fc4f8c6679 100644
--- a/tools/salt-install/config_examples/multi_host/aws/dashboards/ssl-certificate-monitor.json
+++ b/tools/salt-install/config_examples/multi_host/aws/dashboards/ssl-certificate-monitor.json
@@ -171,11 +171,11 @@
},
{
"color": "semi-dark-yellow",
- "value": 12096000
+ "value": __TLS_EXPIRATION_YELLOW__
},
{
"color": "semi-dark-green",
- "value": 25920000
+ "value": __TLS_EXPIRATION_GREEN__
}
]
}
diff --git a/tools/salt-install/provision.sh b/tools/salt-install/provision.sh
index a93899a61a..9b69bbffec 100755
--- a/tools/salt-install/provision.sh
+++ b/tools/salt-install/provision.sh
@@ -722,7 +722,9 @@ else
# "ArvadosPromDataSource" is the hardcoded UID for Prometheus' datasource
# in Grafana.
for f in $(ls "${GRAFANA_DASHBOARDS_DIR}"/*.json); do
- sed 's#${DS_PROMETHEUS}#ArvadosPromDataSource#g' \
+ sed "s#__TLS_EXPIRATION_YELLOW__#${TLS_EXPIRATION_YELLOW}#g;
+ s#__TLS_EXPIRATION_GREEN__#${TLS_EXPIRATION_GREEN}#g;
+ s#\${DS_PROMETHEUS}#ArvadosPromDataSource#g" \
"${f}" > "${GRAFANA_DASHBOARDS_DEST_DIR}"/$(basename "${f}")
done
commit a9435ce3d745bef944e739d672efc9108253a296
Author: Lucas Di Pentima <lucas.dipentima at curii.com>
Date: Wed Oct 25 16:24:01 2023 -0300
20953: Properly pass auth data to HTTPS endpoints that need it.
This makes all HTTP responses green (200) on the grafana dashboard.
Arvados-DCO-1.1-Signed-off-by: Lucas Di Pentima <lucas.dipentima at curii.com>
diff --git a/tools/salt-install/config_examples/multi_host/aws/pillars/prometheus_server.sls b/tools/salt-install/config_examples/multi_host/aws/pillars/prometheus_server.sls
index 143097b4a4..e6714ae8a7 100644
--- a/tools/salt-install/config_examples/multi_host/aws/pillars/prometheus_server.sls
+++ b/tools/salt-install/config_examples/multi_host/aws/pillars/prometheus_server.sls
@@ -28,9 +28,38 @@ prometheus:
timeout: 5s
http:
valid_http_versions: [HTTP/1.1, HTTP/2]
- valid_status_codes: [] # Default is [200]
+ valid_status_codes: [200]
+ method: GET
+ tls_config:
+ insecure_skip_verify: true # Avoid failures on self-signed certs
fail_if_ssl: false
- fail_if_not_ssl: false
+ fail_if_not_ssl: true
+ http_2xx_mngmt_token:
+ prober: http
+ timeout: 5s
+ http:
+ valid_http_versions: [HTTP/1.1, HTTP/2]
+ valid_status_codes: [200]
+ method: GET
+ bearer_token: __MANAGEMENT_TOKEN__
+ tls_config:
+ insecure_skip_verify: true # Avoid failures on self-signed certs
+ fail_if_ssl: false
+ fail_if_not_ssl: true
+ http_2xx_basic_auth:
+ prober: http
+ timeout: 5s
+ http:
+ valid_http_versions: [HTTP/1.1, HTTP/2]
+ valid_status_codes: [200]
+ method: GET
+ basic_auth:
+ username: "__MONITORING_USERNAME__"
+ password: "__MONITORING_PASSWORD__"
+ tls_config:
+ insecure_skip_verify: true # Avoid failures on self-signed certs
+ fail_if_ssl: false
+ fail_if_not_ssl: true
prometheus:
service:
args:
@@ -57,30 +86,56 @@ prometheus:
params:
module: [http_2xx]
static_configs:
- - targets: ['https://__DOMAIN__']
- labels:
- instance: controller.__CLUSTER__
- targets: ['https://workbench.__DOMAIN__']
labels:
instance: workbench.__CLUSTER__
- targets: ['https://workbench2.__DOMAIN__']
labels:
instance: workbench2.__CLUSTER__
- - targets: ['https://download.__DOMAIN__']
+ - targets: ['https://webshell.__DOMAIN__']
+ labels:
+ instance: webshell.__CLUSTER__
+ relabel_configs:
+ - source_labels: [__address__]
+ target_label: __param_target
+ - source_labels: [__param_target]
+ target_label: instance
+ - target_label: __address__
+ replacement: 127.0.0.1:9115 # blackbox exporter.
+
+ - job_name: http_probe_mngmt_token
+ metrics_path: /probe
+ params:
+ module: [http_2xx_mngmt_token]
+ static_configs:
+ - targets: ['https://__DOMAIN__/_health/ping']
+ labels:
+ instance: controller.__CLUSTER__
+ - targets: ['https://download.__DOMAIN__/_health/ping']
labels:
instance: download.__CLUSTER__
+ - targets: ['https://ws.__DOMAIN__/_health/ping']
+ labels:
+ instance: ws.__CLUSTER__
+ relabel_configs:
+ - source_labels: [__address__]
+ target_label: __param_target
+ - source_labels: [__param_target]
+ target_label: instance
+ - target_label: __address__
+ replacement: 127.0.0.1:9115 # blackbox exporter.
+
+ - job_name: http_probe_basic_auth
+ metrics_path: /probe
+ params:
+ module: [http_2xx_basic_auth]
+ static_configs:
- targets: ['https://grafana.__DOMAIN__']
labels:
instance: grafana.__CLUSTER__
- targets: ['https://prometheus.__DOMAIN__']
labels:
instance: prometheus.__CLUSTER__
- - targets: ['https://webshell.__DOMAIN__']
- labels:
- instance: webshell.__CLUSTER__
- - targets: ['https://ws.__DOMAIN__']
- labels:
- instance: ws.__CLUSTER__
relabel_configs:
- source_labels: [__address__]
target_label: __param_target
commit 85d79eb901f52a2fb10fae4bc64b8f9a18dff781
Author: Lucas Di Pentima <lucas.dipentima at curii.com>
Date: Tue Oct 24 20:29:11 2023 -0300
20953: Adds blackbox-exporter HTTP probes and SSL Monitor grafana dashboard.
Arvados-DCO-1.1-Signed-off-by: Lucas Di Pentima <lucas.dipentima at curii.com>
diff --git a/tools/salt-install/config_examples/multi_host/aws/dashboards/ssl-certificate-monitor.json b/tools/salt-install/config_examples/multi_host/aws/dashboards/ssl-certificate-monitor.json
new file mode 100644
index 0000000000..92eb5391a7
--- /dev/null
+++ b/tools/salt-install/config_examples/multi_host/aws/dashboards/ssl-certificate-monitor.json
@@ -0,0 +1,606 @@
+{
+ "__inputs": [
+ {
+ "name": "DS_PROMETHEUS",
+ "label": "Prometheus",
+ "description": "",
+ "type": "datasource",
+ "pluginId": "prometheus",
+ "pluginName": "Prometheus"
+ }
+ ],
+ "__elements": {},
+ "__requires": [
+ {
+ "type": "grafana",
+ "id": "grafana",
+ "name": "Grafana",
+ "version": "10.1.5"
+ },
+ {
+ "type": "datasource",
+ "id": "prometheus",
+ "name": "Prometheus",
+ "version": "1.0.0"
+ },
+ {
+ "type": "panel",
+ "id": "table",
+ "name": "Table",
+ "version": ""
+ }
+ ],
+ "annotations": {
+ "list": [
+ {
+ "builtIn": 1,
+ "datasource": {
+ "type": "datasource",
+ "uid": "grafana"
+ },
+ "enable": true,
+ "hide": true,
+ "iconColor": "rgba(0, 211, 255, 1)",
+ "name": "Annotations & Alerts",
+ "type": "dashboard"
+ }
+ ]
+ },
+ "description": "",
+ "editable": true,
+ "fiscalYearStartMonth": 0,
+ "gnetId": 13230,
+ "graphTooltip": 0,
+ "id": null,
+ "links": [],
+ "liveNow": false,
+ "panels": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "description": "",
+ "fieldConfig": {
+ "defaults": {
+ "custom": {
+ "align": "auto",
+ "cellOptions": {
+ "type": "auto"
+ },
+ "filterable": false,
+ "inspect": false
+ },
+ "mappings": [],
+ "thresholds": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "green",
+ "value": null
+ },
+ {
+ "color": "red",
+ "value": 80
+ }
+ ]
+ }
+ },
+ "overrides": [
+ {
+ "matcher": {
+ "id": "byName",
+ "options": "instance"
+ },
+ "properties": [
+ {
+ "id": "custom.width",
+ "value": 500
+ },
+ {
+ "id": "displayName",
+ "value": "Instance"
+ }
+ ]
+ },
+ {
+ "matcher": {
+ "id": "byName",
+ "options": "Value #B"
+ },
+ "properties": [
+ {
+ "id": "custom.cellOptions",
+ "value": {
+ "mode": "lcd",
+ "type": "gauge"
+ }
+ },
+ {
+ "id": "max",
+ "value": 0.5
+ },
+ {
+ "id": "displayName",
+ "value": "Connect Time"
+ },
+ {
+ "id": "thresholds",
+ "value": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "green",
+ "value": null
+ },
+ {
+ "color": "#EAB839",
+ "value": 0.2
+ },
+ {
+ "color": "red",
+ "value": 0.4
+ }
+ ]
+ }
+ }
+ ]
+ },
+ {
+ "matcher": {
+ "id": "byName",
+ "options": "Value #A"
+ },
+ "properties": [
+ {
+ "id": "decimals",
+ "value": 2
+ },
+ {
+ "id": "displayName",
+ "value": "Certificate expires in"
+ },
+ {
+ "id": "thresholds",
+ "value": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "semi-dark-red",
+ "value": null
+ },
+ {
+ "color": "semi-dark-yellow",
+ "value": 12096000
+ },
+ {
+ "color": "semi-dark-green",
+ "value": 25920000
+ }
+ ]
+ }
+ },
+ {
+ "id": "custom.cellOptions",
+ "value": {
+ "mode": "gradient",
+ "type": "color-background"
+ }
+ },
+ {
+ "id": "custom.width",
+ "value": 220
+ },
+ {
+ "id": "custom.align",
+ "value": "left"
+ },
+ {
+ "id": "unit",
+ "value": "dtdurations"
+ }
+ ]
+ },
+ {
+ "matcher": {
+ "id": "byName",
+ "options": "Value #D"
+ },
+ "properties": [
+ {
+ "id": "displayName",
+ "value": "HTTP Response"
+ },
+ {
+ "id": "thresholds",
+ "value": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "green",
+ "value": null
+ },
+ {
+ "color": "#EAB839",
+ "value": 300
+ },
+ {
+ "color": "red",
+ "value": 400
+ }
+ ]
+ }
+ },
+ {
+ "id": "custom.cellOptions",
+ "value": {
+ "mode": "gradient",
+ "type": "color-background"
+ }
+ },
+ {
+ "id": "custom.align",
+ "value": "center"
+ },
+ {
+ "id": "custom.width",
+ "value": 150
+ }
+ ]
+ },
+ {
+ "matcher": {
+ "id": "byName",
+ "options": "Value #C"
+ },
+ "properties": [
+ {
+ "id": "displayName",
+ "value": "Transfer Time"
+ },
+ {
+ "id": "max",
+ "value": 0.5
+ },
+ {
+ "id": "custom.cellOptions",
+ "value": {
+ "mode": "lcd",
+ "type": "gauge"
+ }
+ },
+ {
+ "id": "thresholds",
+ "value": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "green",
+ "value": null
+ },
+ {
+ "color": "#EAB839",
+ "value": 0.125
+ },
+ {
+ "color": "red",
+ "value": 0.3
+ }
+ ]
+ }
+ }
+ ]
+ },
+ {
+ "matcher": {
+ "id": "byName",
+ "options": "Value #E"
+ },
+ "properties": [
+ {
+ "id": "displayName",
+ "value": "TLS Time"
+ },
+ {
+ "id": "custom.cellOptions",
+ "value": {
+ "mode": "lcd",
+ "type": "gauge"
+ }
+ },
+ {
+ "id": "max",
+ "value": 1
+ },
+ {
+ "id": "thresholds",
+ "value": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "green",
+ "value": null
+ },
+ {
+ "color": "#EAB839",
+ "value": 0.5
+ },
+ {
+ "color": "red",
+ "value": 0.9
+ }
+ ]
+ }
+ }
+ ]
+ },
+ {
+ "matcher": {
+ "id": "byName",
+ "options": "Value #F"
+ },
+ "properties": [
+ {
+ "id": "displayName",
+ "value": "Processing Time"
+ },
+ {
+ "id": "max",
+ "value": 0.5
+ },
+ {
+ "id": "custom.cellOptions",
+ "value": {
+ "mode": "lcd",
+ "type": "gauge"
+ }
+ },
+ {
+ "id": "thresholds",
+ "value": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "green",
+ "value": null
+ },
+ {
+ "color": "#EAB839",
+ "value": 0.25
+ },
+ {
+ "color": "red",
+ "value": 0.4
+ }
+ ]
+ }
+ }
+ ]
+ },
+ {
+ "matcher": {
+ "id": "byName",
+ "options": "Value #G"
+ },
+ "properties": [
+ {
+ "id": "displayName",
+ "value": "Resolve Time"
+ },
+ {
+ "id": "custom.cellOptions",
+ "value": {
+ "mode": "lcd",
+ "type": "gauge"
+ }
+ },
+ {
+ "id": "max",
+ "value": 0.01
+ },
+ {
+ "id": "thresholds",
+ "value": {
+ "mode": "absolute",
+ "steps": [
+ {
+ "color": "green",
+ "value": null
+ },
+ {
+ "color": "#EAB839",
+ "value": 0.005
+ },
+ {
+ "color": "red",
+ "value": 0.009
+ }
+ ]
+ }
+ }
+ ]
+ }
+ ]
+ },
+ "gridPos": {
+ "h": 22,
+ "w": 24,
+ "x": 0,
+ "y": 0
+ },
+ "id": 2,
+ "options": {
+ "cellHeight": "sm",
+ "footer": {
+ "countRows": false,
+ "fields": "",
+ "reducer": [
+ "sum"
+ ],
+ "show": false
+ },
+ "frameIndex": 1,
+ "showHeader": true,
+ "sortBy": [
+ {
+ "desc": false,
+ "displayName": "Certificate expires in"
+ }
+ ]
+ },
+ "pluginVersion": "10.1.5",
+ "targets": [
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "expr": "probe_ssl_earliest_cert_expiry-time()",
+ "format": "table",
+ "hide": false,
+ "instant": true,
+ "interval": "",
+ "legendFormat": "",
+ "refId": "A"
+ },
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "expr": "probe_http_status_code",
+ "format": "table",
+ "instant": true,
+ "interval": "",
+ "legendFormat": "",
+ "refId": "D"
+ },
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "expr": "probe_http_duration_seconds{phase=\"resolve\"}",
+ "format": "table",
+ "instant": true,
+ "interval": "",
+ "legendFormat": "",
+ "refId": "G"
+ },
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "expr": "probe_http_duration_seconds{phase=\"connect\"}",
+ "format": "table",
+ "instant": true,
+ "interval": "",
+ "legendFormat": "",
+ "refId": "B"
+ },
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "expr": "probe_http_duration_seconds{phase=\"tls\"}",
+ "format": "table",
+ "instant": true,
+ "interval": "",
+ "legendFormat": "",
+ "refId": "E"
+ },
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "expr": "probe_http_duration_seconds{phase=\"processing\"}",
+ "format": "table",
+ "instant": true,
+ "interval": "",
+ "legendFormat": "",
+ "refId": "F"
+ },
+ {
+ "datasource": {
+ "type": "prometheus",
+ "uid": "${DS_PROMETHEUS}"
+ },
+ "expr": "probe_http_duration_seconds{phase=\"transfer\"}",
+ "format": "table",
+ "instant": true,
+ "interval": "",
+ "legendFormat": "",
+ "refId": "C"
+ }
+ ],
+ "title": "Certificate & Connection Monitoring",
+ "transformations": [
+ {
+ "id": "seriesToColumns",
+ "options": {
+ "byField": "instance"
+ }
+ },
+ {
+ "id": "organize",
+ "options": {
+ "excludeByName": {
+ "Time": true,
+ "Time 1": true,
+ "Time 2": true,
+ "Time 3": true,
+ "Time 4": true,
+ "Time 5": true,
+ "Time 6": true,
+ "Time 7": true,
+ "__name__": true,
+ "__name__ 1": true,
+ "__name__ 2": true,
+ "__name__ 3": true,
+ "__name__ 4": true,
+ "__name__ 5": true,
+ "__name__ 6": true,
+ "job": true,
+ "job 1": true,
+ "job 2": true,
+ "job 3": true,
+ "job 4": true,
+ "job 5": true,
+ "job 6": true,
+ "job 7": true,
+ "phase": true,
+ "phase 1": true,
+ "phase 2": true,
+ "phase 3": true,
+ "phase 4": true,
+ "phase 5": true
+ },
+ "indexByName": {},
+ "renameByName": {}
+ }
+ }
+ ],
+ "type": "table"
+ }
+ ],
+ "refresh": "",
+ "schemaVersion": 38,
+ "style": "dark",
+ "tags": [],
+ "templating": {
+ "list": []
+ },
+ "time": {
+ "from": "now-6h",
+ "to": "now"
+ },
+ "timepicker": {},
+ "timezone": "",
+ "title": "SSL Certificate Monitor",
+ "uid": "r8eWoHpGz",
+ "version": 4,
+ "weekStart": ""
+ }
\ No newline at end of file
diff --git a/tools/salt-install/config_examples/multi_host/aws/pillars/prometheus_server.sls b/tools/salt-install/config_examples/multi_host/aws/pillars/prometheus_server.sls
index 26877f35df..143097b4a4 100644
--- a/tools/salt-install/config_examples/multi_host/aws/pillars/prometheus_server.sls
+++ b/tools/salt-install/config_examples/multi_host/aws/pillars/prometheus_server.sls
@@ -14,10 +14,23 @@ prometheus:
- prometheus
- alertmanager
- node_exporter
+ - blackbox_exporter
pkg:
use_upstream_repo: false
use_upstream_archive: true
component:
+ blackbox_exporter:
+ config_file: /etc/prometheus/blackbox_exporter.yml
+ config:
+ modules:
+ http_2xx:
+ prober: http
+ timeout: 5s
+ http:
+ valid_http_versions: [HTTP/1.1, HTTP/2]
+ valid_status_codes: [] # Default is [200]
+ fail_if_ssl: false
+ fail_if_not_ssl: false
prometheus:
service:
args:
@@ -39,6 +52,43 @@ prometheus:
instance: mon.__CLUSTER__
cluster: __CLUSTER__
+ - job_name: http_probe
+ metrics_path: /probe
+ params:
+ module: [http_2xx]
+ static_configs:
+ - targets: ['https://__DOMAIN__']
+ labels:
+ instance: controller.__CLUSTER__
+ - targets: ['https://workbench.__DOMAIN__']
+ labels:
+ instance: workbench.__CLUSTER__
+ - targets: ['https://workbench2.__DOMAIN__']
+ labels:
+ instance: workbench2.__CLUSTER__
+ - targets: ['https://download.__DOMAIN__']
+ labels:
+ instance: download.__CLUSTER__
+ - targets: ['https://grafana.__DOMAIN__']
+ labels:
+ instance: grafana.__CLUSTER__
+ - targets: ['https://prometheus.__DOMAIN__']
+ labels:
+ instance: prometheus.__CLUSTER__
+ - targets: ['https://webshell.__DOMAIN__']
+ labels:
+ instance: webshell.__CLUSTER__
+ - targets: ['https://ws.__DOMAIN__']
+ labels:
+ instance: ws.__CLUSTER__
+ relabel_configs:
+ - source_labels: [__address__]
+ target_label: __param_target
+ - source_labels: [__param_target]
+ target_label: instance
+ - target_label: __address__
+ replacement: 127.0.0.1:9115 # blackbox exporter.
+
## Arvados unique jobs
- job_name: arvados_ws
bearer_token: __MANAGEMENT_TOKEN__
-----------------------------------------------------------------------
hooks/post-receive
--
More information about the arvados-commits
mailing list