From 8cc06e30578ed595edd075792c44a98eecdf530a Mon Sep 17 00:00:00 2001 From: Stefan Benz Date: Wed, 29 Jan 2020 16:14:55 +0100 Subject: [PATCH 1/2] fix(loki): added default retention of chuncks for loki --- .../applications/loki/helm/default.go | 12 +++++++---- .../applications/loki/helm/values.go | 21 ++++++++++++------- 2 files changed, 21 insertions(+), 12 deletions(-) diff --git a/internal/bundle/application/applications/loki/helm/default.go b/internal/bundle/application/applications/loki/helm/default.go index 49e92d0..d89ba97 100644 --- a/internal/bundle/application/applications/loki/helm/default.go +++ b/internal/bundle/application/applications/loki/helm/default.go @@ -27,13 +27,17 @@ func DefaultValues(imageTags map[string]string) *Values { SchemaConfig: &SchemaConfigs{ Configs: []*SchemaConfig{ &SchemaConfig{ - From: "2018-04-15", + From: "2000-01-01", Store: "boltdb", ObjectStore: "filesystem", Schema: "v9", Index: &Index{ Prefix: "index_", - Period: "168h", + Period: "24h", + }, + Chunks: &Chunks{ + Prefix: "chunk_", + Period: "24h", }, }, }, @@ -50,11 +54,11 @@ func DefaultValues(imageTags map[string]string) *Values { }, }, ChunkStoreConfig: &ChunkStoreConfig{ - MaxLookBackPeriod: 0, + MaxLookBackPeriod: "168h", }, TableManager: &TableManager{ RetentionDeletesEnabled: false, - RetentionPeriod: 0, + RetentionPeriod: "336h", }, }, Image: &Image{ diff --git a/internal/bundle/application/applications/loki/helm/values.go b/internal/bundle/application/applications/loki/helm/values.go index d36835d..8bd6a30 100644 --- a/internal/bundle/application/applications/loki/helm/values.go +++ b/internal/bundle/application/applications/loki/helm/values.go @@ -28,12 +28,17 @@ type Index struct { Prefix string `yaml:"prefix"` Period string `yaml:"period"` } +type Chunks struct { + Prefix string `yaml:"prefix"` + Period string `yaml:"period"` +} type SchemaConfig struct { - From string `yaml:"from"` - Store string `yaml:"store"` - ObjectStore string `yaml:"object_store"` - Schema string `yaml:"schema"` - Index *Index `yaml:"index"` + From string `yaml:"from"` + Store string `yaml:"store"` + ObjectStore string `yaml:"object_store"` + Schema string `yaml:"schema"` + Index *Index `yaml:"index"` + Chunks *Chunks `yaml:"chunks"` } type SchemaConfigs struct { Configs []*SchemaConfig `yaml:"configs"` @@ -52,11 +57,11 @@ type StorageConfig struct { Filesystem *Filesystem `yaml:"filesystem"` } type ChunkStoreConfig struct { - MaxLookBackPeriod int `yaml:"max_look_back_period"` + MaxLookBackPeriod string `yaml:"max_look_back_period"` } type TableManager struct { - RetentionDeletesEnabled bool `yaml:"retention_deletes_enabled"` - RetentionPeriod int `yaml:"retention_period"` + RetentionDeletesEnabled bool `yaml:"retention_deletes_enabled"` + RetentionPeriod string `yaml:"retention_period"` } type Config struct { AuthEnabled bool `yaml:"auth_enabled"` From 15933f75828ba5bf304691da1f22bd99bdb6c271 Mon Sep 17 00:00:00 2001 From: Stefan Benz Date: Wed, 29 Jan 2020 17:28:44 +0100 Subject: [PATCH 2/2] fix(grafana): fixed dashboards and added necessary plugin --- dashboards/kubelet/json/kubelet.json | 108 ++-- .../json/persistentvolumesusage.json | 490 ++++++++++++++++++ .../persistentvolumesusage/kustomization.yaml | 12 + .../applications/grafana/config/dashboards.go | 22 +- .../applications/grafana/helm/default.go | 1 + .../applications/grafana/helm/values.go | 1 + 6 files changed, 573 insertions(+), 61 deletions(-) create mode 100644 dashboards/persistentvolumesusage/json/persistentvolumesusage.json create mode 100644 dashboards/persistentvolumesusage/kustomization.yaml diff --git a/dashboards/kubelet/json/kubelet.json b/dashboards/kubelet/json/kubelet.json index 2726a93..25a99f4 100644 --- a/dashboards/kubelet/json/kubelet.json +++ b/dashboards/kubelet/json/kubelet.json @@ -73,7 +73,7 @@ "tableColumn": "", "targets": [ { - "expr": "sum(up{cluster=\"$cluster\", job=\"kubelet\"})", + "expr": "sum(up{cluster=\"$cluster\", job=\"kubernetes-nodes\"})", "format": "time_series", "intervalFactor": 2, "legendFormat": "", @@ -153,10 +153,10 @@ "tableColumn": "", "targets": [ { - "expr": "sum(kubelet_running_pod_count{cluster=\"$cluster\", job=\"kubelet\", instance=~\"$instance\"})", + "expr": "sum(kubelet_running_pod_count{cluster=\"$cluster\", job=\"kubernetes-nodes\", instance=~\"$instance\"})", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}}", + "legendFormat": "{{instance}}", "refId": "A" } ], @@ -233,10 +233,10 @@ "tableColumn": "", "targets": [ { - "expr": "sum(kubelet_running_container_count{cluster=\"$cluster\", job=\"kubelet\", instance=~\"$instance\"})", + "expr": "sum(kubelet_running_container_count{cluster=\"$cluster\", job=\"kubernetes-nodes\", instance=~\"$instance\"})", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}}", + "legendFormat": "{{instance}}", "refId": "A" } ], @@ -313,10 +313,10 @@ "tableColumn": "", "targets": [ { - "expr": "sum(volume_manager_total_volumes{cluster=\"$cluster\", job=\"kubelet\", instance=~\"$instance\", state=\"actual_state_of_world\"})", + "expr": "sum(volume_manager_total_volumes{cluster=\"$cluster\", job=\"kubernetes-nodes\", instance=~\"$instance\", state=\"actual_state_of_world\"})", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}}", + "legendFormat": "{{instance}}", "refId": "A" } ], @@ -393,10 +393,10 @@ "tableColumn": "", "targets": [ { - "expr": "sum(volume_manager_total_volumes{cluster=\"$cluster\", job=\"kubelet\", instance=~\"$instance\",state=\"desired_state_of_world\"})", + "expr": "sum(volume_manager_total_volumes{cluster=\"$cluster\", job=\"kubernetes-nodes\", instance=~\"$instance\",state=\"desired_state_of_world\"})", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}}", + "legendFormat": "{{instance}}", "refId": "A" } ], @@ -473,10 +473,10 @@ "tableColumn": "", "targets": [ { - "expr": "sum(rate(kubelet_node_config_error{cluster=\"$cluster\", job=\"kubelet\", instance=~\"$instance\"}[5m]))", + "expr": "sum(rate(kubelet_node_config_error{cluster=\"$cluster\", job=\"kubernetes-nodes\", instance=~\"$instance\"}[5m]))", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}}", + "legendFormat": "{{instance}}", "refId": "A" } ], @@ -545,10 +545,10 @@ "steppedLine": false, "targets": [ { - "expr": "sum(rate(kubelet_runtime_operations_total{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}[5m])) by (operation_type, instance)", + "expr": "sum(rate(kubelet_runtime_operations_total{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}[5m])) by (operation_type, instance)", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}} {{`{{operation_type}}`}}", + "legendFormat": "{{instance}} {{operation_type}}", "refId": "A" } ], @@ -624,10 +624,10 @@ "steppedLine": false, "targets": [ { - "expr": "sum(rate(kubelet_runtime_operations_errors_total{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}[5m])) by (instance, operation_type)", + "expr": "sum(rate(kubelet_runtime_operations_errors_total{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}[5m])) by (instance, operation_type)", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}} {{`{{operation_type}}`}}", + "legendFormat": "{{instance}} {{operation_type}}", "refId": "A" } ], @@ -716,10 +716,10 @@ "steppedLine": false, "targets": [ { - "expr": "histogram_quantile(0.99, sum(rate(kubelet_runtime_operations_duration_seconds_bucket{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}[5m])) by (instance, operation_type, le))", + "expr": "histogram_quantile(0.99, sum(rate(kubelet_runtime_operations_duration_seconds_bucket{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}[5m])) by (instance, operation_type, le))", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}} {{`{{operation_type}}`}}", + "legendFormat": "{{instance}} {{operation_type}}", "refId": "A" } ], @@ -808,17 +808,17 @@ "steppedLine": false, "targets": [ { - "expr": "sum(rate(kubelet_pod_start_duration_seconds_count{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}[5m])) by (instance)", + "expr": "sum(rate(kubelet_pod_start_duration_seconds_count{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}[5m])) by (instance)", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}} pod", + "legendFormat": "{{instance}} pod", "refId": "A" }, { - "expr": "sum(rate(kubelet_pod_worker_duration_seconds_count{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}[5m])) by (instance)", + "expr": "sum(rate(kubelet_pod_worker_duration_seconds_count{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}[5m])) by (instance)", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}} worker", + "legendFormat": "{{instance}} worker", "refId": "B" } ], @@ -894,17 +894,17 @@ "steppedLine": false, "targets": [ { - "expr": "histogram_quantile(0.99, sum(rate(kubelet_pod_start_duration_seconds_count{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}[5m])) by (instance, le))", + "expr": "histogram_quantile(0.99, sum(rate(kubelet_pod_start_duration_seconds_count{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}[5m])) by (instance, le))", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}} pod", + "legendFormat": "{{instance}} pod", "refId": "A" }, { - "expr": "histogram_quantile(0.99, sum(rate(kubelet_pod_worker_duration_seconds_bucket{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}[5m])) by (instance, le))", + "expr": "histogram_quantile(0.99, sum(rate(kubelet_pod_worker_duration_seconds_bucket{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}[5m])) by (instance, le))", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}} worker", + "legendFormat": "{{instance}} worker", "refId": "B" } ], @@ -995,10 +995,10 @@ "steppedLine": false, "targets": [ { - "expr": "sum(rate(storage_operation_duration_seconds_count{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}[5m])) by (instance, operation_name, volume_plugin)", + "expr": "sum(rate(storage_operation_duration_seconds_count{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}[5m])) by (instance, operation_name, volume_plugin)", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}} {{`{{operation_name}}`}} {{`{{volume_plugin}}`}}", + "legendFormat": "{{instance}} {{operation_name}} {{volume_plugin}}", "refId": "A" } ], @@ -1076,10 +1076,10 @@ "steppedLine": false, "targets": [ { - "expr": "sum(rate(storage_operation_errors_total{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}[5m])) by (instance, operation_name, volume_plugin)", + "expr": "sum(rate(storage_operation_errors_total{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}[5m])) by (instance, operation_name, volume_plugin)", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}} {{`{{operation_name}}`}} {{`{{volume_plugin}}`}}", + "legendFormat": "{{instance}} {{operation_name}} {{volume_plugin}}", "refId": "A" } ], @@ -1170,10 +1170,10 @@ "steppedLine": false, "targets": [ { - "expr": "histogram_quantile(0.99, sum(rate(storage_operation_duration_seconds_bucket{cluster=\"$cluster\", job=\"kubelet\", instance=~\"$instance\"}[5m])) by (instance, operation_name, volume_plugin, le))", + "expr": "histogram_quantile(0.99, sum(rate(storage_operation_duration_seconds_bucket{cluster=\"$cluster\", job=\"kubernetes-nodes\", instance=~\"$instance\"}[5m])) by (instance, operation_name, volume_plugin, le))", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}} {{`{{operation_name}}`}} {{`{{volume_plugin}}`}}", + "legendFormat": "{{instance}} {{operation_name}} {{volume_plugin}}", "refId": "A" } ], @@ -1262,10 +1262,10 @@ "steppedLine": false, "targets": [ { - "expr": "sum(rate(kubelet_cgroup_manager_duration_seconds_count{cluster=\"$cluster\", job=\"kubelet\", instance=~\"$instance\"}[5m])) by (instance, operation_type)", + "expr": "sum(rate(kubelet_cgroup_manager_duration_seconds_count{cluster=\"$cluster\", job=\"kubernetes-nodes\", instance=~\"$instance\"}[5m])) by (instance, operation_type)", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{operation_type}}`}}", + "legendFormat": "{{operation_type}}", "refId": "A" } ], @@ -1341,10 +1341,10 @@ "steppedLine": false, "targets": [ { - "expr": "histogram_quantile(0.99, sum(rate(kubelet_cgroup_manager_duration_seconds_bucket{cluster=\"$cluster\", job=\"kubelet\", instance=~\"$instance\"}[5m])) by (instance, operation_type, le))", + "expr": "histogram_quantile(0.99, sum(rate(kubelet_cgroup_manager_duration_seconds_bucket{cluster=\"$cluster\", job=\"kubernetes-nodes\", instance=~\"$instance\"}[5m])) by (instance, operation_type, le))", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}} {{`{{operation_type}}`}}", + "legendFormat": "{{instance}} {{operation_type}}", "refId": "A" } ], @@ -1434,10 +1434,10 @@ "steppedLine": false, "targets": [ { - "expr": "sum(rate(kubelet_pleg_relist_duration_seconds_count{cluster=\"$cluster\", job=\"kubelet\", instance=~\"$instance\"}[5m])) by (instance)", + "expr": "sum(rate(kubelet_pleg_relist_duration_seconds_count{cluster=\"$cluster\", job=\"kubernetes-nodes\", instance=~\"$instance\"}[5m])) by (instance)", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}}", + "legendFormat": "{{instance}}", "refId": "A" } ], @@ -1513,10 +1513,10 @@ "steppedLine": false, "targets": [ { - "expr": "histogram_quantile(0.99, sum(rate(kubelet_pleg_relist_interval_seconds_bucket{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}[5m])) by (instance, le))", + "expr": "histogram_quantile(0.99, sum(rate(kubelet_pleg_relist_interval_seconds_bucket{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}[5m])) by (instance, le))", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}}", + "legendFormat": "{{instance}}", "refId": "A" } ], @@ -1605,10 +1605,10 @@ "steppedLine": false, "targets": [ { - "expr": "histogram_quantile(0.99, sum(rate(kubelet_pleg_relist_duration_seconds_bucket{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}[5m])) by (instance, le))", + "expr": "histogram_quantile(0.99, sum(rate(kubelet_pleg_relist_duration_seconds_bucket{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}[5m])) by (instance, le))", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}}", + "legendFormat": "{{instance}}", "refId": "A" } ], @@ -1697,28 +1697,28 @@ "steppedLine": false, "targets": [ { - "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kubelet\", instance=~\"$instance\",code=~\"2..\"}[5m]))", + "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kubernetes-nodes\", instance=~\"$instance\",code=~\"2..\"}[5m]))", "format": "time_series", "intervalFactor": 2, "legendFormat": "2xx", "refId": "A" }, { - "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kubelet\", instance=~\"$instance\",code=~\"3..\"}[5m]))", + "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kubernetes-nodes\", instance=~\"$instance\",code=~\"3..\"}[5m]))", "format": "time_series", "intervalFactor": 2, "legendFormat": "3xx", "refId": "B" }, { - "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kubelet\", instance=~\"$instance\",code=~\"4..\"}[5m]))", + "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kubernetes-nodes\", instance=~\"$instance\",code=~\"4..\"}[5m]))", "format": "time_series", "intervalFactor": 2, "legendFormat": "4xx", "refId": "C" }, { - "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kubelet\", instance=~\"$instance\",code=~\"5..\"}[5m]))", + "expr": "sum(rate(rest_client_requests_total{cluster=\"$cluster\",job=\"kubernetes-nodes\", instance=~\"$instance\",code=~\"5..\"}[5m]))", "format": "time_series", "intervalFactor": 2, "legendFormat": "5xx", @@ -1810,10 +1810,10 @@ "steppedLine": false, "targets": [ { - "expr": "histogram_quantile(0.99, sum(rate(rest_client_request_latency_seconds_bucket{cluster=\"$cluster\",job=\"kubelet\", instance=~\"$instance\"}[5m])) by (instance, verb, url, le))", + "expr": "histogram_quantile(0.99, sum(rate(rest_client_request_latency_seconds_bucket{cluster=\"$cluster\",job=\"kubernetes-nodes\", instance=~\"$instance\"}[5m])) by (instance, verb, url, le))", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}} {{`{{verb}}`}} {{`{{url}}`}}", + "legendFormat": "{{instance}} {{verb}} {{url}}", "refId": "A" } ], @@ -1902,10 +1902,10 @@ "steppedLine": false, "targets": [ { - "expr": "process_resident_memory_bytes{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}", + "expr": "process_resident_memory_bytes{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}}", + "legendFormat": "{{instance}}", "refId": "A" } ], @@ -1981,10 +1981,10 @@ "steppedLine": false, "targets": [ { - "expr": "rate(process_cpu_seconds_total{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}[5m])", + "expr": "rate(process_cpu_seconds_total{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}[5m])", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}}", + "legendFormat": "{{instance}}", "refId": "A" } ], @@ -2060,10 +2060,10 @@ "steppedLine": false, "targets": [ { - "expr": "go_goroutines{cluster=\"$cluster\",job=\"kubelet\",instance=~\"$instance\"}", + "expr": "go_goroutines{cluster=\"$cluster\",job=\"kubernetes-nodes\",instance=~\"$instance\"}", "format": "time_series", "intervalFactor": 2, - "legendFormat": "{{`{{instance}}`}}", + "legendFormat": "{{instance}}", "refId": "A" } ], @@ -2164,7 +2164,7 @@ "multi": false, "name": "instance", "options": [], - "query": "label_values(kubelet_runtime_operations{cluster=\"$cluster\", job=\"kubelet\"}, instance)", + "query": "label_values(kubelet_runtime_operations{cluster=\"$cluster\", job=\"kubernetes-nodes\"}, instance)", "refresh": 2, "regex": "", "sort": 1, diff --git a/dashboards/persistentvolumesusage/json/persistentvolumesusage.json b/dashboards/persistentvolumesusage/json/persistentvolumesusage.json new file mode 100644 index 0000000..64db342 --- /dev/null +++ b/dashboards/persistentvolumesusage/json/persistentvolumesusage.json @@ -0,0 +1,490 @@ +{ + "__inputs": [], + "__requires": [], + "annotations": { + "list": [] + }, + "editable": false, + "gnetId": null, + "graphTooltip": 0, + "hideControls": false, + "id": null, + "links": [], + "refresh": "", + "rows": [ + { + "collapse": false, + "collapsed": false, + "panels": [ + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "$datasource", + "fill": 1, + "gridPos": {}, + "id": 2, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "repeat": null, + "seriesOverrides": [], + "spaceLength": 10, + "span": 9, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "(\n sum without(instance, node) (kubelet_volume_stats_capacity_bytes{job=\"kubernetes-nodes\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n -\n sum without(instance, node) (kubelet_volume_stats_available_bytes{job=\"kubernetes-nodes\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n)\n", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "Used Space", + "refId": "A" + }, + { + "expr": "sum without(instance, node) (kubelet_volume_stats_available_bytes{job=\"kubernetes-nodes\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "Free Space", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Volume Space Usage", + "tooltip": { + "shared": false, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "bytes", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ] + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "$datasource", + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": {}, + "id": 3, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "span": 3, + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "(\n kubelet_volume_stats_capacity_bytes{job=\"kubernetes-nodes\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"}\n -\n kubelet_volume_stats_available_bytes{job=\"kubernetes-nodes\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"}\n)\n/\nkubelet_volume_stats_capacity_bytes{job=\"kubernetes-nodes\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"}\n* 100\n", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A" + } + ], + "thresholds": "80, 90", + "title": "Volume Space Usage", + "tooltip": { + "shared": false + }, + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + } + ], + "repeat": null, + "repeatIteration": null, + "repeatRowId": null, + "showTitle": false, + "title": "Dashboard Row", + "titleSize": "h6", + "type": "row" + }, + { + "collapse": false, + "collapsed": false, + "panels": [ + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": "$datasource", + "fill": 1, + "gridPos": {}, + "id": 4, + "legend": { + "alignAsTable": true, + "avg": true, + "current": true, + "max": true, + "min": true, + "rightSide": false, + "show": true, + "total": false, + "values": true + }, + "lines": true, + "linewidth": 1, + "links": [], + "nullPointMode": "null", + "percentage": false, + "pointradius": 5, + "points": false, + "renderer": "flot", + "repeat": null, + "seriesOverrides": [], + "spaceLength": 10, + "span": 9, + "stack": true, + "steppedLine": false, + "targets": [ + { + "expr": "sum without(instance, node) (kubelet_volume_stats_inodes_used{job=\"kubernetes-nodes\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": "Used inodes", + "refId": "A" + }, + { + "expr": "(\n sum without(instance, node) (kubelet_volume_stats_inodes{job=\"kubernetes-nodes\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n -\n sum without(instance, node) (kubelet_volume_stats_inodes_used{job=\"kubernetes-nodes\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"})\n)\n", + "format": "time_series", + "intervalFactor": 1, + "legendFormat": " Free inodes", + "refId": "B" + } + ], + "thresholds": [], + "timeFrom": null, + "timeShift": null, + "title": "Volume inodes Usage", + "tooltip": { + "shared": false, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "buckets": null, + "mode": "time", + "name": null, + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + }, + { + "format": "none", + "label": null, + "logBase": 1, + "max": null, + "min": 0, + "show": true + } + ] + }, + { + "cacheTimeout": null, + "colorBackground": false, + "colorValue": false, + "colors": [ + "rgba(50, 172, 45, 0.97)", + "rgba(237, 129, 40, 0.89)", + "rgba(245, 54, 54, 0.9)" + ], + "datasource": "$datasource", + "format": "percent", + "gauge": { + "maxValue": 100, + "minValue": 0, + "show": true, + "thresholdLabels": false, + "thresholdMarkers": true + }, + "gridPos": {}, + "id": 5, + "interval": null, + "links": [], + "mappingType": 1, + "mappingTypes": [ + { + "name": "value to text", + "value": 1 + }, + { + "name": "range to text", + "value": 2 + } + ], + "maxDataPoints": 100, + "nullPointMode": "connected", + "nullText": null, + "postfix": "", + "postfixFontSize": "50%", + "prefix": "", + "prefixFontSize": "50%", + "rangeMaps": [ + { + "from": "null", + "text": "N/A", + "to": "null" + } + ], + "span": 3, + "sparkline": { + "fillColor": "rgba(31, 118, 189, 0.18)", + "full": false, + "lineColor": "rgb(31, 120, 193)", + "show": false + }, + "tableColumn": "", + "targets": [ + { + "expr": "kubelet_volume_stats_inodes_used{job=\"kubernetes-nodes\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"}\n/\nkubelet_volume_stats_inodes{job=\"kubernetes-nodes\", namespace=\"$namespace\", persistentvolumeclaim=\"$volume\"}\n* 100\n", + "format": "time_series", + "intervalFactor": 2, + "legendFormat": "", + "refId": "A" + } + ], + "thresholds": "80, 90", + "title": "Volume inodes Usage", + "tooltip": { + "shared": false + }, + "type": "singlestat", + "valueFontSize": "80%", + "valueMaps": [ + { + "op": "=", + "text": "N/A", + "value": "null" + } + ], + "valueName": "current" + } + ], + "repeat": null, + "repeatIteration": null, + "repeatRowId": null, + "showTitle": false, + "title": "Dashboard Row", + "titleSize": "h6", + "type": "row" + } + ], + "schemaVersion": 14, + "style": "dark", + "tags": [ + "kubernetes-mixin" + ], + "templating": { + "list": [ + { + "current": { + "text": "Prometheus", + "value": "Prometheus" + }, + "hide": 0, + "label": null, + "name": "datasource", + "options": [], + "query": "prometheus", + "refresh": 1, + "regex": "", + "type": "datasource" + }, + { + "allValue": null, + "current": {}, + "datasource": "$datasource", + "hide": 2, + "includeAll": false, + "label": "cluster", + "multi": false, + "name": "cluster", + "options": [], + "query": "label_values(kubelet_volume_stats_capacity_bytes, cluster)", + "refresh": 2, + "regex": "", + "sort": 1, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$datasource", + "hide": 0, + "includeAll": false, + "label": "Namespace", + "multi": false, + "name": "namespace", + "options": [], + "query": "label_values(kubelet_volume_stats_capacity_bytes{job=\"kubernetes-nodes\"}, namespace)", + "refresh": 2, + "regex": "", + "sort": 1, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": null, + "current": {}, + "datasource": "$datasource", + "hide": 0, + "includeAll": false, + "label": "PersistentVolumeClaim", + "multi": false, + "name": "volume", + "options": [], + "query": "label_values(kubelet_volume_stats_capacity_bytes{job=\"kubernetes-nodes\", namespace=\"$namespace\"}, persistentvolumeclaim)", + "refresh": 2, + "regex": "", + "sort": 1, + "tagValuesQuery": "", + "tags": [], + "tagsQuery": "", + "type": "query", + "useTags": false + } + ] + }, + "time": { + "from": "now-7d", + "to": "now" + }, + "timepicker": { + "refresh_intervals": [ + "5s", + "10s", + "30s", + "1m", + "5m", + "15m", + "30m", + "1h", + "2h", + "1d" + ], + "time_options": [ + "5m", + "15m", + "1h", + "6h", + "12h", + "24h", + "2d", + "7d", + "30d" + ] + }, + "timezone": "", + "title": "Kubernetes / Persistent Volumes", + "uid": "919b92a8e8041bd567af9edab12c840c", + "version": 0 +} \ No newline at end of file diff --git a/dashboards/persistentvolumesusage/kustomization.yaml b/dashboards/persistentvolumesusage/kustomization.yaml new file mode 100644 index 0000000..1e549d9 --- /dev/null +++ b/dashboards/persistentvolumesusage/kustomization.yaml @@ -0,0 +1,12 @@ +apiVersion: kustomize.config.k8s.io/v1beta1 +kind: Kustomization + +namespace: caos-system + +configMapGenerator: +- name: grafana-persistentvolumesusage + files: + - json/persistentvolumesusage.json + +generatorOptions: + disableNameSuffixHash: true diff --git a/internal/bundle/application/applications/grafana/config/dashboards.go b/internal/bundle/application/applications/grafana/config/dashboards.go index b109793..6ceb69d 100644 --- a/internal/bundle/application/applications/grafana/config/dashboards.go +++ b/internal/bundle/application/applications/grafana/config/dashboards.go @@ -57,12 +57,20 @@ func getGrafanaDashboards(dashboardsfolder string, toolsetCRDSpec *toolsetsv1bet providers = append(providers, provider) } - // provider := &ConfigProvider{ - // ConfigMaps: []string{ - // "grafana-dashboard-kubelet", - // }, - // Folder: filepath.Join(dashboardsfolder, "kubelet"), - // } - // providers = append(providers, provider) + provider := &Provider{ + ConfigMaps: []string{ + "grafana-dashboard-kubelet", + }, + Folder: filepath.Join(dashboardsfolder, "kubelet"), + } + providers = append(providers, provider) + + provider = &Provider{ + ConfigMaps: []string{ + "grafana-persistentvolumesusage", + }, + Folder: filepath.Join(dashboardsfolder, "persistentvolumesusage"), + } + providers = append(providers, provider) return providers } diff --git a/internal/bundle/application/applications/grafana/helm/default.go b/internal/bundle/application/applications/grafana/helm/default.go index 7124871..f6aab85 100644 --- a/internal/bundle/application/applications/grafana/helm/default.go +++ b/internal/bundle/application/applications/grafana/helm/default.go @@ -24,6 +24,7 @@ func DefaultValues(imageTags map[string]string) *Values { ServiceMonitor: &ServiceMonitor{ SelfMonitor: false, }, + Plugins: []string{"grafana-piechart-panel"}, } return &Values{ diff --git a/internal/bundle/application/applications/grafana/helm/values.go b/internal/bundle/application/applications/grafana/helm/values.go index 2c4c435..730ecbd 100644 --- a/internal/bundle/application/applications/grafana/helm/values.go +++ b/internal/bundle/application/applications/grafana/helm/values.go @@ -74,6 +74,7 @@ type GrafanaValues struct { ServiceMonitor *ServiceMonitor `yaml:"serviceMonitor"` DashboardProviders *DashboardProviders `yaml:"dashboardProviders,omitempty"` DashboardsConfigMaps map[string]string `yaml:"dashboardsConfigMaps,omitempty"` + Plugins []string `yaml:"plugins,omitempty"` } type Rules struct {