diff --git a/caas/kubernetes/node/README.md b/caas/kubernetes/node/README.md index bf18a5b3..540c7a1f 100644 --- a/caas/kubernetes/node/README.md +++ b/caas/kubernetes/node/README.md @@ -17,15 +17,15 @@ module "datadog-monitors-caas-kubernetes-node" { Creates DataDog monitors with the following checks: -- Kubernetes Node Disk pressure -- Kubernetes Node Frequent unregister net device -- Kubernetes Node Kubelet API does not respond -- Kubernetes Node Kubelet sync loop that updates containers does not work -- Kubernetes Node Memory pressure -- Kubernetes Node not ready -- Kubernetes Node unschedulable -- Kubernetes Node volume inodes usage -- Kubernetes Node volume space usage +- Kubernetes Node {{kube_node}} disk pressure on {{kube_cluster_name}} +- Kubernetes Node {{kube_node}} frequent unregister net device +- Kubernetes Node {{kube_node}} Kubelet API does not respond on {{kube_cluster_name}} +- Kubernetes Node {{kube_node}} Kubelet sync loop that updates containers does not work on {{kube_cluster_name}} +- Kubernetes Node {{kube_node}} memory pressure on {{kube_cluster_name}} +- Kubernetes Node {{kube_node}} not ready on {{kube_cluster_name}} +- Kubernetes Node {{kube_node}} unschedulable on {{kube_cluster_name}} +- Kubernetes Node volume {{persistentvolumeclaim}} inodes usage +- Kubernetes Node volume {{persistentvolumeclaim}} space usage ## Requirements diff --git a/caas/kubernetes/node/monitors-k8s-node.tf b/caas/kubernetes/node/monitors-k8s-node.tf index 804ea2f7..d5584127 100644 --- a/caas/kubernetes/node/monitors-k8s-node.tf +++ b/caas/kubernetes/node/monitors-k8s-node.tf @@ -1,6 +1,6 @@ resource "datadog_monitor" "disk_pressure" { count = var.disk_pressure_enabled == "true" ? 1 : 0 - name = "${var.prefix_slug == "" ? "" : "[${var.prefix_slug}]"}[${var.environment}] Kubernetes Node Disk pressure" + name = "${var.prefix_slug == "" ? "" : "[${var.prefix_slug}]"}[${var.environment}] Kubernetes Node {{kube_node}} disk pressure on {{kube_cluster_name}}" message = coalesce(var.disk_pressure_message, var.message) type = "service check" @@ -27,7 +27,7 @@ EOQ resource "datadog_monitor" "memory_pressure" { count = var.memory_pressure_enabled == "true" ? 1 : 0 - name = "${var.prefix_slug == "" ? "" : "[${var.prefix_slug}]"}[${var.environment}] Kubernetes Node Memory pressure" + name = "${var.prefix_slug == "" ? "" : "[${var.prefix_slug}]"}[${var.environment}] Kubernetes Node {{kube_node}} memory pressure on {{kube_cluster_name}}" message = coalesce(var.memory_pressure_message, var.message) type = "service check" @@ -54,7 +54,7 @@ EOQ resource "datadog_monitor" "ready" { count = var.ready_enabled == "true" ? 1 : 0 - name = "${var.prefix_slug == "" ? "" : "[${var.prefix_slug}]"}[${var.environment}] Kubernetes Node not ready" + name = "${var.prefix_slug == "" ? "" : "[${var.prefix_slug}]"}[${var.environment}] Kubernetes Node {{kube_node}} not ready on {{kube_cluster_name}}" message = coalesce(var.ready_message, var.message) type = "service check" @@ -81,12 +81,12 @@ EOQ resource "datadog_monitor" "kubelet_ping" { count = var.kubelet_ping_enabled == "true" ? 1 : 0 - name = "${var.prefix_slug == "" ? "" : "[${var.prefix_slug}]"}[${var.environment}] Kubernetes Node Kubelet API does not respond" + name = "${var.prefix_slug == "" ? "" : "[${var.prefix_slug}]"}[${var.environment}] Kubernetes Node {{kube_node}} Kubelet API does not respond on {{kube_cluster_name}}" message = coalesce(var.kubelet_ping_message, var.message) type = "service check" query = < ## Requirements diff --git a/caas/kubernetes/pod/monitors-k8s-pod.tf b/caas/kubernetes/pod/monitors-k8s-pod.tf index 16f8383f..960d0bd3 100644 --- a/caas/kubernetes/pod/monitors-k8s-pod.tf +++ b/caas/kubernetes/pod/monitors-k8s-pod.tf @@ -119,7 +119,7 @@ EOQ resource "datadog_monitor" "pod_frequently_restarted" { count = var.pod_frequently_restarted_enabled == "true" ? 1 : 0 - name = "${var.prefix_slug == "" ? "" : "[${var.prefix_slug}]"}[${var.environment}] Kubernetes pods in {{kube_replica_set}} frequently restarted on {{kube_cluster_name}}" + name = "${var.prefix_slug == "" ? "" : "[${var.prefix_slug}]"}[${var.environment}] Kubernetes Pods in {{kube_replica_set}} frequently restarted on {{kube_cluster_name}}" message = coalesce(var.pod_frequently_restarted_message, var.message) type = "metric alert"