Skip to content

Commit 1dedbb9

Browse files
authored
Merge pull request #1 from kabisa/kubernetes-alert-updates
updating alerts to v0.5 and replicaset unavailable fix for replicaset…
2 parents a7ac6bb + b39d80b commit 1dedbb9

17 files changed

+210
-20
lines changed

.gitignore

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
.terraform

daemonset-incomplete-variables.tf

Lines changed: 27 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,8 @@ variable "daemonset_incomplete_enabled" {
44
}
55

66
variable "daemonset_incomplete_critical" {
7-
type = number
8-
default = 0
7+
type = number
8+
default = 0
99
description = "alert is raised when (desired - running) > daemonset_incomplete_critical"
1010
}
1111

@@ -38,3 +38,28 @@ variable "daemonset_incomplete_alerting_enabled" {
3838
type = bool
3939
default = true
4040
}
41+
42+
variable "daemonset_incomplete_no_data_timeframe" {
43+
type = number
44+
default = null
45+
}
46+
47+
variable "daemonset_incomplete_notify_no_data" {
48+
type = bool
49+
default = false
50+
}
51+
52+
variable "daemonset_incomplete_ok_threshold" {
53+
type = number
54+
default = null
55+
}
56+
57+
variable "daemonset_incomplete_name_prefix" {
58+
type = string
59+
default = ""
60+
}
61+
62+
variable "daemonset_incomplete_name_suffix" {
63+
type = string
64+
default = ""
65+
}

daemonset-incomplete.tf

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ locals {
66
}
77

88
module "daemonset_incomplete" {
9-
source = "[email protected]:kabisa/terraform-datadog-generic-monitor.git?ref=0.2"
9+
source = "[email protected]:kabisa/terraform-datadog-generic-monitor.git?ref=0.5"
1010

1111
name = "Daemonset Incomplete"
1212
query = "min(${var.daemonset_incomplete_evaluation_period}):max:kubernetes_state.daemonset.scheduled{${local.daemonset_incomplete_filter}} by {daemonset,cluster_name} - min:kubernetes_state.daemonset.ready{${local.daemonset_incomplete_filter}} by {daemonset,cluster_name} > 0"
@@ -29,4 +29,5 @@ module "daemonset_incomplete" {
2929
require_full_window = true
3030

3131
critical_threshold = var.daemonset_incomplete_critical
32+
locked = var.locked
3233
}

hpa-status-variables.tf

Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -32,3 +32,28 @@ variable "hpa_status_alerting_enabled" {
3232
type = bool
3333
default = true
3434
}
35+
36+
variable "hpa_status_no_data_timeframe" {
37+
type = number
38+
default = null
39+
}
40+
41+
variable "hpa_status_notify_no_data" {
42+
type = bool
43+
default = false
44+
}
45+
46+
variable "hpa_status_ok_threshold" {
47+
type = number
48+
default = null
49+
}
50+
51+
variable "hpa_status_name_prefix" {
52+
type = string
53+
default = ""
54+
}
55+
56+
variable "hpa_status_name_suffix" {
57+
type = string
58+
default = ""
59+
}

hpa-status.tf

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,13 +1,13 @@
11
locals {
22
hpa_status_filter = (
33
var.hpa_status_filter_override != ""
4-
? var.hpa_status_filter_override
5-
: var.filter_str
4+
? var.hpa_status_filter_override
5+
: var.filter_str
66
)
77
}
88

99
module "hpa_status" {
10-
source = "[email protected]:kabisa/terraform-datadog-generic-monitor.git?ref=0.2"
10+
source = "[email protected]:kabisa/terraform-datadog-generic-monitor.git?ref=0.5"
1111

1212
name = "HPA Status not OK"
1313
query = "avg(${var.hpa_status_evaluation_period}):avg:kubernetes_state.hpa.condition{${local.hpa_status_filter}} by {hpa,kube_namespace,status,condition} < 1"
@@ -30,4 +30,5 @@ module "hpa_status" {
3030
require_full_window = false
3131

3232
critical_threshold = 1
33+
locked = var.locked
3334
}

node-memory-used-percent-variables.tf

Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -44,3 +44,28 @@ variable "node_memory_used_percent_alerting_enabled" {
4444
type = bool
4545
default = true
4646
}
47+
48+
variable "node_memory_used_percent_no_data_timeframe" {
49+
type = number
50+
default = null
51+
}
52+
53+
variable "node_memory_used_percent_notify_no_data" {
54+
type = bool
55+
default = false
56+
}
57+
58+
variable "node_memory_used_percent_ok_threshold" {
59+
type = number
60+
default = null
61+
}
62+
63+
variable "node_memory_used_percent_name_prefix" {
64+
type = string
65+
default = ""
66+
}
67+
68+
variable "node_memory_used_percent_name_suffix" {
69+
type = string
70+
default = ""
71+
}

node-memory-used-percent.tf

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ locals {
66
}
77

88
module "node_memory_used_percent" {
9-
source = "[email protected]:kabisa/terraform-datadog-generic-monitor.git?ref=0.2"
9+
source = "[email protected]:kabisa/terraform-datadog-generic-monitor.git?ref=0.5"
1010

1111
name = "Memory Used Percent"
1212
query = "avg(${var.node_memory_used_percent_evaluation_period}):( 100 * max:kubernetes.memory.usage{${local.node_memory_used_percent_filter}} by {host,cluster_name} ) / max:kubernetes.memory.capacity{${local.node_memory_used_percent_filter}} by {host,cluster_name} > ${var.node_memory_used_percent_critical}"
@@ -30,4 +30,5 @@ module "node_memory_used_percent" {
3030

3131
critical_threshold = var.node_memory_used_percent_critical
3232
warning_threshold = var.node_memory_used_percent_warning
33+
locked = var.locked
3334
}

node-status-variables.tf

Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -32,3 +32,28 @@ variable "node_status_alerting_enabled" {
3232
type = bool
3333
default = true
3434
}
35+
36+
variable "node_status_no_data_timeframe" {
37+
type = number
38+
default = null
39+
}
40+
41+
variable "node_status_notify_no_data" {
42+
type = bool
43+
default = false
44+
}
45+
46+
variable "node_status_ok_threshold" {
47+
type = number
48+
default = null
49+
}
50+
51+
variable "node_status_name_prefix" {
52+
type = string
53+
default = ""
54+
}
55+
56+
variable "node_status_name_suffix" {
57+
type = string
58+
default = ""
59+
}

node-status.tf

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ locals {
66
}
77

88
module "node_status" {
9-
source = "[email protected]:kabisa/terraform-datadog-generic-monitor.git?ref=0.2"
9+
source = "[email protected]:kabisa/terraform-datadog-generic-monitor.git?ref=0.5"
1010

1111
name = "Node Status not OK"
1212
query = "avg(${var.node_status_evaluation_period}):avg:kubernetes_state.node.status{${local.node_status_filter}} by {cluster_name,node} < 1"
@@ -29,4 +29,5 @@ module "node_status" {
2929
require_full_window = false
3030

3131
critical_threshold = 1
32+
locked = var.locked
3233
}

pod-ready-variables.tf

Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -32,3 +32,28 @@ variable "pod_ready_alerting_enabled" {
3232
type = bool
3333
default = true
3434
}
35+
36+
variable "pod_ready_no_data_timeframe" {
37+
type = number
38+
default = null
39+
}
40+
41+
variable "pod_ready_notify_no_data" {
42+
type = bool
43+
default = false
44+
}
45+
46+
variable "pod_ready_ok_threshold" {
47+
type = number
48+
default = null
49+
}
50+
51+
variable "pod_ready_name_prefix" {
52+
type = string
53+
default = ""
54+
}
55+
56+
variable "pod_ready_name_suffix" {
57+
type = string
58+
default = ""
59+
}

0 commit comments

Comments
 (0)