File tree Expand file tree Collapse file tree 16 files changed +64
-64
lines changed Expand file tree Collapse file tree 16 files changed +64
-64
lines changed Original file line number Diff line number Diff line change @@ -71,10 +71,10 @@ policy_types:
71
71
description : pre-define alerts for container CPU
72
72
default :
73
73
- alert : service_overloaded
74
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 > {{SERVICE_TH_MAX}}'
74
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 > {{SERVICE_TH_MAX}}'
75
75
for : 30s
76
76
- alert : service_underloaded
77
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 < {{SERVICE_TH_MIN}}'
77
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 < {{SERVICE_TH_MIN}}'
78
78
for : 30s
79
79
required : true
80
80
scaling_rule :
@@ -99,10 +99,10 @@ policy_types:
99
99
description : pre-define alerts for VM CPU
100
100
default :
101
101
- alert : node_overloaded
102
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) > {{NODE_TH_MAX}}'
102
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 > {{NODE_TH_MAX}}'
103
103
for : 1m
104
104
- alert : node_underloaded
105
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) < {{NODE_TH_MIN}}'
105
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 < {{NODE_TH_MIN}}'
106
106
for : 1m
107
107
required : true
108
108
scaling_rule :
Original file line number Diff line number Diff line change @@ -70,10 +70,10 @@ policy_types:
70
70
description : pre-define alerts for container CPU
71
71
default :
72
72
- alert : service_overloaded
73
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 > {{SERVICE_TH_MAX}}'
73
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 > {{SERVICE_TH_MAX}}'
74
74
for : 30s
75
75
- alert : service_underloaded
76
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 < {{SERVICE_TH_MIN}}'
76
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 < {{SERVICE_TH_MIN}}'
77
77
for : 30s
78
78
required : true
79
79
scaling_rule :
@@ -98,10 +98,10 @@ policy_types:
98
98
description : pre-define alerts for VM CPU
99
99
default :
100
100
- alert : node_overloaded
101
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) > {{NODE_TH_MAX}}'
101
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 > {{NODE_TH_MAX}}'
102
102
for : 1m
103
103
- alert : node_underloaded
104
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) < {{NODE_TH_MIN}}'
104
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 < {{NODE_TH_MIN}}'
105
105
for : 1m
106
106
required : true
107
107
scaling_rule :
Original file line number Diff line number Diff line change @@ -73,10 +73,10 @@ policy_types:
73
73
description : pre-define alerts for container CPU
74
74
default :
75
75
- alert : service_overloaded
76
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 > {{SERVICE_TH_MAX}}'
76
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 > {{SERVICE_TH_MAX}}'
77
77
for : 30s
78
78
- alert : service_underloaded
79
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 < {{SERVICE_TH_MIN}}'
79
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 < {{SERVICE_TH_MIN}}'
80
80
for : 30s
81
81
required : true
82
82
scaling_rule :
@@ -101,10 +101,10 @@ policy_types:
101
101
description : pre-define alerts for VM CPU
102
102
default :
103
103
- alert : node_overloaded
104
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) > {{NODE_TH_MAX}}'
104
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 > {{NODE_TH_MAX}}'
105
105
for : 1m
106
106
- alert : node_underloaded
107
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) < {{NODE_TH_MIN}}'
107
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 < {{NODE_TH_MIN}}'
108
108
for : 1m
109
109
required : true
110
110
scaling_rule :
Original file line number Diff line number Diff line change @@ -73,10 +73,10 @@ policy_types:
73
73
description : pre-define alerts for container CPU
74
74
default :
75
75
- alert : service_overloaded
76
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 > {{SERVICE_TH_MAX}}'
76
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 > {{SERVICE_TH_MAX}}'
77
77
for : 30s
78
78
- alert : service_underloaded
79
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 < {{SERVICE_TH_MIN}}'
79
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 < {{SERVICE_TH_MIN}}'
80
80
for : 30s
81
81
required : true
82
82
scaling_rule :
@@ -101,10 +101,10 @@ policy_types:
101
101
description : pre-define alerts for VM CPU
102
102
default :
103
103
- alert : node_overloaded
104
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) > {{NODE_TH_MAX}}'
104
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 > {{NODE_TH_MAX}}'
105
105
for : 1m
106
106
- alert : node_underloaded
107
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) < {{NODE_TH_MIN}}'
107
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 < {{NODE_TH_MIN}}'
108
108
for : 1m
109
109
required : true
110
110
scaling_rule :
Original file line number Diff line number Diff line change @@ -73,10 +73,10 @@ policy_types:
73
73
description : pre-define alerts for container CPU
74
74
default :
75
75
- alert : service_overloaded
76
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 > {{SERVICE_TH_MAX}}'
76
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 > {{SERVICE_TH_MAX}}'
77
77
for : 30s
78
78
- alert : service_underloaded
79
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 < {{SERVICE_TH_MIN}}'
79
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 < {{SERVICE_TH_MIN}}'
80
80
for : 30s
81
81
required : true
82
82
scaling_rule :
@@ -101,10 +101,10 @@ policy_types:
101
101
description : pre-define alerts for VM CPU
102
102
default :
103
103
- alert : node_overloaded
104
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) > {{NODE_TH_MAX}}'
104
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 > {{NODE_TH_MAX}}'
105
105
for : 1m
106
106
- alert : node_underloaded
107
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) < {{NODE_TH_MIN}}'
107
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 < {{NODE_TH_MIN}}'
108
108
for : 1m
109
109
required : true
110
110
scaling_rule :
Original file line number Diff line number Diff line change @@ -71,10 +71,10 @@ policy_types:
71
71
description : pre-define alerts for container CPU
72
72
default :
73
73
- alert : service_overloaded
74
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 > {{SERVICE_TH_MAX}}'
74
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 > {{SERVICE_TH_MAX}}'
75
75
for : 30s
76
76
- alert : service_underloaded
77
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 < {{SERVICE_TH_MIN}}'
77
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 < {{SERVICE_TH_MIN}}'
78
78
for : 30s
79
79
required : true
80
80
scaling_rule :
@@ -99,10 +99,10 @@ policy_types:
99
99
description : pre-define alerts for VM CPU
100
100
default :
101
101
- alert : node_overloaded
102
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) > {{NODE_TH_MAX}}'
102
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 > {{NODE_TH_MAX}}'
103
103
for : 1m
104
104
- alert : node_underloaded
105
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) < {{NODE_TH_MIN}}'
105
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 < {{NODE_TH_MIN}}'
106
106
for : 1m
107
107
required : true
108
108
scaling_rule :
Original file line number Diff line number Diff line change @@ -75,10 +75,10 @@ policy_types:
75
75
description : pre-define alerts for container CPU
76
76
default :
77
77
- alert : service_overloaded
78
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 > {{SERVICE_TH_MAX}}'
78
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 > {{SERVICE_TH_MAX}}'
79
79
for : 30s
80
80
- alert : service_underloaded
81
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 < {{SERVICE_TH_MIN}}'
81
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 < {{SERVICE_TH_MIN}}'
82
82
for : 30s
83
83
required : true
84
84
scaling_rule :
@@ -103,10 +103,10 @@ policy_types:
103
103
description : pre-define alerts for VM CPU
104
104
default :
105
105
- alert : node_overloaded
106
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) > {{NODE_TH_MAX}}'
106
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 > {{NODE_TH_MAX}}'
107
107
for : 1m
108
108
- alert : node_underloaded
109
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) < {{NODE_TH_MIN}}'
109
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 < {{NODE_TH_MIN}}'
110
110
for : 1m
111
111
required : true
112
112
scaling_rule :
Original file line number Diff line number Diff line change @@ -78,10 +78,10 @@ policy_types:
78
78
description : pre-define alerts for container CPU
79
79
default :
80
80
- alert : service_overloaded
81
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 > {{SERVICE_TH_MAX}}'
81
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 > {{SERVICE_TH_MAX}}'
82
82
for : 30s
83
83
- alert : service_underloaded
84
- expr : ' avg(rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name= "{{SERVICE_FULL_NAME}}"}[60s]))*100 < {{SERVICE_TH_MIN}}'
84
+ expr : ' avg(rate(container_cpu_usage_seconds_total{image!~"docker.io/rancher.*", pod=~ "{{SERVICE_FULL_NAME}}.* "}[60s]))*100 < {{SERVICE_TH_MIN}}'
85
85
for : 30s
86
86
required : true
87
87
scaling_rule :
@@ -106,10 +106,10 @@ policy_types:
106
106
description : pre-define alerts for VM CPU
107
107
default :
108
108
- alert : node_overloaded
109
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) > {{NODE_TH_MAX}}'
109
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 > {{NODE_TH_MAX}}'
110
110
for : 1m
111
111
- alert : node_underloaded
112
- expr : ' (100-( avg(rate(node_cpu_seconds_total{node= "{{ NODE_NAME }}", mode="idle "}[60s]))*100)) < {{NODE_TH_MIN}}'
112
+ expr : ' avg(rate(container_cpu_usage_seconds_total{instance=~ "{{ NODE_NAME }}.* ", id="/ "}[60s]))*100 < {{NODE_TH_MIN}}'
113
113
for : 1m
114
114
required : true
115
115
scaling_rule :
Original file line number Diff line number Diff line change @@ -150,10 +150,10 @@ policy_types:
150
150
description : pre-define alerts for container Net
151
151
default :
152
152
- alert : service_overloaded
153
- expr : ' avg(rate(container_network_receive_bytes_total{container_label_io_kubernetes_pod_name =~"{{SERVICE_FULL_NAME}}-[^-]*-[^-] *"}[60s]))/1000 > {{SERVICE_TH_MAX}}'
153
+ expr : ' avg(rate(container_network_receive_bytes_total{pod =~"{{SERVICE_FULL_NAME}}. *"}[60s]))/1000 > {{SERVICE_TH_MAX}}'
154
154
for : 30s
155
155
- alert : service_underloaded
156
- expr : ' avg(rate(container_network_receive_bytes_total{container_label_io_kubernetes_pod_name =~"{{SERVICE_FULL_NAME}}-[^-]*-[^-] *"}[60s]))/1000 < {{SERVICE_TH_MIN}}'
156
+ expr : ' avg(rate(container_network_receive_bytes_total{pod =~"{{SERVICE_FULL_NAME}}. *"}[60s]))/1000 < {{SERVICE_TH_MIN}}'
157
157
for : 30s
158
158
required : true
159
159
scaling_rule :
@@ -178,10 +178,10 @@ policy_types:
178
178
description : pre-define alerts for node Net
179
179
default :
180
180
- alert : node_overloaded
181
- expr : ' avg(rate(container_network_receive_bytes_total{node ="{{ NODE_NAME }}", container_label_io_kubernetes_pod_name=~"{{SERVICE_FULL_NAME}}-[^-]*-[^-]* "}[60s]))/1000 > {{SERVICE_TH_MAX}}'
181
+ expr : ' avg(rate(container_network_receive_bytes_total{instance ="{{ NODE_NAME }}"}[60s]))/1000 > {{SERVICE_TH_MAX}}'
182
182
for : 1m
183
183
- alert : node_underloaded
184
- expr : ' avg(rate(container_network_receive_bytes_total{node ="{{ NODE_NAME }}", container_label_io_kubernetes_pod_name=~"{{SERVICE_FULL_NAME}}-[^-]*-[^-]* "}[60s]))/1000 < {{SERVICE_TH_MIN}}'
184
+ expr : ' avg(rate(container_network_receive_bytes_total{instance ="{{ NODE_NAME }}"}[60s]))/1000 < {{SERVICE_TH_MIN}}'
185
185
for : 1m
186
186
required : true
187
187
scaling_rule :
Original file line number Diff line number Diff line change @@ -152,10 +152,10 @@ policy_types:
152
152
description : pre-define alerts for container Net
153
153
default :
154
154
- alert : service_overloaded
155
- expr : ' avg(rate(container_network_receive_bytes_total{container_label_io_kubernetes_pod_name =~"{{SERVICE_FULL_NAME}}-[^-]*-[^-] *"}[60s]))/1000 > {{SERVICE_TH_MAX}}'
155
+ expr : ' avg(rate(container_network_receive_bytes_total{pod =~"{{SERVICE_FULL_NAME}}. *"}[60s]))/1000 > {{SERVICE_TH_MAX}}'
156
156
for : 30s
157
157
- alert : service_underloaded
158
- expr : ' avg(rate(container_network_receive_bytes_total{container_label_io_kubernetes_pod_name =~"{{SERVICE_FULL_NAME}}-[^-]*-[^-] *"}[60s]))/1000 < {{SERVICE_TH_MIN}}'
158
+ expr : ' avg(rate(container_network_receive_bytes_total{pod =~"{{SERVICE_FULL_NAME}}. *"}[60s]))/1000 < {{SERVICE_TH_MIN}}'
159
159
for : 30s
160
160
required : true
161
161
scaling_rule :
@@ -180,10 +180,10 @@ policy_types:
180
180
description : pre-define alerts for node Net
181
181
default :
182
182
- alert : node_overloaded
183
- expr : ' avg(rate(container_network_receive_bytes_total{node ="{{ NODE_NAME }}", container_label_io_kubernetes_pod_name=~"{{SERVICE_FULL_NAME}}-[^-]*-[^-]* "}[60s]))/1000 > {{SERVICE_TH_MAX}}'
183
+ expr : ' avg(rate(container_network_receive_bytes_total{instance ="{{ NODE_NAME }}"}[60s]))/1000 > {{SERVICE_TH_MAX}}'
184
184
for : 1m
185
185
- alert : node_underloaded
186
- expr : ' avg(rate(container_network_receive_bytes_total{node ="{{ NODE_NAME }}", container_label_io_kubernetes_pod_name=~"{{SERVICE_FULL_NAME}}-[^-]*-[^-]* "}[60s]))/1000 < {{SERVICE_TH_MIN}}'
186
+ expr : ' avg(rate(container_network_receive_bytes_total{instance ="{{ NODE_NAME }}"}[60s]))/1000 < {{SERVICE_TH_MIN}}'
187
187
for : 1m
188
188
required : true
189
189
scaling_rule :
You can’t perform that action at this time.
0 commit comments