29 lines
1.3 KiB
YAML
29 lines
1.3 KiB
YAML
namespace: riju
|
|
groups:
|
|
- name: riju
|
|
rules:
|
|
- alert: NodeCPUHigh
|
|
annotations:
|
|
message: "Instance {{ $labels.node }} is running close to max CPU"
|
|
expr: |
|
|
sum(1 - rate(node_cpu_seconds_total{mode="idle"}[1m])) by (node) / count(sum(node_cpu_seconds_total{mode="idle"}) by (node, cpu)) by (node) * 100 >= 80
|
|
for: 30m
|
|
- alert: NodeMemoryHigh
|
|
annotations:
|
|
message: "Instance {{ $labels.node }} is running close to max memory"
|
|
expr: |
|
|
sum(1 - node_memory_MemAvailable_bytes / node_memory_MemTotal_bytes) by (node) * 100 >= 80
|
|
for: 30m
|
|
- alert: RootVolumeFilling
|
|
annotations:
|
|
message: "Root volume on instance {{ $labels.node }} is close to full"
|
|
expr: |
|
|
(1 - sum (node_filesystem_free_bytes{mountpoint="/"}) by (node) / sum (node_filesystem_size_bytes{mountpoint="/"}) by (node)) * 100 >= 80
|
|
for: 30m
|
|
- alert: DataVolumeFilling
|
|
annotations:
|
|
message: "Data volume on instance {{ $labels.node }} is close to full"
|
|
expr: |
|
|
(1 - sum (node_filesystem_free_bytes{mountpoint="/mnt/riju"}) by (node) / sum (node_filesystem_size_bytes{mountpoint="/mnt/riju"}) by (node)) * 100 >= 80
|
|
for: 30m
|