15 lines
522 B
YAML
15 lines
522 B
YAML
|
---
|
||
|
groups:
|
||
|
- name: smart
|
||
|
rules:
|
||
|
- alert: SMARTFailure
|
||
|
expr: |
|
||
|
sum by (hostname) (count_over_time({hostname=~".+"} | json | _SYSTEMD_UNIT = "smartmontools.service" !~ "(?i)previous self-test completed without error" !~ "(?i)Prefailure" |~ "(?i)(error|fail)"[2m])) > 0
|
||
|
for: 2m
|
||
|
labels:
|
||
|
severity: critical
|
||
|
category: logs
|
||
|
annotations:
|
||
|
hostname: "{{ $labels.hostname }}"
|
||
|
summary: "{{ $labels.hostname }} has reported SMART failures"
|