Verified Commit 016af2f5 authored by Quentin Duchemin's avatar Quentin Duchemin
Browse files

Alerts based on SMART values only for physical machines

parent 7fa2bb33
......@@ -78,12 +78,12 @@ services:
# Where to read metrics
- "-datasource.url=http://victoria-metrics:8428"
# Where to write and read alert states, to keep
# state during restart, as vmagent stores states in memory
# state during restart, as vmalert stores states in memory
- "-remoteWrite.url=http://victoria-metrics:8428"
- "-remoteRead.url=http://victoria-metrics:8428"
# Where to send alert when they must be triggered
- "-notifier.url=http://alertmanager:9093"
# HTTP server for vmagent's own metrics
# HTTP server for vmalert's own metrics
- "-httpListenAddr=:8880"
# By default, evaluate rules every 1 minute
- "-evaluationInterval=1m"
......
......@@ -68,7 +68,10 @@ groups:
summary: Proxmox HDD volume 90% full
description: Proxmox HDD volume ({{ $labels.storage }}) on {{ $labels.instance }} is {{ $value }}% full
- alert: DiskDamaged
expr: smartmon_device_smart_healthy != 1
# Only get values from real disks so ignore VMs
# This is hardcoded but I cannot see other way to do so because VMs do no have a specific prefix
# We must add new machines here
expr: smartmon_device_smart_healthy{node=~"alice|bob"} != 1
labels:
severity: critical
annotations:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment