0
0
Fork 0
mirror of https://github.com/alerta/alerta.git synced 2025-01-30 03:33:59 +00:00
alerta_alerta/etc/alerta/alert-ganglia.yaml
2013-04-05 09:38:46 +01:00

49 lines
1.4 KiB
YAML

---
# Server reboots within last 2 hours
- event: ServerReboot
filter: # all
value: $now - $boottime
thresholdInfo: [ 'informational:<:7200' ]
text: [ 'Server rebooted less than 2 hours ago' ]
resource: $host
group: Hardware
graphs: [ ]
tags: [ 'owner:websys' ]
# Puppet Last Run alert
- event: PuppetLastRun
filter: # all
value: $now - $pup_last_run
thresholdInfo: [ 'major:>:7200','normal:<:7200' ]
text: ['Puppet agent has not run for at least 2 hours (last puppet run at $pup_last_run)','Puppet agent is OK (last puppet run at $pup_last_run).']
resource: $host
group: Puppet
count: 2
repeat: 10
graphs: [ ]
tags: [ 'owner:websys' ]
# Puppet Resource alert
- event: PuppetResFailed
filter: # all
value: $pup_res_failed
thresholdInfo: [ 'warning:>:0','normal:==:0' ]
text: [ 'Puppet agent failed to update $pup_res_failed out of $pup_res_total resources','Puppet is updating all $pup_res_total resources' ]
resource: $host
group: Puppet
count: 2
repeat: 10
graphs: [ 'pup_res_failed' ]
tags: [ 'owner:websys' ]
# Ganglia Heartbeat alert
- event: GangliaHeartbeat
filter: # all
value: $heartbeat
thresholdInfo: [ 'critical:>:90','normal:<:90' ]
text: [ 'No heartbeat from Ganglia agent for at least 90 seconds','Heartbeat from Ganglia agent OK' ]
resource: $host
group: Ganglia
repeat: 10
graphs: [ ]
tags: [ 'owner:websys' ]