description:"This is an alert meant to ensure that the entire alerting pipeline is functional.\nThis alert is always firing, therefore it should always be firing in Alertmanager\nand always fire against a receiver. There are integrations with various notification\nmechanisms that send a notification when this alert is not firing. For example the\n\"DeadMansSnitch\" integration in PagerDuty."
summary:'Ensure entire alerting pipeline is functional'
- alert:InstanceDown
expr:'up == 0'
for:5m
labels:
severity:critical
annotations:
description:'{% raw %}{{ $labels.instance }} of job {{ $labels.job }} has been down for more than 5 minutes.{% endraw %}'
summary:'{% raw %}Instance {{ $labels.instance }} down{% endraw %}'
- alert:RebootRequired
expr:'node_reboot_required > 0'
labels:
severity:warning
annotations:
description:'{% raw %}{{ $labels.instance }} requires a reboot.{% endraw %}'
description:'{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available space left and is filling up.{% endraw %}'
summary:'Filesystem is predicted to run out of space within the next 24 hours.'
description:'{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available space left and is filling up fast.{% endraw %}'
summary:'Filesystem is predicted to run out of space within the next 4 hours.'
description:'{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available space left.{% endraw %}'
description:'{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available space left.{% endraw %}'
description:'{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available inodes left and is filling up.{% endraw %}'
summary:'Filesystem is predicted to run out of inodes within the next 24 hours.'
description:'{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available inodes left and is filling up fast.{% endraw %}'
summary:'Filesystem is predicted to run out of inodes within the next 4 hours.'
description:'{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available inodes left.{% endraw %}'
summary:'Filesystem has less than 5% inodes left.'
description:'{% raw %}Filesystem on {{ $labels.device }} at {{ $labels.instance }} has only {{ printf "%.2f" $value }}% available inodes left.{% endraw %}'
summary:'Filesystem has less than 3% inodes left.'
description:'{% raw %}{{ $labels.instance }} interface {{ $labels.device }} has encountered {{ printf "%.0f" $value }} receive errors in the last two minutes.{% endraw %}'
summary:'Network interface is reporting many receive errors.'
description:'{% raw %}{{ $labels.instance }} interface {{ $labels.device }} has encountered {{ printf "%.0f" $value }} transmit errors in the last two minutes.{% endraw %}'
summary:'Network interface is reporting many transmit errors.'