123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142 |
- ## Check if the are any systemd units in the failed state (crashed).
- ## States: 1 - active, 2 - inactive, 3 - activating, 4 - deactivating, 5 - failed.
- ## Service units
- template: systemd_service_units_state
- on: systemd.service_units_state
- class: Errors
- type: Linux
- component: Systemd units
- lookup: max -1s min2max
- units: ok/failed
- every: 10s
- warn: $this != nan AND $this == 5
- delay: down 5m multiplier 1.5 max 1h
- info: one or more systemd service units are in the failed state
- to: sysadmin
- ## Socket units
- template: systemd_socket_units_state
- on: systemd.socket_unit_state
- class: Errors
- type: Linux
- component: Systemd units
- lookup: max -1s min2max
- units: ok/failed
- every: 10s
- warn: $this != nan AND $this == 5
- delay: down 5m multiplier 1.5 max 1h
- info: one or more systemd socket units are in the failed state
- to: sysadmin
- ## Target units
- template: systemd_target_units_state
- on: systemd.target_unit_state
- class: Errors
- type: Linux
- component: Systemd units
- lookup: max -1s min2max
- units: ok/failed
- every: 10s
- warn: $this != nan AND $this == 5
- delay: down 5m multiplier 1.5 max 1h
- info: one or more systemd target units are in the failed state
- to: sysadmin
- ## Path units
- template: systemd_path_units_state
- on: systemd.path_unit_state
- class: Errors
- type: Linux
- component: Systemd units
- lookup: max -1s min2max
- units: ok/failed
- every: 10s
- warn: $this != nan AND $this == 5
- delay: down 5m multiplier 1.5 max 1h
- info: one or more systemd path units are in the failed state
- to: sysadmin
- ## Device units
- template: systemd_device_units_state
- on: systemd.device_unit_state
- class: Errors
- type: Linux
- component: Systemd units
- lookup: max -1s min2max
- units: ok/failed
- every: 10s
- warn: $this != nan AND $this == 5
- delay: down 5m multiplier 1.5 max 1h
- info: one or more the systemd device units are in the failed state
- to: sysadmin
- ## Mount units
- template: systemd_mount_units_state
- on: systemd.mount_unit_state
- class: Errors
- type: Linux
- component: Systemd units
- lookup: max -1s min2max
- units: ok/failed
- every: 10s
- warn: $this != nan AND $this == 5
- delay: down 5m multiplier 1.5 max 1h
- info: one or more the systemd mount units are in the failed state
- to: sysadmin
- ## Automount units
- template: systemd_automount_units_state
- on: systemd.automount_unit_state
- class: Errors
- type: Linux
- component: Systemd units
- lookup: max -1s min2max
- units: ok/failed
- every: 10s
- warn: $this != nan AND $this == 5
- delay: down 5m multiplier 1.5 max 1h
- info: one or more systemd automount units are in the failed state
- to: sysadmin
- ## Swap units
- template: systemd_swap_units_state
- on: systemd.swap_unit_state
- class: Errors
- type: Linux
- component: Systemd units
- lookup: max -1s min2max
- units: ok/failed
- every: 10s
- warn: $this != nan AND $this == 5
- delay: down 5m multiplier 1.5 max 1h
- info: one or more systemd swap units are in the failed state
- to: sysadmin
- ## Scope units
- template: systemd_scope_units_state
- on: systemd.scope_unit_state
- class: Errors
- type: Linux
- component: Systemd units
- lookup: max -1s min2max
- units: ok/failed
- every: 10s
- warn: $this != nan AND $this == 5
- delay: down 5m multiplier 1.5 max 1h
- info: one or more systemd scope units are in the failed state
- to: sysadmin
- ## Slice units
- template: systemd_slice_units_state
- on: systemd.slice_unit_state
- class: Errors
- type: Linux
- component: Systemd units
- lookup: max -1s min2max
- units: ok/failed
- every: 10s
- warn: $this != nan AND $this == 5
- delay: down 5m multiplier 1.5 max 1h
- info: one or more systemd slice units are in the failed state
- to: sysadmin
|