cpu.conf 1.9 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667
  1. # you can disable an alarm notification by setting the 'to' line to: silent
  2. template: 10min_cpu_usage
  3. on: system.cpu
  4. class: Utilization
  5. type: System
  6. component: CPU
  7. os: linux
  8. hosts: *
  9. lookup: average -10m unaligned of user,system,softirq,irq,guest
  10. units: %
  11. every: 1m
  12. warn: $this > (($status >= $WARNING) ? (75) : (85))
  13. crit: $this > (($status == $CRITICAL) ? (85) : (95))
  14. delay: down 15m multiplier 1.5 max 1h
  15. info: average CPU utilization over the last 10 minutes (excluding iowait, nice and steal)
  16. to: sysadmin
  17. template: 10min_cpu_iowait
  18. on: system.cpu
  19. class: Utilization
  20. type: System
  21. component: CPU
  22. os: linux
  23. hosts: *
  24. lookup: average -10m unaligned of iowait
  25. units: %
  26. every: 1m
  27. warn: $this > (($status >= $WARNING) ? (20) : (40))
  28. crit: $this > (($status == $CRITICAL) ? (40) : (50))
  29. delay: down 15m multiplier 1.5 max 1h
  30. info: average CPU iowait time over the last 10 minutes
  31. to: sysadmin
  32. template: 20min_steal_cpu
  33. on: system.cpu
  34. class: Latency
  35. type: System
  36. component: CPU
  37. os: linux
  38. hosts: *
  39. lookup: average -20m unaligned of steal
  40. units: %
  41. every: 5m
  42. warn: $this > (($status >= $WARNING) ? (5) : (10))
  43. crit: $this > (($status == $CRITICAL) ? (20) : (30))
  44. delay: down 1h multiplier 1.5 max 2h
  45. info: average CPU steal time over the last 20 minutes
  46. to: sysadmin
  47. ## FreeBSD
  48. template: 10min_cpu_usage
  49. on: system.cpu
  50. class: Utilization
  51. type: System
  52. component: CPU
  53. os: freebsd
  54. hosts: *
  55. lookup: average -10m unaligned of user,system,interrupt
  56. units: %
  57. every: 1m
  58. warn: $this > (($status >= $WARNING) ? (75) : (85))
  59. crit: $this > (($status == $CRITICAL) ? (85) : (95))
  60. delay: down 15m multiplier 1.5 max 1h
  61. info: average CPU utilization over the last 10 minutes (excluding nice)
  62. to: sysadmin