boinc.conf 1.8 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374
  1. # Alarms for various BOINC issues.
  2. # Warn on any compute errors encountered.
  3. template: boinc_compute_errors
  4. on: boinc.states
  5. class: Errors
  6. type: Computing
  7. component: BOINC
  8. os: *
  9. hosts: *
  10. families: *
  11. lookup: average -10m unaligned of comperror
  12. units: tasks
  13. every: 1m
  14. warn: $this > 0
  15. crit: $this > 1
  16. delay: up 1m down 5m multiplier 1.5 max 1h
  17. info: average number of compute errors over the last 10 minutes
  18. to: sysadmin
  19. # Warn on lots of upload errors
  20. template: boinc_upload_errors
  21. on: boinc.states
  22. class: Errors
  23. type: Computing
  24. component: BOINC
  25. os: *
  26. hosts: *
  27. families: *
  28. lookup: average -10m unaligned of upload_failed
  29. units: tasks
  30. every: 1m
  31. warn: $this > 0
  32. crit: $this > 1
  33. delay: up 1m down 5m multiplier 1.5 max 1h
  34. info: average number of failed uploads over the last 10 minutes
  35. to: sysadmin
  36. # Warn on the task queue being empty
  37. template: boinc_total_tasks
  38. on: boinc.tasks
  39. class: Utilization
  40. type: Computing
  41. component: BOINC
  42. os: *
  43. hosts: *
  44. families: *
  45. lookup: average -10m unaligned of total
  46. units: tasks
  47. every: 1m
  48. warn: $this < 1
  49. crit: $this < 0.1
  50. delay: up 5m down 10m multiplier 1.5 max 1h
  51. info: average number of total tasks over the last 10 minutes
  52. to: sysadmin
  53. # Warn on no active tasks with a non-empty queue
  54. template: boinc_active_tasks
  55. on: boinc.tasks
  56. class: Utilization
  57. type: Computing
  58. component: BOINC
  59. os: *
  60. hosts: *
  61. families: *
  62. lookup: average -10m unaligned of active
  63. calc: ($boinc_total_tasks >= 1) ? ($this) : (inf)
  64. units: tasks
  65. every: 1m
  66. warn: $this < 1
  67. crit: $this < 0.1
  68. delay: up 5m down 10m multiplier 1.5 max 1h
  69. info: average number of active tasks over the last 10 minutes
  70. to: sysadmin