1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374 |
- # This is a fast-reacting no-notification alarm ideal for custom dashboards or badges
- template: httpcheck_web_service_up
- families: *
- on: httpcheck.status
- class: Utilization
- type: Web Server
- component: HTTP endpoint
- lookup: average -1m unaligned percentage of success
- calc: ($this < 75) ? (0) : ($this)
- every: 5s
- units: up/down
- info: HTTP endpoint ${label:url} liveness status
- to: silent
- template: httpcheck_web_service_bad_content
- families: *
- on: httpcheck.status
- class: Workload
- type: Web Server
- component: HTTP endpoint
- lookup: average -5m unaligned percentage of bad_content
- every: 10s
- units: %
- warn: $this >= 10 AND $this < 40
- crit: $this >= 40
- delay: down 5m multiplier 1.5 max 1h
- info: percentage of HTTP responses from ${label:url} with unexpected content in the last 5 minutes
- to: webmaster
- template: httpcheck_web_service_bad_status
- families: *
- on: httpcheck.status
- class: Workload
- type: Web Server
- component: HTTP endpoint
- lookup: average -5m unaligned percentage of bad_status
- every: 10s
- units: %
- warn: $this >= 10 AND $this < 40
- crit: $this >= 40
- delay: down 5m multiplier 1.5 max 1h
- info: percentage of HTTP responses from ${label:url} with unexpected status in the last 5 minutes
- to: webmaster
- template: httpcheck_web_service_timeouts
- families: *
- on: httpcheck.status
- class: Latency
- type: Web Server
- component: HTTP endpoint
- lookup: average -5m unaligned percentage of timeout
- every: 10s
- units: %
- warn: $this >= 10 AND $this < 40
- crit: $this >= 40
- delay: down 5m multiplier 1.5 max 1h
- info: percentage of timed-out HTTP requests to ${label:url} in the last 5 minutes
- to: webmaster
- template: httpcheck_web_service_no_connection
- families: *
- on: httpcheck.status
- class: Errors
- type: Other
- component: HTTP endpoint
- lookup: average -5m unaligned percentage of no_connection
- every: 10s
- units: %
- warn: $this >= 10 AND $this < 40
- crit: $this >= 40
- delay: down 5m multiplier 1.5 max 1h
- info: percentage of failed HTTP requests to ${label:url} in the last 5 minutes
- to: webmaster
|