metadata.yaml 35 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022
  1. plugin_name: cgroups.plugin
  2. modules:
  3. - &module
  4. meta: &meta
  5. plugin_name: cgroups.plugin
  6. module_name: /sys/fs/cgroup
  7. monitored_instance:
  8. name: Containers
  9. link: ""
  10. categories:
  11. - data-collection.containers-and-vms
  12. icon_filename: container.svg
  13. related_resources:
  14. integrations:
  15. list: []
  16. info_provided_to_referring_integrations:
  17. description: ""
  18. keywords:
  19. - containers
  20. most_popular: true
  21. overview: &overview
  22. data_collection: &data_collection
  23. metrics_description: "Monitor Containers for performance, resource usage, and health status."
  24. method_description: ""
  25. supported_platforms:
  26. include: []
  27. exclude: []
  28. multi_instance: true
  29. additional_permissions:
  30. description: ""
  31. default_behavior:
  32. auto_detection:
  33. description: ""
  34. limits:
  35. description: ""
  36. performance_impact:
  37. description: ""
  38. setup:
  39. prerequisites:
  40. list: []
  41. configuration:
  42. file:
  43. name: ""
  44. description: ""
  45. options:
  46. description: ""
  47. folding:
  48. title: ""
  49. enabled: true
  50. list: []
  51. examples:
  52. folding:
  53. enabled: true
  54. title: ""
  55. list: []
  56. troubleshooting:
  57. problems:
  58. list: []
  59. alerts:
  60. - name: cgroup_10min_cpu_usage
  61. link: https://github.com/netdata/netdata/blob/master/health/health.d/cgroups.conf
  62. metric: cgroup.cpu_limit
  63. info: average cgroup CPU utilization over the last 10 minutes
  64. - name: cgroup_ram_in_use
  65. link: https://github.com/netdata/netdata/blob/master/health/health.d/cgroups.conf
  66. metric: cgroup.mem_usage
  67. info: cgroup memory utilization
  68. - name: cgroup_1m_received_packets_rate
  69. link: https://github.com/netdata/netdata/blob/master/health/health.d/cgroups.conf
  70. metric: cgroup.net_packets
  71. info: average number of packets received by the network interface ${label:device} over the last minute
  72. - name: cgroup_10s_received_packets_storm
  73. link: https://github.com/netdata/netdata/blob/master/health/health.d/cgroups.conf
  74. metric: cgroup.net_packets
  75. info:
  76. ratio of average number of received packets for the network interface ${label:device} over the last 10 seconds, compared to the rate over
  77. the last minute
  78. metrics:
  79. folding:
  80. title: Metrics
  81. enabled: false
  82. description: ""
  83. availability: []
  84. scopes:
  85. - name: cgroup
  86. description: ""
  87. labels:
  88. - name: container_name
  89. description: The container name or group path if name resolution fails.
  90. - name: image
  91. description: Docker/Podman container image name.
  92. metrics:
  93. - name: cgroup.cpu_limit
  94. description: CPU Usage within the limits
  95. unit: "percentage"
  96. chart_type: line
  97. dimensions:
  98. - name: used
  99. - name: cgroup.cpu
  100. description: CPU Usage (100% = 1 core)
  101. unit: "percentage"
  102. chart_type: stacked
  103. dimensions:
  104. - name: user
  105. - name: system
  106. - name: cgroup.cpu_per_core
  107. description: CPU Usage (100% = 1 core) Per Core
  108. unit: "percentage"
  109. chart_type: line
  110. dimensions:
  111. - name: a dimension per core
  112. - name: cgroup.throttled
  113. description: CPU Throttled Runnable Periods
  114. unit: "percentage"
  115. chart_type: line
  116. dimensions:
  117. - name: throttled
  118. - name: cgroup.throttled_duration
  119. description: CPU Throttled Time Duration
  120. unit: "ms"
  121. chart_type: line
  122. dimensions:
  123. - name: duration
  124. - name: cgroup.cpu_shares
  125. description: CPU Time Relative Share
  126. unit: "shares"
  127. chart_type: line
  128. dimensions:
  129. - name: shares
  130. - name: cgroup.mem
  131. description: Memory Usage
  132. unit: "MiB"
  133. chart_type: stacked
  134. dimensions:
  135. - name: cache
  136. - name: rss
  137. - name: swap
  138. - name: rss_huge
  139. - name: mapped_file
  140. - name: cgroup.writeback
  141. description: Writeback Memory
  142. unit: "MiB"
  143. chart_type: area
  144. dimensions:
  145. - name: dirty
  146. - name: writeback
  147. - name: cgroup.mem_activity
  148. description: Memory Activity
  149. unit: "MiB/s"
  150. chart_type: line
  151. dimensions:
  152. - name: in
  153. - name: out
  154. - name: cgroup.pgfaults
  155. description: Memory Page Faults
  156. unit: "MiB/s"
  157. chart_type: line
  158. dimensions:
  159. - name: pgfault
  160. - name: swap
  161. - name: cgroup.mem_usage
  162. description: Used Memory
  163. unit: "MiB"
  164. chart_type: stacked
  165. dimensions:
  166. - name: ram
  167. - name: swap
  168. - name: cgroup.mem_usage_limit
  169. description: Used RAM within the limits
  170. unit: "MiB"
  171. chart_type: stacked
  172. dimensions:
  173. - name: available
  174. - name: used
  175. - name: cgroup.mem_utilization
  176. description: Memory Utilization
  177. unit: "percentage"
  178. chart_type: line
  179. dimensions:
  180. - name: utilization
  181. - name: cgroup.mem_failcnt
  182. description: Memory Limit Failures
  183. unit: "count"
  184. chart_type: line
  185. dimensions:
  186. - name: failures
  187. - name: cgroup.io
  188. description: I/O Bandwidth (all disks)
  189. unit: "KiB/s"
  190. chart_type: area
  191. dimensions:
  192. - name: read
  193. - name: write
  194. - name: cgroup.serviced_ops
  195. description: Serviced I/O Operations (all disks)
  196. unit: "operations/s"
  197. chart_type: line
  198. dimensions:
  199. - name: read
  200. - name: write
  201. - name: cgroup.throttle_io
  202. description: Throttle I/O Bandwidth (all disks)
  203. unit: "KiB/s"
  204. chart_type: area
  205. dimensions:
  206. - name: read
  207. - name: write
  208. - name: cgroup.throttle_serviced_ops
  209. description: Throttle Serviced I/O Operations (all disks)
  210. unit: "operations/s"
  211. chart_type: line
  212. dimensions:
  213. - name: read
  214. - name: write
  215. - name: cgroup.queued_ops
  216. description: Queued I/O Operations (all disks)
  217. unit: "operations"
  218. chart_type: line
  219. dimensions:
  220. - name: read
  221. - name: write
  222. - name: cgroup.merged_ops
  223. description: Merged I/O Operations (all disks)
  224. unit: "operations/s"
  225. chart_type: line
  226. dimensions:
  227. - name: read
  228. - name: write
  229. - name: cgroup.cpu_some_pressure
  230. description: CPU some pressure
  231. unit: "percentage"
  232. chart_type: line
  233. dimensions:
  234. - name: some10
  235. - name: some60
  236. - name: some300
  237. - name: cgroup.cpu_some_pressure_stall_time
  238. description: CPU some pressure stall time
  239. unit: "ms"
  240. chart_type: line
  241. dimensions:
  242. - name: time
  243. - name: cgroup.cpu_full_pressure
  244. description: CPU full pressure
  245. unit: "percentage"
  246. chart_type: line
  247. dimensions:
  248. - name: some10
  249. - name: some60
  250. - name: some300
  251. - name: cgroup.cpu_full_pressure_stall_time
  252. description: CPU full pressure stall time
  253. unit: "ms"
  254. chart_type: line
  255. dimensions:
  256. - name: time
  257. - name: cgroup.memory_some_pressure
  258. description: Memory some pressure
  259. unit: "percentage"
  260. chart_type: line
  261. dimensions:
  262. - name: some10
  263. - name: some60
  264. - name: some300
  265. - name: cgroup.memory_some_pressure_stall_time
  266. description: Memory some pressure stall time
  267. unit: "ms"
  268. chart_type: line
  269. dimensions:
  270. - name: time
  271. - name: cgroup.memory_full_pressure
  272. description: Memory full pressure
  273. unit: "percentage"
  274. chart_type: line
  275. dimensions:
  276. - name: some10
  277. - name: some60
  278. - name: some300
  279. - name: cgroup.memory_full_pressure_stall_time
  280. description: Memory full pressure stall time
  281. unit: "ms"
  282. chart_type: line
  283. dimensions:
  284. - name: time
  285. - name: cgroup.io_some_pressure
  286. description: I/O some pressure
  287. unit: "percentage"
  288. chart_type: line
  289. dimensions:
  290. - name: some10
  291. - name: some60
  292. - name: some300
  293. - name: cgroup.io_some_pressure_stall_time
  294. description: I/O some pressure stall time
  295. unit: "ms"
  296. chart_type: line
  297. dimensions:
  298. - name: time
  299. - name: cgroup.io_full_pressure
  300. description: I/O some pressure
  301. unit: "percentage"
  302. chart_type: line
  303. dimensions:
  304. - name: some10
  305. - name: some60
  306. - name: some300
  307. - name: cgroup.io_full_pressure_stall_time
  308. description: I/O some pressure stall time
  309. unit: "ms"
  310. chart_type: line
  311. dimensions:
  312. - name: time
  313. - name: cgroup.pids_current
  314. description: Number of processes
  315. unit: "pids"
  316. chart_type: line
  317. dimensions:
  318. - name: pids
  319. - name: cgroup network device
  320. description: ""
  321. labels:
  322. - name: container_name
  323. description: The container name or group path if name resolution fails.
  324. - name: image
  325. description: Docker/Podman container image name.
  326. - name: device
  327. description: "The name of the host network interface linked to the container's network interface."
  328. - name: container_device
  329. description: Container network interface name.
  330. - name: interface_type
  331. description: 'Network interface type. Always "virtual" for the containers.'
  332. metrics:
  333. - name: cgroup.net_net
  334. description: Bandwidth
  335. unit: "kilobits/s"
  336. chart_type: area
  337. dimensions:
  338. - name: received
  339. - name: sent
  340. - name: cgroup.net_packets
  341. description: Packets
  342. unit: "pps"
  343. chart_type: line
  344. dimensions:
  345. - name: received
  346. - name: sent
  347. - name: multicast
  348. - name: cgroup.net_errors
  349. description: Interface Errors
  350. unit: "errors/s"
  351. chart_type: line
  352. dimensions:
  353. - name: inbound
  354. - name: outbound
  355. - name: cgroup.net_drops
  356. description: Interface Drops
  357. unit: "errors/s"
  358. chart_type: line
  359. dimensions:
  360. - name: inbound
  361. - name: outbound
  362. - name: cgroup.net_fifo
  363. description: Interface FIFO Buffer Errors
  364. unit: "errors/s"
  365. chart_type: line
  366. dimensions:
  367. - name: receive
  368. - name: transmit
  369. - name: cgroup.net_compressed
  370. description: Interface FIFO Buffer Errors
  371. unit: "pps"
  372. chart_type: line
  373. dimensions:
  374. - name: receive
  375. - name: sent
  376. - name: cgroup.net_events
  377. description: Network Interface Events
  378. unit: "events/s"
  379. chart_type: line
  380. dimensions:
  381. - name: frames
  382. - name: collisions
  383. - name: carrier
  384. - name: cgroup.net_operstate
  385. description: Interface Operational State
  386. unit: "state"
  387. chart_type: line
  388. dimensions:
  389. - name: up
  390. - name: down
  391. - name: notpresent
  392. - name: lowerlayerdown
  393. - name: testing
  394. - name: dormant
  395. - name: unknown
  396. - name: cgroup.net_carrier
  397. description: Interface Physical Link State
  398. unit: "state"
  399. chart_type: line
  400. dimensions:
  401. - name: up
  402. - name: down
  403. - name: cgroup.net_mtu
  404. description: Interface MTU
  405. unit: "octets"
  406. chart_type: line
  407. dimensions:
  408. - name: mtu
  409. - <<: *module
  410. meta:
  411. <<: *meta
  412. monitored_instance:
  413. name: Kubernetes Containers
  414. link: https://kubernetes.io/
  415. icon_filename: kubernetes.svg
  416. categories:
  417. #- data-collection.containers-and-vms
  418. - data-collection.kubernetes
  419. keywords:
  420. - k8s
  421. - kubernetes
  422. - pods
  423. - containers
  424. overview:
  425. <<: *overview
  426. data-collection:
  427. <<: *data_collection
  428. metrics_description: Monitor Kubernetes Clusters for performance, resource usage, and health status.
  429. alerts:
  430. - name: k8s_cgroup_10min_cpu_usage
  431. link: https://github.com/netdata/netdata/blob/master/health/health.d/cgroups.conf
  432. metric: k8s.cgroup.cpu_limit
  433. info: average cgroup CPU utilization over the last 10 minutes
  434. - name: k8s_cgroup_ram_in_use
  435. link: https://github.com/netdata/netdata/blob/master/health/health.d/cgroups.conf
  436. metric: k8s.cgroup.mem_usage
  437. info: cgroup memory utilization
  438. - name: k8s_cgroup_1m_received_packets_rate
  439. link: https://github.com/netdata/netdata/blob/master/health/health.d/cgroups.conf
  440. metric: k8s.cgroup.net_packets
  441. info: average number of packets received by the network interface ${label:device} over the last minute
  442. - name: k8s_cgroup_10s_received_packets_storm
  443. link: https://github.com/netdata/netdata/blob/master/health/health.d/cgroups.conf
  444. metric: k8s.cgroup.net_packets
  445. info:
  446. ratio of average number of received packets for the network interface ${label:device} over the last 10 seconds, compared to the rate over
  447. the last minute
  448. metrics:
  449. folding:
  450. title: Metrics
  451. enabled: false
  452. description: ""
  453. availability: []
  454. scopes:
  455. - name: k8s cgroup
  456. description: These metrics refer to the Pod container.
  457. labels:
  458. - name: k8s_node_name
  459. description: 'Node name. The value of _pod.spec.nodeName_.'
  460. - name: k8s_namespace
  461. description: 'Namespace name. The value of _pod.metadata.namespace_.'
  462. - name: k8s_controller_kind
  463. description: 'Controller kind (ReplicaSet, DaemonSet, StatefulSet, Job, etc.). The value of _pod.OwnerReferences.Controller.Kind_.'
  464. - name: k8s_controller_name
  465. description: 'Controller name.The value of _pod.OwnerReferences.Controller.Name_.'
  466. - name: k8s_pod_name
  467. description: 'Pod name. The value of _pod.metadata.name_.'
  468. - name: k8s_container_name
  469. description: 'Container name. The value of _pod.spec.containers.name_.'
  470. - name: k8s_kind
  471. description: 'Instance kind: "pod" or "container".'
  472. - name: k8s_qos_class
  473. description: 'QoS class (guaranteed, burstable, besteffort).'
  474. - name: k8s_cluster_id
  475. description: 'Cluster ID. The value of kube-system namespace _namespace.metadata.uid_.'
  476. metrics:
  477. - name: k8s.cgroup.cpu_limit
  478. description: CPU Usage within the limits
  479. unit: "percentage"
  480. chart_type: line
  481. dimensions:
  482. - name: used
  483. - name: k8s.cgroup.cpu
  484. description: CPU Usage (100% = 1000 mCPU)
  485. unit: "percentage"
  486. chart_type: stacked
  487. dimensions:
  488. - name: user
  489. - name: system
  490. - name: k8s.cgroup.cpu_per_core
  491. description: CPU Usage (100% = 1000 mCPU) Per Core
  492. unit: "percentage"
  493. chart_type: line
  494. dimensions:
  495. - name: a dimension per core
  496. - name: k8s.cgroup.throttled
  497. description: CPU Throttled Runnable Periods
  498. unit: "percentage"
  499. chart_type: line
  500. dimensions:
  501. - name: throttled
  502. - name: k8s.cgroup.throttled_duration
  503. description: CPU Throttled Time Duration
  504. unit: "ms"
  505. chart_type: line
  506. dimensions:
  507. - name: duration
  508. - name: k8s.cgroup.cpu_shares
  509. description: CPU Time Relative Share
  510. unit: "shares"
  511. chart_type: line
  512. dimensions:
  513. - name: shares
  514. - name: k8s.cgroup.mem
  515. description: Memory Usage
  516. unit: "MiB"
  517. chart_type: stacked
  518. dimensions:
  519. - name: cache
  520. - name: rss
  521. - name: swap
  522. - name: rss_huge
  523. - name: mapped_file
  524. - name: k8s.cgroup.writeback
  525. description: Writeback Memory
  526. unit: "MiB"
  527. chart_type: area
  528. dimensions:
  529. - name: dirty
  530. - name: writeback
  531. - name: k8s.cgroup.mem_activity
  532. description: Memory Activity
  533. unit: "MiB/s"
  534. chart_type: line
  535. dimensions:
  536. - name: in
  537. - name: out
  538. - name: k8s.cgroup.pgfaults
  539. description: Memory Page Faults
  540. unit: "MiB/s"
  541. chart_type: line
  542. dimensions:
  543. - name: pgfault
  544. - name: swap
  545. - name: k8s.cgroup.mem_usage
  546. description: Used Memory
  547. unit: "MiB"
  548. chart_type: stacked
  549. dimensions:
  550. - name: ram
  551. - name: swap
  552. - name: k8s.cgroup.mem_usage_limit
  553. description: Used RAM within the limits
  554. unit: "MiB"
  555. chart_type: stacked
  556. dimensions:
  557. - name: available
  558. - name: used
  559. - name: k8s.cgroup.mem_utilization
  560. description: Memory Utilization
  561. unit: "percentage"
  562. chart_type: line
  563. dimensions:
  564. - name: utilization
  565. - name: k8s.cgroup.mem_failcnt
  566. description: Memory Limit Failures
  567. unit: "count"
  568. chart_type: line
  569. dimensions:
  570. - name: failures
  571. - name: k8s.cgroup.io
  572. description: I/O Bandwidth (all disks)
  573. unit: "KiB/s"
  574. chart_type: area
  575. dimensions:
  576. - name: read
  577. - name: write
  578. - name: k8s.cgroup.serviced_ops
  579. description: Serviced I/O Operations (all disks)
  580. unit: "operations/s"
  581. chart_type: line
  582. dimensions:
  583. - name: read
  584. - name: write
  585. - name: k8s.cgroup.throttle_io
  586. description: Throttle I/O Bandwidth (all disks)
  587. unit: "KiB/s"
  588. chart_type: area
  589. dimensions:
  590. - name: read
  591. - name: write
  592. - name: k8s.cgroup.throttle_serviced_ops
  593. description: Throttle Serviced I/O Operations (all disks)
  594. unit: "operations/s"
  595. chart_type: line
  596. dimensions:
  597. - name: read
  598. - name: write
  599. - name: k8s.cgroup.queued_ops
  600. description: Queued I/O Operations (all disks)
  601. unit: "operations"
  602. chart_type: line
  603. dimensions:
  604. - name: read
  605. - name: write
  606. - name: k8s.cgroup.merged_ops
  607. description: Merged I/O Operations (all disks)
  608. unit: "operations/s"
  609. chart_type: line
  610. dimensions:
  611. - name: read
  612. - name: write
  613. - name: k8s.cgroup.cpu_some_pressure
  614. description: CPU some pressure
  615. unit: "percentage"
  616. chart_type: line
  617. dimensions:
  618. - name: some10
  619. - name: some60
  620. - name: some300
  621. - name: k8s.cgroup.cpu_some_pressure_stall_time
  622. description: CPU some pressure stall time
  623. unit: "ms"
  624. chart_type: line
  625. dimensions:
  626. - name: time
  627. - name: k8s.cgroup.cpu_full_pressure
  628. description: CPU full pressure
  629. unit: "percentage"
  630. chart_type: line
  631. dimensions:
  632. - name: some10
  633. - name: some60
  634. - name: some300
  635. - name: k8s.cgroup.cpu_full_pressure_stall_time
  636. description: CPU full pressure stall time
  637. unit: "ms"
  638. chart_type: line
  639. dimensions:
  640. - name: time
  641. - name: k8s.cgroup.memory_some_pressure
  642. description: Memory some pressure
  643. unit: "percentage"
  644. chart_type: line
  645. dimensions:
  646. - name: some10
  647. - name: some60
  648. - name: some300
  649. - name: k8s.cgroup.memory_some_pressure_stall_time
  650. description: Memory some pressure stall time
  651. unit: "ms"
  652. chart_type: line
  653. dimensions:
  654. - name: time
  655. - name: k8s.cgroup.memory_full_pressure
  656. description: Memory full pressure
  657. unit: "percentage"
  658. chart_type: line
  659. dimensions:
  660. - name: some10
  661. - name: some60
  662. - name: some300
  663. - name: k8s.cgroup.memory_full_pressure_stall_time
  664. description: Memory full pressure stall time
  665. unit: "ms"
  666. chart_type: line
  667. dimensions:
  668. - name: time
  669. - name: k8s.cgroup.io_some_pressure
  670. description: I/O some pressure
  671. unit: "percentage"
  672. chart_type: line
  673. dimensions:
  674. - name: some10
  675. - name: some60
  676. - name: some300
  677. - name: k8s.cgroup.io_some_pressure_stall_time
  678. description: I/O some pressure stall time
  679. unit: "ms"
  680. chart_type: line
  681. dimensions:
  682. - name: time
  683. - name: k8s.cgroup.io_full_pressure
  684. description: I/O some pressure
  685. unit: "percentage"
  686. chart_type: line
  687. dimensions:
  688. - name: some10
  689. - name: some60
  690. - name: some300
  691. - name: k8s.cgroup.io_full_pressure_stall_time
  692. description: I/O some pressure stall time
  693. unit: "ms"
  694. chart_type: line
  695. dimensions:
  696. - name: time
  697. - name: k8s.cgroup.pids_current
  698. description: Number of processes
  699. unit: "pids"
  700. chart_type: line
  701. dimensions:
  702. - name: pids
  703. - name: k8s cgroup network device
  704. description: These metrics refer to the Pod container network interface.
  705. labels:
  706. - name: device
  707. description: "The name of the host network interface linked to the container's network interface."
  708. - name: container_device
  709. description: Container network interface name.
  710. - name: interface_type
  711. description: 'Network interface type. Always "virtual" for the containers.'
  712. - name: k8s_node_name
  713. description: 'Node name. The value of _pod.spec.nodeName_.'
  714. - name: k8s_namespace
  715. description: 'Namespace name. The value of _pod.metadata.namespace_.'
  716. - name: k8s_controller_kind
  717. description: 'Controller kind (ReplicaSet, DaemonSet, StatefulSet, Job, etc.). The value of _pod.OwnerReferences.Controller.Kind_.'
  718. - name: k8s_controller_name
  719. description: 'Controller name.The value of _pod.OwnerReferences.Controller.Name_.'
  720. - name: k8s_pod_name
  721. description: 'Pod name. The value of _pod.metadata.name_.'
  722. - name: k8s_container_name
  723. description: 'Container name. The value of _pod.spec.containers.name_.'
  724. - name: k8s_kind
  725. description: 'Instance kind: "pod" or "container".'
  726. - name: k8s_qos_class
  727. description: 'QoS class (guaranteed, burstable, besteffort).'
  728. - name: k8s_cluster_id
  729. description: 'Cluster ID. The value of kube-system namespace _namespace.metadata.uid_.'
  730. metrics:
  731. - name: k8s.cgroup.net_net
  732. description: Bandwidth
  733. unit: "kilobits/s"
  734. chart_type: area
  735. dimensions:
  736. - name: received
  737. - name: sent
  738. - name: k8s.cgroup.net_packets
  739. description: Packets
  740. unit: "pps"
  741. chart_type: line
  742. dimensions:
  743. - name: received
  744. - name: sent
  745. - name: multicast
  746. - name: k8s.cgroup.net_errors
  747. description: Interface Errors
  748. unit: "errors/s"
  749. chart_type: line
  750. dimensions:
  751. - name: inbound
  752. - name: outbound
  753. - name: k8s.cgroup.net_drops
  754. description: Interface Drops
  755. unit: "errors/s"
  756. chart_type: line
  757. dimensions:
  758. - name: inbound
  759. - name: outbound
  760. - name: k8s.cgroup.net_fifo
  761. description: Interface FIFO Buffer Errors
  762. unit: "errors/s"
  763. chart_type: line
  764. dimensions:
  765. - name: receive
  766. - name: transmit
  767. - name: k8s.cgroup.net_compressed
  768. description: Interface FIFO Buffer Errors
  769. unit: "pps"
  770. chart_type: line
  771. dimensions:
  772. - name: receive
  773. - name: sent
  774. - name: k8s.cgroup.net_events
  775. description: Network Interface Events
  776. unit: "events/s"
  777. chart_type: line
  778. dimensions:
  779. - name: frames
  780. - name: collisions
  781. - name: carrier
  782. - name: k8s.cgroup.net_operstate
  783. description: Interface Operational State
  784. unit: "state"
  785. chart_type: line
  786. dimensions:
  787. - name: up
  788. - name: down
  789. - name: notpresent
  790. - name: lowerlayerdown
  791. - name: testing
  792. - name: dormant
  793. - name: unknown
  794. - name: k8s.cgroup.net_carrier
  795. description: Interface Physical Link State
  796. unit: "state"
  797. chart_type: line
  798. dimensions:
  799. - name: up
  800. - name: down
  801. - name: k8s.cgroup.net_mtu
  802. description: Interface MTU
  803. unit: "octets"
  804. chart_type: line
  805. dimensions:
  806. - name: mtu
  807. - <<: *module
  808. meta:
  809. <<: *meta
  810. monitored_instance:
  811. name: Systemd Services
  812. link: ""
  813. icon_filename: systemd.svg
  814. categories:
  815. - data-collection.systemd
  816. keywords:
  817. - systemd
  818. - services
  819. overview:
  820. <<: *overview
  821. data-collection:
  822. <<: *data_collection
  823. metrics_desctiption: "Monitor Systemd Services for performance, resource usage, and health status."
  824. alerts: []
  825. metrics:
  826. folding:
  827. title: Metrics
  828. enabled: false
  829. description: ""
  830. availability: []
  831. scopes:
  832. - name: systemd service
  833. description: ""
  834. labels:
  835. - name: service_name
  836. description: Service name
  837. metrics:
  838. - name: systemd.service.cpu.utilization
  839. description: Systemd Services CPU utilization (100% = 1 core)
  840. unit: percentage
  841. chart_type: stacked
  842. dimensions:
  843. - name: user
  844. - name: system
  845. - name: systemd.service.memory.usage
  846. description: Systemd Services Used Memory
  847. unit: MiB
  848. chart_type: stacked
  849. dimensions:
  850. - name: ram
  851. - name: swap
  852. - name: systemd.service.memory.failcnt
  853. description: Systemd Services Memory Limit Failures
  854. unit: failures/s
  855. chart_type: line
  856. dimensions:
  857. - name: fail
  858. - name: systemd.service.memory.ram.usage
  859. description: Systemd Services Memory
  860. unit: MiB
  861. chart_type: stacked
  862. dimensions:
  863. - name: rss
  864. - name: cache
  865. - name: mapped_file
  866. - name: rss_huge
  867. - name: systemd.service.memory.writeback
  868. description: Systemd Services Writeback Memory
  869. unit: MiB
  870. chart_type: stacked
  871. dimensions:
  872. - name: writeback
  873. - name: dirty
  874. - name: systemd.service.memory.paging.faults
  875. description: Systemd Services Memory Minor and Major Page Faults
  876. unit: MiB/s
  877. chart_type: area
  878. dimensions:
  879. - name: minor
  880. - name: major
  881. - name: systemd.service.memory.paging.io
  882. description: Systemd Services Memory Paging IO
  883. unit: MiB/s
  884. chart_type: area
  885. dimensions:
  886. - name: in
  887. - name: out
  888. - name: systemd.service.disk.io
  889. description: Systemd Services Disk Read/Write Bandwidth
  890. unit: KiB/s
  891. chart_type: area
  892. dimensions:
  893. - name: read
  894. - name: write
  895. - name: systemd.service.disk.iops
  896. description: Systemd Services Disk Read/Write Operations
  897. unit: operations/s
  898. chart_type: line
  899. dimensions:
  900. - name: read
  901. - name: write
  902. - name: systemd.service.disk.throttle.io
  903. description: Systemd Services Throttle Disk Read/Write Bandwidth
  904. unit: KiB/s
  905. chart_type: area
  906. dimensions:
  907. - name: read
  908. - name: write
  909. - name: systemd.service.disk.throttle.iops
  910. description: Systemd Services Throttle Disk Read/Write Operations
  911. unit: operations/s
  912. chart_type: line
  913. dimensions:
  914. - name: read
  915. - name: write
  916. - name: systemd.service.disk.queued_iops
  917. description: Systemd Services Queued Disk Read/Write Operations
  918. unit: operations/s
  919. chart_type: line
  920. dimensions:
  921. - name: read
  922. - name: write
  923. - name: systemd.service.disk.merged_iops
  924. description: Systemd Services Merged Disk Read/Write Operations
  925. unit: operations/s
  926. chart_type: line
  927. dimensions:
  928. - name: read
  929. - name: write
  930. - name: systemd.service.pids.current
  931. description: Systemd Services Number of Processes
  932. unit: pids
  933. chart_type: line
  934. dimensions:
  935. - name: pids
  936. - <<: *module
  937. meta:
  938. <<: *meta
  939. monitored_instance:
  940. name: Virtual Machines
  941. link: ""
  942. icon_filename: container.svg
  943. categories:
  944. - data-collection.containers-and-vms
  945. keywords:
  946. - vms
  947. - virtualization
  948. - container
  949. overview:
  950. <<: *overview
  951. data_collection:
  952. <<: *data_collection
  953. metrics_description: "Monitor Virtual Machines for performance, resource usage, and health status."
  954. - <<: *module
  955. meta:
  956. <<: *meta
  957. monitored_instance:
  958. name: LXC Containers
  959. link: ""
  960. icon_filename: lxc.png
  961. categories:
  962. - data-collection.containers-and-vms
  963. keywords:
  964. - lxc
  965. - lxd
  966. - container
  967. overview:
  968. <<: *overview
  969. data_collection:
  970. <<: *data_collection
  971. metrics_description: "Monitor LXC Containers for performance, resource usage, and health status."
  972. - <<: *module
  973. meta:
  974. <<: *meta
  975. monitored_instance:
  976. name: Libvirt Containers
  977. link: ""
  978. icon_filename: libvirt.png
  979. categories:
  980. - data-collection.containers-and-vms
  981. keywords:
  982. - libvirt
  983. - container
  984. overview:
  985. <<: *overview
  986. data_collection:
  987. <<: *data_collection
  988. metrics_description: "Monitor Libvirt for performance, resource usage, and health status."
  989. - <<: *module
  990. meta:
  991. <<: *meta
  992. monitored_instance:
  993. name: oVirt Containers
  994. link: ""
  995. icon_filename: ovirt.svg
  996. categories:
  997. - data-collection.containers-and-vms
  998. keywords:
  999. - ovirt
  1000. - container
  1001. overview:
  1002. <<: *overview
  1003. data_collection:
  1004. <<: *data_collection
  1005. metrics_description: "Monitor oVirt for performance, resource usage, and health status."
  1006. - <<: *module
  1007. meta:
  1008. <<: *meta
  1009. monitored_instance:
  1010. name: Proxmox Containers
  1011. link: ""
  1012. icon_filename: proxmox.png
  1013. categories:
  1014. - data-collection.containers-and-vms
  1015. keywords:
  1016. - proxmox
  1017. - container
  1018. overview:
  1019. <<: *overview
  1020. data_collection:
  1021. <<: *data_collection
  1022. metrics_description: "Monitor Proxmox for performance, resource usage, and health status."