proc_vmstat.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include "plugin_proc.h"
  3. #define PLUGIN_PROC_MODULE_VMSTAT_NAME "/proc/vmstat"
  4. #define OOM_KILL_STRING "oom_kill"
  5. int do_proc_vmstat(int update_every, usec_t dt) {
  6. (void)dt;
  7. static procfile *ff = NULL;
  8. static int do_swapio = -1, do_io = -1, do_pgfaults = -1, do_oom_kill = -1, do_numa = -1;
  9. static int has_numa = -1;
  10. static ARL_BASE *arl_base = NULL;
  11. static unsigned long long numa_foreign = 0ULL;
  12. static unsigned long long numa_hint_faults = 0ULL;
  13. static unsigned long long numa_hint_faults_local = 0ULL;
  14. static unsigned long long numa_huge_pte_updates = 0ULL;
  15. static unsigned long long numa_interleave = 0ULL;
  16. static unsigned long long numa_local = 0ULL;
  17. static unsigned long long numa_other = 0ULL;
  18. static unsigned long long numa_pages_migrated = 0ULL;
  19. static unsigned long long numa_pte_updates = 0ULL;
  20. static unsigned long long pgfault = 0ULL;
  21. static unsigned long long pgmajfault = 0ULL;
  22. static unsigned long long pgpgin = 0ULL;
  23. static unsigned long long pgpgout = 0ULL;
  24. static unsigned long long pswpin = 0ULL;
  25. static unsigned long long pswpout = 0ULL;
  26. static unsigned long long oom_kill = 0ULL;
  27. if(unlikely(!ff)) {
  28. char filename[FILENAME_MAX + 1];
  29. snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, "/proc/vmstat");
  30. ff = procfile_open(config_get("plugin:proc:/proc/vmstat", "filename to monitor", filename), " \t:", PROCFILE_FLAG_DEFAULT);
  31. if(unlikely(!ff)) return 1;
  32. }
  33. ff = procfile_readall(ff);
  34. if(unlikely(!ff)) return 0; // we return 0, so that we will retry to open it next time
  35. size_t lines = procfile_lines(ff), l;
  36. if(unlikely(!arl_base)) {
  37. do_swapio = config_get_boolean_ondemand("plugin:proc:/proc/vmstat", "swap i/o", CONFIG_BOOLEAN_AUTO);
  38. do_io = config_get_boolean("plugin:proc:/proc/vmstat", "disk i/o", CONFIG_BOOLEAN_YES);
  39. do_pgfaults = config_get_boolean("plugin:proc:/proc/vmstat", "memory page faults", CONFIG_BOOLEAN_YES);
  40. do_oom_kill = config_get_boolean("plugin:proc:/proc/vmstat", "out of memory kills", CONFIG_BOOLEAN_AUTO);
  41. do_numa = config_get_boolean_ondemand("plugin:proc:/proc/vmstat", "system-wide numa metric summary", CONFIG_BOOLEAN_AUTO);
  42. arl_base = arl_create("vmstat", NULL, 60);
  43. arl_expect(arl_base, "pgfault", &pgfault);
  44. arl_expect(arl_base, "pgmajfault", &pgmajfault);
  45. arl_expect(arl_base, "pgpgin", &pgpgin);
  46. arl_expect(arl_base, "pgpgout", &pgpgout);
  47. arl_expect(arl_base, "pswpin", &pswpin);
  48. arl_expect(arl_base, "pswpout", &pswpout);
  49. int has_oom_kill = 0;
  50. for (l = 0; l < lines; l++) {
  51. if (!strcmp(procfile_lineword(ff, l, 0), OOM_KILL_STRING)) {
  52. has_oom_kill = 1;
  53. break;
  54. }
  55. }
  56. if (has_oom_kill)
  57. arl_expect(arl_base, OOM_KILL_STRING, &oom_kill);
  58. else
  59. do_oom_kill = CONFIG_BOOLEAN_NO;
  60. if(do_numa == CONFIG_BOOLEAN_YES || (do_numa == CONFIG_BOOLEAN_AUTO &&
  61. (get_numa_node_count() >= 2 ||
  62. netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES))) {
  63. arl_expect(arl_base, "numa_foreign", &numa_foreign);
  64. arl_expect(arl_base, "numa_hint_faults_local", &numa_hint_faults_local);
  65. arl_expect(arl_base, "numa_hint_faults", &numa_hint_faults);
  66. arl_expect(arl_base, "numa_huge_pte_updates", &numa_huge_pte_updates);
  67. arl_expect(arl_base, "numa_interleave", &numa_interleave);
  68. arl_expect(arl_base, "numa_local", &numa_local);
  69. arl_expect(arl_base, "numa_other", &numa_other);
  70. arl_expect(arl_base, "numa_pages_migrated", &numa_pages_migrated);
  71. arl_expect(arl_base, "numa_pte_updates", &numa_pte_updates);
  72. }
  73. else {
  74. // Do not expect numa metrics when they are not needed.
  75. // By not adding them, the ARL will stop processing the file
  76. // when all the expected metrics are collected.
  77. // Also ARL will not parse their values.
  78. has_numa = 0;
  79. do_numa = CONFIG_BOOLEAN_NO;
  80. }
  81. }
  82. arl_begin(arl_base);
  83. for(l = 0; l < lines ;l++) {
  84. size_t words = procfile_linewords(ff, l);
  85. if(unlikely(words < 2)) {
  86. if(unlikely(words)) collector_error("Cannot read /proc/vmstat line %zu. Expected 2 params, read %zu.", l, words);
  87. continue;
  88. }
  89. if(unlikely(arl_check(arl_base,
  90. procfile_lineword(ff, l, 0),
  91. procfile_lineword(ff, l, 1)))) break;
  92. }
  93. // --------------------------------------------------------------------
  94. if(do_swapio == CONFIG_BOOLEAN_YES || (do_swapio == CONFIG_BOOLEAN_AUTO &&
  95. (pswpin || pswpout ||
  96. netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES))) {
  97. do_swapio = CONFIG_BOOLEAN_YES;
  98. static RRDSET *st_swapio = NULL;
  99. static RRDDIM *rd_in = NULL, *rd_out = NULL;
  100. if(unlikely(!st_swapio)) {
  101. st_swapio = rrdset_create_localhost(
  102. "system"
  103. , "swapio"
  104. , NULL
  105. , "swap"
  106. , NULL
  107. , "Swap I/O"
  108. , "KiB/s"
  109. , PLUGIN_PROC_NAME
  110. , PLUGIN_PROC_MODULE_VMSTAT_NAME
  111. , NETDATA_CHART_PRIO_SYSTEM_SWAPIO
  112. , update_every
  113. , RRDSET_TYPE_AREA
  114. );
  115. rd_in = rrddim_add(st_swapio, "in", NULL, sysconf(_SC_PAGESIZE), 1024, RRD_ALGORITHM_INCREMENTAL);
  116. rd_out = rrddim_add(st_swapio, "out", NULL, -sysconf(_SC_PAGESIZE), 1024, RRD_ALGORITHM_INCREMENTAL);
  117. }
  118. rrddim_set_by_pointer(st_swapio, rd_in, pswpin);
  119. rrddim_set_by_pointer(st_swapio, rd_out, pswpout);
  120. rrdset_done(st_swapio);
  121. }
  122. // --------------------------------------------------------------------
  123. if(do_io) {
  124. static RRDSET *st_io = NULL;
  125. static RRDDIM *rd_in = NULL, *rd_out = NULL;
  126. if(unlikely(!st_io)) {
  127. st_io = rrdset_create_localhost(
  128. "system"
  129. , "pgpgio"
  130. , NULL
  131. , "disk"
  132. , NULL
  133. , "Memory Paged from/to disk"
  134. , "KiB/s"
  135. , PLUGIN_PROC_NAME
  136. , PLUGIN_PROC_MODULE_VMSTAT_NAME
  137. , NETDATA_CHART_PRIO_SYSTEM_PGPGIO
  138. , update_every
  139. , RRDSET_TYPE_AREA
  140. );
  141. rd_in = rrddim_add(st_io, "in", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  142. rd_out = rrddim_add(st_io, "out", NULL, -1, 1, RRD_ALGORITHM_INCREMENTAL);
  143. }
  144. rrddim_set_by_pointer(st_io, rd_in, pgpgin);
  145. rrddim_set_by_pointer(st_io, rd_out, pgpgout);
  146. rrdset_done(st_io);
  147. }
  148. // --------------------------------------------------------------------
  149. if(do_pgfaults) {
  150. static RRDSET *st_pgfaults = NULL;
  151. static RRDDIM *rd_minor = NULL, *rd_major = NULL;
  152. if(unlikely(!st_pgfaults)) {
  153. st_pgfaults = rrdset_create_localhost(
  154. "mem"
  155. , "pgfaults"
  156. , NULL
  157. , "system"
  158. , NULL
  159. , "Memory Page Faults"
  160. , "faults/s"
  161. , PLUGIN_PROC_NAME
  162. , PLUGIN_PROC_MODULE_VMSTAT_NAME
  163. , NETDATA_CHART_PRIO_MEM_SYSTEM_PGFAULTS
  164. , update_every
  165. , RRDSET_TYPE_LINE
  166. );
  167. rrdset_flag_set(st_pgfaults, RRDSET_FLAG_DETAIL);
  168. rd_minor = rrddim_add(st_pgfaults, "minor", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  169. rd_major = rrddim_add(st_pgfaults, "major", NULL, -1, 1, RRD_ALGORITHM_INCREMENTAL);
  170. }
  171. rrddim_set_by_pointer(st_pgfaults, rd_minor, pgfault);
  172. rrddim_set_by_pointer(st_pgfaults, rd_major, pgmajfault);
  173. rrdset_done(st_pgfaults);
  174. }
  175. // --------------------------------------------------------------------
  176. if (do_oom_kill == CONFIG_BOOLEAN_YES ||
  177. (do_oom_kill == CONFIG_BOOLEAN_AUTO && (oom_kill || netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES))) {
  178. static RRDSET *st_oom_kill = NULL;
  179. static RRDDIM *rd_oom_kill = NULL;
  180. do_oom_kill = CONFIG_BOOLEAN_YES;
  181. if(unlikely(!st_oom_kill)) {
  182. st_oom_kill = rrdset_create_localhost(
  183. "mem"
  184. , "oom_kill"
  185. , NULL
  186. , "system"
  187. , NULL
  188. , "Out of Memory Kills"
  189. , "kills/s"
  190. , PLUGIN_PROC_NAME
  191. , PLUGIN_PROC_MODULE_VMSTAT_NAME
  192. , NETDATA_CHART_PRIO_MEM_SYSTEM_OOM_KILL
  193. , update_every
  194. , RRDSET_TYPE_LINE
  195. );
  196. rrdset_flag_set(st_oom_kill, RRDSET_FLAG_DETAIL);
  197. rd_oom_kill = rrddim_add(st_oom_kill, "kills", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  198. }
  199. rrddim_set_by_pointer(st_oom_kill, rd_oom_kill, oom_kill);
  200. rrdset_done(st_oom_kill);
  201. }
  202. // --------------------------------------------------------------------
  203. // Ondemand criteria for NUMA. Since this won't change at run time, we
  204. // check it only once. We check whether the node count is >= 2 because
  205. // single-node systems have uninteresting statistics (since all accesses
  206. // are local).
  207. if(unlikely(has_numa == -1))
  208. has_numa = (numa_local || numa_foreign || numa_interleave || numa_other || numa_pte_updates ||
  209. numa_huge_pte_updates || numa_hint_faults || numa_hint_faults_local || numa_pages_migrated) ? 1 : 0;
  210. if(do_numa == CONFIG_BOOLEAN_YES || (do_numa == CONFIG_BOOLEAN_AUTO && has_numa)) {
  211. do_numa = CONFIG_BOOLEAN_YES;
  212. static RRDSET *st_numa = NULL;
  213. static RRDDIM *rd_local = NULL, *rd_foreign = NULL, *rd_interleave = NULL, *rd_other = NULL, *rd_pte_updates = NULL, *rd_huge_pte_updates = NULL, *rd_hint_faults = NULL, *rd_hint_faults_local = NULL, *rd_pages_migrated = NULL;
  214. if(unlikely(!st_numa)) {
  215. st_numa = rrdset_create_localhost(
  216. "mem"
  217. , "numa"
  218. , NULL
  219. , "numa"
  220. , NULL
  221. , "NUMA events"
  222. , "events/s"
  223. , PLUGIN_PROC_NAME
  224. , PLUGIN_PROC_MODULE_VMSTAT_NAME
  225. , NETDATA_CHART_PRIO_MEM_NUMA
  226. , update_every
  227. , RRDSET_TYPE_LINE
  228. );
  229. rrdset_flag_set(st_numa, RRDSET_FLAG_DETAIL);
  230. // These depend on CONFIG_NUMA in the kernel.
  231. rd_local = rrddim_add(st_numa, "local", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  232. rd_foreign = rrddim_add(st_numa, "foreign", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  233. rd_interleave = rrddim_add(st_numa, "interleave", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  234. rd_other = rrddim_add(st_numa, "other", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  235. // The following stats depend on CONFIG_NUMA_BALANCING in the
  236. // kernel.
  237. rd_pte_updates = rrddim_add(st_numa, "pte_updates", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  238. rd_huge_pte_updates = rrddim_add(st_numa, "huge_pte_updates", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  239. rd_hint_faults = rrddim_add(st_numa, "hint_faults", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  240. rd_hint_faults_local = rrddim_add(st_numa, "hint_faults_local", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  241. rd_pages_migrated = rrddim_add(st_numa, "pages_migrated", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  242. }
  243. rrddim_set_by_pointer(st_numa, rd_local, numa_local);
  244. rrddim_set_by_pointer(st_numa, rd_foreign, numa_foreign);
  245. rrddim_set_by_pointer(st_numa, rd_interleave, numa_interleave);
  246. rrddim_set_by_pointer(st_numa, rd_other, numa_other);
  247. rrddim_set_by_pointer(st_numa, rd_pte_updates, numa_pte_updates);
  248. rrddim_set_by_pointer(st_numa, rd_huge_pte_updates, numa_huge_pte_updates);
  249. rrddim_set_by_pointer(st_numa, rd_hint_faults, numa_hint_faults);
  250. rrddim_set_by_pointer(st_numa, rd_hint_faults_local, numa_hint_faults_local);
  251. rrddim_set_by_pointer(st_numa, rd_pages_migrated, numa_pages_migrated);
  252. rrdset_done(st_numa);
  253. }
  254. return 0;
  255. }