plugin_proc.c 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include "plugin_proc.h"
  3. static struct proc_module {
  4. const char *name;
  5. const char *dim;
  6. int enabled;
  7. int (*func)(int update_every, usec_t dt);
  8. usec_t duration;
  9. RRDDIM *rd;
  10. } proc_modules[] = {
  11. // system metrics
  12. {.name = "/proc/stat", .dim = "stat", .func = do_proc_stat},
  13. {.name = "/proc/uptime", .dim = "uptime", .func = do_proc_uptime},
  14. {.name = "/proc/loadavg", .dim = "loadavg", .func = do_proc_loadavg},
  15. {.name = "/proc/sys/kernel/random/entropy_avail", .dim = "entropy", .func = do_proc_sys_kernel_random_entropy_avail},
  16. // pressure metrics
  17. {.name = "/proc/pressure", .dim = "pressure", .func = do_proc_pressure},
  18. // CPU metrics
  19. {.name = "/proc/interrupts", .dim = "interrupts", .func = do_proc_interrupts},
  20. {.name = "/proc/softirqs", .dim = "softirqs", .func = do_proc_softirqs},
  21. // memory metrics
  22. {.name = "/proc/vmstat", .dim = "vmstat", .func = do_proc_vmstat},
  23. {.name = "/proc/meminfo", .dim = "meminfo", .func = do_proc_meminfo},
  24. {.name = "/sys/kernel/mm/ksm", .dim = "ksm", .func = do_sys_kernel_mm_ksm},
  25. {.name = "/sys/block/zram", .dim = "zram", .func = do_sys_block_zram},
  26. {.name = "/sys/devices/system/edac/mc", .dim = "ecc", .func = do_proc_sys_devices_system_edac_mc},
  27. {.name = "/sys/devices/system/node", .dim = "numa", .func = do_proc_sys_devices_system_node},
  28. {.name = "/proc/pagetypeinfo", .dim = "pagetypeinfo", .func = do_proc_pagetypeinfo},
  29. // network metrics
  30. {.name = "/proc/net/dev", .dim = "netdev", .func = do_proc_net_dev},
  31. {.name = "/proc/net/wireless", .dim = "netwireless", .func = do_proc_net_wireless},
  32. {.name = "/proc/net/sockstat", .dim = "sockstat", .func = do_proc_net_sockstat},
  33. {.name = "/proc/net/sockstat6", .dim = "sockstat6", .func = do_proc_net_sockstat6},
  34. {.name = "/proc/net/netstat",
  35. .dim = "netstat",
  36. .func = do_proc_net_netstat}, // this has to be before /proc/net/snmp, because there is a shared metric
  37. {.name = "/proc/net/snmp", .dim = "snmp", .func = do_proc_net_snmp},
  38. {.name = "/proc/net/snmp6", .dim = "snmp6", .func = do_proc_net_snmp6},
  39. {.name = "/proc/net/sctp/snmp", .dim = "sctp", .func = do_proc_net_sctp_snmp},
  40. {.name = "/proc/net/softnet_stat", .dim = "softnet", .func = do_proc_net_softnet_stat},
  41. {.name = "/proc/net/ip_vs/stats", .dim = "ipvs", .func = do_proc_net_ip_vs_stats},
  42. {.name = "/sys/class/infiniband", .dim = "infiniband", .func = do_sys_class_infiniband},
  43. // firewall metrics
  44. {.name = "/proc/net/stat/conntrack", .dim = "conntrack", .func = do_proc_net_stat_conntrack},
  45. {.name = "/proc/net/stat/synproxy", .dim = "synproxy", .func = do_proc_net_stat_synproxy},
  46. // disk metrics
  47. {.name = "/proc/diskstats", .dim = "diskstats", .func = do_proc_diskstats},
  48. {.name = "/proc/mdstat", .dim = "mdstat", .func = do_proc_mdstat},
  49. // NFS metrics
  50. {.name = "/proc/net/rpc/nfsd", .dim = "nfsd", .func = do_proc_net_rpc_nfsd},
  51. {.name = "/proc/net/rpc/nfs", .dim = "nfs", .func = do_proc_net_rpc_nfs},
  52. // ZFS metrics
  53. {.name = "/proc/spl/kstat/zfs/arcstats", .dim = "zfs_arcstats", .func = do_proc_spl_kstat_zfs_arcstats},
  54. {.name = "/proc/spl/kstat/zfs/pool/state",
  55. .dim = "zfs_pool_state",
  56. .func = do_proc_spl_kstat_zfs_pool_state},
  57. // BTRFS metrics
  58. {.name = "/sys/fs/btrfs", .dim = "btrfs", .func = do_sys_fs_btrfs},
  59. // IPC metrics
  60. {.name = "ipc", .dim = "ipc", .func = do_ipc},
  61. {.name = "/sys/class/power_supply", .dim = "power_supply", .func = do_sys_class_power_supply},
  62. // linux power supply metrics
  63. // the terminator of this array
  64. {.name = NULL, .dim = NULL, .func = NULL}
  65. };
  66. static void proc_main_cleanup(void *ptr)
  67. {
  68. struct netdata_static_thread *static_thread = (struct netdata_static_thread *)ptr;
  69. static_thread->enabled = NETDATA_MAIN_THREAD_EXITING;
  70. info("cleaning up...");
  71. static_thread->enabled = NETDATA_MAIN_THREAD_EXITED;
  72. }
  73. void *proc_main(void *ptr)
  74. {
  75. netdata_thread_cleanup_push(proc_main_cleanup, ptr);
  76. int vdo_cpu_netdata = config_get_boolean("plugin:proc", "netdata server resources", CONFIG_BOOLEAN_YES);
  77. config_get_boolean("plugin:proc", "/proc/pagetypeinfo", CONFIG_BOOLEAN_NO);
  78. // check the enabled status for each module
  79. int i;
  80. for (i = 0; proc_modules[i].name; i++) {
  81. struct proc_module *pm = &proc_modules[i];
  82. pm->enabled = config_get_boolean("plugin:proc", pm->name, CONFIG_BOOLEAN_YES);
  83. pm->duration = 0ULL;
  84. pm->rd = NULL;
  85. }
  86. usec_t step = localhost->rrd_update_every * USEC_PER_SEC;
  87. heartbeat_t hb;
  88. heartbeat_init(&hb);
  89. size_t iterations = 0;
  90. while (!netdata_exit) {
  91. iterations++;
  92. (void)iterations;
  93. usec_t hb_dt = heartbeat_next(&hb, step);
  94. usec_t duration = 0ULL;
  95. if (unlikely(netdata_exit))
  96. break;
  97. // BEGIN -- the job to be done
  98. for (i = 0; proc_modules[i].name; i++) {
  99. struct proc_module *pm = &proc_modules[i];
  100. if (unlikely(!pm->enabled))
  101. continue;
  102. debug(D_PROCNETDEV_LOOP, "PROC calling %s.", pm->name);
  103. //#ifdef NETDATA_LOG_ALLOCATIONS
  104. // if(pm->func == do_proc_interrupts)
  105. // log_thread_memory_allocations = iterations;
  106. //#endif
  107. pm->enabled = !pm->func(localhost->rrd_update_every, hb_dt);
  108. pm->duration = heartbeat_monotonic_dt_to_now_usec(&hb) - duration;
  109. duration += pm->duration;
  110. //#ifdef NETDATA_LOG_ALLOCATIONS
  111. // if(pm->func == do_proc_interrupts)
  112. // log_thread_memory_allocations = 0;
  113. //#endif
  114. if (unlikely(netdata_exit))
  115. break;
  116. }
  117. // END -- the job is done
  118. if (vdo_cpu_netdata) {
  119. static RRDSET *st_cpu_thread = NULL, *st_duration = NULL;
  120. static RRDDIM *rd_user = NULL, *rd_system = NULL;
  121. // ----------------------------------------------------------------
  122. struct rusage thread;
  123. getrusage(RUSAGE_THREAD, &thread);
  124. if (unlikely(!st_cpu_thread)) {
  125. st_cpu_thread = rrdset_create_localhost(
  126. "netdata",
  127. "plugin_proc_cpu",
  128. NULL,
  129. "proc",
  130. NULL,
  131. "Netdata proc plugin CPU usage",
  132. "milliseconds/s",
  133. "proc",
  134. "stats",
  135. 132000,
  136. localhost->rrd_update_every,
  137. RRDSET_TYPE_STACKED);
  138. rd_user = rrddim_add(st_cpu_thread, "user", NULL, 1, USEC_PER_MS, RRD_ALGORITHM_INCREMENTAL);
  139. rd_system = rrddim_add(st_cpu_thread, "system", NULL, 1, USEC_PER_MS, RRD_ALGORITHM_INCREMENTAL);
  140. } else {
  141. rrdset_next(st_cpu_thread);
  142. }
  143. rrddim_set_by_pointer(
  144. st_cpu_thread, rd_user, thread.ru_utime.tv_sec * USEC_PER_SEC + thread.ru_utime.tv_usec);
  145. rrddim_set_by_pointer(
  146. st_cpu_thread, rd_system, thread.ru_stime.tv_sec * USEC_PER_SEC + thread.ru_stime.tv_usec);
  147. rrdset_done(st_cpu_thread);
  148. // ----------------------------------------------------------------
  149. if (unlikely(!st_duration)) {
  150. st_duration = rrdset_find_active_bytype_localhost("netdata", "plugin_proc_modules");
  151. if (!st_duration) {
  152. st_duration = rrdset_create_localhost(
  153. "netdata",
  154. "plugin_proc_modules",
  155. NULL,
  156. "proc",
  157. NULL,
  158. "Netdata proc plugin modules durations",
  159. "milliseconds/run",
  160. "proc",
  161. "stats",
  162. 132001,
  163. localhost->rrd_update_every,
  164. RRDSET_TYPE_STACKED);
  165. for (i = 0; proc_modules[i].name; i++) {
  166. struct proc_module *pm = &proc_modules[i];
  167. if (unlikely(!pm->enabled))
  168. continue;
  169. pm->rd = rrddim_add(st_duration, pm->dim, NULL, 1, USEC_PER_MS, RRD_ALGORITHM_ABSOLUTE);
  170. }
  171. }
  172. } else
  173. rrdset_next(st_duration);
  174. for (i = 0; proc_modules[i].name; i++) {
  175. struct proc_module *pm = &proc_modules[i];
  176. if (unlikely(!pm->enabled))
  177. continue;
  178. rrddim_set_by_pointer(st_duration, pm->rd, pm->duration);
  179. }
  180. rrdset_done(st_duration);
  181. }
  182. }
  183. netdata_thread_cleanup_pop(1);
  184. return NULL;
  185. }
  186. int get_numa_node_count(void)
  187. {
  188. static int numa_node_count = -1;
  189. if (numa_node_count != -1)
  190. return numa_node_count;
  191. numa_node_count = 0;
  192. char name[FILENAME_MAX + 1];
  193. snprintfz(name, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, "/sys/devices/system/node");
  194. char *dirname = config_get("plugin:proc:/sys/devices/system/node", "directory to monitor", name);
  195. DIR *dir = opendir(dirname);
  196. if (dir) {
  197. struct dirent *de = NULL;
  198. while ((de = readdir(dir))) {
  199. if (de->d_type != DT_DIR)
  200. continue;
  201. if (strncmp(de->d_name, "node", 4) != 0)
  202. continue;
  203. if (!isdigit(de->d_name[4]))
  204. continue;
  205. numa_node_count++;
  206. }
  207. closedir(dir);
  208. }
  209. return numa_node_count;
  210. }