plugin_proc.c 8.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include "plugin_proc.h"
  3. static struct proc_module {
  4. const char *name;
  5. const char *dim;
  6. int enabled;
  7. int (*func)(int update_every, usec_t dt);
  8. RRDDIM *rd;
  9. } proc_modules[] = {
  10. // system metrics
  11. {.name = "/proc/stat", .dim = "stat", .func = do_proc_stat},
  12. {.name = "/proc/uptime", .dim = "uptime", .func = do_proc_uptime},
  13. {.name = "/proc/loadavg", .dim = "loadavg", .func = do_proc_loadavg},
  14. {.name = "/proc/sys/fs/file-nr", .dim = "file-nr", .func = do_proc_sys_fs_file_nr},
  15. {.name = "/proc/sys/kernel/random/entropy_avail", .dim = "entropy", .func = do_proc_sys_kernel_random_entropy_avail},
  16. // pressure metrics
  17. {.name = "/proc/pressure", .dim = "pressure", .func = do_proc_pressure},
  18. // CPU metrics
  19. {.name = "/proc/interrupts", .dim = "interrupts", .func = do_proc_interrupts},
  20. {.name = "/proc/softirqs", .dim = "softirqs", .func = do_proc_softirqs},
  21. // memory metrics
  22. {.name = "/proc/vmstat", .dim = "vmstat", .func = do_proc_vmstat},
  23. {.name = "/proc/meminfo", .dim = "meminfo", .func = do_proc_meminfo},
  24. {.name = "/sys/kernel/mm/ksm", .dim = "ksm", .func = do_sys_kernel_mm_ksm},
  25. {.name = "/sys/block/zram", .dim = "zram", .func = do_sys_block_zram},
  26. {.name = "/sys/devices/system/edac/mc", .dim = "edac", .func = do_proc_sys_devices_system_edac_mc},
  27. {.name = "/sys/devices/pci/aer", .dim = "pci_aer", .func = do_proc_sys_devices_pci_aer},
  28. {.name = "/sys/devices/system/node", .dim = "numa", .func = do_proc_sys_devices_system_node},
  29. {.name = "/proc/pagetypeinfo", .dim = "pagetypeinfo", .func = do_proc_pagetypeinfo},
  30. // network metrics
  31. {.name = "/proc/net/wireless", .dim = "netwireless", .func = do_proc_net_wireless},
  32. {.name = "/proc/net/sockstat", .dim = "sockstat", .func = do_proc_net_sockstat},
  33. {.name = "/proc/net/sockstat6", .dim = "sockstat6", .func = do_proc_net_sockstat6},
  34. {.name = "/proc/net/netstat", .dim = "netstat", .func = do_proc_net_netstat},
  35. {.name = "/proc/net/sctp/snmp", .dim = "sctp", .func = do_proc_net_sctp_snmp},
  36. {.name = "/proc/net/softnet_stat", .dim = "softnet", .func = do_proc_net_softnet_stat},
  37. {.name = "/proc/net/ip_vs/stats", .dim = "ipvs", .func = do_proc_net_ip_vs_stats},
  38. {.name = "/sys/class/infiniband", .dim = "infiniband", .func = do_sys_class_infiniband},
  39. // firewall metrics
  40. {.name = "/proc/net/stat/conntrack", .dim = "conntrack", .func = do_proc_net_stat_conntrack},
  41. {.name = "/proc/net/stat/synproxy", .dim = "synproxy", .func = do_proc_net_stat_synproxy},
  42. // disk metrics
  43. {.name = "/proc/diskstats", .dim = "diskstats", .func = do_proc_diskstats},
  44. {.name = "/proc/mdstat", .dim = "mdstat", .func = do_proc_mdstat},
  45. // NFS metrics
  46. {.name = "/proc/net/rpc/nfsd", .dim = "nfsd", .func = do_proc_net_rpc_nfsd},
  47. {.name = "/proc/net/rpc/nfs", .dim = "nfs", .func = do_proc_net_rpc_nfs},
  48. // ZFS metrics
  49. {.name = "/proc/spl/kstat/zfs/arcstats", .dim = "zfs_arcstats", .func = do_proc_spl_kstat_zfs_arcstats},
  50. {.name = "/proc/spl/kstat/zfs/pool/state",.dim = "zfs_pool_state",.func = do_proc_spl_kstat_zfs_pool_state},
  51. // BTRFS metrics
  52. {.name = "/sys/fs/btrfs", .dim = "btrfs", .func = do_sys_fs_btrfs},
  53. // IPC metrics
  54. {.name = "ipc", .dim = "ipc", .func = do_ipc},
  55. // linux power supply metrics
  56. {.name = "/sys/class/power_supply", .dim = "power_supply", .func = do_sys_class_power_supply},
  57. // GPU metrics
  58. {.name = "/sys/class/drm", .dim = "drm", .func = do_sys_class_drm},
  59. // the terminator of this array
  60. {.name = NULL, .dim = NULL, .func = NULL}
  61. };
  62. #if WORKER_UTILIZATION_MAX_JOB_TYPES < 36
  63. #error WORKER_UTILIZATION_MAX_JOB_TYPES has to be at least 36
  64. #endif
  65. static netdata_thread_t *netdev_thread = NULL;
  66. static void proc_main_cleanup(void *ptr)
  67. {
  68. struct netdata_static_thread *static_thread = (struct netdata_static_thread *)ptr;
  69. static_thread->enabled = NETDATA_MAIN_THREAD_EXITING;
  70. collector_info("cleaning up...");
  71. if (netdev_thread) {
  72. netdata_thread_join(*netdev_thread, NULL);
  73. freez(netdev_thread);
  74. }
  75. static_thread->enabled = NETDATA_MAIN_THREAD_EXITED;
  76. worker_unregister();
  77. }
  78. bool inside_lxc_container = false;
  79. static bool is_lxcfs_proc_mounted() {
  80. procfile *ff = NULL;
  81. if (unlikely(!ff)) {
  82. char filename[FILENAME_MAX + 1];
  83. snprintfz(filename, FILENAME_MAX, "/proc/self/mounts");
  84. ff = procfile_open(filename, " \t", PROCFILE_FLAG_DEFAULT);
  85. if (unlikely(!ff))
  86. return false;
  87. }
  88. ff = procfile_readall(ff);
  89. if (unlikely(!ff))
  90. return false;
  91. unsigned long l, lines = procfile_lines(ff);
  92. for (l = 0; l < lines; l++) {
  93. size_t words = procfile_linewords(ff, l);
  94. if (words < 2) {
  95. continue;
  96. }
  97. if (!strcmp(procfile_lineword(ff, l, 0), "lxcfs") && !strncmp(procfile_lineword(ff, l, 1), "/proc", 5)) {
  98. procfile_close(ff);
  99. return true;
  100. }
  101. }
  102. procfile_close(ff);
  103. return false;
  104. }
  105. static bool log_proc_module(BUFFER *wb, void *data) {
  106. struct proc_module *pm = data;
  107. buffer_sprintf(wb, "proc.plugin[%s]", pm->name);
  108. return true;
  109. }
  110. void *proc_main(void *ptr)
  111. {
  112. worker_register("PROC");
  113. rrd_collector_started();
  114. if (config_get_boolean("plugin:proc", "/proc/net/dev", CONFIG_BOOLEAN_YES)) {
  115. netdev_thread = mallocz(sizeof(netdata_thread_t));
  116. netdata_log_debug(D_SYSTEM, "Starting thread %s.", THREAD_NETDEV_NAME);
  117. netdata_thread_create(
  118. netdev_thread, THREAD_NETDEV_NAME, NETDATA_THREAD_OPTION_JOINABLE, netdev_main, netdev_thread);
  119. }
  120. netdata_thread_cleanup_push(proc_main_cleanup, ptr)
  121. {
  122. config_get_boolean("plugin:proc", "/proc/pagetypeinfo", CONFIG_BOOLEAN_NO);
  123. // check the enabled status for each module
  124. int i;
  125. for(i = 0; proc_modules[i].name; i++) {
  126. struct proc_module *pm = &proc_modules[i];
  127. pm->enabled = config_get_boolean("plugin:proc", pm->name, CONFIG_BOOLEAN_YES);
  128. pm->rd = NULL;
  129. worker_register_job_name(i, proc_modules[i].dim);
  130. }
  131. usec_t step = localhost->rrd_update_every * USEC_PER_SEC;
  132. heartbeat_t hb;
  133. heartbeat_init(&hb);
  134. inside_lxc_container = is_lxcfs_proc_mounted();
  135. #define LGS_MODULE_ID 0
  136. ND_LOG_STACK lgs[] = {
  137. [LGS_MODULE_ID] = ND_LOG_FIELD_TXT(NDF_MODULE, "proc.plugin"),
  138. ND_LOG_FIELD_END(),
  139. };
  140. ND_LOG_STACK_PUSH(lgs);
  141. while(service_running(SERVICE_COLLECTORS)) {
  142. worker_is_idle();
  143. usec_t hb_dt = heartbeat_next(&hb, step);
  144. if(unlikely(!service_running(SERVICE_COLLECTORS)))
  145. break;
  146. for(i = 0; proc_modules[i].name; i++) {
  147. if(unlikely(!service_running(SERVICE_COLLECTORS)))
  148. break;
  149. struct proc_module *pm = &proc_modules[i];
  150. if(unlikely(!pm->enabled))
  151. continue;
  152. worker_is_busy(i);
  153. lgs[LGS_MODULE_ID] = ND_LOG_FIELD_CB(NDF_MODULE, log_proc_module, pm);
  154. pm->enabled = !pm->func(localhost->rrd_update_every, hb_dt);
  155. lgs[LGS_MODULE_ID] = ND_LOG_FIELD_TXT(NDF_MODULE, "proc.plugin");
  156. }
  157. }
  158. }
  159. netdata_thread_cleanup_pop(1);
  160. return NULL;
  161. }
  162. int get_numa_node_count(void)
  163. {
  164. static int numa_node_count = -1;
  165. if (numa_node_count != -1)
  166. return numa_node_count;
  167. numa_node_count = 0;
  168. char name[FILENAME_MAX + 1];
  169. snprintfz(name, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, "/sys/devices/system/node");
  170. char *dirname = config_get("plugin:proc:/sys/devices/system/node", "directory to monitor", name);
  171. DIR *dir = opendir(dirname);
  172. if (dir) {
  173. struct dirent *de = NULL;
  174. while ((de = readdir(dir))) {
  175. if (de->d_type != DT_DIR)
  176. continue;
  177. if (strncmp(de->d_name, "node", 4) != 0)
  178. continue;
  179. if (!isdigit(de->d_name[4]))
  180. continue;
  181. numa_node_count++;
  182. }
  183. closedir(dir);
  184. }
  185. return numa_node_count;
  186. }