ebpf_process.c 48 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include <sys/resource.h>
  3. #include "ebpf.h"
  4. #include "ebpf_process.h"
  5. /*****************************************************************
  6. *
  7. * GLOBAL VARIABLES
  8. *
  9. *****************************************************************/
  10. static char *process_dimension_names[NETDATA_KEY_PUBLISH_PROCESS_END] = { "process", "task", "process", "thread" };
  11. static char *process_id_names[NETDATA_KEY_PUBLISH_PROCESS_END] = { "do_exit", "release_task", "_do_fork", "sys_clone" };
  12. static char *status[] = { "process", "zombie" };
  13. static ebpf_local_maps_t process_maps[] = {{.name = "tbl_pid_stats", .internal_input = ND_EBPF_DEFAULT_PID_SIZE,
  14. .user_input = 0,
  15. .type = NETDATA_EBPF_MAP_RESIZABLE | NETDATA_EBPF_MAP_PID,
  16. .map_fd = ND_EBPF_MAP_FD_NOT_INITIALIZED},
  17. {.name = "tbl_total_stats", .internal_input = NETDATA_KEY_END_VECTOR,
  18. .user_input = 0, .type = NETDATA_EBPF_MAP_STATIC,
  19. .map_fd = ND_EBPF_MAP_FD_NOT_INITIALIZED},
  20. {.name = "process_ctrl", .internal_input = NETDATA_CONTROLLER_END,
  21. .user_input = 0,
  22. .type = NETDATA_EBPF_MAP_CONTROLLER,
  23. .map_fd = ND_EBPF_MAP_FD_NOT_INITIALIZED},
  24. {.name = NULL, .internal_input = 0, .user_input = 0,
  25. .type = NETDATA_EBPF_MAP_CONTROLLER,
  26. .map_fd = ND_EBPF_MAP_FD_NOT_INITIALIZED}};
  27. char *tracepoint_sched_type = { "sched" } ;
  28. char *tracepoint_sched_process_exit = { "sched_process_exit" };
  29. char *tracepoint_sched_process_exec = { "sched_process_exec" };
  30. char *tracepoint_sched_process_fork = { "sched_process_fork" };
  31. static int was_sched_process_exit_enabled = 0;
  32. static int was_sched_process_exec_enabled = 0;
  33. static int was_sched_process_fork_enabled = 0;
  34. static netdata_idx_t *process_hash_values = NULL;
  35. static netdata_syscall_stat_t process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_END];
  36. static netdata_publish_syscall_t process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_END];
  37. ebpf_process_stat_t **global_process_stats = NULL;
  38. ebpf_process_publish_apps_t **current_apps_data = NULL;
  39. int process_enabled = 0;
  40. static struct bpf_object *objects = NULL;
  41. static struct bpf_link **probe_links = NULL;
  42. struct config process_config = { .first_section = NULL,
  43. .last_section = NULL,
  44. .mutex = NETDATA_MUTEX_INITIALIZER,
  45. .index = { .avl_tree = { .root = NULL, .compar = appconfig_section_compare },
  46. .rwlock = AVL_LOCK_INITIALIZER } };
  47. static struct netdata_static_thread cgroup_thread = {"EBPF CGROUP", NULL, NULL,
  48. 1, NULL, NULL, NULL};
  49. static char *threads_stat[NETDATA_EBPF_THREAD_STAT_END] = {"total", "running"};
  50. static char *load_event_stat[NETDATA_EBPF_LOAD_STAT_END] = {"legacy", "co-re"};
  51. /*****************************************************************
  52. *
  53. * PROCESS DATA AND SEND TO NETDATA
  54. *
  55. *****************************************************************/
  56. /**
  57. * Update publish structure before to send data to Netdata.
  58. *
  59. * @param publish the first output structure with independent dimensions
  60. * @param pvc the second output structure with correlated dimensions
  61. * @param input the structure with the input data.
  62. */
  63. static void ebpf_update_global_publish(netdata_publish_syscall_t *publish, netdata_publish_vfs_common_t *pvc,
  64. netdata_syscall_stat_t *input)
  65. {
  66. netdata_publish_syscall_t *move = publish;
  67. int selector = NETDATA_KEY_PUBLISH_PROCESS_EXIT;
  68. while (move) {
  69. move->ncall = (input->call > move->pcall) ? input->call - move->pcall : move->pcall - input->call;
  70. move->nbyte = (input->bytes > move->pbyte) ? input->bytes - move->pbyte : move->pbyte - input->bytes;
  71. move->nerr = (input->ecall > move->nerr) ? input->ecall - move->perr : move->perr - input->ecall;
  72. move->pcall = input->call;
  73. move->pbyte = input->bytes;
  74. move->perr = input->ecall;
  75. input = input->next;
  76. move = move->next;
  77. selector++;
  78. }
  79. pvc->running = (long)publish[NETDATA_KEY_PUBLISH_PROCESS_FORK].ncall -
  80. (long)publish[NETDATA_KEY_PUBLISH_PROCESS_CLONE].ncall;
  81. publish[NETDATA_KEY_PUBLISH_PROCESS_RELEASE_TASK].ncall = -publish[NETDATA_KEY_PUBLISH_PROCESS_RELEASE_TASK].ncall;
  82. pvc->zombie = (long)publish[NETDATA_KEY_PUBLISH_PROCESS_EXIT].ncall +
  83. (long)publish[NETDATA_KEY_PUBLISH_PROCESS_RELEASE_TASK].ncall;
  84. }
  85. /**
  86. * Call the necessary functions to create a chart.
  87. *
  88. * @param family the chart family
  89. * @param move the pointer with the values that will be published
  90. */
  91. static void write_status_chart(char *family, netdata_publish_vfs_common_t *pvc)
  92. {
  93. write_begin_chart(family, NETDATA_PROCESS_STATUS_NAME);
  94. write_chart_dimension(status[0], (long long)pvc->running);
  95. write_chart_dimension(status[1], (long long)pvc->zombie);
  96. write_end_chart();
  97. }
  98. /**
  99. * Send data to Netdata calling auxiliary functions.
  100. *
  101. * @param em the structure with thread information
  102. */
  103. static void ebpf_process_send_data(ebpf_module_t *em)
  104. {
  105. netdata_publish_vfs_common_t pvc;
  106. ebpf_update_global_publish(process_publish_aggregated, &pvc, process_aggregated_data);
  107. write_count_chart(NETDATA_EXIT_SYSCALL, NETDATA_EBPF_SYSTEM_GROUP,
  108. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_EXIT], 2);
  109. write_count_chart(NETDATA_PROCESS_SYSCALL, NETDATA_EBPF_SYSTEM_GROUP,
  110. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_FORK], 2);
  111. write_status_chart(NETDATA_EBPF_SYSTEM_GROUP, &pvc);
  112. if (em->mode < MODE_ENTRY) {
  113. write_err_chart(NETDATA_PROCESS_ERROR_NAME, NETDATA_EBPF_SYSTEM_GROUP,
  114. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_FORK], 2);
  115. }
  116. }
  117. /**
  118. * Sum values for pid
  119. *
  120. * @param root the structure with all available PIDs
  121. *
  122. * @param offset the address that we are reading
  123. *
  124. * @return it returns the sum of all PIDs
  125. */
  126. long long ebpf_process_sum_values_for_pids(struct pid_on_target *root, size_t offset)
  127. {
  128. long long ret = 0;
  129. while (root) {
  130. int32_t pid = root->pid;
  131. ebpf_process_publish_apps_t *w = current_apps_data[pid];
  132. if (w) {
  133. ret += get_value_from_structure((char *)w, offset);
  134. }
  135. root = root->next;
  136. }
  137. return ret;
  138. }
  139. /**
  140. * Remove process pid
  141. *
  142. * Remove from PID task table when task_release was called.
  143. */
  144. void ebpf_process_remove_pids()
  145. {
  146. struct pid_stat *pids = root_of_pids;
  147. int pid_fd = process_maps[NETDATA_PROCESS_PID_TABLE].map_fd;
  148. while (pids) {
  149. uint32_t pid = pids->pid;
  150. ebpf_process_stat_t *w = global_process_stats[pid];
  151. if (w) {
  152. if (w->removeme) {
  153. freez(w);
  154. global_process_stats[pid] = NULL;
  155. bpf_map_delete_elem(pid_fd, &pid);
  156. }
  157. }
  158. pids = pids->next;
  159. }
  160. }
  161. /**
  162. * Send data to Netdata calling auxiliary functions.
  163. *
  164. * @param root the target list.
  165. */
  166. void ebpf_process_send_apps_data(struct target *root, ebpf_module_t *em)
  167. {
  168. struct target *w;
  169. collected_number value;
  170. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_SYSCALL_APPS_TASK_PROCESS);
  171. for (w = root; w; w = w->next) {
  172. if (unlikely(w->exposed && w->processes)) {
  173. value = ebpf_process_sum_values_for_pids(w->root_pid, offsetof(ebpf_process_publish_apps_t, create_process));
  174. write_chart_dimension(w->name, value);
  175. }
  176. }
  177. write_end_chart();
  178. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_SYSCALL_APPS_TASK_THREAD);
  179. for (w = root; w; w = w->next) {
  180. if (unlikely(w->exposed && w->processes)) {
  181. value = ebpf_process_sum_values_for_pids(w->root_pid, offsetof(ebpf_process_publish_apps_t, create_thread));
  182. write_chart_dimension(w->name, value);
  183. }
  184. }
  185. write_end_chart();
  186. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_SYSCALL_APPS_TASK_EXIT);
  187. for (w = root; w; w = w->next) {
  188. if (unlikely(w->exposed && w->processes)) {
  189. value = ebpf_process_sum_values_for_pids(w->root_pid, offsetof(ebpf_process_publish_apps_t,
  190. call_do_exit));
  191. write_chart_dimension(w->name, value);
  192. }
  193. }
  194. write_end_chart();
  195. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_SYSCALL_APPS_TASK_CLOSE);
  196. for (w = root; w; w = w->next) {
  197. if (unlikely(w->exposed && w->processes)) {
  198. value = ebpf_process_sum_values_for_pids(w->root_pid, offsetof(ebpf_process_publish_apps_t,
  199. call_release_task));
  200. write_chart_dimension(w->name, value);
  201. }
  202. }
  203. write_end_chart();
  204. if (em->mode < MODE_ENTRY) {
  205. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_SYSCALL_APPS_TASK_ERROR);
  206. for (w = root; w; w = w->next) {
  207. if (unlikely(w->exposed && w->processes)) {
  208. value = ebpf_process_sum_values_for_pids(w->root_pid, offsetof(ebpf_process_publish_apps_t,
  209. task_err));
  210. write_chart_dimension(w->name, value);
  211. }
  212. }
  213. write_end_chart();
  214. }
  215. ebpf_process_remove_pids();
  216. }
  217. /*****************************************************************
  218. *
  219. * READ INFORMATION FROM KERNEL RING
  220. *
  221. *****************************************************************/
  222. /**
  223. * Read the hash table and store data to allocated vectors.
  224. */
  225. static void read_hash_global_tables()
  226. {
  227. uint64_t idx;
  228. netdata_idx_t res[NETDATA_KEY_END_VECTOR];
  229. netdata_idx_t *val = process_hash_values;
  230. int fd = process_maps[NETDATA_PROCESS_GLOBAL_TABLE].map_fd;
  231. for (idx = 0; idx < NETDATA_KEY_END_VECTOR; idx++) {
  232. if (!bpf_map_lookup_elem(fd, &idx, val)) {
  233. uint64_t total = 0;
  234. int i;
  235. int end = ebpf_nprocs;
  236. for (i = 0; i < end; i++)
  237. total += val[i];
  238. res[idx] = total;
  239. } else {
  240. res[idx] = 0;
  241. }
  242. }
  243. process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_EXIT].call = res[NETDATA_KEY_CALLS_DO_EXIT];
  244. process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_RELEASE_TASK].call = res[NETDATA_KEY_CALLS_RELEASE_TASK];
  245. process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_FORK].call = res[NETDATA_KEY_CALLS_DO_FORK];
  246. process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_CLONE].call = res[NETDATA_KEY_CALLS_SYS_CLONE];
  247. process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_FORK].ecall = res[NETDATA_KEY_ERROR_DO_FORK];
  248. process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_CLONE].ecall = res[NETDATA_KEY_ERROR_SYS_CLONE];
  249. }
  250. /**
  251. * Read the hash table and store data to allocated vectors.
  252. */
  253. static void ebpf_process_update_apps_data()
  254. {
  255. struct pid_stat *pids = root_of_pids;
  256. while (pids) {
  257. uint32_t current_pid = pids->pid;
  258. ebpf_process_stat_t *ps = global_process_stats[current_pid];
  259. if (!ps) {
  260. pids = pids->next;
  261. continue;
  262. }
  263. ebpf_process_publish_apps_t *cad = current_apps_data[current_pid];
  264. if (!cad) {
  265. cad = callocz(1, sizeof(ebpf_process_publish_apps_t));
  266. current_apps_data[current_pid] = cad;
  267. }
  268. //Read data
  269. cad->call_do_exit = ps->exit_call;
  270. cad->call_release_task = ps->release_call;
  271. cad->create_process = ps->create_process;
  272. cad->create_thread = ps->create_thread;
  273. cad->task_err = ps->task_err;
  274. pids = pids->next;
  275. }
  276. }
  277. /**
  278. * Update cgroup
  279. *
  280. * Update cgroup data based in
  281. */
  282. static void ebpf_update_process_cgroup()
  283. {
  284. ebpf_cgroup_target_t *ect ;
  285. int pid_fd = process_maps[NETDATA_PROCESS_PID_TABLE].map_fd;
  286. pthread_mutex_lock(&mutex_cgroup_shm);
  287. for (ect = ebpf_cgroup_pids; ect; ect = ect->next) {
  288. struct pid_on_target2 *pids;
  289. for (pids = ect->pids; pids; pids = pids->next) {
  290. int pid = pids->pid;
  291. ebpf_process_stat_t *out = &pids->ps;
  292. if (global_process_stats[pid]) {
  293. ebpf_process_stat_t *in = global_process_stats[pid];
  294. memcpy(out, in, sizeof(ebpf_process_stat_t));
  295. } else {
  296. if (bpf_map_lookup_elem(pid_fd, &pid, out)) {
  297. memset(out, 0, sizeof(ebpf_process_stat_t));
  298. }
  299. }
  300. }
  301. }
  302. pthread_mutex_unlock(&mutex_cgroup_shm);
  303. }
  304. /*****************************************************************
  305. *
  306. * FUNCTIONS TO CREATE CHARTS
  307. *
  308. *****************************************************************/
  309. /**
  310. * Create process status chart
  311. *
  312. * @param family the chart family
  313. * @param name the chart name
  314. * @param axis the axis label
  315. * @param web the group name used to attach the chart on dashboard
  316. * @param order the order number of the specified chart
  317. * @param update_every value to overwrite the update frequency set by the server.
  318. */
  319. static void ebpf_process_status_chart(char *family, char *name, char *axis,
  320. char *web, char *algorithm, int order, int update_every)
  321. {
  322. printf("CHART %s.%s '' 'Process not closed' '%s' '%s' '' line %d %d '' 'ebpf.plugin' 'process'\n",
  323. family,
  324. name,
  325. axis,
  326. web,
  327. order,
  328. update_every);
  329. printf("DIMENSION %s '' %s 1 1\n", status[0], algorithm);
  330. printf("DIMENSION %s '' %s 1 1\n", status[1], algorithm);
  331. }
  332. /**
  333. * Create global charts
  334. *
  335. * Call ebpf_create_chart to create the charts for the collector.
  336. *
  337. * @param em a pointer to the structure with the default values.
  338. */
  339. static void ebpf_create_global_charts(ebpf_module_t *em)
  340. {
  341. ebpf_create_chart(NETDATA_EBPF_SYSTEM_GROUP,
  342. NETDATA_PROCESS_SYSCALL,
  343. "Start process",
  344. EBPF_COMMON_DIMENSION_CALL,
  345. NETDATA_PROCESS_GROUP,
  346. NULL,
  347. NETDATA_EBPF_CHART_TYPE_LINE,
  348. 21002,
  349. ebpf_create_global_dimension,
  350. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_FORK],
  351. 2, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  352. ebpf_create_chart(NETDATA_EBPF_SYSTEM_GROUP,
  353. NETDATA_EXIT_SYSCALL,
  354. "Exit process",
  355. EBPF_COMMON_DIMENSION_CALL,
  356. NETDATA_PROCESS_GROUP,
  357. NULL,
  358. NETDATA_EBPF_CHART_TYPE_LINE,
  359. 21003,
  360. ebpf_create_global_dimension,
  361. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_EXIT],
  362. 2, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  363. ebpf_process_status_chart(NETDATA_EBPF_SYSTEM_GROUP,
  364. NETDATA_PROCESS_STATUS_NAME,
  365. EBPF_COMMON_DIMENSION_DIFFERENCE,
  366. NETDATA_PROCESS_GROUP,
  367. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  368. 21004, em->update_every);
  369. if (em->mode < MODE_ENTRY) {
  370. ebpf_create_chart(NETDATA_EBPF_SYSTEM_GROUP,
  371. NETDATA_PROCESS_ERROR_NAME,
  372. "Fails to create process",
  373. EBPF_COMMON_DIMENSION_CALL,
  374. NETDATA_PROCESS_GROUP,
  375. NULL,
  376. NETDATA_EBPF_CHART_TYPE_LINE,
  377. 21005,
  378. ebpf_create_global_dimension,
  379. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_FORK],
  380. 2, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  381. }
  382. }
  383. /**
  384. * Create chart for Statistic Thread
  385. *
  386. * Write to standard output current values for threads.
  387. *
  388. * @param em a pointer to the structure with the default values.
  389. */
  390. static inline void ebpf_create_statistic_thread_chart(ebpf_module_t *em)
  391. {
  392. ebpf_write_chart_cmd(NETDATA_MONITORING_FAMILY,
  393. NETDATA_EBPF_THREADS,
  394. "Threads info.",
  395. "threads",
  396. NETDATA_EBPF_FAMILY,
  397. NETDATA_EBPF_CHART_TYPE_LINE,
  398. NULL,
  399. 140000,
  400. em->update_every,
  401. NETDATA_EBPF_MODULE_NAME_PROCESS);
  402. ebpf_write_global_dimension(threads_stat[NETDATA_EBPF_THREAD_STAT_TOTAL],
  403. threads_stat[NETDATA_EBPF_THREAD_STAT_TOTAL],
  404. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX]);
  405. ebpf_write_global_dimension(threads_stat[NETDATA_EBPF_THREAD_STAT_RUNNING],
  406. threads_stat[NETDATA_EBPF_THREAD_STAT_RUNNING],
  407. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX]);
  408. }
  409. /**
  410. * Create chart for Load Thread
  411. *
  412. * Write to standard output current values for load mode.
  413. *
  414. * @param em a pointer to the structure with the default values.
  415. */
  416. static inline void ebpf_create_statistic_load_chart(ebpf_module_t *em)
  417. {
  418. ebpf_write_chart_cmd(NETDATA_MONITORING_FAMILY,
  419. NETDATA_EBPF_LOAD_METHOD,
  420. "Load info.",
  421. "methods",
  422. NETDATA_EBPF_FAMILY,
  423. NETDATA_EBPF_CHART_TYPE_LINE,
  424. NULL,
  425. 140001,
  426. em->update_every,
  427. NETDATA_EBPF_MODULE_NAME_PROCESS);
  428. ebpf_write_global_dimension(load_event_stat[NETDATA_EBPF_LOAD_STAT_LEGACY],
  429. load_event_stat[NETDATA_EBPF_LOAD_STAT_LEGACY],
  430. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX]);
  431. ebpf_write_global_dimension(load_event_stat[NETDATA_EBPF_LOAD_STAT_CORE],
  432. load_event_stat[NETDATA_EBPF_LOAD_STAT_CORE],
  433. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX]);
  434. }
  435. /**
  436. * Create Statistics Charts
  437. *
  438. * Create charts that will show statistics related to eBPF plugin.
  439. *
  440. * @param em a pointer to the structure with the default values.
  441. */
  442. static void ebpf_create_statistic_charts(ebpf_module_t *em)
  443. {
  444. ebpf_create_statistic_thread_chart(em);
  445. ebpf_create_statistic_load_chart(em);
  446. }
  447. /**
  448. * Create process apps charts
  449. *
  450. * Call ebpf_create_chart to create the charts on apps submenu.
  451. *
  452. * @param em a pointer to the structure with the default values.
  453. * @param ptr a pointer for the targets.
  454. */
  455. void ebpf_process_create_apps_charts(struct ebpf_module *em, void *ptr)
  456. {
  457. struct target *root = ptr;
  458. ebpf_create_charts_on_apps(NETDATA_SYSCALL_APPS_TASK_PROCESS,
  459. "Process started",
  460. EBPF_COMMON_DIMENSION_CALL,
  461. NETDATA_PROCESS_GROUP,
  462. NETDATA_EBPF_CHART_TYPE_STACKED,
  463. 20065,
  464. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  465. root, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  466. ebpf_create_charts_on_apps(NETDATA_SYSCALL_APPS_TASK_THREAD,
  467. "Threads started",
  468. EBPF_COMMON_DIMENSION_CALL,
  469. NETDATA_PROCESS_GROUP,
  470. NETDATA_EBPF_CHART_TYPE_STACKED,
  471. 20066,
  472. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  473. root, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  474. ebpf_create_charts_on_apps(NETDATA_SYSCALL_APPS_TASK_EXIT,
  475. "Tasks starts exit process.",
  476. EBPF_COMMON_DIMENSION_CALL,
  477. NETDATA_PROCESS_GROUP,
  478. NETDATA_EBPF_CHART_TYPE_STACKED,
  479. 20067,
  480. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  481. root, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  482. ebpf_create_charts_on_apps(NETDATA_SYSCALL_APPS_TASK_CLOSE,
  483. "Tasks closed",
  484. EBPF_COMMON_DIMENSION_CALL,
  485. NETDATA_PROCESS_GROUP,
  486. NETDATA_EBPF_CHART_TYPE_STACKED,
  487. 20068,
  488. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  489. root, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  490. if (em->mode < MODE_ENTRY) {
  491. ebpf_create_charts_on_apps(NETDATA_SYSCALL_APPS_TASK_ERROR,
  492. "Errors to create process or threads.",
  493. EBPF_COMMON_DIMENSION_CALL,
  494. NETDATA_PROCESS_GROUP,
  495. NETDATA_EBPF_CHART_TYPE_STACKED,
  496. 20069,
  497. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  498. root,
  499. em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  500. }
  501. }
  502. /**
  503. * Create apps charts
  504. *
  505. * Call ebpf_create_chart to create the charts on apps submenu.
  506. *
  507. * @param root a pointer for the targets.
  508. */
  509. static void ebpf_create_apps_charts(struct target *root)
  510. {
  511. struct target *w;
  512. int newly_added = 0;
  513. for (w = root; w; w = w->next) {
  514. if (w->target)
  515. continue;
  516. if (unlikely(w->processes && (debug_enabled || w->debug_enabled))) {
  517. struct pid_on_target *pid_on_target;
  518. fprintf(
  519. stderr, "ebpf.plugin: target '%s' has aggregated %u process%s:", w->name, w->processes,
  520. (w->processes == 1) ? "" : "es");
  521. for (pid_on_target = w->root_pid; pid_on_target; pid_on_target = pid_on_target->next) {
  522. fprintf(stderr, " %d", pid_on_target->pid);
  523. }
  524. fputc('\n', stderr);
  525. }
  526. if (!w->exposed && w->processes) {
  527. newly_added++;
  528. w->exposed = 1;
  529. if (debug_enabled || w->debug_enabled)
  530. debug_log_int("%s just added - regenerating charts.", w->name);
  531. }
  532. }
  533. if (!newly_added)
  534. return;
  535. int counter;
  536. for (counter = 0; ebpf_modules[counter].thread_name; counter++) {
  537. ebpf_module_t *current = &ebpf_modules[counter];
  538. if (current->enabled && current->apps_charts && current->apps_routine)
  539. current->apps_routine(current, root);
  540. }
  541. }
  542. /*****************************************************************
  543. *
  544. * FUNCTIONS WITH THE MAIN LOOP
  545. *
  546. *****************************************************************/
  547. /**
  548. * Cgroup update shm
  549. *
  550. * This is the thread callback.
  551. * This thread is necessary, because we cannot freeze the whole plugin to read the data from shared memory.
  552. *
  553. * @param ptr It is a NULL value for this thread.
  554. *
  555. * @return It always returns NULL.
  556. */
  557. void *ebpf_cgroup_update_shm(void *ptr)
  558. {
  559. UNUSED(ptr);
  560. heartbeat_t hb;
  561. heartbeat_init(&hb);
  562. usec_t step = 30 * USEC_PER_SEC;
  563. while (!close_ebpf_plugin) {
  564. usec_t dt = heartbeat_next(&hb, step);
  565. (void)dt;
  566. if (close_ebpf_plugin)
  567. break;
  568. if (!shm_ebpf_cgroup.header)
  569. ebpf_map_cgroup_shared_memory();
  570. ebpf_parse_cgroup_shm_data();
  571. }
  572. return NULL;
  573. }
  574. /**
  575. * Sum PIDs
  576. *
  577. * Sum values for all targets.
  578. *
  579. * @param ps structure used to store data
  580. * @param pids input data
  581. */
  582. static void ebpf_process_sum_cgroup_pids(ebpf_process_stat_t *ps, struct pid_on_target2 *pids)
  583. {
  584. ebpf_process_stat_t accumulator;
  585. memset(&accumulator, 0, sizeof(accumulator));
  586. while (pids) {
  587. ebpf_process_stat_t *ps = &pids->ps;
  588. accumulator.exit_call += ps->exit_call;
  589. accumulator.release_call += ps->release_call;
  590. accumulator.create_process += ps->create_process;
  591. accumulator.create_thread += ps->create_thread;
  592. accumulator.task_err += ps->task_err;
  593. pids = pids->next;
  594. }
  595. ps->exit_call = (accumulator.exit_call >= ps->exit_call) ? accumulator.exit_call : ps->exit_call;
  596. ps->release_call = (accumulator.release_call >= ps->release_call) ? accumulator.release_call : ps->release_call;
  597. ps->create_process = (accumulator.create_process >= ps->create_process) ? accumulator.create_process : ps->create_process;
  598. ps->create_thread = (accumulator.create_thread >= ps->create_thread) ? accumulator.create_thread : ps->create_thread;
  599. ps->task_err = (accumulator.task_err >= ps->task_err) ? accumulator.task_err : ps->task_err;
  600. }
  601. /*
  602. * Send Specific Process data
  603. *
  604. * Send data for specific cgroup/apps.
  605. *
  606. * @param type chart type
  607. * @param values structure with values that will be sent to netdata
  608. * @param em the structure with thread information
  609. */
  610. static void ebpf_send_specific_process_data(char *type, ebpf_process_stat_t *values, ebpf_module_t *em)
  611. {
  612. write_begin_chart(type, NETDATA_SYSCALL_APPS_TASK_PROCESS);
  613. write_chart_dimension(process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_FORK].name,
  614. (long long) values->create_process);
  615. write_end_chart();
  616. write_begin_chart(type, NETDATA_SYSCALL_APPS_TASK_THREAD);
  617. write_chart_dimension(process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_CLONE].name,
  618. (long long) values->create_thread);
  619. write_end_chart();
  620. write_begin_chart(type, NETDATA_SYSCALL_APPS_TASK_EXIT);
  621. write_chart_dimension(process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_EXIT].name,
  622. (long long) values->release_call);
  623. write_end_chart();
  624. write_begin_chart(type, NETDATA_SYSCALL_APPS_TASK_CLOSE);
  625. write_chart_dimension(process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_RELEASE_TASK].name,
  626. (long long) values->release_call);
  627. write_end_chart();
  628. if (em->mode < MODE_ENTRY) {
  629. write_begin_chart(type, NETDATA_SYSCALL_APPS_TASK_ERROR);
  630. write_chart_dimension(process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_EXIT].name,
  631. (long long) values->task_err);
  632. write_end_chart();
  633. }
  634. }
  635. /**
  636. * Create specific process charts
  637. *
  638. * Create charts for cgroup/application
  639. *
  640. * @param type the chart type.
  641. * @param em the structure with thread information
  642. */
  643. static void ebpf_create_specific_process_charts(char *type, ebpf_module_t *em)
  644. {
  645. ebpf_create_chart(type, NETDATA_SYSCALL_APPS_TASK_PROCESS, "Process started",
  646. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_CGROUP_GROUP,
  647. NETDATA_CGROUP_PROCESS_CREATE_CONTEXT, NETDATA_EBPF_CHART_TYPE_LINE,
  648. NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5000,
  649. ebpf_create_global_dimension, &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_FORK],
  650. 1, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  651. ebpf_create_chart(type, NETDATA_SYSCALL_APPS_TASK_THREAD, "Threads started",
  652. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_CGROUP_GROUP,
  653. NETDATA_CGROUP_THREAD_CREATE_CONTEXT, NETDATA_EBPF_CHART_TYPE_LINE,
  654. NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5001,
  655. ebpf_create_global_dimension,
  656. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_CLONE],
  657. 1, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  658. ebpf_create_chart(type, NETDATA_SYSCALL_APPS_TASK_EXIT, "Tasks starts exit process.",
  659. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_CGROUP_GROUP,
  660. NETDATA_CGROUP_PROCESS_EXIT_CONTEXT,
  661. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5002,
  662. ebpf_create_global_dimension,
  663. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_EXIT],
  664. 1, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  665. ebpf_create_chart(type, NETDATA_SYSCALL_APPS_TASK_CLOSE, "Tasks closed",
  666. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_CGROUP_GROUP,
  667. NETDATA_CGROUP_PROCESS_CLOSE_CONTEXT,
  668. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5003,
  669. ebpf_create_global_dimension,
  670. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_RELEASE_TASK],
  671. 1, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  672. if (em->mode < MODE_ENTRY) {
  673. ebpf_create_chart(type, NETDATA_SYSCALL_APPS_TASK_ERROR, "Errors to create process or threads.",
  674. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_CGROUP_GROUP,
  675. NETDATA_CGROUP_PROCESS_ERROR_CONTEXT,
  676. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5004,
  677. ebpf_create_global_dimension,
  678. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_EXIT],
  679. 1, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  680. }
  681. }
  682. /**
  683. * Obsolete specific process charts
  684. *
  685. * Obsolete charts for cgroup/application
  686. *
  687. * @param type the chart type.
  688. * @param em the structure with thread information
  689. */
  690. static void ebpf_obsolete_specific_process_charts(char *type, ebpf_module_t *em)
  691. {
  692. ebpf_write_chart_obsolete(type, NETDATA_SYSCALL_APPS_TASK_PROCESS, "Process started",
  693. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_GROUP, NETDATA_EBPF_CHART_TYPE_LINE,
  694. NETDATA_CGROUP_PROCESS_CREATE_CONTEXT, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5000,
  695. em->update_every);
  696. ebpf_write_chart_obsolete(type, NETDATA_SYSCALL_APPS_TASK_THREAD, "Threads started",
  697. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_GROUP, NETDATA_EBPF_CHART_TYPE_LINE,
  698. NETDATA_CGROUP_THREAD_CREATE_CONTEXT, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5001,
  699. em->update_every);
  700. ebpf_write_chart_obsolete(type, NETDATA_SYSCALL_APPS_TASK_EXIT,"Tasks starts exit process.",
  701. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_GROUP, NETDATA_EBPF_CHART_TYPE_LINE,
  702. NETDATA_CGROUP_PROCESS_EXIT_CONTEXT, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5002,
  703. em->update_every);
  704. ebpf_write_chart_obsolete(type, NETDATA_SYSCALL_APPS_TASK_CLOSE,"Tasks closed",
  705. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_GROUP, NETDATA_EBPF_CHART_TYPE_LINE,
  706. NETDATA_CGROUP_PROCESS_CLOSE_CONTEXT, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5003,
  707. em->update_every);
  708. if (em->mode < MODE_ENTRY) {
  709. ebpf_write_chart_obsolete(type, NETDATA_SYSCALL_APPS_TASK_ERROR,"Errors to create process or threads.",
  710. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_GROUP, NETDATA_EBPF_CHART_TYPE_LINE,
  711. NETDATA_CGROUP_PROCESS_ERROR_CONTEXT, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5004,
  712. em->update_every);
  713. }
  714. }
  715. /**
  716. * Create Systemd process Charts
  717. *
  718. * Create charts when systemd is enabled
  719. *
  720. * @param em the structure with thread information
  721. **/
  722. static void ebpf_create_systemd_process_charts(ebpf_module_t *em)
  723. {
  724. ebpf_create_charts_on_systemd(NETDATA_SYSCALL_APPS_TASK_PROCESS, "Process started",
  725. EBPF_COMMON_DIMENSION_CALL, NETDATA_APPS_PROCESS_GROUP,
  726. NETDATA_EBPF_CHART_TYPE_STACKED, 20065,
  727. ebpf_algorithms[NETDATA_EBPF_INCREMENTAL_IDX], NETDATA_SYSTEMD_PROCESS_CREATE_CONTEXT,
  728. NETDATA_EBPF_MODULE_NAME_PROCESS, em->update_every);
  729. ebpf_create_charts_on_systemd(NETDATA_SYSCALL_APPS_TASK_THREAD, "Threads started",
  730. EBPF_COMMON_DIMENSION_CALL, NETDATA_APPS_PROCESS_GROUP,
  731. NETDATA_EBPF_CHART_TYPE_STACKED, 20066,
  732. ebpf_algorithms[NETDATA_EBPF_INCREMENTAL_IDX], NETDATA_SYSTEMD_THREAD_CREATE_CONTEXT,
  733. NETDATA_EBPF_MODULE_NAME_PROCESS, em->update_every);
  734. ebpf_create_charts_on_systemd(NETDATA_SYSCALL_APPS_TASK_CLOSE, "Tasks starts exit process.",
  735. EBPF_COMMON_DIMENSION_CALL, NETDATA_APPS_PROCESS_GROUP,
  736. NETDATA_EBPF_CHART_TYPE_STACKED, 20067,
  737. ebpf_algorithms[NETDATA_EBPF_INCREMENTAL_IDX], NETDATA_SYSTEMD_PROCESS_EXIT_CONTEXT,
  738. NETDATA_EBPF_MODULE_NAME_PROCESS, em->update_every);
  739. ebpf_create_charts_on_systemd(NETDATA_SYSCALL_APPS_TASK_EXIT, "Tasks closed",
  740. EBPF_COMMON_DIMENSION_CALL, NETDATA_APPS_PROCESS_GROUP,
  741. NETDATA_EBPF_CHART_TYPE_STACKED, 20068,
  742. ebpf_algorithms[NETDATA_EBPF_INCREMENTAL_IDX], NETDATA_SYSTEMD_PROCESS_CLOSE_CONTEXT,
  743. NETDATA_EBPF_MODULE_NAME_PROCESS, em->update_every);
  744. if (em->mode < MODE_ENTRY) {
  745. ebpf_create_charts_on_systemd(NETDATA_SYSCALL_APPS_TASK_ERROR, "Errors to create process or threads.",
  746. EBPF_COMMON_DIMENSION_CALL, NETDATA_APPS_PROCESS_GROUP,
  747. NETDATA_EBPF_CHART_TYPE_STACKED, 20069,
  748. ebpf_algorithms[NETDATA_EBPF_INCREMENTAL_IDX], NETDATA_SYSTEMD_PROCESS_ERROR_CONTEXT,
  749. NETDATA_EBPF_MODULE_NAME_PROCESS, em->update_every);
  750. }
  751. }
  752. /**
  753. * Send Systemd charts
  754. *
  755. * Send collected data to Netdata.
  756. *
  757. * @param em the structure with thread information
  758. *
  759. * @return It returns the status for chart creation, if it is necessary to remove a specific dimension, zero is returned
  760. * otherwise function returns 1 to avoid chart recreation
  761. */
  762. static int ebpf_send_systemd_process_charts(ebpf_module_t *em)
  763. {
  764. int ret = 1;
  765. ebpf_cgroup_target_t *ect;
  766. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_SYSCALL_APPS_TASK_PROCESS);
  767. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  768. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  769. write_chart_dimension(ect->name, ect->publish_systemd_ps.create_process);
  770. } else
  771. ret = 0;
  772. }
  773. write_end_chart();
  774. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_SYSCALL_APPS_TASK_THREAD);
  775. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  776. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  777. write_chart_dimension(ect->name, ect->publish_systemd_ps.create_thread);
  778. }
  779. }
  780. write_end_chart();
  781. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_SYSCALL_APPS_TASK_EXIT);
  782. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  783. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  784. write_chart_dimension(ect->name, ect->publish_systemd_ps.exit_call);
  785. }
  786. }
  787. write_end_chart();
  788. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_SYSCALL_APPS_TASK_CLOSE);
  789. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  790. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  791. write_chart_dimension(ect->name, ect->publish_systemd_ps.release_call);
  792. }
  793. }
  794. write_end_chart();
  795. if (em->mode < MODE_ENTRY) {
  796. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_SYSCALL_APPS_TASK_ERROR);
  797. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  798. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  799. write_chart_dimension(ect->name, ect->publish_systemd_ps.task_err);
  800. }
  801. }
  802. write_end_chart();
  803. }
  804. return ret;
  805. }
  806. /**
  807. * Send data to Netdata calling auxiliary functions.
  808. *
  809. * @param em the structure with thread information
  810. */
  811. static void ebpf_process_send_cgroup_data(ebpf_module_t *em)
  812. {
  813. if (!ebpf_cgroup_pids)
  814. return;
  815. pthread_mutex_lock(&mutex_cgroup_shm);
  816. ebpf_cgroup_target_t *ect;
  817. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  818. ebpf_process_sum_cgroup_pids(&ect->publish_systemd_ps, ect->pids);
  819. }
  820. int has_systemd = shm_ebpf_cgroup.header->systemd_enabled;
  821. if (has_systemd) {
  822. static int systemd_chart = 0;
  823. if (!systemd_chart) {
  824. ebpf_create_systemd_process_charts(em);
  825. systemd_chart = 1;
  826. }
  827. systemd_chart = ebpf_send_systemd_process_charts(em);
  828. }
  829. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  830. if (ect->systemd)
  831. continue;
  832. if (!(ect->flags & NETDATA_EBPF_CGROUP_HAS_PROCESS_CHART) && ect->updated) {
  833. ebpf_create_specific_process_charts(ect->name, em);
  834. ect->flags |= NETDATA_EBPF_CGROUP_HAS_PROCESS_CHART;
  835. }
  836. if (ect->flags & NETDATA_EBPF_CGROUP_HAS_PROCESS_CHART) {
  837. if (ect->updated) {
  838. ebpf_send_specific_process_data(ect->name, &ect->publish_systemd_ps, em);
  839. } else {
  840. ebpf_obsolete_specific_process_charts(ect->name, em);
  841. ect->flags &= ~NETDATA_EBPF_CGROUP_HAS_PROCESS_CHART;
  842. }
  843. }
  844. }
  845. pthread_mutex_unlock(&mutex_cgroup_shm);
  846. }
  847. /**
  848. * Update Cgroup algorithm
  849. *
  850. * Change algorithm from absolute to incremental
  851. */
  852. void ebpf_process_update_cgroup_algorithm()
  853. {
  854. int i;
  855. for (i = 0; i < NETDATA_KEY_PUBLISH_PROCESS_END; i++) {
  856. netdata_publish_syscall_t *ptr = &process_publish_aggregated[i];
  857. freez(ptr->algorithm);
  858. ptr->algorithm = strdupz(ebpf_algorithms[NETDATA_EBPF_INCREMENTAL_IDX]);
  859. }
  860. }
  861. /**
  862. * Send Statistic Data
  863. *
  864. * Send statistic information to netdata.
  865. */
  866. void ebpf_send_statistic_data()
  867. {
  868. write_begin_chart(NETDATA_MONITORING_FAMILY, NETDATA_EBPF_THREADS);
  869. write_chart_dimension(threads_stat[NETDATA_EBPF_THREAD_STAT_TOTAL], (long long)plugin_statistics.threads);
  870. write_chart_dimension(threads_stat[NETDATA_EBPF_THREAD_STAT_RUNNING], (long long)plugin_statistics.running);
  871. write_end_chart();
  872. write_begin_chart(NETDATA_MONITORING_FAMILY, NETDATA_EBPF_LOAD_METHOD);
  873. write_chart_dimension(load_event_stat[NETDATA_EBPF_LOAD_STAT_LEGACY], (long long)plugin_statistics.legacy);
  874. write_chart_dimension(load_event_stat[NETDATA_EBPF_LOAD_STAT_CORE], (long long)plugin_statistics.core);
  875. write_end_chart();
  876. }
  877. /**
  878. * Main loop for this collector.
  879. *
  880. * @param em the structure with thread information
  881. */
  882. static void process_collector(ebpf_module_t *em)
  883. {
  884. cgroup_thread.thread = mallocz(sizeof(netdata_thread_t));
  885. cgroup_thread.start_routine = ebpf_cgroup_update_shm;
  886. netdata_thread_create(cgroup_thread.thread, cgroup_thread.name, NETDATA_THREAD_OPTION_JOINABLE,
  887. ebpf_cgroup_update_shm, em);
  888. heartbeat_t hb;
  889. heartbeat_init(&hb);
  890. int publish_global = em->global_charts;
  891. int apps_enabled = em->apps_charts;
  892. int cgroups = em->cgroup_charts;
  893. int thread_enabled = em->enabled;
  894. if (cgroups)
  895. ebpf_process_update_cgroup_algorithm();
  896. int pid_fd = process_maps[NETDATA_PROCESS_PID_TABLE].map_fd;
  897. int update_every = em->update_every;
  898. int counter = update_every - 1;
  899. while (!close_ebpf_plugin) {
  900. usec_t dt = heartbeat_next(&hb, USEC_PER_SEC);
  901. (void)dt;
  902. pthread_mutex_lock(&collect_data_mutex);
  903. cleanup_exited_pids();
  904. collect_data_for_all_processes(pid_fd);
  905. ebpf_create_apps_charts(apps_groups_root_target);
  906. pthread_cond_broadcast(&collect_data_cond_var);
  907. pthread_mutex_unlock(&collect_data_mutex);
  908. if (++counter == update_every) {
  909. counter = 0;
  910. read_hash_global_tables();
  911. int publish_apps = 0;
  912. if (all_pids_count > 0) {
  913. if (apps_enabled) {
  914. publish_apps = 1;
  915. ebpf_process_update_apps_data();
  916. }
  917. if (cgroups) {
  918. ebpf_update_process_cgroup();
  919. }
  920. }
  921. pthread_mutex_lock(&lock);
  922. ebpf_send_statistic_data();
  923. if (thread_enabled) {
  924. if (publish_global) {
  925. ebpf_process_send_data(em);
  926. }
  927. if (publish_apps) {
  928. ebpf_process_send_apps_data(apps_groups_root_target, em);
  929. }
  930. if (cgroups) {
  931. ebpf_process_send_cgroup_data(em);
  932. }
  933. }
  934. pthread_mutex_unlock(&lock);
  935. }
  936. fflush(stdout);
  937. }
  938. }
  939. /*****************************************************************
  940. *
  941. * FUNCTIONS TO CLOSE THE THREAD
  942. *
  943. *****************************************************************/
  944. void clean_global_memory() {
  945. int pid_fd = process_maps[NETDATA_PROCESS_PID_TABLE].map_fd;
  946. struct pid_stat *pids = root_of_pids;
  947. while (pids) {
  948. uint32_t pid = pids->pid;
  949. freez(global_process_stats[pid]);
  950. bpf_map_delete_elem(pid_fd, &pid);
  951. freez(current_apps_data[pid]);
  952. pids = pids->next;
  953. }
  954. }
  955. /**
  956. * Process disable tracepoints
  957. *
  958. * Disable tracepoints when the plugin was responsible to enable it.
  959. */
  960. static void ebpf_process_disable_tracepoints()
  961. {
  962. char *default_message = { "Cannot disable the tracepoint" };
  963. if (!was_sched_process_exit_enabled) {
  964. if (ebpf_disable_tracing_values(tracepoint_sched_type, tracepoint_sched_process_exit))
  965. error("%s %s/%s.", default_message, tracepoint_sched_type, tracepoint_sched_process_exit);
  966. }
  967. if (!was_sched_process_exec_enabled) {
  968. if (ebpf_disable_tracing_values(tracepoint_sched_type, tracepoint_sched_process_exec))
  969. error("%s %s/%s.", default_message, tracepoint_sched_type, tracepoint_sched_process_exec);
  970. }
  971. if (!was_sched_process_fork_enabled) {
  972. if (ebpf_disable_tracing_values(tracepoint_sched_type, tracepoint_sched_process_fork))
  973. error("%s %s/%s.", default_message, tracepoint_sched_type, tracepoint_sched_process_fork);
  974. }
  975. }
  976. /**
  977. * Clean up the main thread.
  978. *
  979. * @param ptr thread data.
  980. */
  981. static void ebpf_process_cleanup(void *ptr)
  982. {
  983. UNUSED(ptr);
  984. heartbeat_t hb;
  985. heartbeat_init(&hb);
  986. uint32_t tick = 1 * USEC_PER_SEC;
  987. while (!finalized_threads) {
  988. usec_t dt = heartbeat_next(&hb, tick);
  989. UNUSED(dt);
  990. }
  991. ebpf_cleanup_publish_syscall(process_publish_aggregated);
  992. freez(process_hash_values);
  993. clean_global_memory();
  994. freez(global_process_stats);
  995. freez(current_apps_data);
  996. ebpf_process_disable_tracepoints();
  997. if (probe_links) {
  998. struct bpf_program *prog;
  999. size_t i = 0 ;
  1000. bpf_object__for_each_program(prog, objects) {
  1001. bpf_link__destroy(probe_links[i]);
  1002. i++;
  1003. }
  1004. bpf_object__close(objects);
  1005. }
  1006. freez(cgroup_thread.thread);
  1007. }
  1008. /*****************************************************************
  1009. *
  1010. * FUNCTIONS TO START THREAD
  1011. *
  1012. *****************************************************************/
  1013. /**
  1014. * Allocate vectors used with this thread.
  1015. * We are not testing the return, because callocz does this and shutdown the software
  1016. * case it was not possible to allocate.
  1017. *
  1018. * @param length is the length for the vectors used inside the collector.
  1019. */
  1020. static void ebpf_process_allocate_global_vectors(size_t length)
  1021. {
  1022. memset(process_aggregated_data, 0, length * sizeof(netdata_syscall_stat_t));
  1023. memset(process_publish_aggregated, 0, length * sizeof(netdata_publish_syscall_t));
  1024. process_hash_values = callocz(ebpf_nprocs, sizeof(netdata_idx_t));
  1025. global_process_stats = callocz((size_t)pid_max, sizeof(ebpf_process_stat_t *));
  1026. current_apps_data = callocz((size_t)pid_max, sizeof(ebpf_process_publish_apps_t *));
  1027. }
  1028. static void change_syscalls()
  1029. {
  1030. static char *lfork = { "do_fork" };
  1031. process_id_names[NETDATA_KEY_PUBLISH_PROCESS_FORK] = lfork;
  1032. }
  1033. /**
  1034. * Set local variables
  1035. *
  1036. */
  1037. static void set_local_pointers()
  1038. {
  1039. if (isrh >= NETDATA_MINIMUM_RH_VERSION && isrh < NETDATA_RH_8)
  1040. change_syscalls();
  1041. }
  1042. /*****************************************************************
  1043. *
  1044. * EBPF PROCESS THREAD
  1045. *
  1046. *****************************************************************/
  1047. /**
  1048. *
  1049. */
  1050. static void wait_for_all_threads_die()
  1051. {
  1052. ebpf_modules[EBPF_MODULE_PROCESS_IDX].enabled = 0;
  1053. heartbeat_t hb;
  1054. heartbeat_init(&hb);
  1055. int max = 10;
  1056. int i;
  1057. for (i = 0; i < max; i++) {
  1058. heartbeat_next(&hb, 200000);
  1059. size_t j, counter = 0, compare = 0;
  1060. for (j = 0; ebpf_modules[j].thread_name; j++) {
  1061. if (!ebpf_modules[j].enabled)
  1062. counter++;
  1063. compare++;
  1064. }
  1065. if (counter == compare)
  1066. break;
  1067. }
  1068. }
  1069. /**
  1070. * Enable tracepoints
  1071. *
  1072. * Enable necessary tracepoints for thread.
  1073. *
  1074. * @return It returns 0 on success and -1 otherwise
  1075. */
  1076. static int ebpf_process_enable_tracepoints()
  1077. {
  1078. int test = ebpf_is_tracepoint_enabled(tracepoint_sched_type, tracepoint_sched_process_exit);
  1079. if (test == -1)
  1080. return -1;
  1081. else if (!test) {
  1082. if (ebpf_enable_tracing_values(tracepoint_sched_type, tracepoint_sched_process_exit))
  1083. return -1;
  1084. }
  1085. was_sched_process_exit_enabled = test;
  1086. test = ebpf_is_tracepoint_enabled(tracepoint_sched_type, tracepoint_sched_process_exec);
  1087. if (test == -1)
  1088. return -1;
  1089. else if (!test) {
  1090. if (ebpf_enable_tracing_values(tracepoint_sched_type, tracepoint_sched_process_exec))
  1091. return -1;
  1092. }
  1093. was_sched_process_exec_enabled = test;
  1094. test = ebpf_is_tracepoint_enabled(tracepoint_sched_type, tracepoint_sched_process_fork);
  1095. if (test == -1)
  1096. return -1;
  1097. else if (!test) {
  1098. if (ebpf_enable_tracing_values(tracepoint_sched_type, tracepoint_sched_process_fork))
  1099. return -1;
  1100. }
  1101. was_sched_process_fork_enabled = test;
  1102. return 0;
  1103. }
  1104. /**
  1105. * Process thread
  1106. *
  1107. * Thread used to generate process charts.
  1108. *
  1109. * @param ptr a pointer to `struct ebpf_module`
  1110. *
  1111. * @return It always return NULL
  1112. */
  1113. void *ebpf_process_thread(void *ptr)
  1114. {
  1115. netdata_thread_cleanup_push(ebpf_process_cleanup, ptr);
  1116. ebpf_module_t *em = (ebpf_module_t *)ptr;
  1117. em->maps = process_maps;
  1118. if (ebpf_process_enable_tracepoints()) {
  1119. em->enabled = em->global_charts = em->apps_charts = em->cgroup_charts = CONFIG_BOOLEAN_NO;
  1120. }
  1121. process_enabled = em->enabled;
  1122. pthread_mutex_lock(&lock);
  1123. ebpf_process_allocate_global_vectors(NETDATA_KEY_PUBLISH_PROCESS_END);
  1124. ebpf_update_pid_table(&process_maps[0], em);
  1125. set_local_pointers();
  1126. probe_links = ebpf_load_program(ebpf_plugin_dir, em, running_on_kernel, isrh, &objects);
  1127. if (!probe_links) {
  1128. em->enabled = CONFIG_BOOLEAN_NO;
  1129. pthread_mutex_unlock(&lock);
  1130. goto endprocess;
  1131. }
  1132. int algorithms[NETDATA_KEY_PUBLISH_PROCESS_END] = {
  1133. NETDATA_EBPF_ABSOLUTE_IDX, NETDATA_EBPF_ABSOLUTE_IDX, NETDATA_EBPF_ABSOLUTE_IDX, NETDATA_EBPF_ABSOLUTE_IDX
  1134. };
  1135. ebpf_global_labels(
  1136. process_aggregated_data, process_publish_aggregated, process_dimension_names, process_id_names,
  1137. algorithms, NETDATA_KEY_PUBLISH_PROCESS_END);
  1138. if (process_enabled) {
  1139. ebpf_create_global_charts(em);
  1140. }
  1141. ebpf_update_stats(&plugin_statistics, em);
  1142. ebpf_create_statistic_charts(em);
  1143. pthread_mutex_unlock(&lock);
  1144. process_collector(em);
  1145. endprocess:
  1146. if (!em->enabled)
  1147. ebpf_update_disabled_plugin_stats(em);
  1148. wait_for_all_threads_die();
  1149. netdata_thread_cleanup_pop(1);
  1150. return NULL;
  1151. }