ebpf_process.c 48 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include <sys/resource.h>
  3. #include "ebpf.h"
  4. #include "ebpf_process.h"
  5. /*****************************************************************
  6. *
  7. * GLOBAL VARIABLES
  8. *
  9. *****************************************************************/
  10. static char *process_dimension_names[NETDATA_KEY_PUBLISH_PROCESS_END] = { "process", "task", "process", "thread" };
  11. static char *process_id_names[NETDATA_KEY_PUBLISH_PROCESS_END] = { "do_exit", "release_task", "_do_fork", "sys_clone" };
  12. static char *status[] = { "process", "zombie" };
  13. static ebpf_local_maps_t process_maps[] = {{.name = "tbl_pid_stats", .internal_input = ND_EBPF_DEFAULT_PID_SIZE,
  14. .user_input = 0,
  15. .type = NETDATA_EBPF_MAP_RESIZABLE | NETDATA_EBPF_MAP_PID,
  16. .map_fd = ND_EBPF_MAP_FD_NOT_INITIALIZED},
  17. {.name = "tbl_total_stats", .internal_input = NETDATA_KEY_END_VECTOR,
  18. .user_input = 0, .type = NETDATA_EBPF_MAP_STATIC,
  19. .map_fd = ND_EBPF_MAP_FD_NOT_INITIALIZED},
  20. {.name = "process_ctrl", .internal_input = NETDATA_CONTROLLER_END,
  21. .user_input = 0,
  22. .type = NETDATA_EBPF_MAP_CONTROLLER,
  23. .map_fd = ND_EBPF_MAP_FD_NOT_INITIALIZED},
  24. {.name = NULL, .internal_input = 0, .user_input = 0,
  25. .type = NETDATA_EBPF_MAP_CONTROLLER,
  26. .map_fd = ND_EBPF_MAP_FD_NOT_INITIALIZED}};
  27. char *tracepoint_sched_type = { "sched" } ;
  28. char *tracepoint_sched_process_exit = { "sched_process_exit" };
  29. char *tracepoint_sched_process_exec = { "sched_process_exec" };
  30. char *tracepoint_sched_process_fork = { "sched_process_fork" };
  31. static int was_sched_process_exit_enabled = 0;
  32. static int was_sched_process_exec_enabled = 0;
  33. static int was_sched_process_fork_enabled = 0;
  34. static netdata_idx_t *process_hash_values = NULL;
  35. static netdata_syscall_stat_t process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_END];
  36. static netdata_publish_syscall_t process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_END];
  37. ebpf_process_stat_t **global_process_stats = NULL;
  38. ebpf_process_publish_apps_t **current_apps_data = NULL;
  39. int process_enabled = 0;
  40. static struct bpf_object *objects = NULL;
  41. static struct bpf_link **probe_links = NULL;
  42. struct config process_config = { .first_section = NULL,
  43. .last_section = NULL,
  44. .mutex = NETDATA_MUTEX_INITIALIZER,
  45. .index = { .avl_tree = { .root = NULL, .compar = appconfig_section_compare },
  46. .rwlock = AVL_LOCK_INITIALIZER } };
  47. static struct netdata_static_thread cgroup_thread = {"EBPF CGROUP", NULL, NULL,
  48. 1, NULL, NULL, NULL};
  49. static char *threads_stat[NETDATA_EBPF_THREAD_STAT_END] = {"total", "running"};
  50. static char *load_event_stat[NETDATA_EBPF_LOAD_STAT_END] = {"legacy", "co-re"};
  51. /*****************************************************************
  52. *
  53. * PROCESS DATA AND SEND TO NETDATA
  54. *
  55. *****************************************************************/
  56. /**
  57. * Update publish structure before to send data to Netdata.
  58. *
  59. * @param publish the first output structure with independent dimensions
  60. * @param pvc the second output structure with correlated dimensions
  61. * @param input the structure with the input data.
  62. */
  63. static void ebpf_update_global_publish(netdata_publish_syscall_t *publish, netdata_publish_vfs_common_t *pvc,
  64. netdata_syscall_stat_t *input)
  65. {
  66. netdata_publish_syscall_t *move = publish;
  67. int selector = NETDATA_KEY_PUBLISH_PROCESS_EXIT;
  68. while (move) {
  69. move->ncall = (input->call > move->pcall) ? input->call - move->pcall : move->pcall - input->call;
  70. move->nbyte = (input->bytes > move->pbyte) ? input->bytes - move->pbyte : move->pbyte - input->bytes;
  71. move->nerr = (input->ecall > move->nerr) ? input->ecall - move->perr : move->perr - input->ecall;
  72. move->pcall = input->call;
  73. move->pbyte = input->bytes;
  74. move->perr = input->ecall;
  75. input = input->next;
  76. move = move->next;
  77. selector++;
  78. }
  79. pvc->running = (long)publish[NETDATA_KEY_PUBLISH_PROCESS_FORK].ncall -
  80. (long)publish[NETDATA_KEY_PUBLISH_PROCESS_CLONE].ncall;
  81. publish[NETDATA_KEY_PUBLISH_PROCESS_RELEASE_TASK].ncall = -publish[NETDATA_KEY_PUBLISH_PROCESS_RELEASE_TASK].ncall;
  82. pvc->zombie = (long)publish[NETDATA_KEY_PUBLISH_PROCESS_EXIT].ncall +
  83. (long)publish[NETDATA_KEY_PUBLISH_PROCESS_RELEASE_TASK].ncall;
  84. }
  85. /**
  86. * Call the necessary functions to create a chart.
  87. *
  88. * @param family the chart family
  89. * @param move the pointer with the values that will be published
  90. */
  91. static void write_status_chart(char *family, netdata_publish_vfs_common_t *pvc)
  92. {
  93. write_begin_chart(family, NETDATA_PROCESS_STATUS_NAME);
  94. write_chart_dimension(status[0], (long long)pvc->running);
  95. write_chart_dimension(status[1], (long long)pvc->zombie);
  96. write_end_chart();
  97. }
  98. /**
  99. * Send data to Netdata calling auxiliary functions.
  100. *
  101. * @param em the structure with thread information
  102. */
  103. static void ebpf_process_send_data(ebpf_module_t *em)
  104. {
  105. netdata_publish_vfs_common_t pvc;
  106. ebpf_update_global_publish(process_publish_aggregated, &pvc, process_aggregated_data);
  107. write_count_chart(NETDATA_EXIT_SYSCALL, NETDATA_EBPF_SYSTEM_GROUP,
  108. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_EXIT], 2);
  109. write_count_chart(NETDATA_PROCESS_SYSCALL, NETDATA_EBPF_SYSTEM_GROUP,
  110. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_FORK], 2);
  111. write_status_chart(NETDATA_EBPF_SYSTEM_GROUP, &pvc);
  112. if (em->mode < MODE_ENTRY) {
  113. write_err_chart(NETDATA_PROCESS_ERROR_NAME, NETDATA_EBPF_SYSTEM_GROUP,
  114. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_FORK], 2);
  115. }
  116. }
  117. /**
  118. * Sum values for pid
  119. *
  120. * @param root the structure with all available PIDs
  121. *
  122. * @param offset the address that we are reading
  123. *
  124. * @return it returns the sum of all PIDs
  125. */
  126. long long ebpf_process_sum_values_for_pids(struct pid_on_target *root, size_t offset)
  127. {
  128. long long ret = 0;
  129. while (root) {
  130. int32_t pid = root->pid;
  131. ebpf_process_publish_apps_t *w = current_apps_data[pid];
  132. if (w) {
  133. ret += get_value_from_structure((char *)w, offset);
  134. }
  135. root = root->next;
  136. }
  137. return ret;
  138. }
  139. /**
  140. * Remove process pid
  141. *
  142. * Remove from PID task table when task_release was called.
  143. */
  144. void ebpf_process_remove_pids()
  145. {
  146. struct pid_stat *pids = root_of_pids;
  147. int pid_fd = process_maps[NETDATA_PROCESS_PID_TABLE].map_fd;
  148. while (pids) {
  149. uint32_t pid = pids->pid;
  150. ebpf_process_stat_t *w = global_process_stats[pid];
  151. if (w) {
  152. if (w->removeme) {
  153. freez(w);
  154. global_process_stats[pid] = NULL;
  155. bpf_map_delete_elem(pid_fd, &pid);
  156. }
  157. }
  158. pids = pids->next;
  159. }
  160. }
  161. /**
  162. * Send data to Netdata calling auxiliary functions.
  163. *
  164. * @param root the target list.
  165. */
  166. void ebpf_process_send_apps_data(struct target *root, ebpf_module_t *em)
  167. {
  168. struct target *w;
  169. collected_number value;
  170. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_SYSCALL_APPS_TASK_PROCESS);
  171. for (w = root; w; w = w->next) {
  172. if (unlikely(w->exposed && w->processes)) {
  173. value = ebpf_process_sum_values_for_pids(w->root_pid, offsetof(ebpf_process_publish_apps_t, create_process));
  174. write_chart_dimension(w->name, value);
  175. }
  176. }
  177. write_end_chart();
  178. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_SYSCALL_APPS_TASK_THREAD);
  179. for (w = root; w; w = w->next) {
  180. if (unlikely(w->exposed && w->processes)) {
  181. value = ebpf_process_sum_values_for_pids(w->root_pid, offsetof(ebpf_process_publish_apps_t, create_thread));
  182. write_chart_dimension(w->name, value);
  183. }
  184. }
  185. write_end_chart();
  186. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_SYSCALL_APPS_TASK_EXIT);
  187. for (w = root; w; w = w->next) {
  188. if (unlikely(w->exposed && w->processes)) {
  189. value = ebpf_process_sum_values_for_pids(w->root_pid, offsetof(ebpf_process_publish_apps_t,
  190. call_do_exit));
  191. write_chart_dimension(w->name, value);
  192. }
  193. }
  194. write_end_chart();
  195. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_SYSCALL_APPS_TASK_CLOSE);
  196. for (w = root; w; w = w->next) {
  197. if (unlikely(w->exposed && w->processes)) {
  198. value = ebpf_process_sum_values_for_pids(w->root_pid, offsetof(ebpf_process_publish_apps_t,
  199. call_release_task));
  200. write_chart_dimension(w->name, value);
  201. }
  202. }
  203. write_end_chart();
  204. if (em->mode < MODE_ENTRY) {
  205. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_SYSCALL_APPS_TASK_ERROR);
  206. for (w = root; w; w = w->next) {
  207. if (unlikely(w->exposed && w->processes)) {
  208. value = ebpf_process_sum_values_for_pids(w->root_pid, offsetof(ebpf_process_publish_apps_t,
  209. task_err));
  210. write_chart_dimension(w->name, value);
  211. }
  212. }
  213. write_end_chart();
  214. }
  215. ebpf_process_remove_pids();
  216. }
  217. /*****************************************************************
  218. *
  219. * READ INFORMATION FROM KERNEL RING
  220. *
  221. *****************************************************************/
  222. /**
  223. * Read the hash table and store data to allocated vectors.
  224. */
  225. static void read_hash_global_tables()
  226. {
  227. uint64_t idx;
  228. netdata_idx_t res[NETDATA_KEY_END_VECTOR];
  229. netdata_idx_t *val = process_hash_values;
  230. int fd = process_maps[NETDATA_PROCESS_GLOBAL_TABLE].map_fd;
  231. for (idx = 0; idx < NETDATA_KEY_END_VECTOR; idx++) {
  232. if (!bpf_map_lookup_elem(fd, &idx, val)) {
  233. uint64_t total = 0;
  234. int i;
  235. int end = ebpf_nprocs;
  236. for (i = 0; i < end; i++)
  237. total += val[i];
  238. res[idx] = total;
  239. } else {
  240. res[idx] = 0;
  241. }
  242. }
  243. process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_EXIT].call = res[NETDATA_KEY_CALLS_DO_EXIT];
  244. process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_RELEASE_TASK].call = res[NETDATA_KEY_CALLS_RELEASE_TASK];
  245. process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_FORK].call = res[NETDATA_KEY_CALLS_DO_FORK];
  246. process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_CLONE].call = res[NETDATA_KEY_CALLS_SYS_CLONE];
  247. process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_FORK].ecall = res[NETDATA_KEY_ERROR_DO_FORK];
  248. process_aggregated_data[NETDATA_KEY_PUBLISH_PROCESS_CLONE].ecall = res[NETDATA_KEY_ERROR_SYS_CLONE];
  249. }
  250. /**
  251. * Read the hash table and store data to allocated vectors.
  252. */
  253. static void ebpf_process_update_apps_data()
  254. {
  255. struct pid_stat *pids = root_of_pids;
  256. while (pids) {
  257. uint32_t current_pid = pids->pid;
  258. ebpf_process_stat_t *ps = global_process_stats[current_pid];
  259. if (!ps) {
  260. pids = pids->next;
  261. continue;
  262. }
  263. ebpf_process_publish_apps_t *cad = current_apps_data[current_pid];
  264. if (!cad) {
  265. cad = callocz(1, sizeof(ebpf_process_publish_apps_t));
  266. current_apps_data[current_pid] = cad;
  267. }
  268. //Read data
  269. cad->call_do_exit = ps->exit_call;
  270. cad->call_release_task = ps->release_call;
  271. cad->create_process = ps->create_process;
  272. cad->create_thread = ps->create_thread;
  273. cad->task_err = ps->task_err;
  274. pids = pids->next;
  275. }
  276. }
  277. /**
  278. * Update cgroup
  279. *
  280. * Update cgroup data based in
  281. */
  282. static void ebpf_update_process_cgroup()
  283. {
  284. ebpf_cgroup_target_t *ect ;
  285. int pid_fd = process_maps[NETDATA_PROCESS_PID_TABLE].map_fd;
  286. pthread_mutex_lock(&mutex_cgroup_shm);
  287. for (ect = ebpf_cgroup_pids; ect; ect = ect->next) {
  288. struct pid_on_target2 *pids;
  289. for (pids = ect->pids; pids; pids = pids->next) {
  290. int pid = pids->pid;
  291. ebpf_process_stat_t *out = &pids->ps;
  292. if (global_process_stats[pid]) {
  293. ebpf_process_stat_t *in = global_process_stats[pid];
  294. memcpy(out, in, sizeof(ebpf_process_stat_t));
  295. } else {
  296. if (bpf_map_lookup_elem(pid_fd, &pid, out)) {
  297. memset(out, 0, sizeof(ebpf_process_stat_t));
  298. }
  299. }
  300. }
  301. }
  302. pthread_mutex_unlock(&mutex_cgroup_shm);
  303. }
  304. /*****************************************************************
  305. *
  306. * FUNCTIONS TO CREATE CHARTS
  307. *
  308. *****************************************************************/
  309. /**
  310. * Create process status chart
  311. *
  312. * @param family the chart family
  313. * @param name the chart name
  314. * @param axis the axis label
  315. * @param web the group name used to attach the chart on dashboard
  316. * @param order the order number of the specified chart
  317. * @param update_every value to overwrite the update frequency set by the server.
  318. */
  319. static void ebpf_process_status_chart(char *family, char *name, char *axis,
  320. char *web, char *algorithm, int order, int update_every)
  321. {
  322. printf("CHART %s.%s '' 'Process not closed' '%s' '%s' '' line %d %d '' 'ebpf.plugin' 'process'\n",
  323. family,
  324. name,
  325. axis,
  326. web,
  327. order,
  328. update_every);
  329. printf("DIMENSION %s '' %s 1 1\n", status[0], algorithm);
  330. printf("DIMENSION %s '' %s 1 1\n", status[1], algorithm);
  331. }
  332. /**
  333. * Create global charts
  334. *
  335. * Call ebpf_create_chart to create the charts for the collector.
  336. *
  337. * @param em a pointer to the structure with the default values.
  338. */
  339. static void ebpf_create_global_charts(ebpf_module_t *em)
  340. {
  341. ebpf_create_chart(NETDATA_EBPF_SYSTEM_GROUP,
  342. NETDATA_PROCESS_SYSCALL,
  343. "Start process",
  344. EBPF_COMMON_DIMENSION_CALL,
  345. NETDATA_PROCESS_GROUP,
  346. NULL,
  347. NETDATA_EBPF_CHART_TYPE_LINE,
  348. 21002,
  349. ebpf_create_global_dimension,
  350. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_FORK],
  351. 2, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  352. ebpf_create_chart(NETDATA_EBPF_SYSTEM_GROUP,
  353. NETDATA_EXIT_SYSCALL,
  354. "Exit process",
  355. EBPF_COMMON_DIMENSION_CALL,
  356. NETDATA_PROCESS_GROUP,
  357. NULL,
  358. NETDATA_EBPF_CHART_TYPE_LINE,
  359. 21003,
  360. ebpf_create_global_dimension,
  361. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_EXIT],
  362. 2, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  363. ebpf_process_status_chart(NETDATA_EBPF_SYSTEM_GROUP,
  364. NETDATA_PROCESS_STATUS_NAME,
  365. EBPF_COMMON_DIMENSION_DIFFERENCE,
  366. NETDATA_PROCESS_GROUP,
  367. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  368. 21004, em->update_every);
  369. if (em->mode < MODE_ENTRY) {
  370. ebpf_create_chart(NETDATA_EBPF_SYSTEM_GROUP,
  371. NETDATA_PROCESS_ERROR_NAME,
  372. "Fails to create process",
  373. EBPF_COMMON_DIMENSION_CALL,
  374. NETDATA_PROCESS_GROUP,
  375. NULL,
  376. NETDATA_EBPF_CHART_TYPE_LINE,
  377. 21005,
  378. ebpf_create_global_dimension,
  379. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_FORK],
  380. 2, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  381. }
  382. }
  383. /**
  384. * Create chart for Statistic Thread
  385. *
  386. * Write to standard output current values for threads.
  387. *
  388. * @param em a pointer to the structure with the default values.
  389. */
  390. static inline void ebpf_create_statistic_thread_chart(ebpf_module_t *em)
  391. {
  392. ebpf_write_chart_cmd(NETDATA_MONITORING_FAMILY,
  393. NETDATA_EBPF_THREADS,
  394. "Threads info.",
  395. "threads",
  396. NETDATA_EBPF_FAMILY,
  397. NETDATA_EBPF_CHART_TYPE_LINE,
  398. NULL,
  399. 140000,
  400. em->update_every,
  401. NETDATA_EBPF_MODULE_NAME_PROCESS);
  402. ebpf_write_global_dimension(threads_stat[NETDATA_EBPF_THREAD_STAT_TOTAL],
  403. threads_stat[NETDATA_EBPF_THREAD_STAT_TOTAL],
  404. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX]);
  405. ebpf_write_global_dimension(threads_stat[NETDATA_EBPF_THREAD_STAT_RUNNING],
  406. threads_stat[NETDATA_EBPF_THREAD_STAT_RUNNING],
  407. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX]);
  408. }
  409. /**
  410. * Create chart for Load Thread
  411. *
  412. * Write to standard output current values for load mode.
  413. *
  414. * @param em a pointer to the structure with the default values.
  415. */
  416. static inline void ebpf_create_statistic_load_chart(ebpf_module_t *em)
  417. {
  418. ebpf_write_chart_cmd(NETDATA_MONITORING_FAMILY,
  419. NETDATA_EBPF_LOAD_METHOD,
  420. "Load info.",
  421. "methods",
  422. NETDATA_EBPF_FAMILY,
  423. NETDATA_EBPF_CHART_TYPE_LINE,
  424. NULL,
  425. 140001,
  426. em->update_every,
  427. NETDATA_EBPF_MODULE_NAME_PROCESS);
  428. ebpf_write_global_dimension(load_event_stat[NETDATA_EBPF_LOAD_STAT_LEGACY],
  429. load_event_stat[NETDATA_EBPF_LOAD_STAT_LEGACY],
  430. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX]);
  431. ebpf_write_global_dimension(load_event_stat[NETDATA_EBPF_LOAD_STAT_CORE],
  432. load_event_stat[NETDATA_EBPF_LOAD_STAT_CORE],
  433. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX]);
  434. }
  435. /**
  436. * Create Statistics Charts
  437. *
  438. * Create charts that will show statistics related to eBPF plugin.
  439. *
  440. * @param em a pointer to the structure with the default values.
  441. */
  442. static void ebpf_create_statistic_charts(ebpf_module_t *em)
  443. {
  444. ebpf_create_statistic_thread_chart(em);
  445. ebpf_create_statistic_load_chart(em);
  446. }
  447. /**
  448. * Create process apps charts
  449. *
  450. * Call ebpf_create_chart to create the charts on apps submenu.
  451. *
  452. * @param em a pointer to the structure with the default values.
  453. * @param ptr a pointer for the targets.
  454. */
  455. void ebpf_process_create_apps_charts(struct ebpf_module *em, void *ptr)
  456. {
  457. struct target *root = ptr;
  458. ebpf_create_charts_on_apps(NETDATA_SYSCALL_APPS_TASK_PROCESS,
  459. "Process started",
  460. EBPF_COMMON_DIMENSION_CALL,
  461. NETDATA_PROCESS_GROUP,
  462. NETDATA_EBPF_CHART_TYPE_STACKED,
  463. 20065,
  464. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  465. root, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  466. ebpf_create_charts_on_apps(NETDATA_SYSCALL_APPS_TASK_THREAD,
  467. "Threads started",
  468. EBPF_COMMON_DIMENSION_CALL,
  469. NETDATA_PROCESS_GROUP,
  470. NETDATA_EBPF_CHART_TYPE_STACKED,
  471. 20066,
  472. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  473. root, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  474. ebpf_create_charts_on_apps(NETDATA_SYSCALL_APPS_TASK_EXIT,
  475. "Tasks starts exit process.",
  476. EBPF_COMMON_DIMENSION_CALL,
  477. NETDATA_PROCESS_GROUP,
  478. NETDATA_EBPF_CHART_TYPE_STACKED,
  479. 20067,
  480. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  481. root, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  482. ebpf_create_charts_on_apps(NETDATA_SYSCALL_APPS_TASK_CLOSE,
  483. "Tasks closed",
  484. EBPF_COMMON_DIMENSION_CALL,
  485. NETDATA_PROCESS_GROUP,
  486. NETDATA_EBPF_CHART_TYPE_STACKED,
  487. 20068,
  488. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  489. root, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  490. if (em->mode < MODE_ENTRY) {
  491. ebpf_create_charts_on_apps(NETDATA_SYSCALL_APPS_TASK_ERROR,
  492. "Errors to create process or threads.",
  493. EBPF_COMMON_DIMENSION_CALL,
  494. NETDATA_PROCESS_GROUP,
  495. NETDATA_EBPF_CHART_TYPE_STACKED,
  496. 20069,
  497. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  498. root,
  499. em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  500. }
  501. }
  502. /**
  503. * Create apps charts
  504. *
  505. * Call ebpf_create_chart to create the charts on apps submenu.
  506. *
  507. * @param root a pointer for the targets.
  508. */
  509. static void ebpf_create_apps_charts(struct target *root)
  510. {
  511. if (unlikely(!all_pids))
  512. return;
  513. struct target *w;
  514. int newly_added = 0;
  515. for (w = root; w; w = w->next) {
  516. if (w->target)
  517. continue;
  518. if (unlikely(w->processes && (debug_enabled || w->debug_enabled))) {
  519. struct pid_on_target *pid_on_target;
  520. fprintf(
  521. stderr, "ebpf.plugin: target '%s' has aggregated %u process%s:", w->name, w->processes,
  522. (w->processes == 1) ? "" : "es");
  523. for (pid_on_target = w->root_pid; pid_on_target; pid_on_target = pid_on_target->next) {
  524. fprintf(stderr, " %d", pid_on_target->pid);
  525. }
  526. fputc('\n', stderr);
  527. }
  528. if (!w->exposed && w->processes) {
  529. newly_added++;
  530. w->exposed = 1;
  531. if (debug_enabled || w->debug_enabled)
  532. debug_log_int("%s just added - regenerating charts.", w->name);
  533. }
  534. }
  535. if (!newly_added)
  536. return;
  537. int counter;
  538. for (counter = 0; ebpf_modules[counter].thread_name; counter++) {
  539. ebpf_module_t *current = &ebpf_modules[counter];
  540. if (current->enabled && current->apps_charts && current->apps_routine)
  541. current->apps_routine(current, root);
  542. }
  543. }
  544. /*****************************************************************
  545. *
  546. * FUNCTIONS WITH THE MAIN LOOP
  547. *
  548. *****************************************************************/
  549. /**
  550. * Cgroup update shm
  551. *
  552. * This is the thread callback.
  553. * This thread is necessary, because we cannot freeze the whole plugin to read the data from shared memory.
  554. *
  555. * @param ptr It is a NULL value for this thread.
  556. *
  557. * @return It always returns NULL.
  558. */
  559. void *ebpf_cgroup_update_shm(void *ptr)
  560. {
  561. UNUSED(ptr);
  562. heartbeat_t hb;
  563. heartbeat_init(&hb);
  564. usec_t step = 30 * USEC_PER_SEC;
  565. while (!close_ebpf_plugin) {
  566. usec_t dt = heartbeat_next(&hb, step);
  567. (void)dt;
  568. if (close_ebpf_plugin)
  569. break;
  570. if (!shm_ebpf_cgroup.header)
  571. ebpf_map_cgroup_shared_memory();
  572. ebpf_parse_cgroup_shm_data();
  573. }
  574. return NULL;
  575. }
  576. /**
  577. * Sum PIDs
  578. *
  579. * Sum values for all targets.
  580. *
  581. * @param ps structure used to store data
  582. * @param pids input data
  583. */
  584. static void ebpf_process_sum_cgroup_pids(ebpf_process_stat_t *ps, struct pid_on_target2 *pids)
  585. {
  586. ebpf_process_stat_t accumulator;
  587. memset(&accumulator, 0, sizeof(accumulator));
  588. while (pids) {
  589. ebpf_process_stat_t *ps = &pids->ps;
  590. accumulator.exit_call += ps->exit_call;
  591. accumulator.release_call += ps->release_call;
  592. accumulator.create_process += ps->create_process;
  593. accumulator.create_thread += ps->create_thread;
  594. accumulator.task_err += ps->task_err;
  595. pids = pids->next;
  596. }
  597. ps->exit_call = (accumulator.exit_call >= ps->exit_call) ? accumulator.exit_call : ps->exit_call;
  598. ps->release_call = (accumulator.release_call >= ps->release_call) ? accumulator.release_call : ps->release_call;
  599. ps->create_process = (accumulator.create_process >= ps->create_process) ? accumulator.create_process : ps->create_process;
  600. ps->create_thread = (accumulator.create_thread >= ps->create_thread) ? accumulator.create_thread : ps->create_thread;
  601. ps->task_err = (accumulator.task_err >= ps->task_err) ? accumulator.task_err : ps->task_err;
  602. }
  603. /*
  604. * Send Specific Process data
  605. *
  606. * Send data for specific cgroup/apps.
  607. *
  608. * @param type chart type
  609. * @param values structure with values that will be sent to netdata
  610. * @param em the structure with thread information
  611. */
  612. static void ebpf_send_specific_process_data(char *type, ebpf_process_stat_t *values, ebpf_module_t *em)
  613. {
  614. write_begin_chart(type, NETDATA_SYSCALL_APPS_TASK_PROCESS);
  615. write_chart_dimension(process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_FORK].name,
  616. (long long) values->create_process);
  617. write_end_chart();
  618. write_begin_chart(type, NETDATA_SYSCALL_APPS_TASK_THREAD);
  619. write_chart_dimension(process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_CLONE].name,
  620. (long long) values->create_thread);
  621. write_end_chart();
  622. write_begin_chart(type, NETDATA_SYSCALL_APPS_TASK_EXIT);
  623. write_chart_dimension(process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_EXIT].name,
  624. (long long) values->release_call);
  625. write_end_chart();
  626. write_begin_chart(type, NETDATA_SYSCALL_APPS_TASK_CLOSE);
  627. write_chart_dimension(process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_RELEASE_TASK].name,
  628. (long long) values->release_call);
  629. write_end_chart();
  630. if (em->mode < MODE_ENTRY) {
  631. write_begin_chart(type, NETDATA_SYSCALL_APPS_TASK_ERROR);
  632. write_chart_dimension(process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_EXIT].name,
  633. (long long) values->task_err);
  634. write_end_chart();
  635. }
  636. }
  637. /**
  638. * Create specific process charts
  639. *
  640. * Create charts for cgroup/application
  641. *
  642. * @param type the chart type.
  643. * @param em the structure with thread information
  644. */
  645. static void ebpf_create_specific_process_charts(char *type, ebpf_module_t *em)
  646. {
  647. ebpf_create_chart(type, NETDATA_SYSCALL_APPS_TASK_PROCESS, "Process started",
  648. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_CGROUP_GROUP,
  649. NETDATA_CGROUP_PROCESS_CREATE_CONTEXT, NETDATA_EBPF_CHART_TYPE_LINE,
  650. NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5000,
  651. ebpf_create_global_dimension, &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_FORK],
  652. 1, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  653. ebpf_create_chart(type, NETDATA_SYSCALL_APPS_TASK_THREAD, "Threads started",
  654. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_CGROUP_GROUP,
  655. NETDATA_CGROUP_THREAD_CREATE_CONTEXT, NETDATA_EBPF_CHART_TYPE_LINE,
  656. NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5001,
  657. ebpf_create_global_dimension,
  658. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_CLONE],
  659. 1, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  660. ebpf_create_chart(type, NETDATA_SYSCALL_APPS_TASK_EXIT, "Tasks starts exit process.",
  661. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_CGROUP_GROUP,
  662. NETDATA_CGROUP_PROCESS_EXIT_CONTEXT,
  663. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5002,
  664. ebpf_create_global_dimension,
  665. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_EXIT],
  666. 1, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  667. ebpf_create_chart(type, NETDATA_SYSCALL_APPS_TASK_CLOSE, "Tasks closed",
  668. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_CGROUP_GROUP,
  669. NETDATA_CGROUP_PROCESS_CLOSE_CONTEXT,
  670. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5003,
  671. ebpf_create_global_dimension,
  672. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_RELEASE_TASK],
  673. 1, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  674. if (em->mode < MODE_ENTRY) {
  675. ebpf_create_chart(type, NETDATA_SYSCALL_APPS_TASK_ERROR, "Errors to create process or threads.",
  676. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_CGROUP_GROUP,
  677. NETDATA_CGROUP_PROCESS_ERROR_CONTEXT,
  678. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5004,
  679. ebpf_create_global_dimension,
  680. &process_publish_aggregated[NETDATA_KEY_PUBLISH_PROCESS_EXIT],
  681. 1, em->update_every, NETDATA_EBPF_MODULE_NAME_PROCESS);
  682. }
  683. }
  684. /**
  685. * Obsolete specific process charts
  686. *
  687. * Obsolete charts for cgroup/application
  688. *
  689. * @param type the chart type.
  690. * @param em the structure with thread information
  691. */
  692. static void ebpf_obsolete_specific_process_charts(char *type, ebpf_module_t *em)
  693. {
  694. ebpf_write_chart_obsolete(type, NETDATA_SYSCALL_APPS_TASK_PROCESS, "Process started",
  695. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_GROUP, NETDATA_EBPF_CHART_TYPE_LINE,
  696. NETDATA_CGROUP_PROCESS_CREATE_CONTEXT, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5000,
  697. em->update_every);
  698. ebpf_write_chart_obsolete(type, NETDATA_SYSCALL_APPS_TASK_THREAD, "Threads started",
  699. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_GROUP, NETDATA_EBPF_CHART_TYPE_LINE,
  700. NETDATA_CGROUP_THREAD_CREATE_CONTEXT, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5001,
  701. em->update_every);
  702. ebpf_write_chart_obsolete(type, NETDATA_SYSCALL_APPS_TASK_EXIT,"Tasks starts exit process.",
  703. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_GROUP, NETDATA_EBPF_CHART_TYPE_LINE,
  704. NETDATA_CGROUP_PROCESS_EXIT_CONTEXT, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5002,
  705. em->update_every);
  706. ebpf_write_chart_obsolete(type, NETDATA_SYSCALL_APPS_TASK_CLOSE,"Tasks closed",
  707. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_GROUP, NETDATA_EBPF_CHART_TYPE_LINE,
  708. NETDATA_CGROUP_PROCESS_CLOSE_CONTEXT, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5003,
  709. em->update_every);
  710. if (em->mode < MODE_ENTRY) {
  711. ebpf_write_chart_obsolete(type, NETDATA_SYSCALL_APPS_TASK_ERROR,"Errors to create process or threads.",
  712. EBPF_COMMON_DIMENSION_CALL, NETDATA_PROCESS_GROUP, NETDATA_EBPF_CHART_TYPE_LINE,
  713. NETDATA_CGROUP_PROCESS_ERROR_CONTEXT, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5004,
  714. em->update_every);
  715. }
  716. }
  717. /**
  718. * Create Systemd process Charts
  719. *
  720. * Create charts when systemd is enabled
  721. *
  722. * @param em the structure with thread information
  723. **/
  724. static void ebpf_create_systemd_process_charts(ebpf_module_t *em)
  725. {
  726. ebpf_create_charts_on_systemd(NETDATA_SYSCALL_APPS_TASK_PROCESS, "Process started",
  727. EBPF_COMMON_DIMENSION_CALL, NETDATA_APPS_PROCESS_GROUP,
  728. NETDATA_EBPF_CHART_TYPE_STACKED, 20065,
  729. ebpf_algorithms[NETDATA_EBPF_INCREMENTAL_IDX], NETDATA_SYSTEMD_PROCESS_CREATE_CONTEXT,
  730. NETDATA_EBPF_MODULE_NAME_PROCESS, em->update_every);
  731. ebpf_create_charts_on_systemd(NETDATA_SYSCALL_APPS_TASK_THREAD, "Threads started",
  732. EBPF_COMMON_DIMENSION_CALL, NETDATA_APPS_PROCESS_GROUP,
  733. NETDATA_EBPF_CHART_TYPE_STACKED, 20066,
  734. ebpf_algorithms[NETDATA_EBPF_INCREMENTAL_IDX], NETDATA_SYSTEMD_THREAD_CREATE_CONTEXT,
  735. NETDATA_EBPF_MODULE_NAME_PROCESS, em->update_every);
  736. ebpf_create_charts_on_systemd(NETDATA_SYSCALL_APPS_TASK_CLOSE, "Tasks starts exit process.",
  737. EBPF_COMMON_DIMENSION_CALL, NETDATA_APPS_PROCESS_GROUP,
  738. NETDATA_EBPF_CHART_TYPE_STACKED, 20067,
  739. ebpf_algorithms[NETDATA_EBPF_INCREMENTAL_IDX], NETDATA_SYSTEMD_PROCESS_EXIT_CONTEXT,
  740. NETDATA_EBPF_MODULE_NAME_PROCESS, em->update_every);
  741. ebpf_create_charts_on_systemd(NETDATA_SYSCALL_APPS_TASK_EXIT, "Tasks closed",
  742. EBPF_COMMON_DIMENSION_CALL, NETDATA_APPS_PROCESS_GROUP,
  743. NETDATA_EBPF_CHART_TYPE_STACKED, 20068,
  744. ebpf_algorithms[NETDATA_EBPF_INCREMENTAL_IDX], NETDATA_SYSTEMD_PROCESS_CLOSE_CONTEXT,
  745. NETDATA_EBPF_MODULE_NAME_PROCESS, em->update_every);
  746. if (em->mode < MODE_ENTRY) {
  747. ebpf_create_charts_on_systemd(NETDATA_SYSCALL_APPS_TASK_ERROR, "Errors to create process or threads.",
  748. EBPF_COMMON_DIMENSION_CALL, NETDATA_APPS_PROCESS_GROUP,
  749. NETDATA_EBPF_CHART_TYPE_STACKED, 20069,
  750. ebpf_algorithms[NETDATA_EBPF_INCREMENTAL_IDX], NETDATA_SYSTEMD_PROCESS_ERROR_CONTEXT,
  751. NETDATA_EBPF_MODULE_NAME_PROCESS, em->update_every);
  752. }
  753. }
  754. /**
  755. * Send Systemd charts
  756. *
  757. * Send collected data to Netdata.
  758. *
  759. * @param em the structure with thread information
  760. *
  761. * @return It returns the status for chart creation, if it is necessary to remove a specific dimension, zero is returned
  762. * otherwise function returns 1 to avoid chart recreation
  763. */
  764. static int ebpf_send_systemd_process_charts(ebpf_module_t *em)
  765. {
  766. int ret = 1;
  767. ebpf_cgroup_target_t *ect;
  768. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_SYSCALL_APPS_TASK_PROCESS);
  769. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  770. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  771. write_chart_dimension(ect->name, ect->publish_systemd_ps.create_process);
  772. } else
  773. ret = 0;
  774. }
  775. write_end_chart();
  776. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_SYSCALL_APPS_TASK_THREAD);
  777. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  778. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  779. write_chart_dimension(ect->name, ect->publish_systemd_ps.create_thread);
  780. }
  781. }
  782. write_end_chart();
  783. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_SYSCALL_APPS_TASK_EXIT);
  784. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  785. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  786. write_chart_dimension(ect->name, ect->publish_systemd_ps.exit_call);
  787. }
  788. }
  789. write_end_chart();
  790. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_SYSCALL_APPS_TASK_CLOSE);
  791. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  792. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  793. write_chart_dimension(ect->name, ect->publish_systemd_ps.release_call);
  794. }
  795. }
  796. write_end_chart();
  797. if (em->mode < MODE_ENTRY) {
  798. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_SYSCALL_APPS_TASK_ERROR);
  799. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  800. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  801. write_chart_dimension(ect->name, ect->publish_systemd_ps.task_err);
  802. }
  803. }
  804. write_end_chart();
  805. }
  806. return ret;
  807. }
  808. /**
  809. * Send data to Netdata calling auxiliary functions.
  810. *
  811. * @param em the structure with thread information
  812. */
  813. static void ebpf_process_send_cgroup_data(ebpf_module_t *em)
  814. {
  815. if (!ebpf_cgroup_pids)
  816. return;
  817. pthread_mutex_lock(&mutex_cgroup_shm);
  818. ebpf_cgroup_target_t *ect;
  819. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  820. ebpf_process_sum_cgroup_pids(&ect->publish_systemd_ps, ect->pids);
  821. }
  822. int has_systemd = shm_ebpf_cgroup.header->systemd_enabled;
  823. if (has_systemd) {
  824. static int systemd_chart = 0;
  825. if (!systemd_chart) {
  826. ebpf_create_systemd_process_charts(em);
  827. systemd_chart = 1;
  828. }
  829. systemd_chart = ebpf_send_systemd_process_charts(em);
  830. }
  831. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  832. if (ect->systemd)
  833. continue;
  834. if (!(ect->flags & NETDATA_EBPF_CGROUP_HAS_PROCESS_CHART) && ect->updated) {
  835. ebpf_create_specific_process_charts(ect->name, em);
  836. ect->flags |= NETDATA_EBPF_CGROUP_HAS_PROCESS_CHART;
  837. }
  838. if (ect->flags & NETDATA_EBPF_CGROUP_HAS_PROCESS_CHART) {
  839. if (ect->updated) {
  840. ebpf_send_specific_process_data(ect->name, &ect->publish_systemd_ps, em);
  841. } else {
  842. ebpf_obsolete_specific_process_charts(ect->name, em);
  843. ect->flags &= ~NETDATA_EBPF_CGROUP_HAS_PROCESS_CHART;
  844. }
  845. }
  846. }
  847. pthread_mutex_unlock(&mutex_cgroup_shm);
  848. }
  849. /**
  850. * Update Cgroup algorithm
  851. *
  852. * Change algorithm from absolute to incremental
  853. */
  854. void ebpf_process_update_cgroup_algorithm()
  855. {
  856. int i;
  857. for (i = 0; i < NETDATA_KEY_PUBLISH_PROCESS_END; i++) {
  858. netdata_publish_syscall_t *ptr = &process_publish_aggregated[i];
  859. freez(ptr->algorithm);
  860. ptr->algorithm = strdupz(ebpf_algorithms[NETDATA_EBPF_INCREMENTAL_IDX]);
  861. }
  862. }
  863. /**
  864. * Send Statistic Data
  865. *
  866. * Send statistic information to netdata.
  867. */
  868. void ebpf_send_statistic_data()
  869. {
  870. write_begin_chart(NETDATA_MONITORING_FAMILY, NETDATA_EBPF_THREADS);
  871. write_chart_dimension(threads_stat[NETDATA_EBPF_THREAD_STAT_TOTAL], (long long)plugin_statistics.threads);
  872. write_chart_dimension(threads_stat[NETDATA_EBPF_THREAD_STAT_RUNNING], (long long)plugin_statistics.running);
  873. write_end_chart();
  874. write_begin_chart(NETDATA_MONITORING_FAMILY, NETDATA_EBPF_LOAD_METHOD);
  875. write_chart_dimension(load_event_stat[NETDATA_EBPF_LOAD_STAT_LEGACY], (long long)plugin_statistics.legacy);
  876. write_chart_dimension(load_event_stat[NETDATA_EBPF_LOAD_STAT_CORE], (long long)plugin_statistics.core);
  877. write_end_chart();
  878. }
  879. /**
  880. * Main loop for this collector.
  881. *
  882. * @param em the structure with thread information
  883. */
  884. static void process_collector(ebpf_module_t *em)
  885. {
  886. cgroup_thread.thread = mallocz(sizeof(netdata_thread_t));
  887. cgroup_thread.start_routine = ebpf_cgroup_update_shm;
  888. netdata_thread_create(cgroup_thread.thread, cgroup_thread.name, NETDATA_THREAD_OPTION_JOINABLE,
  889. ebpf_cgroup_update_shm, em);
  890. heartbeat_t hb;
  891. heartbeat_init(&hb);
  892. int publish_global = em->global_charts;
  893. int apps_enabled = em->apps_charts;
  894. int cgroups = em->cgroup_charts;
  895. int thread_enabled = em->enabled;
  896. if (cgroups)
  897. ebpf_process_update_cgroup_algorithm();
  898. int pid_fd = process_maps[NETDATA_PROCESS_PID_TABLE].map_fd;
  899. int update_every = em->update_every;
  900. int counter = update_every - 1;
  901. while (!close_ebpf_plugin) {
  902. usec_t dt = heartbeat_next(&hb, USEC_PER_SEC);
  903. (void)dt;
  904. pthread_mutex_lock(&collect_data_mutex);
  905. cleanup_exited_pids();
  906. collect_data_for_all_processes(pid_fd);
  907. ebpf_create_apps_charts(apps_groups_root_target);
  908. pthread_cond_broadcast(&collect_data_cond_var);
  909. pthread_mutex_unlock(&collect_data_mutex);
  910. if (++counter == update_every) {
  911. counter = 0;
  912. read_hash_global_tables();
  913. int publish_apps = 0;
  914. if (all_pids_count > 0) {
  915. if (apps_enabled) {
  916. publish_apps = 1;
  917. ebpf_process_update_apps_data();
  918. }
  919. if (cgroups) {
  920. ebpf_update_process_cgroup();
  921. }
  922. }
  923. pthread_mutex_lock(&lock);
  924. ebpf_send_statistic_data();
  925. if (thread_enabled) {
  926. if (publish_global) {
  927. ebpf_process_send_data(em);
  928. }
  929. if (publish_apps) {
  930. ebpf_process_send_apps_data(apps_groups_root_target, em);
  931. }
  932. if (cgroups) {
  933. ebpf_process_send_cgroup_data(em);
  934. }
  935. }
  936. pthread_mutex_unlock(&lock);
  937. }
  938. fflush(stdout);
  939. }
  940. }
  941. /*****************************************************************
  942. *
  943. * FUNCTIONS TO CLOSE THE THREAD
  944. *
  945. *****************************************************************/
  946. void clean_global_memory() {
  947. int pid_fd = process_maps[NETDATA_PROCESS_PID_TABLE].map_fd;
  948. struct pid_stat *pids = root_of_pids;
  949. while (pids) {
  950. uint32_t pid = pids->pid;
  951. freez(global_process_stats[pid]);
  952. bpf_map_delete_elem(pid_fd, &pid);
  953. freez(current_apps_data[pid]);
  954. pids = pids->next;
  955. }
  956. }
  957. /**
  958. * Process disable tracepoints
  959. *
  960. * Disable tracepoints when the plugin was responsible to enable it.
  961. */
  962. static void ebpf_process_disable_tracepoints()
  963. {
  964. char *default_message = { "Cannot disable the tracepoint" };
  965. if (!was_sched_process_exit_enabled) {
  966. if (ebpf_disable_tracing_values(tracepoint_sched_type, tracepoint_sched_process_exit))
  967. error("%s %s/%s.", default_message, tracepoint_sched_type, tracepoint_sched_process_exit);
  968. }
  969. if (!was_sched_process_exec_enabled) {
  970. if (ebpf_disable_tracing_values(tracepoint_sched_type, tracepoint_sched_process_exec))
  971. error("%s %s/%s.", default_message, tracepoint_sched_type, tracepoint_sched_process_exec);
  972. }
  973. if (!was_sched_process_fork_enabled) {
  974. if (ebpf_disable_tracing_values(tracepoint_sched_type, tracepoint_sched_process_fork))
  975. error("%s %s/%s.", default_message, tracepoint_sched_type, tracepoint_sched_process_fork);
  976. }
  977. }
  978. /**
  979. * Clean up the main thread.
  980. *
  981. * @param ptr thread data.
  982. */
  983. static void ebpf_process_cleanup(void *ptr)
  984. {
  985. UNUSED(ptr);
  986. heartbeat_t hb;
  987. heartbeat_init(&hb);
  988. uint32_t tick = 1 * USEC_PER_SEC;
  989. while (!finalized_threads) {
  990. usec_t dt = heartbeat_next(&hb, tick);
  991. UNUSED(dt);
  992. }
  993. ebpf_cleanup_publish_syscall(process_publish_aggregated);
  994. freez(process_hash_values);
  995. clean_global_memory();
  996. freez(global_process_stats);
  997. freez(current_apps_data);
  998. ebpf_process_disable_tracepoints();
  999. if (probe_links) {
  1000. struct bpf_program *prog;
  1001. size_t i = 0 ;
  1002. bpf_object__for_each_program(prog, objects) {
  1003. bpf_link__destroy(probe_links[i]);
  1004. i++;
  1005. }
  1006. bpf_object__close(objects);
  1007. }
  1008. freez(cgroup_thread.thread);
  1009. }
  1010. /*****************************************************************
  1011. *
  1012. * FUNCTIONS TO START THREAD
  1013. *
  1014. *****************************************************************/
  1015. /**
  1016. * Allocate vectors used with this thread.
  1017. * We are not testing the return, because callocz does this and shutdown the software
  1018. * case it was not possible to allocate.
  1019. *
  1020. * @param length is the length for the vectors used inside the collector.
  1021. */
  1022. static void ebpf_process_allocate_global_vectors(size_t length)
  1023. {
  1024. memset(process_aggregated_data, 0, length * sizeof(netdata_syscall_stat_t));
  1025. memset(process_publish_aggregated, 0, length * sizeof(netdata_publish_syscall_t));
  1026. process_hash_values = callocz(ebpf_nprocs, sizeof(netdata_idx_t));
  1027. global_process_stats = callocz((size_t)pid_max, sizeof(ebpf_process_stat_t *));
  1028. current_apps_data = callocz((size_t)pid_max, sizeof(ebpf_process_publish_apps_t *));
  1029. }
  1030. static void change_syscalls()
  1031. {
  1032. static char *lfork = { "do_fork" };
  1033. process_id_names[NETDATA_KEY_PUBLISH_PROCESS_FORK] = lfork;
  1034. }
  1035. /**
  1036. * Set local variables
  1037. *
  1038. */
  1039. static void set_local_pointers()
  1040. {
  1041. if (isrh >= NETDATA_MINIMUM_RH_VERSION && isrh < NETDATA_RH_8)
  1042. change_syscalls();
  1043. }
  1044. /*****************************************************************
  1045. *
  1046. * EBPF PROCESS THREAD
  1047. *
  1048. *****************************************************************/
  1049. /**
  1050. *
  1051. */
  1052. static void wait_for_all_threads_die()
  1053. {
  1054. ebpf_modules[EBPF_MODULE_PROCESS_IDX].enabled = 0;
  1055. heartbeat_t hb;
  1056. heartbeat_init(&hb);
  1057. int max = 10;
  1058. int i;
  1059. for (i = 0; i < max; i++) {
  1060. heartbeat_next(&hb, 200000);
  1061. size_t j, counter = 0, compare = 0;
  1062. for (j = 0; ebpf_modules[j].thread_name; j++) {
  1063. if (!ebpf_modules[j].enabled)
  1064. counter++;
  1065. compare++;
  1066. }
  1067. if (counter == compare)
  1068. break;
  1069. }
  1070. }
  1071. /**
  1072. * Enable tracepoints
  1073. *
  1074. * Enable necessary tracepoints for thread.
  1075. *
  1076. * @return It returns 0 on success and -1 otherwise
  1077. */
  1078. static int ebpf_process_enable_tracepoints()
  1079. {
  1080. int test = ebpf_is_tracepoint_enabled(tracepoint_sched_type, tracepoint_sched_process_exit);
  1081. if (test == -1)
  1082. return -1;
  1083. else if (!test) {
  1084. if (ebpf_enable_tracing_values(tracepoint_sched_type, tracepoint_sched_process_exit))
  1085. return -1;
  1086. }
  1087. was_sched_process_exit_enabled = test;
  1088. test = ebpf_is_tracepoint_enabled(tracepoint_sched_type, tracepoint_sched_process_exec);
  1089. if (test == -1)
  1090. return -1;
  1091. else if (!test) {
  1092. if (ebpf_enable_tracing_values(tracepoint_sched_type, tracepoint_sched_process_exec))
  1093. return -1;
  1094. }
  1095. was_sched_process_exec_enabled = test;
  1096. test = ebpf_is_tracepoint_enabled(tracepoint_sched_type, tracepoint_sched_process_fork);
  1097. if (test == -1)
  1098. return -1;
  1099. else if (!test) {
  1100. if (ebpf_enable_tracing_values(tracepoint_sched_type, tracepoint_sched_process_fork))
  1101. return -1;
  1102. }
  1103. was_sched_process_fork_enabled = test;
  1104. return 0;
  1105. }
  1106. /**
  1107. * Process thread
  1108. *
  1109. * Thread used to generate process charts.
  1110. *
  1111. * @param ptr a pointer to `struct ebpf_module`
  1112. *
  1113. * @return It always return NULL
  1114. */
  1115. void *ebpf_process_thread(void *ptr)
  1116. {
  1117. netdata_thread_cleanup_push(ebpf_process_cleanup, ptr);
  1118. ebpf_module_t *em = (ebpf_module_t *)ptr;
  1119. em->maps = process_maps;
  1120. if (ebpf_process_enable_tracepoints()) {
  1121. em->enabled = em->global_charts = em->apps_charts = em->cgroup_charts = CONFIG_BOOLEAN_NO;
  1122. }
  1123. process_enabled = em->enabled;
  1124. pthread_mutex_lock(&lock);
  1125. ebpf_process_allocate_global_vectors(NETDATA_KEY_PUBLISH_PROCESS_END);
  1126. ebpf_update_pid_table(&process_maps[0], em);
  1127. set_local_pointers();
  1128. probe_links = ebpf_load_program(ebpf_plugin_dir, em, running_on_kernel, isrh, &objects);
  1129. if (!probe_links) {
  1130. em->enabled = CONFIG_BOOLEAN_NO;
  1131. pthread_mutex_unlock(&lock);
  1132. goto endprocess;
  1133. }
  1134. int algorithms[NETDATA_KEY_PUBLISH_PROCESS_END] = {
  1135. NETDATA_EBPF_ABSOLUTE_IDX, NETDATA_EBPF_ABSOLUTE_IDX, NETDATA_EBPF_ABSOLUTE_IDX, NETDATA_EBPF_ABSOLUTE_IDX
  1136. };
  1137. ebpf_global_labels(
  1138. process_aggregated_data, process_publish_aggregated, process_dimension_names, process_id_names,
  1139. algorithms, NETDATA_KEY_PUBLISH_PROCESS_END);
  1140. if (process_enabled) {
  1141. ebpf_create_global_charts(em);
  1142. }
  1143. ebpf_update_stats(&plugin_statistics, em);
  1144. ebpf_create_statistic_charts(em);
  1145. pthread_mutex_unlock(&lock);
  1146. process_collector(em);
  1147. endprocess:
  1148. if (!em->enabled)
  1149. ebpf_update_disabled_plugin_stats(em);
  1150. wait_for_all_threads_die();
  1151. netdata_thread_cleanup_pop(1);
  1152. return NULL;
  1153. }