ebpf_cachestat.c 37 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include "ebpf.h"
  3. #include "ebpf_cachestat.h"
  4. netdata_publish_cachestat_t **cachestat_pid;
  5. static struct bpf_link **probe_links = NULL;
  6. static struct bpf_object *objects = NULL;
  7. static char *cachestat_counter_dimension_name[NETDATA_CACHESTAT_END] = { "ratio", "dirty", "hit",
  8. "miss" };
  9. static netdata_syscall_stat_t cachestat_counter_aggregated_data[NETDATA_CACHESTAT_END];
  10. static netdata_publish_syscall_t cachestat_counter_publish_aggregated[NETDATA_CACHESTAT_END];
  11. netdata_cachestat_pid_t *cachestat_vector = NULL;
  12. static netdata_idx_t cachestat_hash_values[NETDATA_CACHESTAT_END];
  13. static netdata_idx_t *cachestat_values = NULL;
  14. static int read_thread_closed = 1;
  15. struct netdata_static_thread cachestat_threads = {"CACHESTAT KERNEL",
  16. NULL, NULL, 1, NULL,
  17. NULL, NULL};
  18. static ebpf_local_maps_t cachestat_maps[] = {{.name = "cstat_global", .internal_input = NETDATA_CACHESTAT_END,
  19. .user_input = 0, .type = NETDATA_EBPF_MAP_STATIC,
  20. .map_fd = ND_EBPF_MAP_FD_NOT_INITIALIZED},
  21. {.name = "cstat_pid", .internal_input = ND_EBPF_DEFAULT_PID_SIZE,
  22. .user_input = 0,
  23. .type = NETDATA_EBPF_MAP_RESIZABLE | NETDATA_EBPF_MAP_PID,
  24. .map_fd = ND_EBPF_MAP_FD_NOT_INITIALIZED},
  25. {.name = "cstat_ctrl", .internal_input = NETDATA_CONTROLLER_END,
  26. .user_input = 0,
  27. .type = NETDATA_EBPF_MAP_CONTROLLER,
  28. .map_fd = ND_EBPF_MAP_FD_NOT_INITIALIZED},
  29. {.name = NULL, .internal_input = 0, .user_input = 0,
  30. .type = NETDATA_EBPF_MAP_CONTROLLER,
  31. .map_fd = ND_EBPF_MAP_FD_NOT_INITIALIZED}};
  32. struct config cachestat_config = { .first_section = NULL,
  33. .last_section = NULL,
  34. .mutex = NETDATA_MUTEX_INITIALIZER,
  35. .index = { .avl_tree = { .root = NULL, .compar = appconfig_section_compare },
  36. .rwlock = AVL_LOCK_INITIALIZER } };
  37. /*****************************************************************
  38. *
  39. * FUNCTIONS TO CLOSE THE THREAD
  40. *
  41. *****************************************************************/
  42. /**
  43. * Clean PID structures
  44. *
  45. * Clean the allocated structures.
  46. */
  47. void clean_cachestat_pid_structures() {
  48. struct pid_stat *pids = root_of_pids;
  49. while (pids) {
  50. freez(cachestat_pid[pids->pid]);
  51. pids = pids->next;
  52. }
  53. }
  54. /**
  55. * Clean up the main thread.
  56. *
  57. * @param ptr thread data.
  58. */
  59. static void ebpf_cachestat_cleanup(void *ptr)
  60. {
  61. ebpf_module_t *em = (ebpf_module_t *)ptr;
  62. if (!em->enabled)
  63. return;
  64. heartbeat_t hb;
  65. heartbeat_init(&hb);
  66. uint32_t tick = 2*USEC_PER_MS;
  67. while (!read_thread_closed) {
  68. usec_t dt = heartbeat_next(&hb, tick);
  69. UNUSED(dt);
  70. }
  71. ebpf_cleanup_publish_syscall(cachestat_counter_publish_aggregated);
  72. freez(cachestat_vector);
  73. freez(cachestat_values);
  74. if (probe_links) {
  75. struct bpf_program *prog;
  76. size_t i = 0 ;
  77. bpf_object__for_each_program(prog, objects) {
  78. bpf_link__destroy(probe_links[i]);
  79. i++;
  80. }
  81. bpf_object__close(objects);
  82. }
  83. }
  84. /*****************************************************************
  85. *
  86. * COMMON FUNCTIONS
  87. *
  88. *****************************************************************/
  89. /**
  90. * Update publish
  91. *
  92. * Update publish values before to write dimension.
  93. *
  94. * @param out structure that will receive data.
  95. * @param mpa calls for mark_page_accessed during the last second.
  96. * @param mbd calls for mark_buffer_dirty during the last second.
  97. * @param apcl calls for add_to_page_cache_lru during the last second.
  98. * @param apd calls for account_page_dirtied during the last second.
  99. */
  100. void cachestat_update_publish(netdata_publish_cachestat_t *out, uint64_t mpa, uint64_t mbd,
  101. uint64_t apcl, uint64_t apd)
  102. {
  103. // Adapted algorithm from https://github.com/iovisor/bcc/blob/master/tools/cachestat.py#L126-L138
  104. calculated_number total = (calculated_number) (((long long)mpa) - ((long long)mbd));
  105. if (total < 0)
  106. total = 0;
  107. calculated_number misses = (calculated_number) ( ((long long) apcl) - ((long long) apd) );
  108. if (misses < 0)
  109. misses = 0;
  110. // If hits are < 0, then its possible misses are overestimate due to possibly page cache read ahead adding
  111. // more pages than needed. In this case just assume misses as total and reset hits.
  112. calculated_number hits = total - misses;
  113. if (hits < 0 ) {
  114. misses = total;
  115. hits = 0;
  116. }
  117. calculated_number ratio = (total > 0) ? hits/total : 1;
  118. out->ratio = (long long )(ratio*100);
  119. out->hit = (long long)hits;
  120. out->miss = (long long)misses;
  121. }
  122. /**
  123. * Save previous values
  124. *
  125. * Save values used this time.
  126. *
  127. * @param publish
  128. */
  129. static void save_previous_values(netdata_publish_cachestat_t *publish) {
  130. publish->prev.mark_page_accessed = cachestat_hash_values[NETDATA_KEY_CALLS_MARK_PAGE_ACCESSED];
  131. publish->prev.account_page_dirtied = cachestat_hash_values[NETDATA_KEY_CALLS_ACCOUNT_PAGE_DIRTIED];
  132. publish->prev.add_to_page_cache_lru = cachestat_hash_values[NETDATA_KEY_CALLS_ADD_TO_PAGE_CACHE_LRU];
  133. publish->prev.mark_buffer_dirty = cachestat_hash_values[NETDATA_KEY_CALLS_MARK_BUFFER_DIRTY];
  134. }
  135. /**
  136. * Calculate statistics
  137. *
  138. * @param publish the structure where we will store the data.
  139. */
  140. static void calculate_stats(netdata_publish_cachestat_t *publish) {
  141. if (!publish->prev.mark_page_accessed) {
  142. save_previous_values(publish);
  143. return;
  144. }
  145. uint64_t mpa = cachestat_hash_values[NETDATA_KEY_CALLS_MARK_PAGE_ACCESSED] - publish->prev.mark_page_accessed;
  146. uint64_t mbd = cachestat_hash_values[NETDATA_KEY_CALLS_MARK_BUFFER_DIRTY] - publish->prev.mark_buffer_dirty;
  147. uint64_t apcl = cachestat_hash_values[NETDATA_KEY_CALLS_ADD_TO_PAGE_CACHE_LRU] - publish->prev.add_to_page_cache_lru;
  148. uint64_t apd = cachestat_hash_values[NETDATA_KEY_CALLS_ACCOUNT_PAGE_DIRTIED] - publish->prev.account_page_dirtied;
  149. save_previous_values(publish);
  150. // We are changing the original algorithm to have a smooth ratio.
  151. cachestat_update_publish(publish, mpa, mbd, apcl, apd);
  152. }
  153. /*****************************************************************
  154. *
  155. * APPS
  156. *
  157. *****************************************************************/
  158. /**
  159. * Apps Accumulator
  160. *
  161. * Sum all values read from kernel and store in the first address.
  162. *
  163. * @param out the vector with read values.
  164. */
  165. static void cachestat_apps_accumulator(netdata_cachestat_pid_t *out)
  166. {
  167. int i, end = (running_on_kernel >= NETDATA_KERNEL_V4_15) ? ebpf_nprocs : 1;
  168. netdata_cachestat_pid_t *total = &out[0];
  169. for (i = 1; i < end; i++) {
  170. netdata_cachestat_pid_t *w = &out[i];
  171. total->account_page_dirtied += w->account_page_dirtied;
  172. total->add_to_page_cache_lru += w->add_to_page_cache_lru;
  173. total->mark_buffer_dirty += w->mark_buffer_dirty;
  174. total->mark_page_accessed += w->mark_page_accessed;
  175. }
  176. }
  177. /**
  178. * Save Pid values
  179. *
  180. * Save the current values inside the structure
  181. *
  182. * @param out vector used to plot charts
  183. * @param publish vector with values read from hash tables.
  184. */
  185. static inline void cachestat_save_pid_values(netdata_publish_cachestat_t *out, netdata_cachestat_pid_t *publish)
  186. {
  187. if (!out->current.mark_page_accessed) {
  188. memcpy(&out->current, &publish[0], sizeof(netdata_cachestat_pid_t));
  189. return;
  190. }
  191. memcpy(&out->prev, &out->current, sizeof(netdata_cachestat_pid_t));
  192. memcpy(&out->current, &publish[0], sizeof(netdata_cachestat_pid_t));
  193. }
  194. /**
  195. * Fill PID
  196. *
  197. * Fill PID structures
  198. *
  199. * @param current_pid pid that we are collecting data
  200. * @param out values read from hash tables;
  201. */
  202. static void cachestat_fill_pid(uint32_t current_pid, netdata_cachestat_pid_t *publish)
  203. {
  204. netdata_publish_cachestat_t *curr = cachestat_pid[current_pid];
  205. if (!curr) {
  206. curr = callocz(1, sizeof(netdata_publish_cachestat_t));
  207. cachestat_pid[current_pid] = curr;
  208. cachestat_save_pid_values(curr, publish);
  209. return;
  210. }
  211. cachestat_save_pid_values(curr, publish);
  212. }
  213. /**
  214. * Read APPS table
  215. *
  216. * Read the apps table and store data inside the structure.
  217. */
  218. static void read_apps_table()
  219. {
  220. netdata_cachestat_pid_t *cv = cachestat_vector;
  221. uint32_t key;
  222. struct pid_stat *pids = root_of_pids;
  223. int fd = cachestat_maps[NETDATA_CACHESTAT_PID_STATS].map_fd;
  224. size_t length = sizeof(netdata_cachestat_pid_t)*ebpf_nprocs;
  225. while (pids) {
  226. key = pids->pid;
  227. if (bpf_map_lookup_elem(fd, &key, cv)) {
  228. pids = pids->next;
  229. continue;
  230. }
  231. cachestat_apps_accumulator(cv);
  232. cachestat_fill_pid(key, cv);
  233. // We are cleaning to avoid passing data read from one process to other.
  234. memset(cv, 0, length);
  235. pids = pids->next;
  236. }
  237. }
  238. /**
  239. * Update cgroup
  240. *
  241. * Update cgroup data based in
  242. */
  243. static void ebpf_update_cachestat_cgroup()
  244. {
  245. netdata_cachestat_pid_t *cv = cachestat_vector;
  246. int fd = cachestat_maps[NETDATA_CACHESTAT_PID_STATS].map_fd;
  247. size_t length = sizeof(netdata_cachestat_pid_t) * ebpf_nprocs;
  248. ebpf_cgroup_target_t *ect;
  249. pthread_mutex_lock(&mutex_cgroup_shm);
  250. for (ect = ebpf_cgroup_pids; ect; ect = ect->next) {
  251. struct pid_on_target2 *pids;
  252. for (pids = ect->pids; pids; pids = pids->next) {
  253. int pid = pids->pid;
  254. netdata_cachestat_pid_t *out = &pids->cachestat;
  255. if (likely(cachestat_pid) && cachestat_pid[pid]) {
  256. netdata_publish_cachestat_t *in = cachestat_pid[pid];
  257. memcpy(out, &in->current, sizeof(netdata_cachestat_pid_t));
  258. } else {
  259. memset(cv, 0, length);
  260. if (bpf_map_lookup_elem(fd, &pid, cv)) {
  261. continue;
  262. }
  263. cachestat_apps_accumulator(cv);
  264. memcpy(out, cv, sizeof(netdata_cachestat_pid_t));
  265. }
  266. }
  267. }
  268. pthread_mutex_unlock(&mutex_cgroup_shm);
  269. }
  270. /**
  271. * Create apps charts
  272. *
  273. * Call ebpf_create_chart to create the charts on apps submenu.
  274. *
  275. * @param em a pointer to the structure with the default values.
  276. */
  277. void ebpf_cachestat_create_apps_charts(struct ebpf_module *em, void *ptr)
  278. {
  279. struct target *root = ptr;
  280. ebpf_create_charts_on_apps(NETDATA_CACHESTAT_HIT_RATIO_CHART,
  281. "Hit ratio",
  282. EBPF_COMMON_DIMENSION_PERCENTAGE,
  283. NETDATA_CACHESTAT_SUBMENU,
  284. NETDATA_EBPF_CHART_TYPE_LINE,
  285. 20090,
  286. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  287. root, em->update_every, NETDATA_EBPF_MODULE_NAME_CACHESTAT);
  288. ebpf_create_charts_on_apps(NETDATA_CACHESTAT_DIRTY_CHART,
  289. "Number of dirty pages",
  290. EBPF_CACHESTAT_DIMENSION_PAGE,
  291. NETDATA_CACHESTAT_SUBMENU,
  292. NETDATA_EBPF_CHART_TYPE_STACKED,
  293. 20091,
  294. ebpf_algorithms[NETDATA_EBPF_INCREMENTAL_IDX],
  295. root, em->update_every, NETDATA_EBPF_MODULE_NAME_CACHESTAT);
  296. ebpf_create_charts_on_apps(NETDATA_CACHESTAT_HIT_CHART,
  297. "Number of accessed files",
  298. EBPF_CACHESTAT_DIMENSION_HITS,
  299. NETDATA_CACHESTAT_SUBMENU,
  300. NETDATA_EBPF_CHART_TYPE_STACKED,
  301. 20092,
  302. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  303. root, em->update_every, NETDATA_EBPF_MODULE_NAME_CACHESTAT);
  304. ebpf_create_charts_on_apps(NETDATA_CACHESTAT_MISSES_CHART,
  305. "Files out of page cache",
  306. EBPF_CACHESTAT_DIMENSION_MISSES,
  307. NETDATA_CACHESTAT_SUBMENU,
  308. NETDATA_EBPF_CHART_TYPE_STACKED,
  309. 20093,
  310. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  311. root, em->update_every, NETDATA_EBPF_MODULE_NAME_CACHESTAT);
  312. }
  313. /*****************************************************************
  314. *
  315. * MAIN LOOP
  316. *
  317. *****************************************************************/
  318. /**
  319. * Read global counter
  320. *
  321. * Read the table with number of calls for all functions
  322. */
  323. static void read_global_table()
  324. {
  325. uint32_t idx;
  326. netdata_idx_t *val = cachestat_hash_values;
  327. netdata_idx_t *stored = cachestat_values;
  328. int fd = cachestat_maps[NETDATA_CACHESTAT_GLOBAL_STATS].map_fd;
  329. for (idx = NETDATA_KEY_CALLS_ADD_TO_PAGE_CACHE_LRU; idx < NETDATA_CACHESTAT_END; idx++) {
  330. if (!bpf_map_lookup_elem(fd, &idx, stored)) {
  331. int i;
  332. int end = ebpf_nprocs;
  333. netdata_idx_t total = 0;
  334. for (i = 0; i < end; i++)
  335. total += stored[i];
  336. val[idx] = total;
  337. }
  338. }
  339. }
  340. /**
  341. * Socket read hash
  342. *
  343. * This is the thread callback.
  344. * This thread is necessary, because we cannot freeze the whole plugin to read the data on very busy socket.
  345. *
  346. * @param ptr It is a NULL value for this thread.
  347. *
  348. * @return It always returns NULL.
  349. */
  350. void *ebpf_cachestat_read_hash(void *ptr)
  351. {
  352. read_thread_closed = 0;
  353. heartbeat_t hb;
  354. heartbeat_init(&hb);
  355. ebpf_module_t *em = (ebpf_module_t *)ptr;
  356. usec_t step = NETDATA_LATENCY_CACHESTAT_SLEEP_MS * em->update_every;
  357. while (!close_ebpf_plugin) {
  358. usec_t dt = heartbeat_next(&hb, step);
  359. (void)dt;
  360. read_global_table();
  361. }
  362. read_thread_closed = 1;
  363. return NULL;
  364. }
  365. /**
  366. * Send global
  367. *
  368. * Send global charts to Netdata
  369. */
  370. static void cachestat_send_global(netdata_publish_cachestat_t *publish)
  371. {
  372. calculate_stats(publish);
  373. netdata_publish_syscall_t *ptr = cachestat_counter_publish_aggregated;
  374. ebpf_one_dimension_write_charts(
  375. NETDATA_EBPF_MEMORY_GROUP, NETDATA_CACHESTAT_HIT_RATIO_CHART, ptr[NETDATA_CACHESTAT_IDX_RATIO].dimension,
  376. publish->ratio);
  377. ebpf_one_dimension_write_charts(
  378. NETDATA_EBPF_MEMORY_GROUP, NETDATA_CACHESTAT_DIRTY_CHART, ptr[NETDATA_CACHESTAT_IDX_DIRTY].dimension,
  379. cachestat_hash_values[NETDATA_KEY_CALLS_MARK_BUFFER_DIRTY]);
  380. ebpf_one_dimension_write_charts(
  381. NETDATA_EBPF_MEMORY_GROUP, NETDATA_CACHESTAT_HIT_CHART, ptr[NETDATA_CACHESTAT_IDX_HIT].dimension, publish->hit);
  382. ebpf_one_dimension_write_charts(
  383. NETDATA_EBPF_MEMORY_GROUP, NETDATA_CACHESTAT_MISSES_CHART, ptr[NETDATA_CACHESTAT_IDX_MISS].dimension,
  384. publish->miss);
  385. }
  386. /**
  387. * Cachestat sum PIDs
  388. *
  389. * Sum values for all PIDs associated to a group
  390. *
  391. * @param publish output structure.
  392. * @param root structure with listed IPs
  393. */
  394. void ebpf_cachestat_sum_pids(netdata_publish_cachestat_t *publish, struct pid_on_target *root)
  395. {
  396. memcpy(&publish->prev, &publish->current,sizeof(publish->current));
  397. memset(&publish->current, 0, sizeof(publish->current));
  398. netdata_cachestat_pid_t *dst = &publish->current;
  399. while (root) {
  400. int32_t pid = root->pid;
  401. netdata_publish_cachestat_t *w = cachestat_pid[pid];
  402. if (w) {
  403. netdata_cachestat_pid_t *src = &w->current;
  404. dst->account_page_dirtied += src->account_page_dirtied;
  405. dst->add_to_page_cache_lru += src->add_to_page_cache_lru;
  406. dst->mark_buffer_dirty += src->mark_buffer_dirty;
  407. dst->mark_page_accessed += src->mark_page_accessed;
  408. }
  409. root = root->next;
  410. }
  411. }
  412. /**
  413. * Send data to Netdata calling auxiliary functions.
  414. *
  415. * @param root the target list.
  416. */
  417. void ebpf_cache_send_apps_data(struct target *root)
  418. {
  419. struct target *w;
  420. collected_number value;
  421. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_CACHESTAT_HIT_RATIO_CHART);
  422. for (w = root; w; w = w->next) {
  423. if (unlikely(w->exposed && w->processes)) {
  424. ebpf_cachestat_sum_pids(&w->cachestat, w->root_pid);
  425. netdata_cachestat_pid_t *current = &w->cachestat.current;
  426. netdata_cachestat_pid_t *prev = &w->cachestat.prev;
  427. uint64_t mpa = current->mark_page_accessed - prev->mark_page_accessed;
  428. uint64_t mbd = current->mark_buffer_dirty - prev->mark_buffer_dirty;
  429. w->cachestat.dirty = mbd;
  430. uint64_t apcl = current->add_to_page_cache_lru - prev->add_to_page_cache_lru;
  431. uint64_t apd = current->account_page_dirtied - prev->account_page_dirtied;
  432. cachestat_update_publish(&w->cachestat, mpa, mbd, apcl, apd);
  433. value = (collected_number) w->cachestat.ratio;
  434. // Here we are using different approach to have a chart more smooth
  435. write_chart_dimension(w->name, value);
  436. }
  437. }
  438. write_end_chart();
  439. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_CACHESTAT_DIRTY_CHART);
  440. for (w = root; w; w = w->next) {
  441. if (unlikely(w->exposed && w->processes)) {
  442. value = (collected_number) w->cachestat.dirty;
  443. write_chart_dimension(w->name, value);
  444. }
  445. }
  446. write_end_chart();
  447. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_CACHESTAT_HIT_CHART);
  448. for (w = root; w; w = w->next) {
  449. if (unlikely(w->exposed && w->processes)) {
  450. value = (collected_number) w->cachestat.hit;
  451. write_chart_dimension(w->name, value);
  452. }
  453. }
  454. write_end_chart();
  455. write_begin_chart(NETDATA_APPS_FAMILY, NETDATA_CACHESTAT_MISSES_CHART);
  456. for (w = root; w; w = w->next) {
  457. if (unlikely(w->exposed && w->processes)) {
  458. value = (collected_number) w->cachestat.miss;
  459. write_chart_dimension(w->name, value);
  460. }
  461. }
  462. write_end_chart();
  463. }
  464. /**
  465. * Cachestat sum PIDs
  466. *
  467. * Sum values for all PIDs associated to a group
  468. *
  469. * @param publish output structure.
  470. * @param root structure with listed IPs
  471. */
  472. void ebpf_cachestat_sum_cgroup_pids(netdata_publish_cachestat_t *publish, struct pid_on_target2 *root)
  473. {
  474. memcpy(&publish->prev, &publish->current,sizeof(publish->current));
  475. memset(&publish->current, 0, sizeof(publish->current));
  476. netdata_cachestat_pid_t *dst = &publish->current;
  477. while (root) {
  478. netdata_cachestat_pid_t *src = &root->cachestat;
  479. dst->account_page_dirtied += src->account_page_dirtied;
  480. dst->add_to_page_cache_lru += src->add_to_page_cache_lru;
  481. dst->mark_buffer_dirty += src->mark_buffer_dirty;
  482. dst->mark_page_accessed += src->mark_page_accessed;
  483. root = root->next;
  484. }
  485. }
  486. /**
  487. * Calc chart values
  488. *
  489. * Do necessary math to plot charts.
  490. */
  491. void ebpf_cachestat_calc_chart_values()
  492. {
  493. ebpf_cgroup_target_t *ect;
  494. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  495. ebpf_cachestat_sum_cgroup_pids(&ect->publish_cachestat, ect->pids);
  496. netdata_cachestat_pid_t *current = &ect->publish_cachestat.current;
  497. netdata_cachestat_pid_t *prev = &ect->publish_cachestat.prev;
  498. uint64_t mpa = current->mark_page_accessed - prev->mark_page_accessed;
  499. uint64_t mbd = current->mark_buffer_dirty - prev->mark_buffer_dirty;
  500. ect->publish_cachestat.dirty = mbd;
  501. uint64_t apcl = current->add_to_page_cache_lru - prev->add_to_page_cache_lru;
  502. uint64_t apd = current->account_page_dirtied - prev->account_page_dirtied;
  503. cachestat_update_publish(&ect->publish_cachestat, mpa, mbd, apcl, apd);
  504. }
  505. }
  506. /**
  507. * Create Systemd cachestat Charts
  508. *
  509. * Create charts when systemd is enabled
  510. *
  511. * @param update_every value to overwrite the update frequency set by the server.
  512. **/
  513. static void ebpf_create_systemd_cachestat_charts(int update_every)
  514. {
  515. ebpf_create_charts_on_systemd(NETDATA_CACHESTAT_HIT_RATIO_CHART,
  516. "Hit ratio",
  517. EBPF_COMMON_DIMENSION_PERCENTAGE, NETDATA_CACHESTAT_SUBMENU,
  518. NETDATA_EBPF_CHART_TYPE_LINE, 21100,
  519. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  520. NETDATA_SYSTEMD_CACHESTAT_HIT_RATIO_CONTEXT, NETDATA_EBPF_MODULE_NAME_CACHESTAT,
  521. update_every);
  522. ebpf_create_charts_on_systemd(NETDATA_CACHESTAT_DIRTY_CHART,
  523. "Number of dirty pages",
  524. EBPF_CACHESTAT_DIMENSION_PAGE, NETDATA_CACHESTAT_SUBMENU,
  525. NETDATA_EBPF_CHART_TYPE_LINE, 21101,
  526. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  527. NETDATA_SYSTEMD_CACHESTAT_MODIFIED_CACHE_CONTEXT, NETDATA_EBPF_MODULE_NAME_CACHESTAT,
  528. update_every);
  529. ebpf_create_charts_on_systemd(NETDATA_CACHESTAT_HIT_CHART, "Number of accessed files",
  530. EBPF_CACHESTAT_DIMENSION_HITS, NETDATA_CACHESTAT_SUBMENU,
  531. NETDATA_EBPF_CHART_TYPE_LINE, 21102,
  532. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  533. NETDATA_SYSTEMD_CACHESTAT_HIT_FILE_CONTEXT, NETDATA_EBPF_MODULE_NAME_CACHESTAT,
  534. update_every);
  535. ebpf_create_charts_on_systemd(NETDATA_CACHESTAT_MISSES_CHART, "Files out of page cache",
  536. EBPF_CACHESTAT_DIMENSION_MISSES, NETDATA_CACHESTAT_SUBMENU,
  537. NETDATA_EBPF_CHART_TYPE_LINE, 21103,
  538. ebpf_algorithms[NETDATA_EBPF_ABSOLUTE_IDX],
  539. NETDATA_SYSTEMD_CACHESTAT_MISS_FILES_CONTEXT, NETDATA_EBPF_MODULE_NAME_CACHESTAT,
  540. update_every);
  541. }
  542. /**
  543. * Send Cache Stat charts
  544. *
  545. * Send collected data to Netdata.
  546. *
  547. * @return It returns the status for chart creation, if it is necessary to remove a specific dimension, zero is returned
  548. * otherwise function returns 1 to avoid chart recreation
  549. */
  550. static int ebpf_send_systemd_cachestat_charts()
  551. {
  552. int ret = 1;
  553. ebpf_cgroup_target_t *ect;
  554. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_CACHESTAT_HIT_RATIO_CHART);
  555. for (ect = ebpf_cgroup_pids; ect; ect = ect->next) {
  556. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  557. write_chart_dimension(ect->name, (long long)ect->publish_cachestat.ratio);
  558. } else
  559. ret = 0;
  560. }
  561. write_end_chart();
  562. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_CACHESTAT_DIRTY_CHART);
  563. for (ect = ebpf_cgroup_pids; ect; ect = ect->next) {
  564. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  565. write_chart_dimension(ect->name, (long long)ect->publish_cachestat.dirty);
  566. }
  567. }
  568. write_end_chart();
  569. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_CACHESTAT_HIT_CHART);
  570. for (ect = ebpf_cgroup_pids; ect; ect = ect->next) {
  571. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  572. write_chart_dimension(ect->name, (long long)ect->publish_cachestat.hit);
  573. }
  574. }
  575. write_end_chart();
  576. write_begin_chart(NETDATA_SERVICE_FAMILY, NETDATA_CACHESTAT_MISSES_CHART);
  577. for (ect = ebpf_cgroup_pids; ect; ect = ect->next) {
  578. if (unlikely(ect->systemd) && unlikely(ect->updated)) {
  579. write_chart_dimension(ect->name, (long long)ect->publish_cachestat.miss);
  580. }
  581. }
  582. write_end_chart();
  583. return ret;
  584. }
  585. /**
  586. * Send Directory Cache charts
  587. *
  588. * Send collected data to Netdata.
  589. */
  590. static void ebpf_send_specific_cachestat_data(char *type, netdata_publish_cachestat_t *npc)
  591. {
  592. write_begin_chart(type, NETDATA_CACHESTAT_HIT_RATIO_CHART);
  593. write_chart_dimension(cachestat_counter_publish_aggregated[NETDATA_CACHESTAT_IDX_RATIO].name, (long long)npc->ratio);
  594. write_end_chart();
  595. write_begin_chart(type, NETDATA_CACHESTAT_DIRTY_CHART);
  596. write_chart_dimension(cachestat_counter_publish_aggregated[NETDATA_CACHESTAT_IDX_DIRTY].name, (long long)npc->dirty);
  597. write_end_chart();
  598. write_begin_chart(type, NETDATA_CACHESTAT_HIT_CHART);
  599. write_chart_dimension(cachestat_counter_publish_aggregated[NETDATA_CACHESTAT_IDX_HIT].name, (long long)npc->hit);
  600. write_end_chart();
  601. write_begin_chart(type, NETDATA_CACHESTAT_MISSES_CHART);
  602. write_chart_dimension(cachestat_counter_publish_aggregated[NETDATA_CACHESTAT_IDX_MISS].name, (long long)npc->miss);
  603. write_end_chart();
  604. }
  605. /**
  606. * Create specific cache Stat charts
  607. *
  608. * Create charts for cgroup/application.
  609. *
  610. * @param type the chart type.
  611. * @param update_every value to overwrite the update frequency set by the server.
  612. */
  613. static void ebpf_create_specific_cachestat_charts(char *type, int update_every)
  614. {
  615. ebpf_create_chart(type, NETDATA_CACHESTAT_HIT_RATIO_CHART,
  616. "Hit ratio",
  617. EBPF_COMMON_DIMENSION_PERCENTAGE, NETDATA_CACHESTAT_CGROUP_SUBMENU,
  618. NETDATA_CGROUP_CACHESTAT_HIT_RATIO_CONTEXT,
  619. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5200,
  620. ebpf_create_global_dimension,
  621. cachestat_counter_publish_aggregated, 1, update_every, NETDATA_EBPF_MODULE_NAME_CACHESTAT);
  622. ebpf_create_chart(type, NETDATA_CACHESTAT_DIRTY_CHART,
  623. "Number of dirty pages",
  624. EBPF_CACHESTAT_DIMENSION_PAGE, NETDATA_CACHESTAT_CGROUP_SUBMENU,
  625. NETDATA_CGROUP_CACHESTAT_MODIFIED_CACHE_CONTEXT,
  626. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5201,
  627. ebpf_create_global_dimension,
  628. &cachestat_counter_publish_aggregated[NETDATA_CACHESTAT_IDX_DIRTY], 1,
  629. update_every, NETDATA_EBPF_MODULE_NAME_CACHESTAT);
  630. ebpf_create_chart(type, NETDATA_CACHESTAT_HIT_CHART,
  631. "Number of accessed files",
  632. EBPF_CACHESTAT_DIMENSION_HITS, NETDATA_CACHESTAT_CGROUP_SUBMENU,
  633. NETDATA_CGROUP_CACHESTAT_HIT_FILES_CONTEXT,
  634. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5202,
  635. ebpf_create_global_dimension,
  636. &cachestat_counter_publish_aggregated[NETDATA_CACHESTAT_IDX_HIT], 1,
  637. update_every, NETDATA_EBPF_MODULE_NAME_CACHESTAT);
  638. ebpf_create_chart(type, NETDATA_CACHESTAT_MISSES_CHART,
  639. "Files out of page cache",
  640. EBPF_CACHESTAT_DIMENSION_MISSES, NETDATA_CACHESTAT_CGROUP_SUBMENU,
  641. NETDATA_CGROUP_CACHESTAT_MISS_FILES_CONTEXT,
  642. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5203,
  643. ebpf_create_global_dimension,
  644. &cachestat_counter_publish_aggregated[NETDATA_CACHESTAT_IDX_MISS], 1,
  645. update_every, NETDATA_EBPF_MODULE_NAME_CACHESTAT);
  646. }
  647. /**
  648. * Obsolete specific cache stat charts
  649. *
  650. * Obsolete charts for cgroup/application.
  651. *
  652. * @param type the chart type.
  653. * @param update_every value to overwrite the update frequency set by the server.
  654. */
  655. static void ebpf_obsolete_specific_cachestat_charts(char *type, int update_every)
  656. {
  657. ebpf_write_chart_obsolete(type, NETDATA_CACHESTAT_HIT_RATIO_CHART,
  658. "Hit ratio",
  659. EBPF_COMMON_DIMENSION_PERCENTAGE, NETDATA_CACHESTAT_SUBMENU,
  660. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CGROUP_CACHESTAT_HIT_RATIO_CONTEXT,
  661. NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5200, update_every);
  662. ebpf_write_chart_obsolete(type, NETDATA_CACHESTAT_DIRTY_CHART,
  663. "Number of dirty pages",
  664. EBPF_CACHESTAT_DIMENSION_PAGE, NETDATA_CACHESTAT_SUBMENU,
  665. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CGROUP_CACHESTAT_MODIFIED_CACHE_CONTEXT,
  666. NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5201, update_every);
  667. ebpf_write_chart_obsolete(type, NETDATA_CACHESTAT_HIT_CHART,
  668. "Number of accessed files",
  669. EBPF_CACHESTAT_DIMENSION_HITS, NETDATA_CACHESTAT_SUBMENU,
  670. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CGROUP_CACHESTAT_HIT_FILES_CONTEXT,
  671. NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5202, update_every);
  672. ebpf_write_chart_obsolete(type, NETDATA_CACHESTAT_MISSES_CHART,
  673. "Files out of page cache",
  674. EBPF_CACHESTAT_DIMENSION_MISSES, NETDATA_CACHESTAT_SUBMENU,
  675. NETDATA_EBPF_CHART_TYPE_LINE, NETDATA_CGROUP_CACHESTAT_MISS_FILES_CONTEXT,
  676. NETDATA_CHART_PRIO_CGROUPS_CONTAINERS + 5203, update_every);
  677. }
  678. /**
  679. * Send data to Netdata calling auxiliary functions.
  680. *
  681. * @param update_every value to overwrite the update frequency set by the server.
  682. */
  683. void ebpf_cachestat_send_cgroup_data(int update_every)
  684. {
  685. if (!ebpf_cgroup_pids)
  686. return;
  687. pthread_mutex_lock(&mutex_cgroup_shm);
  688. ebpf_cgroup_target_t *ect;
  689. ebpf_cachestat_calc_chart_values();
  690. int has_systemd = shm_ebpf_cgroup.header->systemd_enabled;
  691. if (has_systemd) {
  692. static int systemd_charts = 0;
  693. if (!systemd_charts) {
  694. ebpf_create_systemd_cachestat_charts(update_every);
  695. systemd_charts = 1;
  696. }
  697. systemd_charts = ebpf_send_systemd_cachestat_charts();
  698. }
  699. for (ect = ebpf_cgroup_pids; ect ; ect = ect->next) {
  700. if (ect->systemd)
  701. continue;
  702. if (!(ect->flags & NETDATA_EBPF_CGROUP_HAS_CACHESTAT_CHART) && ect->updated) {
  703. ebpf_create_specific_cachestat_charts(ect->name, update_every);
  704. ect->flags |= NETDATA_EBPF_CGROUP_HAS_CACHESTAT_CHART;
  705. }
  706. if (ect->flags & NETDATA_EBPF_CGROUP_HAS_CACHESTAT_CHART) {
  707. if (ect->updated) {
  708. ebpf_send_specific_cachestat_data(ect->name, &ect->publish_cachestat);
  709. } else {
  710. ebpf_obsolete_specific_cachestat_charts(ect->name, update_every);
  711. ect->flags &= ~NETDATA_EBPF_CGROUP_HAS_CACHESTAT_CHART;
  712. }
  713. }
  714. }
  715. pthread_mutex_unlock(&mutex_cgroup_shm);
  716. }
  717. /**
  718. * Main loop for this collector.
  719. */
  720. static void cachestat_collector(ebpf_module_t *em)
  721. {
  722. cachestat_threads.thread = mallocz(sizeof(netdata_thread_t));
  723. cachestat_threads.start_routine = ebpf_cachestat_read_hash;
  724. netdata_thread_create(cachestat_threads.thread, cachestat_threads.name, NETDATA_THREAD_OPTION_JOINABLE,
  725. ebpf_cachestat_read_hash, em);
  726. netdata_publish_cachestat_t publish;
  727. memset(&publish, 0, sizeof(publish));
  728. int apps = em->apps_charts;
  729. int cgroups = em->cgroup_charts;
  730. int update_every = em->update_every;
  731. int counter = update_every - 1;
  732. while (!close_ebpf_plugin) {
  733. pthread_mutex_lock(&collect_data_mutex);
  734. pthread_cond_wait(&collect_data_cond_var, &collect_data_mutex);
  735. if (++counter == update_every) {
  736. counter = 0;
  737. if (apps)
  738. read_apps_table();
  739. if (cgroups)
  740. ebpf_update_cachestat_cgroup();
  741. pthread_mutex_lock(&lock);
  742. cachestat_send_global(&publish);
  743. if (apps)
  744. ebpf_cache_send_apps_data(apps_groups_root_target);
  745. if (cgroups)
  746. ebpf_cachestat_send_cgroup_data(update_every);
  747. pthread_mutex_unlock(&lock);
  748. }
  749. pthread_mutex_unlock(&collect_data_mutex);
  750. }
  751. }
  752. /*****************************************************************
  753. *
  754. * INITIALIZE THREAD
  755. *
  756. *****************************************************************/
  757. /**
  758. * Create global charts
  759. *
  760. * Call ebpf_create_chart to create the charts for the collector.
  761. *
  762. * @param em a pointer to `struct ebpf_module`
  763. */
  764. static void ebpf_create_memory_charts(ebpf_module_t *em)
  765. {
  766. ebpf_create_chart(NETDATA_EBPF_MEMORY_GROUP, NETDATA_CACHESTAT_HIT_RATIO_CHART,
  767. "Hit ratio",
  768. EBPF_COMMON_DIMENSION_PERCENTAGE, NETDATA_CACHESTAT_SUBMENU,
  769. NULL,
  770. NETDATA_EBPF_CHART_TYPE_LINE,
  771. 21100,
  772. ebpf_create_global_dimension,
  773. cachestat_counter_publish_aggregated, 1, em->update_every, NETDATA_EBPF_MODULE_NAME_CACHESTAT);
  774. ebpf_create_chart(NETDATA_EBPF_MEMORY_GROUP, NETDATA_CACHESTAT_DIRTY_CHART,
  775. "Number of dirty pages",
  776. EBPF_CACHESTAT_DIMENSION_PAGE, NETDATA_CACHESTAT_SUBMENU,
  777. NULL,
  778. NETDATA_EBPF_CHART_TYPE_LINE,
  779. 21101,
  780. ebpf_create_global_dimension,
  781. &cachestat_counter_publish_aggregated[NETDATA_CACHESTAT_IDX_DIRTY], 1,
  782. em->update_every, NETDATA_EBPF_MODULE_NAME_CACHESTAT);
  783. ebpf_create_chart(NETDATA_EBPF_MEMORY_GROUP, NETDATA_CACHESTAT_HIT_CHART,
  784. "Number of accessed files",
  785. EBPF_CACHESTAT_DIMENSION_HITS, NETDATA_CACHESTAT_SUBMENU,
  786. NULL,
  787. NETDATA_EBPF_CHART_TYPE_LINE,
  788. 21102,
  789. ebpf_create_global_dimension,
  790. &cachestat_counter_publish_aggregated[NETDATA_CACHESTAT_IDX_HIT], 1,
  791. em->update_every, NETDATA_EBPF_MODULE_NAME_CACHESTAT);
  792. ebpf_create_chart(NETDATA_EBPF_MEMORY_GROUP, NETDATA_CACHESTAT_MISSES_CHART,
  793. "Files out of page cache",
  794. EBPF_CACHESTAT_DIMENSION_MISSES, NETDATA_CACHESTAT_SUBMENU,
  795. NULL,
  796. NETDATA_EBPF_CHART_TYPE_LINE,
  797. 21103,
  798. ebpf_create_global_dimension,
  799. &cachestat_counter_publish_aggregated[NETDATA_CACHESTAT_IDX_MISS], 1,
  800. em->update_every, NETDATA_EBPF_MODULE_NAME_CACHESTAT);
  801. fflush(stdout);
  802. }
  803. /**
  804. * Allocate vectors used with this thread.
  805. *
  806. * We are not testing the return, because callocz does this and shutdown the software
  807. * case it was not possible to allocate.
  808. *
  809. * @param apps is apps enabled?
  810. */
  811. static void ebpf_cachestat_allocate_global_vectors(int apps)
  812. {
  813. if (apps)
  814. cachestat_pid = callocz((size_t)pid_max, sizeof(netdata_publish_cachestat_t *));
  815. cachestat_vector = callocz((size_t)ebpf_nprocs, sizeof(netdata_cachestat_pid_t));
  816. cachestat_values = callocz((size_t)ebpf_nprocs, sizeof(netdata_idx_t));
  817. memset(cachestat_hash_values, 0, NETDATA_CACHESTAT_END * sizeof(netdata_idx_t));
  818. memset(cachestat_counter_aggregated_data, 0, NETDATA_CACHESTAT_END * sizeof(netdata_syscall_stat_t));
  819. memset(cachestat_counter_publish_aggregated, 0, NETDATA_CACHESTAT_END * sizeof(netdata_publish_syscall_t));
  820. }
  821. /*****************************************************************
  822. *
  823. * MAIN THREAD
  824. *
  825. *****************************************************************/
  826. /**
  827. * Cachestat thread
  828. *
  829. * Thread used to make cachestat thread
  830. *
  831. * @param ptr a pointer to `struct ebpf_module`
  832. *
  833. * @return It always return NULL
  834. */
  835. void *ebpf_cachestat_thread(void *ptr)
  836. {
  837. netdata_thread_cleanup_push(ebpf_cachestat_cleanup, ptr);
  838. ebpf_module_t *em = (ebpf_module_t *)ptr;
  839. em->maps = cachestat_maps;
  840. ebpf_update_pid_table(&cachestat_maps[NETDATA_CACHESTAT_PID_STATS], em);
  841. if (!em->enabled)
  842. goto endcachestat;
  843. pthread_mutex_lock(&lock);
  844. ebpf_cachestat_allocate_global_vectors(em->apps_charts);
  845. probe_links = ebpf_load_program(ebpf_plugin_dir, em, running_on_kernel, isrh, &objects);
  846. if (!probe_links) {
  847. pthread_mutex_unlock(&lock);
  848. em->enabled = CONFIG_BOOLEAN_NO;
  849. goto endcachestat;
  850. }
  851. ebpf_update_stats(&plugin_statistics, em);
  852. int algorithms[NETDATA_CACHESTAT_END] = {
  853. NETDATA_EBPF_ABSOLUTE_IDX, NETDATA_EBPF_INCREMENTAL_IDX, NETDATA_EBPF_ABSOLUTE_IDX, NETDATA_EBPF_ABSOLUTE_IDX
  854. };
  855. ebpf_global_labels(cachestat_counter_aggregated_data, cachestat_counter_publish_aggregated,
  856. cachestat_counter_dimension_name, cachestat_counter_dimension_name,
  857. algorithms, NETDATA_CACHESTAT_END);
  858. ebpf_create_memory_charts(em);
  859. pthread_mutex_unlock(&lock);
  860. cachestat_collector(em);
  861. endcachestat:
  862. if (!em->enabled)
  863. ebpf_update_disabled_plugin_stats(em);
  864. netdata_thread_cleanup_pop(1);
  865. return NULL;
  866. }