plugin_diskspace.c 36 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include "../proc.plugin/plugin_proc.h"
  3. #define PLUGIN_DISKSPACE_NAME "diskspace.plugin"
  4. #define DEFAULT_EXCLUDED_PATHS "/proc/* /sys/* /var/run/user/* /run/user/* /snap/* /var/lib/docker/*"
  5. #define DEFAULT_EXCLUDED_FILESYSTEMS "*gvfs *gluster* *s3fs *ipfs *davfs2 *httpfs *sshfs *gdfs *moosefs fusectl autofs"
  6. #define DEFAULT_EXCLUDED_FILESYSTEMS_INODES "msdosfs msdos vfat overlayfs aufs* *unionfs"
  7. #define CONFIG_SECTION_DISKSPACE "plugin:proc:diskspace"
  8. #define RRDFUNCTIONS_DISKSPACE_HELP "View mount point statistics"
  9. #define MAX_STAT_USEC 10000LU
  10. #define SLOW_UPDATE_EVERY 5
  11. static netdata_thread_t *diskspace_slow_thread = NULL;
  12. static struct mountinfo *disk_mountinfo_root = NULL;
  13. static int check_for_new_mountpoints_every = 15;
  14. static int cleanup_mount_points = 1;
  15. static inline void mountinfo_reload(int force) {
  16. static time_t last_loaded = 0;
  17. time_t now = now_realtime_sec();
  18. if(force || now - last_loaded >= check_for_new_mountpoints_every) {
  19. // mountinfo_free_all() can be called with NULL disk_mountinfo_root
  20. mountinfo_free_all(disk_mountinfo_root);
  21. // re-read mountinfo in case something changed
  22. disk_mountinfo_root = mountinfo_read(0);
  23. last_loaded = now;
  24. }
  25. }
  26. // Data to be stored in DICTIONARY dict_mountpoints used by do_disk_space_stats().
  27. // This DICTIONARY is used to lookup the settings of the mount point on each iteration.
  28. struct mount_point_metadata {
  29. int do_space;
  30. int do_inodes;
  31. int shown_error;
  32. int updated;
  33. int slow;
  34. bool function_ready;
  35. STRING *filesystem;
  36. STRING *mountroot;
  37. RRDLABELS *chart_labels;
  38. size_t collected; // the number of times this has been collected
  39. RRDSET *st_space;
  40. RRDDIM *rd_space_used;
  41. RRDDIM *rd_space_avail;
  42. RRDDIM *rd_space_reserved;
  43. RRDSET *st_inodes;
  44. RRDDIM *rd_inodes_used;
  45. RRDDIM *rd_inodes_avail;
  46. RRDDIM *rd_inodes_reserved;
  47. };
  48. static DICTIONARY *dict_mountpoints = NULL;
  49. #define rrdset_obsolete_and_pointer_null(st) do { if(st) { rrdset_is_obsolete___safe_from_collector_thread(st); (st) = NULL; } } while(st)
  50. int mount_point_cleanup(const char *name, void *entry, int slow) {
  51. (void)name;
  52. struct mount_point_metadata *mp = (struct mount_point_metadata *)entry;
  53. if(!mp) return 0;
  54. if (slow != mp->slow)
  55. return 0;
  56. if(likely(mp->updated)) {
  57. mp->updated = 0;
  58. return 0;
  59. }
  60. if(likely(cleanup_mount_points && mp->collected)) {
  61. mp->function_ready = false;
  62. mp->collected = 0;
  63. mp->updated = 0;
  64. mp->shown_error = 0;
  65. string_freez(mp->filesystem);
  66. string_freez(mp->mountroot);
  67. rrdset_obsolete_and_pointer_null(mp->st_space);
  68. rrdset_obsolete_and_pointer_null(mp->st_inodes);
  69. mp->rd_space_avail = NULL;
  70. mp->rd_space_used = NULL;
  71. mp->rd_space_reserved = NULL;
  72. mp->rd_inodes_avail = NULL;
  73. mp->rd_inodes_used = NULL;
  74. mp->rd_inodes_reserved = NULL;
  75. }
  76. return 0;
  77. }
  78. int mount_point_cleanup_cb(const DICTIONARY_ITEM *item, void *entry, void *data __maybe_unused) {
  79. const char *name = dictionary_acquired_item_name(item);
  80. return mount_point_cleanup(name, (struct mount_point_metadata *)entry, 0);
  81. }
  82. // a copy of basic mountinfo fields
  83. struct basic_mountinfo {
  84. char *persistent_id;
  85. char *root;
  86. char *mount_point;
  87. char *filesystem;
  88. struct basic_mountinfo *next;
  89. };
  90. static struct basic_mountinfo *slow_mountinfo_tmp_root = NULL;
  91. static netdata_mutex_t slow_mountinfo_mutex;
  92. static struct basic_mountinfo *basic_mountinfo_create_and_copy(struct mountinfo* mi)
  93. {
  94. struct basic_mountinfo *bmi = callocz(1, sizeof(struct basic_mountinfo));
  95. if (mi) {
  96. bmi->persistent_id = strdupz(mi->persistent_id);
  97. bmi->root = strdupz(mi->root);
  98. bmi->mount_point = strdupz(mi->mount_point);
  99. bmi->filesystem = strdupz(mi->filesystem);
  100. }
  101. return bmi;
  102. }
  103. static void add_basic_mountinfo(struct basic_mountinfo **root, struct mountinfo *mi)
  104. {
  105. if (!root)
  106. return;
  107. struct basic_mountinfo *bmi = basic_mountinfo_create_and_copy(mi);
  108. bmi->next = *root;
  109. *root = bmi;
  110. };
  111. static void free_basic_mountinfo(struct basic_mountinfo *bmi)
  112. {
  113. if (bmi) {
  114. freez(bmi->persistent_id);
  115. freez(bmi->root);
  116. freez(bmi->mount_point);
  117. freez(bmi->filesystem);
  118. freez(bmi);
  119. }
  120. };
  121. static void free_basic_mountinfo_list(struct basic_mountinfo *root)
  122. {
  123. struct basic_mountinfo *bmi = root, *next;
  124. while (bmi) {
  125. next = bmi->next;
  126. free_basic_mountinfo(bmi);
  127. bmi = next;
  128. }
  129. }
  130. static void calculate_values_and_show_charts(
  131. struct basic_mountinfo *mi,
  132. struct mount_point_metadata *m,
  133. struct statvfs *buff_statvfs,
  134. int update_every)
  135. {
  136. const char *family = mi->mount_point;
  137. const char *disk = mi->persistent_id;
  138. // logic found at get_fs_usage() in coreutils
  139. unsigned long bsize = (buff_statvfs->f_frsize) ? buff_statvfs->f_frsize : buff_statvfs->f_bsize;
  140. fsblkcnt_t bavail = buff_statvfs->f_bavail;
  141. fsblkcnt_t btotal = buff_statvfs->f_blocks;
  142. fsblkcnt_t bavail_root = buff_statvfs->f_bfree;
  143. fsblkcnt_t breserved_root = bavail_root - bavail;
  144. fsblkcnt_t bused = likely(btotal >= bavail_root) ? btotal - bavail_root : bavail_root - btotal;
  145. #ifdef NETDATA_INTERNAL_CHECKS
  146. if(unlikely(btotal != bavail + breserved_root + bused))
  147. collector_error("DISKSPACE: disk block statistics for '%s' (disk '%s') do not sum up: total = %llu, available = %llu, reserved = %llu, used = %llu", mi->mount_point, disk, (unsigned long long)btotal, (unsigned long long)bavail, (unsigned long long)breserved_root, (unsigned long long)bused);
  148. #endif
  149. // --------------------------------------------------------------------------
  150. fsfilcnt_t favail = buff_statvfs->f_favail;
  151. fsfilcnt_t ftotal = buff_statvfs->f_files;
  152. fsfilcnt_t favail_root = buff_statvfs->f_ffree;
  153. fsfilcnt_t freserved_root = favail_root - favail;
  154. fsfilcnt_t fused = ftotal - favail_root;
  155. if(m->do_inodes == CONFIG_BOOLEAN_AUTO && favail == (fsfilcnt_t)-1) {
  156. // this file system does not support inodes reporting
  157. // eg. cephfs
  158. m->do_inodes = CONFIG_BOOLEAN_NO;
  159. }
  160. #ifdef NETDATA_INTERNAL_CHECKS
  161. if(unlikely(btotal != bavail + breserved_root + bused))
  162. collector_error("DISKSPACE: disk inode statistics for '%s' (disk '%s') do not sum up: total = %llu, available = %llu, reserved = %llu, used = %llu", mi->mount_point, disk, (unsigned long long)ftotal, (unsigned long long)favail, (unsigned long long)freserved_root, (unsigned long long)fused);
  163. #endif
  164. int rendered = 0;
  165. if(m->do_space == CONFIG_BOOLEAN_YES || (m->do_space == CONFIG_BOOLEAN_AUTO &&
  166. (bavail || breserved_root || bused ||
  167. netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES))) {
  168. if(unlikely(!m->st_space) || m->st_space->update_every != update_every) {
  169. m->do_space = CONFIG_BOOLEAN_YES;
  170. m->st_space = rrdset_find_active_bytype_localhost("disk_space", disk);
  171. if(unlikely(!m->st_space || m->st_space->update_every != update_every)) {
  172. char title[4096 + 1];
  173. snprintfz(title, sizeof(title) - 1, "Disk Space Usage");
  174. m->st_space = rrdset_create_localhost(
  175. "disk_space"
  176. , disk
  177. , NULL
  178. , family
  179. , "disk.space"
  180. , title
  181. , "GiB"
  182. , PLUGIN_DISKSPACE_NAME
  183. , NULL
  184. , NETDATA_CHART_PRIO_DISKSPACE_SPACE
  185. , update_every
  186. , RRDSET_TYPE_STACKED
  187. );
  188. }
  189. rrdset_update_rrdlabels(m->st_space, m->chart_labels);
  190. m->rd_space_avail = rrddim_add(m->st_space, "avail", NULL, (collected_number)bsize, 1024 * 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  191. m->rd_space_used = rrddim_add(m->st_space, "used", NULL, (collected_number)bsize, 1024 * 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  192. m->rd_space_reserved = rrddim_add(m->st_space, "reserved_for_root", "reserved for root", (collected_number)bsize, 1024 * 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  193. }
  194. rrddim_set_by_pointer(m->st_space, m->rd_space_avail, (collected_number)bavail);
  195. rrddim_set_by_pointer(m->st_space, m->rd_space_used, (collected_number)bused);
  196. rrddim_set_by_pointer(m->st_space, m->rd_space_reserved, (collected_number)breserved_root);
  197. rrdset_done(m->st_space);
  198. rendered++;
  199. }
  200. if(m->do_inodes == CONFIG_BOOLEAN_YES || (m->do_inodes == CONFIG_BOOLEAN_AUTO &&
  201. (favail || freserved_root || fused ||
  202. netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES))) {
  203. if(unlikely(!m->st_inodes) || m->st_inodes->update_every != update_every) {
  204. m->do_inodes = CONFIG_BOOLEAN_YES;
  205. m->st_inodes = rrdset_find_active_bytype_localhost("disk_inodes", disk);
  206. if(unlikely(!m->st_inodes) || m->st_inodes->update_every != update_every) {
  207. char title[4096 + 1];
  208. snprintfz(title, sizeof(title) - 1, "Disk Files (inodes) Usage");
  209. m->st_inodes = rrdset_create_localhost(
  210. "disk_inodes"
  211. , disk
  212. , NULL
  213. , family
  214. , "disk.inodes"
  215. , title
  216. , "inodes"
  217. , PLUGIN_DISKSPACE_NAME
  218. , NULL
  219. , NETDATA_CHART_PRIO_DISKSPACE_INODES
  220. , update_every
  221. , RRDSET_TYPE_STACKED
  222. );
  223. }
  224. rrdset_update_rrdlabels(m->st_inodes, m->chart_labels);
  225. m->rd_inodes_avail = rrddim_add(m->st_inodes, "avail", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  226. m->rd_inodes_used = rrddim_add(m->st_inodes, "used", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  227. m->rd_inodes_reserved = rrddim_add(m->st_inodes, "reserved_for_root", "reserved for root", 1, 1, RRD_ALGORITHM_ABSOLUTE);
  228. }
  229. rrddim_set_by_pointer(m->st_inodes, m->rd_inodes_avail, (collected_number)favail);
  230. rrddim_set_by_pointer(m->st_inodes, m->rd_inodes_used, (collected_number)fused);
  231. rrddim_set_by_pointer(m->st_inodes, m->rd_inodes_reserved, (collected_number)freserved_root);
  232. rrdset_done(m->st_inodes);
  233. rendered++;
  234. }
  235. m->function_ready = rendered > 0;
  236. if(likely(rendered))
  237. m->collected++;
  238. }
  239. static inline void do_disk_space_stats(struct mountinfo *mi, int update_every) {
  240. const char *disk = mi->persistent_id;
  241. static SIMPLE_PATTERN *excluded_mountpoints = NULL;
  242. static SIMPLE_PATTERN *excluded_filesystems = NULL;
  243. static SIMPLE_PATTERN *excluded_filesystems_inodes = NULL;
  244. usec_t slow_timeout = MAX_STAT_USEC * update_every;
  245. int do_space, do_inodes;
  246. if(unlikely(!dict_mountpoints)) {
  247. SIMPLE_PREFIX_MODE mode = SIMPLE_PATTERN_EXACT;
  248. if(config_move("plugin:proc:/proc/diskstats", "exclude space metrics on paths", CONFIG_SECTION_DISKSPACE, "exclude space metrics on paths") != -1) {
  249. // old configuration, enable backwards compatibility
  250. mode = SIMPLE_PATTERN_PREFIX;
  251. }
  252. excluded_mountpoints = simple_pattern_create(
  253. config_get(CONFIG_SECTION_DISKSPACE, "exclude space metrics on paths", DEFAULT_EXCLUDED_PATHS),
  254. NULL,
  255. mode,
  256. true);
  257. excluded_filesystems = simple_pattern_create(
  258. config_get(CONFIG_SECTION_DISKSPACE, "exclude space metrics on filesystems", DEFAULT_EXCLUDED_FILESYSTEMS),
  259. NULL,
  260. SIMPLE_PATTERN_EXACT,
  261. true);
  262. excluded_filesystems_inodes = simple_pattern_create(
  263. config_get(CONFIG_SECTION_DISKSPACE, "exclude inode metrics on filesystems", DEFAULT_EXCLUDED_FILESYSTEMS_INODES),
  264. NULL,
  265. SIMPLE_PATTERN_EXACT,
  266. true);
  267. dict_mountpoints = dictionary_create_advanced(DICT_OPTION_NONE, &dictionary_stats_category_collectors, 0);
  268. }
  269. struct mount_point_metadata *m = dictionary_get(dict_mountpoints, mi->mount_point);
  270. if(unlikely(!m)) {
  271. int slow = 0;
  272. int def_space = config_get_boolean_ondemand(CONFIG_SECTION_DISKSPACE, "space usage for all disks", CONFIG_BOOLEAN_AUTO);
  273. int def_inodes = config_get_boolean_ondemand(CONFIG_SECTION_DISKSPACE, "inodes usage for all disks", CONFIG_BOOLEAN_AUTO);
  274. if(unlikely(simple_pattern_matches(excluded_mountpoints, mi->mount_point))) {
  275. def_space = CONFIG_BOOLEAN_NO;
  276. def_inodes = CONFIG_BOOLEAN_NO;
  277. }
  278. if(unlikely(simple_pattern_matches(excluded_filesystems, mi->filesystem))) {
  279. def_space = CONFIG_BOOLEAN_NO;
  280. def_inodes = CONFIG_BOOLEAN_NO;
  281. }
  282. if (unlikely(simple_pattern_matches(excluded_filesystems_inodes, mi->filesystem))) {
  283. def_inodes = CONFIG_BOOLEAN_NO;
  284. }
  285. // check if the mount point is a directory #2407
  286. // but only when it is enabled by default #4491
  287. if(def_space != CONFIG_BOOLEAN_NO || def_inodes != CONFIG_BOOLEAN_NO) {
  288. usec_t start_time = now_monotonic_high_precision_usec();
  289. struct stat bs;
  290. if(stat(mi->mount_point, &bs) == -1) {
  291. collector_error("DISKSPACE: Cannot stat() mount point '%s' (disk '%s', filesystem '%s', root '%s')."
  292. , mi->mount_point
  293. , disk
  294. , mi->filesystem?mi->filesystem:""
  295. , mi->root?mi->root:""
  296. );
  297. def_space = CONFIG_BOOLEAN_NO;
  298. def_inodes = CONFIG_BOOLEAN_NO;
  299. }
  300. else {
  301. if((bs.st_mode & S_IFMT) != S_IFDIR) {
  302. collector_error("DISKSPACE: Mount point '%s' (disk '%s', filesystem '%s', root '%s') is not a directory."
  303. , mi->mount_point
  304. , disk
  305. , mi->filesystem?mi->filesystem:""
  306. , mi->root?mi->root:""
  307. );
  308. def_space = CONFIG_BOOLEAN_NO;
  309. def_inodes = CONFIG_BOOLEAN_NO;
  310. }
  311. }
  312. if ((now_monotonic_high_precision_usec() - start_time) > slow_timeout)
  313. slow = 1;
  314. }
  315. char var_name[4096 + 1];
  316. snprintfz(var_name, 4096, "plugin:proc:diskspace:%s", mi->mount_point);
  317. do_space = def_space;
  318. do_inodes = def_inodes;
  319. if (config_exists(var_name, "space usage"))
  320. do_space = config_get_boolean_ondemand(var_name, "space usage", def_space);
  321. if (config_exists(var_name, "inodes usage"))
  322. do_inodes = config_get_boolean_ondemand(var_name, "inodes usage", def_inodes);
  323. struct mount_point_metadata mp = {
  324. .do_space = do_space,
  325. .do_inodes = do_inodes,
  326. .shown_error = 0,
  327. .updated = 0,
  328. .slow = 0,
  329. .collected = 0,
  330. .st_space = NULL,
  331. .rd_space_avail = NULL,
  332. .rd_space_used = NULL,
  333. .rd_space_reserved = NULL,
  334. .st_inodes = NULL,
  335. .rd_inodes_avail = NULL,
  336. .rd_inodes_used = NULL,
  337. .rd_inodes_reserved = NULL
  338. };
  339. mp.filesystem = string_strdupz(mi->filesystem);
  340. mp.mountroot = string_strdupz(mi->root);
  341. mp.chart_labels = rrdlabels_create();
  342. rrdlabels_add(mp.chart_labels, "mount_point", mi->mount_point, RRDLABEL_SRC_AUTO);
  343. rrdlabels_add(mp.chart_labels, "filesystem", mi->filesystem, RRDLABEL_SRC_AUTO);
  344. rrdlabels_add(mp.chart_labels, "mount_root", mi->root, RRDLABEL_SRC_AUTO);
  345. m = dictionary_set(dict_mountpoints, mi->mount_point, &mp, sizeof(struct mount_point_metadata));
  346. m->slow = slow;
  347. }
  348. if (m->slow) {
  349. add_basic_mountinfo(&slow_mountinfo_tmp_root, mi);
  350. return;
  351. }
  352. m->updated = 1;
  353. if(unlikely(m->do_space == CONFIG_BOOLEAN_NO && m->do_inodes == CONFIG_BOOLEAN_NO))
  354. return;
  355. if (unlikely(
  356. mi->flags & MOUNTINFO_READONLY &&
  357. !(mi->flags & MOUNTINFO_IS_IN_SYSD_PROTECTED_LIST) &&
  358. !m->collected &&
  359. m->do_space != CONFIG_BOOLEAN_YES &&
  360. m->do_inodes != CONFIG_BOOLEAN_YES))
  361. return;
  362. usec_t start_time = now_monotonic_high_precision_usec();
  363. struct statvfs buff_statvfs;
  364. if (statvfs(mi->mount_point, &buff_statvfs) < 0) {
  365. if(!m->shown_error) {
  366. collector_error("DISKSPACE: failed to statvfs() mount point '%s' (disk '%s', filesystem '%s', root '%s')"
  367. , mi->mount_point
  368. , disk
  369. , mi->filesystem?mi->filesystem:""
  370. , mi->root?mi->root:""
  371. );
  372. m->shown_error = 1;
  373. }
  374. return;
  375. }
  376. if ((now_monotonic_high_precision_usec() - start_time) > slow_timeout)
  377. m->slow = 1;
  378. m->shown_error = 0;
  379. struct basic_mountinfo bmi;
  380. bmi.mount_point = mi->mount_point;
  381. bmi.persistent_id = mi->persistent_id;
  382. bmi.filesystem = mi->filesystem;
  383. bmi.root = mi->root;
  384. calculate_values_and_show_charts(&bmi, m, &buff_statvfs, update_every);
  385. }
  386. static inline void do_slow_disk_space_stats(struct basic_mountinfo *mi, int update_every) {
  387. struct mount_point_metadata *m = dictionary_get(dict_mountpoints, mi->mount_point);
  388. m->updated = 1;
  389. struct statvfs buff_statvfs;
  390. if (statvfs(mi->mount_point, &buff_statvfs) < 0) {
  391. if(!m->shown_error) {
  392. collector_error("DISKSPACE: failed to statvfs() mount point '%s' (disk '%s', filesystem '%s', root '%s')"
  393. , mi->mount_point
  394. , mi->persistent_id
  395. , mi->filesystem?mi->filesystem:""
  396. , mi->root?mi->root:""
  397. );
  398. m->shown_error = 1;
  399. }
  400. return;
  401. }
  402. m->shown_error = 0;
  403. calculate_values_and_show_charts(mi, m, &buff_statvfs, update_every);
  404. }
  405. static void diskspace_slow_worker_cleanup(void *ptr)
  406. {
  407. UNUSED(ptr);
  408. collector_info("cleaning up...");
  409. worker_unregister();
  410. }
  411. #define WORKER_JOB_SLOW_MOUNTPOINT 0
  412. #define WORKER_JOB_SLOW_CLEANUP 1
  413. struct slow_worker_data {
  414. netdata_thread_t *slow_thread;
  415. int update_every;
  416. };
  417. void *diskspace_slow_worker(void *ptr)
  418. {
  419. struct slow_worker_data *data = (struct slow_worker_data *)ptr;
  420. worker_register("DISKSPACE_SLOW");
  421. worker_register_job_name(WORKER_JOB_SLOW_MOUNTPOINT, "mountpoint");
  422. worker_register_job_name(WORKER_JOB_SLOW_CLEANUP, "cleanup");
  423. struct basic_mountinfo *slow_mountinfo_root = NULL;
  424. int slow_update_every = data->update_every > SLOW_UPDATE_EVERY ? data->update_every : SLOW_UPDATE_EVERY;
  425. netdata_thread_cleanup_push(diskspace_slow_worker_cleanup, data->slow_thread);
  426. usec_t step = slow_update_every * USEC_PER_SEC;
  427. usec_t real_step = USEC_PER_SEC;
  428. heartbeat_t hb;
  429. heartbeat_init(&hb);
  430. while(service_running(SERVICE_COLLECTORS)) {
  431. worker_is_idle();
  432. heartbeat_next(&hb, USEC_PER_SEC);
  433. if (real_step < step) {
  434. real_step += USEC_PER_SEC;
  435. continue;
  436. }
  437. real_step = USEC_PER_SEC;
  438. usec_t start_time = now_monotonic_high_precision_usec();
  439. if (!dict_mountpoints)
  440. continue;
  441. if(unlikely(!service_running(SERVICE_COLLECTORS))) break;
  442. // --------------------------------------------------------------------------
  443. // disk space metrics
  444. worker_is_busy(WORKER_JOB_SLOW_MOUNTPOINT);
  445. netdata_mutex_lock(&slow_mountinfo_mutex);
  446. free_basic_mountinfo_list(slow_mountinfo_root);
  447. slow_mountinfo_root = slow_mountinfo_tmp_root;
  448. slow_mountinfo_tmp_root = NULL;
  449. netdata_mutex_unlock(&slow_mountinfo_mutex);
  450. struct basic_mountinfo *bmi;
  451. for(bmi = slow_mountinfo_root; bmi; bmi = bmi->next) {
  452. do_slow_disk_space_stats(bmi, slow_update_every);
  453. if(unlikely(!service_running(SERVICE_COLLECTORS))) break;
  454. }
  455. if(unlikely(!service_running(SERVICE_COLLECTORS))) break;
  456. worker_is_busy(WORKER_JOB_SLOW_CLEANUP);
  457. for(bmi = slow_mountinfo_root; bmi; bmi = bmi->next) {
  458. struct mount_point_metadata *m = dictionary_get(dict_mountpoints, bmi->mount_point);
  459. if (m)
  460. mount_point_cleanup(bmi->mount_point, m, 1);
  461. }
  462. usec_t dt = now_monotonic_high_precision_usec() - start_time;
  463. if (dt > step) {
  464. slow_update_every = (dt / USEC_PER_SEC) * 3 / 2;
  465. if (slow_update_every % SLOW_UPDATE_EVERY)
  466. slow_update_every += SLOW_UPDATE_EVERY - slow_update_every % SLOW_UPDATE_EVERY;
  467. step = slow_update_every * USEC_PER_SEC;
  468. }
  469. }
  470. netdata_thread_cleanup_pop(1);
  471. free_basic_mountinfo_list(slow_mountinfo_root);
  472. return NULL;
  473. }
  474. static void diskspace_main_cleanup(void *ptr) {
  475. rrd_collector_finished();
  476. worker_unregister();
  477. struct netdata_static_thread *static_thread = (struct netdata_static_thread *)ptr;
  478. static_thread->enabled = NETDATA_MAIN_THREAD_EXITING;
  479. collector_info("cleaning up...");
  480. if (diskspace_slow_thread) {
  481. netdata_thread_join(*diskspace_slow_thread, NULL);
  482. freez(diskspace_slow_thread);
  483. }
  484. free_basic_mountinfo_list(slow_mountinfo_tmp_root);
  485. static_thread->enabled = NETDATA_MAIN_THREAD_EXITED;
  486. }
  487. #define WORKER_JOB_MOUNTINFO 0
  488. #define WORKER_JOB_MOUNTPOINT 1
  489. #define WORKER_JOB_CLEANUP 2
  490. #if WORKER_UTILIZATION_MAX_JOB_TYPES < 3
  491. #error WORKER_UTILIZATION_MAX_JOB_TYPES has to be at least 3
  492. #endif
  493. int diskspace_function_mount_points(BUFFER *wb, int timeout __maybe_unused, const char *function __maybe_unused,
  494. void *collector_data __maybe_unused,
  495. rrd_function_result_callback_t result_cb, void *result_cb_data,
  496. rrd_function_is_cancelled_cb_t is_cancelled_cb, void *is_cancelled_cb_data,
  497. rrd_function_register_canceller_cb_t register_canceller_cb __maybe_unused,
  498. void *register_canceller_cb_data __maybe_unused) {
  499. buffer_flush(wb);
  500. wb->content_type = CT_APPLICATION_JSON;
  501. buffer_json_initialize(wb, "\"", "\"", 0, true, BUFFER_JSON_OPTIONS_DEFAULT);
  502. buffer_json_member_add_string(wb, "hostname", rrdhost_hostname(localhost));
  503. buffer_json_member_add_uint64(wb, "status", HTTP_RESP_OK);
  504. buffer_json_member_add_string(wb, "type", "table");
  505. buffer_json_member_add_time_t(wb, "update_every", 1);
  506. buffer_json_member_add_string(wb, "help", RRDFUNCTIONS_DISKSPACE_HELP);
  507. buffer_json_member_add_array(wb, "data");
  508. double max_space_util = 0.0;
  509. double max_space_avail = 0.0;
  510. double max_space_used = 0.0;
  511. double max_space_reserved = 0.0;
  512. double max_inodes_util = 0.0;
  513. double max_inodes_avail = 0.0;
  514. double max_inodes_used = 0.0;
  515. double max_inodes_reserved = 0.0;
  516. struct mount_point_metadata *mp;
  517. dfe_start_write(dict_mountpoints, mp) {
  518. if (!mp->function_ready)
  519. continue;
  520. buffer_json_add_array_item_array(wb);
  521. buffer_json_add_array_item_string(wb, mp_dfe.name);
  522. buffer_json_add_array_item_string(wb, string2str(mp->filesystem));
  523. buffer_json_add_array_item_string(wb, string2str(mp->mountroot));
  524. double space_avail = rrddim_get_last_stored_value(mp->rd_space_avail, &max_space_avail, 1.0);
  525. double space_used = rrddim_get_last_stored_value(mp->rd_space_used, &max_space_used, 1.0);
  526. double space_reserved = rrddim_get_last_stored_value(mp->rd_space_reserved, &max_space_reserved, 1.0);
  527. double inodes_avail = rrddim_get_last_stored_value(mp->rd_inodes_avail, &max_inodes_avail, 1.0);
  528. double inodes_used = rrddim_get_last_stored_value(mp->rd_inodes_used, &max_inodes_used, 1.0);
  529. double inodes_reserved = rrddim_get_last_stored_value(mp->rd_inodes_reserved, &max_inodes_reserved, 1.0);
  530. double space_util = NAN;
  531. if (!isnan(space_avail) && !isnan(space_used)) {
  532. space_util = space_avail + space_used > 0 ? space_used * 100.0 / (space_avail + space_used) : 0;
  533. max_space_util = MAX(max_space_util, space_util);
  534. }
  535. double inodes_util = NAN;
  536. if (!isnan(inodes_avail) && !isnan(inodes_used)) {
  537. inodes_util = inodes_avail + inodes_used > 0 ? inodes_used * 100.0 / (inodes_avail + inodes_used) : 0;
  538. max_inodes_util = MAX(max_inodes_util, inodes_util);
  539. }
  540. buffer_json_add_array_item_double(wb, space_util);
  541. buffer_json_add_array_item_double(wb, space_avail);
  542. buffer_json_add_array_item_double(wb, space_used);
  543. buffer_json_add_array_item_double(wb, space_reserved);
  544. buffer_json_add_array_item_double(wb, inodes_util);
  545. buffer_json_add_array_item_double(wb, inodes_avail);
  546. buffer_json_add_array_item_double(wb, inodes_used);
  547. buffer_json_add_array_item_double(wb, inodes_reserved);
  548. buffer_json_array_close(wb);
  549. }
  550. dfe_done(mp);
  551. buffer_json_array_close(wb); // data
  552. buffer_json_member_add_object(wb, "columns");
  553. {
  554. size_t field_id = 0;
  555. buffer_rrdf_table_add_field(wb, field_id++, "Mountpoint", "Mountpoint Name",
  556. RRDF_FIELD_TYPE_STRING, RRDF_FIELD_VISUAL_VALUE, RRDF_FIELD_TRANSFORM_NONE,
  557. 0, NULL, NAN, RRDF_FIELD_SORT_ASCENDING, NULL,
  558. RRDF_FIELD_SUMMARY_COUNT, RRDF_FIELD_FILTER_MULTISELECT,
  559. RRDF_FIELD_OPTS_VISIBLE | RRDF_FIELD_OPTS_UNIQUE_KEY | RRDF_FIELD_OPTS_STICKY | RRDF_FIELD_OPTS_FULL_WIDTH,
  560. NULL);
  561. buffer_rrdf_table_add_field(wb, field_id++, "Filesystem", "Mountpoint Filesystem",
  562. RRDF_FIELD_TYPE_STRING, RRDF_FIELD_VISUAL_VALUE, RRDF_FIELD_TRANSFORM_NONE,
  563. 0, NULL, NAN, RRDF_FIELD_SORT_ASCENDING, NULL,
  564. RRDF_FIELD_SUMMARY_COUNT, RRDF_FIELD_FILTER_MULTISELECT,
  565. RRDF_FIELD_OPTS_VISIBLE | RRDF_FIELD_OPTS_UNIQUE_KEY,
  566. NULL);
  567. buffer_rrdf_table_add_field(wb, field_id++, "Root", "Mountpoint Root",
  568. RRDF_FIELD_TYPE_STRING, RRDF_FIELD_VISUAL_VALUE, RRDF_FIELD_TRANSFORM_NONE,
  569. 0, NULL, NAN, RRDF_FIELD_SORT_ASCENDING, NULL,
  570. RRDF_FIELD_SUMMARY_COUNT, RRDF_FIELD_FILTER_MULTISELECT,
  571. RRDF_FIELD_OPTS_UNIQUE_KEY,
  572. NULL);
  573. buffer_rrdf_table_add_field(wb, field_id++, "Used%", "Space Utilization",
  574. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  575. 2, "%", max_space_util, RRDF_FIELD_SORT_DESCENDING, NULL,
  576. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  577. RRDF_FIELD_OPTS_VISIBLE,
  578. NULL);
  579. buffer_rrdf_table_add_field(wb, field_id++, "Avail", "Space Avail",
  580. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  581. 2, "GiB", max_space_avail, RRDF_FIELD_SORT_DESCENDING, NULL,
  582. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  583. RRDF_FIELD_OPTS_VISIBLE,
  584. NULL);
  585. buffer_rrdf_table_add_field(wb, field_id++, "Used", "Space Used",
  586. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  587. 2, "GiB", max_space_used, RRDF_FIELD_SORT_DESCENDING, NULL,
  588. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  589. RRDF_FIELD_OPTS_VISIBLE,
  590. NULL);
  591. buffer_rrdf_table_add_field(wb, field_id++, "Reserved", "Space Reserved for root",
  592. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  593. 2, "GiB", max_space_reserved, RRDF_FIELD_SORT_DESCENDING, NULL,
  594. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  595. RRDF_FIELD_OPTS_VISIBLE,
  596. NULL);
  597. buffer_rrdf_table_add_field(wb, field_id++, "iUsed%", "Inodes Utilization",
  598. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  599. 2, "%", max_inodes_util, RRDF_FIELD_SORT_DESCENDING, NULL,
  600. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  601. RRDF_FIELD_OPTS_NONE,
  602. NULL);
  603. buffer_rrdf_table_add_field(wb, field_id++, "iAvail", "Inodes Avail",
  604. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  605. 2, "inodes", max_inodes_avail, RRDF_FIELD_SORT_DESCENDING, NULL,
  606. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  607. RRDF_FIELD_OPTS_NONE,
  608. NULL);
  609. buffer_rrdf_table_add_field(wb, field_id++, "iUsed", "Inodes Used",
  610. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  611. 2, "inodes", max_inodes_used, RRDF_FIELD_SORT_DESCENDING, NULL,
  612. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  613. RRDF_FIELD_OPTS_NONE,
  614. NULL);
  615. buffer_rrdf_table_add_field(wb, field_id++, "iReserved", "Inodes Reserved for root",
  616. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  617. 2, "inodes", max_inodes_reserved, RRDF_FIELD_SORT_DESCENDING, NULL,
  618. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  619. RRDF_FIELD_OPTS_NONE,
  620. NULL);
  621. }
  622. buffer_json_object_close(wb); // columns
  623. buffer_json_member_add_string(wb, "default_sort_column", "Used%");
  624. buffer_json_member_add_object(wb, "charts");
  625. {
  626. buffer_json_member_add_object(wb, "Utilization");
  627. {
  628. buffer_json_member_add_string(wb, "name", "Utilization");
  629. buffer_json_member_add_string(wb, "type", "stacked-bar");
  630. buffer_json_member_add_array(wb, "columns");
  631. {
  632. buffer_json_add_array_item_string(wb, "Used%");
  633. }
  634. buffer_json_array_close(wb);
  635. }
  636. buffer_json_object_close(wb);
  637. buffer_json_member_add_object(wb, "Usage");
  638. {
  639. buffer_json_member_add_string(wb, "name", "Usage");
  640. buffer_json_member_add_string(wb, "type", "stacked-bar");
  641. buffer_json_member_add_array(wb, "columns");
  642. {
  643. buffer_json_add_array_item_string(wb, "Avail");
  644. buffer_json_add_array_item_string(wb, "Used");
  645. buffer_json_add_array_item_string(wb, "Reserved");
  646. }
  647. buffer_json_array_close(wb);
  648. }
  649. buffer_json_object_close(wb);
  650. buffer_json_member_add_object(wb, "Inodes");
  651. {
  652. buffer_json_member_add_string(wb, "name", "Inodes");
  653. buffer_json_member_add_string(wb, "type", "stacked-bar");
  654. buffer_json_member_add_array(wb, "columns");
  655. {
  656. buffer_json_add_array_item_string(wb, "iAvail");
  657. buffer_json_add_array_item_string(wb, "iUsed");
  658. buffer_json_add_array_item_string(wb, "iReserved");
  659. }
  660. buffer_json_array_close(wb);
  661. }
  662. buffer_json_object_close(wb);
  663. }
  664. buffer_json_object_close(wb); // charts
  665. buffer_json_member_add_array(wb, "default_charts");
  666. {
  667. buffer_json_add_array_item_array(wb);
  668. buffer_json_add_array_item_string(wb, "Utilization");
  669. buffer_json_add_array_item_string(wb, "Mountpoint");
  670. buffer_json_array_close(wb);
  671. buffer_json_add_array_item_array(wb);
  672. buffer_json_add_array_item_string(wb, "Usage");
  673. buffer_json_add_array_item_string(wb, "Mountpoint");
  674. buffer_json_array_close(wb);
  675. }
  676. buffer_json_array_close(wb);
  677. buffer_json_member_add_time_t(wb, "expires", now_realtime_sec() + 1);
  678. buffer_json_finalize(wb);
  679. int response = HTTP_RESP_OK;
  680. if(is_cancelled_cb && is_cancelled_cb(is_cancelled_cb_data)) {
  681. buffer_flush(wb);
  682. response = HTTP_RESP_CLIENT_CLOSED_REQUEST;
  683. }
  684. if(result_cb)
  685. result_cb(wb, response, result_cb_data);
  686. return response;
  687. }
  688. void *diskspace_main(void *ptr) {
  689. worker_register("DISKSPACE");
  690. worker_register_job_name(WORKER_JOB_MOUNTINFO, "mountinfo");
  691. worker_register_job_name(WORKER_JOB_MOUNTPOINT, "mountpoint");
  692. worker_register_job_name(WORKER_JOB_CLEANUP, "cleanup");
  693. rrd_collector_started();
  694. rrd_function_add(localhost, NULL, "mount-points", 10, RRDFUNCTIONS_DISKSPACE_HELP, true, diskspace_function_mount_points, NULL);
  695. netdata_thread_cleanup_push(diskspace_main_cleanup, ptr);
  696. cleanup_mount_points = config_get_boolean(CONFIG_SECTION_DISKSPACE, "remove charts of unmounted disks" , cleanup_mount_points);
  697. int update_every = (int)config_get_number(CONFIG_SECTION_DISKSPACE, "update every", localhost->rrd_update_every);
  698. if(update_every < localhost->rrd_update_every)
  699. update_every = localhost->rrd_update_every;
  700. check_for_new_mountpoints_every = (int)config_get_number(CONFIG_SECTION_DISKSPACE, "check for new mount points every", check_for_new_mountpoints_every);
  701. if(check_for_new_mountpoints_every < update_every)
  702. check_for_new_mountpoints_every = update_every;
  703. netdata_mutex_init(&slow_mountinfo_mutex);
  704. diskspace_slow_thread = mallocz(sizeof(netdata_thread_t));
  705. struct slow_worker_data slow_worker_data = {.slow_thread = diskspace_slow_thread, .update_every = update_every};
  706. netdata_thread_create(
  707. diskspace_slow_thread,
  708. "P[diskspace slow]",
  709. NETDATA_THREAD_OPTION_JOINABLE,
  710. diskspace_slow_worker,
  711. &slow_worker_data);
  712. usec_t step = update_every * USEC_PER_SEC;
  713. heartbeat_t hb;
  714. heartbeat_init(&hb);
  715. while(service_running(SERVICE_COLLECTORS)) {
  716. worker_is_idle();
  717. /* usec_t hb_dt = */ heartbeat_next(&hb, step);
  718. if(unlikely(!service_running(SERVICE_COLLECTORS))) break;
  719. // --------------------------------------------------------------------------
  720. // this is smart enough not to reload it every time
  721. worker_is_busy(WORKER_JOB_MOUNTINFO);
  722. mountinfo_reload(0);
  723. // --------------------------------------------------------------------------
  724. // disk space metrics
  725. netdata_mutex_lock(&slow_mountinfo_mutex);
  726. free_basic_mountinfo_list(slow_mountinfo_tmp_root);
  727. slow_mountinfo_tmp_root = NULL;
  728. struct mountinfo *mi;
  729. for(mi = disk_mountinfo_root; mi; mi = mi->next) {
  730. if(unlikely(mi->flags & (MOUNTINFO_IS_DUMMY | MOUNTINFO_IS_BIND)))
  731. continue;
  732. // exclude mounts made by ProtectHome and ProtectSystem systemd hardening options
  733. // https://github.com/netdata/netdata/issues/11498#issuecomment-950982878
  734. if(mi->flags & MOUNTINFO_READONLY && mi->flags & MOUNTINFO_IS_IN_SYSD_PROTECTED_LIST && !strcmp(mi->root, mi->mount_point))
  735. continue;
  736. worker_is_busy(WORKER_JOB_MOUNTPOINT);
  737. do_disk_space_stats(mi, update_every);
  738. if(unlikely(!service_running(SERVICE_COLLECTORS))) break;
  739. }
  740. netdata_mutex_unlock(&slow_mountinfo_mutex);
  741. if(unlikely(!service_running(SERVICE_COLLECTORS))) break;
  742. if(dict_mountpoints) {
  743. worker_is_busy(WORKER_JOB_CLEANUP);
  744. dictionary_walkthrough_read(dict_mountpoints, mount_point_cleanup_cb, NULL);
  745. }
  746. }
  747. worker_unregister();
  748. netdata_thread_cleanup_pop(1);
  749. return NULL;
  750. }