plugin_diskspace.c 36 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include "../proc.plugin/plugin_proc.h"
  3. #define PLUGIN_DISKSPACE_NAME "diskspace.plugin"
  4. #define DEFAULT_EXCLUDED_PATHS "/proc/* /sys/* /var/run/user/* /run/user/* /snap/* /var/lib/docker/*"
  5. #define DEFAULT_EXCLUDED_FILESYSTEMS "*gvfs *gluster* *s3fs *ipfs *davfs2 *httpfs *sshfs *gdfs *moosefs fusectl autofs"
  6. #define DEFAULT_EXCLUDED_FILESYSTEMS_INODES "msdosfs msdos vfat overlayfs aufs* *unionfs"
  7. #define CONFIG_SECTION_DISKSPACE "plugin:proc:diskspace"
  8. #define RRDFUNCTIONS_DISKSPACE_HELP "View mount point statistics"
  9. #define MAX_STAT_USEC 10000LU
  10. #define SLOW_UPDATE_EVERY 5
  11. static netdata_thread_t *diskspace_slow_thread = NULL;
  12. static struct mountinfo *disk_mountinfo_root = NULL;
  13. static int check_for_new_mountpoints_every = 15;
  14. static int cleanup_mount_points = 1;
  15. static inline void mountinfo_reload(int force) {
  16. static time_t last_loaded = 0;
  17. time_t now = now_realtime_sec();
  18. if(force || now - last_loaded >= check_for_new_mountpoints_every) {
  19. // mountinfo_free_all() can be called with NULL disk_mountinfo_root
  20. mountinfo_free_all(disk_mountinfo_root);
  21. // re-read mountinfo in case something changed
  22. disk_mountinfo_root = mountinfo_read(0);
  23. last_loaded = now;
  24. }
  25. }
  26. // Data to be stored in DICTIONARY dict_mountpoints used by do_disk_space_stats().
  27. // This DICTIONARY is used to lookup the settings of the mount point on each iteration.
  28. struct mount_point_metadata {
  29. int do_space;
  30. int do_inodes;
  31. bool shown_error;
  32. bool updated;
  33. bool slow;
  34. STRING *filesystem;
  35. STRING *mountroot;
  36. RRDLABELS *chart_labels;
  37. size_t collected; // the number of times this has been collected
  38. RRDSET *st_space;
  39. RRDDIM *rd_space_used;
  40. RRDDIM *rd_space_avail;
  41. RRDDIM *rd_space_reserved;
  42. RRDSET *st_inodes;
  43. RRDDIM *rd_inodes_used;
  44. RRDDIM *rd_inodes_avail;
  45. RRDDIM *rd_inodes_reserved;
  46. };
  47. static DICTIONARY *dict_mountpoints = NULL;
  48. #define rrdset_obsolete_and_pointer_null(st) do { if(st) { rrdset_is_obsolete___safe_from_collector_thread(st); (st) = NULL; } } while(st)
  49. static void mount_points_cleanup(bool slow) {
  50. struct mount_point_metadata *mp;
  51. dfe_start_write(dict_mountpoints, mp) {
  52. if(mp->slow != slow) continue;
  53. if(mp->updated)
  54. mp->updated = false;
  55. else if(cleanup_mount_points)
  56. dictionary_del(dict_mountpoints, mp_dfe.name);
  57. }
  58. dfe_done(mp);
  59. dictionary_garbage_collect(dict_mountpoints);
  60. }
  61. void mountpoint_delete_cb(const DICTIONARY_ITEM *item __maybe_unused, void *entry, void *data __maybe_unused) {
  62. struct mount_point_metadata *mp = (struct mount_point_metadata *)entry;
  63. mp->collected = 0;
  64. mp->updated = false;
  65. mp->shown_error = false;
  66. string_freez(mp->filesystem);
  67. mp->filesystem = NULL;
  68. string_freez(mp->mountroot);
  69. mp->mountroot = NULL;
  70. rrdset_obsolete_and_pointer_null(mp->st_space);
  71. rrdset_obsolete_and_pointer_null(mp->st_inodes);
  72. mp->rd_space_avail = NULL;
  73. mp->rd_space_used = NULL;
  74. mp->rd_space_reserved = NULL;
  75. mp->rd_inodes_avail = NULL;
  76. mp->rd_inodes_used = NULL;
  77. mp->rd_inodes_reserved = NULL;
  78. }
  79. // a copy of basic mountinfo fields
  80. struct basic_mountinfo {
  81. char *persistent_id;
  82. char *root;
  83. char *mount_point;
  84. char *filesystem;
  85. struct basic_mountinfo *next;
  86. };
  87. static struct basic_mountinfo *slow_mountinfo_tmp_root = NULL;
  88. static netdata_mutex_t slow_mountinfo_mutex;
  89. static struct basic_mountinfo *basic_mountinfo_create_and_copy(struct mountinfo* mi)
  90. {
  91. struct basic_mountinfo *bmi = callocz(1, sizeof(struct basic_mountinfo));
  92. if (mi) {
  93. bmi->persistent_id = strdupz(mi->persistent_id);
  94. bmi->root = strdupz(mi->root);
  95. bmi->mount_point = strdupz(mi->mount_point);
  96. bmi->filesystem = strdupz(mi->filesystem);
  97. }
  98. return bmi;
  99. }
  100. static void add_basic_mountinfo(struct basic_mountinfo **root, struct mountinfo *mi)
  101. {
  102. if (!root)
  103. return;
  104. struct basic_mountinfo *bmi = basic_mountinfo_create_and_copy(mi);
  105. bmi->next = *root;
  106. *root = bmi;
  107. }
  108. static void free_basic_mountinfo(struct basic_mountinfo *bmi)
  109. {
  110. if (bmi) {
  111. freez(bmi->persistent_id);
  112. freez(bmi->root);
  113. freez(bmi->mount_point);
  114. freez(bmi->filesystem);
  115. freez(bmi);
  116. }
  117. }
  118. static void free_basic_mountinfo_list(struct basic_mountinfo *root)
  119. {
  120. struct basic_mountinfo *bmi = root, *next;
  121. while (bmi) {
  122. next = bmi->next;
  123. free_basic_mountinfo(bmi);
  124. bmi = next;
  125. }
  126. }
  127. static void calculate_values_and_show_charts(
  128. struct basic_mountinfo *mi,
  129. struct mount_point_metadata *m,
  130. struct statvfs *buff_statvfs,
  131. int update_every)
  132. {
  133. const char *family = mi->mount_point;
  134. const char *disk = mi->persistent_id;
  135. // logic found at get_fs_usage() in coreutils
  136. unsigned long bsize = (buff_statvfs->f_frsize) ? buff_statvfs->f_frsize : buff_statvfs->f_bsize;
  137. fsblkcnt_t bavail = buff_statvfs->f_bavail;
  138. fsblkcnt_t btotal = buff_statvfs->f_blocks;
  139. fsblkcnt_t bavail_root = buff_statvfs->f_bfree;
  140. fsblkcnt_t breserved_root = bavail_root - bavail;
  141. fsblkcnt_t bused = likely(btotal >= bavail_root) ? btotal - bavail_root : bavail_root - btotal;
  142. #ifdef NETDATA_INTERNAL_CHECKS
  143. if(unlikely(btotal != bavail + breserved_root + bused))
  144. collector_error("DISKSPACE: disk block statistics for '%s' (disk '%s') do not sum up: total = %llu, available = %llu, reserved = %llu, used = %llu", mi->mount_point, disk, (unsigned long long)btotal, (unsigned long long)bavail, (unsigned long long)breserved_root, (unsigned long long)bused);
  145. #endif
  146. // --------------------------------------------------------------------------
  147. fsfilcnt_t favail = buff_statvfs->f_favail;
  148. fsfilcnt_t ftotal = buff_statvfs->f_files;
  149. fsfilcnt_t favail_root = buff_statvfs->f_ffree;
  150. fsfilcnt_t freserved_root = favail_root - favail;
  151. fsfilcnt_t fused = ftotal - favail_root;
  152. if(m->do_inodes == CONFIG_BOOLEAN_AUTO && favail == (fsfilcnt_t)-1) {
  153. // this file system does not support inodes reporting
  154. // eg. cephfs
  155. m->do_inodes = CONFIG_BOOLEAN_NO;
  156. }
  157. #ifdef NETDATA_INTERNAL_CHECKS
  158. if(unlikely(btotal != bavail + breserved_root + bused))
  159. collector_error("DISKSPACE: disk inode statistics for '%s' (disk '%s') do not sum up: total = %llu, available = %llu, reserved = %llu, used = %llu", mi->mount_point, disk, (unsigned long long)ftotal, (unsigned long long)favail, (unsigned long long)freserved_root, (unsigned long long)fused);
  160. #endif
  161. int rendered = 0;
  162. if(m->do_space == CONFIG_BOOLEAN_YES || (m->do_space == CONFIG_BOOLEAN_AUTO &&
  163. (bavail || breserved_root || bused ||
  164. netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES))) {
  165. if(unlikely(!m->st_space) || m->st_space->update_every != update_every) {
  166. m->do_space = CONFIG_BOOLEAN_YES;
  167. m->st_space = rrdset_find_active_bytype_localhost("disk_space", disk);
  168. if(unlikely(!m->st_space || m->st_space->update_every != update_every)) {
  169. char title[4096 + 1];
  170. snprintfz(title, sizeof(title) - 1, "Disk Space Usage");
  171. m->st_space = rrdset_create_localhost(
  172. "disk_space"
  173. , disk
  174. , NULL
  175. , family
  176. , "disk.space"
  177. , title
  178. , "GiB"
  179. , PLUGIN_DISKSPACE_NAME
  180. , NULL
  181. , NETDATA_CHART_PRIO_DISKSPACE_SPACE
  182. , update_every
  183. , RRDSET_TYPE_STACKED
  184. );
  185. }
  186. rrdset_update_rrdlabels(m->st_space, m->chart_labels);
  187. m->rd_space_avail = rrddim_add(m->st_space, "avail", NULL, (collected_number)bsize, 1024 * 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  188. m->rd_space_used = rrddim_add(m->st_space, "used", NULL, (collected_number)bsize, 1024 * 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  189. m->rd_space_reserved = rrddim_add(m->st_space, "reserved_for_root", "reserved for root", (collected_number)bsize, 1024 * 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  190. }
  191. rrddim_set_by_pointer(m->st_space, m->rd_space_avail, (collected_number)bavail);
  192. rrddim_set_by_pointer(m->st_space, m->rd_space_used, (collected_number)bused);
  193. rrddim_set_by_pointer(m->st_space, m->rd_space_reserved, (collected_number)breserved_root);
  194. rrdset_done(m->st_space);
  195. rendered++;
  196. }
  197. if(m->do_inodes == CONFIG_BOOLEAN_YES || (m->do_inodes == CONFIG_BOOLEAN_AUTO &&
  198. (favail || freserved_root || fused ||
  199. netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES))) {
  200. if(unlikely(!m->st_inodes) || m->st_inodes->update_every != update_every) {
  201. m->do_inodes = CONFIG_BOOLEAN_YES;
  202. m->st_inodes = rrdset_find_active_bytype_localhost("disk_inodes", disk);
  203. if(unlikely(!m->st_inodes) || m->st_inodes->update_every != update_every) {
  204. char title[4096 + 1];
  205. snprintfz(title, sizeof(title) - 1, "Disk Files (inodes) Usage");
  206. m->st_inodes = rrdset_create_localhost(
  207. "disk_inodes"
  208. , disk
  209. , NULL
  210. , family
  211. , "disk.inodes"
  212. , title
  213. , "inodes"
  214. , PLUGIN_DISKSPACE_NAME
  215. , NULL
  216. , NETDATA_CHART_PRIO_DISKSPACE_INODES
  217. , update_every
  218. , RRDSET_TYPE_STACKED
  219. );
  220. }
  221. rrdset_update_rrdlabels(m->st_inodes, m->chart_labels);
  222. m->rd_inodes_avail = rrddim_add(m->st_inodes, "avail", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  223. m->rd_inodes_used = rrddim_add(m->st_inodes, "used", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  224. m->rd_inodes_reserved = rrddim_add(m->st_inodes, "reserved_for_root", "reserved for root", 1, 1, RRD_ALGORITHM_ABSOLUTE);
  225. }
  226. rrddim_set_by_pointer(m->st_inodes, m->rd_inodes_avail, (collected_number)favail);
  227. rrddim_set_by_pointer(m->st_inodes, m->rd_inodes_used, (collected_number)fused);
  228. rrddim_set_by_pointer(m->st_inodes, m->rd_inodes_reserved, (collected_number)freserved_root);
  229. rrdset_done(m->st_inodes);
  230. rendered++;
  231. }
  232. if(likely(rendered))
  233. m->collected++;
  234. }
  235. static inline void do_disk_space_stats(struct mountinfo *mi, int update_every) {
  236. const char *disk = mi->persistent_id;
  237. static SIMPLE_PATTERN *excluded_mountpoints = NULL;
  238. static SIMPLE_PATTERN *excluded_filesystems = NULL;
  239. static SIMPLE_PATTERN *excluded_filesystems_inodes = NULL;
  240. usec_t slow_timeout = MAX_STAT_USEC * update_every;
  241. int do_space, do_inodes;
  242. if(unlikely(!dict_mountpoints)) {
  243. SIMPLE_PREFIX_MODE mode = SIMPLE_PATTERN_EXACT;
  244. if(config_move("plugin:proc:/proc/diskstats", "exclude space metrics on paths", CONFIG_SECTION_DISKSPACE, "exclude space metrics on paths") != -1) {
  245. // old configuration, enable backwards compatibility
  246. mode = SIMPLE_PATTERN_PREFIX;
  247. }
  248. excluded_mountpoints = simple_pattern_create(
  249. config_get(CONFIG_SECTION_DISKSPACE, "exclude space metrics on paths", DEFAULT_EXCLUDED_PATHS),
  250. NULL,
  251. mode,
  252. true);
  253. excluded_filesystems = simple_pattern_create(
  254. config_get(CONFIG_SECTION_DISKSPACE, "exclude space metrics on filesystems", DEFAULT_EXCLUDED_FILESYSTEMS),
  255. NULL,
  256. SIMPLE_PATTERN_EXACT,
  257. true);
  258. excluded_filesystems_inodes = simple_pattern_create(
  259. config_get(CONFIG_SECTION_DISKSPACE, "exclude inode metrics on filesystems", DEFAULT_EXCLUDED_FILESYSTEMS_INODES),
  260. NULL,
  261. SIMPLE_PATTERN_EXACT,
  262. true);
  263. dict_mountpoints = dictionary_create_advanced(DICT_OPTION_NONE, &dictionary_stats_category_collectors, 0);
  264. dictionary_register_delete_callback(dict_mountpoints, mountpoint_delete_cb, NULL);
  265. }
  266. const DICTIONARY_ITEM *item = dictionary_get_and_acquire_item(dict_mountpoints, mi->mount_point);
  267. if(unlikely(!item)) {
  268. bool slow = false;
  269. int def_space = config_get_boolean_ondemand(CONFIG_SECTION_DISKSPACE, "space usage for all disks", CONFIG_BOOLEAN_AUTO);
  270. int def_inodes = config_get_boolean_ondemand(CONFIG_SECTION_DISKSPACE, "inodes usage for all disks", CONFIG_BOOLEAN_AUTO);
  271. if(unlikely(simple_pattern_matches(excluded_mountpoints, mi->mount_point))) {
  272. def_space = CONFIG_BOOLEAN_NO;
  273. def_inodes = CONFIG_BOOLEAN_NO;
  274. }
  275. if(unlikely(simple_pattern_matches(excluded_filesystems, mi->filesystem))) {
  276. def_space = CONFIG_BOOLEAN_NO;
  277. def_inodes = CONFIG_BOOLEAN_NO;
  278. }
  279. if (unlikely(simple_pattern_matches(excluded_filesystems_inodes, mi->filesystem))) {
  280. def_inodes = CONFIG_BOOLEAN_NO;
  281. }
  282. // check if the mount point is a directory #2407
  283. // but only when it is enabled by default #4491
  284. if(def_space != CONFIG_BOOLEAN_NO || def_inodes != CONFIG_BOOLEAN_NO) {
  285. usec_t start_time = now_monotonic_high_precision_usec();
  286. struct stat bs;
  287. if(stat(mi->mount_point, &bs) == -1) {
  288. collector_error("DISKSPACE: Cannot stat() mount point '%s' (disk '%s', filesystem '%s', root '%s')."
  289. , mi->mount_point
  290. , disk
  291. , mi->filesystem?mi->filesystem:""
  292. , mi->root?mi->root:""
  293. );
  294. def_space = CONFIG_BOOLEAN_NO;
  295. def_inodes = CONFIG_BOOLEAN_NO;
  296. }
  297. else {
  298. if((bs.st_mode & S_IFMT) != S_IFDIR) {
  299. collector_error("DISKSPACE: Mount point '%s' (disk '%s', filesystem '%s', root '%s') is not a directory."
  300. , mi->mount_point
  301. , disk
  302. , mi->filesystem?mi->filesystem:""
  303. , mi->root?mi->root:""
  304. );
  305. def_space = CONFIG_BOOLEAN_NO;
  306. def_inodes = CONFIG_BOOLEAN_NO;
  307. }
  308. }
  309. if ((now_monotonic_high_precision_usec() - start_time) > slow_timeout)
  310. slow = true;
  311. }
  312. char var_name[4096 + 1];
  313. snprintfz(var_name, 4096, "plugin:proc:diskspace:%s", mi->mount_point);
  314. do_space = def_space;
  315. do_inodes = def_inodes;
  316. if (config_exists(var_name, "space usage"))
  317. do_space = config_get_boolean_ondemand(var_name, "space usage", def_space);
  318. if (config_exists(var_name, "inodes usage"))
  319. do_inodes = config_get_boolean_ondemand(var_name, "inodes usage", def_inodes);
  320. struct mount_point_metadata mp = {
  321. .do_space = do_space,
  322. .do_inodes = do_inodes,
  323. .shown_error = false,
  324. .updated = false,
  325. .slow = slow,
  326. .collected = 0,
  327. .filesystem = string_strdupz(mi->filesystem),
  328. .mountroot = string_strdupz(mi->root),
  329. .chart_labels = rrdlabels_create(),
  330. .st_space = NULL,
  331. .rd_space_avail = NULL,
  332. .rd_space_used = NULL,
  333. .rd_space_reserved = NULL,
  334. .st_inodes = NULL,
  335. .rd_inodes_avail = NULL,
  336. .rd_inodes_used = NULL,
  337. .rd_inodes_reserved = NULL
  338. };
  339. rrdlabels_add(mp.chart_labels, "mount_point", mi->mount_point, RRDLABEL_SRC_AUTO);
  340. rrdlabels_add(mp.chart_labels, "filesystem", mi->filesystem, RRDLABEL_SRC_AUTO);
  341. rrdlabels_add(mp.chart_labels, "mount_root", mi->root, RRDLABEL_SRC_AUTO);
  342. item = dictionary_set_and_acquire_item(dict_mountpoints, mi->mount_point, &mp, sizeof(struct mount_point_metadata));
  343. }
  344. struct mount_point_metadata *m = dictionary_acquired_item_value(item);
  345. if (m->slow) {
  346. add_basic_mountinfo(&slow_mountinfo_tmp_root, mi);
  347. goto cleanup;
  348. }
  349. m->updated = true;
  350. if(unlikely(m->do_space == CONFIG_BOOLEAN_NO && m->do_inodes == CONFIG_BOOLEAN_NO)) {
  351. goto cleanup;
  352. }
  353. if (unlikely(
  354. mi->flags & MOUNTINFO_READONLY &&
  355. !(mi->flags & MOUNTINFO_IS_IN_SYSD_PROTECTED_LIST) &&
  356. !m->collected &&
  357. m->do_space != CONFIG_BOOLEAN_YES &&
  358. m->do_inodes != CONFIG_BOOLEAN_YES)) {
  359. goto cleanup;
  360. }
  361. usec_t start_time = now_monotonic_high_precision_usec();
  362. struct statvfs buff_statvfs;
  363. if (statvfs(mi->mount_point, &buff_statvfs) < 0) {
  364. if(!m->shown_error) {
  365. collector_error("DISKSPACE: failed to statvfs() mount point '%s' (disk '%s', filesystem '%s', root '%s')"
  366. , mi->mount_point
  367. , disk
  368. , mi->filesystem?mi->filesystem:""
  369. , mi->root?mi->root:""
  370. );
  371. m->shown_error = true;
  372. }
  373. goto cleanup;
  374. }
  375. if ((now_monotonic_high_precision_usec() - start_time) > slow_timeout)
  376. m->slow = true;
  377. m->shown_error = false;
  378. struct basic_mountinfo bmi;
  379. bmi.mount_point = mi->mount_point;
  380. bmi.persistent_id = mi->persistent_id;
  381. bmi.filesystem = mi->filesystem;
  382. bmi.root = mi->root;
  383. calculate_values_and_show_charts(&bmi, m, &buff_statvfs, update_every);
  384. cleanup:
  385. dictionary_acquired_item_release(dict_mountpoints, item);
  386. }
  387. static inline void do_slow_disk_space_stats(struct basic_mountinfo *mi, int update_every) {
  388. const DICTIONARY_ITEM *item = dictionary_get_and_acquire_item(dict_mountpoints, mi->mount_point);
  389. if(!item) return;
  390. struct mount_point_metadata *m = dictionary_acquired_item_value(item);
  391. m->updated = true;
  392. struct statvfs buff_statvfs;
  393. if (statvfs(mi->mount_point, &buff_statvfs) < 0) {
  394. if(!m->shown_error) {
  395. collector_error("DISKSPACE: failed to statvfs() mount point '%s' (disk '%s', filesystem '%s', root '%s')"
  396. , mi->mount_point
  397. , mi->persistent_id
  398. , mi->filesystem?mi->filesystem:""
  399. , mi->root?mi->root:""
  400. );
  401. m->shown_error = true;
  402. }
  403. goto cleanup;
  404. }
  405. m->shown_error = false;
  406. calculate_values_and_show_charts(mi, m, &buff_statvfs, update_every);
  407. cleanup:
  408. dictionary_acquired_item_release(dict_mountpoints, item);
  409. }
  410. static void diskspace_slow_worker_cleanup(void *ptr)
  411. {
  412. UNUSED(ptr);
  413. collector_info("cleaning up...");
  414. worker_unregister();
  415. }
  416. #define WORKER_JOB_SLOW_MOUNTPOINT 0
  417. #define WORKER_JOB_SLOW_CLEANUP 1
  418. struct slow_worker_data {
  419. netdata_thread_t *slow_thread;
  420. int update_every;
  421. };
  422. void *diskspace_slow_worker(void *ptr)
  423. {
  424. struct slow_worker_data *data = (struct slow_worker_data *)ptr;
  425. worker_register("DISKSPACE_SLOW");
  426. worker_register_job_name(WORKER_JOB_SLOW_MOUNTPOINT, "mountpoint");
  427. worker_register_job_name(WORKER_JOB_SLOW_CLEANUP, "cleanup");
  428. struct basic_mountinfo *slow_mountinfo_root = NULL;
  429. int slow_update_every = data->update_every > SLOW_UPDATE_EVERY ? data->update_every : SLOW_UPDATE_EVERY;
  430. netdata_thread_cleanup_push(diskspace_slow_worker_cleanup, data->slow_thread);
  431. usec_t step = slow_update_every * USEC_PER_SEC;
  432. usec_t real_step = USEC_PER_SEC;
  433. heartbeat_t hb;
  434. heartbeat_init(&hb);
  435. while(service_running(SERVICE_COLLECTORS)) {
  436. worker_is_idle();
  437. heartbeat_next(&hb, USEC_PER_SEC);
  438. if (real_step < step) {
  439. real_step += USEC_PER_SEC;
  440. continue;
  441. }
  442. real_step = USEC_PER_SEC;
  443. usec_t start_time = now_monotonic_high_precision_usec();
  444. if (!dict_mountpoints)
  445. continue;
  446. if(unlikely(!service_running(SERVICE_COLLECTORS))) break;
  447. // --------------------------------------------------------------------------
  448. // disk space metrics
  449. worker_is_busy(WORKER_JOB_SLOW_MOUNTPOINT);
  450. netdata_mutex_lock(&slow_mountinfo_mutex);
  451. free_basic_mountinfo_list(slow_mountinfo_root);
  452. slow_mountinfo_root = slow_mountinfo_tmp_root;
  453. slow_mountinfo_tmp_root = NULL;
  454. netdata_mutex_unlock(&slow_mountinfo_mutex);
  455. struct basic_mountinfo *bmi;
  456. for(bmi = slow_mountinfo_root; bmi; bmi = bmi->next) {
  457. do_slow_disk_space_stats(bmi, slow_update_every);
  458. if(unlikely(!service_running(SERVICE_COLLECTORS))) break;
  459. }
  460. if(unlikely(!service_running(SERVICE_COLLECTORS))) break;
  461. if(dict_mountpoints) {
  462. worker_is_busy(WORKER_JOB_SLOW_CLEANUP);
  463. mount_points_cleanup(true);
  464. }
  465. usec_t dt = now_monotonic_high_precision_usec() - start_time;
  466. if (dt > step) {
  467. slow_update_every = (dt / USEC_PER_SEC) * 3 / 2;
  468. if (slow_update_every % SLOW_UPDATE_EVERY)
  469. slow_update_every += SLOW_UPDATE_EVERY - slow_update_every % SLOW_UPDATE_EVERY;
  470. step = slow_update_every * USEC_PER_SEC;
  471. }
  472. }
  473. netdata_thread_cleanup_pop(1);
  474. free_basic_mountinfo_list(slow_mountinfo_root);
  475. return NULL;
  476. }
  477. static void diskspace_main_cleanup(void *ptr) {
  478. rrd_collector_finished();
  479. worker_unregister();
  480. struct netdata_static_thread *static_thread = (struct netdata_static_thread *)ptr;
  481. static_thread->enabled = NETDATA_MAIN_THREAD_EXITING;
  482. collector_info("cleaning up...");
  483. if (diskspace_slow_thread) {
  484. netdata_thread_join(*diskspace_slow_thread, NULL);
  485. freez(diskspace_slow_thread);
  486. }
  487. free_basic_mountinfo_list(slow_mountinfo_tmp_root);
  488. static_thread->enabled = NETDATA_MAIN_THREAD_EXITED;
  489. }
  490. #define WORKER_JOB_MOUNTINFO 0
  491. #define WORKER_JOB_MOUNTPOINT 1
  492. #define WORKER_JOB_CLEANUP 2
  493. #if WORKER_UTILIZATION_MAX_JOB_TYPES < 3
  494. #error WORKER_UTILIZATION_MAX_JOB_TYPES has to be at least 3
  495. #endif
  496. int diskspace_function_mount_points(BUFFER *wb, const char *function __maybe_unused) {
  497. netdata_mutex_lock(&slow_mountinfo_mutex);
  498. buffer_flush(wb);
  499. wb->content_type = CT_APPLICATION_JSON;
  500. buffer_json_initialize(wb, "\"", "\"", 0, true, BUFFER_JSON_OPTIONS_DEFAULT);
  501. buffer_json_member_add_string(wb, "hostname", rrdhost_hostname(localhost));
  502. buffer_json_member_add_uint64(wb, "status", HTTP_RESP_OK);
  503. buffer_json_member_add_string(wb, "type", "table");
  504. buffer_json_member_add_time_t(wb, "update_every", 1);
  505. buffer_json_member_add_string(wb, "help", RRDFUNCTIONS_DISKSPACE_HELP);
  506. buffer_json_member_add_array(wb, "data");
  507. double max_space_util = 0.0;
  508. double max_space_avail = 0.0;
  509. double max_space_used = 0.0;
  510. double max_space_reserved = 0.0;
  511. double max_inodes_util = 0.0;
  512. double max_inodes_avail = 0.0;
  513. double max_inodes_used = 0.0;
  514. double max_inodes_reserved = 0.0;
  515. struct mount_point_metadata *mp;
  516. dfe_start_read(dict_mountpoints, mp) {
  517. if (!mp->collected)
  518. continue;
  519. buffer_json_add_array_item_array(wb);
  520. buffer_json_add_array_item_string(wb, mp_dfe.name);
  521. buffer_json_add_array_item_string(wb, string2str(mp->filesystem));
  522. buffer_json_add_array_item_string(wb, string2str(mp->mountroot));
  523. double space_avail = rrddim_get_last_stored_value(mp->rd_space_avail, &max_space_avail, 1.0);
  524. double space_used = rrddim_get_last_stored_value(mp->rd_space_used, &max_space_used, 1.0);
  525. double space_reserved = rrddim_get_last_stored_value(mp->rd_space_reserved, &max_space_reserved, 1.0);
  526. double inodes_avail = rrddim_get_last_stored_value(mp->rd_inodes_avail, &max_inodes_avail, 1.0);
  527. double inodes_used = rrddim_get_last_stored_value(mp->rd_inodes_used, &max_inodes_used, 1.0);
  528. double inodes_reserved = rrddim_get_last_stored_value(mp->rd_inodes_reserved, &max_inodes_reserved, 1.0);
  529. double space_util = NAN;
  530. if (!isnan(space_avail) && !isnan(space_used)) {
  531. space_util = space_avail + space_used > 0 ? space_used * 100.0 / (space_avail + space_used) : 0;
  532. max_space_util = MAX(max_space_util, space_util);
  533. }
  534. double inodes_util = NAN;
  535. if (!isnan(inodes_avail) && !isnan(inodes_used)) {
  536. inodes_util = inodes_avail + inodes_used > 0 ? inodes_used * 100.0 / (inodes_avail + inodes_used) : 0;
  537. max_inodes_util = MAX(max_inodes_util, inodes_util);
  538. }
  539. buffer_json_add_array_item_double(wb, space_util);
  540. buffer_json_add_array_item_double(wb, space_avail);
  541. buffer_json_add_array_item_double(wb, space_used);
  542. buffer_json_add_array_item_double(wb, space_reserved);
  543. buffer_json_add_array_item_double(wb, inodes_util);
  544. buffer_json_add_array_item_double(wb, inodes_avail);
  545. buffer_json_add_array_item_double(wb, inodes_used);
  546. buffer_json_add_array_item_double(wb, inodes_reserved);
  547. buffer_json_array_close(wb);
  548. }
  549. dfe_done(mp);
  550. buffer_json_array_close(wb); // data
  551. buffer_json_member_add_object(wb, "columns");
  552. {
  553. size_t field_id = 0;
  554. buffer_rrdf_table_add_field(wb, field_id++, "Mountpoint", "Mountpoint Name",
  555. RRDF_FIELD_TYPE_STRING, RRDF_FIELD_VISUAL_VALUE, RRDF_FIELD_TRANSFORM_NONE,
  556. 0, NULL, NAN, RRDF_FIELD_SORT_ASCENDING, NULL,
  557. RRDF_FIELD_SUMMARY_COUNT, RRDF_FIELD_FILTER_MULTISELECT,
  558. RRDF_FIELD_OPTS_VISIBLE | RRDF_FIELD_OPTS_UNIQUE_KEY | RRDF_FIELD_OPTS_STICKY | RRDF_FIELD_OPTS_FULL_WIDTH,
  559. NULL);
  560. buffer_rrdf_table_add_field(wb, field_id++, "Filesystem", "Mountpoint Filesystem",
  561. RRDF_FIELD_TYPE_STRING, RRDF_FIELD_VISUAL_VALUE, RRDF_FIELD_TRANSFORM_NONE,
  562. 0, NULL, NAN, RRDF_FIELD_SORT_ASCENDING, NULL,
  563. RRDF_FIELD_SUMMARY_COUNT, RRDF_FIELD_FILTER_MULTISELECT,
  564. RRDF_FIELD_OPTS_VISIBLE | RRDF_FIELD_OPTS_UNIQUE_KEY,
  565. NULL);
  566. buffer_rrdf_table_add_field(wb, field_id++, "Root", "Mountpoint Root",
  567. RRDF_FIELD_TYPE_STRING, RRDF_FIELD_VISUAL_VALUE, RRDF_FIELD_TRANSFORM_NONE,
  568. 0, NULL, NAN, RRDF_FIELD_SORT_ASCENDING, NULL,
  569. RRDF_FIELD_SUMMARY_COUNT, RRDF_FIELD_FILTER_MULTISELECT,
  570. RRDF_FIELD_OPTS_UNIQUE_KEY,
  571. NULL);
  572. buffer_rrdf_table_add_field(wb, field_id++, "Used%", "Space Utilization",
  573. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  574. 2, "%", max_space_util, RRDF_FIELD_SORT_DESCENDING, NULL,
  575. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  576. RRDF_FIELD_OPTS_VISIBLE,
  577. NULL);
  578. buffer_rrdf_table_add_field(wb, field_id++, "Avail", "Space Avail",
  579. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  580. 2, "GiB", max_space_avail, RRDF_FIELD_SORT_DESCENDING, NULL,
  581. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  582. RRDF_FIELD_OPTS_VISIBLE,
  583. NULL);
  584. buffer_rrdf_table_add_field(wb, field_id++, "Used", "Space Used",
  585. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  586. 2, "GiB", max_space_used, RRDF_FIELD_SORT_DESCENDING, NULL,
  587. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  588. RRDF_FIELD_OPTS_VISIBLE,
  589. NULL);
  590. buffer_rrdf_table_add_field(wb, field_id++, "Reserved", "Space Reserved for root",
  591. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  592. 2, "GiB", max_space_reserved, RRDF_FIELD_SORT_DESCENDING, NULL,
  593. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  594. RRDF_FIELD_OPTS_VISIBLE,
  595. NULL);
  596. buffer_rrdf_table_add_field(wb, field_id++, "iUsed%", "Inodes Utilization",
  597. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  598. 2, "%", max_inodes_util, RRDF_FIELD_SORT_DESCENDING, NULL,
  599. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  600. RRDF_FIELD_OPTS_NONE,
  601. NULL);
  602. buffer_rrdf_table_add_field(wb, field_id++, "iAvail", "Inodes Avail",
  603. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  604. 2, "inodes", max_inodes_avail, RRDF_FIELD_SORT_DESCENDING, NULL,
  605. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  606. RRDF_FIELD_OPTS_NONE,
  607. NULL);
  608. buffer_rrdf_table_add_field(wb, field_id++, "iUsed", "Inodes Used",
  609. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  610. 2, "inodes", max_inodes_used, RRDF_FIELD_SORT_DESCENDING, NULL,
  611. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  612. RRDF_FIELD_OPTS_NONE,
  613. NULL);
  614. buffer_rrdf_table_add_field(wb, field_id++, "iReserved", "Inodes Reserved for root",
  615. RRDF_FIELD_TYPE_BAR_WITH_INTEGER, RRDF_FIELD_VISUAL_BAR, RRDF_FIELD_TRANSFORM_NUMBER,
  616. 2, "inodes", max_inodes_reserved, RRDF_FIELD_SORT_DESCENDING, NULL,
  617. RRDF_FIELD_SUMMARY_SUM, RRDF_FIELD_FILTER_NONE,
  618. RRDF_FIELD_OPTS_NONE,
  619. NULL);
  620. }
  621. buffer_json_object_close(wb); // columns
  622. buffer_json_member_add_string(wb, "default_sort_column", "Used%");
  623. buffer_json_member_add_object(wb, "charts");
  624. {
  625. buffer_json_member_add_object(wb, "Utilization");
  626. {
  627. buffer_json_member_add_string(wb, "name", "Utilization");
  628. buffer_json_member_add_string(wb, "type", "stacked-bar");
  629. buffer_json_member_add_array(wb, "columns");
  630. {
  631. buffer_json_add_array_item_string(wb, "Used%");
  632. }
  633. buffer_json_array_close(wb);
  634. }
  635. buffer_json_object_close(wb);
  636. buffer_json_member_add_object(wb, "Usage");
  637. {
  638. buffer_json_member_add_string(wb, "name", "Usage");
  639. buffer_json_member_add_string(wb, "type", "stacked-bar");
  640. buffer_json_member_add_array(wb, "columns");
  641. {
  642. buffer_json_add_array_item_string(wb, "Avail");
  643. buffer_json_add_array_item_string(wb, "Used");
  644. buffer_json_add_array_item_string(wb, "Reserved");
  645. }
  646. buffer_json_array_close(wb);
  647. }
  648. buffer_json_object_close(wb);
  649. buffer_json_member_add_object(wb, "Inodes");
  650. {
  651. buffer_json_member_add_string(wb, "name", "Inodes");
  652. buffer_json_member_add_string(wb, "type", "stacked-bar");
  653. buffer_json_member_add_array(wb, "columns");
  654. {
  655. buffer_json_add_array_item_string(wb, "iAvail");
  656. buffer_json_add_array_item_string(wb, "iUsed");
  657. buffer_json_add_array_item_string(wb, "iReserved");
  658. }
  659. buffer_json_array_close(wb);
  660. }
  661. buffer_json_object_close(wb);
  662. }
  663. buffer_json_object_close(wb); // charts
  664. buffer_json_member_add_array(wb, "default_charts");
  665. {
  666. buffer_json_add_array_item_array(wb);
  667. buffer_json_add_array_item_string(wb, "Utilization");
  668. buffer_json_add_array_item_string(wb, "Mountpoint");
  669. buffer_json_array_close(wb);
  670. buffer_json_add_array_item_array(wb);
  671. buffer_json_add_array_item_string(wb, "Usage");
  672. buffer_json_add_array_item_string(wb, "Mountpoint");
  673. buffer_json_array_close(wb);
  674. }
  675. buffer_json_array_close(wb);
  676. buffer_json_member_add_time_t(wb, "expires", now_realtime_sec() + 1);
  677. buffer_json_finalize(wb);
  678. netdata_mutex_unlock(&slow_mountinfo_mutex);
  679. return HTTP_RESP_OK;
  680. }
  681. void *diskspace_main(void *ptr) {
  682. worker_register("DISKSPACE");
  683. worker_register_job_name(WORKER_JOB_MOUNTINFO, "mountinfo");
  684. worker_register_job_name(WORKER_JOB_MOUNTPOINT, "mountpoint");
  685. worker_register_job_name(WORKER_JOB_CLEANUP, "cleanup");
  686. rrd_function_add_inline(localhost, NULL, "mount-points", 10,
  687. RRDFUNCTIONS_PRIORITY_DEFAULT, RRDFUNCTIONS_DISKSPACE_HELP,
  688. "top", HTTP_ACCESS_ANY, diskspace_function_mount_points);
  689. netdata_thread_cleanup_push(diskspace_main_cleanup, ptr);
  690. cleanup_mount_points = config_get_boolean(CONFIG_SECTION_DISKSPACE, "remove charts of unmounted disks" , cleanup_mount_points);
  691. int update_every = (int)config_get_number(CONFIG_SECTION_DISKSPACE, "update every", localhost->rrd_update_every);
  692. if(update_every < localhost->rrd_update_every)
  693. update_every = localhost->rrd_update_every;
  694. check_for_new_mountpoints_every = (int)config_get_number(CONFIG_SECTION_DISKSPACE, "check for new mount points every", check_for_new_mountpoints_every);
  695. if(check_for_new_mountpoints_every < update_every)
  696. check_for_new_mountpoints_every = update_every;
  697. netdata_mutex_init(&slow_mountinfo_mutex);
  698. diskspace_slow_thread = mallocz(sizeof(netdata_thread_t));
  699. struct slow_worker_data slow_worker_data = {.slow_thread = diskspace_slow_thread, .update_every = update_every};
  700. netdata_thread_create(
  701. diskspace_slow_thread,
  702. "P[diskspace slow]",
  703. NETDATA_THREAD_OPTION_JOINABLE,
  704. diskspace_slow_worker,
  705. &slow_worker_data);
  706. usec_t step = update_every * USEC_PER_SEC;
  707. heartbeat_t hb;
  708. heartbeat_init(&hb);
  709. while(service_running(SERVICE_COLLECTORS)) {
  710. worker_is_idle();
  711. /* usec_t hb_dt = */ heartbeat_next(&hb, step);
  712. if(unlikely(!service_running(SERVICE_COLLECTORS))) break;
  713. // --------------------------------------------------------------------------
  714. // this is smart enough not to reload it every time
  715. worker_is_busy(WORKER_JOB_MOUNTINFO);
  716. mountinfo_reload(0);
  717. // --------------------------------------------------------------------------
  718. // disk space metrics
  719. netdata_mutex_lock(&slow_mountinfo_mutex);
  720. free_basic_mountinfo_list(slow_mountinfo_tmp_root);
  721. slow_mountinfo_tmp_root = NULL;
  722. struct mountinfo *mi;
  723. for(mi = disk_mountinfo_root; mi; mi = mi->next) {
  724. if(unlikely(mi->flags & (MOUNTINFO_IS_DUMMY | MOUNTINFO_IS_BIND)))
  725. continue;
  726. // exclude mounts made by ProtectHome and ProtectSystem systemd hardening options
  727. // https://github.com/netdata/netdata/issues/11498#issuecomment-950982878
  728. if(mi->flags & MOUNTINFO_READONLY && mi->flags & MOUNTINFO_IS_IN_SYSD_PROTECTED_LIST && !strcmp(mi->root, mi->mount_point))
  729. continue;
  730. worker_is_busy(WORKER_JOB_MOUNTPOINT);
  731. do_disk_space_stats(mi, update_every);
  732. if(unlikely(!service_running(SERVICE_COLLECTORS))) break;
  733. }
  734. netdata_mutex_unlock(&slow_mountinfo_mutex);
  735. if(unlikely(!service_running(SERVICE_COLLECTORS))) break;
  736. if(dict_mountpoints) {
  737. worker_is_busy(WORKER_JOB_CLEANUP);
  738. mount_points_cleanup(false);
  739. }
  740. }
  741. worker_unregister();
  742. netdata_thread_cleanup_pop(1);
  743. return NULL;
  744. }