sys_fs_cgroup.c 166 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228322932303231323232333234323532363237323832393240324132423243324432453246324732483249325032513252325332543255325632573258325932603261326232633264326532663267326832693270327132723273327432753276327732783279328032813282328332843285328632873288328932903291329232933294329532963297329832993300330133023303330433053306330733083309331033113312331333143315331633173318331933203321332233233324332533263327332833293330333133323333333433353336333733383339334033413342334333443345334633473348334933503351335233533354335533563357335833593360336133623363336433653366336733683369337033713372337333743375337633773378337933803381338233833384338533863387338833893390339133923393339433953396339733983399340034013402340334043405340634073408340934103411341234133414341534163417341834193420342134223423342434253426342734283429343034313432343334343435343634373438343934403441344234433444344534463447344834493450345134523453345434553456345734583459346034613462346334643465346634673468346934703471347234733474347534763477347834793480348134823483348434853486348734883489349034913492349334943495349634973498349935003501350235033504350535063507350835093510351135123513351435153516351735183519352035213522352335243525352635273528352935303531353235333534353535363537353835393540354135423543354435453546354735483549355035513552355335543555355635573558355935603561356235633564356535663567356835693570357135723573357435753576357735783579358035813582358335843585358635873588358935903591359235933594359535963597359835993600360136023603360436053606360736083609361036113612361336143615361636173618361936203621362236233624362536263627362836293630363136323633363436353636363736383639364036413642364336443645364636473648364936503651365236533654365536563657365836593660366136623663366436653666366736683669367036713672367336743675367636773678367936803681368236833684368536863687368836893690369136923693369436953696369736983699370037013702370337043705370637073708370937103711371237133714371537163717371837193720372137223723372437253726372737283729373037313732373337343735373637373738373937403741374237433744374537463747374837493750375137523753375437553756375737583759376037613762376337643765376637673768376937703771377237733774377537763777377837793780378137823783378437853786378737883789379037913792379337943795379637973798379938003801380238033804380538063807380838093810381138123813381438153816381738183819382038213822382338243825382638273828382938303831383238333834383538363837383838393840384138423843384438453846384738483849385038513852385338543855385638573858385938603861386238633864386538663867386838693870387138723873387438753876387738783879388038813882388338843885388638873888388938903891389238933894389538963897389838993900390139023903390439053906390739083909391039113912391339143915391639173918391939203921392239233924392539263927392839293930393139323933393439353936393739383939394039413942394339443945394639473948394939503951395239533954395539563957395839593960396139623963396439653966396739683969397039713972397339743975397639773978397939803981398239833984398539863987398839893990399139923993399439953996399739983999400040014002400340044005400640074008400940104011401240134014401540164017401840194020402140224023402440254026402740284029403040314032403340344035403640374038403940404041404240434044404540464047404840494050405140524053405440554056405740584059406040614062406340644065406640674068406940704071407240734074407540764077407840794080408140824083408440854086408740884089409040914092409340944095409640974098409941004101410241034104
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include "sys_fs_cgroup.h"
  3. #define PLUGIN_CGROUPS_NAME "cgroups.plugin"
  4. #define PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME "systemd"
  5. #define PLUGIN_CGROUPS_MODULE_CGROUPS_NAME "/sys/fs/cgroup"
  6. // ----------------------------------------------------------------------------
  7. // cgroup globals
  8. static long system_page_size = 4096; // system will be queried via sysconf() in configuration()
  9. static int cgroup_enable_cpuacct_stat = CONFIG_BOOLEAN_AUTO;
  10. static int cgroup_enable_cpuacct_usage = CONFIG_BOOLEAN_AUTO;
  11. static int cgroup_enable_memory = CONFIG_BOOLEAN_AUTO;
  12. static int cgroup_enable_detailed_memory = CONFIG_BOOLEAN_AUTO;
  13. static int cgroup_enable_memory_failcnt = CONFIG_BOOLEAN_AUTO;
  14. static int cgroup_enable_swap = CONFIG_BOOLEAN_AUTO;
  15. static int cgroup_enable_blkio_io = CONFIG_BOOLEAN_AUTO;
  16. static int cgroup_enable_blkio_ops = CONFIG_BOOLEAN_AUTO;
  17. static int cgroup_enable_blkio_throttle_io = CONFIG_BOOLEAN_AUTO;
  18. static int cgroup_enable_blkio_throttle_ops = CONFIG_BOOLEAN_AUTO;
  19. static int cgroup_enable_blkio_merged_ops = CONFIG_BOOLEAN_AUTO;
  20. static int cgroup_enable_blkio_queued_ops = CONFIG_BOOLEAN_AUTO;
  21. static int cgroup_enable_pressure_cpu = CONFIG_BOOLEAN_AUTO;
  22. static int cgroup_enable_pressure_io_some = CONFIG_BOOLEAN_AUTO;
  23. static int cgroup_enable_pressure_io_full = CONFIG_BOOLEAN_AUTO;
  24. static int cgroup_enable_pressure_memory_some = CONFIG_BOOLEAN_AUTO;
  25. static int cgroup_enable_pressure_memory_full = CONFIG_BOOLEAN_AUTO;
  26. static int cgroup_enable_systemd_services = CONFIG_BOOLEAN_YES;
  27. static int cgroup_enable_systemd_services_detailed_memory = CONFIG_BOOLEAN_NO;
  28. static int cgroup_used_memory = CONFIG_BOOLEAN_YES;
  29. static int cgroup_use_unified_cgroups = CONFIG_BOOLEAN_NO;
  30. static int cgroup_unified_exist = CONFIG_BOOLEAN_AUTO;
  31. static int cgroup_search_in_devices = 1;
  32. static int cgroup_enable_new_cgroups_detected_at_runtime = 1;
  33. static int cgroup_check_for_new_every = 10;
  34. static int cgroup_update_every = 1;
  35. static int cgroup_containers_chart_priority = NETDATA_CHART_PRIO_CGROUPS_CONTAINERS;
  36. static int cgroup_recheck_zero_blkio_every_iterations = 10;
  37. static int cgroup_recheck_zero_mem_failcnt_every_iterations = 10;
  38. static int cgroup_recheck_zero_mem_detailed_every_iterations = 10;
  39. static char *cgroup_cpuacct_base = NULL;
  40. static char *cgroup_cpuset_base = NULL;
  41. static char *cgroup_blkio_base = NULL;
  42. static char *cgroup_memory_base = NULL;
  43. static char *cgroup_devices_base = NULL;
  44. static char *cgroup_unified_base = NULL;
  45. static int cgroup_root_count = 0;
  46. static int cgroup_root_max = 1000;
  47. static int cgroup_max_depth = 0;
  48. static SIMPLE_PATTERN *enabled_cgroup_patterns = NULL;
  49. static SIMPLE_PATTERN *enabled_cgroup_paths = NULL;
  50. static SIMPLE_PATTERN *enabled_cgroup_renames = NULL;
  51. static SIMPLE_PATTERN *systemd_services_cgroups = NULL;
  52. static char *cgroups_rename_script = NULL;
  53. static char *cgroups_network_interface_script = NULL;
  54. static int cgroups_check = 0;
  55. static uint32_t Read_hash = 0;
  56. static uint32_t Write_hash = 0;
  57. static uint32_t user_hash = 0;
  58. static uint32_t system_hash = 0;
  59. enum cgroups_type { CGROUPS_AUTODETECT_FAIL, CGROUPS_V1, CGROUPS_V2 };
  60. enum cgroups_systemd_setting {
  61. SYSTEMD_CGROUP_ERR,
  62. SYSTEMD_CGROUP_LEGACY,
  63. SYSTEMD_CGROUP_HYBRID,
  64. SYSTEMD_CGROUP_UNIFIED
  65. };
  66. struct cgroups_systemd_config_setting {
  67. char *name;
  68. enum cgroups_systemd_setting setting;
  69. };
  70. static struct cgroups_systemd_config_setting cgroups_systemd_options[] = {
  71. { .name = "legacy", .setting = SYSTEMD_CGROUP_LEGACY },
  72. { .name = "hybrid", .setting = SYSTEMD_CGROUP_HYBRID },
  73. { .name = "unified", .setting = SYSTEMD_CGROUP_UNIFIED },
  74. { .name = NULL, .setting = SYSTEMD_CGROUP_ERR },
  75. };
  76. /* on Fed systemd is not in PATH for some reason */
  77. #define SYSTEMD_CMD_RHEL "/usr/lib/systemd/systemd --version"
  78. #define SYSTEMD_HIERARCHY_STRING "default-hierarchy="
  79. #define MAXSIZE_PROC_CMDLINE 4096
  80. static enum cgroups_systemd_setting cgroups_detect_systemd(const char *exec)
  81. {
  82. pid_t command_pid;
  83. enum cgroups_systemd_setting retval = SYSTEMD_CGROUP_ERR;
  84. char buf[MAXSIZE_PROC_CMDLINE];
  85. char *begin, *end;
  86. FILE *f = mypopen(exec, &command_pid);
  87. if (!f)
  88. return retval;
  89. while (fgets(buf, MAXSIZE_PROC_CMDLINE, f) != NULL) {
  90. if ((begin = strstr(buf, SYSTEMD_HIERARCHY_STRING))) {
  91. end = begin = begin + strlen(SYSTEMD_HIERARCHY_STRING);
  92. if (!*begin)
  93. break;
  94. while (isalpha(*end))
  95. end++;
  96. *end = 0;
  97. for (int i = 0; cgroups_systemd_options[i].name; i++) {
  98. if (!strcmp(begin, cgroups_systemd_options[i].name)) {
  99. retval = cgroups_systemd_options[i].setting;
  100. break;
  101. }
  102. }
  103. break;
  104. }
  105. }
  106. if (mypclose(f, command_pid))
  107. return SYSTEMD_CGROUP_ERR;
  108. return retval;
  109. }
  110. static enum cgroups_type cgroups_try_detect_version()
  111. {
  112. pid_t command_pid;
  113. char buf[MAXSIZE_PROC_CMDLINE];
  114. enum cgroups_systemd_setting systemd_setting;
  115. int cgroups2_available = 0;
  116. // 1. check if cgroups2 available on system at all
  117. FILE *f = mypopen("grep cgroup /proc/filesystems", &command_pid);
  118. if (!f) {
  119. error("popen failed");
  120. return CGROUPS_AUTODETECT_FAIL;
  121. }
  122. while (fgets(buf, MAXSIZE_PROC_CMDLINE, f) != NULL) {
  123. if (strstr(buf, "cgroup2")) {
  124. cgroups2_available = 1;
  125. break;
  126. }
  127. }
  128. if(mypclose(f, command_pid))
  129. return CGROUPS_AUTODETECT_FAIL;
  130. if(!cgroups2_available)
  131. return CGROUPS_V1;
  132. // 2. check systemd compiletime setting
  133. if ((systemd_setting = cgroups_detect_systemd("systemd --version")) == SYSTEMD_CGROUP_ERR)
  134. systemd_setting = cgroups_detect_systemd(SYSTEMD_CMD_RHEL);
  135. if(systemd_setting == SYSTEMD_CGROUP_ERR)
  136. return CGROUPS_AUTODETECT_FAIL;
  137. if(systemd_setting == SYSTEMD_CGROUP_LEGACY || systemd_setting == SYSTEMD_CGROUP_HYBRID) {
  138. // currently we prefer V1 if HYBRID is set as it seems to be more feature complete
  139. // in the future we might want to continue here if SYSTEMD_CGROUP_HYBRID
  140. // and go ahead with V2
  141. return CGROUPS_V1;
  142. }
  143. // 3. if we are unified as on Fedora (default cgroups2 only mode)
  144. // check kernel command line flag that can override that setting
  145. f = fopen("/proc/cmdline", "r");
  146. if (!f) {
  147. error("Error reading kernel boot commandline parameters");
  148. return CGROUPS_AUTODETECT_FAIL;
  149. }
  150. if (!fgets(buf, MAXSIZE_PROC_CMDLINE, f)) {
  151. error("couldn't read all cmdline params into buffer");
  152. fclose(f);
  153. return CGROUPS_AUTODETECT_FAIL;
  154. }
  155. fclose(f);
  156. if (strstr(buf, "systemd.unified_cgroup_hierarchy=0")) {
  157. info("cgroups v2 (unified cgroups) is available but are disabled on this system.");
  158. return CGROUPS_V1;
  159. }
  160. return CGROUPS_V2;
  161. }
  162. void read_cgroup_plugin_configuration() {
  163. system_page_size = sysconf(_SC_PAGESIZE);
  164. Read_hash = simple_hash("Read");
  165. Write_hash = simple_hash("Write");
  166. user_hash = simple_hash("user");
  167. system_hash = simple_hash("system");
  168. cgroup_update_every = (int)config_get_number("plugin:cgroups", "update every", localhost->rrd_update_every);
  169. if(cgroup_update_every < localhost->rrd_update_every)
  170. cgroup_update_every = localhost->rrd_update_every;
  171. cgroup_check_for_new_every = (int)config_get_number("plugin:cgroups", "check for new cgroups every", (long long)cgroup_check_for_new_every * (long long)cgroup_update_every);
  172. if(cgroup_check_for_new_every < cgroup_update_every)
  173. cgroup_check_for_new_every = cgroup_update_every;
  174. cgroup_use_unified_cgroups = config_get_boolean_ondemand("plugin:cgroups", "use unified cgroups", CONFIG_BOOLEAN_AUTO);
  175. if(cgroup_use_unified_cgroups == CONFIG_BOOLEAN_AUTO)
  176. cgroup_use_unified_cgroups = (cgroups_try_detect_version() == CGROUPS_V2);
  177. info("use unified cgroups %s", cgroup_use_unified_cgroups ? "true" : "false");
  178. cgroup_containers_chart_priority = (int)config_get_number("plugin:cgroups", "containers priority", cgroup_containers_chart_priority);
  179. if(cgroup_containers_chart_priority < 1)
  180. cgroup_containers_chart_priority = NETDATA_CHART_PRIO_CGROUPS_CONTAINERS;
  181. cgroup_enable_cpuacct_stat = config_get_boolean_ondemand("plugin:cgroups", "enable cpuacct stat (total CPU)", cgroup_enable_cpuacct_stat);
  182. cgroup_enable_cpuacct_usage = config_get_boolean_ondemand("plugin:cgroups", "enable cpuacct usage (per core CPU)", cgroup_enable_cpuacct_usage);
  183. cgroup_enable_memory = config_get_boolean_ondemand("plugin:cgroups", "enable memory", cgroup_enable_memory);
  184. cgroup_enable_detailed_memory = config_get_boolean_ondemand("plugin:cgroups", "enable detailed memory", cgroup_enable_detailed_memory);
  185. cgroup_enable_memory_failcnt = config_get_boolean_ondemand("plugin:cgroups", "enable memory limits fail count", cgroup_enable_memory_failcnt);
  186. cgroup_enable_swap = config_get_boolean_ondemand("plugin:cgroups", "enable swap memory", cgroup_enable_swap);
  187. cgroup_enable_blkio_io = config_get_boolean_ondemand("plugin:cgroups", "enable blkio bandwidth", cgroup_enable_blkio_io);
  188. cgroup_enable_blkio_ops = config_get_boolean_ondemand("plugin:cgroups", "enable blkio operations", cgroup_enable_blkio_ops);
  189. cgroup_enable_blkio_throttle_io = config_get_boolean_ondemand("plugin:cgroups", "enable blkio throttle bandwidth", cgroup_enable_blkio_throttle_io);
  190. cgroup_enable_blkio_throttle_ops = config_get_boolean_ondemand("plugin:cgroups", "enable blkio throttle operations", cgroup_enable_blkio_throttle_ops);
  191. cgroup_enable_blkio_queued_ops = config_get_boolean_ondemand("plugin:cgroups", "enable blkio queued operations", cgroup_enable_blkio_queued_ops);
  192. cgroup_enable_blkio_merged_ops = config_get_boolean_ondemand("plugin:cgroups", "enable blkio merged operations", cgroup_enable_blkio_merged_ops);
  193. cgroup_enable_pressure_cpu = config_get_boolean_ondemand("plugin:cgroups", "enable cpu pressure", cgroup_enable_pressure_cpu);
  194. cgroup_enable_pressure_io_some = config_get_boolean_ondemand("plugin:cgroups", "enable io some pressure", cgroup_enable_pressure_io_some);
  195. cgroup_enable_pressure_io_full = config_get_boolean_ondemand("plugin:cgroups", "enable io full pressure", cgroup_enable_pressure_io_full);
  196. cgroup_enable_pressure_memory_some = config_get_boolean_ondemand("plugin:cgroups", "enable memory some pressure", cgroup_enable_pressure_memory_some);
  197. cgroup_enable_pressure_memory_full = config_get_boolean_ondemand("plugin:cgroups", "enable memory full pressure", cgroup_enable_pressure_memory_full);
  198. cgroup_recheck_zero_blkio_every_iterations = (int)config_get_number("plugin:cgroups", "recheck zero blkio every iterations", cgroup_recheck_zero_blkio_every_iterations);
  199. cgroup_recheck_zero_mem_failcnt_every_iterations = (int)config_get_number("plugin:cgroups", "recheck zero memory failcnt every iterations", cgroup_recheck_zero_mem_failcnt_every_iterations);
  200. cgroup_recheck_zero_mem_detailed_every_iterations = (int)config_get_number("plugin:cgroups", "recheck zero detailed memory every iterations", cgroup_recheck_zero_mem_detailed_every_iterations);
  201. cgroup_enable_systemd_services = config_get_boolean("plugin:cgroups", "enable systemd services", cgroup_enable_systemd_services);
  202. cgroup_enable_systemd_services_detailed_memory = config_get_boolean("plugin:cgroups", "enable systemd services detailed memory", cgroup_enable_systemd_services_detailed_memory);
  203. cgroup_used_memory = config_get_boolean("plugin:cgroups", "report used memory", cgroup_used_memory);
  204. char filename[FILENAME_MAX + 1], *s;
  205. struct mountinfo *mi, *root = mountinfo_read(0);
  206. if(!cgroup_use_unified_cgroups) {
  207. // cgroup v1 does not have pressure metrics
  208. cgroup_enable_pressure_cpu =
  209. cgroup_enable_pressure_io_some =
  210. cgroup_enable_pressure_io_full =
  211. cgroup_enable_pressure_memory_some =
  212. cgroup_enable_pressure_memory_full = CONFIG_BOOLEAN_NO;
  213. mi = mountinfo_find_by_filesystem_super_option(root, "cgroup", "cpuacct");
  214. if(!mi) mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup", "cpuacct");
  215. if(!mi) {
  216. error("CGROUP: cannot find cpuacct mountinfo. Assuming default: /sys/fs/cgroup/cpuacct");
  217. s = "/sys/fs/cgroup/cpuacct";
  218. }
  219. else s = mi->mount_point;
  220. snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
  221. cgroup_cpuacct_base = config_get("plugin:cgroups", "path to /sys/fs/cgroup/cpuacct", filename);
  222. mi = mountinfo_find_by_filesystem_super_option(root, "cgroup", "cpuset");
  223. if(!mi) mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup", "cpuset");
  224. if(!mi) {
  225. error("CGROUP: cannot find cpuset mountinfo. Assuming default: /sys/fs/cgroup/cpuset");
  226. s = "/sys/fs/cgroup/cpuset";
  227. }
  228. else s = mi->mount_point;
  229. snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
  230. cgroup_cpuset_base = config_get("plugin:cgroups", "path to /sys/fs/cgroup/cpuset", filename);
  231. mi = mountinfo_find_by_filesystem_super_option(root, "cgroup", "blkio");
  232. if(!mi) mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup", "blkio");
  233. if(!mi) {
  234. error("CGROUP: cannot find blkio mountinfo. Assuming default: /sys/fs/cgroup/blkio");
  235. s = "/sys/fs/cgroup/blkio";
  236. }
  237. else s = mi->mount_point;
  238. snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
  239. cgroup_blkio_base = config_get("plugin:cgroups", "path to /sys/fs/cgroup/blkio", filename);
  240. mi = mountinfo_find_by_filesystem_super_option(root, "cgroup", "memory");
  241. if(!mi) mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup", "memory");
  242. if(!mi) {
  243. error("CGROUP: cannot find memory mountinfo. Assuming default: /sys/fs/cgroup/memory");
  244. s = "/sys/fs/cgroup/memory";
  245. }
  246. else s = mi->mount_point;
  247. snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
  248. cgroup_memory_base = config_get("plugin:cgroups", "path to /sys/fs/cgroup/memory", filename);
  249. mi = mountinfo_find_by_filesystem_super_option(root, "cgroup", "devices");
  250. if(!mi) mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup", "devices");
  251. if(!mi) {
  252. error("CGROUP: cannot find devices mountinfo. Assuming default: /sys/fs/cgroup/devices");
  253. s = "/sys/fs/cgroup/devices";
  254. }
  255. else s = mi->mount_point;
  256. snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
  257. cgroup_devices_base = config_get("plugin:cgroups", "path to /sys/fs/cgroup/devices", filename);
  258. }
  259. else {
  260. //cgroup_enable_cpuacct_stat =
  261. cgroup_enable_cpuacct_usage =
  262. //cgroup_enable_memory =
  263. //cgroup_enable_detailed_memory =
  264. cgroup_enable_memory_failcnt =
  265. //cgroup_enable_swap =
  266. //cgroup_enable_blkio_io =
  267. //cgroup_enable_blkio_ops =
  268. cgroup_enable_blkio_throttle_io =
  269. cgroup_enable_blkio_throttle_ops =
  270. cgroup_enable_blkio_merged_ops =
  271. cgroup_enable_blkio_queued_ops = CONFIG_BOOLEAN_NO;
  272. cgroup_search_in_devices = 0;
  273. cgroup_enable_systemd_services_detailed_memory = CONFIG_BOOLEAN_NO;
  274. cgroup_used_memory = CONFIG_BOOLEAN_NO; //unified cgroups use different values
  275. //TODO: can there be more than 1 cgroup2 mount point?
  276. mi = mountinfo_find_by_filesystem_super_option(root, "cgroup2", "rw"); //there is no cgroup2 specific super option - for now use 'rw' option
  277. if(mi) debug(D_CGROUP, "found unified cgroup root using super options, with path: '%s'", mi->mount_point);
  278. if(!mi) {
  279. mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup2", "cgroup");
  280. if(mi) debug(D_CGROUP, "found unified cgroup root using mountsource info, with path: '%s'", mi->mount_point);
  281. }
  282. if(!mi) {
  283. error("CGROUP: cannot find cgroup2 mountinfo. Assuming default: /sys/fs/cgroup");
  284. s = "/sys/fs/cgroup";
  285. }
  286. else s = mi->mount_point;
  287. snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
  288. cgroup_unified_base = config_get("plugin:cgroups", "path to unified cgroups", filename);
  289. debug(D_CGROUP, "using cgroup root: '%s'", cgroup_unified_base);
  290. }
  291. cgroup_root_max = (int)config_get_number("plugin:cgroups", "max cgroups to allow", cgroup_root_max);
  292. cgroup_max_depth = (int)config_get_number("plugin:cgroups", "max cgroups depth to monitor", cgroup_max_depth);
  293. cgroup_enable_new_cgroups_detected_at_runtime = config_get_boolean("plugin:cgroups", "enable new cgroups detected at run time", cgroup_enable_new_cgroups_detected_at_runtime);
  294. enabled_cgroup_patterns = simple_pattern_create(
  295. config_get("plugin:cgroups", "enable by default cgroups matching",
  296. // ----------------------------------------------------------------
  297. " !*/init.scope " // ignore init.scope
  298. " !/system.slice/run-*.scope " // ignore system.slice/run-XXXX.scope
  299. " *.scope " // we need all other *.scope for sure
  300. // ----------------------------------------------------------------
  301. " /machine.slice/*.service " // #3367 systemd-nspawn
  302. " /kubepods/pod*/* " // k8s containers
  303. " /kubepods/*/pod*/* " // k8s containers
  304. // ----------------------------------------------------------------
  305. " !/kubepods* " // all other k8s cgroups
  306. " !*/vcpu* " // libvirtd adds these sub-cgroups
  307. " !*/emulator " // libvirtd adds these sub-cgroups
  308. " !*.mount "
  309. " !*.partition "
  310. " !*.service "
  311. " !*.socket "
  312. " !*.slice "
  313. " !*.swap "
  314. " !*.user "
  315. " !/ "
  316. " !/docker "
  317. " !/libvirt "
  318. " !/lxc "
  319. " !/lxc/*/* " // #1397 #2649
  320. " !/lxc.monitor* "
  321. " !/lxc.pivot "
  322. " !/lxc.payload "
  323. " !/machine "
  324. " !/qemu "
  325. " !/system "
  326. " !/systemd "
  327. " !/user "
  328. " * " // enable anything else
  329. ), NULL, SIMPLE_PATTERN_EXACT);
  330. enabled_cgroup_paths = simple_pattern_create(
  331. config_get("plugin:cgroups", "search for cgroups in subpaths matching",
  332. " !*/init.scope " // ignore init.scope
  333. " !*-qemu " // #345
  334. " !*.libvirt-qemu " // #3010
  335. " !/init.scope "
  336. " !/system "
  337. " !/systemd "
  338. " !/user "
  339. " !/user.slice "
  340. " !/lxc/*/* " // #2161 #2649
  341. " !/lxc.monitor "
  342. " !/lxc.payload/*/* "
  343. " !/lxc.payload.* "
  344. " * "
  345. ), NULL, SIMPLE_PATTERN_EXACT);
  346. snprintfz(filename, FILENAME_MAX, "%s/cgroup-name.sh", netdata_configured_primary_plugins_dir);
  347. cgroups_rename_script = config_get("plugin:cgroups", "script to get cgroup names", filename);
  348. snprintfz(filename, FILENAME_MAX, "%s/cgroup-network", netdata_configured_primary_plugins_dir);
  349. cgroups_network_interface_script = config_get("plugin:cgroups", "script to get cgroup network interfaces", filename);
  350. enabled_cgroup_renames = simple_pattern_create(
  351. config_get("plugin:cgroups", "run script to rename cgroups matching",
  352. " !/ "
  353. " !*.mount "
  354. " !*.socket "
  355. " !*.partition "
  356. " /machine.slice/*.service " // #3367 systemd-nspawn
  357. " !*.service "
  358. " !*.slice "
  359. " !*.swap "
  360. " !*.user "
  361. " !init.scope "
  362. " !*.scope/vcpu* " // libvirtd adds these sub-cgroups
  363. " !*.scope/emulator " // libvirtd adds these sub-cgroups
  364. " *.scope "
  365. " *docker* "
  366. " *lxc* "
  367. " *qemu* "
  368. " *kubepods* " // #3396 kubernetes
  369. " *.libvirt-qemu " // #3010
  370. " * "
  371. ), NULL, SIMPLE_PATTERN_EXACT);
  372. if(cgroup_enable_systemd_services) {
  373. systemd_services_cgroups = simple_pattern_create(
  374. config_get("plugin:cgroups", "cgroups to match as systemd services",
  375. " !/system.slice/*/*.service "
  376. " /system.slice/*.service "
  377. ), NULL, SIMPLE_PATTERN_EXACT);
  378. }
  379. mountinfo_free_all(root);
  380. }
  381. // ----------------------------------------------------------------------------
  382. // cgroup objects
  383. struct blkio {
  384. int updated;
  385. int enabled; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
  386. int delay_counter;
  387. char *filename;
  388. unsigned long long Read;
  389. unsigned long long Write;
  390. /*
  391. unsigned long long Sync;
  392. unsigned long long Async;
  393. unsigned long long Total;
  394. */
  395. };
  396. // https://www.kernel.org/doc/Documentation/cgroup-v1/memory.txt
  397. struct memory {
  398. ARL_BASE *arl_base;
  399. ARL_ENTRY *arl_dirty;
  400. ARL_ENTRY *arl_swap;
  401. int updated_detailed;
  402. int updated_usage_in_bytes;
  403. int updated_msw_usage_in_bytes;
  404. int updated_failcnt;
  405. int enabled_detailed; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
  406. int enabled_usage_in_bytes; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
  407. int enabled_msw_usage_in_bytes; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
  408. int enabled_failcnt; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
  409. int delay_counter_detailed;
  410. int delay_counter_failcnt;
  411. char *filename_detailed;
  412. char *filename_usage_in_bytes;
  413. char *filename_msw_usage_in_bytes;
  414. char *filename_failcnt;
  415. int detailed_has_dirty;
  416. int detailed_has_swap;
  417. // detailed metrics
  418. /*
  419. unsigned long long cache;
  420. unsigned long long rss;
  421. unsigned long long rss_huge;
  422. unsigned long long mapped_file;
  423. unsigned long long writeback;
  424. unsigned long long dirty;
  425. unsigned long long swap;
  426. unsigned long long pgpgin;
  427. unsigned long long pgpgout;
  428. unsigned long long pgfault;
  429. unsigned long long pgmajfault;
  430. unsigned long long inactive_anon;
  431. unsigned long long active_anon;
  432. unsigned long long inactive_file;
  433. unsigned long long active_file;
  434. unsigned long long unevictable;
  435. unsigned long long hierarchical_memory_limit;
  436. */
  437. //unified cgroups metrics
  438. unsigned long long anon;
  439. unsigned long long kernel_stack;
  440. unsigned long long slab;
  441. unsigned long long sock;
  442. unsigned long long shmem;
  443. unsigned long long anon_thp;
  444. //unsigned long long file_writeback;
  445. //unsigned long long file_dirty;
  446. //unsigned long long file;
  447. unsigned long long total_cache;
  448. unsigned long long total_rss;
  449. unsigned long long total_rss_huge;
  450. unsigned long long total_mapped_file;
  451. unsigned long long total_writeback;
  452. unsigned long long total_dirty;
  453. unsigned long long total_swap;
  454. unsigned long long total_pgpgin;
  455. unsigned long long total_pgpgout;
  456. unsigned long long total_pgfault;
  457. unsigned long long total_pgmajfault;
  458. /*
  459. unsigned long long total_inactive_anon;
  460. unsigned long long total_active_anon;
  461. */
  462. unsigned long long total_inactive_file;
  463. /*
  464. unsigned long long total_active_file;
  465. unsigned long long total_unevictable;
  466. */
  467. // single file metrics
  468. unsigned long long usage_in_bytes;
  469. unsigned long long msw_usage_in_bytes;
  470. unsigned long long failcnt;
  471. };
  472. // https://www.kernel.org/doc/Documentation/cgroup-v1/cpuacct.txt
  473. struct cpuacct_stat {
  474. int updated;
  475. int enabled; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
  476. char *filename;
  477. unsigned long long user;
  478. unsigned long long system;
  479. };
  480. // https://www.kernel.org/doc/Documentation/cgroup-v1/cpuacct.txt
  481. struct cpuacct_usage {
  482. int updated;
  483. int enabled; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
  484. char *filename;
  485. unsigned int cpus;
  486. unsigned long long *cpu_percpu;
  487. };
  488. struct cgroup_network_interface {
  489. const char *host_device;
  490. const char *container_device;
  491. struct cgroup_network_interface *next;
  492. };
  493. #define CGROUP_OPTIONS_DISABLED_DUPLICATE 0x00000001
  494. #define CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE 0x00000002
  495. #define CGROUP_OPTIONS_IS_UNIFIED 0x00000004
  496. // *** WARNING *** The fields are not thread safe. Take care of safe usage.
  497. struct cgroup {
  498. uint32_t options;
  499. char available; // found in the filesystem
  500. char enabled; // enabled in the config
  501. char pending_renames;
  502. char *id;
  503. uint32_t hash;
  504. char *chart_id;
  505. uint32_t hash_chart;
  506. char *chart_title;
  507. struct label *chart_labels;
  508. struct cpuacct_stat cpuacct_stat;
  509. struct cpuacct_usage cpuacct_usage;
  510. struct memory memory;
  511. struct blkio io_service_bytes; // bytes
  512. struct blkio io_serviced; // operations
  513. struct blkio throttle_io_service_bytes; // bytes
  514. struct blkio throttle_io_serviced; // operations
  515. struct blkio io_merged; // operations
  516. struct blkio io_queued; // operations
  517. struct cgroup_network_interface *interfaces;
  518. struct pressure cpu_pressure;
  519. struct pressure io_pressure;
  520. struct pressure memory_pressure;
  521. // per cgroup charts
  522. RRDSET *st_cpu;
  523. RRDSET *st_cpu_limit;
  524. RRDSET *st_cpu_per_core;
  525. RRDSET *st_mem;
  526. RRDSET *st_mem_utilization;
  527. RRDSET *st_writeback;
  528. RRDSET *st_mem_activity;
  529. RRDSET *st_pgfaults;
  530. RRDSET *st_mem_usage;
  531. RRDSET *st_mem_usage_limit;
  532. RRDSET *st_mem_failcnt;
  533. RRDSET *st_io;
  534. RRDSET *st_serviced_ops;
  535. RRDSET *st_throttle_io;
  536. RRDSET *st_throttle_serviced_ops;
  537. RRDSET *st_queued_ops;
  538. RRDSET *st_merged_ops;
  539. // per cgroup chart variables
  540. char *filename_cpuset_cpus;
  541. unsigned long long cpuset_cpus;
  542. char *filename_cpu_cfs_period;
  543. unsigned long long cpu_cfs_period;
  544. char *filename_cpu_cfs_quota;
  545. unsigned long long cpu_cfs_quota;
  546. RRDSETVAR *chart_var_cpu_limit;
  547. calculated_number prev_cpu_usage;
  548. char *filename_memory_limit;
  549. unsigned long long memory_limit;
  550. RRDSETVAR *chart_var_memory_limit;
  551. char *filename_memoryswap_limit;
  552. unsigned long long memoryswap_limit;
  553. RRDSETVAR *chart_var_memoryswap_limit;
  554. // services
  555. RRDDIM *rd_cpu;
  556. RRDDIM *rd_mem_usage;
  557. RRDDIM *rd_mem_failcnt;
  558. RRDDIM *rd_swap_usage;
  559. RRDDIM *rd_mem_detailed_cache;
  560. RRDDIM *rd_mem_detailed_rss;
  561. RRDDIM *rd_mem_detailed_mapped;
  562. RRDDIM *rd_mem_detailed_writeback;
  563. RRDDIM *rd_mem_detailed_pgpgin;
  564. RRDDIM *rd_mem_detailed_pgpgout;
  565. RRDDIM *rd_mem_detailed_pgfault;
  566. RRDDIM *rd_mem_detailed_pgmajfault;
  567. RRDDIM *rd_io_service_bytes_read;
  568. RRDDIM *rd_io_serviced_read;
  569. RRDDIM *rd_throttle_io_read;
  570. RRDDIM *rd_throttle_io_serviced_read;
  571. RRDDIM *rd_io_queued_read;
  572. RRDDIM *rd_io_merged_read;
  573. RRDDIM *rd_io_service_bytes_write;
  574. RRDDIM *rd_io_serviced_write;
  575. RRDDIM *rd_throttle_io_write;
  576. RRDDIM *rd_throttle_io_serviced_write;
  577. RRDDIM *rd_io_queued_write;
  578. RRDDIM *rd_io_merged_write;
  579. struct cgroup *next;
  580. struct cgroup *discovered_next;
  581. } *cgroup_root = NULL;
  582. uv_mutex_t cgroup_root_mutex;
  583. struct cgroup *discovered_cgroup_root = NULL;
  584. struct discovery_thread {
  585. uv_thread_t thread;
  586. uv_mutex_t mutex;
  587. uv_cond_t cond_var;
  588. int start_discovery;
  589. int exited;
  590. } discovery_thread;
  591. // ----------------------------------------------------------------------------
  592. // read values from /sys
  593. static inline void cgroup_read_cpuacct_stat(struct cpuacct_stat *cp) {
  594. static procfile *ff = NULL;
  595. if(likely(cp->filename)) {
  596. ff = procfile_reopen(ff, cp->filename, NULL, PROCFILE_FLAG_DEFAULT);
  597. if(unlikely(!ff)) {
  598. cp->updated = 0;
  599. cgroups_check = 1;
  600. return;
  601. }
  602. ff = procfile_readall(ff);
  603. if(unlikely(!ff)) {
  604. cp->updated = 0;
  605. cgroups_check = 1;
  606. return;
  607. }
  608. unsigned long i, lines = procfile_lines(ff);
  609. if(unlikely(lines < 1)) {
  610. error("CGROUP: file '%s' should have 1+ lines.", cp->filename);
  611. cp->updated = 0;
  612. return;
  613. }
  614. for(i = 0; i < lines ; i++) {
  615. char *s = procfile_lineword(ff, i, 0);
  616. uint32_t hash = simple_hash(s);
  617. if(unlikely(hash == user_hash && !strcmp(s, "user")))
  618. cp->user = str2ull(procfile_lineword(ff, i, 1));
  619. else if(unlikely(hash == system_hash && !strcmp(s, "system")))
  620. cp->system = str2ull(procfile_lineword(ff, i, 1));
  621. }
  622. cp->updated = 1;
  623. if(unlikely(cp->enabled == CONFIG_BOOLEAN_AUTO &&
  624. (cp->user || cp->system || netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES)))
  625. cp->enabled = CONFIG_BOOLEAN_YES;
  626. }
  627. }
  628. static inline void cgroup2_read_cpuacct_stat(struct cpuacct_stat *cp) {
  629. static procfile *ff = NULL;
  630. if(likely(cp->filename)) {
  631. ff = procfile_reopen(ff, cp->filename, NULL, PROCFILE_FLAG_DEFAULT);
  632. if(unlikely(!ff)) {
  633. cp->updated = 0;
  634. cgroups_check = 1;
  635. return;
  636. }
  637. ff = procfile_readall(ff);
  638. if(unlikely(!ff)) {
  639. cp->updated = 0;
  640. cgroups_check = 1;
  641. return;
  642. }
  643. unsigned long lines = procfile_lines(ff);
  644. if(unlikely(lines < 3)) {
  645. error("CGROUP: file '%s' should have 3+ lines.", cp->filename);
  646. cp->updated = 0;
  647. return;
  648. }
  649. cp->user = str2ull(procfile_lineword(ff, 1, 1));
  650. cp->system = str2ull(procfile_lineword(ff, 2, 1));
  651. cp->updated = 1;
  652. if(unlikely(cp->enabled == CONFIG_BOOLEAN_AUTO &&
  653. (cp->user || cp->system || netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES)))
  654. cp->enabled = CONFIG_BOOLEAN_YES;
  655. }
  656. }
  657. static inline void cgroup_read_cpuacct_usage(struct cpuacct_usage *ca) {
  658. static procfile *ff = NULL;
  659. if(likely(ca->filename)) {
  660. ff = procfile_reopen(ff, ca->filename, NULL, PROCFILE_FLAG_DEFAULT);
  661. if(unlikely(!ff)) {
  662. ca->updated = 0;
  663. cgroups_check = 1;
  664. return;
  665. }
  666. ff = procfile_readall(ff);
  667. if(unlikely(!ff)) {
  668. ca->updated = 0;
  669. cgroups_check = 1;
  670. return;
  671. }
  672. if(unlikely(procfile_lines(ff) < 1)) {
  673. error("CGROUP: file '%s' should have 1+ lines but has %zu.", ca->filename, procfile_lines(ff));
  674. ca->updated = 0;
  675. return;
  676. }
  677. unsigned long i = procfile_linewords(ff, 0);
  678. if(unlikely(i == 0)) {
  679. ca->updated = 0;
  680. return;
  681. }
  682. // we may have 1 more CPU reported
  683. while(i > 0) {
  684. char *s = procfile_lineword(ff, 0, i - 1);
  685. if(!*s) i--;
  686. else break;
  687. }
  688. if(unlikely(i != ca->cpus)) {
  689. freez(ca->cpu_percpu);
  690. ca->cpu_percpu = mallocz(sizeof(unsigned long long) * i);
  691. ca->cpus = (unsigned int)i;
  692. }
  693. unsigned long long total = 0;
  694. for(i = 0; i < ca->cpus ;i++) {
  695. unsigned long long n = str2ull(procfile_lineword(ff, 0, i));
  696. ca->cpu_percpu[i] = n;
  697. total += n;
  698. }
  699. ca->updated = 1;
  700. if(unlikely(ca->enabled == CONFIG_BOOLEAN_AUTO &&
  701. (total || netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES)))
  702. ca->enabled = CONFIG_BOOLEAN_YES;
  703. }
  704. }
  705. static inline void cgroup_read_blkio(struct blkio *io) {
  706. if(unlikely(io->enabled == CONFIG_BOOLEAN_AUTO && io->delay_counter > 0)) {
  707. io->delay_counter--;
  708. return;
  709. }
  710. if(likely(io->filename)) {
  711. static procfile *ff = NULL;
  712. ff = procfile_reopen(ff, io->filename, NULL, PROCFILE_FLAG_DEFAULT);
  713. if(unlikely(!ff)) {
  714. io->updated = 0;
  715. cgroups_check = 1;
  716. return;
  717. }
  718. ff = procfile_readall(ff);
  719. if(unlikely(!ff)) {
  720. io->updated = 0;
  721. cgroups_check = 1;
  722. return;
  723. }
  724. unsigned long i, lines = procfile_lines(ff);
  725. if(unlikely(lines < 1)) {
  726. error("CGROUP: file '%s' should have 1+ lines.", io->filename);
  727. io->updated = 0;
  728. return;
  729. }
  730. io->Read = 0;
  731. io->Write = 0;
  732. /*
  733. io->Sync = 0;
  734. io->Async = 0;
  735. io->Total = 0;
  736. */
  737. for(i = 0; i < lines ; i++) {
  738. char *s = procfile_lineword(ff, i, 1);
  739. uint32_t hash = simple_hash(s);
  740. if(unlikely(hash == Read_hash && !strcmp(s, "Read")))
  741. io->Read += str2ull(procfile_lineword(ff, i, 2));
  742. else if(unlikely(hash == Write_hash && !strcmp(s, "Write")))
  743. io->Write += str2ull(procfile_lineword(ff, i, 2));
  744. /*
  745. else if(unlikely(hash == Sync_hash && !strcmp(s, "Sync")))
  746. io->Sync += str2ull(procfile_lineword(ff, i, 2));
  747. else if(unlikely(hash == Async_hash && !strcmp(s, "Async")))
  748. io->Async += str2ull(procfile_lineword(ff, i, 2));
  749. else if(unlikely(hash == Total_hash && !strcmp(s, "Total")))
  750. io->Total += str2ull(procfile_lineword(ff, i, 2));
  751. */
  752. }
  753. io->updated = 1;
  754. if(unlikely(io->enabled == CONFIG_BOOLEAN_AUTO)) {
  755. if(unlikely(io->Read || io->Write || netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES))
  756. io->enabled = CONFIG_BOOLEAN_YES;
  757. else
  758. io->delay_counter = cgroup_recheck_zero_blkio_every_iterations;
  759. }
  760. }
  761. }
  762. static inline void cgroup2_read_blkio(struct blkio *io, unsigned int word_offset) {
  763. if(unlikely(io->enabled == CONFIG_BOOLEAN_AUTO && io->delay_counter > 0)) {
  764. io->delay_counter--;
  765. return;
  766. }
  767. if(likely(io->filename)) {
  768. static procfile *ff = NULL;
  769. ff = procfile_reopen(ff, io->filename, NULL, PROCFILE_FLAG_DEFAULT);
  770. if(unlikely(!ff)) {
  771. io->updated = 0;
  772. cgroups_check = 1;
  773. return;
  774. }
  775. ff = procfile_readall(ff);
  776. if(unlikely(!ff)) {
  777. io->updated = 0;
  778. cgroups_check = 1;
  779. return;
  780. }
  781. unsigned long i, lines = procfile_lines(ff);
  782. if (unlikely(lines < 1)) {
  783. error("CGROUP: file '%s' should have 1+ lines.", io->filename);
  784. io->updated = 0;
  785. return;
  786. }
  787. io->Read = 0;
  788. io->Write = 0;
  789. for (i = 0; i < lines; i++) {
  790. io->Read += str2ull(procfile_lineword(ff, i, 2 + word_offset));
  791. io->Write += str2ull(procfile_lineword(ff, i, 4 + word_offset));
  792. }
  793. io->updated = 1;
  794. if(unlikely(io->enabled == CONFIG_BOOLEAN_AUTO)) {
  795. if(unlikely(io->Read || io->Write || netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES))
  796. io->enabled = CONFIG_BOOLEAN_YES;
  797. else
  798. io->delay_counter = cgroup_recheck_zero_blkio_every_iterations;
  799. }
  800. }
  801. }
  802. static inline void cgroup2_read_pressure(struct pressure *res) {
  803. static procfile *ff = NULL;
  804. if (likely(res->filename)) {
  805. ff = procfile_reopen(ff, res->filename, " =", PROCFILE_FLAG_DEFAULT);
  806. if (unlikely(!ff)) {
  807. res->updated = 0;
  808. cgroups_check = 1;
  809. return;
  810. }
  811. ff = procfile_readall(ff);
  812. if (unlikely(!ff)) {
  813. res->updated = 0;
  814. cgroups_check = 1;
  815. return;
  816. }
  817. size_t lines = procfile_lines(ff);
  818. if (lines < 1) {
  819. error("CGROUP: file '%s' should have 1+ lines.", res->filename);
  820. res->updated = 0;
  821. return;
  822. }
  823. res->some.value10 = strtod(procfile_lineword(ff, 0, 2), NULL);
  824. res->some.value60 = strtod(procfile_lineword(ff, 0, 4), NULL);
  825. res->some.value300 = strtod(procfile_lineword(ff, 0, 6), NULL);
  826. if (lines > 2) {
  827. res->full.value10 = strtod(procfile_lineword(ff, 1, 2), NULL);
  828. res->full.value60 = strtod(procfile_lineword(ff, 1, 4), NULL);
  829. res->full.value300 = strtod(procfile_lineword(ff, 1, 6), NULL);
  830. }
  831. res->updated = 1;
  832. if (unlikely(res->some.enabled == CONFIG_BOOLEAN_AUTO)) {
  833. res->some.enabled = CONFIG_BOOLEAN_YES;
  834. if (lines > 2) {
  835. res->full.enabled = CONFIG_BOOLEAN_YES;
  836. } else {
  837. res->full.enabled = CONFIG_BOOLEAN_NO;
  838. }
  839. }
  840. }
  841. }
  842. static inline void cgroup_read_memory(struct memory *mem, char parent_cg_is_unified) {
  843. static procfile *ff = NULL;
  844. // read detailed ram usage
  845. if(likely(mem->filename_detailed)) {
  846. if(unlikely(mem->enabled_detailed == CONFIG_BOOLEAN_AUTO && mem->delay_counter_detailed > 0)) {
  847. mem->delay_counter_detailed--;
  848. goto memory_next;
  849. }
  850. ff = procfile_reopen(ff, mem->filename_detailed, NULL, PROCFILE_FLAG_DEFAULT);
  851. if(unlikely(!ff)) {
  852. mem->updated_detailed = 0;
  853. cgroups_check = 1;
  854. goto memory_next;
  855. }
  856. ff = procfile_readall(ff);
  857. if(unlikely(!ff)) {
  858. mem->updated_detailed = 0;
  859. cgroups_check = 1;
  860. goto memory_next;
  861. }
  862. unsigned long i, lines = procfile_lines(ff);
  863. if(unlikely(lines < 1)) {
  864. error("CGROUP: file '%s' should have 1+ lines.", mem->filename_detailed);
  865. mem->updated_detailed = 0;
  866. goto memory_next;
  867. }
  868. if(unlikely(!mem->arl_base)) {
  869. if(parent_cg_is_unified == 0){
  870. mem->arl_base = arl_create("cgroup/memory", NULL, 60);
  871. arl_expect(mem->arl_base, "total_cache", &mem->total_cache);
  872. arl_expect(mem->arl_base, "total_rss", &mem->total_rss);
  873. arl_expect(mem->arl_base, "total_rss_huge", &mem->total_rss_huge);
  874. arl_expect(mem->arl_base, "total_mapped_file", &mem->total_mapped_file);
  875. arl_expect(mem->arl_base, "total_writeback", &mem->total_writeback);
  876. mem->arl_dirty = arl_expect(mem->arl_base, "total_dirty", &mem->total_dirty);
  877. mem->arl_swap = arl_expect(mem->arl_base, "total_swap", &mem->total_swap);
  878. arl_expect(mem->arl_base, "total_pgpgin", &mem->total_pgpgin);
  879. arl_expect(mem->arl_base, "total_pgpgout", &mem->total_pgpgout);
  880. arl_expect(mem->arl_base, "total_pgfault", &mem->total_pgfault);
  881. arl_expect(mem->arl_base, "total_pgmajfault", &mem->total_pgmajfault);
  882. arl_expect(mem->arl_base, "total_inactive_file", &mem->total_inactive_file);
  883. } else {
  884. mem->arl_base = arl_create("cgroup/memory", NULL, 60);
  885. arl_expect(mem->arl_base, "anon", &mem->anon);
  886. arl_expect(mem->arl_base, "kernel_stack", &mem->kernel_stack);
  887. arl_expect(mem->arl_base, "slab", &mem->slab);
  888. arl_expect(mem->arl_base, "sock", &mem->sock);
  889. arl_expect(mem->arl_base, "anon_thp", &mem->anon_thp);
  890. arl_expect(mem->arl_base, "file", &mem->total_mapped_file);
  891. arl_expect(mem->arl_base, "file_writeback", &mem->total_writeback);
  892. mem->arl_dirty = arl_expect(mem->arl_base, "file_dirty", &mem->total_dirty);
  893. arl_expect(mem->arl_base, "pgfault", &mem->total_pgfault);
  894. arl_expect(mem->arl_base, "pgmajfault", &mem->total_pgmajfault);
  895. arl_expect(mem->arl_base, "inactive_file", &mem->total_inactive_file);
  896. }
  897. }
  898. arl_begin(mem->arl_base);
  899. for(i = 0; i < lines ; i++) {
  900. if(arl_check(mem->arl_base,
  901. procfile_lineword(ff, i, 0),
  902. procfile_lineword(ff, i, 1))) break;
  903. }
  904. if(unlikely(mem->arl_dirty->flags & ARL_ENTRY_FLAG_FOUND))
  905. mem->detailed_has_dirty = 1;
  906. if(unlikely(parent_cg_is_unified == 0 && mem->arl_swap->flags & ARL_ENTRY_FLAG_FOUND))
  907. mem->detailed_has_swap = 1;
  908. // fprintf(stderr, "READ: '%s', cache: %llu, rss: %llu, rss_huge: %llu, mapped_file: %llu, writeback: %llu, dirty: %llu, swap: %llu, pgpgin: %llu, pgpgout: %llu, pgfault: %llu, pgmajfault: %llu, inactive_anon: %llu, active_anon: %llu, inactive_file: %llu, active_file: %llu, unevictable: %llu, hierarchical_memory_limit: %llu, total_cache: %llu, total_rss: %llu, total_rss_huge: %llu, total_mapped_file: %llu, total_writeback: %llu, total_dirty: %llu, total_swap: %llu, total_pgpgin: %llu, total_pgpgout: %llu, total_pgfault: %llu, total_pgmajfault: %llu, total_inactive_anon: %llu, total_active_anon: %llu, total_inactive_file: %llu, total_active_file: %llu, total_unevictable: %llu\n", mem->filename, mem->cache, mem->rss, mem->rss_huge, mem->mapped_file, mem->writeback, mem->dirty, mem->swap, mem->pgpgin, mem->pgpgout, mem->pgfault, mem->pgmajfault, mem->inactive_anon, mem->active_anon, mem->inactive_file, mem->active_file, mem->unevictable, mem->hierarchical_memory_limit, mem->total_cache, mem->total_rss, mem->total_rss_huge, mem->total_mapped_file, mem->total_writeback, mem->total_dirty, mem->total_swap, mem->total_pgpgin, mem->total_pgpgout, mem->total_pgfault, mem->total_pgmajfault, mem->total_inactive_anon, mem->total_active_anon, mem->total_inactive_file, mem->total_active_file, mem->total_unevictable);
  909. mem->updated_detailed = 1;
  910. if(unlikely(mem->enabled_detailed == CONFIG_BOOLEAN_AUTO)) {
  911. if(( (!parent_cg_is_unified) && ( mem->total_cache || mem->total_dirty || mem->total_rss || mem->total_rss_huge || mem->total_mapped_file || mem->total_writeback
  912. || mem->total_swap || mem->total_pgpgin || mem->total_pgpgout || mem->total_pgfault || mem->total_pgmajfault || mem->total_inactive_file))
  913. || (parent_cg_is_unified && ( mem->anon || mem->total_dirty || mem->kernel_stack || mem->slab || mem->sock || mem->total_writeback
  914. || mem->anon_thp || mem->total_pgfault || mem->total_pgmajfault || mem->total_inactive_file))
  915. || netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES)
  916. mem->enabled_detailed = CONFIG_BOOLEAN_YES;
  917. else
  918. mem->delay_counter_detailed = cgroup_recheck_zero_mem_detailed_every_iterations;
  919. }
  920. }
  921. memory_next:
  922. // read usage_in_bytes
  923. if(likely(mem->filename_usage_in_bytes)) {
  924. mem->updated_usage_in_bytes = !read_single_number_file(mem->filename_usage_in_bytes, &mem->usage_in_bytes);
  925. if(unlikely(mem->updated_usage_in_bytes && mem->enabled_usage_in_bytes == CONFIG_BOOLEAN_AUTO &&
  926. (mem->usage_in_bytes || netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES)))
  927. mem->enabled_usage_in_bytes = CONFIG_BOOLEAN_YES;
  928. }
  929. if (likely(mem->updated_usage_in_bytes && mem->updated_detailed)) {
  930. mem->usage_in_bytes =
  931. (mem->usage_in_bytes > mem->total_inactive_file) ? (mem->usage_in_bytes - mem->total_inactive_file) : 0;
  932. }
  933. // read msw_usage_in_bytes
  934. if(likely(mem->filename_msw_usage_in_bytes)) {
  935. mem->updated_msw_usage_in_bytes = !read_single_number_file(mem->filename_msw_usage_in_bytes, &mem->msw_usage_in_bytes);
  936. if(unlikely(mem->updated_msw_usage_in_bytes && mem->enabled_msw_usage_in_bytes == CONFIG_BOOLEAN_AUTO &&
  937. (mem->msw_usage_in_bytes || netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES)))
  938. mem->enabled_msw_usage_in_bytes = CONFIG_BOOLEAN_YES;
  939. }
  940. // read failcnt
  941. if(likely(mem->filename_failcnt)) {
  942. if(unlikely(mem->enabled_failcnt == CONFIG_BOOLEAN_AUTO && mem->delay_counter_failcnt > 0)) {
  943. mem->updated_failcnt = 0;
  944. mem->delay_counter_failcnt--;
  945. }
  946. else {
  947. mem->updated_failcnt = !read_single_number_file(mem->filename_failcnt, &mem->failcnt);
  948. if(unlikely(mem->updated_failcnt && mem->enabled_failcnt == CONFIG_BOOLEAN_AUTO)) {
  949. if(unlikely(mem->failcnt || netdata_zero_metrics_enabled == CONFIG_BOOLEAN_YES))
  950. mem->enabled_failcnt = CONFIG_BOOLEAN_YES;
  951. else
  952. mem->delay_counter_failcnt = cgroup_recheck_zero_mem_failcnt_every_iterations;
  953. }
  954. }
  955. }
  956. }
  957. static inline void cgroup_read(struct cgroup *cg) {
  958. debug(D_CGROUP, "reading metrics for cgroups '%s'", cg->id);
  959. if(!(cg->options & CGROUP_OPTIONS_IS_UNIFIED)) {
  960. cgroup_read_cpuacct_stat(&cg->cpuacct_stat);
  961. cgroup_read_cpuacct_usage(&cg->cpuacct_usage);
  962. cgroup_read_memory(&cg->memory, 0);
  963. cgroup_read_blkio(&cg->io_service_bytes);
  964. cgroup_read_blkio(&cg->io_serviced);
  965. cgroup_read_blkio(&cg->throttle_io_service_bytes);
  966. cgroup_read_blkio(&cg->throttle_io_serviced);
  967. cgroup_read_blkio(&cg->io_merged);
  968. cgroup_read_blkio(&cg->io_queued);
  969. }
  970. else {
  971. //TODO: io_service_bytes and io_serviced use same file merge into 1 function
  972. cgroup2_read_blkio(&cg->io_service_bytes, 0);
  973. cgroup2_read_blkio(&cg->io_serviced, 4);
  974. cgroup2_read_cpuacct_stat(&cg->cpuacct_stat);
  975. cgroup2_read_pressure(&cg->cpu_pressure);
  976. cgroup2_read_pressure(&cg->io_pressure);
  977. cgroup2_read_pressure(&cg->memory_pressure);
  978. cgroup_read_memory(&cg->memory, 1);
  979. }
  980. }
  981. static inline void read_all_cgroups(struct cgroup *root) {
  982. debug(D_CGROUP, "reading metrics for all cgroups");
  983. struct cgroup *cg;
  984. for(cg = root; cg ; cg = cg->next)
  985. if(cg->enabled && !cg->pending_renames)
  986. cgroup_read(cg);
  987. }
  988. // ----------------------------------------------------------------------------
  989. // cgroup network interfaces
  990. #define CGROUP_NETWORK_INTERFACE_MAX_LINE 2048
  991. static inline void read_cgroup_network_interfaces(struct cgroup *cg) {
  992. debug(D_CGROUP, "looking for the network interfaces of cgroup '%s' with chart id '%s' and title '%s'", cg->id, cg->chart_id, cg->chart_title);
  993. pid_t cgroup_pid;
  994. char command[CGROUP_NETWORK_INTERFACE_MAX_LINE + 1];
  995. if(!(cg->options & CGROUP_OPTIONS_IS_UNIFIED)) {
  996. snprintfz(command, CGROUP_NETWORK_INTERFACE_MAX_LINE, "exec %s --cgroup '%s%s'", cgroups_network_interface_script, cgroup_cpuacct_base, cg->id);
  997. }
  998. else {
  999. snprintfz(command, CGROUP_NETWORK_INTERFACE_MAX_LINE, "exec %s --cgroup '%s%s'", cgroups_network_interface_script, cgroup_unified_base, cg->id);
  1000. }
  1001. debug(D_CGROUP, "executing command '%s' for cgroup '%s'", command, cg->id);
  1002. FILE *fp = mypopen(command, &cgroup_pid);
  1003. if(!fp) {
  1004. error("CGROUP: cannot popen(\"%s\", \"r\").", command);
  1005. return;
  1006. }
  1007. char *s;
  1008. char buffer[CGROUP_NETWORK_INTERFACE_MAX_LINE + 1];
  1009. while((s = fgets(buffer, CGROUP_NETWORK_INTERFACE_MAX_LINE, fp))) {
  1010. trim(s);
  1011. if(*s && *s != '\n') {
  1012. char *t = s;
  1013. while(*t && *t != ' ') t++;
  1014. if(*t == ' ') {
  1015. *t = '\0';
  1016. t++;
  1017. }
  1018. if(!*s) {
  1019. error("CGROUP: empty host interface returned by script");
  1020. continue;
  1021. }
  1022. if(!*t) {
  1023. error("CGROUP: empty guest interface returned by script");
  1024. continue;
  1025. }
  1026. struct cgroup_network_interface *i = callocz(1, sizeof(struct cgroup_network_interface));
  1027. i->host_device = strdupz(s);
  1028. i->container_device = strdupz(t);
  1029. i->next = cg->interfaces;
  1030. cg->interfaces = i;
  1031. info("CGROUP: cgroup '%s' has network interface '%s' as '%s'", cg->id, i->host_device, i->container_device);
  1032. // register a device rename to proc_net_dev.c
  1033. netdev_rename_device_add(i->host_device, i->container_device, cg->chart_id, cg->chart_labels);
  1034. }
  1035. }
  1036. mypclose(fp, cgroup_pid);
  1037. // debug(D_CGROUP, "closed command for cgroup '%s'", cg->id);
  1038. }
  1039. static inline void free_cgroup_network_interfaces(struct cgroup *cg) {
  1040. while(cg->interfaces) {
  1041. struct cgroup_network_interface *i = cg->interfaces;
  1042. cg->interfaces = i->next;
  1043. // delete the registration of proc_net_dev rename
  1044. netdev_rename_device_del(i->host_device);
  1045. freez((void *)i->host_device);
  1046. freez((void *)i->container_device);
  1047. freez((void *)i);
  1048. }
  1049. }
  1050. // ----------------------------------------------------------------------------
  1051. // add/remove/find cgroup objects
  1052. #define CGROUP_CHARTID_LINE_MAX 1024
  1053. static inline char *cgroup_title_strdupz(const char *s) {
  1054. if(!s || !*s) s = "/";
  1055. if(*s == '/' && s[1] != '\0') s++;
  1056. char *r = strdupz(s);
  1057. netdata_fix_chart_name(r);
  1058. return r;
  1059. }
  1060. static inline char *cgroup_chart_id_strdupz(const char *s) {
  1061. if(!s || !*s) s = "/";
  1062. if(*s == '/' && s[1] != '\0') s++;
  1063. char *r = strdupz(s);
  1064. netdata_fix_chart_id(r);
  1065. return r;
  1066. }
  1067. char *parse_k8s_data(struct label **labels, char *data)
  1068. {
  1069. char *name = mystrsep(&data, " ");
  1070. if (!data) {
  1071. return name;
  1072. }
  1073. while (data) {
  1074. char *key = mystrsep(&data, "=");
  1075. char *value;
  1076. if (data && *data == ',') {
  1077. value = "";
  1078. *data++ = '\0';
  1079. } else {
  1080. value = mystrsep(&data, ",");
  1081. }
  1082. value = strip_double_quotes(value, 1);
  1083. if (!key || *key == '\0' || !value || *value == '\0')
  1084. continue;
  1085. *labels = add_label_to_list(*labels, key, value, LABEL_SOURCE_KUBERNETES);
  1086. }
  1087. return name;
  1088. }
  1089. static inline void cgroup_get_chart_name(struct cgroup *cg) {
  1090. debug(D_CGROUP, "looking for the name of cgroup '%s' with chart id '%s' and title '%s'", cg->id, cg->chart_id, cg->chart_title);
  1091. pid_t cgroup_pid;
  1092. char command[CGROUP_CHARTID_LINE_MAX + 1];
  1093. snprintfz(command, CGROUP_CHARTID_LINE_MAX, "exec %s '%s'", cgroups_rename_script, cg->chart_id);
  1094. debug(D_CGROUP, "executing command \"%s\" for cgroup '%s'", command, cg->chart_id);
  1095. FILE *fp = mypopen(command, &cgroup_pid);
  1096. if(fp) {
  1097. // debug(D_CGROUP, "reading from command '%s' for cgroup '%s'", command, cg->id);
  1098. char buffer[CGROUP_CHARTID_LINE_MAX + 1];
  1099. char *s = fgets(buffer, CGROUP_CHARTID_LINE_MAX, fp);
  1100. // debug(D_CGROUP, "closing command for cgroup '%s'", cg->id);
  1101. int name_error = mypclose(fp, cgroup_pid);
  1102. // debug(D_CGROUP, "closed command for cgroup '%s'", cg->id);
  1103. if(s && *s && *s != '\n') {
  1104. debug(D_CGROUP, "cgroup '%s' should be renamed to '%s'", cg->chart_id, s);
  1105. s = trim(s);
  1106. if (s) {
  1107. if(likely(name_error==0))
  1108. cg->pending_renames = 0;
  1109. else if (unlikely(name_error==3)) {
  1110. debug(D_CGROUP, "cgroup '%s' disabled based due to rename command output", cg->chart_id);
  1111. cg->enabled = 0;
  1112. }
  1113. if (likely(cg->pending_renames < 2)) {
  1114. char *name = s;
  1115. if (!strncmp(s, "k8s_", 4)) {
  1116. free_label_list(cg->chart_labels);
  1117. name = parse_k8s_data(&cg->chart_labels, s);
  1118. }
  1119. freez(cg->chart_title);
  1120. cg->chart_title = cgroup_title_strdupz(name);
  1121. freez(cg->chart_id);
  1122. cg->chart_id = cgroup_chart_id_strdupz(name);
  1123. cg->hash_chart = simple_hash(cg->chart_id);
  1124. }
  1125. }
  1126. }
  1127. }
  1128. else
  1129. error("CGROUP: cannot popen(\"%s\", \"r\").", command);
  1130. }
  1131. static inline struct cgroup *cgroup_add(const char *id) {
  1132. if(!id || !*id) id = "/";
  1133. debug(D_CGROUP, "adding to list, cgroup with id '%s'", id);
  1134. if(cgroup_root_count >= cgroup_root_max) {
  1135. info("CGROUP: maximum number of cgroups reached (%d). Not adding cgroup '%s'", cgroup_root_count, id);
  1136. return NULL;
  1137. }
  1138. int def = simple_pattern_matches(enabled_cgroup_patterns, id)?cgroup_enable_new_cgroups_detected_at_runtime:0;
  1139. struct cgroup *cg = callocz(1, sizeof(struct cgroup));
  1140. cg->id = strdupz(id);
  1141. cg->hash = simple_hash(cg->id);
  1142. cg->chart_title = cgroup_title_strdupz(id);
  1143. cg->chart_id = cgroup_chart_id_strdupz(id);
  1144. cg->hash_chart = simple_hash(cg->chart_id);
  1145. if(cgroup_use_unified_cgroups) cg->options |= CGROUP_OPTIONS_IS_UNIFIED;
  1146. if(!discovered_cgroup_root)
  1147. discovered_cgroup_root = cg;
  1148. else {
  1149. // append it
  1150. struct cgroup *e;
  1151. for(e = discovered_cgroup_root; e->discovered_next ;e = e->discovered_next) ;
  1152. e->discovered_next = cg;
  1153. }
  1154. cgroup_root_count++;
  1155. // fix the chart_id and title by calling the external script
  1156. if(simple_pattern_matches(enabled_cgroup_renames, cg->id)) {
  1157. cg->pending_renames = 2;
  1158. cgroup_get_chart_name(cg);
  1159. debug(D_CGROUP, "cgroup '%s' renamed to '%s' (title: '%s')", cg->id, cg->chart_id, cg->chart_title);
  1160. }
  1161. else
  1162. debug(D_CGROUP, "cgroup '%s' will not be renamed - it matches the list of disabled cgroup renames (will be shown as '%s')", cg->id, cg->chart_id);
  1163. int user_configurable = 1;
  1164. // check if this cgroup should be a systemd service
  1165. if(cgroup_enable_systemd_services) {
  1166. if(simple_pattern_matches(systemd_services_cgroups, cg->id) ||
  1167. simple_pattern_matches(systemd_services_cgroups, cg->chart_id)) {
  1168. debug(D_CGROUP, "cgroup '%s' with chart id '%s' (title: '%s') matches systemd services cgroups", cg->id, cg->chart_id, cg->chart_title);
  1169. char buffer[CGROUP_CHARTID_LINE_MAX + 1];
  1170. cg->options |= CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE;
  1171. strncpy(buffer, cg->id, CGROUP_CHARTID_LINE_MAX);
  1172. char *s = buffer;
  1173. //freez(cg->chart_id);
  1174. //cg->chart_id = cgroup_chart_id_strdupz(s);
  1175. //cg->hash_chart = simple_hash(cg->chart_id);
  1176. // skip to the last slash
  1177. size_t len = strlen(s);
  1178. while(len--) if(unlikely(s[len] == '/')) break;
  1179. if(len) s = &s[len + 1];
  1180. // remove extension
  1181. len = strlen(s);
  1182. while(len--) if(unlikely(s[len] == '.')) break;
  1183. if(len) s[len] = '\0';
  1184. freez(cg->chart_title);
  1185. cg->chart_title = cgroup_title_strdupz(s);
  1186. cg->enabled = 1;
  1187. user_configurable = 0;
  1188. debug(D_CGROUP, "cgroup '%s' renamed to '%s' (title: '%s')", cg->id, cg->chart_id, cg->chart_title);
  1189. }
  1190. else
  1191. debug(D_CGROUP, "cgroup '%s' with chart id '%s' (title: '%s') does not match systemd services groups", cg->id, cg->chart_id, cg->chart_title);
  1192. }
  1193. if(user_configurable) {
  1194. // allow the user to enable/disable this individually
  1195. char option[FILENAME_MAX + 1];
  1196. snprintfz(option, FILENAME_MAX, "enable cgroup %s", cg->chart_title);
  1197. cg->enabled = (char) config_get_boolean("plugin:cgroups", option, def);
  1198. }
  1199. // detect duplicate cgroups
  1200. if(cg->enabled) {
  1201. struct cgroup *t;
  1202. for (t = discovered_cgroup_root; t; t = t->discovered_next) {
  1203. if (t != cg && t->enabled && t->hash_chart == cg->hash_chart && !strcmp(t->chart_id, cg->chart_id)) {
  1204. // TODO: use it after refactoring if system.slice might be scanned before init.scope/system.slice
  1205. //
  1206. // if (!strncmp(t->id, "/system.slice/", 14) && !strncmp(cg->id, "/init.scope/system.slice/", 25)) {
  1207. // error("CGROUP: chart id '%s' already exists with id '%s' and is enabled. Swapping them by enabling cgroup with id '%s' and disabling cgroup with id '%s'.",
  1208. // cg->chart_id, t->id, cg->id, t->id);
  1209. // t->enabled = 0;
  1210. // t->options |= CGROUP_OPTIONS_DISABLED_DUPLICATE;
  1211. // }
  1212. // else {}
  1213. //
  1214. // https://github.com/netdata/netdata/issues/797#issuecomment-241248884
  1215. error("CGROUP: chart id '%s' already exists with id '%s' and is enabled and available. Disabling cgroup with id '%s'.",
  1216. cg->chart_id, t->id, cg->id);
  1217. cg->enabled = 0;
  1218. cg->options |= CGROUP_OPTIONS_DISABLED_DUPLICATE;
  1219. break;
  1220. }
  1221. }
  1222. }
  1223. if(cg->enabled && !cg->pending_renames && !(cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE))
  1224. read_cgroup_network_interfaces(cg);
  1225. debug(D_CGROUP, "ADDED CGROUP: '%s' with chart id '%s' and title '%s' as %s (default was %s)", cg->id, cg->chart_id, cg->chart_title, (cg->enabled)?"enabled":"disabled", (def)?"enabled":"disabled");
  1226. return cg;
  1227. }
  1228. static inline void free_pressure(struct pressure *res) {
  1229. if (res->some.st) rrdset_is_obsolete(res->some.st);
  1230. if (res->full.st) rrdset_is_obsolete(res->full.st);
  1231. freez(res->filename);
  1232. }
  1233. static inline void cgroup_free(struct cgroup *cg) {
  1234. debug(D_CGROUP, "Removing cgroup '%s' with chart id '%s' (was %s and %s)", cg->id, cg->chart_id, (cg->enabled)?"enabled":"disabled", (cg->available)?"available":"not available");
  1235. if(cg->st_cpu) rrdset_is_obsolete(cg->st_cpu);
  1236. if(cg->st_cpu_limit) rrdset_is_obsolete(cg->st_cpu_limit);
  1237. if(cg->st_cpu_per_core) rrdset_is_obsolete(cg->st_cpu_per_core);
  1238. if(cg->st_mem) rrdset_is_obsolete(cg->st_mem);
  1239. if(cg->st_writeback) rrdset_is_obsolete(cg->st_writeback);
  1240. if(cg->st_mem_activity) rrdset_is_obsolete(cg->st_mem_activity);
  1241. if(cg->st_pgfaults) rrdset_is_obsolete(cg->st_pgfaults);
  1242. if(cg->st_mem_usage) rrdset_is_obsolete(cg->st_mem_usage);
  1243. if(cg->st_mem_usage_limit) rrdset_is_obsolete(cg->st_mem_usage_limit);
  1244. if(cg->st_mem_utilization) rrdset_is_obsolete(cg->st_mem_utilization);
  1245. if(cg->st_mem_failcnt) rrdset_is_obsolete(cg->st_mem_failcnt);
  1246. if(cg->st_io) rrdset_is_obsolete(cg->st_io);
  1247. if(cg->st_serviced_ops) rrdset_is_obsolete(cg->st_serviced_ops);
  1248. if(cg->st_throttle_io) rrdset_is_obsolete(cg->st_throttle_io);
  1249. if(cg->st_throttle_serviced_ops) rrdset_is_obsolete(cg->st_throttle_serviced_ops);
  1250. if(cg->st_queued_ops) rrdset_is_obsolete(cg->st_queued_ops);
  1251. if(cg->st_merged_ops) rrdset_is_obsolete(cg->st_merged_ops);
  1252. freez(cg->filename_cpuset_cpus);
  1253. freez(cg->filename_cpu_cfs_period);
  1254. freez(cg->filename_cpu_cfs_quota);
  1255. freez(cg->filename_memory_limit);
  1256. freez(cg->filename_memoryswap_limit);
  1257. free_cgroup_network_interfaces(cg);
  1258. freez(cg->cpuacct_usage.cpu_percpu);
  1259. freez(cg->cpuacct_stat.filename);
  1260. freez(cg->cpuacct_usage.filename);
  1261. arl_free(cg->memory.arl_base);
  1262. freez(cg->memory.filename_detailed);
  1263. freez(cg->memory.filename_failcnt);
  1264. freez(cg->memory.filename_usage_in_bytes);
  1265. freez(cg->memory.filename_msw_usage_in_bytes);
  1266. freez(cg->io_service_bytes.filename);
  1267. freez(cg->io_serviced.filename);
  1268. freez(cg->throttle_io_service_bytes.filename);
  1269. freez(cg->throttle_io_serviced.filename);
  1270. freez(cg->io_merged.filename);
  1271. freez(cg->io_queued.filename);
  1272. free_pressure(&cg->cpu_pressure);
  1273. free_pressure(&cg->io_pressure);
  1274. free_pressure(&cg->memory_pressure);
  1275. freez(cg->id);
  1276. freez(cg->chart_id);
  1277. freez(cg->chart_title);
  1278. free_label_list(cg->chart_labels);
  1279. freez(cg);
  1280. cgroup_root_count--;
  1281. }
  1282. // find if a given cgroup exists
  1283. static inline struct cgroup *cgroup_find(const char *id) {
  1284. debug(D_CGROUP, "searching for cgroup '%s'", id);
  1285. uint32_t hash = simple_hash(id);
  1286. struct cgroup *cg;
  1287. for(cg = discovered_cgroup_root; cg ; cg = cg->discovered_next) {
  1288. if(hash == cg->hash && strcmp(id, cg->id) == 0)
  1289. break;
  1290. }
  1291. debug(D_CGROUP, "cgroup '%s' %s in memory", id, (cg)?"found":"not found");
  1292. return cg;
  1293. }
  1294. // ----------------------------------------------------------------------------
  1295. // detect running cgroups
  1296. // callback for find_file_in_subdirs()
  1297. static inline void found_subdir_in_dir(const char *dir) {
  1298. debug(D_CGROUP, "examining cgroup dir '%s'", dir);
  1299. struct cgroup *cg = cgroup_find(dir);
  1300. if(!cg) {
  1301. if(*dir && cgroup_max_depth > 0) {
  1302. int depth = 0;
  1303. const char *s;
  1304. for(s = dir; *s ;s++)
  1305. if(unlikely(*s == '/'))
  1306. depth++;
  1307. if(depth > cgroup_max_depth) {
  1308. info("CGROUP: '%s' is too deep (%d, while max is %d)", dir, depth, cgroup_max_depth);
  1309. return;
  1310. }
  1311. }
  1312. // debug(D_CGROUP, "will add dir '%s' as cgroup", dir);
  1313. cg = cgroup_add(dir);
  1314. }
  1315. if(cg) {
  1316. // delay renaming of the cgroup and looking for network interfaces to deal with the docker lag when starting the container
  1317. if(unlikely(cg->pending_renames == 1)) {
  1318. // fix the chart_id and title by calling the external script
  1319. if(simple_pattern_matches(enabled_cgroup_renames, cg->id)) {
  1320. cgroup_get_chart_name(cg);
  1321. cg->pending_renames = 0;
  1322. if(cg->enabled && !(cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE))
  1323. read_cgroup_network_interfaces(cg);
  1324. debug(D_CGROUP, "cgroup '%s' renamed to '%s' (title: '%s')", cg->id, cg->chart_id, cg->chart_title);
  1325. }
  1326. else
  1327. debug(D_CGROUP, "cgroup '%s' will not be renamed - it matches the list of disabled cgroup renames (will be shown as '%s')", cg->id, cg->chart_id);
  1328. }
  1329. cg->available = 1;
  1330. }
  1331. }
  1332. static inline int find_dir_in_subdirs(const char *base, const char *this, void (*callback)(const char *)) {
  1333. if(!this) this = base;
  1334. debug(D_CGROUP, "searching for directories in '%s' (base '%s')", this?this:"", base);
  1335. size_t dirlen = strlen(this), baselen = strlen(base);
  1336. int ret = -1;
  1337. int enabled = -1;
  1338. const char *relative_path = &this[baselen];
  1339. if(!*relative_path) relative_path = "/";
  1340. DIR *dir = opendir(this);
  1341. if(!dir) {
  1342. error("CGROUP: cannot read directory '%s'", base);
  1343. return ret;
  1344. }
  1345. ret = 1;
  1346. callback(relative_path);
  1347. struct dirent *de = NULL;
  1348. while((de = readdir(dir))) {
  1349. if(de->d_type == DT_DIR
  1350. && (
  1351. (de->d_name[0] == '.' && de->d_name[1] == '\0')
  1352. || (de->d_name[0] == '.' && de->d_name[1] == '.' && de->d_name[2] == '\0')
  1353. ))
  1354. continue;
  1355. if(de->d_type == DT_DIR) {
  1356. if(enabled == -1) {
  1357. const char *r = relative_path;
  1358. if(*r == '\0') r = "/";
  1359. // do not decent in directories we are not interested
  1360. int def = simple_pattern_matches(enabled_cgroup_paths, r);
  1361. // we check for this option here
  1362. // so that the config will not have settings
  1363. // for leaf directories
  1364. char option[FILENAME_MAX + 1];
  1365. snprintfz(option, FILENAME_MAX, "search for cgroups under %s", r);
  1366. option[FILENAME_MAX] = '\0';
  1367. enabled = config_get_boolean("plugin:cgroups", option, def);
  1368. }
  1369. if(enabled) {
  1370. char *s = mallocz(dirlen + strlen(de->d_name) + 2);
  1371. strcpy(s, this);
  1372. strcat(s, "/");
  1373. strcat(s, de->d_name);
  1374. int ret2 = find_dir_in_subdirs(base, s, callback);
  1375. if(ret2 > 0) ret += ret2;
  1376. freez(s);
  1377. }
  1378. }
  1379. }
  1380. closedir(dir);
  1381. return ret;
  1382. }
  1383. static inline void mark_all_cgroups_as_not_available() {
  1384. debug(D_CGROUP, "marking all cgroups as not available");
  1385. struct cgroup *cg;
  1386. // mark all as not available
  1387. for(cg = discovered_cgroup_root; cg ; cg = cg->discovered_next) {
  1388. cg->available = 0;
  1389. }
  1390. }
  1391. static inline void update_filenames()
  1392. {
  1393. struct cgroup *cg;
  1394. struct stat buf;
  1395. for(cg = discovered_cgroup_root; cg ; cg = cg->discovered_next) {
  1396. // fprintf(stderr, " >>> CGROUP '%s' (%u - %s) with name '%s'\n", cg->id, cg->hash, cg->available?"available":"stopped", cg->name);
  1397. if(unlikely(cg->pending_renames))
  1398. cg->pending_renames--;
  1399. if(unlikely(!cg->available || cg->pending_renames))
  1400. continue;
  1401. debug(D_CGROUP, "checking paths for cgroup '%s'", cg->id);
  1402. // check for newly added cgroups
  1403. // and update the filenames they read
  1404. char filename[FILENAME_MAX + 1];
  1405. if(!cgroup_use_unified_cgroups) {
  1406. if(unlikely(cgroup_enable_cpuacct_stat && !cg->cpuacct_stat.filename)) {
  1407. snprintfz(filename, FILENAME_MAX, "%s%s/cpuacct.stat", cgroup_cpuacct_base, cg->id);
  1408. if(likely(stat(filename, &buf) != -1)) {
  1409. cg->cpuacct_stat.filename = strdupz(filename);
  1410. cg->cpuacct_stat.enabled = cgroup_enable_cpuacct_stat;
  1411. snprintfz(filename, FILENAME_MAX, "%s%s/cpuset.cpus", cgroup_cpuset_base, cg->id);
  1412. cg->filename_cpuset_cpus = strdupz(filename);
  1413. snprintfz(filename, FILENAME_MAX, "%s%s/cpu.cfs_period_us", cgroup_cpuacct_base, cg->id);
  1414. cg->filename_cpu_cfs_period = strdupz(filename);
  1415. snprintfz(filename, FILENAME_MAX, "%s%s/cpu.cfs_quota_us", cgroup_cpuacct_base, cg->id);
  1416. cg->filename_cpu_cfs_quota = strdupz(filename);
  1417. debug(D_CGROUP, "cpuacct.stat filename for cgroup '%s': '%s'", cg->id, cg->cpuacct_stat.filename);
  1418. }
  1419. else
  1420. debug(D_CGROUP, "cpuacct.stat file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1421. }
  1422. if(unlikely(cgroup_enable_cpuacct_usage && !cg->cpuacct_usage.filename && !(cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE))) {
  1423. snprintfz(filename, FILENAME_MAX, "%s%s/cpuacct.usage_percpu", cgroup_cpuacct_base, cg->id);
  1424. if(likely(stat(filename, &buf) != -1)) {
  1425. cg->cpuacct_usage.filename = strdupz(filename);
  1426. cg->cpuacct_usage.enabled = cgroup_enable_cpuacct_usage;
  1427. debug(D_CGROUP, "cpuacct.usage_percpu filename for cgroup '%s': '%s'", cg->id, cg->cpuacct_usage.filename);
  1428. }
  1429. else
  1430. debug(D_CGROUP, "cpuacct.usage_percpu file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1431. }
  1432. if(unlikely((cgroup_enable_detailed_memory || cgroup_used_memory) && !cg->memory.filename_detailed && (cgroup_used_memory || cgroup_enable_systemd_services_detailed_memory || !(cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE)))) {
  1433. snprintfz(filename, FILENAME_MAX, "%s%s/memory.stat", cgroup_memory_base, cg->id);
  1434. if(likely(stat(filename, &buf) != -1)) {
  1435. cg->memory.filename_detailed = strdupz(filename);
  1436. cg->memory.enabled_detailed = (cgroup_enable_detailed_memory == CONFIG_BOOLEAN_YES)?CONFIG_BOOLEAN_YES:CONFIG_BOOLEAN_AUTO;
  1437. debug(D_CGROUP, "memory.stat filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_detailed);
  1438. }
  1439. else
  1440. debug(D_CGROUP, "memory.stat file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1441. }
  1442. if(unlikely(cgroup_enable_memory && !cg->memory.filename_usage_in_bytes)) {
  1443. snprintfz(filename, FILENAME_MAX, "%s%s/memory.usage_in_bytes", cgroup_memory_base, cg->id);
  1444. if(likely(stat(filename, &buf) != -1)) {
  1445. cg->memory.filename_usage_in_bytes = strdupz(filename);
  1446. cg->memory.enabled_usage_in_bytes = cgroup_enable_memory;
  1447. debug(D_CGROUP, "memory.usage_in_bytes filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_usage_in_bytes);
  1448. snprintfz(filename, FILENAME_MAX, "%s%s/memory.limit_in_bytes", cgroup_memory_base, cg->id);
  1449. cg->filename_memory_limit = strdupz(filename);
  1450. }
  1451. else
  1452. debug(D_CGROUP, "memory.usage_in_bytes file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1453. }
  1454. if(unlikely(cgroup_enable_swap && !cg->memory.filename_msw_usage_in_bytes)) {
  1455. snprintfz(filename, FILENAME_MAX, "%s%s/memory.memsw.usage_in_bytes", cgroup_memory_base, cg->id);
  1456. if(likely(stat(filename, &buf) != -1)) {
  1457. cg->memory.filename_msw_usage_in_bytes = strdupz(filename);
  1458. cg->memory.enabled_msw_usage_in_bytes = cgroup_enable_swap;
  1459. snprintfz(filename, FILENAME_MAX, "%s%s/memory.memsw.limit_in_bytes", cgroup_memory_base, cg->id);
  1460. cg->filename_memoryswap_limit = strdupz(filename);
  1461. debug(D_CGROUP, "memory.msw_usage_in_bytes filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_msw_usage_in_bytes);
  1462. }
  1463. else
  1464. debug(D_CGROUP, "memory.msw_usage_in_bytes file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1465. }
  1466. if(unlikely(cgroup_enable_memory_failcnt && !cg->memory.filename_failcnt)) {
  1467. snprintfz(filename, FILENAME_MAX, "%s%s/memory.failcnt", cgroup_memory_base, cg->id);
  1468. if(likely(stat(filename, &buf) != -1)) {
  1469. cg->memory.filename_failcnt = strdupz(filename);
  1470. cg->memory.enabled_failcnt = cgroup_enable_memory_failcnt;
  1471. debug(D_CGROUP, "memory.failcnt filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_failcnt);
  1472. }
  1473. else
  1474. debug(D_CGROUP, "memory.failcnt file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1475. }
  1476. if(unlikely(cgroup_enable_blkio_io && !cg->io_service_bytes.filename)) {
  1477. snprintfz(filename, FILENAME_MAX, "%s%s/blkio.io_service_bytes", cgroup_blkio_base, cg->id);
  1478. if(likely(stat(filename, &buf) != -1)) {
  1479. cg->io_service_bytes.filename = strdupz(filename);
  1480. cg->io_service_bytes.enabled = cgroup_enable_blkio_io;
  1481. debug(D_CGROUP, "io_service_bytes filename for cgroup '%s': '%s'", cg->id, cg->io_service_bytes.filename);
  1482. }
  1483. else
  1484. debug(D_CGROUP, "io_service_bytes file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1485. }
  1486. if(unlikely(cgroup_enable_blkio_ops && !cg->io_serviced.filename)) {
  1487. snprintfz(filename, FILENAME_MAX, "%s%s/blkio.io_serviced", cgroup_blkio_base, cg->id);
  1488. if(likely(stat(filename, &buf) != -1)) {
  1489. cg->io_serviced.filename = strdupz(filename);
  1490. cg->io_serviced.enabled = cgroup_enable_blkio_ops;
  1491. debug(D_CGROUP, "io_serviced filename for cgroup '%s': '%s'", cg->id, cg->io_serviced.filename);
  1492. }
  1493. else
  1494. debug(D_CGROUP, "io_serviced file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1495. }
  1496. if(unlikely(cgroup_enable_blkio_throttle_io && !cg->throttle_io_service_bytes.filename)) {
  1497. snprintfz(filename, FILENAME_MAX, "%s%s/blkio.throttle.io_service_bytes", cgroup_blkio_base, cg->id);
  1498. if(likely(stat(filename, &buf) != -1)) {
  1499. cg->throttle_io_service_bytes.filename = strdupz(filename);
  1500. cg->throttle_io_service_bytes.enabled = cgroup_enable_blkio_throttle_io;
  1501. debug(D_CGROUP, "throttle_io_service_bytes filename for cgroup '%s': '%s'", cg->id, cg->throttle_io_service_bytes.filename);
  1502. }
  1503. else
  1504. debug(D_CGROUP, "throttle_io_service_bytes file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1505. }
  1506. if(unlikely(cgroup_enable_blkio_throttle_ops && !cg->throttle_io_serviced.filename)) {
  1507. snprintfz(filename, FILENAME_MAX, "%s%s/blkio.throttle.io_serviced", cgroup_blkio_base, cg->id);
  1508. if(likely(stat(filename, &buf) != -1)) {
  1509. cg->throttle_io_serviced.filename = strdupz(filename);
  1510. cg->throttle_io_serviced.enabled = cgroup_enable_blkio_throttle_ops;
  1511. debug(D_CGROUP, "throttle_io_serviced filename for cgroup '%s': '%s'", cg->id, cg->throttle_io_serviced.filename);
  1512. }
  1513. else
  1514. debug(D_CGROUP, "throttle_io_serviced file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1515. }
  1516. if(unlikely(cgroup_enable_blkio_merged_ops && !cg->io_merged.filename)) {
  1517. snprintfz(filename, FILENAME_MAX, "%s%s/blkio.io_merged", cgroup_blkio_base, cg->id);
  1518. if(likely(stat(filename, &buf) != -1)) {
  1519. cg->io_merged.filename = strdupz(filename);
  1520. cg->io_merged.enabled = cgroup_enable_blkio_merged_ops;
  1521. debug(D_CGROUP, "io_merged filename for cgroup '%s': '%s'", cg->id, cg->io_merged.filename);
  1522. }
  1523. else
  1524. debug(D_CGROUP, "io_merged file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1525. }
  1526. if(unlikely(cgroup_enable_blkio_queued_ops && !cg->io_queued.filename)) {
  1527. snprintfz(filename, FILENAME_MAX, "%s%s/blkio.io_queued", cgroup_blkio_base, cg->id);
  1528. if(likely(stat(filename, &buf) != -1)) {
  1529. cg->io_queued.filename = strdupz(filename);
  1530. cg->io_queued.enabled = cgroup_enable_blkio_queued_ops;
  1531. debug(D_CGROUP, "io_queued filename for cgroup '%s': '%s'", cg->id, cg->io_queued.filename);
  1532. }
  1533. else
  1534. debug(D_CGROUP, "io_queued file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1535. }
  1536. }
  1537. else if(likely(cgroup_unified_exist)) {
  1538. if(unlikely(cgroup_enable_blkio_io && !cg->io_service_bytes.filename)) {
  1539. snprintfz(filename, FILENAME_MAX, "%s%s/io.stat", cgroup_unified_base, cg->id);
  1540. if(likely(stat(filename, &buf) != -1)) {
  1541. cg->io_service_bytes.filename = strdupz(filename);
  1542. cg->io_service_bytes.enabled = cgroup_enable_blkio_io;
  1543. debug(D_CGROUP, "io.stat filename for unified cgroup '%s': '%s'", cg->id, cg->io_service_bytes.filename);
  1544. } else
  1545. debug(D_CGROUP, "io.stat file for unified cgroup '%s': '%s' does not exist.", cg->id, filename);
  1546. }
  1547. if (unlikely(cgroup_enable_blkio_ops && !cg->io_serviced.filename)) {
  1548. snprintfz(filename, FILENAME_MAX, "%s%s/io.stat", cgroup_unified_base, cg->id);
  1549. if (likely(stat(filename, &buf) != -1)) {
  1550. cg->io_serviced.filename = strdupz(filename);
  1551. cg->io_serviced.enabled = cgroup_enable_blkio_ops;
  1552. debug(D_CGROUP, "io.stat filename for unified cgroup '%s': '%s'", cg->id, cg->io_service_bytes.filename);
  1553. } else
  1554. debug(D_CGROUP, "io.stat file for unified cgroup '%s': '%s' does not exist.", cg->id, filename);
  1555. }
  1556. if(unlikely(cgroup_enable_cpuacct_stat && !cg->cpuacct_stat.filename)) {
  1557. snprintfz(filename, FILENAME_MAX, "%s%s/cpu.stat", cgroup_unified_base, cg->id);
  1558. if(likely(stat(filename, &buf) != -1)) {
  1559. cg->cpuacct_stat.filename = strdupz(filename);
  1560. cg->cpuacct_stat.enabled = cgroup_enable_cpuacct_stat;
  1561. cg->filename_cpuset_cpus = NULL;
  1562. cg->filename_cpu_cfs_period = NULL;
  1563. snprintfz(filename, FILENAME_MAX, "%s%s/cpu.max", cgroup_unified_base, cg->id);
  1564. cg->filename_cpu_cfs_quota = strdupz(filename);
  1565. debug(D_CGROUP, "cpu.stat filename for unified cgroup '%s': '%s'", cg->id, cg->cpuacct_stat.filename);
  1566. }
  1567. else
  1568. debug(D_CGROUP, "cpu.stat file for unified cgroup '%s': '%s' does not exist.", cg->id, filename);
  1569. }
  1570. if(unlikely((cgroup_enable_detailed_memory || cgroup_used_memory) && !cg->memory.filename_detailed && (cgroup_used_memory || cgroup_enable_systemd_services_detailed_memory || !(cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE)))) {
  1571. snprintfz(filename, FILENAME_MAX, "%s%s/memory.stat", cgroup_unified_base, cg->id);
  1572. if(likely(stat(filename, &buf) != -1)) {
  1573. cg->memory.filename_detailed = strdupz(filename);
  1574. cg->memory.enabled_detailed = (cgroup_enable_detailed_memory == CONFIG_BOOLEAN_YES)?CONFIG_BOOLEAN_YES:CONFIG_BOOLEAN_AUTO;
  1575. debug(D_CGROUP, "memory.stat filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_detailed);
  1576. }
  1577. else
  1578. debug(D_CGROUP, "memory.stat file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1579. }
  1580. if(unlikely(cgroup_enable_memory && !cg->memory.filename_usage_in_bytes)) {
  1581. snprintfz(filename, FILENAME_MAX, "%s%s/memory.current", cgroup_unified_base, cg->id);
  1582. if(likely(stat(filename, &buf) != -1)) {
  1583. cg->memory.filename_usage_in_bytes = strdupz(filename);
  1584. cg->memory.enabled_usage_in_bytes = cgroup_enable_memory;
  1585. debug(D_CGROUP, "memory.current filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_usage_in_bytes);
  1586. snprintfz(filename, FILENAME_MAX, "%s%s/memory.max", cgroup_unified_base, cg->id);
  1587. cg->filename_memory_limit = strdupz(filename);
  1588. }
  1589. else
  1590. debug(D_CGROUP, "memory.current file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1591. }
  1592. if(unlikely(cgroup_enable_swap && !cg->memory.filename_msw_usage_in_bytes)) {
  1593. snprintfz(filename, FILENAME_MAX, "%s%s/memory.swap.current", cgroup_unified_base, cg->id);
  1594. if(likely(stat(filename, &buf) != -1)) {
  1595. cg->memory.filename_msw_usage_in_bytes = strdupz(filename);
  1596. cg->memory.enabled_msw_usage_in_bytes = cgroup_enable_swap;
  1597. snprintfz(filename, FILENAME_MAX, "%s%s/memory.swap.max", cgroup_unified_base, cg->id);
  1598. cg->filename_memoryswap_limit = strdupz(filename);
  1599. debug(D_CGROUP, "memory.swap.current filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_msw_usage_in_bytes);
  1600. }
  1601. else
  1602. debug(D_CGROUP, "memory.swap file for cgroup '%s': '%s' does not exist.", cg->id, filename);
  1603. }
  1604. if (unlikely(cgroup_enable_pressure_cpu && !cg->cpu_pressure.filename)) {
  1605. snprintfz(filename, FILENAME_MAX, "%s%s/cpu.pressure", cgroup_unified_base, cg->id);
  1606. if (likely(stat(filename, &buf) != -1)) {
  1607. cg->cpu_pressure.filename = strdupz(filename);
  1608. cg->cpu_pressure.some.enabled = cgroup_enable_pressure_cpu;
  1609. cg->cpu_pressure.full.enabled = CONFIG_BOOLEAN_NO;
  1610. debug(D_CGROUP, "cpu.pressure filename for cgroup '%s': '%s'", cg->id, cg->cpu_pressure.filename);
  1611. } else {
  1612. debug(D_CGROUP, "cpu.pressure file for cgroup '%s': '%s' does not exist", cg->id, filename);
  1613. }
  1614. }
  1615. if (unlikely((cgroup_enable_pressure_io_some || cgroup_enable_pressure_io_full) && !cg->io_pressure.filename)) {
  1616. snprintfz(filename, FILENAME_MAX, "%s%s/io.pressure", cgroup_unified_base, cg->id);
  1617. if (likely(stat(filename, &buf) != -1)) {
  1618. cg->io_pressure.filename = strdupz(filename);
  1619. cg->io_pressure.some.enabled = cgroup_enable_pressure_io_some;
  1620. cg->io_pressure.full.enabled = cgroup_enable_pressure_io_full;
  1621. debug(D_CGROUP, "io.pressure filename for cgroup '%s': '%s'", cg->id, cg->io_pressure.filename);
  1622. } else {
  1623. debug(D_CGROUP, "io.pressure file for cgroup '%s': '%s' does not exist", cg->id, filename);
  1624. }
  1625. }
  1626. if (unlikely((cgroup_enable_pressure_memory_some || cgroup_enable_pressure_memory_full) && !cg->memory_pressure.filename)) {
  1627. snprintfz(filename, FILENAME_MAX, "%s%s/memory.pressure", cgroup_unified_base, cg->id);
  1628. if (likely(stat(filename, &buf) != -1)) {
  1629. cg->memory_pressure.filename = strdupz(filename);
  1630. cg->memory_pressure.some.enabled = cgroup_enable_pressure_memory_some;
  1631. cg->memory_pressure.full.enabled = cgroup_enable_pressure_memory_full;
  1632. debug(D_CGROUP, "memory.pressure filename for cgroup '%s': '%s'", cg->id, cg->memory_pressure.filename);
  1633. } else {
  1634. debug(D_CGROUP, "memory.pressure file for cgroup '%s': '%s' does not exist", cg->id, filename);
  1635. }
  1636. }
  1637. }
  1638. }
  1639. }
  1640. static inline void cleanup_all_cgroups() {
  1641. struct cgroup *cg = discovered_cgroup_root, *last = NULL;
  1642. for(; cg ;) {
  1643. if(!cg->available) {
  1644. // enable the first duplicate cgroup
  1645. {
  1646. struct cgroup *t;
  1647. for(t = discovered_cgroup_root; t ; t = t->discovered_next) {
  1648. if(t != cg && t->available && !t->enabled && t->options & CGROUP_OPTIONS_DISABLED_DUPLICATE && t->hash_chart == cg->hash_chart && !strcmp(t->chart_id, cg->chart_id)) {
  1649. debug(D_CGROUP, "Enabling duplicate of cgroup '%s' with id '%s', because the original with id '%s' stopped.", t->chart_id, t->id, cg->id);
  1650. t->enabled = 1;
  1651. t->options &= ~CGROUP_OPTIONS_DISABLED_DUPLICATE;
  1652. break;
  1653. }
  1654. }
  1655. }
  1656. if(!last)
  1657. discovered_cgroup_root = cg->discovered_next;
  1658. else
  1659. last->discovered_next = cg->discovered_next;
  1660. cgroup_free(cg);
  1661. if(!last)
  1662. cg = discovered_cgroup_root;
  1663. else
  1664. cg = last->discovered_next;
  1665. }
  1666. else {
  1667. last = cg;
  1668. cg = cg->discovered_next;
  1669. }
  1670. }
  1671. }
  1672. static inline void copy_discovered_cgroups()
  1673. {
  1674. debug(D_CGROUP, "copy discovered cgroups to the main group list");
  1675. struct cgroup *cg;
  1676. for(cg = discovered_cgroup_root; cg ; cg = cg->discovered_next) {
  1677. cg->next = cg->discovered_next;
  1678. }
  1679. cgroup_root = discovered_cgroup_root;
  1680. }
  1681. static inline void find_all_cgroups() {
  1682. debug(D_CGROUP, "searching for cgroups");
  1683. mark_all_cgroups_as_not_available();
  1684. if(!cgroup_use_unified_cgroups) {
  1685. if(cgroup_enable_cpuacct_stat || cgroup_enable_cpuacct_usage) {
  1686. if(find_dir_in_subdirs(cgroup_cpuacct_base, NULL, found_subdir_in_dir) == -1) {
  1687. cgroup_enable_cpuacct_stat =
  1688. cgroup_enable_cpuacct_usage = CONFIG_BOOLEAN_NO;
  1689. error("CGROUP: disabled cpu statistics.");
  1690. }
  1691. }
  1692. if(cgroup_enable_blkio_io || cgroup_enable_blkio_ops || cgroup_enable_blkio_throttle_io || cgroup_enable_blkio_throttle_ops || cgroup_enable_blkio_merged_ops || cgroup_enable_blkio_queued_ops) {
  1693. if(find_dir_in_subdirs(cgroup_blkio_base, NULL, found_subdir_in_dir) == -1) {
  1694. cgroup_enable_blkio_io =
  1695. cgroup_enable_blkio_ops =
  1696. cgroup_enable_blkio_throttle_io =
  1697. cgroup_enable_blkio_throttle_ops =
  1698. cgroup_enable_blkio_merged_ops =
  1699. cgroup_enable_blkio_queued_ops = CONFIG_BOOLEAN_NO;
  1700. error("CGROUP: disabled blkio statistics.");
  1701. }
  1702. }
  1703. if(cgroup_enable_memory || cgroup_enable_detailed_memory || cgroup_enable_swap || cgroup_enable_memory_failcnt) {
  1704. if(find_dir_in_subdirs(cgroup_memory_base, NULL, found_subdir_in_dir) == -1) {
  1705. cgroup_enable_memory =
  1706. cgroup_enable_detailed_memory =
  1707. cgroup_enable_swap =
  1708. cgroup_enable_memory_failcnt = CONFIG_BOOLEAN_NO;
  1709. error("CGROUP: disabled memory statistics.");
  1710. }
  1711. }
  1712. if(cgroup_search_in_devices) {
  1713. if(find_dir_in_subdirs(cgroup_devices_base, NULL, found_subdir_in_dir) == -1) {
  1714. cgroup_search_in_devices = 0;
  1715. error("CGROUP: disabled devices statistics.");
  1716. }
  1717. }
  1718. }
  1719. else {
  1720. if (find_dir_in_subdirs(cgroup_unified_base, NULL, found_subdir_in_dir) == -1) {
  1721. cgroup_unified_exist = CONFIG_BOOLEAN_NO;
  1722. error("CGROUP: disabled unified cgroups statistics.");
  1723. }
  1724. }
  1725. update_filenames();
  1726. uv_mutex_lock(&cgroup_root_mutex);
  1727. cleanup_all_cgroups();
  1728. copy_discovered_cgroups();
  1729. uv_mutex_unlock(&cgroup_root_mutex);
  1730. debug(D_CGROUP, "done searching for cgroups");
  1731. }
  1732. void cgroup_discovery_worker(void *ptr)
  1733. {
  1734. UNUSED(ptr);
  1735. while (!netdata_exit) {
  1736. uv_mutex_lock(&discovery_thread.mutex);
  1737. while (!discovery_thread.start_discovery)
  1738. uv_cond_wait(&discovery_thread.cond_var, &discovery_thread.mutex);
  1739. discovery_thread.start_discovery = 0;
  1740. uv_mutex_unlock(&discovery_thread.mutex);
  1741. if (unlikely(netdata_exit))
  1742. break;
  1743. find_all_cgroups();
  1744. }
  1745. discovery_thread.exited = 1;
  1746. }
  1747. // ----------------------------------------------------------------------------
  1748. // generate charts
  1749. #define CHART_TITLE_MAX 300
  1750. void update_systemd_services_charts(
  1751. int update_every
  1752. , int do_cpu
  1753. , int do_mem_usage
  1754. , int do_mem_detailed
  1755. , int do_mem_failcnt
  1756. , int do_swap_usage
  1757. , int do_io
  1758. , int do_io_ops
  1759. , int do_throttle_io
  1760. , int do_throttle_ops
  1761. , int do_queued_ops
  1762. , int do_merged_ops
  1763. ) {
  1764. static RRDSET
  1765. *st_cpu = NULL,
  1766. *st_mem_usage = NULL,
  1767. *st_mem_failcnt = NULL,
  1768. *st_swap_usage = NULL,
  1769. *st_mem_detailed_cache = NULL,
  1770. *st_mem_detailed_rss = NULL,
  1771. *st_mem_detailed_mapped = NULL,
  1772. *st_mem_detailed_writeback = NULL,
  1773. *st_mem_detailed_pgfault = NULL,
  1774. *st_mem_detailed_pgmajfault = NULL,
  1775. *st_mem_detailed_pgpgin = NULL,
  1776. *st_mem_detailed_pgpgout = NULL,
  1777. *st_io_read = NULL,
  1778. *st_io_serviced_read = NULL,
  1779. *st_throttle_io_read = NULL,
  1780. *st_throttle_ops_read = NULL,
  1781. *st_queued_ops_read = NULL,
  1782. *st_merged_ops_read = NULL,
  1783. *st_io_write = NULL,
  1784. *st_io_serviced_write = NULL,
  1785. *st_throttle_io_write = NULL,
  1786. *st_throttle_ops_write = NULL,
  1787. *st_queued_ops_write = NULL,
  1788. *st_merged_ops_write = NULL;
  1789. // create the charts
  1790. if(likely(do_cpu)) {
  1791. if(unlikely(!st_cpu)) {
  1792. char title[CHART_TITLE_MAX + 1];
  1793. snprintfz(title, CHART_TITLE_MAX, "Systemd Services CPU utilization (100%% = 1 core)");
  1794. st_cpu = rrdset_create_localhost(
  1795. "services"
  1796. , "cpu"
  1797. , NULL
  1798. , "cpu"
  1799. , "services.cpu"
  1800. , title
  1801. , "percentage"
  1802. , PLUGIN_CGROUPS_NAME
  1803. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  1804. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD
  1805. , update_every
  1806. , RRDSET_TYPE_STACKED
  1807. );
  1808. }
  1809. else
  1810. rrdset_next(st_cpu);
  1811. }
  1812. if(likely(do_mem_usage)) {
  1813. if(unlikely(!st_mem_usage)) {
  1814. st_mem_usage = rrdset_create_localhost(
  1815. "services"
  1816. , "mem_usage"
  1817. , NULL
  1818. , "mem"
  1819. , "services.mem_usage"
  1820. , "Systemd Services Used Memory"
  1821. , "MiB"
  1822. , PLUGIN_CGROUPS_NAME
  1823. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  1824. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 10
  1825. , update_every
  1826. , RRDSET_TYPE_STACKED
  1827. );
  1828. }
  1829. else
  1830. rrdset_next(st_mem_usage);
  1831. }
  1832. if(likely(do_mem_detailed)) {
  1833. if(unlikely(!st_mem_detailed_rss)) {
  1834. st_mem_detailed_rss = rrdset_create_localhost(
  1835. "services"
  1836. , "mem_rss"
  1837. , NULL
  1838. , "mem"
  1839. , "services.mem_rss"
  1840. , "Systemd Services RSS Memory"
  1841. , "MiB"
  1842. , PLUGIN_CGROUPS_NAME
  1843. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  1844. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 20
  1845. , update_every
  1846. , RRDSET_TYPE_STACKED
  1847. );
  1848. }
  1849. else
  1850. rrdset_next(st_mem_detailed_rss);
  1851. if(unlikely(!st_mem_detailed_mapped)) {
  1852. st_mem_detailed_mapped = rrdset_create_localhost(
  1853. "services"
  1854. , "mem_mapped"
  1855. , NULL
  1856. , "mem"
  1857. , "services.mem_mapped"
  1858. , "Systemd Services Mapped Memory"
  1859. , "MiB"
  1860. , PLUGIN_CGROUPS_NAME
  1861. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  1862. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 30
  1863. , update_every
  1864. , RRDSET_TYPE_STACKED
  1865. );
  1866. }
  1867. else
  1868. rrdset_next(st_mem_detailed_mapped);
  1869. if(unlikely(!st_mem_detailed_cache)) {
  1870. st_mem_detailed_cache = rrdset_create_localhost(
  1871. "services"
  1872. , "mem_cache"
  1873. , NULL
  1874. , "mem"
  1875. , "services.mem_cache"
  1876. , "Systemd Services Cache Memory"
  1877. , "MiB"
  1878. , PLUGIN_CGROUPS_NAME
  1879. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  1880. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 40
  1881. , update_every
  1882. , RRDSET_TYPE_STACKED
  1883. );
  1884. }
  1885. else
  1886. rrdset_next(st_mem_detailed_cache);
  1887. if(unlikely(!st_mem_detailed_writeback)) {
  1888. st_mem_detailed_writeback = rrdset_create_localhost(
  1889. "services"
  1890. , "mem_writeback"
  1891. , NULL
  1892. , "mem"
  1893. , "services.mem_writeback"
  1894. , "Systemd Services Writeback Memory"
  1895. , "MiB"
  1896. , PLUGIN_CGROUPS_NAME
  1897. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  1898. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 50
  1899. , update_every
  1900. , RRDSET_TYPE_STACKED
  1901. );
  1902. }
  1903. else
  1904. rrdset_next(st_mem_detailed_writeback);
  1905. if(unlikely(!st_mem_detailed_pgfault)) {
  1906. st_mem_detailed_pgfault = rrdset_create_localhost(
  1907. "services"
  1908. , "mem_pgfault"
  1909. , NULL
  1910. , "mem"
  1911. , "services.mem_pgfault"
  1912. , "Systemd Services Memory Minor Page Faults"
  1913. , "MiB/s"
  1914. , PLUGIN_CGROUPS_NAME
  1915. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  1916. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 60
  1917. , update_every
  1918. , RRDSET_TYPE_STACKED
  1919. );
  1920. }
  1921. else
  1922. rrdset_next(st_mem_detailed_pgfault);
  1923. if(unlikely(!st_mem_detailed_pgmajfault)) {
  1924. st_mem_detailed_pgmajfault = rrdset_create_localhost(
  1925. "services"
  1926. , "mem_pgmajfault"
  1927. , NULL
  1928. , "mem"
  1929. , "services.mem_pgmajfault"
  1930. , "Systemd Services Memory Major Page Faults"
  1931. , "MiB/s"
  1932. , PLUGIN_CGROUPS_NAME
  1933. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  1934. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 70
  1935. , update_every
  1936. , RRDSET_TYPE_STACKED
  1937. );
  1938. }
  1939. else
  1940. rrdset_next(st_mem_detailed_pgmajfault);
  1941. if(unlikely(!st_mem_detailed_pgpgin)) {
  1942. st_mem_detailed_pgpgin = rrdset_create_localhost(
  1943. "services"
  1944. , "mem_pgpgin"
  1945. , NULL
  1946. , "mem"
  1947. , "services.mem_pgpgin"
  1948. , "Systemd Services Memory Charging Activity"
  1949. , "MiB/s"
  1950. , PLUGIN_CGROUPS_NAME
  1951. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  1952. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 80
  1953. , update_every
  1954. , RRDSET_TYPE_STACKED
  1955. );
  1956. }
  1957. else
  1958. rrdset_next(st_mem_detailed_pgpgin);
  1959. if(unlikely(!st_mem_detailed_pgpgout)) {
  1960. st_mem_detailed_pgpgout = rrdset_create_localhost(
  1961. "services"
  1962. , "mem_pgpgout"
  1963. , NULL
  1964. , "mem"
  1965. , "services.mem_pgpgout"
  1966. , "Systemd Services Memory Uncharging Activity"
  1967. , "MiB/s"
  1968. , PLUGIN_CGROUPS_NAME
  1969. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  1970. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 90
  1971. , update_every
  1972. , RRDSET_TYPE_STACKED
  1973. );
  1974. }
  1975. else
  1976. rrdset_next(st_mem_detailed_pgpgout);
  1977. }
  1978. if(likely(do_mem_failcnt)) {
  1979. if(unlikely(!st_mem_failcnt)) {
  1980. st_mem_failcnt = rrdset_create_localhost(
  1981. "services"
  1982. , "mem_failcnt"
  1983. , NULL
  1984. , "mem"
  1985. , "services.mem_failcnt"
  1986. , "Systemd Services Memory Limit Failures"
  1987. , "failures"
  1988. , PLUGIN_CGROUPS_NAME
  1989. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  1990. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 110
  1991. , update_every
  1992. , RRDSET_TYPE_STACKED
  1993. );
  1994. }
  1995. else
  1996. rrdset_next(st_mem_failcnt);
  1997. }
  1998. if(likely(do_swap_usage)) {
  1999. if(unlikely(!st_swap_usage)) {
  2000. st_swap_usage = rrdset_create_localhost(
  2001. "services"
  2002. , "swap_usage"
  2003. , NULL
  2004. , "swap"
  2005. , "services.swap_usage"
  2006. , "Systemd Services Swap Memory Used"
  2007. , "MiB"
  2008. , PLUGIN_CGROUPS_NAME
  2009. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  2010. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 100
  2011. , update_every
  2012. , RRDSET_TYPE_STACKED
  2013. );
  2014. }
  2015. else
  2016. rrdset_next(st_swap_usage);
  2017. }
  2018. if(likely(do_io)) {
  2019. if(unlikely(!st_io_read)) {
  2020. st_io_read = rrdset_create_localhost(
  2021. "services"
  2022. , "io_read"
  2023. , NULL
  2024. , "disk"
  2025. , "services.io_read"
  2026. , "Systemd Services Disk Read Bandwidth"
  2027. , "KiB/s"
  2028. , PLUGIN_CGROUPS_NAME
  2029. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  2030. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 120
  2031. , update_every
  2032. , RRDSET_TYPE_STACKED
  2033. );
  2034. }
  2035. else
  2036. rrdset_next(st_io_read);
  2037. if(unlikely(!st_io_write)) {
  2038. st_io_write = rrdset_create_localhost(
  2039. "services"
  2040. , "io_write"
  2041. , NULL
  2042. , "disk"
  2043. , "services.io_write"
  2044. , "Systemd Services Disk Write Bandwidth"
  2045. , "KiB/s"
  2046. , PLUGIN_CGROUPS_NAME
  2047. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  2048. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 130
  2049. , update_every
  2050. , RRDSET_TYPE_STACKED
  2051. );
  2052. }
  2053. else
  2054. rrdset_next(st_io_write);
  2055. }
  2056. if(likely(do_io_ops)) {
  2057. if(unlikely(!st_io_serviced_read)) {
  2058. st_io_serviced_read = rrdset_create_localhost(
  2059. "services"
  2060. , "io_ops_read"
  2061. , NULL
  2062. , "disk"
  2063. , "services.io_ops_read"
  2064. , "Systemd Services Disk Read Operations"
  2065. , "operations/s"
  2066. , PLUGIN_CGROUPS_NAME
  2067. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  2068. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 140
  2069. , update_every
  2070. , RRDSET_TYPE_STACKED
  2071. );
  2072. }
  2073. else
  2074. rrdset_next(st_io_serviced_read);
  2075. if(unlikely(!st_io_serviced_write)) {
  2076. st_io_serviced_write = rrdset_create_localhost(
  2077. "services"
  2078. , "io_ops_write"
  2079. , NULL
  2080. , "disk"
  2081. , "services.io_ops_write"
  2082. , "Systemd Services Disk Write Operations"
  2083. , "operations/s"
  2084. , PLUGIN_CGROUPS_NAME
  2085. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  2086. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 150
  2087. , update_every
  2088. , RRDSET_TYPE_STACKED
  2089. );
  2090. }
  2091. else
  2092. rrdset_next(st_io_serviced_write);
  2093. }
  2094. if(likely(do_throttle_io)) {
  2095. if(unlikely(!st_throttle_io_read)) {
  2096. st_throttle_io_read = rrdset_create_localhost(
  2097. "services"
  2098. , "throttle_io_read"
  2099. , NULL
  2100. , "disk"
  2101. , "services.throttle_io_read"
  2102. , "Systemd Services Throttle Disk Read Bandwidth"
  2103. , "KiB/s"
  2104. , PLUGIN_CGROUPS_NAME
  2105. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  2106. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 160
  2107. , update_every
  2108. , RRDSET_TYPE_STACKED
  2109. );
  2110. }
  2111. else
  2112. rrdset_next(st_throttle_io_read);
  2113. if(unlikely(!st_throttle_io_write)) {
  2114. st_throttle_io_write = rrdset_create_localhost(
  2115. "services"
  2116. , "throttle_io_write"
  2117. , NULL
  2118. , "disk"
  2119. , "services.throttle_io_write"
  2120. , "Systemd Services Throttle Disk Write Bandwidth"
  2121. , "KiB/s"
  2122. , PLUGIN_CGROUPS_NAME
  2123. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  2124. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 170
  2125. , update_every
  2126. , RRDSET_TYPE_STACKED
  2127. );
  2128. }
  2129. else
  2130. rrdset_next(st_throttle_io_write);
  2131. }
  2132. if(likely(do_throttle_ops)) {
  2133. if(unlikely(!st_throttle_ops_read)) {
  2134. st_throttle_ops_read = rrdset_create_localhost(
  2135. "services"
  2136. , "throttle_io_ops_read"
  2137. , NULL
  2138. , "disk"
  2139. , "services.throttle_io_ops_read"
  2140. , "Systemd Services Throttle Disk Read Operations"
  2141. , "operations/s"
  2142. , PLUGIN_CGROUPS_NAME
  2143. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  2144. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 180
  2145. , update_every
  2146. , RRDSET_TYPE_STACKED
  2147. );
  2148. }
  2149. else
  2150. rrdset_next(st_throttle_ops_read);
  2151. if(unlikely(!st_throttle_ops_write)) {
  2152. st_throttle_ops_write = rrdset_create_localhost(
  2153. "services"
  2154. , "throttle_io_ops_write"
  2155. , NULL
  2156. , "disk"
  2157. , "services.throttle_io_ops_write"
  2158. , "Systemd Services Throttle Disk Write Operations"
  2159. , "operations/s"
  2160. , PLUGIN_CGROUPS_NAME
  2161. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  2162. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 190
  2163. , update_every
  2164. , RRDSET_TYPE_STACKED
  2165. );
  2166. }
  2167. else
  2168. rrdset_next(st_throttle_ops_write);
  2169. }
  2170. if(likely(do_queued_ops)) {
  2171. if(unlikely(!st_queued_ops_read)) {
  2172. st_queued_ops_read = rrdset_create_localhost(
  2173. "services"
  2174. , "queued_io_ops_read"
  2175. , NULL
  2176. , "disk"
  2177. , "services.queued_io_ops_read"
  2178. , "Systemd Services Queued Disk Read Operations"
  2179. , "operations/s"
  2180. , PLUGIN_CGROUPS_NAME
  2181. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  2182. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 200
  2183. , update_every
  2184. , RRDSET_TYPE_STACKED
  2185. );
  2186. }
  2187. else
  2188. rrdset_next(st_queued_ops_read);
  2189. if(unlikely(!st_queued_ops_write)) {
  2190. st_queued_ops_write = rrdset_create_localhost(
  2191. "services"
  2192. , "queued_io_ops_write"
  2193. , NULL
  2194. , "disk"
  2195. , "services.queued_io_ops_write"
  2196. , "Systemd Services Queued Disk Write Operations"
  2197. , "operations/s"
  2198. , PLUGIN_CGROUPS_NAME
  2199. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  2200. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 210
  2201. , update_every
  2202. , RRDSET_TYPE_STACKED
  2203. );
  2204. }
  2205. else
  2206. rrdset_next(st_queued_ops_write);
  2207. }
  2208. if(likely(do_merged_ops)) {
  2209. if(unlikely(!st_merged_ops_read)) {
  2210. st_merged_ops_read = rrdset_create_localhost(
  2211. "services"
  2212. , "merged_io_ops_read"
  2213. , NULL
  2214. , "disk"
  2215. , "services.merged_io_ops_read"
  2216. , "Systemd Services Merged Disk Read Operations"
  2217. , "operations/s"
  2218. , PLUGIN_CGROUPS_NAME
  2219. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  2220. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 220
  2221. , update_every
  2222. , RRDSET_TYPE_STACKED
  2223. );
  2224. }
  2225. else
  2226. rrdset_next(st_merged_ops_read);
  2227. if(unlikely(!st_merged_ops_write)) {
  2228. st_merged_ops_write = rrdset_create_localhost(
  2229. "services"
  2230. , "merged_io_ops_write"
  2231. , NULL
  2232. , "disk"
  2233. , "services.merged_io_ops_write"
  2234. , "Systemd Services Merged Disk Write Operations"
  2235. , "operations/s"
  2236. , PLUGIN_CGROUPS_NAME
  2237. , PLUGIN_CGROUPS_MODULE_SYSTEMD_NAME
  2238. , NETDATA_CHART_PRIO_CGROUPS_SYSTEMD + 230
  2239. , update_every
  2240. , RRDSET_TYPE_STACKED
  2241. );
  2242. }
  2243. else
  2244. rrdset_next(st_merged_ops_write);
  2245. }
  2246. // update the values
  2247. struct cgroup *cg;
  2248. for(cg = cgroup_root; cg ; cg = cg->next) {
  2249. if(unlikely(!cg->enabled || cg->pending_renames || !(cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE)))
  2250. continue;
  2251. if(likely(do_cpu && cg->cpuacct_stat.updated)) {
  2252. if(unlikely(!cg->rd_cpu)){
  2253. if (!(cg->options & CGROUP_OPTIONS_IS_UNIFIED)) {
  2254. cg->rd_cpu = rrddim_add(st_cpu, cg->chart_id, cg->chart_title, 100, system_hz, RRD_ALGORITHM_INCREMENTAL);
  2255. } else {
  2256. cg->rd_cpu = rrddim_add(st_cpu, cg->chart_id, cg->chart_title, 100, 1000000, RRD_ALGORITHM_INCREMENTAL);
  2257. }
  2258. }
  2259. rrddim_set_by_pointer(st_cpu, cg->rd_cpu, cg->cpuacct_stat.user + cg->cpuacct_stat.system);
  2260. }
  2261. if(likely(do_mem_usage && cg->memory.updated_usage_in_bytes)) {
  2262. if(unlikely(!cg->rd_mem_usage))
  2263. cg->rd_mem_usage = rrddim_add(st_mem_usage, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2264. rrddim_set_by_pointer(st_mem_usage, cg->rd_mem_usage, cg->memory.usage_in_bytes);
  2265. }
  2266. if(likely(do_mem_detailed && cg->memory.updated_detailed)) {
  2267. if(unlikely(!cg->rd_mem_detailed_rss))
  2268. cg->rd_mem_detailed_rss = rrddim_add(st_mem_detailed_rss, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2269. rrddim_set_by_pointer(st_mem_detailed_rss, cg->rd_mem_detailed_rss, cg->memory.total_rss + cg->memory.total_rss_huge);
  2270. if(unlikely(!cg->rd_mem_detailed_mapped))
  2271. cg->rd_mem_detailed_mapped = rrddim_add(st_mem_detailed_mapped, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2272. rrddim_set_by_pointer(st_mem_detailed_mapped, cg->rd_mem_detailed_mapped, cg->memory.total_mapped_file);
  2273. if(unlikely(!cg->rd_mem_detailed_cache))
  2274. cg->rd_mem_detailed_cache = rrddim_add(st_mem_detailed_cache, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2275. rrddim_set_by_pointer(st_mem_detailed_cache, cg->rd_mem_detailed_cache, cg->memory.total_cache);
  2276. if(unlikely(!cg->rd_mem_detailed_writeback))
  2277. cg->rd_mem_detailed_writeback = rrddim_add(st_mem_detailed_writeback, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2278. rrddim_set_by_pointer(st_mem_detailed_writeback, cg->rd_mem_detailed_writeback, cg->memory.total_writeback);
  2279. if(unlikely(!cg->rd_mem_detailed_pgfault))
  2280. cg->rd_mem_detailed_pgfault = rrddim_add(st_mem_detailed_pgfault, cg->chart_id, cg->chart_title, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
  2281. rrddim_set_by_pointer(st_mem_detailed_pgfault, cg->rd_mem_detailed_pgfault, cg->memory.total_pgfault);
  2282. if(unlikely(!cg->rd_mem_detailed_pgmajfault))
  2283. cg->rd_mem_detailed_pgmajfault = rrddim_add(st_mem_detailed_pgmajfault, cg->chart_id, cg->chart_title, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
  2284. rrddim_set_by_pointer(st_mem_detailed_pgmajfault, cg->rd_mem_detailed_pgmajfault, cg->memory.total_pgmajfault);
  2285. if(unlikely(!cg->rd_mem_detailed_pgpgin))
  2286. cg->rd_mem_detailed_pgpgin = rrddim_add(st_mem_detailed_pgpgin, cg->chart_id, cg->chart_title, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
  2287. rrddim_set_by_pointer(st_mem_detailed_pgpgin, cg->rd_mem_detailed_pgpgin, cg->memory.total_pgpgin);
  2288. if(unlikely(!cg->rd_mem_detailed_pgpgout))
  2289. cg->rd_mem_detailed_pgpgout = rrddim_add(st_mem_detailed_pgpgout, cg->chart_id, cg->chart_title, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
  2290. rrddim_set_by_pointer(st_mem_detailed_pgpgout, cg->rd_mem_detailed_pgpgout, cg->memory.total_pgpgout);
  2291. }
  2292. if(likely(do_mem_failcnt && cg->memory.updated_failcnt)) {
  2293. if(unlikely(!cg->rd_mem_failcnt))
  2294. cg->rd_mem_failcnt = rrddim_add(st_mem_failcnt, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2295. rrddim_set_by_pointer(st_mem_failcnt, cg->rd_mem_failcnt, cg->memory.failcnt);
  2296. }
  2297. if(likely(do_swap_usage && cg->memory.updated_msw_usage_in_bytes)) {
  2298. if(unlikely(!cg->rd_swap_usage))
  2299. cg->rd_swap_usage = rrddim_add(st_swap_usage, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2300. rrddim_set_by_pointer(st_swap_usage, cg->rd_swap_usage, cg->memory.msw_usage_in_bytes);
  2301. }
  2302. if(likely(do_io && cg->io_service_bytes.updated)) {
  2303. if(unlikely(!cg->rd_io_service_bytes_read))
  2304. cg->rd_io_service_bytes_read = rrddim_add(st_io_read, cg->chart_id, cg->chart_title, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
  2305. rrddim_set_by_pointer(st_io_read, cg->rd_io_service_bytes_read, cg->io_service_bytes.Read);
  2306. if(unlikely(!cg->rd_io_service_bytes_write))
  2307. cg->rd_io_service_bytes_write = rrddim_add(st_io_write, cg->chart_id, cg->chart_title, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
  2308. rrddim_set_by_pointer(st_io_write, cg->rd_io_service_bytes_write, cg->io_service_bytes.Write);
  2309. }
  2310. if(likely(do_io_ops && cg->io_serviced.updated)) {
  2311. if(unlikely(!cg->rd_io_serviced_read))
  2312. cg->rd_io_serviced_read = rrddim_add(st_io_serviced_read, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2313. rrddim_set_by_pointer(st_io_serviced_read, cg->rd_io_serviced_read, cg->io_serviced.Read);
  2314. if(unlikely(!cg->rd_io_serviced_write))
  2315. cg->rd_io_serviced_write = rrddim_add(st_io_serviced_write, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2316. rrddim_set_by_pointer(st_io_serviced_write, cg->rd_io_serviced_write, cg->io_serviced.Write);
  2317. }
  2318. if(likely(do_throttle_io && cg->throttle_io_service_bytes.updated)) {
  2319. if(unlikely(!cg->rd_throttle_io_read))
  2320. cg->rd_throttle_io_read = rrddim_add(st_throttle_io_read, cg->chart_id, cg->chart_title, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
  2321. rrddim_set_by_pointer(st_throttle_io_read, cg->rd_throttle_io_read, cg->throttle_io_service_bytes.Read);
  2322. if(unlikely(!cg->rd_throttle_io_write))
  2323. cg->rd_throttle_io_write = rrddim_add(st_throttle_io_write, cg->chart_id, cg->chart_title, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
  2324. rrddim_set_by_pointer(st_throttle_io_write, cg->rd_throttle_io_write, cg->throttle_io_service_bytes.Write);
  2325. }
  2326. if(likely(do_throttle_ops && cg->throttle_io_serviced.updated)) {
  2327. if(unlikely(!cg->rd_throttle_io_serviced_read))
  2328. cg->rd_throttle_io_serviced_read = rrddim_add(st_throttle_ops_read, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2329. rrddim_set_by_pointer(st_throttle_ops_read, cg->rd_throttle_io_serviced_read, cg->throttle_io_serviced.Read);
  2330. if(unlikely(!cg->rd_throttle_io_serviced_write))
  2331. cg->rd_throttle_io_serviced_write = rrddim_add(st_throttle_ops_write, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2332. rrddim_set_by_pointer(st_throttle_ops_write, cg->rd_throttle_io_serviced_write, cg->throttle_io_serviced.Write);
  2333. }
  2334. if(likely(do_queued_ops && cg->io_queued.updated)) {
  2335. if(unlikely(!cg->rd_io_queued_read))
  2336. cg->rd_io_queued_read = rrddim_add(st_queued_ops_read, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2337. rrddim_set_by_pointer(st_queued_ops_read, cg->rd_io_queued_read, cg->io_queued.Read);
  2338. if(unlikely(!cg->rd_io_queued_write))
  2339. cg->rd_io_queued_write = rrddim_add(st_queued_ops_write, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2340. rrddim_set_by_pointer(st_queued_ops_write, cg->rd_io_queued_write, cg->io_queued.Write);
  2341. }
  2342. if(likely(do_merged_ops && cg->io_merged.updated)) {
  2343. if(unlikely(!cg->rd_io_merged_read))
  2344. cg->rd_io_merged_read = rrddim_add(st_merged_ops_read, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2345. rrddim_set_by_pointer(st_merged_ops_read, cg->rd_io_merged_read, cg->io_merged.Read);
  2346. if(unlikely(!cg->rd_io_merged_write))
  2347. cg->rd_io_merged_write = rrddim_add(st_merged_ops_write, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2348. rrddim_set_by_pointer(st_merged_ops_write, cg->rd_io_merged_write, cg->io_merged.Write);
  2349. }
  2350. }
  2351. // complete the iteration
  2352. if(likely(do_cpu))
  2353. rrdset_done(st_cpu);
  2354. if(likely(do_mem_usage))
  2355. rrdset_done(st_mem_usage);
  2356. if(unlikely(do_mem_detailed)) {
  2357. rrdset_done(st_mem_detailed_cache);
  2358. rrdset_done(st_mem_detailed_rss);
  2359. rrdset_done(st_mem_detailed_mapped);
  2360. rrdset_done(st_mem_detailed_writeback);
  2361. rrdset_done(st_mem_detailed_pgfault);
  2362. rrdset_done(st_mem_detailed_pgmajfault);
  2363. rrdset_done(st_mem_detailed_pgpgin);
  2364. rrdset_done(st_mem_detailed_pgpgout);
  2365. }
  2366. if(likely(do_mem_failcnt))
  2367. rrdset_done(st_mem_failcnt);
  2368. if(likely(do_swap_usage))
  2369. rrdset_done(st_swap_usage);
  2370. if(likely(do_io)) {
  2371. rrdset_done(st_io_read);
  2372. rrdset_done(st_io_write);
  2373. }
  2374. if(likely(do_io_ops)) {
  2375. rrdset_done(st_io_serviced_read);
  2376. rrdset_done(st_io_serviced_write);
  2377. }
  2378. if(likely(do_throttle_io)) {
  2379. rrdset_done(st_throttle_io_read);
  2380. rrdset_done(st_throttle_io_write);
  2381. }
  2382. if(likely(do_throttle_ops)) {
  2383. rrdset_done(st_throttle_ops_read);
  2384. rrdset_done(st_throttle_ops_write);
  2385. }
  2386. if(likely(do_queued_ops)) {
  2387. rrdset_done(st_queued_ops_read);
  2388. rrdset_done(st_queued_ops_write);
  2389. }
  2390. if(likely(do_merged_ops)) {
  2391. rrdset_done(st_merged_ops_read);
  2392. rrdset_done(st_merged_ops_write);
  2393. }
  2394. }
  2395. static inline char *cgroup_chart_type(char *buffer, const char *id, size_t len) {
  2396. if(buffer[0]) return buffer;
  2397. if(id[0] == '\0' || (id[0] == '/' && id[1] == '\0'))
  2398. strncpy(buffer, "cgroup_root", len);
  2399. else
  2400. snprintfz(buffer, len, "cgroup_%s", id);
  2401. netdata_fix_chart_id(buffer);
  2402. return buffer;
  2403. }
  2404. static inline unsigned long long cpuset_str2ull(char **s) {
  2405. unsigned long long n = 0;
  2406. char c;
  2407. for(c = **s; c >= '0' && c <= '9' ; c = *(++*s)) {
  2408. n *= 10;
  2409. n += c - '0';
  2410. }
  2411. return n;
  2412. }
  2413. static inline void update_cpu_limits(char **filename, unsigned long long *value, struct cgroup *cg) {
  2414. if(*filename) {
  2415. int ret = -1;
  2416. if(value == &cg->cpuset_cpus) {
  2417. static char *buf = NULL;
  2418. static size_t buf_size = 0;
  2419. if(!buf) {
  2420. buf_size = 100U + 6 * get_system_cpus(); // taken from kernel/cgroup/cpuset.c
  2421. buf = mallocz(buf_size + 1);
  2422. }
  2423. ret = read_file(*filename, buf, buf_size);
  2424. if(!ret) {
  2425. char *s = buf;
  2426. unsigned long long ncpus = 0;
  2427. // parse the cpuset string and calculate the number of cpus the cgroup is allowed to use
  2428. while(*s) {
  2429. unsigned long long n = cpuset_str2ull(&s);
  2430. ncpus++;
  2431. if(*s == ',') {
  2432. s++;
  2433. continue;
  2434. }
  2435. if(*s == '-') {
  2436. s++;
  2437. unsigned long long m = cpuset_str2ull(&s);
  2438. ncpus += m - n; // calculate the number of cpus in the region
  2439. }
  2440. s++;
  2441. }
  2442. if(likely(ncpus)) *value = ncpus;
  2443. }
  2444. }
  2445. else if(value == &cg->cpu_cfs_period) {
  2446. ret = read_single_number_file(*filename, value);
  2447. }
  2448. else if(value == &cg->cpu_cfs_quota) {
  2449. ret = read_single_number_file(*filename, value);
  2450. }
  2451. else ret = -1;
  2452. if(ret) {
  2453. error("Cannot refresh cgroup %s cpu limit by reading '%s'. Will not update its limit anymore.", cg->id, *filename);
  2454. freez(*filename);
  2455. *filename = NULL;
  2456. }
  2457. }
  2458. }
  2459. static inline void update_cpu_limits2(struct cgroup *cg) {
  2460. if(cg->filename_cpu_cfs_quota){
  2461. static procfile *ff = NULL;
  2462. ff = procfile_reopen(ff, cg->filename_cpu_cfs_quota, NULL, PROCFILE_FLAG_DEFAULT);
  2463. if(unlikely(!ff)) {
  2464. goto cpu_limits2_err;
  2465. }
  2466. ff = procfile_readall(ff);
  2467. if(unlikely(!ff)) {
  2468. goto cpu_limits2_err;
  2469. }
  2470. unsigned long lines = procfile_lines(ff);
  2471. if (unlikely(lines < 1)) {
  2472. error("CGROUP: file '%s' should have 1 lines.", cg->filename_cpu_cfs_quota);
  2473. return;
  2474. }
  2475. cg->cpu_cfs_period = str2ull(procfile_lineword(ff, 0, 1));
  2476. cg->cpuset_cpus = get_system_cpus();
  2477. char *s = "max\n\0";
  2478. if(strsame(s, procfile_lineword(ff, 0, 0)) == 0){
  2479. cg->cpu_cfs_quota = cg->cpu_cfs_period * cg->cpuset_cpus;
  2480. } else {
  2481. cg->cpu_cfs_quota = str2ull(procfile_lineword(ff, 0, 0));
  2482. }
  2483. debug(D_CGROUP, "CPU limits values: %llu %llu %llu", cg->cpu_cfs_period, cg->cpuset_cpus, cg->cpu_cfs_quota);
  2484. return;
  2485. cpu_limits2_err:
  2486. error("Cannot refresh cgroup %s cpu limit by reading '%s'. Will not update its limit anymore.", cg->id, cg->filename_cpu_cfs_quota);
  2487. freez(cg->filename_cpu_cfs_quota);
  2488. cg->filename_cpu_cfs_quota = NULL;
  2489. }
  2490. }
  2491. static inline int update_memory_limits(char **filename, RRDSETVAR **chart_var, unsigned long long *value, const char *chart_var_name, struct cgroup *cg) {
  2492. if(*filename) {
  2493. if(unlikely(!*chart_var)) {
  2494. *chart_var = rrdsetvar_custom_chart_variable_create(cg->st_mem_usage, chart_var_name);
  2495. if(!*chart_var) {
  2496. error("Cannot create cgroup %s chart variable '%s'. Will not update its limit anymore.", cg->id, chart_var_name);
  2497. freez(*filename);
  2498. *filename = NULL;
  2499. }
  2500. }
  2501. if(*filename && *chart_var) {
  2502. if(!(cg->options & CGROUP_OPTIONS_IS_UNIFIED)) {
  2503. if(read_single_number_file(*filename, value)) {
  2504. error("Cannot refresh cgroup %s memory limit by reading '%s'. Will not update its limit anymore.", cg->id, *filename);
  2505. freez(*filename);
  2506. *filename = NULL;
  2507. }
  2508. else {
  2509. rrdsetvar_custom_chart_variable_set(*chart_var, (calculated_number)(*value / (1024 * 1024)));
  2510. return 1;
  2511. }
  2512. } else {
  2513. char buffer[30 + 1];
  2514. int ret = read_file(*filename, buffer, 30);
  2515. if(ret) {
  2516. error("Cannot refresh cgroup %s memory limit by reading '%s'. Will not update its limit anymore.", cg->id, *filename);
  2517. freez(*filename);
  2518. *filename = NULL;
  2519. return 0;
  2520. }
  2521. char *s = "max\n\0";
  2522. if(strsame(s, buffer) == 0){
  2523. *value = UINT64_MAX;
  2524. rrdsetvar_custom_chart_variable_set(*chart_var, (calculated_number)(*value / (1024 * 1024)));
  2525. return 1;
  2526. }
  2527. *value = str2ull(buffer);
  2528. rrdsetvar_custom_chart_variable_set(*chart_var, (calculated_number)(*value / (1024 * 1024)));
  2529. return 1;
  2530. }
  2531. }
  2532. }
  2533. return 0;
  2534. }
  2535. void update_cgroup_charts(int update_every) {
  2536. debug(D_CGROUP, "updating cgroups charts");
  2537. char type[RRD_ID_LENGTH_MAX + 1];
  2538. char title[CHART_TITLE_MAX + 1];
  2539. int services_do_cpu = 0,
  2540. services_do_mem_usage = 0,
  2541. services_do_mem_detailed = 0,
  2542. services_do_mem_failcnt = 0,
  2543. services_do_swap_usage = 0,
  2544. services_do_io = 0,
  2545. services_do_io_ops = 0,
  2546. services_do_throttle_io = 0,
  2547. services_do_throttle_ops = 0,
  2548. services_do_queued_ops = 0,
  2549. services_do_merged_ops = 0;
  2550. struct cgroup *cg;
  2551. for(cg = cgroup_root; cg ; cg = cg->next) {
  2552. if(unlikely(!cg->enabled || cg->pending_renames))
  2553. continue;
  2554. if(likely(cgroup_enable_systemd_services && cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE)) {
  2555. if(cg->cpuacct_stat.updated && cg->cpuacct_stat.enabled == CONFIG_BOOLEAN_YES) services_do_cpu++;
  2556. if(cgroup_enable_systemd_services_detailed_memory && cg->memory.updated_detailed && cg->memory.enabled_detailed) services_do_mem_detailed++;
  2557. if(cg->memory.updated_usage_in_bytes && cg->memory.enabled_usage_in_bytes == CONFIG_BOOLEAN_YES) services_do_mem_usage++;
  2558. if(cg->memory.updated_failcnt && cg->memory.enabled_failcnt == CONFIG_BOOLEAN_YES) services_do_mem_failcnt++;
  2559. if(cg->memory.updated_msw_usage_in_bytes && cg->memory.enabled_msw_usage_in_bytes == CONFIG_BOOLEAN_YES) services_do_swap_usage++;
  2560. if(cg->io_service_bytes.updated && cg->io_service_bytes.enabled == CONFIG_BOOLEAN_YES) services_do_io++;
  2561. if(cg->io_serviced.updated && cg->io_serviced.enabled == CONFIG_BOOLEAN_YES) services_do_io_ops++;
  2562. if(cg->throttle_io_service_bytes.updated && cg->throttle_io_service_bytes.enabled == CONFIG_BOOLEAN_YES) services_do_throttle_io++;
  2563. if(cg->throttle_io_serviced.updated && cg->throttle_io_serviced.enabled == CONFIG_BOOLEAN_YES) services_do_throttle_ops++;
  2564. if(cg->io_queued.updated && cg->io_queued.enabled == CONFIG_BOOLEAN_YES) services_do_queued_ops++;
  2565. if(cg->io_merged.updated && cg->io_merged.enabled == CONFIG_BOOLEAN_YES) services_do_merged_ops++;
  2566. continue;
  2567. }
  2568. type[0] = '\0';
  2569. if(likely(cg->cpuacct_stat.updated && cg->cpuacct_stat.enabled == CONFIG_BOOLEAN_YES)) {
  2570. if(unlikely(!cg->st_cpu)) {
  2571. snprintfz(title, CHART_TITLE_MAX, "CPU Usage (100%% = 1 core)");
  2572. cg->st_cpu = rrdset_create_localhost(
  2573. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  2574. , "cpu"
  2575. , NULL
  2576. , "cpu"
  2577. , "cgroup.cpu"
  2578. , title
  2579. , "percentage"
  2580. , PLUGIN_CGROUPS_NAME
  2581. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  2582. , cgroup_containers_chart_priority
  2583. , update_every
  2584. , RRDSET_TYPE_STACKED
  2585. );
  2586. rrdset_update_labels(cg->st_cpu, cg->chart_labels);
  2587. if(!(cg->options & CGROUP_OPTIONS_IS_UNIFIED)) {
  2588. rrddim_add(cg->st_cpu, "user", NULL, 100, system_hz, RRD_ALGORITHM_INCREMENTAL);
  2589. rrddim_add(cg->st_cpu, "system", NULL, 100, system_hz, RRD_ALGORITHM_INCREMENTAL);
  2590. }
  2591. else {
  2592. rrddim_add(cg->st_cpu, "user", NULL, 100, 1000000, RRD_ALGORITHM_INCREMENTAL);
  2593. rrddim_add(cg->st_cpu, "system", NULL, 100, 1000000, RRD_ALGORITHM_INCREMENTAL);
  2594. }
  2595. }
  2596. else
  2597. rrdset_next(cg->st_cpu);
  2598. rrddim_set(cg->st_cpu, "user", cg->cpuacct_stat.user);
  2599. rrddim_set(cg->st_cpu, "system", cg->cpuacct_stat.system);
  2600. rrdset_done(cg->st_cpu);
  2601. if(likely(cg->filename_cpuset_cpus || cg->filename_cpu_cfs_period || cg->filename_cpu_cfs_quota)) {
  2602. if(!(cg->options & CGROUP_OPTIONS_IS_UNIFIED)) {
  2603. update_cpu_limits(&cg->filename_cpuset_cpus, &cg->cpuset_cpus, cg);
  2604. update_cpu_limits(&cg->filename_cpu_cfs_period, &cg->cpu_cfs_period, cg);
  2605. update_cpu_limits(&cg->filename_cpu_cfs_quota, &cg->cpu_cfs_quota, cg);
  2606. } else {
  2607. update_cpu_limits2(cg);
  2608. }
  2609. if(unlikely(!cg->chart_var_cpu_limit)) {
  2610. cg->chart_var_cpu_limit = rrdsetvar_custom_chart_variable_create(cg->st_cpu, "cpu_limit");
  2611. if(!cg->chart_var_cpu_limit) {
  2612. error("Cannot create cgroup %s chart variable 'cpu_limit'. Will not update its limit anymore.", cg->id);
  2613. if(cg->filename_cpuset_cpus) freez(cg->filename_cpuset_cpus);
  2614. cg->filename_cpuset_cpus = NULL;
  2615. if(cg->filename_cpu_cfs_period) freez(cg->filename_cpu_cfs_period);
  2616. cg->filename_cpu_cfs_period = NULL;
  2617. if(cg->filename_cpu_cfs_quota) freez(cg->filename_cpu_cfs_quota);
  2618. cg->filename_cpu_cfs_quota = NULL;
  2619. }
  2620. }
  2621. else {
  2622. calculated_number value = 0, quota = 0;
  2623. if(likely( ((!(cg->options & CGROUP_OPTIONS_IS_UNIFIED)) && (cg->filename_cpuset_cpus || (cg->filename_cpu_cfs_period && cg->filename_cpu_cfs_quota)))
  2624. || ((cg->options & CGROUP_OPTIONS_IS_UNIFIED) && cg->filename_cpu_cfs_quota))) {
  2625. if(unlikely(cg->cpu_cfs_quota > 0))
  2626. quota = (calculated_number)cg->cpu_cfs_quota / (calculated_number)cg->cpu_cfs_period;
  2627. if(unlikely(quota > 0 && quota < cg->cpuset_cpus))
  2628. value = quota * 100;
  2629. else
  2630. value = (calculated_number)cg->cpuset_cpus * 100;
  2631. }
  2632. if(likely(value)) {
  2633. rrdsetvar_custom_chart_variable_set(cg->chart_var_cpu_limit, value);
  2634. if(unlikely(!cg->st_cpu_limit)) {
  2635. snprintfz(title, CHART_TITLE_MAX, "CPU Usage within the limits");
  2636. cg->st_cpu_limit = rrdset_create_localhost(
  2637. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  2638. , "cpu_limit"
  2639. , NULL
  2640. , "cpu"
  2641. , "cgroup.cpu_limit"
  2642. , title
  2643. , "percentage"
  2644. , PLUGIN_CGROUPS_NAME
  2645. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  2646. , cgroup_containers_chart_priority - 1
  2647. , update_every
  2648. , RRDSET_TYPE_LINE
  2649. );
  2650. rrdset_update_labels(cg->st_cpu_limit, cg->chart_labels);
  2651. if(!(cg->options & CGROUP_OPTIONS_IS_UNIFIED))
  2652. rrddim_add(cg->st_cpu_limit, "used", NULL, 1, system_hz, RRD_ALGORITHM_ABSOLUTE);
  2653. else
  2654. rrddim_add(cg->st_cpu_limit, "used", NULL, 1, 1000000, RRD_ALGORITHM_ABSOLUTE);
  2655. }
  2656. else
  2657. rrdset_next(cg->st_cpu_limit);
  2658. calculated_number cpu_usage = 0;
  2659. cpu_usage = (calculated_number)(cg->cpuacct_stat.user + cg->cpuacct_stat.system) * 100;
  2660. calculated_number cpu_used = 100 * (cpu_usage - cg->prev_cpu_usage) / (value * update_every);
  2661. rrdset_isnot_obsolete(cg->st_cpu_limit);
  2662. rrddim_set(cg->st_cpu_limit, "used", (cpu_used > 0)?cpu_used:0);
  2663. cg->prev_cpu_usage = cpu_usage;
  2664. rrdset_done(cg->st_cpu_limit);
  2665. }
  2666. else {
  2667. rrdsetvar_custom_chart_variable_set(cg->chart_var_cpu_limit, NAN);
  2668. if(unlikely(cg->st_cpu_limit)) {
  2669. rrdset_is_obsolete(cg->st_cpu_limit);
  2670. cg->st_cpu_limit = NULL;
  2671. }
  2672. }
  2673. }
  2674. }
  2675. }
  2676. if(likely(cg->cpuacct_usage.updated && cg->cpuacct_usage.enabled == CONFIG_BOOLEAN_YES)) {
  2677. char id[RRD_ID_LENGTH_MAX + 1];
  2678. unsigned int i;
  2679. if(unlikely(!cg->st_cpu_per_core)) {
  2680. snprintfz(title, CHART_TITLE_MAX, "CPU Usage (100%% = 1 core) Per Core");
  2681. cg->st_cpu_per_core = rrdset_create_localhost(
  2682. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  2683. , "cpu_per_core"
  2684. , NULL
  2685. , "cpu"
  2686. , "cgroup.cpu_per_core"
  2687. , title
  2688. , "percentage"
  2689. , PLUGIN_CGROUPS_NAME
  2690. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  2691. , cgroup_containers_chart_priority + 100
  2692. , update_every
  2693. , RRDSET_TYPE_STACKED
  2694. );
  2695. rrdset_update_labels(cg->st_cpu_per_core, cg->chart_labels);
  2696. for(i = 0; i < cg->cpuacct_usage.cpus; i++) {
  2697. snprintfz(id, RRD_ID_LENGTH_MAX, "cpu%u", i);
  2698. rrddim_add(cg->st_cpu_per_core, id, NULL, 100, 1000000000, RRD_ALGORITHM_INCREMENTAL);
  2699. }
  2700. }
  2701. else
  2702. rrdset_next(cg->st_cpu_per_core);
  2703. for(i = 0; i < cg->cpuacct_usage.cpus ;i++) {
  2704. snprintfz(id, RRD_ID_LENGTH_MAX, "cpu%u", i);
  2705. rrddim_set(cg->st_cpu_per_core, id, cg->cpuacct_usage.cpu_percpu[i]);
  2706. }
  2707. rrdset_done(cg->st_cpu_per_core);
  2708. }
  2709. if(likely(cg->memory.updated_detailed && cg->memory.enabled_detailed == CONFIG_BOOLEAN_YES)) {
  2710. if(unlikely(!cg->st_mem)) {
  2711. snprintfz(title, CHART_TITLE_MAX, "Memory Usage");
  2712. cg->st_mem = rrdset_create_localhost(
  2713. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  2714. , "mem"
  2715. , NULL
  2716. , "mem"
  2717. , "cgroup.mem"
  2718. , title
  2719. , "MiB"
  2720. , PLUGIN_CGROUPS_NAME
  2721. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  2722. , cgroup_containers_chart_priority + 220
  2723. , update_every
  2724. , RRDSET_TYPE_STACKED
  2725. );
  2726. rrdset_update_labels(cg->st_mem, cg->chart_labels);
  2727. if(!(cg->options & CGROUP_OPTIONS_IS_UNIFIED)) {
  2728. rrddim_add(cg->st_mem, "cache", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2729. rrddim_add(cg->st_mem, "rss", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2730. if(cg->memory.detailed_has_swap)
  2731. rrddim_add(cg->st_mem, "swap", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2732. rrddim_add(cg->st_mem, "rss_huge", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2733. rrddim_add(cg->st_mem, "mapped_file", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2734. } else {
  2735. rrddim_add(cg->st_mem, "anon", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2736. rrddim_add(cg->st_mem, "kernel_stack", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2737. rrddim_add(cg->st_mem, "slab", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2738. rrddim_add(cg->st_mem, "sock", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2739. rrddim_add(cg->st_mem, "anon_thp", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2740. rrddim_add(cg->st_mem, "file", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2741. }
  2742. }
  2743. else
  2744. rrdset_next(cg->st_mem);
  2745. if(!(cg->options & CGROUP_OPTIONS_IS_UNIFIED)) {
  2746. rrddim_set(cg->st_mem, "cache", cg->memory.total_cache);
  2747. rrddim_set(cg->st_mem, "rss", (cg->memory.total_rss > cg->memory.total_rss_huge)?(cg->memory.total_rss - cg->memory.total_rss_huge):0);
  2748. if(cg->memory.detailed_has_swap)
  2749. rrddim_set(cg->st_mem, "swap", cg->memory.total_swap);
  2750. rrddim_set(cg->st_mem, "rss_huge", cg->memory.total_rss_huge);
  2751. rrddim_set(cg->st_mem, "mapped_file", cg->memory.total_mapped_file);
  2752. } else {
  2753. rrddim_set(cg->st_mem, "anon", cg->memory.anon);
  2754. rrddim_set(cg->st_mem, "kernel_stack", cg->memory.kernel_stack);
  2755. rrddim_set(cg->st_mem, "slab", cg->memory.slab);
  2756. rrddim_set(cg->st_mem, "sock", cg->memory.sock);
  2757. rrddim_set(cg->st_mem, "anon_thp", cg->memory.anon_thp);
  2758. rrddim_set(cg->st_mem, "file", cg->memory.total_mapped_file);
  2759. }
  2760. rrdset_done(cg->st_mem);
  2761. if(unlikely(!cg->st_writeback)) {
  2762. snprintfz(title, CHART_TITLE_MAX, "Writeback Memory");
  2763. cg->st_writeback = rrdset_create_localhost(
  2764. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  2765. , "writeback"
  2766. , NULL
  2767. , "mem"
  2768. , "cgroup.writeback"
  2769. , title
  2770. , "MiB"
  2771. , PLUGIN_CGROUPS_NAME
  2772. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  2773. , cgroup_containers_chart_priority + 300
  2774. , update_every
  2775. , RRDSET_TYPE_AREA
  2776. );
  2777. rrdset_update_labels(cg->st_writeback, cg->chart_labels);
  2778. if(cg->memory.detailed_has_dirty)
  2779. rrddim_add(cg->st_writeback, "dirty", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2780. rrddim_add(cg->st_writeback, "writeback", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2781. }
  2782. else
  2783. rrdset_next(cg->st_writeback);
  2784. if(cg->memory.detailed_has_dirty)
  2785. rrddim_set(cg->st_writeback, "dirty", cg->memory.total_dirty);
  2786. rrddim_set(cg->st_writeback, "writeback", cg->memory.total_writeback);
  2787. rrdset_done(cg->st_writeback);
  2788. if(!(cg->options & CGROUP_OPTIONS_IS_UNIFIED)) {
  2789. if(unlikely(!cg->st_mem_activity)) {
  2790. snprintfz(title, CHART_TITLE_MAX, "Memory Activity");
  2791. cg->st_mem_activity = rrdset_create_localhost(
  2792. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  2793. , "mem_activity"
  2794. , NULL
  2795. , "mem"
  2796. , "cgroup.mem_activity"
  2797. , title
  2798. , "MiB/s"
  2799. , PLUGIN_CGROUPS_NAME
  2800. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  2801. , cgroup_containers_chart_priority + 400
  2802. , update_every
  2803. , RRDSET_TYPE_LINE
  2804. );
  2805. rrdset_update_labels(cg->st_mem_activity, cg->chart_labels);
  2806. rrddim_add(cg->st_mem_activity, "pgpgin", "in", system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
  2807. rrddim_add(cg->st_mem_activity, "pgpgout", "out", -system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
  2808. }
  2809. else
  2810. rrdset_next(cg->st_mem_activity);
  2811. rrddim_set(cg->st_mem_activity, "pgpgin", cg->memory.total_pgpgin);
  2812. rrddim_set(cg->st_mem_activity, "pgpgout", cg->memory.total_pgpgout);
  2813. rrdset_done(cg->st_mem_activity);
  2814. }
  2815. if(unlikely(!cg->st_pgfaults)) {
  2816. snprintfz(title, CHART_TITLE_MAX, "Memory Page Faults");
  2817. cg->st_pgfaults = rrdset_create_localhost(
  2818. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  2819. , "pgfaults"
  2820. , NULL
  2821. , "mem"
  2822. , "cgroup.pgfaults"
  2823. , title
  2824. , "MiB/s"
  2825. , PLUGIN_CGROUPS_NAME
  2826. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  2827. , cgroup_containers_chart_priority + 500
  2828. , update_every
  2829. , RRDSET_TYPE_LINE
  2830. );
  2831. rrdset_update_labels(cg->st_pgfaults, cg->chart_labels);
  2832. rrddim_add(cg->st_pgfaults, "pgfault", NULL, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
  2833. rrddim_add(cg->st_pgfaults, "pgmajfault", "swap", -system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
  2834. }
  2835. else
  2836. rrdset_next(cg->st_pgfaults);
  2837. rrddim_set(cg->st_pgfaults, "pgfault", cg->memory.total_pgfault);
  2838. rrddim_set(cg->st_pgfaults, "pgmajfault", cg->memory.total_pgmajfault);
  2839. rrdset_done(cg->st_pgfaults);
  2840. }
  2841. if(likely(cg->memory.updated_usage_in_bytes && cg->memory.enabled_usage_in_bytes == CONFIG_BOOLEAN_YES)) {
  2842. if(unlikely(!cg->st_mem_usage)) {
  2843. snprintfz(title, CHART_TITLE_MAX, "Used Memory");
  2844. cg->st_mem_usage = rrdset_create_localhost(
  2845. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  2846. , "mem_usage"
  2847. , NULL
  2848. , "mem"
  2849. , "cgroup.mem_usage"
  2850. , title
  2851. , "MiB"
  2852. , PLUGIN_CGROUPS_NAME
  2853. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  2854. , cgroup_containers_chart_priority + 210
  2855. , update_every
  2856. , RRDSET_TYPE_STACKED
  2857. );
  2858. rrdset_update_labels(cg->st_mem_usage, cg->chart_labels);
  2859. rrddim_add(cg->st_mem_usage, "ram", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2860. rrddim_add(cg->st_mem_usage, "swap", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2861. }
  2862. else
  2863. rrdset_next(cg->st_mem_usage);
  2864. rrddim_set(cg->st_mem_usage, "ram", cg->memory.usage_in_bytes);
  2865. if(!(cg->options & CGROUP_OPTIONS_IS_UNIFIED)) {
  2866. rrddim_set(
  2867. cg->st_mem_usage,
  2868. "swap",
  2869. (cg->memory.msw_usage_in_bytes > cg->memory.usage_in_bytes) ?
  2870. cg->memory.msw_usage_in_bytes - cg->memory.usage_in_bytes : 0);
  2871. } else {
  2872. rrddim_set(cg->st_mem_usage, "swap", cg->memory.msw_usage_in_bytes);
  2873. }
  2874. rrdset_done(cg->st_mem_usage);
  2875. if (likely(update_memory_limits(&cg->filename_memory_limit, &cg->chart_var_memory_limit, &cg->memory_limit, "memory_limit", cg))) {
  2876. static unsigned long long ram_total = 0;
  2877. if(unlikely(!ram_total)) {
  2878. procfile *ff = NULL;
  2879. char filename[FILENAME_MAX + 1];
  2880. snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, "/proc/meminfo");
  2881. ff = procfile_open(config_get("plugin:cgroups", "meminfo filename to monitor", filename), " \t:", PROCFILE_FLAG_DEFAULT);
  2882. if(likely(ff))
  2883. ff = procfile_readall(ff);
  2884. if(likely(ff && procfile_lines(ff) && !strncmp(procfile_word(ff, 0), "MemTotal", 8)))
  2885. ram_total = str2ull(procfile_word(ff, 1)) * 1024;
  2886. else {
  2887. error("Cannot read file %s. Will not update cgroup %s RAM limit anymore.", filename, cg->id);
  2888. freez(cg->filename_memory_limit);
  2889. cg->filename_memory_limit = NULL;
  2890. }
  2891. procfile_close(ff);
  2892. }
  2893. if(likely(ram_total)) {
  2894. unsigned long long memory_limit = ram_total;
  2895. if(unlikely(cg->memory_limit < ram_total))
  2896. memory_limit = cg->memory_limit;
  2897. if(unlikely(!cg->st_mem_usage_limit)) {
  2898. snprintfz(title, CHART_TITLE_MAX, "Used RAM within the limits");
  2899. cg->st_mem_usage_limit = rrdset_create_localhost(
  2900. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  2901. , "mem_usage_limit"
  2902. , NULL
  2903. , "mem"
  2904. , "cgroup.mem_usage_limit"
  2905. , title
  2906. , "MiB"
  2907. , PLUGIN_CGROUPS_NAME
  2908. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  2909. , cgroup_containers_chart_priority + 200
  2910. , update_every
  2911. , RRDSET_TYPE_STACKED
  2912. );
  2913. rrdset_update_labels(cg->st_mem_usage_limit, cg->chart_labels);
  2914. rrddim_add(cg->st_mem_usage_limit, "available", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2915. rrddim_add(cg->st_mem_usage_limit, "used", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
  2916. }
  2917. else
  2918. rrdset_next(cg->st_mem_usage_limit);
  2919. rrdset_isnot_obsolete(cg->st_mem_usage_limit);
  2920. rrddim_set(cg->st_mem_usage_limit, "available", memory_limit - cg->memory.usage_in_bytes);
  2921. rrddim_set(cg->st_mem_usage_limit, "used", cg->memory.usage_in_bytes);
  2922. rrdset_done(cg->st_mem_usage_limit);
  2923. if (unlikely(!cg->st_mem_utilization)) {
  2924. snprintfz(title, CHART_TITLE_MAX, "Memory Utilization");
  2925. cg->st_mem_utilization = rrdset_create_localhost(
  2926. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  2927. , "mem_utilization"
  2928. , NULL
  2929. , "mem"
  2930. , "cgroup.mem_utilization"
  2931. , title
  2932. , "percentage"
  2933. , PLUGIN_CGROUPS_NAME
  2934. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  2935. , cgroup_containers_chart_priority + 199
  2936. , update_every
  2937. , RRDSET_TYPE_AREA
  2938. );
  2939. rrdset_update_labels(cg->st_mem_utilization, cg->chart_labels);
  2940. rrddim_add(cg->st_mem_utilization, "utilization", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2941. } else
  2942. rrdset_next(cg->st_mem_utilization);
  2943. if (memory_limit) {
  2944. rrdset_isnot_obsolete(cg->st_mem_utilization);
  2945. rrddim_set(
  2946. cg->st_mem_utilization, "utilization", cg->memory.usage_in_bytes * 100 / memory_limit);
  2947. rrdset_done(cg->st_mem_utilization);
  2948. }
  2949. }
  2950. }
  2951. else {
  2952. if(unlikely(cg->st_mem_usage_limit)) {
  2953. rrdset_is_obsolete(cg->st_mem_usage_limit);
  2954. cg->st_mem_usage_limit = NULL;
  2955. }
  2956. if(unlikely(cg->st_mem_utilization)) {
  2957. rrdset_is_obsolete(cg->st_mem_utilization);
  2958. cg->st_mem_utilization = NULL;
  2959. }
  2960. }
  2961. update_memory_limits(&cg->filename_memoryswap_limit, &cg->chart_var_memoryswap_limit, &cg->memoryswap_limit, "memory_and_swap_limit", cg);
  2962. }
  2963. if(likely(cg->memory.updated_failcnt && cg->memory.enabled_failcnt == CONFIG_BOOLEAN_YES)) {
  2964. if(unlikely(!cg->st_mem_failcnt)) {
  2965. snprintfz(title, CHART_TITLE_MAX, "Memory Limit Failures");
  2966. cg->st_mem_failcnt = rrdset_create_localhost(
  2967. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  2968. , "mem_failcnt"
  2969. , NULL
  2970. , "mem"
  2971. , "cgroup.mem_failcnt"
  2972. , title
  2973. , "count"
  2974. , PLUGIN_CGROUPS_NAME
  2975. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  2976. , cgroup_containers_chart_priority + 250
  2977. , update_every
  2978. , RRDSET_TYPE_LINE
  2979. );
  2980. rrdset_update_labels(cg->st_mem_failcnt, cg->chart_labels);
  2981. rrddim_add(cg->st_mem_failcnt, "failures", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2982. }
  2983. else
  2984. rrdset_next(cg->st_mem_failcnt);
  2985. rrddim_set(cg->st_mem_failcnt, "failures", cg->memory.failcnt);
  2986. rrdset_done(cg->st_mem_failcnt);
  2987. }
  2988. if(likely(cg->io_service_bytes.updated && cg->io_service_bytes.enabled == CONFIG_BOOLEAN_YES)) {
  2989. if(unlikely(!cg->st_io)) {
  2990. snprintfz(title, CHART_TITLE_MAX, "I/O Bandwidth (all disks)");
  2991. cg->st_io = rrdset_create_localhost(
  2992. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  2993. , "io"
  2994. , NULL
  2995. , "disk"
  2996. , "cgroup.io"
  2997. , title
  2998. , "KiB/s"
  2999. , PLUGIN_CGROUPS_NAME
  3000. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  3001. , cgroup_containers_chart_priority + 1200
  3002. , update_every
  3003. , RRDSET_TYPE_AREA
  3004. );
  3005. rrdset_update_labels(cg->st_io, cg->chart_labels);
  3006. rrddim_add(cg->st_io, "read", NULL, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
  3007. rrddim_add(cg->st_io, "write", NULL, -1, 1024, RRD_ALGORITHM_INCREMENTAL);
  3008. }
  3009. else
  3010. rrdset_next(cg->st_io);
  3011. rrddim_set(cg->st_io, "read", cg->io_service_bytes.Read);
  3012. rrddim_set(cg->st_io, "write", cg->io_service_bytes.Write);
  3013. rrdset_done(cg->st_io);
  3014. }
  3015. if(likely(cg->io_serviced.updated && cg->io_serviced.enabled == CONFIG_BOOLEAN_YES)) {
  3016. if(unlikely(!cg->st_serviced_ops)) {
  3017. snprintfz(title, CHART_TITLE_MAX, "Serviced I/O Operations (all disks)");
  3018. cg->st_serviced_ops = rrdset_create_localhost(
  3019. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  3020. , "serviced_ops"
  3021. , NULL
  3022. , "disk"
  3023. , "cgroup.serviced_ops"
  3024. , title
  3025. , "operations/s"
  3026. , PLUGIN_CGROUPS_NAME
  3027. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  3028. , cgroup_containers_chart_priority + 1200
  3029. , update_every
  3030. , RRDSET_TYPE_LINE
  3031. );
  3032. rrdset_update_labels(cg->st_serviced_ops, cg->chart_labels);
  3033. rrddim_add(cg->st_serviced_ops, "read", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  3034. rrddim_add(cg->st_serviced_ops, "write", NULL, -1, 1, RRD_ALGORITHM_INCREMENTAL);
  3035. }
  3036. else
  3037. rrdset_next(cg->st_serviced_ops);
  3038. rrddim_set(cg->st_serviced_ops, "read", cg->io_serviced.Read);
  3039. rrddim_set(cg->st_serviced_ops, "write", cg->io_serviced.Write);
  3040. rrdset_done(cg->st_serviced_ops);
  3041. }
  3042. if(likely(cg->throttle_io_service_bytes.updated && cg->throttle_io_service_bytes.enabled == CONFIG_BOOLEAN_YES)) {
  3043. if(unlikely(!cg->st_throttle_io)) {
  3044. snprintfz(title, CHART_TITLE_MAX, "Throttle I/O Bandwidth (all disks)");
  3045. cg->st_throttle_io = rrdset_create_localhost(
  3046. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  3047. , "throttle_io"
  3048. , NULL
  3049. , "disk"
  3050. , "cgroup.throttle_io"
  3051. , title
  3052. , "KiB/s"
  3053. , PLUGIN_CGROUPS_NAME
  3054. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  3055. , cgroup_containers_chart_priority + 1200
  3056. , update_every
  3057. , RRDSET_TYPE_AREA
  3058. );
  3059. rrdset_update_labels(cg->st_throttle_io, cg->chart_labels);
  3060. rrddim_add(cg->st_throttle_io, "read", NULL, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
  3061. rrddim_add(cg->st_throttle_io, "write", NULL, -1, 1024, RRD_ALGORITHM_INCREMENTAL);
  3062. }
  3063. else
  3064. rrdset_next(cg->st_throttle_io);
  3065. rrddim_set(cg->st_throttle_io, "read", cg->throttle_io_service_bytes.Read);
  3066. rrddim_set(cg->st_throttle_io, "write", cg->throttle_io_service_bytes.Write);
  3067. rrdset_done(cg->st_throttle_io);
  3068. }
  3069. if(likely(cg->throttle_io_serviced.updated && cg->throttle_io_serviced.enabled == CONFIG_BOOLEAN_YES)) {
  3070. if(unlikely(!cg->st_throttle_serviced_ops)) {
  3071. snprintfz(title, CHART_TITLE_MAX, "Throttle Serviced I/O Operations (all disks)");
  3072. cg->st_throttle_serviced_ops = rrdset_create_localhost(
  3073. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  3074. , "throttle_serviced_ops"
  3075. , NULL
  3076. , "disk"
  3077. , "cgroup.throttle_serviced_ops"
  3078. , title
  3079. , "operations/s"
  3080. , PLUGIN_CGROUPS_NAME
  3081. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  3082. , cgroup_containers_chart_priority + 1200
  3083. , update_every
  3084. , RRDSET_TYPE_LINE
  3085. );
  3086. rrdset_update_labels(cg->st_throttle_serviced_ops, cg->chart_labels);
  3087. rrddim_add(cg->st_throttle_serviced_ops, "read", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  3088. rrddim_add(cg->st_throttle_serviced_ops, "write", NULL, -1, 1, RRD_ALGORITHM_INCREMENTAL);
  3089. }
  3090. else
  3091. rrdset_next(cg->st_throttle_serviced_ops);
  3092. rrddim_set(cg->st_throttle_serviced_ops, "read", cg->throttle_io_serviced.Read);
  3093. rrddim_set(cg->st_throttle_serviced_ops, "write", cg->throttle_io_serviced.Write);
  3094. rrdset_done(cg->st_throttle_serviced_ops);
  3095. }
  3096. if(likely(cg->io_queued.updated && cg->io_queued.enabled == CONFIG_BOOLEAN_YES)) {
  3097. if(unlikely(!cg->st_queued_ops)) {
  3098. snprintfz(title, CHART_TITLE_MAX, "Queued I/O Operations (all disks)");
  3099. cg->st_queued_ops = rrdset_create_localhost(
  3100. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  3101. , "queued_ops"
  3102. , NULL
  3103. , "disk"
  3104. , "cgroup.queued_ops"
  3105. , title
  3106. , "operations"
  3107. , PLUGIN_CGROUPS_NAME
  3108. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  3109. , cgroup_containers_chart_priority + 2000
  3110. , update_every
  3111. , RRDSET_TYPE_LINE
  3112. );
  3113. rrdset_update_labels(cg->st_queued_ops, cg->chart_labels);
  3114. rrddim_add(cg->st_queued_ops, "read", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  3115. rrddim_add(cg->st_queued_ops, "write", NULL, -1, 1, RRD_ALGORITHM_ABSOLUTE);
  3116. }
  3117. else
  3118. rrdset_next(cg->st_queued_ops);
  3119. rrddim_set(cg->st_queued_ops, "read", cg->io_queued.Read);
  3120. rrddim_set(cg->st_queued_ops, "write", cg->io_queued.Write);
  3121. rrdset_done(cg->st_queued_ops);
  3122. }
  3123. if(likely(cg->io_merged.updated && cg->io_merged.enabled == CONFIG_BOOLEAN_YES)) {
  3124. if(unlikely(!cg->st_merged_ops)) {
  3125. snprintfz(title, CHART_TITLE_MAX, "Merged I/O Operations (all disks)");
  3126. cg->st_merged_ops = rrdset_create_localhost(
  3127. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  3128. , "merged_ops"
  3129. , NULL
  3130. , "disk"
  3131. , "cgroup.merged_ops"
  3132. , title
  3133. , "operations/s"
  3134. , PLUGIN_CGROUPS_NAME
  3135. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  3136. , cgroup_containers_chart_priority + 2100
  3137. , update_every
  3138. , RRDSET_TYPE_LINE
  3139. );
  3140. rrdset_update_labels(cg->st_merged_ops, cg->chart_labels);
  3141. rrddim_add(cg->st_merged_ops, "read", NULL, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
  3142. rrddim_add(cg->st_merged_ops, "write", NULL, -1, 1024, RRD_ALGORITHM_INCREMENTAL);
  3143. }
  3144. else
  3145. rrdset_next(cg->st_merged_ops);
  3146. rrddim_set(cg->st_merged_ops, "read", cg->io_merged.Read);
  3147. rrddim_set(cg->st_merged_ops, "write", cg->io_merged.Write);
  3148. rrdset_done(cg->st_merged_ops);
  3149. }
  3150. if (cg->options & CGROUP_OPTIONS_IS_UNIFIED) {
  3151. struct pressure *res = &cg->cpu_pressure;
  3152. if (likely(res->updated && res->some.enabled)) {
  3153. if (unlikely(!res->some.st)) {
  3154. RRDSET *chart;
  3155. snprintfz(title, CHART_TITLE_MAX, "CPU pressure");
  3156. chart = res->some.st = rrdset_create_localhost(
  3157. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  3158. , "cpu_pressure"
  3159. , NULL
  3160. , "cpu"
  3161. , "cgroup.cpu_pressure"
  3162. , title
  3163. , "percentage"
  3164. , PLUGIN_CGROUPS_NAME
  3165. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  3166. , cgroup_containers_chart_priority + 2200
  3167. , update_every
  3168. , RRDSET_TYPE_LINE
  3169. );
  3170. rrdset_update_labels(chart = res->some.st, cg->chart_labels);
  3171. res->some.rd10 = rrddim_add(chart, "some 10", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3172. res->some.rd60 = rrddim_add(chart, "some 60", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3173. res->some.rd300 = rrddim_add(chart, "some 300", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3174. } else {
  3175. rrdset_next(res->some.st);
  3176. }
  3177. update_pressure_chart(&res->some);
  3178. }
  3179. res = &cg->memory_pressure;
  3180. if (likely(res->updated && res->some.enabled)) {
  3181. if (unlikely(!res->some.st)) {
  3182. RRDSET *chart;
  3183. snprintfz(title, CHART_TITLE_MAX, "Memory pressure");
  3184. chart = res->some.st = rrdset_create_localhost(
  3185. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  3186. , "mem_pressure"
  3187. , NULL
  3188. , "mem"
  3189. , "cgroup.memory_pressure"
  3190. , title
  3191. , "percentage"
  3192. , PLUGIN_CGROUPS_NAME
  3193. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  3194. , cgroup_containers_chart_priority + 2300
  3195. , update_every
  3196. , RRDSET_TYPE_LINE
  3197. );
  3198. rrdset_update_labels(chart = res->some.st, cg->chart_labels);
  3199. res->some.rd10 = rrddim_add(chart, "some 10", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3200. res->some.rd60 = rrddim_add(chart, "some 60", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3201. res->some.rd300 = rrddim_add(chart, "some 300", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3202. } else {
  3203. rrdset_next(res->some.st);
  3204. }
  3205. update_pressure_chart(&res->some);
  3206. }
  3207. if (likely(res->updated && res->full.enabled)) {
  3208. if (unlikely(!res->full.st)) {
  3209. RRDSET *chart;
  3210. snprintfz(title, CHART_TITLE_MAX, "Memory full pressure");
  3211. chart = res->full.st = rrdset_create_localhost(
  3212. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  3213. , "mem_full_pressure"
  3214. , NULL
  3215. , "mem"
  3216. , "cgroup.memory_full_pressure"
  3217. , title
  3218. , "percentage"
  3219. , PLUGIN_CGROUPS_NAME
  3220. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  3221. , cgroup_containers_chart_priority + 2350
  3222. , update_every
  3223. , RRDSET_TYPE_LINE
  3224. );
  3225. rrdset_update_labels(chart = res->full.st, cg->chart_labels);
  3226. res->full.rd10 = rrddim_add(chart, "full 10", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3227. res->full.rd60 = rrddim_add(chart, "full 60", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3228. res->full.rd300 = rrddim_add(chart, "full 300", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3229. } else {
  3230. rrdset_next(res->full.st);
  3231. }
  3232. update_pressure_chart(&res->full);
  3233. }
  3234. res = &cg->io_pressure;
  3235. if (likely(res->updated && res->some.enabled)) {
  3236. if (unlikely(!res->some.st)) {
  3237. RRDSET *chart;
  3238. snprintfz(title, CHART_TITLE_MAX, "I/O pressure");
  3239. chart = res->some.st = rrdset_create_localhost(
  3240. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  3241. , "io_pressure"
  3242. , NULL
  3243. , "disk"
  3244. , "cgroup.io_pressure"
  3245. , title
  3246. , "percentage"
  3247. , PLUGIN_CGROUPS_NAME
  3248. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  3249. , cgroup_containers_chart_priority + 2400
  3250. , update_every
  3251. , RRDSET_TYPE_LINE
  3252. );
  3253. rrdset_update_labels(chart = res->some.st, cg->chart_labels);
  3254. res->some.rd10 = rrddim_add(chart, "some 10", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3255. res->some.rd60 = rrddim_add(chart, "some 60", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3256. res->some.rd300 = rrddim_add(chart, "some 300", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3257. } else {
  3258. rrdset_next(res->some.st);
  3259. }
  3260. update_pressure_chart(&res->some);
  3261. }
  3262. if (likely(res->updated && res->full.enabled)) {
  3263. if (unlikely(!res->full.st)) {
  3264. RRDSET *chart;
  3265. snprintfz(title, CHART_TITLE_MAX, "I/O full pressure");
  3266. chart = res->full.st = rrdset_create_localhost(
  3267. cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
  3268. , "io_full_pressure"
  3269. , NULL
  3270. , "disk"
  3271. , "cgroup.io_full_pressure"
  3272. , title
  3273. , "percentage"
  3274. , PLUGIN_CGROUPS_NAME
  3275. , PLUGIN_CGROUPS_MODULE_CGROUPS_NAME
  3276. , cgroup_containers_chart_priority + 2450
  3277. , update_every
  3278. , RRDSET_TYPE_LINE
  3279. );
  3280. rrdset_update_labels(chart = res->full.st, cg->chart_labels);
  3281. res->full.rd10 = rrddim_add(chart, "full 10", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3282. res->full.rd60 = rrddim_add(chart, "full 60", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3283. res->full.rd300 = rrddim_add(chart, "full 300", NULL, 1, 100, RRD_ALGORITHM_ABSOLUTE);
  3284. } else {
  3285. rrdset_next(res->full.st);
  3286. }
  3287. update_pressure_chart(&res->full);
  3288. }
  3289. }
  3290. }
  3291. if(likely(cgroup_enable_systemd_services))
  3292. update_systemd_services_charts(update_every, services_do_cpu, services_do_mem_usage, services_do_mem_detailed
  3293. , services_do_mem_failcnt, services_do_swap_usage, services_do_io
  3294. , services_do_io_ops, services_do_throttle_io, services_do_throttle_ops
  3295. , services_do_queued_ops, services_do_merged_ops
  3296. );
  3297. debug(D_CGROUP, "done updating cgroups charts");
  3298. }
  3299. // ----------------------------------------------------------------------------
  3300. // cgroups main
  3301. static void cgroup_main_cleanup(void *ptr) {
  3302. struct netdata_static_thread *static_thread = (struct netdata_static_thread *)ptr;
  3303. static_thread->enabled = NETDATA_MAIN_THREAD_EXITING;
  3304. info("cleaning up...");
  3305. usec_t max = 2 * USEC_PER_SEC, step = 50000;
  3306. if (!discovery_thread.exited) {
  3307. info("stopping discovery thread worker");
  3308. uv_mutex_lock(&discovery_thread.mutex);
  3309. discovery_thread.start_discovery = 1;
  3310. uv_cond_signal(&discovery_thread.cond_var);
  3311. uv_mutex_unlock(&discovery_thread.mutex);
  3312. }
  3313. while (!discovery_thread.exited && max > 0) {
  3314. max -= step;
  3315. info("waiting for discovery thread to finish...");
  3316. sleep_usec(step);
  3317. }
  3318. static_thread->enabled = NETDATA_MAIN_THREAD_EXITED;
  3319. }
  3320. void *cgroups_main(void *ptr) {
  3321. netdata_thread_cleanup_push(cgroup_main_cleanup, ptr);
  3322. struct rusage thread;
  3323. // when ZERO, attempt to do it
  3324. int vdo_cpu_netdata = config_get_boolean("plugin:cgroups", "cgroups plugin resource charts", 1);
  3325. read_cgroup_plugin_configuration();
  3326. RRDSET *stcpu_thread = NULL;
  3327. if (uv_mutex_init(&cgroup_root_mutex)) {
  3328. error("CGROUP: cannot initialize mutex for the main cgroup list");
  3329. goto exit;
  3330. }
  3331. // dispatch a discovery worker thread
  3332. discovery_thread.start_discovery = 0;
  3333. discovery_thread.exited = 0;
  3334. if (uv_mutex_init(&discovery_thread.mutex)) {
  3335. error("CGROUP: cannot initialize mutex for discovery thread");
  3336. goto exit;
  3337. }
  3338. if (uv_cond_init(&discovery_thread.cond_var)) {
  3339. error("CGROUP: cannot initialize conditional variable for discovery thread");
  3340. goto exit;
  3341. }
  3342. int error = uv_thread_create(&discovery_thread.thread, cgroup_discovery_worker, NULL);
  3343. if (error) {
  3344. error("CGROUP: cannot create tread worker. uv_thread_create(): %s", uv_strerror(error));
  3345. goto exit;
  3346. }
  3347. uv_thread_set_name_np(discovery_thread.thread, "PLUGIN[cgroups]");
  3348. heartbeat_t hb;
  3349. heartbeat_init(&hb);
  3350. usec_t step = cgroup_update_every * USEC_PER_SEC;
  3351. usec_t find_every = cgroup_check_for_new_every * USEC_PER_SEC, find_dt = 0;
  3352. while(!netdata_exit) {
  3353. usec_t hb_dt = heartbeat_next(&hb, step);
  3354. if(unlikely(netdata_exit)) break;
  3355. find_dt += hb_dt;
  3356. if(unlikely(find_dt >= find_every || cgroups_check)) {
  3357. uv_cond_signal(&discovery_thread.cond_var);
  3358. discovery_thread.start_discovery = 1;
  3359. find_dt = 0;
  3360. cgroups_check = 0;
  3361. }
  3362. uv_mutex_lock(&cgroup_root_mutex);
  3363. read_all_cgroups(cgroup_root);
  3364. update_cgroup_charts(cgroup_update_every);
  3365. uv_mutex_unlock(&cgroup_root_mutex);
  3366. // --------------------------------------------------------------------
  3367. if(vdo_cpu_netdata) {
  3368. getrusage(RUSAGE_THREAD, &thread);
  3369. if(unlikely(!stcpu_thread)) {
  3370. stcpu_thread = rrdset_create_localhost(
  3371. "netdata"
  3372. , "plugin_cgroups_cpu"
  3373. , NULL
  3374. , "cgroups"
  3375. , NULL
  3376. , "Netdata CGroups Plugin CPU usage"
  3377. , "milliseconds/s"
  3378. , PLUGIN_CGROUPS_NAME
  3379. , "stats"
  3380. , 132000
  3381. , cgroup_update_every
  3382. , RRDSET_TYPE_STACKED
  3383. );
  3384. rrddim_add(stcpu_thread, "user", NULL, 1, 1000, RRD_ALGORITHM_INCREMENTAL);
  3385. rrddim_add(stcpu_thread, "system", NULL, 1, 1000, RRD_ALGORITHM_INCREMENTAL);
  3386. }
  3387. else
  3388. rrdset_next(stcpu_thread);
  3389. rrddim_set(stcpu_thread, "user" , thread.ru_utime.tv_sec * 1000000ULL + thread.ru_utime.tv_usec);
  3390. rrddim_set(stcpu_thread, "system", thread.ru_stime.tv_sec * 1000000ULL + thread.ru_stime.tv_usec);
  3391. rrdset_done(stcpu_thread);
  3392. }
  3393. }
  3394. exit:
  3395. netdata_thread_cleanup_pop(1);
  3396. return NULL;
  3397. }