dashboard_info.js 260 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889389038913892389338943895389638973898389939003901390239033904390539063907390839093910391139123913391439153916391739183919392039213922392339243925392639273928392939303931393239333934393539363937393839393940394139423943394439453946394739483949395039513952395339543955395639573958395939603961396239633964396539663967396839693970397139723973397439753976397739783979398039813982398339843985398639873988398939903991399239933994399539963997399839994000400140024003400440054006400740084009401040114012401340144015401640174018401940204021402240234024402540264027402840294030403140324033403440354036403740384039404040414042404340444045404640474048404940504051405240534054405540564057405840594060406140624063406440654066406740684069407040714072407340744075407640774078407940804081408240834084408540864087408840894090409140924093409440954096409740984099410041014102410341044105410641074108410941104111411241134114411541164117411841194120412141224123412441254126412741284129413041314132413341344135413641374138413941404141414241434144414541464147414841494150415141524153415441554156415741584159416041614162416341644165416641674168416941704171417241734174417541764177417841794180418141824183418441854186418741884189419041914192419341944195419641974198419942004201420242034204420542064207420842094210421142124213421442154216421742184219422042214222422342244225422642274228422942304231423242334234423542364237423842394240424142424243424442454246424742484249425042514252425342544255425642574258425942604261426242634264426542664267426842694270427142724273427442754276427742784279428042814282428342844285428642874288428942904291429242934294429542964297429842994300430143024303430443054306430743084309431043114312431343144315431643174318431943204321432243234324432543264327432843294330433143324333433443354336433743384339434043414342434343444345434643474348434943504351435243534354435543564357435843594360436143624363436443654366436743684369437043714372437343744375437643774378437943804381438243834384438543864387438843894390439143924393439443954396439743984399440044014402440344044405440644074408440944104411441244134414441544164417441844194420442144224423442444254426442744284429443044314432443344344435443644374438443944404441444244434444444544464447444844494450445144524453445444554456445744584459446044614462446344644465446644674468446944704471447244734474447544764477447844794480448144824483448444854486448744884489449044914492449344944495449644974498449945004501450245034504450545064507450845094510451145124513451445154516451745184519452045214522452345244525452645274528452945304531453245334534453545364537453845394540454145424543454445454546454745484549455045514552455345544555455645574558455945604561456245634564456545664567456845694570457145724573457445754576457745784579458045814582458345844585458645874588458945904591459245934594459545964597459845994600460146024603460446054606460746084609461046114612461346144615461646174618461946204621462246234624462546264627462846294630463146324633463446354636463746384639464046414642464346444645464646474648464946504651465246534654465546564657465846594660466146624663466446654666466746684669467046714672467346744675467646774678467946804681468246834684468546864687468846894690469146924693469446954696469746984699470047014702470347044705470647074708470947104711471247134714471547164717471847194720472147224723472447254726472747284729473047314732473347344735473647374738473947404741474247434744474547464747474847494750475147524753475447554756475747584759476047614762476347644765476647674768476947704771477247734774477547764777477847794780478147824783478447854786478747884789479047914792479347944795479647974798479948004801480248034804480548064807480848094810481148124813481448154816481748184819482048214822482348244825482648274828482948304831483248334834483548364837483848394840484148424843484448454846484748484849485048514852485348544855485648574858485948604861486248634864486548664867486848694870487148724873487448754876487748784879488048814882488348844885488648874888488948904891489248934894489548964897489848994900490149024903490449054906490749084909491049114912491349144915491649174918491949204921
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. // Codacy declarations
  3. /* global NETDATA */
  4. var netdataDashboard = window.netdataDashboard || {};
  5. // Informational content for the various sections of the GUI (menus, sections, charts, etc.)
  6. // ----------------------------------------------------------------------------
  7. // Menus
  8. netdataDashboard.menu = {
  9. 'system': {
  10. title: 'System Overview',
  11. icon: '<i class="fas fa-bookmark"></i>',
  12. info: 'Overview of the key system metrics.'
  13. },
  14. 'services': {
  15. title: 'systemd Services',
  16. icon: '<i class="fas fa-cogs"></i>',
  17. info: 'Resources utilization of systemd services. netdata monitors all systemd services via CGROUPS ' +
  18. '(the resources accounting used by containers). '
  19. },
  20. 'ap': {
  21. title: 'Access Points',
  22. icon: '<i class="fas fa-wifi"></i>',
  23. info: 'Performance metrics for the access points (i.e. wireless interfaces in AP mode) found on the system.'
  24. },
  25. 'tc': {
  26. title: 'Quality of Service',
  27. icon: '<i class="fas fa-globe"></i>',
  28. info: 'Netdata collects and visualizes <code>tc</code> class utilization using its ' +
  29. '<a href="https://github.com/netdata/netdata/blob/master/collectors/tc.plugin/tc-qos-helper.sh.in" target="_blank">tc-helper plugin</a>. ' +
  30. 'If you also use <a href="http://firehol.org/#fireqos" target="_blank">FireQOS</a> for setting up QoS, ' +
  31. 'netdata automatically collects interface and class names. If your QoS configuration includes overheads ' +
  32. 'calculation, the values shown here will include these overheads (the total bandwidth for the same ' +
  33. 'interface as reported in the Network Interfaces section, will be lower than the total bandwidth ' +
  34. 'reported here). QoS data collection may have a slight time difference compared to the interface ' +
  35. '(QoS data collection uses a BASH script, so a shift in data collection of a few milliseconds ' +
  36. 'should be justified).'
  37. },
  38. 'net': {
  39. title: 'Network Interfaces',
  40. icon: '<i class="fas fa-sitemap"></i>',
  41. info: '<p>Performance <a href="https://www.kernel.org/doc/html/latest/networking/statistics.html" target="_blank">metrics for network interfaces</a>.</p>'+
  42. '<p>Netdata retrieves this data reading the <code>/proc/net/dev</code> file and <code>/sys/class/net/</code> directory.</p>'
  43. },
  44. 'wireless': {
  45. title: 'Wireless Interfaces',
  46. icon: '<i class="fas fa-wifi"></i>',
  47. info: 'Performance metrics for wireless interfaces.'
  48. },
  49. 'ip': {
  50. title: 'Networking Stack',
  51. icon: '<i class="fas fa-cloud"></i>',
  52. info: function (os) {
  53. if (os === "linux")
  54. return 'Metrics for the networking stack of the system. These metrics are collected from <code>/proc/net/netstat</code> or attaching <code>kprobes</code> to kernel functions, apply to both IPv4 and IPv6 traffic and are related to operation of the kernel networking stack.';
  55. else
  56. return 'Metrics for the networking stack of the system.';
  57. }
  58. },
  59. 'ipv4': {
  60. title: 'IPv4 Networking',
  61. icon: '<i class="fas fa-cloud"></i>',
  62. info: 'Metrics for the IPv4 stack of the system. ' +
  63. '<a href="https://en.wikipedia.org/wiki/IPv4" target="_blank">Internet Protocol version 4 (IPv4)</a> is ' +
  64. 'the fourth version of the Internet Protocol (IP). It is one of the core protocols of standards-based ' +
  65. 'internetworking methods in the Internet. IPv4 is a connectionless protocol for use on packet-switched ' +
  66. 'networks. It operates on a best effort delivery model, in that it does not guarantee delivery, nor does ' +
  67. 'it assure proper sequencing or avoidance of duplicate delivery. These aspects, including data integrity, ' +
  68. 'are addressed by an upper layer transport protocol, such as the Transmission Control Protocol (TCP).'
  69. },
  70. 'ipv6': {
  71. title: 'IPv6 Networking',
  72. icon: '<i class="fas fa-cloud"></i>',
  73. info: 'Metrics for the IPv6 stack of the system. <a href="https://en.wikipedia.org/wiki/IPv6" target="_blank">Internet Protocol version 6 (IPv6)</a> is the most recent version of the Internet Protocol (IP), the communications protocol that provides an identification and location system for computers on networks and routes traffic across the Internet. IPv6 was developed by the Internet Engineering Task Force (IETF) to deal with the long-anticipated problem of IPv4 address exhaustion. IPv6 is intended to replace IPv4.'
  74. },
  75. 'sctp': {
  76. title: 'SCTP Networking',
  77. icon: '<i class="fas fa-cloud"></i>',
  78. info: '<p><a href="https://en.wikipedia.org/wiki/Stream_Control_Transmission_Protocol" target="_blank">Stream Control Transmission Protocol (SCTP)</a> '+
  79. 'is a computer network protocol which operates at the transport layer and serves a role similar to the popular '+
  80. 'protocols TCP and UDP. SCTP provides some of the features of both UDP and TCP: it is message-oriented like UDP '+
  81. 'and ensures reliable, in-sequence transport of messages with congestion control like TCP. '+
  82. 'It differs from those protocols by providing multi-homing and redundant paths to increase resilience and reliability.</p>'+
  83. '<p>Netdata collects SCTP metrics reading the <code>/proc/net/sctp/snmp</code> file.</p>'
  84. },
  85. 'ipvs': {
  86. title: 'IP Virtual Server',
  87. icon: '<i class="fas fa-eye"></i>',
  88. info: '<p><a href="http://www.linuxvirtualserver.org/software/ipvs.html" target="_blank">IPVS (IP Virtual Server)</a> '+
  89. 'implements transport-layer load balancing inside the Linux kernel, so called Layer-4 switching. '+
  90. 'IPVS running on a host acts as a load balancer at the front of a cluster of real servers, '+
  91. 'it can direct requests for TCP/UDP based services to the real servers, '+
  92. 'and makes services of the real servers to appear as a virtual service on a single IP address.</p>'+
  93. '<p>Netdata collects summary statistics, reading <code>/proc/net/ip_vs_stats</code>. '+
  94. 'To display the statistics information of services and their servers, run <code>ipvsadm -Ln --stats</code> '+
  95. 'or <code>ipvsadm -Ln --rate</code> for the rate statistics. '+
  96. 'For details, see <a href="https://linux.die.net/man/8/ipvsadm" target="_blank">ipvsadm(8)</a>.</p>'
  97. },
  98. 'netfilter': {
  99. title: 'Firewall (netfilter)',
  100. icon: '<i class="fas fa-shield-alt"></i>',
  101. info: 'Performance metrics of the netfilter components.'
  102. },
  103. 'ipfw': {
  104. title: 'Firewall (ipfw)',
  105. icon: '<i class="fas fa-shield-alt"></i>',
  106. info: 'Counters and memory usage for the ipfw rules.'
  107. },
  108. 'cpu': {
  109. title: 'CPUs',
  110. icon: '<i class="fas fa-bolt"></i>',
  111. info: 'Detailed information for each CPU of the system. A summary of the system for all CPUs can be found at the <a href="#menu_system">System Overview</a> section.'
  112. },
  113. 'mem': {
  114. title: 'Memory',
  115. icon: '<i class="fas fa-microchip"></i>',
  116. info: 'Detailed information about the memory management of the system.'
  117. },
  118. 'disk': {
  119. title: 'Disks',
  120. icon: '<i class="fas fa-hdd"></i>',
  121. info: 'Charts with performance information for all the system disks. Special care has been given to present disk performance metrics in a way compatible with <code>iostat -x</code>. netdata by default prevents rendering performance charts for individual partitions and unmounted virtual disks. Disabled charts can still be enabled by configuring the relative settings in the netdata configuration file.'
  122. },
  123. 'mount': {
  124. title: 'Mount Points',
  125. icon: '<i class="fas fa-hdd"></i>',
  126. info: ''
  127. },
  128. 'mdstat': {
  129. title: 'MD arrays',
  130. icon: '<i class="fas fa-hdd"></i>',
  131. info: '<p>RAID devices are virtual devices created from two or more real block devices. '+
  132. '<a href="https://man7.org/linux/man-pages/man4/md.4.html" target="_blank">Linux Software RAID</a> devices are '+
  133. 'implemented through the md (Multiple Devices) device driver.</p>'+
  134. '<p>Netdata monitors the current status of MD arrays reading <a href="https://raid.wiki.kernel.org/index.php/Mdstat" target="_blank">/proc/mdstat</a> and '+
  135. '<code>/sys/block/%s/md/mismatch_cnt</code> files.</p>'
  136. },
  137. 'sensors': {
  138. title: 'Sensors',
  139. icon: '<i class="fas fa-leaf"></i>',
  140. info: 'Readings of the configured system sensors.'
  141. },
  142. 'ipmi': {
  143. title: 'IPMI',
  144. icon: '<i class="fas fa-leaf"></i>',
  145. info: 'The Intelligent Platform Management Interface (IPMI) is a set of computer interface specifications for an autonomous computer subsystem that provides management and monitoring capabilities independently of the host system\'s CPU, firmware (BIOS or UEFI) and operating system.'
  146. },
  147. 'samba': {
  148. title: 'Samba',
  149. icon: '<i class="fas fa-folder-open"></i>',
  150. info: 'Performance metrics of the Samba file share operations of this system. Samba is a implementation of Windows services, including Windows SMB protocol file shares.'
  151. },
  152. 'nfsd': {
  153. title: 'NFS Server',
  154. icon: '<i class="fas fa-folder-open"></i>',
  155. info: 'Performance metrics of the Network File Server. NFS is a distributed file system protocol, allowing a user on a client computer to access files over a network, much like local storage is accessed. NFS, like many other protocols, builds on the Open Network Computing Remote Procedure Call (ONC RPC) system. The NFS is an open standard defined in Request for Comments (RFC).'
  156. },
  157. 'nfs': {
  158. title: 'NFS Client',
  159. icon: '<i class="fas fa-folder-open"></i>',
  160. info: 'Performance metrics of the NFS operations of this system, acting as an NFS client.'
  161. },
  162. 'zfs': {
  163. title: 'ZFS filesystem',
  164. icon: '<i class="fas fa-folder-open"></i>',
  165. info: 'Performance metrics of the ZFS filesystem. The following charts visualize all metrics reported by <a href="https://github.com/zfsonlinux/zfs/blob/master/cmd/arcstat/arcstat" target="_blank">arcstat.py</a> and <a href="https://github.com/zfsonlinux/zfs/blob/master/cmd/arc_summary/arc_summary3" target="_blank">arc_summary.py</a>.'
  166. },
  167. 'zfspool': {
  168. title: 'ZFS pools',
  169. icon: '<i class="fas fa-database"></i>',
  170. info: 'State of ZFS pools.'
  171. },
  172. 'btrfs': {
  173. title: 'BTRFS filesystem',
  174. icon: '<i class="fas fa-folder-open"></i>',
  175. info: 'Disk space metrics for the BTRFS filesystem.'
  176. },
  177. 'apps': {
  178. title: 'Applications',
  179. icon: '<i class="fas fa-heartbeat"></i>',
  180. info: 'Per application statistics are collected using netdata\'s <code>apps.plugin</code>. This plugin walks through all processes and aggregates statistics for applications of interest, defined in <code>/etc/netdata/apps_groups.conf</code>, which can be edited by running <code>$ /etc/netdata/edit-config apps_groups.conf</code> (the default is <a href="https://github.com/netdata/netdata/blob/master/collectors/apps.plugin/apps_groups.conf" target="_blank">here</a>). The plugin internally builds a process tree (much like <code>ps fax</code> does), and groups processes together (evaluating both child and parent processes) so that the result is always a chart with a predefined set of dimensions (of course, only application groups found running are reported). The reported values are compatible with <code>top</code>, although the netdata plugin counts also the resources of exited children (unlike <code>top</code> which shows only the resources of the currently running processes). So for processes like shell scripts, the reported values include the resources used by the commands these scripts run within each timeframe.',
  181. height: 1.5
  182. },
  183. 'users': {
  184. title: 'Users',
  185. icon: '<i class="fas fa-user"></i>',
  186. info: 'Per user statistics are collected using netdata\'s <code>apps.plugin</code>. This plugin walks through all processes and aggregates statistics per user. The reported values are compatible with <code>top</code>, although the netdata plugin counts also the resources of exited children (unlike <code>top</code> which shows only the resources of the currently running processes). So for processes like shell scripts, the reported values include the resources used by the commands these scripts run within each timeframe.',
  187. height: 1.5
  188. },
  189. 'groups': {
  190. title: 'User Groups',
  191. icon: '<i class="fas fa-users"></i>',
  192. info: 'Per user group statistics are collected using netdata\'s <code>apps.plugin</code>. This plugin walks through all processes and aggregates statistics per user group. The reported values are compatible with <code>top</code>, although the netdata plugin counts also the resources of exited children (unlike <code>top</code> which shows only the resources of the currently running processes). So for processes like shell scripts, the reported values include the resources used by the commands these scripts run within each timeframe.',
  193. height: 1.5
  194. },
  195. 'netdata': {
  196. title: 'Netdata Monitoring',
  197. icon: '<i class="fas fa-chart-bar"></i>',
  198. info: 'Performance metrics for the operation of netdata itself and its plugins.'
  199. },
  200. 'aclk_test': {
  201. title: 'ACLK Test Generator',
  202. info: 'For internal use to perform integration testing.'
  203. },
  204. 'example': {
  205. title: 'Example Charts',
  206. info: 'Example charts, demonstrating the external plugin architecture.'
  207. },
  208. 'cgroup': {
  209. title: '',
  210. icon: '<i class="fas fa-th"></i>',
  211. info: 'Container resource utilization metrics. Netdata reads this information from <b>cgroups</b> (abbreviated from <b>control groups</b>), a Linux kernel feature that limits and accounts resource usage (CPU, memory, disk I/O, network, etc.) of a collection of processes. <b>cgroups</b> together with <b>namespaces</b> (that offer isolation between processes) provide what we usually call: <b>containers</b>.'
  212. },
  213. 'cgqemu': {
  214. title: '',
  215. icon: '<i class="fas fa-th-large"></i>',
  216. info: 'QEMU virtual machine resource utilization metrics. QEMU (short for Quick Emulator) is a free and open-source hosted hypervisor that performs hardware virtualization.'
  217. },
  218. 'fping': {
  219. title: 'fping',
  220. icon: '<i class="fas fa-exchange-alt"></i>',
  221. info: 'Network latency statistics, via <b>fping</b>. <b>fping</b> is a program to send ICMP echo probes to network hosts, similar to <code>ping</code>, but much better performing when pinging multiple hosts. fping versions after 3.15 can be directly used as netdata plugins.'
  222. },
  223. 'gearman': {
  224. title: 'Gearman',
  225. icon: '<i class="fas fa-tasks"></i>',
  226. info: 'Gearman is a job server that allows you to do work in parallel, to load balance processing, and to call functions between languages.'
  227. },
  228. 'ioping': {
  229. title: 'ioping',
  230. icon: '<i class="fas fa-exchange-alt"></i>',
  231. info: 'Disk latency statistics, via <b>ioping</b>. <b>ioping</b> is a program to read/write data probes from/to a disk.'
  232. },
  233. 'httpcheck': {
  234. title: 'Http Check',
  235. icon: '<i class="fas fa-heartbeat"></i>',
  236. info: 'Web Service availability and latency monitoring using HTTP checks. This plugin is a specialized version of the port check plugin.'
  237. },
  238. 'memcached': {
  239. title: 'memcached',
  240. icon: '<i class="fas fa-database"></i>',
  241. info: 'Performance metrics for <b>memcached</b>. Memcached is a general-purpose distributed memory caching system. It is often used to speed up dynamic database-driven websites by caching data and objects in RAM to reduce the number of times an external data source (such as a database or API) must be read.'
  242. },
  243. 'monit': {
  244. title: 'monit',
  245. icon: '<i class="fas fa-database"></i>',
  246. info: 'Statuses of checks in <b>monit</b>. Monit is a utility for managing and monitoring processes, programs, files, directories and filesystems on a Unix system. Monit conducts automatic maintenance and repair and can execute meaningful causal actions in error situations.'
  247. },
  248. 'mysql': {
  249. title: 'MySQL',
  250. icon: '<i class="fas fa-database"></i>',
  251. info: 'Performance metrics for <b>mysql</b>, the open-source relational database management system (RDBMS).'
  252. },
  253. 'postgres': {
  254. title: 'Postgres',
  255. icon: '<i class="fas fa-database"></i>',
  256. info: 'Performance metrics for <b>PostgresSQL</b>, the object-relational database (ORDBMS).'
  257. },
  258. 'redis': {
  259. title: 'Redis',
  260. icon: '<i class="fas fa-database"></i>',
  261. info: 'Performance metrics for <b>redis</b>. Redis (REmote DIctionary Server) is a software project that implements data structure servers. It is open-source, networked, in-memory, and stores keys with optional durability.'
  262. },
  263. 'rethinkdbs': {
  264. title: 'RethinkDB',
  265. icon: '<i class="fas fa-database"></i>',
  266. info: 'Performance metrics for <b>rethinkdb</b>. RethinkDB is the first open-source scalable database built for realtime applications'
  267. },
  268. 'retroshare': {
  269. title: 'RetroShare',
  270. icon: '<i class="fas fa-share-alt"></i>',
  271. info: 'Performance metrics for <b>RetroShare</b>. RetroShare is open source software for encrypted filesharing, serverless email, instant messaging, online chat, and BBS, based on a friend-to-friend network built on GNU Privacy Guard (GPG).'
  272. },
  273. 'riakkv': {
  274. title: 'Riak KV',
  275. icon: '<i class="fas fa-database"></i>',
  276. info: 'Metrics for <b>Riak KV</b>, the distributed key-value store.'
  277. },
  278. 'ipfs': {
  279. title: 'IPFS',
  280. icon: '<i class="fas fa-folder-open"></i>',
  281. info: 'Performance metrics for the InterPlanetary File System (IPFS), a content-addressable, peer-to-peer hypermedia distribution protocol.'
  282. },
  283. 'phpfpm': {
  284. title: 'PHP-FPM',
  285. icon: '<i class="fas fa-eye"></i>',
  286. info: 'Performance metrics for <b>PHP-FPM</b>, an alternative FastCGI implementation for PHP.'
  287. },
  288. 'pihole': {
  289. title: 'Pi-hole',
  290. icon: '<i class="fas fa-ban"></i>',
  291. info: 'Metrics for <a href="https://pi-hole.net/" target="_blank">Pi-hole</a>, a black hole for Internet advertisements.' +
  292. ' The metrics returned by Pi-Hole API is all from the last 24 hours.'
  293. },
  294. 'portcheck': {
  295. title: 'Port Check',
  296. icon: '<i class="fas fa-heartbeat"></i>',
  297. info: 'Service availability and latency monitoring using port checks.'
  298. },
  299. 'postfix': {
  300. title: 'postfix',
  301. icon: '<i class="fas fa-envelope"></i>',
  302. info: undefined
  303. },
  304. 'dovecot': {
  305. title: 'Dovecot',
  306. icon: '<i class="fas fa-envelope"></i>',
  307. info: undefined
  308. },
  309. 'hddtemp': {
  310. title: 'HDD Temp',
  311. icon: '<i class="fas fa-thermometer-half"></i>',
  312. info: undefined
  313. },
  314. 'nginx': {
  315. title: 'nginx',
  316. icon: '<i class="fas fa-eye"></i>',
  317. info: undefined
  318. },
  319. 'apache': {
  320. title: 'Apache',
  321. icon: '<i class="fas fa-eye"></i>',
  322. info: undefined
  323. },
  324. 'lighttpd': {
  325. title: 'Lighttpd',
  326. icon: '<i class="fas fa-eye"></i>',
  327. info: undefined
  328. },
  329. 'web_log': {
  330. title: undefined,
  331. icon: '<i class="fas fa-file-alt"></i>',
  332. info: 'Information extracted from a server log file. <code>web_log</code> plugin incrementally parses the server log file to provide, in real-time, a break down of key server performance metrics. For web servers, an extended log file format may optionally be used (for <code>nginx</code> and <code>apache</code>) offering timing information and bandwidth for both requests and responses. <code>web_log</code> plugin may also be configured to provide a break down of requests per URL pattern (check <a href="https://github.com/netdata/netdata/blob/master/collectors/python.d.plugin/web_log/web_log.conf" target="_blank"><code>/etc/netdata/python.d/web_log.conf</code></a>).'
  333. },
  334. 'named': {
  335. title: 'named',
  336. icon: '<i class="fas fa-tag"></i>',
  337. info: undefined
  338. },
  339. 'squid': {
  340. title: 'squid',
  341. icon: '<i class="fas fa-exchange-alt"></i>',
  342. info: undefined
  343. },
  344. 'nut': {
  345. title: 'UPS',
  346. icon: '<i class="fas fa-battery-half"></i>',
  347. info: undefined
  348. },
  349. 'apcupsd': {
  350. title: 'UPS',
  351. icon: '<i class="fas fa-battery-half"></i>',
  352. info: undefined
  353. },
  354. 'smawebbox': {
  355. title: 'Solar Power',
  356. icon: '<i class="fas fa-sun"></i>',
  357. info: undefined
  358. },
  359. 'fronius': {
  360. title: 'Fronius',
  361. icon: '<i class="fas fa-sun"></i>',
  362. info: undefined
  363. },
  364. 'stiebeleltron': {
  365. title: 'Stiebel Eltron',
  366. icon: '<i class="fas fa-thermometer-half"></i>',
  367. info: undefined
  368. },
  369. 'snmp': {
  370. title: 'SNMP',
  371. icon: '<i class="fas fa-random"></i>',
  372. info: undefined
  373. },
  374. 'go_expvar': {
  375. title: 'Go - expvars',
  376. icon: '<i class="fas fa-eye"></i>',
  377. info: 'Statistics about running Go applications exposed by the <a href="https://golang.org/pkg/expvar/" target="_blank">expvar package</a>.'
  378. },
  379. 'chrony': {
  380. icon: '<i class="fas fa-clock"></i>',
  381. info: 'chronyd parameters about the system’s clock performance.'
  382. },
  383. 'couchdb': {
  384. icon: '<i class="fas fa-database"></i>',
  385. info: 'Performance metrics for <b><a href="https://couchdb.apache.org/">CouchDB</a></b>, the open-source, JSON document-based database with an HTTP API and multi-master replication.'
  386. },
  387. 'beanstalk': {
  388. title: 'Beanstalkd',
  389. icon: '<i class="fas fa-tasks"></i>',
  390. info: 'Provides statistics on the <b><a href="http://kr.github.io/beanstalkd/">beanstalkd</a></b> server and any tubes available on that server using data pulled from beanstalkc'
  391. },
  392. 'rabbitmq': {
  393. title: 'RabbitMQ',
  394. icon: '<i class="fas fa-comments"></i>',
  395. info: 'Performance data for the <b><a href="https://www.rabbitmq.com/">RabbitMQ</a></b> open-source message broker.'
  396. },
  397. 'ceph': {
  398. title: 'Ceph',
  399. icon: '<i class="fas fa-database"></i>',
  400. info: 'Provides statistics on the <b><a href="http://ceph.com/">ceph</a></b> cluster server, the open-source distributed storage system.'
  401. },
  402. 'ntpd': {
  403. title: 'ntpd',
  404. icon: '<i class="fas fa-clock"></i>',
  405. info: 'Provides statistics for the internal variables of the Network Time Protocol daemon <b><a href="http://www.ntp.org/">ntpd</a></b> and optional including the configured peers (if enabled in the module configuration). The module presents the performance metrics as shown by <b><a href="http://doc.ntp.org/current-stable/ntpq.html">ntpq</a></b> (the standard NTP query program) using NTP mode 6 UDP packets to communicate with the NTP server.'
  406. },
  407. 'spigotmc': {
  408. title: 'Spigot MC',
  409. icon: '<i class="fas fa-eye"></i>',
  410. info: 'Provides basic performance statistics for the <b><a href="https://www.spigotmc.org/">Spigot Minecraft</a></b> server.'
  411. },
  412. 'unbound': {
  413. title: 'Unbound',
  414. icon: '<i class="fas fa-tag"></i>',
  415. info: undefined
  416. },
  417. 'boinc': {
  418. title: 'BOINC',
  419. icon: '<i class="fas fa-microchip"></i>',
  420. info: 'Provides task counts for <b><a href="http://boinc.berkeley.edu/">BOINC</a></b> distributed computing clients.'
  421. },
  422. 'w1sensor': {
  423. title: '1-Wire Sensors',
  424. icon: '<i class="fas fa-thermometer-half"></i>',
  425. info: 'Data derived from <a href="https://en.wikipedia.org/wiki/1-Wire">1-Wire</a> sensors. Currently temperature sensors are automatically detected.'
  426. },
  427. 'logind': {
  428. title: 'Logind',
  429. icon: '<i class="fas fa-user"></i>',
  430. info: undefined
  431. },
  432. 'powersupply': {
  433. title: 'Power Supply',
  434. icon: '<i class="fas fa-battery-half"></i>',
  435. info: 'Statistics for the various system power supplies. Data collected from <a href="https://www.kernel.org/doc/Documentation/power/power_supply_class.txt">Linux power supply class</a>.'
  436. },
  437. 'xenstat': {
  438. title: 'Xen Node',
  439. icon: '<i class="fas fa-server"></i>',
  440. info: 'General statistics for the Xen node. Data collected using <b>xenstat</b> library</a>.'
  441. },
  442. 'xendomain': {
  443. title: '',
  444. icon: '<i class="fas fa-th-large"></i>',
  445. info: 'Xen domain resource utilization metrics. Netdata reads this information using <b>xenstat</b> library which gives access to the resource usage information (CPU, memory, disk I/O, network) for a virtual machine.'
  446. },
  447. 'wmi': {
  448. title: 'wmi',
  449. icon: '<i class="fas fa-server"></i>',
  450. info: undefined
  451. },
  452. 'perf': {
  453. title: 'Perf Counters',
  454. icon: '<i class="fas fa-tachometer-alt"></i>',
  455. info: 'Performance Monitoring Counters (PMC). Data collected using <b>perf_event_open()</b> system call which utilises Hardware Performance Monitoring Units (PMU).'
  456. },
  457. 'vsphere': {
  458. title: 'vSphere',
  459. icon: '<i class="fas fa-server"></i>',
  460. info: 'Performance statistics for ESXI hosts and virtual machines. Data collected from <a href="https://www.vmware.com/products/vcenter-server.html">VMware vCenter Server</a> using <code><a href="https://github.com/vmware/govmomi"> govmomi</a></code> library.'
  461. },
  462. 'vcsa': {
  463. title: 'VCSA',
  464. icon: '<i class="fas fa-server"></i>',
  465. info: 'vCenter Server Appliance health statistics. Data collected from <a href="https://vmware.github.io/vsphere-automation-sdk-rest/vsphere/index.html#SVC_com.vmware.appliance.health">Health API</a>.'
  466. },
  467. 'zookeeper': {
  468. title: 'Zookeeper',
  469. icon: '<i class="fas fa-database"></i>',
  470. info: 'Provides health statistics for <b><a href="https://zookeeper.apache.org/">Zookeeper</a></b> server. Data collected through the command port using <code><a href="https://zookeeper.apache.org/doc/r3.5.5/zookeeperAdmin.html#sc_zkCommands">mntr</a></code> command.'
  471. },
  472. 'hdfs': {
  473. title: 'HDFS',
  474. icon: '<i class="fas fa-folder-open"></i>',
  475. info: 'Provides <b><a href="https://hadoop.apache.org/docs/r3.2.0/hadoop-project-dist/hadoop-hdfs/HdfsDesign.html">Hadoop Distributed File System</a></b> performance statistics. Module collects metrics over <code>Java Management Extensions</code> through the web interface of an <code>HDFS</code> daemon.'
  476. },
  477. 'am2320': {
  478. title: 'AM2320 Sensor',
  479. icon: '<i class="fas fa-thermometer-half"></i>',
  480. info: 'Readings from the external AM2320 Sensor.'
  481. },
  482. 'scaleio': {
  483. title: 'ScaleIO',
  484. icon: '<i class="fas fa-database"></i>',
  485. info: 'Performance and health statistics for various ScaleIO components. Data collected via VxFlex OS Gateway REST API.'
  486. },
  487. 'squidlog': {
  488. title: 'Squid log',
  489. icon: '<i class="fas fa-file-alt"></i>',
  490. info: undefined
  491. },
  492. 'cockroachdb': {
  493. title: 'CockroachDB',
  494. icon: '<i class="fas fa-database"></i>',
  495. info: 'Performance and health statistics for various <code>CockroachDB</code> components.'
  496. },
  497. 'ebpf': {
  498. title: 'eBPF',
  499. icon: '<i class="fas fa-heartbeat"></i>',
  500. info: 'Monitor system calls, internal functions, bytes read, bytes written and errors using <code>eBPF</code>.'
  501. },
  502. 'filesystem': {
  503. title: 'Filesystem',
  504. icon: '<i class="fas fa-hdd"></i>',
  505. },
  506. 'vernemq': {
  507. title: 'VerneMQ',
  508. icon: '<i class="fas fa-comments"></i>',
  509. info: 'Performance data for the <b><a href="https://vernemq.com/">VerneMQ</a></b> open-source MQTT broker.'
  510. },
  511. 'pulsar': {
  512. title: 'Pulsar',
  513. icon: '<i class="fas fa-comments"></i>',
  514. info: 'Summary, namespaces and topics performance data for the <b><a href="http://pulsar.apache.org/">Apache Pulsar</a></b> pub-sub messaging system.'
  515. },
  516. 'anomalies': {
  517. title: 'Anomalies',
  518. icon: '<i class="fas fa-flask"></i>',
  519. info: 'Anomaly scores relating to key system metrics. A high anomaly probability indicates strange behaviour and may trigger an anomaly prediction from the trained models. Read the <a href="https://github.com/netdata/netdata/tree/master/collectors/python.d.plugin/anomalies" target="_blank">anomalies collector docs</a> for more details.'
  520. },
  521. 'alarms': {
  522. title: 'Alarms',
  523. icon: '<i class="fas fa-bell"></i>',
  524. info: 'Charts showing alarm status over time. More details <a href="https://github.com/netdata/netdata/blob/master/collectors/python.d.plugin/alarms/README.md" target="_blank">here</a>.'
  525. },
  526. 'statsd': {
  527. title: 'StatsD',
  528. icon: '<i class="fas fa-chart-line"></i>',
  529. info:'StatsD is an industry-standard technology stack for monitoring applications and instrumenting any piece of software to deliver custom metrics. Netdata allows the user to organize the metrics in different charts and visualize any application metric easily. Read more on <a href="https://learn.netdata.cloud/docs/agent/collectors/statsd.plugin">Netdata Learn</a>.'
  530. },
  531. 'supervisord': {
  532. title: 'Supervisord',
  533. icon: '<i class="fas fa-tasks"></i>',
  534. info: 'Detailed statistics for each group of processes controlled by <b><a href="http://supervisord.org/">Supervisor</a></b>. ' +
  535. 'Netdata collects these metrics using <a href="http://supervisord.org/api.html#supervisor.rpcinterface.SupervisorNamespaceRPCInterface.getAllProcessInfo" target="_blank"><code>getAllProcessInfo</code></a> method.'
  536. },
  537. 'systemdunits': {
  538. title: 'systemd units',
  539. icon: '<i class="fas fa-cogs"></i>',
  540. info: '<b>systemd</b> provides a dependency system between various entities called "units" of 11 different types. ' +
  541. 'Units encapsulate various objects that are relevant for system boot-up and maintenance. ' +
  542. 'Units may be <code>active</code> (meaning started, bound, plugged in, depending on the unit type), ' +
  543. 'or <code>inactive</code> (meaning stopped, unbound, unplugged), ' +
  544. 'as well as in the process of being activated or deactivated, i.e. between the two states (these states are called <code>activating</code>, <code>deactivating</code>). ' +
  545. 'A special <code>failed</code> state is available as well, which is very similar to <code>inactive</code> and is entered when the service failed in some way (process returned error code on exit, or crashed, an operation timed out, or after too many restarts). ' +
  546. 'For detailes, see <a href="https://www.freedesktop.org/software/systemd/man/systemd.html" target="_blank"> systemd(1)</a>.'
  547. },
  548. 'changefinder': {
  549. title: 'ChangeFinder',
  550. icon: '<i class="fas fa-flask"></i>',
  551. info: 'Online changepoint detection using machine learning. More details <a href="https://github.com/netdata/netdata/blob/master/collectors/python.d.plugin/changefinder/README.md" target="_blank">here</a>.'
  552. },
  553. 'zscores': {
  554. title: 'Z-Scores',
  555. icon: '<i class="fas fa-exclamation"></i>',
  556. info: 'Z scores scores relating to key system metrics.'
  557. },
  558. };
  559. // ----------------------------------------------------------------------------
  560. // submenus
  561. // information to be shown, just below each submenu
  562. // information about the submenus
  563. netdataDashboard.submenu = {
  564. 'web_log.squid_bandwidth': {
  565. title: 'bandwidth',
  566. info: 'Bandwidth of responses (<code>sent</code>) by squid. This chart may present unusual spikes, since the bandwidth is accounted at the time the log line is saved by the server, even if the time needed to serve it spans across a longer duration. We suggest to use QoS (e.g. <a href="http://firehol.org/#fireqos" target="_blank">FireQOS</a>) for accurate accounting of the server bandwidth.'
  567. },
  568. 'web_log.squid_responses': {
  569. title: 'responses',
  570. info: 'Information related to the responses sent by squid.'
  571. },
  572. 'web_log.squid_requests': {
  573. title: 'requests',
  574. info: 'Information related to the requests squid has received.'
  575. },
  576. 'web_log.squid_hierarchy': {
  577. title: 'hierarchy',
  578. info: 'Performance metrics for the squid hierarchy used to serve the requests.'
  579. },
  580. 'web_log.squid_squid_transport': {
  581. title: 'transport'
  582. },
  583. 'web_log.squid_squid_cache': {
  584. title: 'cache',
  585. info: 'Performance metrics for the performance of the squid cache.'
  586. },
  587. 'web_log.squid_timings': {
  588. title: 'timings',
  589. info: 'Duration of squid requests. Unrealistic spikes may be reported, since squid logs the total time of the requests, when they complete. Especially for HTTPS, the clients get a tunnel from the proxy and exchange requests directly with the upstream servers, so squid cannot evaluate the individual requests and reports the total time the tunnel was open.'
  590. },
  591. 'web_log.squid_clients': {
  592. title: 'clients'
  593. },
  594. 'web_log.bandwidth': {
  595. info: 'Bandwidth of requests (<code>received</code>) and responses (<code>sent</code>). <code>received</code> requires an extended log format (without it, the web server log does not have this information). This chart may present unusual spikes, since the bandwidth is accounted at the time the log line is saved by the web server, even if the time needed to serve it spans across a longer duration. We suggest to use QoS (e.g. <a href="http://firehol.org/#fireqos" target="_blank">FireQOS</a>) for accurate accounting of the web server bandwidth.'
  596. },
  597. 'web_log.urls': {
  598. info: 'Number of requests for each <code>URL pattern</code> defined in <a href="https://github.com/netdata/netdata/blob/master/collectors/python.d.plugin/web_log/web_log.conf" target="_blank"><code>/etc/netdata/python.d/web_log.conf</code></a>. This chart counts all requests matching the URL patterns defined, independently of the web server response codes (i.e. both successful and unsuccessful).'
  599. },
  600. 'web_log.clients': {
  601. info: 'Charts showing the number of unique client IPs, accessing the web server.'
  602. },
  603. 'web_log.timings': {
  604. info: 'Web server response timings - the time the web server needed to prepare and respond to requests. This requires an extended log format and its meaning is web server specific. For most web servers this accounts the time from the reception of a complete request, to the dispatch of the last byte of the response. So, it includes the network delays of responses, but it does not include the network delays of requests.'
  605. },
  606. 'mem.ksm': {
  607. title: 'deduper (ksm)',
  608. info: 'Kernel Same-page Merging (KSM) performance monitoring, read from several files in <code>/sys/kernel/mm/ksm/</code>. KSM is a memory-saving de-duplication feature in the Linux kernel (since version 2.6.32). The KSM daemon ksmd periodically scans those areas of user memory which have been registered with it, looking for pages of identical content which can be replaced by a single write-protected page (which is automatically copied if a process later wants to update its content). KSM was originally developed for use with KVM (where it was known as Kernel Shared Memory), to fit more virtual machines into physical memory, by sharing the data common between them. But it can be useful to any application which generates many instances of the same data.'
  609. },
  610. 'mem.hugepages': {
  611. info: 'Hugepages is a feature that allows the kernel to utilize the multiple page size capabilities of modern hardware architectures. The kernel creates multiple pages of virtual memory, mapped from both physical RAM and swap. There is a mechanism in the CPU architecture called "Translation Lookaside Buffers" (TLB) to manage the mapping of virtual memory pages to actual physical memory addresses. The TLB is a limited hardware resource, so utilizing a large amount of physical memory with the default page size consumes the TLB and adds processing overhead. By utilizing Huge Pages, the kernel is able to create pages of much larger sizes, each page consuming a single resource in the TLB. Huge Pages are pinned to physical RAM and cannot be swapped/paged out.'
  612. },
  613. 'mem.numa': {
  614. info: 'Non-Uniform Memory Access (NUMA) is a hierarchical memory design the memory access time is dependent on locality. Under NUMA, a processor can access its own local memory faster than non-local memory (memory local to another processor or memory shared between processors). The individual metrics are described in the <a href="https://www.kernel.org/doc/Documentation/numastat.txt" target="_blank">Linux kernel documentation</a>.'
  615. },
  616. 'ip.ecn': {
  617. info: '<a href="https://en.wikipedia.org/wiki/Explicit_Congestion_Notification" target="_blank">Explicit Congestion Notification (ECN)</a> '+
  618. 'is an extension to the IP and to the TCP that allows end-to-end notification of network congestion without dropping packets. '+
  619. 'ECN is an optional feature that may be used between two ECN-enabled endpoints when '+
  620. 'the underlying network infrastructure also supports it.'
  621. },
  622. 'ip.multicast': {
  623. info: '<a href="https://en.wikipedia.org/wiki/Multicast" target="_blank">IP multicast</a> is a technique for '+
  624. 'one-to-many communication over an IP network. '+
  625. 'Multicast uses network infrastructure efficiently by requiring the source to send a packet only once, '+
  626. 'even if it needs to be delivered to a large number of receivers. '+
  627. 'The nodes in the network take care of replicating the packet to reach multiple receivers only when necessary.'
  628. },
  629. 'ip.broadcast': {
  630. info: 'In computer networking, '+
  631. '<a href="https://en.wikipedia.org/wiki/Broadcasting_(networking)" target="_blank">broadcasting</a> refers to transmitting a packet that will be received by every device on the network. '+
  632. 'In practice, the scope of the broadcast is limited to a broadcast domain.'
  633. },
  634. 'netfilter.conntrack': {
  635. title: 'connection tracker',
  636. info: 'Netfilter Connection Tracker performance metrics. The connection tracker keeps track of all connections of the machine, inbound and outbound. It works by keeping a database with all open connections, tracking network and address translation and connection expectations.'
  637. },
  638. 'netfilter.nfacct': {
  639. title: 'bandwidth accounting',
  640. info: 'The following information is read using the <code>nfacct.plugin</code>.'
  641. },
  642. 'netfilter.synproxy': {
  643. title: 'DDoS protection',
  644. info: 'DDoS protection performance metrics. <a href="https://github.com/firehol/firehol/wiki/Working-with-SYNPROXY" target="_blank">SYNPROXY</a> is a TCP SYN packets proxy. It is used to protect any TCP server (like a web server) from SYN floods and similar DDoS attacks. It is a netfilter module, in the Linux kernel (since version 3.12). It is optimized to handle millions of packets per second utilizing all CPUs available without any concurrency locking between the connections. It can be used for any kind of TCP traffic (even encrypted), since it does not interfere with the content itself.'
  645. },
  646. 'ipfw.dynamic_rules': {
  647. title: 'dynamic rules',
  648. info: 'Number of dynamic rules, created by correspondent stateful firewall rules.'
  649. },
  650. 'system.softnet_stat': {
  651. title: 'softnet',
  652. info: function (os) {
  653. if (os === 'linux')
  654. return 'Statistics for CPUs SoftIRQs related to network receive work. Break down per CPU core can be found at <a href="#menu_cpu_submenu_softnet_stat">CPU / softnet statistics</a>. <b>processed</b> states the number of packets processed, <b>dropped</b> is the number packets dropped because the network device backlog was full (to fix them on Linux use <code>sysctl</code> to increase <code>net.core.netdev_max_backlog</code>), <b>squeezed</b> is the number of packets dropped because the network device budget ran out (to fix them on Linux use <code>sysctl</code> to increase <code>net.core.netdev_budget</code> and/or <code>net.core.netdev_budget_usecs</code>). More information about identifying and troubleshooting network driver related issues can be found at <a href="https://access.redhat.com/sites/default/files/attachments/20150325_network_performance_tuning.pdf" target="_blank">Red Hat Enterprise Linux Network Performance Tuning Guide</a>.';
  655. else
  656. return 'Statistics for CPUs SoftIRQs related to network receive work.';
  657. }
  658. },
  659. 'cpu.softnet_stat': {
  660. title: 'softnet',
  661. info: function (os) {
  662. if (os === 'linux')
  663. return 'Statistics for per CPUs core SoftIRQs related to network receive work. Total for all CPU cores can be found at <a href="#menu_system_submenu_softnet_stat">System / softnet statistics</a>. <b>processed</b> states the number of packets processed, <b>dropped</b> is the number packets dropped because the network device backlog was full (to fix them on Linux use <code>sysctl</code> to increase <code>net.core.netdev_max_backlog</code>), <b>squeezed</b> is the number of packets dropped because the network device budget ran out (to fix them on Linux use <code>sysctl</code> to increase <code>net.core.netdev_budget</code> and/or <code>net.core.netdev_budget_usecs</code>). More information about identifying and troubleshooting network driver related issues can be found at <a href="https://access.redhat.com/sites/default/files/attachments/20150325_network_performance_tuning.pdf" target="_blank">Red Hat Enterprise Linux Network Performance Tuning Guide</a>.';
  664. else
  665. return 'Statistics for per CPUs core SoftIRQs related to network receive work. Total for all CPU cores can be found at <a href="#menu_system_submenu_softnet_stat">System / softnet statistics</a>.';
  666. }
  667. },
  668. 'go_expvar.memstats': {
  669. title: 'memory statistics',
  670. info: 'Go runtime memory statistics. See <a href="https://golang.org/pkg/runtime/#MemStats" target="_blank">runtime.MemStats</a> documentation for more info about each chart and the values.'
  671. },
  672. 'couchdb.dbactivity': {
  673. title: 'db activity',
  674. info: 'Overall database reads and writes for the entire server. This includes any external HTTP traffic, as well as internal replication traffic performed in a cluster to ensure node consistency.'
  675. },
  676. 'couchdb.httptraffic': {
  677. title: 'http traffic breakdown',
  678. info: 'All HTTP traffic, broken down by type of request (<tt>GET</tt>, <tt>PUT</tt>, <tt>POST</tt>, etc.) and response status code (<tt>200</tt>, <tt>201</tt>, <tt>4xx</tt>, etc.)<br/><br/>Any <tt>5xx</tt> errors here indicate a likely CouchDB bug; check the logfile for further information.'
  679. },
  680. 'couchdb.ops': {
  681. title: 'server operations'
  682. },
  683. 'couchdb.perdbstats': {
  684. title: 'per db statistics',
  685. info: 'Statistics per database. This includes <a href="http://docs.couchdb.org/en/latest/api/database/common.html#get--db">3 size graphs per database</a>: active (the size of live data in the database), external (the uncompressed size of the database contents), and file (the size of the file on disk, exclusive of any views and indexes). It also includes the number of documents and number of deleted documents per database.'
  686. },
  687. 'couchdb.erlang': {
  688. title: 'erlang statistics',
  689. info: 'Detailed information about the status of the Erlang VM that hosts CouchDB. These are intended for advanced users only. High values of the peak message queue (>10e6) generally indicate an overload condition.'
  690. },
  691. 'ntpd.system': {
  692. title: 'system',
  693. info: 'Statistics of the system variables as shown by the readlist billboard <code>ntpq -c rl</code>. System variables are assigned an association ID of zero and can also be shown in the readvar billboard <code>ntpq -c "rv 0"</code>. These variables are used in the <a href="http://doc.ntp.org/current-stable/discipline.html">Clock Discipline Algorithm</a>, to calculate the lowest and most stable offset.'
  694. },
  695. 'ntpd.peers': {
  696. title: 'peers',
  697. info: 'Statistics of the peer variables for each peer configured in <code>/etc/ntp.conf</code> as shown by the readvar billboard <code>ntpq -c "rv &lt;association&gt;"</code>, while each peer is assigned a nonzero association ID as shown by <code>ntpq -c "apeers"</code>. The module periodically scans for new/changed peers (default: every 60s). <b>ntpd</b> selects the best possible peer from the available peers to synchronize the clock. A minimum of at least 3 peers is required to properly identify the best possible peer.'
  698. },
  699. 'mem.page_cache': {
  700. title: 'page cache (eBPF)',
  701. info: 'Monitor calls to functions used to manipulate <a href="https://en.wikipedia.org/wiki/Page_cache" target="_blank">Linux page cache</a>. When integration with apps is <a href="https://learn.netdata.cloud/guides/troubleshoot/monitor-debug-applications-ebpf" target="_blank">enabled</a>, Netdata also shows page cache manipulation per <a href="#menu_apps_submenu_page_cache">application</a>.'
  702. },
  703. 'apps.page_cache': {
  704. title: 'page cache (eBPF)',
  705. info: 'Netdata also gives a summary for these charts in <a href="#menu_mem_submenu_page_cache">Memory submenu</a>.'
  706. },
  707. 'filesystem.vfs': {
  708. title: 'vfs (eBPF)',
  709. info: 'Monitor calls to functions used to manipulate <a href="https://learn.netdata.cloud/docs/agent/collectors/ebpf.plugin#vfs" target="_blank">File Systems</a>. When integration with apps is <a href="https://learn.netdata.cloud/guides/troubleshoot/monitor-debug-applications-ebpf" target="_blank">enabled</a>, Netdata also shows Virtual File System per <a href="#menu_apps_submenu_vfs">application</a>.'
  710. },
  711. 'apps.vfs': {
  712. title: 'vfs (eBPF)',
  713. info: 'Netdata also gives a summary for these charts in <a href="#menu_filesystem_submenu_vfs">Filesystem submenu</a>.'
  714. },
  715. 'filesystem.ext4_latency': {
  716. info: 'Latency is the time it takes for an event to be completed. We calculate the difference between the calling and return times, this spans disk I/O, file system operations (lock, I/O), run queue latency and all events related to the monitored action. Based on the eBPF <a href="http://www.brendangregg.com/blog/2016-10-06/linux-bcc-ext4dist-ext4slower.html" target="_blank">ext4dist</a> from BCC tools.'
  717. },
  718. 'filesystem.xfs_latency': {
  719. info: 'Latency is the time it takes for an event to be completed. We calculate the difference between the calling and return times, this spans disk I/O, file system operations (lock, I/O), run queue latency and all events related to the monitored action. Based on the eBPF <a href="https://github.com/iovisor/bcc/blob/master/tools/xfsdist_example.txt" target="_blank">xfsdist</a> from BCC tools.'
  720. },
  721. 'filesystem.nfs_latency': {
  722. info: 'Latency is the time it takes for an event to be completed. We calculate the difference between the calling and return times, this spans disk I/O, file system operations (lock, I/O), run queue latency and all events related to the monitored action. Based on the eBPF <a href="https://github.com/iovisor/bcc/blob/master/tools/nfsdist_example.txt" target="_blank">nfsdist</a> from BCC tools.'
  723. },
  724. 'filesystem.zfs_latency': {
  725. info: 'Latency is the time it takes for an event to be completed. We calculate the difference between the calling and return times, this spans disk I/O, file system operations (lock, I/O), run queue latency and all events related to the monitored action. Based on the eBPF <a href="https://github.com/iovisor/bcc/blob/master/tools/zfsdist_example.txt" target="_blank">zfsdist</a> from BCC tools.'
  726. },
  727. 'filesystem.btrfs_latency': {
  728. info: 'Latency is the time it takes for an event to be completed. We calculate the difference between the calling and return times, we get the logarithmic for the final result and we sum one value to the respective bin. Based on the eBPF <a href="https://github.com/iovisor/bcc/blob/master/tools/btrfsdist_example.txt" target="_blank">btrfsdist</a> from BCC tools.'
  729. },
  730. 'filesystem.file_access': {
  731. title: 'file access (eBPF)',
  732. info: 'When integration with apps is <a href="https://learn.netdata.cloud/guides/troubleshoot/monitor-debug-applications-ebpf" target="_blank">enabled</a>, Netdata also shows file access per <a href="#menu_apps_submenu_file_access">application</a>.'
  733. },
  734. 'apps.file_access': {
  735. title: 'file access (eBPF)',
  736. info: 'Netdata also gives a summary for this chart on <a href="#menu_filesystem_submenu_file_access">Filesystem submenu</a> (more details on <a href="https://learn.netdata.cloud/docs/agent/collectors/ebpf.plugin#file" target="_blank">eBPF plugin file chart section</a>).'
  737. },
  738. 'ip.kernel': {
  739. title: 'kernel functions',
  740. info: 'Next charts are made when <code>ebpf.plugin</code> is running on your host. When integration with apps is <a href="https://learn.netdata.cloud/guides/troubleshoot/monitor-debug-applications-ebpf" target="_blank">enabled</a>, Netdata also shows calls for kernel functions per <a href="#menu_apps_submenu_net">application</a>.'
  741. },
  742. 'apps.net': {
  743. title: 'network',
  744. info: 'Netdata also gives a summary for eBPF charts in <a href="#menu_ip_submenu_kernel">Networking Stack submenu</a>.'
  745. },
  746. 'system.ipc semaphores': {
  747. info: 'System V semaphores is an inter-process communication (IPC) mechanism. '+
  748. 'It allows processes or threads within a process to synchronize their actions. '+
  749. 'They are often used to monitor and control the availability of system resources such as shared memory segments. ' +
  750. 'For details, see <a href="https://man7.org/linux/man-pages/man7/svipc.7.html" target="_blank">svipc(7)</a>. ' +
  751. 'To see the host IPC semaphore information, run <code>ipcs -us</code>. For limits, run <code>ipcs -ls</code>.'
  752. },
  753. 'system.ipc shared memory': {
  754. info: 'System V shared memory is an inter-process communication (IPC) mechanism. '+
  755. 'It allows processes to communicate information by sharing a region of memory. '+
  756. 'It is the fastest form of inter-process communication available since no kernel involvement occurs when data is passed between the processes (no copying). '+
  757. 'Typically, processes must synchronize their access to a shared memory object, using, for example, POSIX semaphores. '+
  758. 'For details, see <a href="https://man7.org/linux/man-pages/man7/svipc.7.html" target="_blank">svipc(7)</a>. '+
  759. 'To see the host IPC shared memory information, run <code>ipcs -um</code>. For limits, run <code>ipcs -lm</code>.'
  760. },
  761. 'system.ipc message queues': {
  762. info: 'System V message queues is an inter-process communication (IPC) mechanism. '+
  763. 'It allow processes to exchange data in the form of messages. '+
  764. 'For details, see <a href="https://man7.org/linux/man-pages/man7/svipc.7.html" target="_blank">svipc(7)</a>. ' +
  765. 'To see the host IPC messages information, run <code>ipcs -uq</code>. For limits, run <code>ipcs -lq</code>.'
  766. },
  767. 'system.interrupts': {
  768. info: '<a href="https://en.wikipedia.org/wiki/Interrupt" target="_blank"><b>Interrupts</b></a> are signals '+
  769. 'sent to the CPU by external devices (normally I/O devices) or programs (running processes). '+
  770. 'They tell the CPU to stop its current activities and execute the appropriate part of the operating system. '+
  771. 'Interrupt types are '+
  772. '<b>hardware</b> (generated by hardware devices to signal that they need some attention from the OS), '+
  773. '<b>software</b> (generated by programs when they want to request a system call to be performed by the operating system), and '+
  774. '<b>traps</b> (generated by the CPU itself to indicate that some error or condition occurred for which assistance from the operating system is needed).'
  775. },
  776. 'cpu.interrupts': {
  777. info: 'Total number of interrupts per CPU. '+
  778. 'To see the total number for the system check the <a href="#menu_system_submenu_interrupts">interrupts</a> section. '+
  779. 'The last column in <code>/proc/interrupts</code> provides an interrupt description or the device name that registered the handler for that interrupt.'
  780. },
  781. };
  782. // ----------------------------------------------------------------------------
  783. // chart
  784. // information works on the context of a chart
  785. // Its purpose is to set:
  786. //
  787. // info: the text above the charts
  788. // heads: the representation of the chart at the top the subsection (second level menu)
  789. // mainheads: the representation of the chart at the top of the section (first level menu)
  790. // colors: the dimension colors of the chart (the default colors are appended)
  791. // height: the ratio of the chart height relative to the default
  792. //
  793. var cgroupCPULimitIsSet = 0;
  794. var cgroupMemLimitIsSet = 0;
  795. netdataDashboard.context = {
  796. 'system.cpu': {
  797. info: function (os) {
  798. void (os);
  799. return 'Total CPU utilization (all cores). 100% here means there is no CPU idle time at all. You can get per core usage at the <a href="#menu_cpu">CPUs</a> section and per application usage at the <a href="#menu_apps">Applications Monitoring</a> section.'
  800. + netdataDashboard.sparkline('<br/>Keep an eye on <b>iowait</b> ', 'system.cpu', 'iowait', '%', '. If it is constantly high, your disks are a bottleneck and they slow your system down.')
  801. + netdataDashboard.sparkline('<br/>An important metric worth monitoring, is <b>softirq</b> ', 'system.cpu', 'softirq', '%', '. A constantly high percentage of softirq may indicate network driver issues.');
  802. },
  803. valueRange: "[0, 100]"
  804. },
  805. 'system.load': {
  806. info: 'Current system load, i.e. the number of processes using CPU or waiting for system resources (usually CPU and disk). The 3 metrics refer to 1, 5 and 15 minute averages. The system calculates this once every 5 seconds. For more information check <a href="https://en.wikipedia.org/wiki/Load_(computing)" target="_blank">this wikipedia article</a>.',
  807. height: 0.7
  808. },
  809. 'system.cpu_pressure': {
  810. info: '<a href="https://www.kernel.org/doc/html/latest/accounting/psi.html">Pressure Stall Information</a> ' +
  811. 'identifies and quantifies the disruptions caused by resource contentions. ' +
  812. 'The "some" line indicates the share of time in which at least <b>some</b> tasks are stalled on CPU. ' +
  813. 'The ratios (in %) are tracked as recent trends over 10-, 60-, and 300-second windows.'
  814. },
  815. 'system.memory_some_pressure': {
  816. info: '<a href="https://www.kernel.org/doc/html/latest/accounting/psi.html">Pressure Stall Information</a> ' +
  817. 'identifies and quantifies the disruptions caused by resource contentions. ' +
  818. 'The "some" line indicates the share of time in which at least <b>some</b> tasks are stalled on memory. ' +
  819. 'The "full" line indicates the share of time in which <b>all non-idle</b> tasks are stalled on memory simultaneously. ' +
  820. 'In this state actual CPU cycles are going to waste, and a workload that spends extended time in this state is considered to be thrashing. ' +
  821. 'The ratios (in %) are tracked as recent trends over 10-, 60-, and 300-second windows.'
  822. },
  823. 'system.io_some_pressure': {
  824. info: '<a href="https://www.kernel.org/doc/html/latest/accounting/psi.html">Pressure Stall Information</a> ' +
  825. 'identifies and quantifies the disruptions caused by resource contentions. ' +
  826. 'The "some" line indicates the share of time in which at least <b>some</b> tasks are stalled on I/O. ' +
  827. 'The "full" line indicates the share of time in which <b>all non-idle</b> tasks are stalled on I/O simultaneously. ' +
  828. 'In this state actual CPU cycles are going to waste, and a workload that spends extended time in this state is considered to be thrashing. ' +
  829. 'The ratios (in %) are tracked as recent trends over 10-, 60-, and 300-second windows.'
  830. },
  831. 'system.io': {
  832. info: function (os) {
  833. var s = 'Total Disk I/O, for all physical disks. You can get detailed information about each disk at the <a href="#menu_disk">Disks</a> section and per application Disk usage at the <a href="#menu_apps">Applications Monitoring</a> section.';
  834. if (os === 'linux')
  835. return s + ' Physical are all the disks that are listed in <code>/sys/block</code>, but do not exist in <code>/sys/devices/virtual/block</code>.';
  836. else
  837. return s;
  838. }
  839. },
  840. 'system.pgpgio': {
  841. info: 'Memory paged from/to disk. This is usually the total disk I/O of the system.'
  842. },
  843. 'system.swapio': {
  844. info: 'Total Swap I/O. (netdata measures both <code>in</code> and <code>out</code>. If either of the metrics <code>in</code> or <code>out</code> is not shown in the chart, the reason is that the metric is zero. - you can change the page settings to always render all the available dimensions on all charts).'
  845. },
  846. 'system.pgfaults': {
  847. info: 'Total page faults. <b>Major page faults</b> indicates that the system is using its swap. You can find which applications use the swap at the <a href="#menu_apps">Applications Monitoring</a> section.'
  848. },
  849. 'system.entropy': {
  850. colors: '#CC22AA',
  851. info: '<a href="https://en.wikipedia.org/wiki/Entropy_(computing)" target="_blank">Entropy</a>, is a pool of random numbers (<a href="https://en.wikipedia.org/wiki//dev/random" target="_blank">/dev/random</a>) that is mainly used in cryptography. If the pool of entropy gets empty, processes requiring random numbers may run a lot slower (it depends on the interface each program uses), waiting for the pool to be replenished. Ideally a system with high entropy demands should have a hardware device for that purpose (TPM is one such device). There are also several software-only options you may install, like <code>haveged</code>, although these are generally useful only in servers.'
  852. },
  853. 'system.clock_sync_state': {
  854. info: 'State map: 0 - not synchronized, 1 - synchronized'
  855. },
  856. 'system.forks': {
  857. colors: '#5555DD',
  858. info: 'Number of new processes created.'
  859. },
  860. 'system.intr': {
  861. colors: '#DD5555',
  862. info: 'Total number of CPU interrupts. Check <code>system.interrupts</code> that gives more detail about each interrupt and also the <a href="#menu_cpu">CPUs</a> section where interrupts are analyzed <a href="#menu_cpu_submenu_interrupts">per CPU core</a>.'
  863. },
  864. 'system.interrupts': {
  865. info: 'CPU interrupts in detail. At the <a href="#menu_cpu">CPUs</a> section, interrupts are analyzed <a href="#menu_cpu_submenu_interrupts">per CPU core</a>. '+
  866. 'The last column in <code>/proc/interrupts</code> provides an interrupt description or the device name that registered the handler for that interrupt.'
  867. },
  868. 'system.hardirq_latency': {
  869. info: 'Total time spent servicing hardware interrupts. Based on the eBPF <a href="https://github.com/iovisor/bcc/blob/master/tools/hardirqs_example.txt" target="_blank">hardirqs</a> from BCC tools.'
  870. },
  871. 'system.softirqs': {
  872. info: 'CPU softirqs in detail. At the <a href="#menu_cpu">CPUs</a> section, softirqs are analyzed per CPU core.'
  873. },
  874. 'system.softirq_latency': {
  875. info: 'Total time spent servicing software interrupts. Based on the eBPF <a href="https://github.com/iovisor/bcc/blob/master/tools/softirqs_example.txt" target="_blank">softirqs</a> from BCC tools.'
  876. },
  877. 'system.processes': {
  878. info: 'System processes. <b>Running</b> are the processes in the CPU. <b>Blocked</b> are processes that are willing to enter the CPU, but they cannot, e.g. because they wait for disk activity.'
  879. },
  880. 'system.active_processes': {
  881. info: 'All system processes.'
  882. },
  883. 'system.ctxt': {
  884. info: '<a href="https://en.wikipedia.org/wiki/Context_switch" target="_blank">Context Switches</a>, is the switching of the CPU from one process, task or thread to another. If there are many processes or threads willing to execute and very few CPU cores available to handle them, the system is making more context switching to balance the CPU resources among them. The whole process is computationally intensive. The more the context switches, the slower the system gets.'
  885. },
  886. 'system.idlejitter': {
  887. info: 'Idle jitter is calculated by netdata. A thread is spawned that requests to sleep for a few microseconds. When the system wakes it up, it measures how many microseconds have passed. The difference between the requested and the actual duration of the sleep, is the <b>idle jitter</b>. This number is useful in real-time environments, where CPU jitter can affect the quality of the service (like VoIP media gateways).'
  888. },
  889. 'system.net': {
  890. info: function (os) {
  891. var s = 'Total bandwidth of all physical network interfaces. This does not include <code>lo</code>, VPNs, network bridges, IFB devices, bond interfaces, etc. Only the bandwidth of physical network interfaces is aggregated.';
  892. if (os === 'linux')
  893. return s + ' Physical are all the network interfaces that are listed in <code>/proc/net/dev</code>, but do not exist in <code>/sys/devices/virtual/net</code>.';
  894. else
  895. return s;
  896. }
  897. },
  898. 'system.ip': {
  899. info: 'Total IP traffic in the system.'
  900. },
  901. 'system.ipv4': {
  902. info: 'Total IPv4 Traffic.'
  903. },
  904. 'system.ipv6': {
  905. info: 'Total IPv6 Traffic.'
  906. },
  907. 'system.ram': {
  908. info: 'System Random Access Memory (i.e. physical memory) usage.'
  909. },
  910. 'system.swap': {
  911. info: 'System swap memory usage. Swap space is used when the amount of physical memory (RAM) is full. When the system needs more memory resources and the RAM is full, inactive pages in memory are moved to the swap space (usually a disk, a disk partition or a file).'
  912. },
  913. 'system.swapcalls': {
  914. info: 'Monitor calls to functions <code>swap_readpage</code> and <code>swap_writepage</code>. When integration with apps is <a href="https://learn.netdata.cloud/guides/troubleshoot/monitor-debug-applications-ebpf" target="_blank">enabled</a>, Netdata also shows swap access per <a href="#menu_apps_submenu_swap">application</a>.'
  915. },
  916. 'system.ipc_semaphores': {
  917. info: 'Number of allocated System V IPC semaphores. '+
  918. 'The system-wide limit on the number of semaphores in all semaphore sets is specified in <code>/proc/sys/kernel/sem</code> file (2nd field).'
  919. },
  920. 'system.ipc_semaphore_arrays': {
  921. info: 'Number of used System V IPC semaphore arrays (sets). Semaphores support semaphore sets where each one is a counting semaphore. '+
  922. 'So when an application requests semaphores, the kernel releases them in sets. '+
  923. 'The system-wide limit on the maximum number of semaphore sets is specified in <code>/proc/sys/kernel/sem</code> file (4th field).'
  924. },
  925. 'system.shared_memory_segments': {
  926. info: 'Number of allocated System V IPC memory segments. '+
  927. 'The system-wide maximum number of shared memory segments that can be created is specified in <code>/proc/sys/kernel/shmmni</code> file.'
  928. },
  929. 'system.shared_memory_bytes': {
  930. info: 'Amount of memory currently used by System V IPC memory segments. '+
  931. 'The run-time limit on the maximum shared memory segment size that can be created is specified in <code>/proc/sys/kernel/shmmax</code> file.'
  932. },
  933. 'system.message_queue_messages': {
  934. info: 'Number of messages that are currently present in System V IPC message queues.'
  935. },
  936. 'system.message_queue_bytes': {
  937. info: 'Amount of memory currently used by messages in System V IPC message queues.'
  938. },
  939. 'system.uptime': {
  940. info: 'The amount of time the system has been running, including time spent in suspend.'
  941. },
  942. // ------------------------------------------------------------------------
  943. // CPU charts
  944. 'cpu.cpu': {
  945. commonMin: true,
  946. commonMax: true,
  947. valueRange: "[0, 100]"
  948. },
  949. 'cpu.interrupts': {
  950. commonMin: true,
  951. commonMax: true
  952. },
  953. 'cpu.softirqs': {
  954. commonMin: true,
  955. commonMax: true
  956. },
  957. 'cpu.softnet_stat': {
  958. commonMin: true,
  959. commonMax: true
  960. },
  961. // ------------------------------------------------------------------------
  962. // MEMORY
  963. 'mem.ksm_savings': {
  964. heads: [
  965. netdataDashboard.gaugeChart('Saved', '12%', 'savings', '#0099CC')
  966. ]
  967. },
  968. 'mem.ksm_ratios': {
  969. heads: [
  970. function (os, id) {
  971. void (os);
  972. return '<div data-netdata="' + id + '"'
  973. + ' data-gauge-max-value="100"'
  974. + ' data-chart-library="gauge"'
  975. + ' data-title="Savings"'
  976. + ' data-units="percentage %"'
  977. + ' data-gauge-adjust="width"'
  978. + ' data-width="12%"'
  979. + ' data-before="0"'
  980. + ' data-after="-CHART_DURATION"'
  981. + ' data-points="CHART_DURATION"'
  982. + ' role="application"></div>';
  983. }
  984. ]
  985. },
  986. 'mem.zram_usage': {
  987. info: 'ZRAM total RAM usage metrics. ZRAM uses some memory to store metadata about stored memory pages, thus introducing an overhead which is proportional to disk size. It excludes same-element-filled-pages since no memory is allocated for them.'
  988. },
  989. 'mem.zram_savings': {
  990. info: 'Displays original and compressed memory data sizes.'
  991. },
  992. 'mem.zram_ratio': {
  993. heads: [
  994. netdataDashboard.gaugeChart('Compression Ratio', '12%', 'ratio', '#0099CC')
  995. ],
  996. info: 'Compression ratio, calculated as <code>100 * original_size / compressed_size</code>. More means better compression and more RAM savings.'
  997. },
  998. 'mem.zram_efficiency': {
  999. heads: [
  1000. netdataDashboard.gaugeChart('Efficiency', '12%', 'percent', NETDATA.colors[0])
  1001. ],
  1002. commonMin: true,
  1003. commonMax: true,
  1004. valueRange: "[0, 100]",
  1005. info: 'Memory usage efficiency, calculated as <code>100 * compressed_size / total_mem_used</code>.'
  1006. },
  1007. 'mem.pgfaults': {
  1008. info: 'A <a href="https://en.wikipedia.org/wiki/Page_fault" target="_blank">page fault</a> is a type of interrupt, called trap, raised by computer hardware when a running program accesses a memory page that is mapped into the virtual address space, but not actually loaded into main memory. If the page is loaded in memory at the time the fault is generated, but is not marked in the memory management unit as being loaded in memory, then it is called a <b>minor</b> or soft page fault. A <b>major</b> page fault is generated when the system needs to load the memory page from disk or swap memory.'
  1009. },
  1010. 'mem.committed': {
  1011. colors: NETDATA.colors[3],
  1012. info: 'Committed Memory, is the sum of all memory which has been allocated by processes.'
  1013. },
  1014. 'mem.available': {
  1015. info: 'Available Memory is estimated by the kernel, as the amount of RAM that can be used by userspace processes, without causing swapping.'
  1016. },
  1017. 'mem.writeback': {
  1018. info: '<b>Dirty</b> is the amount of memory waiting to be written to disk. <b>Writeback</b> is how much memory is actively being written to disk.'
  1019. },
  1020. 'mem.kernel': {
  1021. info: 'The total amount of memory being used by the kernel. '+
  1022. '<b>Slab</b> is the memory used by the kernel to cache data structures for its own use. '+
  1023. '<b>KernelStack</b> is the memory allocated for each task done by the kernel. '+
  1024. '<b>PageTables</b> is the memory dedicated to the lowest level of page tables (A page table is used to turn a virtual address into a physical memory address). '+
  1025. '<b>VmallocUsed</b> is the memory being used as virtual address space. '+
  1026. '<b>Percpu</b> is the memory allocated to the per-CPU allocator used to back per-CPU allocations (excludes the cost of metadata). '+
  1027. 'When you create a per-CPU variable, each processor on the system gets its own copy of that variable.'
  1028. },
  1029. 'mem.slab': {
  1030. info: '<b>Reclaimable</b> is the amount of memory which the kernel can reuse. <b>Unreclaimable</b> can not be reused even when the kernel is lacking memory.'
  1031. },
  1032. 'mem.hugepages': {
  1033. info: 'Dedicated (or Direct) HugePages is memory reserved for applications configured to utilize huge pages. Hugepages are <b>used</b> memory, even if there are free hugepages available.'
  1034. },
  1035. 'mem.transparent_hugepages': {
  1036. info: 'Transparent HugePages (THP) is backing virtual memory with huge pages, supporting automatic promotion and demotion of page sizes. It works for all applications for anonymous memory mappings and tmpfs/shmem.'
  1037. },
  1038. 'mem.hwcorrupt': {
  1039. info: 'The amount of memory with physical corruption problems, identified by <a href="https://en.wikipedia.org/wiki/ECC_memory" target="_blank">ECC</a> and set aside by the kernel so it does not get used.'
  1040. },
  1041. 'mem.cachestat_ratio': {
  1042. info: 'When the processor needs to read or write a location in main memory, it checks for a corresponding entry in the page cache. If the entry is there, a page cache hit has occurred and the read is from the cache. If the entry is not there, a page cache miss has occurred and the kernel allocates a new entry and copies in data from the disk. Netdata calculates the percentage of accessed files that are cached on memory. <a href="https://github.com/iovisor/bcc/blob/master/tools/cachestat.py#L126-L138" target="_blank">The ratio</a> is calculated counting the accessed cached pages (without counting dirty pages and pages added because of read misses) divided by total access without dirty pages.'
  1043. },
  1044. 'mem.cachestat_dirties': {
  1045. info: 'Number of <a href="https://en.wikipedia.org/wiki/Page_cache#Memory_conservation" target="_blank">dirty(modified) pages</a> cache. Pages in the page cache modified after being brought in are called dirty pages. Since non-dirty pages in the page cache have identical copies in <a href="https://en.wikipedia.org/wiki/Secondary_storage" target="_blank">secondary storage</a> (e.g. hard disk drive or solid-state drive), discarding and reusing their space is much quicker than paging out application memory, and is often preferred over flushing the dirty pages into secondary storage and reusing their space.'
  1046. },
  1047. 'mem.cachestat_hits': {
  1048. info: 'When the processor needs to read or write a location in main memory, it checks for a corresponding entry in the page cache. If the entry is there, a page cache hit has occurred and the read is from the cache. Hits show pages accessed that were not modified (we are excluding dirty pages), this counting also excludes the recent pages inserted for read.'
  1049. },
  1050. 'mem.cachestat_misses': {
  1051. info: 'When the processor needs to read or write a location in main memory, it checks for a corresponding entry in the page cache. If the entry is not there, a page cache miss has occurred and the cache allocates a new entry and copies in data for the main memory. Misses count page insertions to the memory not related to writing.'
  1052. },
  1053. 'mem.sync': {
  1054. info: 'System calls for <a href="https://man7.org/linux/man-pages/man2/sync.2.html" target="_blank">sync() and syncfs()</a> which flush the file system buffers to storage devices. Performance perturbations might be caused by these calls. The <code>sync()</code> calls are based on the eBPF <a href="https://github.com/iovisor/bcc/blob/master/tools/syncsnoop.py" target="_blank">syncsnoop</a> from BCC tools.'
  1055. },
  1056. 'mem.file_sync': {
  1057. info: 'System calls for <a href="https://man7.org/linux/man-pages/man2/fsync.2.html" target="_blank">fsync() and fdatasync()</a> transfer all modified page caches for the files on disk devices. These calls block until the device reports that the transfer has been completed.'
  1058. },
  1059. 'mem.memory_map': {
  1060. info: 'System calls for <a href="https://man7.org/linux/man-pages/man2/msync.2.html" target="_blank">msync()</a> which flushes changes made to the in-core copy of a file that was mapped.'
  1061. },
  1062. 'mem.file_segment': {
  1063. info: 'System calls for <a href="https://man7.org/linux/man-pages/man2/sync_file_range.2.html" target="_blank">sync_file_range()</a> permits fine control when synchronizing the open file referred to by the file descriptor fd with disk. This system call is extremely dangerous and should not be used in portable programs.'
  1064. },
  1065. 'filesystem.dc_hit_ratio': {
  1066. info: 'Percentage of file accesses that were present in the directory cache. 100% means that every file that was accessed was present in the directory cache. If files are not present in the directory cache 1) they are not present in the file system, 2) the files were not accessed before. Read more about <a href="https://www.kernel.org/doc/htmldocs/filesystems/the_directory_cache.html" target="_blank">directory cache</a>. When integration with apps is <a href="https://learn.netdata.cloud/guides/troubleshoot/monitor-debug-applications-ebpf" target="_blank">enabled</a>, Netdata also shows directory cache per <a href="#menu_apps_submenu_directory_cache__eBPF_">application</a>.'
  1067. },
  1068. 'filesystem.dc_reference': {
  1069. info: 'Counters of file accesses. <code>Reference</code> is when there is a file access and the file is not present in the directory cache. <code>Miss</code> is when there is file access and the file is not found in the filesystem. <code>Slow</code> is when there is a file access and the file is present in the filesystem but not in the directory cache. Read more about <a href="https://www.kernel.org/doc/htmldocs/filesystems/the_directory_cache.html" target="_blank">directory cache</a>.'
  1070. },
  1071. 'md.health': {
  1072. info: 'Number of failed devices per MD array. '+
  1073. 'Netdata retrieves this data from the <b>[n/m]</b> field of the md status line. '+
  1074. 'It means that ideally the array would have <b>n</b> devices however, currently, <b>m</b> devices are in use. '+
  1075. '<code>failed disks</code> is <b>n-m</b>.'
  1076. },
  1077. 'md.disks': {
  1078. info: 'Number of devices in use and in the down state. '+
  1079. 'Netdata retrieves this data from the <b>[n/m]</b> field of the md status line. '+
  1080. 'It means that ideally the array would have <b>n</b> devices however, currently, <b>m</b> devices are in use. '+
  1081. '<code>inuse</code> is <b>m</b>, <code>down</code> is <b>n-m</b>.'
  1082. },
  1083. 'md.status': {
  1084. info: 'Completion progress of the ongoing operation.'
  1085. },
  1086. 'md.expected_time_until_operation_finish': {
  1087. info: 'Estimated time to complete the ongoing operation. '+
  1088. 'The time is only an approximation since the operation speed will vary according to other I/O demands.'
  1089. },
  1090. 'md.operation_speed': {
  1091. info: 'Speed of the ongoing operation. '+
  1092. 'The system-wide rebuild speed limits are specified in <code>/proc/sys/dev/raid/{speed_limit_min,speed_limit_max}</code> files. '+
  1093. 'These options are good for tweaking rebuilt process and may increase overall system load, cpu and memory usage.'
  1094. },
  1095. 'md.mismatch_cnt': {
  1096. info: 'When performing <b>check</b> and <b>repair</b>, and possibly when performing <b>resync</b>, md will count the number of errors that are found. '+
  1097. 'A count of mismatches is recorded in the <code>sysfs</code> file <code>md/mismatch_cnt</code>. '+
  1098. 'This value is the number of sectors that were re-written, or (for <b>check</b>) would have been re-written. '+
  1099. 'It may be larger than the number of actual errors by a factor of the number of sectors in a page. '+
  1100. 'Mismatches can not be interpreted very reliably on RAID1 or RAID10, especially when the device is used for swap. '+
  1101. 'On a truly clean RAID5 or RAID6 array, any mismatches should indicate a hardware problem at some level - '+
  1102. 'software issues should never cause such a mismatch. '+
  1103. 'For details, see <a href="https://man7.org/linux/man-pages/man4/md.4.html" target="_blank">md(4)</a>.'
  1104. },
  1105. // ------------------------------------------------------------------------
  1106. // IP
  1107. 'ip.inerrors': {
  1108. info: 'Errors encountered during the reception of IP packets. ' +
  1109. '<b>noroutes</b> (<code>InNoRoutes</code>) counts packets that were dropped because there was no route to send them. ' +
  1110. '<b>truncated</b> (<code>InTruncatedPkts</code>) counts packets which is being discarded because the datagram frame didn\'t carry enough data. ' +
  1111. '<b>checksum</b> (<code>InCsumErrors</code>) counts packets that were dropped because they had wrong checksum. '
  1112. },
  1113. 'ip.mcast': {
  1114. info: 'Total multicast traffic in the system.'
  1115. },
  1116. 'ip.mcastpkts': {
  1117. info: 'Total transferred multicast packets in the system.'
  1118. },
  1119. 'ip.bcast': {
  1120. info: 'Total broadcast traffic in the system.'
  1121. },
  1122. 'ip.bcastpkts': {
  1123. info: 'Total transferred broadcast packets in the system.'
  1124. },
  1125. 'ip.ecnpkts': {
  1126. info: 'Total number of received IP packets with ECN bits set in the system. '+
  1127. '<b>CEP</b> - congestion encountered. '+
  1128. '<b>NoECTP</b> - non ECN-capable transport. '+
  1129. '<b>ECTP0</b> and <b>ECTP1</b> - ECN capable transport.'
  1130. },
  1131. 'ip.tcpreorders': {
  1132. info: 'TCP prevents out-of-order packets by either sequencing them in the correct order or by requesting the retransmission of out-of-order packets. '+
  1133. '<b>Timestamp</b> - detected re-ordering using the timestamp option. '+
  1134. '<b>SACK</b> - detected re-ordering using Selective Acknowledgment algorithm. '+
  1135. '<b>FACK</b> - detected re-ordering using Forward Acknowledgment algorithm. '+
  1136. '<b>Reno</b> - detected re-ordering using Fast Retransmit algorithm.'
  1137. },
  1138. 'ip.tcpofo': {
  1139. info: 'TCP maintains an out-of-order (OOO) queue to keep the OOO packets in the TCP communication. '+
  1140. '<b>InQueue</b> - the TCP layer receives an OOO packet and has enough memory to queue it. '+
  1141. '<b>Dropped</b> - the TCP layer receives an OOO packet but does not have enough memory, so drops it. '+
  1142. '<b>Merged</b> - the received OOO packet has an overlay with the previous packet. '+
  1143. 'The overlay part will be dropped. All these packets will also be counted into <b>InQueue</b>. '+
  1144. '<b>Pruned</b> - packets dropped from out-of-order queue because of socket buffer overrun.'
  1145. },
  1146. 'ip.tcpsyncookies': {
  1147. info: '<a href="https://en.wikipedia.org/wiki/SYN_cookies" target="_blank">SYN cookies</a> are used to mitigate SYN flood. '+
  1148. '<b>Received</b> - after sending a SYN cookie, it came back to us and passed the check. '+
  1149. '<b>Sent</b> - an application was not able to accept a connection fast enough, so the kernel could not store '+
  1150. 'an entry in the queue for this connection. Instead of dropping it, it sent a SYN cookie to the client. '+
  1151. '<b>Failed</b> - the MSS decoded from the SYN cookie is invalid. When this counter is incremented, '+
  1152. 'the received packet won’t be treated as a SYN cookie.'
  1153. },
  1154. 'ip.tcpmemorypressures': {
  1155. info: 'Number of times a socket was put in <b>memory pressure</b> due to a non fatal memory allocation failure (the kernel attempts to work around this situation by reducing the send buffers, etc).'
  1156. },
  1157. 'ip.tcpconnaborts': {
  1158. info: 'TCP connection aborts. <b>baddata</b> (<code>TCPAbortOnData</code>) happens while the connection is on <code>FIN_WAIT1</code> and the kernel receives a packet with a sequence number beyond the last one for this connection - the kernel responds with <code>RST</code> (closes the connection). <b>userclosed</b> (<code>TCPAbortOnClose</code>) happens when the kernel receives data on an already closed connection and responds with <code>RST</code>. <b>nomemory</b> (<code>TCPAbortOnMemory</code> happens when there are too many orphaned sockets (not attached to an fd) and the kernel has to drop a connection - sometimes it will send an <code>RST</code>, sometimes it won\'t. <b>timeout</b> (<code>TCPAbortOnTimeout</code>) happens when a connection times out. <b>linger</b> (<code>TCPAbortOnLinger</code>) happens when the kernel killed a socket that was already closed by the application and lingered around for long enough. <b>failed</b> (<code>TCPAbortFailed</code>) happens when the kernel attempted to send an <code>RST</code> but failed because there was no memory available.'
  1159. },
  1160. 'ip.tcp_functions': {
  1161. title : 'TCP calls',
  1162. info: 'Successful or failed calls to functions <code>tcp_sendmsg</code>, <code>tcp_cleanup_rbuf</code>, and <code>tcp_close</code>.'
  1163. },
  1164. 'ip.total_tcp_bandwidth': {
  1165. title : 'TCP bandwidth',
  1166. info: 'Bytes sent and received by functions <code>tcp_sendmsg</code> and <code>tcp_cleanup_rbuf</code>. We use <code>tcp_cleanup_rbuf</code> instead of <code>tcp_recvmsg</code>, because the last one misses <code>tcp_read_sock()</code> traffic and we would also need to have more probes to get the socket and package size.'
  1167. },
  1168. 'ip.tcp_error': {
  1169. title : 'TCP errors',
  1170. info: 'Failed calls to functions <code>tcp_sendmsg</code>, <code>tcp_cleanup_rbuf</code>, and <code>tcp_close</code>.'
  1171. },
  1172. 'ip.tcp_retransmit': {
  1173. title : 'TCP retransmit',
  1174. info: 'Number of packets retransmitted by function <code>tcp_retransmit_skb</code>.'
  1175. },
  1176. 'ip.udp_functions': {
  1177. title : 'UDP calls',
  1178. info: 'Successful or failed calls to functions <code>udp_sendmsg</code> and <code>udp_recvmsg</code>.'
  1179. },
  1180. 'ip.total_udp_bandwidth': {
  1181. title : 'UDP bandwidth',
  1182. info: 'Bytes sent and received by functions <code>udp_sendmsg</code> and <code>udp_recvmsg</code>.'
  1183. },
  1184. 'ip.udp_error': {
  1185. title : 'UDP errors',
  1186. info: 'Failed calls to functions <code>udp_sendmsg</code> and <code>udp_recvmsg</code>.'
  1187. },
  1188. 'ip.tcp_syn_queue': {
  1189. info: 'The <b>SYN queue</b> of the kernel tracks TCP handshakes until connections get fully established. ' +
  1190. 'It overflows when too many incoming TCP connection requests hang in the half-open state and the server ' +
  1191. 'is not configured to fall back to SYN cookies*. Overflows are usually caused by SYN flood DoS attacks ' +
  1192. '(i.e. someone sends lots of SYN packets and never completes the handshakes). ' +
  1193. '<b>drops</b> (or <code>TcpExtTCPReqQFullDrop</code>) is the number of connections dropped because the ' +
  1194. 'SYN queue was full and SYN cookies were disabled. ' +
  1195. '<b>cookies</b> (or <code>TcpExtTCPReqQFullDoCookies</code>) is the number of SYN cookies sent because the ' +
  1196. 'SYN queue was full.'
  1197. },
  1198. 'ip.tcp_accept_queue': {
  1199. info: 'The <b>accept queue</b> of the kernel holds the fully established TCP connections, waiting to be handled ' +
  1200. 'by the listening application. <b>overflows</b> (or <code>ListenOverflows</code>) is the number of ' +
  1201. 'established connections that could not be handled because the receive queue of the listening application ' +
  1202. 'was full. <b>drops</b> (or <code>ListenDrops</code>) is the number of incoming ' +
  1203. 'connections that could not be handled, including SYN floods, overflows, out of memory, security issues, ' +
  1204. 'no route to destination, reception of related ICMP messages, socket is broadcast or multicast.'
  1205. },
  1206. // ------------------------------------------------------------------------
  1207. // IPv4
  1208. 'ipv4.packets': {
  1209. info: '<p>IPv4 packets statistics for this host.</p>'+
  1210. '<p><b>Received</b> - packets received by the IP layer. '+
  1211. 'This counter will be increased even if the packet is dropped later. '+
  1212. '<b>Sent</b> - packets sent via IP layer, for both single cast and multicast packets. '+
  1213. 'This counter does not include any packets counted in <b>Forwarded</b>. '+
  1214. '<b>Forwarded</b> - input packets for which this host was not their final IP destination, '+
  1215. 'as a result of which an attempt was made to find a route to forward them to that final destination. '+
  1216. 'In hosts which do not act as IP Gateways, this counter will include only those packets which were '+
  1217. '<a href="https://en.wikipedia.org/wiki/Source_routing" target="_blank">Source-Routed</a> '+
  1218. 'and the Source-Route option processing was successful. '+
  1219. '<b>Delivered</b> - packets delivered to the upper layer protocols, e.g. TCP, UDP, ICMP, and so on.</p>'
  1220. },
  1221. 'ipv4.fragsout': {
  1222. info: '<p><a href="https://en.wikipedia.org/wiki/IPv4#Fragmentation" target="_blank">IPv4 fragmentation</a> '+
  1223. 'statistics for this system.</p>'+
  1224. '<p><b>OK</b> - packets that have been successfully fragmented. '+
  1225. '<b>Failed</b> - packets that have been discarded because they needed to be fragmented '+
  1226. 'but could not be, e.g. due to <i>Don\'t Fragment</i> (DF) flag was set. '+
  1227. '<b>Created</b> - fragments that have been generated as a result of fragmentation.</p>'
  1228. },
  1229. 'ipv4.fragsin': {
  1230. info: '<p><a href="https://en.wikipedia.org/wiki/IPv4#Reassembly" target="_blank">IPv4 reassembly</a> '+
  1231. 'statistics for this system.</p>'+
  1232. '<p><b>OK</b> - packets that have been successfully reassembled. '+
  1233. '<b>Failed</b> - failures detected by the IP reassembly algorithm. '+
  1234. 'This is not necessarily a count of discarded IP fragments since some algorithms '+
  1235. 'can lose track of the number of fragments by combining them as they are received. '+
  1236. '<b>All</b> - received IP fragments which needed to be reassembled.</p>'
  1237. },
  1238. 'ipv4.errors': {
  1239. info: '<p>The number of discarded IPv4 packets.</p>'+
  1240. '<p><b>InDiscards</b>, <b>OutDiscards</b> - inbound and outbound packets which were chosen '+
  1241. 'to be discarded even though no errors had been '+
  1242. 'detected to prevent their being deliverable to a higher-layer protocol. '+
  1243. '<b>InHdrErrors</b> - input packets that have been discarded due to errors in their IP headers, including '+
  1244. 'bad checksums, version number mismatch, other format errors, time-to-live exceeded, '+
  1245. 'errors discovered in processing their IP options, etc. '+
  1246. '<b>OutNoRoutes</b> - packets that have been discarded because no route could be found '+
  1247. 'to transmit them to their destination. This includes any packets which a host cannot route '+
  1248. 'because all of its default gateways are down. '+
  1249. '<b>InAddrErrors</b> - input packets that have been discarded due to invalid IP address or '+
  1250. 'the destination IP address is not a local address and IP forwarding is not enabled. '+
  1251. '<b>InUnknownProtos</b> - input packets which were discarded because of an unknown or unsupported protocol.</p>'
  1252. },
  1253. 'ipv4.icmp': {
  1254. info: '<p>The number of transferred IPv4 ICMP messages.</p>'+
  1255. '<p><b>Received</b>, <b>Sent</b> - ICMP messages which the host received and attempted to send. '+
  1256. 'Both these counters include errors.</p>'
  1257. },
  1258. 'ipv4.icmp_errors': {
  1259. info: '<p>The number of IPv4 ICMP errors.</p>'+
  1260. '<p><b>InErrors</b> - received ICMP messages but determined as having ICMP-specific errors, '+
  1261. 'e.g. bad ICMP checksums, bad length, etc. '+
  1262. '<b>OutErrors</b> - ICMP messages which this host did not send due to '+
  1263. 'problems discovered within ICMP such as a lack of buffers. '+
  1264. 'This counter does not include errors discovered outside the ICMP layer '+
  1265. 'such as the inability of IP to route the resultant datagram. '+
  1266. '<b>InCsumErrors</b> - received ICMP messages with bad checksum.</p>'
  1267. },
  1268. 'ipv4.icmpmsg': {
  1269. info: 'The number of transferred '+
  1270. '<a href="https://www.iana.org/assignments/icmp-parameters/icmp-parameters.xhtml" target="_blank">IPv4 ICMP control messages</a>.'
  1271. },
  1272. 'ipv4.udppackets': {
  1273. info: 'The number of transferred UDP packets.'
  1274. },
  1275. 'ipv4.udperrors': {
  1276. info: '<p>The number of errors encountered during transferring UDP packets.</p>'+
  1277. '<b>RcvbufErrors</b> - receive buffer is full. '+
  1278. '<b>SndbufErrors</b> - send buffer is full, no kernel memory available, or '+
  1279. 'the IP layer reported an error when trying to send the packet and no error queue has been setup. '+
  1280. '<b>InErrors</b> - that is an aggregated counter for all errors, excluding <b>NoPorts</b>. '+
  1281. '<b>NoPorts</b> - no application is listening at the destination port. '+
  1282. '<b>InCsumErrors</b> - a UDP checksum failure is detected. '+
  1283. '<b>IgnoredMulti</b> - ignored multicast packets.'
  1284. },
  1285. 'ipv4.udplite': {
  1286. info: 'The number of transferred UDP-Lite packets.'
  1287. },
  1288. 'ipv4.udplite_errors': {
  1289. info: '<p>The number of errors encountered during transferring UDP-Lite packets.</p>'+
  1290. '<b>RcvbufErrors</b> - receive buffer is full. '+
  1291. '<b>SndbufErrors</b> - send buffer is full, no kernel memory available, or '+
  1292. 'the IP layer reported an error when trying to send the packet and no error queue has been setup. '+
  1293. '<b>InErrors</b> - that is an aggregated counter for all errors, excluding <b>NoPorts</b>. '+
  1294. '<b>NoPorts</b> - no application is listening at the destination port. '+
  1295. '<b>InCsumErrors</b> - a UDP checksum failure is detected. '+
  1296. '<b>IgnoredMulti</b> - ignored multicast packets.'
  1297. },
  1298. 'ipv4.tcppackets': {
  1299. info: '<p>The number of packets transferred by the TCP layer.</p>'+
  1300. '</p><b>Received</b> - received packets, including those received in error, '+
  1301. 'such as checksum error, invalid TCP header, and so on. '+
  1302. '<b>Sent</b> - sent packets, excluding the retransmitted packets. '+
  1303. 'But it includes the SYN, ACK, and RST packets.</p>'
  1304. },
  1305. 'ipv4.tcpsock': {
  1306. info: 'The number of TCP connections for which the current state is either ESTABLISHED or CLOSE-WAIT. '+
  1307. 'This is a snapshot of the established connections at the time of measurement '+
  1308. '(i.e. a connection established and a connection disconnected within the same iteration will not affect this metric).'
  1309. },
  1310. 'ipv4.tcpopens': {
  1311. info: '<b>active</b> or <code>ActiveOpens</code> is the number of outgoing TCP <b>connections attempted</b> by this host.'
  1312. + ' <b>passive</b> or <code>PassiveOpens</code> is the number of incoming TCP <b>connections accepted</b> by this host.'
  1313. },
  1314. 'ipv4.tcperrors': {
  1315. info: '<code>InErrs</code> is the number of TCP segments received in error (including header too small, checksum errors, sequence errors, bad packets - for both IPv4 and IPv6).'
  1316. + ' <code>InCsumErrors</code> is the number of TCP segments received with checksum errors (for both IPv4 and IPv6).'
  1317. + ' <code>RetransSegs</code> is the number of TCP segments retransmitted.'
  1318. },
  1319. 'ipv4.tcphandshake': {
  1320. info: '<code>EstabResets</code> is the number of established connections resets (i.e. connections that made a direct transition from <code>ESTABLISHED</code> or <code>CLOSE_WAIT</code> to <code>CLOSED</code>).'
  1321. + ' <code>OutRsts</code> is the number of TCP segments sent, with the <code>RST</code> flag set (for both IPv4 and IPv6).'
  1322. + ' <code>AttemptFails</code> is the number of times TCP connections made a direct transition from either <code>SYN_SENT</code> or <code>SYN_RECV</code> to <code>CLOSED</code>, plus the number of times TCP connections made a direct transition from the <code>SYN_RECV</code> to <code>LISTEN</code>.'
  1323. + ' <code>TCPSynRetrans</code> shows retries for new outbound TCP connections, which can indicate general connectivity issues or backlog on the remote host.'
  1324. },
  1325. 'ipv4.sockstat_sockets': {
  1326. info: 'The total number of used sockets for all '+
  1327. '<a href="https://man7.org/linux/man-pages/man7/address_families.7.html" target="_blank">address families</a> '+
  1328. 'in this system.'
  1329. },
  1330. 'ipv4.sockstat_tcp_sockets': {
  1331. info: '<p>The number of TCP sockets in the system in certain '+
  1332. '<a href="https://en.wikipedia.org/wiki/Transmission_Control_Protocol#Protocol_operation" target="_blank">states</a>.</p>'+
  1333. '<p><b>Alloc</b> - in any TCP state. '+
  1334. '<b>Orphan</b> - no longer attached to a socket descriptor in any user processes, '+
  1335. 'but for which the kernel is still required to maintain state in order to complete the transport protocol. '+
  1336. '<b>InUse</b> - in any TCP state, excluding TIME-WAIT and CLOSED. '+
  1337. '<b>TimeWait</b> - in the TIME-WAIT state.</p>'
  1338. },
  1339. 'ipv4.sockstat_tcp_mem': {
  1340. info: 'The amount of memory used by allocated TCP sockets.'
  1341. },
  1342. 'ipv4.sockstat_udp_sockets': {
  1343. info: 'The number of used UDP sockets.'
  1344. },
  1345. 'ipv4.sockstat_udp_mem': {
  1346. info: 'The amount of memory used by allocated UDP sockets.'
  1347. },
  1348. 'ipv4.sockstat_udplite_sockets': {
  1349. info: 'The number of used UDP-Lite sockets.'
  1350. },
  1351. 'ipv4.sockstat_raw_sockets': {
  1352. info: 'The number of used <a href="https://en.wikipedia.org/wiki/Network_socket#Types" target="_blank"> raw sockets</a>.'
  1353. },
  1354. 'ipv4.sockstat_frag_sockets': {
  1355. info: 'The number of entries in hash tables that are used for packet reassembly.'
  1356. },
  1357. 'ipv4.sockstat_frag_mem': {
  1358. info: 'The amount of memory used for packet reassembly.'
  1359. },
  1360. // ------------------------------------------------------------------------
  1361. // IPv6
  1362. 'ipv6.packets': {
  1363. info: '<p>IPv6 packet statistics for this host.</p>'+
  1364. '<p><b>Received</b> - packets received by the IP layer. '+
  1365. 'This counter will be increased even if the packet is dropped later. '+
  1366. '<b>Sent</b> - packets sent via IP layer, for both single cast and multicast packets. '+
  1367. 'This counter does not include any packets counted in <b>Forwarded</b>. '+
  1368. '<b>Forwarded</b> - input packets for which this host was not their final IP destination, '+
  1369. 'as a result of which an attempt was made to find a route to forward them to that final destination. '+
  1370. 'In hosts which do not act as IP Gateways, this counter will include only those packets which were '+
  1371. '<a href="https://en.wikipedia.org/wiki/Source_routing" target="_blank">Source-Routed</a> '+
  1372. 'and the Source-Route option processing was successful. '+
  1373. '<b>Delivers</b> - packets delivered to the upper layer protocols, e.g. TCP, UDP, ICMP, and so on.</p>'
  1374. },
  1375. 'ipv6.fragsout': {
  1376. info: '<p><a href="https://en.wikipedia.org/wiki/IP_fragmentation" target="_blank">IPv6 fragmentation</a> '+
  1377. 'statistics for this system.</p>'+
  1378. '<p><b>OK</b> - packets that have been successfully fragmented. '+
  1379. '<b>Failed</b> - packets that have been discarded because they needed to be fragmented '+
  1380. 'but could not be, e.g. due to <i>Don\'t Fragment</i> (DF) flag was set. '+
  1381. '<b>All</b> - fragments that have been generated as a result of fragmentation.</p>'
  1382. },
  1383. 'ipv6.fragsin': {
  1384. info: '<p><a href="https://en.wikipedia.org/wiki/IP_fragmentation" target="_blank">IPv6 reassembly</a> '+
  1385. 'statistics for this system.</p>'+
  1386. '<p><b>OK</b> - packets that have been successfully reassembled. '+
  1387. '<b>Failed</b> - failures detected by the IP reassembly algorithm. '+
  1388. 'This is not necessarily a count of discarded IP fragments since some algorithms '+
  1389. 'can lose track of the number of fragments by combining them as they are received. '+
  1390. '<b>Timeout</b> - reassembly timeouts detected. '+
  1391. '<b>All</b> - received IP fragments which needed to be reassembled.</p>'
  1392. },
  1393. 'ipv6.errors': {
  1394. info: '<p>The number of discarded IPv6 packets.</p>'+
  1395. '<p><b>InDiscards</b>, <b>OutDiscards</b> - packets which were chosen to be discarded even though '+
  1396. 'no errors had been detected to prevent their being deliverable to a higher-layer protocol. '+
  1397. '<b>InHdrErrors</b> - errors in IP headers, including bad checksums, version number mismatch, '+
  1398. 'other format errors, time-to-live exceeded, etc. '+
  1399. '<b>InAddrErrors</b> - invalid IP address or the destination IP address is not a local address and '+
  1400. 'IP forwarding is not enabled. '+
  1401. '<b>InUnknownProtos</b> - unknown or unsupported protocol. '+
  1402. '<b>InTooBigErrors</b> - the size exceeded the link MTU. '+
  1403. '<b>InTruncatedPkts</b> - packet frame did not carry enough data. '+
  1404. '<b>InNoRoutes</b> - no route could be found while forwarding. '+
  1405. '<b>OutNoRoutes</b> - no route could be found for packets generated by this host.</p>'
  1406. },
  1407. 'ipv6.udppackets': {
  1408. info: 'The number of transferred UDP packets.'
  1409. },
  1410. 'ipv6.udperrors': {
  1411. info: '<p>The number of errors encountered during transferring UDP packets.</p>'+
  1412. '<b>RcvbufErrors</b> - receive buffer is full. '+
  1413. '<b>SndbufErrors</b> - send buffer is full, no kernel memory available, or '+
  1414. 'the IP layer reported an error when trying to send the packet and no error queue has been setup. '+
  1415. '<b>InErrors</b> - that is an aggregated counter for all errors, excluding <b>NoPorts</b>. '+
  1416. '<b>NoPorts</b> - no application is listening at the destination port. '+
  1417. '<b>InCsumErrors</b> - a UDP checksum failure is detected. '+
  1418. '<b>IgnoredMulti</b> - ignored multicast packets.'
  1419. },
  1420. 'ipv6.udplitepackets': {
  1421. info: 'The number of transferred UDP-Lite packets.'
  1422. },
  1423. 'ipv6.udpliteerrors': {
  1424. info: '<p>The number of errors encountered during transferring UDP-Lite packets.</p>'+
  1425. '<p><b>RcvbufErrors</b> - receive buffer is full. '+
  1426. '<b>SndbufErrors</b> - send buffer is full, no kernel memory available, or '+
  1427. 'the IP layer reported an error when trying to send the packet and no error queue has been setup. '+
  1428. '<b>InErrors</b> - that is an aggregated counter for all errors, excluding <b>NoPorts</b>. '+
  1429. '<b>NoPorts</b> - no application is listening at the destination port. '+
  1430. '<b>InCsumErrors</b> - a UDP checksum failure is detected.</p>'
  1431. },
  1432. 'ipv6.mcast': {
  1433. info: 'Total IPv6 multicast traffic.'
  1434. },
  1435. 'ipv6.bcast': {
  1436. info: 'Total IPv6 broadcast traffic.'
  1437. },
  1438. 'ipv6.mcastpkts': {
  1439. info: 'Total transferred IPv6 multicast packets.'
  1440. },
  1441. 'ipv6.icmp': {
  1442. info: '<p>The number of transferred ICMPv6 messages.</p>'+
  1443. '<p><b>Received</b>, <b>Sent</b> - ICMP messages which the host received and attempted to send. '+
  1444. 'Both these counters include errors.</p>'
  1445. },
  1446. 'ipv6.icmpredir': {
  1447. info: 'The number of transferred ICMPv6 Redirect messages. '+
  1448. 'These messages inform a host to update its routing information (to send packets on an alternative route).'
  1449. },
  1450. 'ipv6.icmpechos': {
  1451. info: 'The number of ICMPv6 Echo messages.'
  1452. },
  1453. 'ipv6.icmperrors': {
  1454. info: '<p>The number of ICMPv6 errors and '+
  1455. '<a href="https://www.rfc-editor.org/rfc/rfc4443.html#section-3" target="_blank">error messages</a>.</p>'+
  1456. '<p><b>InErrors</b>, <b>OutErrors</b> - bad ICMP messages (bad ICMP checksums, bad length, etc.). '+
  1457. '<b>InCsumErrors</b> - wrong checksum.</p>'
  1458. },
  1459. 'ipv6.groupmemb': {
  1460. info: '<p>The number of transferred ICMPv6 Group Membership messages.</p>'+
  1461. '<p> Multicast routers send Group Membership Query messages to learn which groups have members on each of their '+
  1462. 'attached physical networks. Host computers respond by sending a Group Membership Report for each '+
  1463. 'multicast group joined by the host. A host computer can also send a Group Membership Report when '+
  1464. 'it joins a new multicast group. '+
  1465. 'Group Membership Reduction messages are sent when a host computer leaves a multicast group.</p>'
  1466. },
  1467. 'ipv6.icmprouter': {
  1468. info: '<p>The number of transferred ICMPv6 '+
  1469. '<a href="https://en.wikipedia.org/wiki/Neighbor_Discovery_Protocol" target="_blank">Router Discovery</a> messages.</p>'+
  1470. '<p>Router <b>Solicitations</b> message is sent from a computer host to any routers on the local area network '+
  1471. 'to request that they advertise their presence on the network. '+
  1472. 'Router <b>Advertisement</b> message is sent by a router on the local area network to announce its IP address '+
  1473. 'as available for routing.</p>'
  1474. },
  1475. 'ipv6.icmpneighbor': {
  1476. info: '<p>The number of transferred ICMPv6 '+
  1477. '<a href="https://en.wikipedia.org/wiki/Neighbor_Discovery_Protocol" target="_blank">Neighbour Discovery</a> messages.</p>'+
  1478. '<p>Neighbor <b>Solicitations</b> are used by nodes to determine the link layer address '+
  1479. 'of a neighbor, or to verify that a neighbor is still reachable via a cached link layer address. '+
  1480. 'Neighbor <b>Advertisements</b> are used by nodes to respond to a Neighbor Solicitation message.</p>'
  1481. },
  1482. 'ipv6.icmpmldv2': {
  1483. info: 'The number of transferred ICMPv6 '+
  1484. '<a href="https://en.wikipedia.org/wiki/Multicast_Listener_Discovery" target="_blank">Multicast Listener Discovery</a> (MLD) messages.'
  1485. },
  1486. 'ipv6.icmptypes': {
  1487. info: 'The number of transferred ICMPv6 messages of '+
  1488. '<a href="https://en.wikipedia.org/wiki/Internet_Control_Message_Protocol_for_IPv6#Types" target="_blank">certain types</a>.'
  1489. },
  1490. 'ipv6.ect': {
  1491. info: '<p>Total number of received IPv6 packets with ECN bits set in the system.</p>'+
  1492. '<p><b>CEP</b> - congestion encountered. '+
  1493. '<b>NoECTP</b> - non ECN-capable transport. '+
  1494. '<b>ECTP0</b> and <b>ECTP1</b> - ECN capable transport.</p>'
  1495. },
  1496. 'ipv6.sockstat6_tcp_sockets': {
  1497. info: 'The number of TCP sockets in any '+
  1498. '<a href="https://en.wikipedia.org/wiki/Transmission_Control_Protocol#Protocol_operation" target="">state</a>, '+
  1499. 'excluding TIME-WAIT and CLOSED.'
  1500. },
  1501. 'ipv6.sockstat6_udp_sockets': {
  1502. info: 'The number of used UDP sockets.'
  1503. },
  1504. 'ipv6.sockstat6_udplite_sockets': {
  1505. info: 'The number of used UDP-Lite sockets.'
  1506. },
  1507. 'ipv6.sockstat6_raw_sockets': {
  1508. info: 'The number of used <a href="https://en.wikipedia.org/wiki/Network_socket#Types" target="_blank"> raw sockets</a>.'
  1509. },
  1510. 'ipv6.sockstat6_frag_sockets': {
  1511. info: 'The number of entries in hash tables that are used for packet reassembly.'
  1512. },
  1513. // ------------------------------------------------------------------------
  1514. // SCTP
  1515. 'sctp.established': {
  1516. info: 'The number of associations for which the current state is either '+
  1517. 'ESTABLISHED, SHUTDOWN-RECEIVED or SHUTDOWN-PENDING.'
  1518. },
  1519. 'sctp.transitions': {
  1520. info: '<p>The number of times that associations have made a direct transition between states.</p>'+
  1521. '<p><b>Active</b> - from COOKIE-ECHOED to ESTABLISHED. The upper layer initiated the association attempt. '+
  1522. '<b>Passive</b> - from CLOSED to ESTABLISHED. The remote endpoint initiated the association attempt. '+
  1523. '<b>Aborted</b> - from any state to CLOSED using the primitive ABORT. Ungraceful termination of the association. '+
  1524. '<b>Shutdown</b> - from SHUTDOWN-SENT or SHUTDOWN-ACK-SENT to CLOSED. Graceful termination of the association.</p>'
  1525. },
  1526. 'sctp.packets': {
  1527. info: '<p>The number of transferred SCTP packets.</p>'+
  1528. '<p><b>Received</b> - includes duplicate packets. '+
  1529. '<b>Sent</b> - includes retransmitted DATA chunks.</p>'
  1530. },
  1531. 'sctp.packet_errors': {
  1532. info: '<p>The number of errors encountered during receiving SCTP packets.</p>'+
  1533. '<p><b>Invalid</b> - packets for which the receiver was unable to identify an appropriate association. '+
  1534. '<b>Checksum</b> - packets with an invalid checksum.</p>'
  1535. },
  1536. 'sctp.fragmentation': {
  1537. info: '<p>The number of fragmented and reassembled SCTP messages.</p>'+
  1538. '<p><b>Reassembled</b> - reassembled user messages, after conversion into DATA chunks. '+
  1539. '<b>Fragmented</b> - user messages that have to be fragmented because of the MTU.</p>'
  1540. },
  1541. 'sctp.chunks': {
  1542. info: 'The number of transferred control, ordered, and unordered DATA chunks. '+
  1543. 'Retransmissions and duplicates are not included.'
  1544. },
  1545. // ------------------------------------------------------------------------
  1546. // APPS
  1547. 'apps.cpu': {
  1548. height: 2.0
  1549. },
  1550. 'apps.mem': {
  1551. info: 'Real memory (RAM) used by applications. This does not include shared memory.'
  1552. },
  1553. 'apps.vmem': {
  1554. info: 'Virtual memory allocated by applications. Please check <a href="https://github.com/netdata/netdata/tree/master/daemon#virtual-memory" target="_blank">this article</a> for more information.'
  1555. },
  1556. 'apps.preads': {
  1557. height: 2.0
  1558. },
  1559. 'apps.pwrites': {
  1560. height: 2.0
  1561. },
  1562. 'apps.uptime': {
  1563. info: 'Carried over process group uptime since the Netdata restart. The period of time within which at least one process in the group was running.'
  1564. },
  1565. 'apps.file_open': {
  1566. info: 'Calls to the internal function <code>do_sys_open</code> ( For kernels newer than <code>5.5.19</code> we add a kprobe to <code>do_sys_openat2</code>. ), which is the common function called from' +
  1567. ' <a href="https://www.man7.org/linux/man-pages/man2/open.2.html" target="_blank">open(2)</a> ' +
  1568. ' and <a href="https://www.man7.org/linux/man-pages/man2/openat.2.html" target="_blank">openat(2)</a>. '
  1569. },
  1570. 'apps.file_open_error': {
  1571. info: 'Failed calls to the internal function <code>do_sys_open</code> ( For kernels newer than <code>5.5.19</code> we add a kprobe to <code>do_sys_openat2</code>. ).'
  1572. },
  1573. 'apps.file_closed': {
  1574. info: 'Calls to the internal function <a href="https://elixir.bootlin.com/linux/v5.10/source/fs/file.c#L665" target="_blank">__close_fd</a> or <a href="https://elixir.bootlin.com/linux/v5.11/source/fs/file.c#L617" target="_blank">close_fd</a> according to your kernel version, which is called from' +
  1575. ' <a href="https://www.man7.org/linux/man-pages/man2/close.2.html" target="_blank">close(2)</a>. '
  1576. },
  1577. 'apps.file_close_error': {
  1578. info: 'Failed calls to the internal function <a href="https://elixir.bootlin.com/linux/v5.10/source/fs/file.c#L665" target="_blank">__close_fd</a> or <a href="https://elixir.bootlin.com/linux/v5.11/source/fs/file.c#L617" target="_blank">close_fd</a> according to your kernel version.'
  1579. },
  1580. 'apps.file_deleted': {
  1581. info: 'Calls to the function <a href="https://www.kernel.org/doc/htmldocs/filesystems/API-vfs-unlink.html" target="_blank">vfs_unlink</a>. This chart does not show all events that remove files from the filesystem, because filesystems can create their own functions to remove files.'
  1582. },
  1583. 'apps.vfs_write_call': {
  1584. info: 'Successful calls to the function <a href="https://topic.alibabacloud.com/a/kernel-state-file-operation-__-work-information-kernel_8_8_20287135.html" target="_blank">vfs_write</a>. This chart may not show all filesystem events if it uses other functions to store data on disk.'
  1585. },
  1586. 'apps.vfs_write_error': {
  1587. info: 'Failed calls to the function <a href="https://topic.alibabacloud.com/a/kernel-state-file-operation-__-work-information-kernel_8_8_20287135.html" target="_blank">vfs_write</a>. This chart may not show all filesystem events if it uses other functions to store data on disk.'
  1588. },
  1589. 'apps.vfs_read_call': {
  1590. info: 'Successful calls to the function <a href="https://topic.alibabacloud.com/a/kernel-state-file-operation-__-work-information-kernel_8_8_20287135.html" target="_blank">vfs_read</a>. This chart may not show all filesystem events if it uses other functions to store data on disk.'
  1591. },
  1592. 'apps.vfs_read_error': {
  1593. info: 'Failed calls to the function <a href="https://topic.alibabacloud.com/a/kernel-state-file-operation-__-work-information-kernel_8_8_20287135.html" target="_blank">vfs_read</a>. This chart may not show all filesystem events if it uses other functions to store data on disk.'
  1594. },
  1595. 'apps.vfs_write_bytes': {
  1596. info: 'Total of bytes successfully written using the function <a href="https://topic.alibabacloud.com/a/kernel-state-file-operation-__-work-information-kernel_8_8_20287135.html" target="_blank">vfs_write</a>.'
  1597. },
  1598. 'apps.vfs_read_bytes': {
  1599. info: 'Total of bytes successfully read using the function <a href="https://topic.alibabacloud.com/a/kernel-state-file-operation-__-work-information-kernel_8_8_20287135.html" target="_blank">vfs_read</a>.'
  1600. },
  1601. 'apps.process_create': {
  1602. info: 'Calls to either <a href="https://www.ece.uic.edu/~yshi1/linux/lkse/node4.html#SECTION00421000000000000000" target="_blank">do_fork</a>, or <code>kernel_clone</code> if you are running kernel newer than 5.9.16, to create a new task, which is the common name used to define process and tasks inside the kernel. Netdata identifies the process by counting the number of calls to <a href="https://linux.die.net/man/2/clone" target="_blank">sys_clone</a> that do not have the flag <code>CLONE_THREAD</code> set.'
  1603. },
  1604. 'apps.thread_create': {
  1605. info: 'Calls to either <a href="https://www.ece.uic.edu/~yshi1/linux/lkse/node4.html#SECTION00421000000000000000" target="_blank">do_fork</a>, or <code>kernel_clone</code> if you are running kernel newer than 5.9.16, to create a new task, which is the common name used to define process and tasks inside the kernel. Netdata identifies the threads by counting the number of calls to <a href="https://linux.die.net/man/2/clone" target="_blank">sys_clone</a> that have the flag <code>CLONE_THREAD</code> set.'
  1606. },
  1607. 'apps.task_close': {
  1608. info: 'Calls to the functions responsible for closing (<a href="https://www.informit.com/articles/article.aspx?p=370047&seqNum=4" target="_blank">do_exit</a>) and releasing (<a href="https://www.informit.com/articles/article.aspx?p=370047&seqNum=4" target="_blank">release_task</a>) tasks.'
  1609. },
  1610. 'apps.total_bandwidth_sent': {
  1611. info: 'Bytes sent by functions <code>tcp_sendmsg</code> and <code>udp_sendmsg</code>.'
  1612. },
  1613. 'apps.total_bandwidth_recv': {
  1614. info: 'Bytes received by functions <code>tcp_cleanup_rbuf</code> and <code>udp_recvmsg</code>. We use <code>tcp_cleanup_rbuf</code> instead <code>tcp_recvmsg</code>, because this last misses <code>tcp_read_sock()</code> traffic and we would also need to have more probes to get the socket and package size.'
  1615. },
  1616. 'apps.bandwidth_tcp_send': {
  1617. info: 'The function <code>tcp_sendmsg</code> is used to collect number of bytes sent from TCP connections.'
  1618. },
  1619. 'apps.bandwidth_tcp_recv': {
  1620. info: 'The function <code>tcp_cleanup_rbuf</code> is used to collect number of bytes received from TCP connections.'
  1621. },
  1622. 'apps.bandwidth_tcp_retransmit': {
  1623. info: 'The function <code>tcp_retransmit_skb</code> is called when the host did not receive the expected return from a packet sent.'
  1624. },
  1625. 'apps.bandwidth_udp_send': {
  1626. info: 'The function <code>udp_sendmsg</code> is used to collect number of bytes sent from UDP connections.'
  1627. },
  1628. 'apps.bandwidth_udp_recv': {
  1629. info: 'The function <code>udp_recvmsg</code> is used to collect number of bytes received from UDP connections.'
  1630. },
  1631. 'apps.dc_hit_ratio': {
  1632. info: 'Percentage of file accesses that were present in the directory cache. 100% means that every file that was accessed was present in the directory cache. If files are not present in the directory cache 1) they are not present in the file system, 2) the files were not accessed before. Read more about <a href="https://www.kernel.org/doc/htmldocs/filesystems/the_directory_cache.html" target="_blank">directory cache</a>. Netdata also gives a summary for these charts in <a href="#menu_filesystem_submenu_directory_cache__eBPF_">Filesystem submenu</a>.'
  1633. },
  1634. 'apps.dc_reference': {
  1635. info: 'Counters of file accesses. <code>Reference</code> is when there is a file access, see the <code>filesystem.dc_reference</code> chart for more context. Read more about <a href="https://www.kernel.org/doc/htmldocs/filesystems/the_directory_cache.html" target="_blank">directory cache</a>.'
  1636. },
  1637. 'apps.dc_not_cache': {
  1638. info: 'Counters of file accesses. <code>Slow</code> is when there is a file access and the file is not present in the directory cache, see the <code>filesystem.dc_reference</code> chart for more context. Read more about <a href="https://www.kernel.org/doc/htmldocs/filesystems/the_directory_cache.html" target="_blank">directory cache</a>.'
  1639. },
  1640. 'apps.dc_not_found': {
  1641. info: 'Counters of file accesses. <code>Miss</code> is when there is file access and the file is not found in the filesystem, see the <code>filesystem.dc_reference</code> chart for more context. Read more about <a href="https://www.kernel.org/doc/htmldocs/filesystems/the_directory_cache.html" target="_blank">directory cache</a>.'
  1642. },
  1643. // ------------------------------------------------------------------------
  1644. // USERS
  1645. 'users.cpu': {
  1646. height: 2.0
  1647. },
  1648. 'users.mem': {
  1649. info: 'Real memory (RAM) used per user. This does not include shared memory.'
  1650. },
  1651. 'users.vmem': {
  1652. info: 'Virtual memory allocated per user. Please check <a href="https://github.com/netdata/netdata/tree/master/daemon#virtual-memory" target="_blank">this article</a> for more information.'
  1653. },
  1654. 'users.preads': {
  1655. height: 2.0
  1656. },
  1657. 'users.pwrites': {
  1658. height: 2.0
  1659. },
  1660. 'users.uptime': {
  1661. info: 'Carried over process group uptime since the Netdata restart. The period of time within which at least one process in the group was running.'
  1662. },
  1663. // ------------------------------------------------------------------------
  1664. // GROUPS
  1665. 'groups.cpu': {
  1666. height: 2.0
  1667. },
  1668. 'groups.mem': {
  1669. info: 'Real memory (RAM) used per user group. This does not include shared memory.'
  1670. },
  1671. 'groups.vmem': {
  1672. info: 'Virtual memory allocated per user group since the Netdata restart. Please check <a href="https://github.com/netdata/netdata/tree/master/daemon#virtual-memory" target="_blank">this article</a> for more information.'
  1673. },
  1674. 'groups.preads': {
  1675. height: 2.0
  1676. },
  1677. 'groups.pwrites': {
  1678. height: 2.0
  1679. },
  1680. 'groups.uptime': {
  1681. info: 'Carried over process group uptime. The period of time within which at least one process in the group was running.'
  1682. },
  1683. // ------------------------------------------------------------------------
  1684. // NETWORK QoS
  1685. 'tc.qos': {
  1686. heads: [
  1687. function (os, id) {
  1688. void (os);
  1689. if (id.match(/.*-ifb$/))
  1690. return netdataDashboard.gaugeChart('Inbound', '12%', '', '#5555AA');
  1691. else
  1692. return netdataDashboard.gaugeChart('Outbound', '12%', '', '#AA9900');
  1693. }
  1694. ]
  1695. },
  1696. // ------------------------------------------------------------------------
  1697. // NETWORK INTERFACES
  1698. 'net.net': {
  1699. mainheads: [
  1700. function (os, id) {
  1701. void (os);
  1702. if (id.match(/^cgroup_.*/)) {
  1703. var iface;
  1704. try {
  1705. iface = ' ' + id.substring(id.lastIndexOf('.net_') + 5, id.length);
  1706. } catch (e) {
  1707. iface = '';
  1708. }
  1709. return netdataDashboard.gaugeChart('Received' + iface, '12%', 'received');
  1710. } else
  1711. return '';
  1712. },
  1713. function (os, id) {
  1714. void (os);
  1715. if (id.match(/^cgroup_.*/)) {
  1716. var iface;
  1717. try {
  1718. iface = ' ' + id.substring(id.lastIndexOf('.net_') + 5, id.length);
  1719. } catch (e) {
  1720. iface = '';
  1721. }
  1722. return netdataDashboard.gaugeChart('Sent' + iface, '12%', 'sent');
  1723. } else
  1724. return '';
  1725. }
  1726. ],
  1727. heads: [
  1728. function (os, id) {
  1729. void (os);
  1730. if (!id.match(/^cgroup_.*/))
  1731. return netdataDashboard.gaugeChart('Received', '12%', 'received');
  1732. else
  1733. return '';
  1734. },
  1735. function (os, id) {
  1736. void (os);
  1737. if (!id.match(/^cgroup_.*/))
  1738. return netdataDashboard.gaugeChart('Sent', '12%', 'sent');
  1739. else
  1740. return '';
  1741. }
  1742. ],
  1743. info: 'Amount of traffic that the interface has received and sent.'
  1744. },
  1745. 'net.packets': {
  1746. info: 'Number of packets that the interface has received and sent. '+
  1747. 'Received <a href="https://en.wikipedia.org/wiki/Multicast" target="_blank">multicast</a> counter is '+
  1748. 'commonly calculated at the device level (unlike <b>received</b>) and therefore may include packets which did not reach the host.'
  1749. },
  1750. 'net.errors': {
  1751. info: '<b>Inbound</b> is the number of bad packets received on this interface. '+
  1752. 'It includes dropped packets due to invalid length, CRC, frame alignment, and other errors. '+
  1753. '<b>Outbound</b> is the number of transmit problems. '+
  1754. 'It includes frames transmission errors due to loss of carrier, FIFO underrun/underflow, heartbeat, late collisions, and other problems.'
  1755. },
  1756. 'net.fifo': {
  1757. info: '<b>Inbound</b> is the number of packets dropped because they did not fit into buffers provided by the host, '+
  1758. 'e.g. packets larger than MTU or next buffer in the ring was not available for a scatter transfer. '+
  1759. '<b>Outbound</b> is the number of frame transmission errors due to device FIFO underrun/underflow. '+
  1760. 'This condition occurs when the device begins transmission of a frame '+
  1761. 'but is unable to deliver the entire frame to the transmitter in time for transmission.'
  1762. },
  1763. 'net.drops': {
  1764. info: 'Packets that have been dropped at the network interface level. '+
  1765. '<b>Inbound</b> is the number of packets received but not processed, e.g. due to '+
  1766. '<a href="#menu_system_submenu_softnet_stat">softnet backlog</a> overflow, bad / unintended VLAN tags, '+
  1767. 'unknown or unregistered protocols, IPv6 frames when the server is not configured for IPv6. '+
  1768. '<b>Outbound</b> is the number of packets dropped on their way to transmission, e.g. due to lack of resources.'
  1769. },
  1770. 'net.compressed': {
  1771. info: 'Number of correctly received and transmitted compressed packets. '+
  1772. 'These counters are only meaningful for interfaces which support packet compression (e.g. CSLIP, PPP).'
  1773. },
  1774. 'net.events': {
  1775. info: '<b>Frames</b> is an aggregated counter for dropped packets due to '+
  1776. 'invalid length, FIFO overflow, CRC, and frame alignment errors. '+
  1777. '<b>Collisions</b> is the number of '+
  1778. '<a href="https://en.wikipedia.org/wiki/Collision_(telecommunications)" target="blank">collisions</a> during packet transmissions. '+
  1779. '<b>Carrier</b> is an aggregated counter for frame transmission errors due to '+
  1780. 'excessive collisions, loss of carrier, device FIFO underrun/underflow, Heartbeat/SQE Test errors, and late collisions.'
  1781. },
  1782. 'net.duplex': {
  1783. info: '<p>The interface\'s latest or current '+
  1784. '<a href="https://en.wikipedia.org/wiki/Duplex_(telecommunications)" target="_blank">duplex</a> that the network adapter '+
  1785. '<a href="https://en.wikipedia.org/wiki/Autonegotiation" target="_blank">negotiated</a> with the device it is connected to. '+
  1786. '<b>Unknown</b> - the duplex mode can not be determined. '+
  1787. '<b>Half duplex</b> - the communication is one direction at a time. '+
  1788. '<b>Full duplex</b> - the interface is able to send and receive data simultaneously.</p>'+
  1789. '<p><b>State map</b>: 0 - unknown, 1 - half, 2 - full.</p>'
  1790. },
  1791. 'net.operstate': {
  1792. info: '</p>The current <a href="https://datatracker.ietf.org/doc/html/rfc2863" target="_blank">operational state</a> of the interface. '+
  1793. '<b>Unknown</b> - the state can not be determined. '+
  1794. '<b>NotPresent</b> - the interface has missing (typically, hardware) components. '+
  1795. '<b>Down</b> - the interface is unable to transfer data on L1, e.g. ethernet is not plugged or interface is administratively down. '+
  1796. '<b>LowerLayerDown</b> - the interface is down due to state of lower-layer interface(s). '+
  1797. '<b>Testing</b> - the interface is in testing mode, e.g. cable test. It can’t be used for normal traffic until tests complete. '+
  1798. '<b>Dormant</b> - the interface is L1 up, but waiting for an external event, e.g. for a protocol to establish. '+
  1799. '<b>Up</b> - the interface is ready to pass packets and can be used.</p>'+
  1800. '<p><b>State map</b>: 0 - unknown, 1 - notpresent, 2 - down, 3 - lowerlayerdown, 4 - testing, 5 - dormant, 6 - up.</p>'
  1801. },
  1802. 'net.carrier': {
  1803. info: '<p>The current physical link state of the interface.</p>'+
  1804. '<p><b>State map</b>: 0 - down, 1 - up.</p>'
  1805. },
  1806. 'net.speed': {
  1807. info: 'The interface\'s latest or current speed that the network adapter '+
  1808. '<a href="https://en.wikipedia.org/wiki/Autonegotiation" target="_blank">negotiated</a> with the device it is connected to. '+
  1809. 'This does not give the max supported speed of the NIC.'
  1810. },
  1811. 'net.mtu': {
  1812. info: 'The interface\'s currently configured '+
  1813. '<a href="https://en.wikipedia.org/wiki/Maximum_transmission_unit" target="_blank">Maximum transmission unit</a> (MTU) value. '+
  1814. 'MTU is the size of the largest protocol data unit that can be communicated in a single network layer transaction.'
  1815. },
  1816. // ------------------------------------------------------------------------
  1817. // NETFILTER
  1818. 'netfilter.sockets': {
  1819. colors: '#88AA00',
  1820. heads: [
  1821. netdataDashboard.gaugeChart('Active Connections', '12%', '', '#88AA00')
  1822. ]
  1823. },
  1824. 'netfilter.new': {
  1825. heads: [
  1826. netdataDashboard.gaugeChart('New Connections', '12%', 'new', '#5555AA')
  1827. ]
  1828. },
  1829. // ------------------------------------------------------------------------
  1830. // IPVS
  1831. 'ipvs.sockets': {
  1832. info: 'Total created connections for all services and their servers. '+
  1833. 'To see the IPVS connection table, run <code>ipvsadm -Lnc</code>.'
  1834. },
  1835. 'ipvs.packets': {
  1836. info: 'Total transferred packets for all services and their servers.'
  1837. },
  1838. 'ipvs.net': {
  1839. info: 'Total network traffic for all services and their servers.'
  1840. },
  1841. // ------------------------------------------------------------------------
  1842. // DISKS
  1843. 'disk.util': {
  1844. colors: '#FF5588',
  1845. heads: [
  1846. netdataDashboard.gaugeChart('Utilization', '12%', '', '#FF5588')
  1847. ],
  1848. info: 'Disk Utilization measures the amount of time the disk was busy with something. This is not related to its performance. 100% means that the system always had an outstanding operation on the disk. Keep in mind that depending on the underlying technology of the disk, 100% here may or may not be an indication of congestion.'
  1849. },
  1850. 'disk.busy': {
  1851. colors: '#FF5588',
  1852. info: 'Disk Busy Time measures the amount of time the disk was busy with something.'
  1853. },
  1854. 'disk.backlog': {
  1855. colors: '#0099CC',
  1856. info: 'Backlog is an indication of the duration of pending disk operations. On every I/O event the system is multiplying the time spent doing I/O since the last update of this field with the number of pending operations. While not accurate, this metric can provide an indication of the expected completion time of the operations in progress.'
  1857. },
  1858. 'disk.io': {
  1859. heads: [
  1860. netdataDashboard.gaugeChart('Read', '12%', 'reads'),
  1861. netdataDashboard.gaugeChart('Write', '12%', 'writes')
  1862. ],
  1863. info: 'Amount of data transferred to and from disk.'
  1864. },
  1865. 'disk_ext.io': {
  1866. info: 'Amount of discarded data that are no longer in use by a mounted file system.'
  1867. },
  1868. 'disk.ops': {
  1869. info: 'Completed disk I/O operations. Keep in mind the number of operations requested might be higher, since the system is able to merge adjacent to each other (see merged operations chart).'
  1870. },
  1871. 'disk_ext.ops': {
  1872. info: '<p>Number (after merges) of completed discard/flush requests.</p>'+
  1873. '<p><b>Discard</b> commands inform disks which blocks of data are no longer considered to be in use and therefore can be erased internally. '+
  1874. 'They are useful for solid-state drivers (SSDs) and thinly-provisioned storage. '+
  1875. 'Discarding/trimming enables the SSD to handle garbage collection more efficiently, '+
  1876. 'which would otherwise slow future write operations to the involved blocks down.</p>'+
  1877. '<p><b>Flush</b> operations transfer all modified in-core data (i.e., modified buffer cache pages) to the disk device '+
  1878. 'so that all changed information can be retrieved even if the system crashes or is rebooted. '+
  1879. 'Flush requests are executed by disks. Flush requests are not tracked for partitions. '+
  1880. 'Before being merged, flush operations are counted as writes.</p>'
  1881. },
  1882. 'disk.qops': {
  1883. info: 'I/O operations currently in progress. This metric is a snapshot - it is not an average over the last interval.'
  1884. },
  1885. 'disk.iotime': {
  1886. height: 0.5,
  1887. info: 'The sum of the duration of all completed I/O operations. This number can exceed the interval if the disk is able to execute I/O operations in parallel.'
  1888. },
  1889. 'disk_ext.iotime': {
  1890. height: 0.5,
  1891. info: 'The sum of the duration of all completed discard/flush operations. This number can exceed the interval if the disk is able to execute discard/flush operations in parallel.'
  1892. },
  1893. 'disk.mops': {
  1894. height: 0.5,
  1895. info: 'The number of merged disk operations. The system is able to merge adjacent I/O operations, for example two 4KB reads can become one 8KB read before given to disk.'
  1896. },
  1897. 'disk_ext.mops': {
  1898. height: 0.5,
  1899. info: 'The number of merged discard disk operations. Discard operations which are adjacent to each other may be merged for efficiency.'
  1900. },
  1901. 'disk.svctm': {
  1902. height: 0.5,
  1903. info: 'The average service time for completed I/O operations. This metric is calculated using the total busy time of the disk and the number of completed operations. If the disk is able to execute multiple parallel operations the reporting average service time will be misleading.'
  1904. },
  1905. 'disk.latency_io': {
  1906. height: 0.5,
  1907. info: 'Disk I/O latency is the time it takes for an I/O request to be completed. Latency is the single most important metric to focus on when it comes to storage performance, under most circumstances. For hard drives, an average latency somewhere between 10 to 20 ms can be considered acceptable. For SSD (Solid State Drives), depending on the workload it should never reach higher than 1-3 ms. In most cases, workloads will experience less than 1ms latency numbers. The dimensions refer to time intervals. This chart is based on the <a href="https://github.com/cloudflare/ebpf_exporter/blob/master/examples/bio-tracepoints.yaml" target="_blank">bio_tracepoints</a> tool of the ebpf_exporter.'
  1908. },
  1909. 'disk.avgsz': {
  1910. height: 0.5,
  1911. info: 'The average I/O operation size.'
  1912. },
  1913. 'disk_ext.avgsz': {
  1914. height: 0.5,
  1915. info: 'The average discard operation size.'
  1916. },
  1917. 'disk.await': {
  1918. height: 0.5,
  1919. info: 'The average time for I/O requests issued to the device to be served. This includes the time spent by the requests in queue and the time spent servicing them.'
  1920. },
  1921. 'disk_ext.await': {
  1922. height: 0.5,
  1923. info: 'The average time for discard/flush requests issued to the device to be served. This includes the time spent by the requests in queue and the time spent servicing them.'
  1924. },
  1925. 'disk.space': {
  1926. info: 'Disk space utilization. reserved for root is automatically reserved by the system to prevent the root user from getting out of space.'
  1927. },
  1928. 'disk.inodes': {
  1929. info: 'inodes (or index nodes) are filesystem objects (e.g. files and directories). On many types of file system implementations, the maximum number of inodes is fixed at filesystem creation, limiting the maximum number of files the filesystem can hold. It is possible for a device to run out of inodes. When this happens, new files cannot be created on the device, even though there may be free space available.'
  1930. },
  1931. 'disk.bcache_hit_ratio': {
  1932. info: '<p><b>Bcache (block cache)</b> is a cache in the block layer of Linux kernel, '+
  1933. 'which is used for accessing secondary storage devices. '+
  1934. 'It allows one or more fast storage devices, such as flash-based solid-state drives (SSDs), '+
  1935. 'to act as a cache for one or more slower storage devices, such as hard disk drives (HDDs).</p>'+
  1936. '<p>Percentage of data requests that were fulfilled right from the block cache. '+
  1937. 'Hits and misses are counted per individual IO as bcache sees them. '+
  1938. 'A partial hit is counted as a miss.</p>'
  1939. },
  1940. 'disk.bcache_rates': {
  1941. info: 'Throttling rates. '+
  1942. 'To avoid congestions bcache tracks latency to the cache device, and gradually throttles traffic if the latency exceeds a threshold. ' +
  1943. 'If the writeback percentage is nonzero, bcache tries to keep around this percentage of the cache dirty by '+
  1944. 'throttling background writeback and using a PD controller to smoothly adjust the rate.'
  1945. },
  1946. 'disk.bcache_size': {
  1947. info: 'Amount of dirty data for this backing device in the cache.'
  1948. },
  1949. 'disk.bcache_usage': {
  1950. info: 'Percentage of cache device which does not contain dirty data, and could potentially be used for writeback.'
  1951. },
  1952. 'disk.bcache_cache_read_races': {
  1953. info: '<b>Read races</b> happen when a bucket was reused and invalidated while data was being read from the cache. '+
  1954. 'When this occurs the data is reread from the backing device. '+
  1955. '<b>IO errors</b> are decayed by the half life. '+
  1956. 'If the decaying count reaches the limit, dirty data is written out and the cache is disabled.'
  1957. },
  1958. 'disk.bcache': {
  1959. info: 'Hits and misses are counted per individual IO as bcache sees them; a partial hit is counted as a miss. '+
  1960. 'Collisions happen when data was going to be inserted into the cache from a cache miss, '+
  1961. 'but raced with a write and data was already present. '+
  1962. 'Cache miss reads are rounded up to the readahead size, but without overlapping existing cache entries.'
  1963. },
  1964. 'disk.bcache_bypass': {
  1965. info: 'Hits and misses for IO that is intended to skip the cache.'
  1966. },
  1967. 'disk.bcache_cache_alloc': {
  1968. info: 'Working set size. '+
  1969. '<b>Unused</b> is the percentage of the cache that does not contain any data. '+
  1970. '<b>Dirty</b> is the data that is modified in the cache but not yet written to the permanent storage. '+
  1971. '<b>Clean</b> data matches the data stored on the permanent storage. '+
  1972. '<b>Metadata</b> is bcache\'s metadata overhead. '
  1973. },
  1974. // ------------------------------------------------------------------------
  1975. // ZFS pools
  1976. 'zfspool.state': {
  1977. info: 'ZFS pool state. The overall health of a pool, as reported by <code>zpool status</code>, is determined by the aggregate state of all devices within the pool. ' +
  1978. 'For details, see <a href="https://openzfs.github.io/openzfs-docs/man/8/zpoolconcepts.8.html?#Device_Failure_and_Recovery" target="_blank"> ZFS documentation</a>.'
  1979. },
  1980. // ------------------------------------------------------------------------
  1981. // MYSQL
  1982. 'mysql.net': {
  1983. info: 'The amount of data sent to mysql clients (<strong>out</strong>) and received from mysql clients (<strong>in</strong>).'
  1984. },
  1985. 'mysql.queries': {
  1986. info: 'The number of statements executed by the server.<ul>' +
  1987. '<li><strong>queries</strong> counts the statements executed within stored SQL programs.</li>' +
  1988. '<li><strong>questions</strong> counts the statements sent to the mysql server by mysql clients.</li>' +
  1989. '<li><strong>slow queries</strong> counts the number of statements that took more than <a href="http://dev.mysql.com/doc/refman/5.7/en/server-system-variables.html#sysvar_long_query_time" target="_blank">long_query_time</a> seconds to be executed.' +
  1990. ' For more information about slow queries check the mysql <a href="http://dev.mysql.com/doc/refman/5.7/en/slow-query-log.html" target="_blank">slow query log</a>.</li>' +
  1991. '</ul>'
  1992. },
  1993. 'mysql.handlers': {
  1994. info: 'Usage of the internal handlers of mysql. This chart provides very good insights of what the mysql server is actually doing.' +
  1995. ' (if the chart is not showing all these dimensions it is because they are zero - set <strong>Which dimensions to show?</strong> to <strong>All</strong> from the dashboard settings, to render even the zero values)<ul>' +
  1996. '<li><strong>commit</strong>, the number of internal <a href="http://dev.mysql.com/doc/refman/5.7/en/commit.html" target="_blank">COMMIT</a> statements.</li>' +
  1997. '<li><strong>delete</strong>, the number of times that rows have been deleted from tables.</li>' +
  1998. '<li><strong>prepare</strong>, a counter for the prepare phase of two-phase commit operations.</li>' +
  1999. '<li><strong>read first</strong>, the number of times the first entry in an index was read. A high value suggests that the server is doing a lot of full index scans; e.g. <strong>SELECT col1 FROM foo</strong>, with col1 indexed.</li>' +
  2000. '<li><strong>read key</strong>, the number of requests to read a row based on a key. If this value is high, it is a good indication that your tables are properly indexed for your queries.</li>' +
  2001. '<li><strong>read next</strong>, the number of requests to read the next row in key order. This value is incremented if you are querying an index column with a range constraint or if you are doing an index scan.</li>' +
  2002. '<li><strong>read prev</strong>, the number of requests to read the previous row in key order. This read method is mainly used to optimize <strong>ORDER BY ... DESC</strong>.</li>' +
  2003. '<li><strong>read rnd</strong>, the number of requests to read a row based on a fixed position. A high value indicates you are doing a lot of queries that require sorting of the result. You probably have a lot of queries that require MySQL to scan entire tables or you have joins that do not use keys properly.</li>' +
  2004. '<li><strong>read rnd next</strong>, the number of requests to read the next row in the data file. This value is high if you are doing a lot of table scans. Generally this suggests that your tables are not properly indexed or that your queries are not written to take advantage of the indexes you have.</li>' +
  2005. '<li><strong>rollback</strong>, the number of requests for a storage engine to perform a rollback operation.</li>' +
  2006. '<li><strong>savepoint</strong>, the number of requests for a storage engine to place a savepoint.</li>' +
  2007. '<li><strong>savepoint rollback</strong>, the number of requests for a storage engine to roll back to a savepoint.</li>' +
  2008. '<li><strong>update</strong>, the number of requests to update a row in a table.</li>' +
  2009. '<li><strong>write</strong>, the number of requests to insert a row in a table.</li>' +
  2010. '</ul>'
  2011. },
  2012. 'mysql.table_locks': {
  2013. info: 'MySQL table locks counters: <ul>' +
  2014. '<li><strong>immediate</strong>, the number of times that a request for a table lock could be granted immediately.</li>' +
  2015. '<li><strong>waited</strong>, the number of times that a request for a table lock could not be granted immediately and a wait was needed. If this is high and you have performance problems, you should first optimize your queries, and then either split your table or tables or use replication.</li>' +
  2016. '</ul>'
  2017. },
  2018. 'mysql.innodb_deadlocks': {
  2019. info: 'A deadlock happens when two or more transactions mutually hold and request for locks, creating a cycle of dependencies. For more information about <a href="https://dev.mysql.com/doc/refman/5.7/en/innodb-deadlocks-handling.html" target="_blank">how to minimize and handle deadlocks</a>.'
  2020. },
  2021. 'mysql.galera_cluster_status': {
  2022. info:
  2023. '<code>-1</code>: unknown, ' +
  2024. '<code>0</code>: primary (primary group configuration, quorum present), ' +
  2025. '<code>1</code>: non-primary (non-primary group configuration, quorum lost), ' +
  2026. '<code>2</code>: disconnected(not connected to group, retrying).'
  2027. },
  2028. 'mysql.galera_cluster_state': {
  2029. info:
  2030. '<code>0</code>: Undefined, ' +
  2031. '<code>1</code>: Joining, ' +
  2032. '<code>2</code>: Donor/Desynced, ' +
  2033. '<code>3</code>: Joined, ' +
  2034. '<code>4</code>: Synced, ' +
  2035. '<code>5</code>: Inconsistent.'
  2036. },
  2037. 'mysql.galera_cluster_weight': {
  2038. info: 'The value is counted as a sum of <code>pc.weight</code> of the nodes in the current Primary Component.'
  2039. },
  2040. 'mysql.galera_connected': {
  2041. info: '<code>0</code> means that the node has not yet connected to any of the cluster components. ' +
  2042. 'This may be due to misconfiguration.'
  2043. },
  2044. 'mysql.open_transactions': {
  2045. info: 'The number of locally running transactions which have been registered inside the wsrep provider. ' +
  2046. 'This means transactions which have made operations which have caused write set population to happen. ' +
  2047. 'Transactions which are read only are not counted.'
  2048. },
  2049. // ------------------------------------------------------------------------
  2050. // POSTGRESQL
  2051. 'postgres.db_stat_blks': {
  2052. info: 'Blocks reads from disk or cache.<ul>' +
  2053. '<li><strong>blks_read:</strong> number of disk blocks read in this database.</li>' +
  2054. '<li><strong>blks_hit:</strong> number of times disk blocks were found already in the buffer cache, so that a read was not necessary (this only includes hits in the PostgreSQL buffer cache, not the operating system&#39;s file system cache)</li>' +
  2055. '</ul>'
  2056. },
  2057. 'postgres.db_stat_tuple_write': {
  2058. info: '<ul><li>Number of rows inserted/updated/deleted.</li>' +
  2059. '<li><strong>conflicts:</strong> number of queries canceled due to conflicts with recovery in this database. (Conflicts occur only on standby servers; see <a href="https://www.postgresql.org/docs/10/static/monitoring-stats.html#PG-STAT-DATABASE-CONFLICTS-VIEW" target="_blank">pg_stat_database_conflicts</a> for details.)</li>' +
  2060. '</ul>'
  2061. },
  2062. 'postgres.db_stat_temp_bytes': {
  2063. info: 'Temporary files can be created on disk for sorts, hashes, and temporary query results.'
  2064. },
  2065. 'postgres.db_stat_temp_files': {
  2066. info: '<ul>' +
  2067. '<li><strong>files:</strong> number of temporary files created by queries. All temporary files are counted, regardless of why the temporary file was created (e.g., sorting or hashing).</li>' +
  2068. '</ul>'
  2069. },
  2070. 'postgres.archive_wal': {
  2071. info: 'WAL archiving.<ul>' +
  2072. '<li><strong>total:</strong> total files.</li>' +
  2073. '<li><strong>ready:</strong> WAL waiting to be archived.</li>' +
  2074. '<li><strong>done:</strong> WAL successfully archived. ' +
  2075. 'Ready WAL can indicate archive_command is in error, see <a href="https://www.postgresql.org/docs/current/static/continuous-archiving.html" target="_blank">Continuous Archiving and Point-in-Time Recovery</a>.</li>' +
  2076. '</ul>'
  2077. },
  2078. 'postgres.checkpointer': {
  2079. info: 'Number of checkpoints.<ul>' +
  2080. '<li><strong>scheduled:</strong> when checkpoint_timeout is reached.</li>' +
  2081. '<li><strong>requested:</strong> when max_wal_size is reached.</li>' +
  2082. '</ul>' +
  2083. 'For more information see <a href="https://www.postgresql.org/docs/current/static/wal-configuration.html" target="_blank">WAL Configuration</a>.'
  2084. },
  2085. 'postgres.autovacuum': {
  2086. info: 'PostgreSQL databases require periodic maintenance known as vacuuming. For many installations, it is sufficient to let vacuuming be performed by the autovacuum daemon. ' +
  2087. 'For more information see <a href="https://www.postgresql.org/docs/current/static/routine-vacuuming.html#AUTOVACUUM" target="_blank">The Autovacuum Daemon</a>.'
  2088. },
  2089. 'postgres.standby_delta': {
  2090. info: 'Streaming replication delta.<ul>' +
  2091. '<li><strong>sent_delta:</strong> replication delta sent to standby.</li>' +
  2092. '<li><strong>write_delta:</strong> replication delta written to disk by this standby.</li>' +
  2093. '<li><strong>flush_delta:</strong> replication delta flushed to disk by this standby server.</li>' +
  2094. '<li><strong>replay_delta:</strong> replication delta replayed into the database on this standby server.</li>' +
  2095. '</ul>' +
  2096. 'For more information see <a href="https://www.postgresql.org/docs/current/static/warm-standby.html#SYNCHRONOUS-REPLICATION" target="_blank">Synchronous Replication</a>.'
  2097. },
  2098. 'postgres.replication_slot': {
  2099. info: 'Replication slot files.<ul>' +
  2100. '<li><strong>wal_keeped:</strong> WAL files retained by each replication slots.</li>' +
  2101. '<li><strong>pg_replslot_files:</strong> files present in pg_replslot.</li>' +
  2102. '</ul>' +
  2103. 'For more information see <a href="https://www.postgresql.org/docs/current/static/warm-standby.html#STREAMING-REPLICATION-SLOTS" target="_blank">Replication Slots</a>.'
  2104. },
  2105. 'postgres.backend_usage': {
  2106. info: 'Connections usage against maximum connections allowed, as defined in the <i>max_connections</i> setting.<ul>' +
  2107. '<li><strong>available:</strong> maximum new connections allowed.</li>' +
  2108. '<li><strong>used:</strong> connections currently in use.</li>' +
  2109. '</ul>' +
  2110. 'Assuming non-superuser accounts are being used to connect to Postgres (so <i>superuser_reserved_connections</i> are subtracted from <i>max_connections</i>).<br/>' +
  2111. 'For more information see <a href="https://www.postgresql.org/docs/current/runtime-config-connection.html" target="_blank">Connections and Authentication</a>.'
  2112. },
  2113. 'postgres.forced_autovacuum': {
  2114. info: 'Percent towards forced autovacuum for one or more tables.<ul>' +
  2115. '<li><strong>percent_towards_forced_autovacuum:</strong> a forced autovacuum will run once this value reaches 100.</li>' +
  2116. '</ul>' +
  2117. 'For more information see <a href="https://www.postgresql.org/docs/current/routine-vacuuming.html" target="_blank">Preventing Transaction ID Wraparound Failures</a>.'
  2118. },
  2119. 'postgres.tx_wraparound_oldest_current_xid': {
  2120. info: 'The oldest current transaction id (xid).<ul>' +
  2121. '<li><strong>oldest_current_xid:</strong> oldest current transaction id.</li>' +
  2122. '</ul>' +
  2123. 'If for some reason autovacuum fails to clear old XIDs from a table, the system will begin to emit warning messages when the database\'s oldest XIDs reach eleven million transactions from the wraparound point.<br/>' +
  2124. 'For more information see <a href="https://www.postgresql.org/docs/current/routine-vacuuming.html" target="_blank">Preventing Transaction ID Wraparound Failures</a>.'
  2125. },
  2126. 'postgres.percent_towards_wraparound': {
  2127. info: 'Percent towards transaction wraparound.<ul>' +
  2128. '<li><strong>percent_towards_wraparound:</strong> transaction wraparound may occur when this value reaches 100.</li>' +
  2129. '</ul>' +
  2130. 'For more information see <a href="https://www.postgresql.org/docs/current/routine-vacuuming.html" target="_blank">Preventing Transaction ID Wraparound Failures</a>.'
  2131. },
  2132. // ------------------------------------------------------------------------
  2133. // APACHE
  2134. 'apache.connections': {
  2135. colors: NETDATA.colors[4],
  2136. mainheads: [
  2137. netdataDashboard.gaugeChart('Connections', '12%', '', NETDATA.colors[4])
  2138. ]
  2139. },
  2140. 'apache.requests': {
  2141. colors: NETDATA.colors[0],
  2142. mainheads: [
  2143. netdataDashboard.gaugeChart('Requests', '12%', '', NETDATA.colors[0])
  2144. ]
  2145. },
  2146. 'apache.net': {
  2147. colors: NETDATA.colors[3],
  2148. mainheads: [
  2149. netdataDashboard.gaugeChart('Bandwidth', '12%', '', NETDATA.colors[3])
  2150. ]
  2151. },
  2152. 'apache.workers': {
  2153. mainheads: [
  2154. function (os, id) {
  2155. void (os);
  2156. return '<div data-netdata="' + id + '"'
  2157. + ' data-dimensions="busy"'
  2158. + ' data-append-options="percentage"'
  2159. + ' data-gauge-max-value="100"'
  2160. + ' data-chart-library="gauge"'
  2161. + ' data-title="Workers Utilization"'
  2162. + ' data-units="percentage %"'
  2163. + ' data-gauge-adjust="width"'
  2164. + ' data-width="12%"'
  2165. + ' data-before="0"'
  2166. + ' data-after="-CHART_DURATION"'
  2167. + ' data-points="CHART_DURATION"'
  2168. + ' role="application"></div>';
  2169. }
  2170. ]
  2171. },
  2172. 'apache.bytesperreq': {
  2173. colors: NETDATA.colors[3],
  2174. height: 0.5
  2175. },
  2176. 'apache.reqpersec': {
  2177. colors: NETDATA.colors[4],
  2178. height: 0.5
  2179. },
  2180. 'apache.bytespersec': {
  2181. colors: NETDATA.colors[6],
  2182. height: 0.5
  2183. },
  2184. // ------------------------------------------------------------------------
  2185. // LIGHTTPD
  2186. 'lighttpd.connections': {
  2187. colors: NETDATA.colors[4],
  2188. mainheads: [
  2189. netdataDashboard.gaugeChart('Connections', '12%', '', NETDATA.colors[4])
  2190. ]
  2191. },
  2192. 'lighttpd.requests': {
  2193. colors: NETDATA.colors[0],
  2194. mainheads: [
  2195. netdataDashboard.gaugeChart('Requests', '12%', '', NETDATA.colors[0])
  2196. ]
  2197. },
  2198. 'lighttpd.net': {
  2199. colors: NETDATA.colors[3],
  2200. mainheads: [
  2201. netdataDashboard.gaugeChart('Bandwidth', '12%', '', NETDATA.colors[3])
  2202. ]
  2203. },
  2204. 'lighttpd.workers': {
  2205. mainheads: [
  2206. function (os, id) {
  2207. void (os);
  2208. return '<div data-netdata="' + id + '"'
  2209. + ' data-dimensions="busy"'
  2210. + ' data-append-options="percentage"'
  2211. + ' data-gauge-max-value="100"'
  2212. + ' data-chart-library="gauge"'
  2213. + ' data-title="Servers Utilization"'
  2214. + ' data-units="percentage %"'
  2215. + ' data-gauge-adjust="width"'
  2216. + ' data-width="12%"'
  2217. + ' data-before="0"'
  2218. + ' data-after="-CHART_DURATION"'
  2219. + ' data-points="CHART_DURATION"'
  2220. + ' role="application"></div>';
  2221. }
  2222. ]
  2223. },
  2224. 'lighttpd.bytesperreq': {
  2225. colors: NETDATA.colors[3],
  2226. height: 0.5
  2227. },
  2228. 'lighttpd.reqpersec': {
  2229. colors: NETDATA.colors[4],
  2230. height: 0.5
  2231. },
  2232. 'lighttpd.bytespersec': {
  2233. colors: NETDATA.colors[6],
  2234. height: 0.5
  2235. },
  2236. // ------------------------------------------------------------------------
  2237. // NGINX
  2238. 'nginx.connections': {
  2239. colors: NETDATA.colors[4],
  2240. mainheads: [
  2241. netdataDashboard.gaugeChart('Connections', '12%', '', NETDATA.colors[4])
  2242. ]
  2243. },
  2244. 'nginx.requests': {
  2245. colors: NETDATA.colors[0],
  2246. mainheads: [
  2247. netdataDashboard.gaugeChart('Requests', '12%', '', NETDATA.colors[0])
  2248. ]
  2249. },
  2250. // ------------------------------------------------------------------------
  2251. // HTTP check
  2252. 'httpcheck.responsetime': {
  2253. info: 'The <code>response time</code> describes the time passed between request and response. ' +
  2254. 'Currently, the accuracy of the response time is low and should be used as reference only.'
  2255. },
  2256. 'httpcheck.responselength': {
  2257. info: 'The <code>response length</code> counts the number of characters in the response body. For static pages, this should be mostly constant.'
  2258. },
  2259. 'httpcheck.status': {
  2260. valueRange: "[0, 1]",
  2261. info: 'This chart verifies the response of the webserver. Each status dimension will have a value of <code>1</code> if triggered. ' +
  2262. 'Dimension <code>success</code> is <code>1</code> only if all constraints are satisfied. ' +
  2263. 'This chart is most useful for alarms or third-party apps.'
  2264. },
  2265. // ------------------------------------------------------------------------
  2266. // NETDATA
  2267. 'netdata.response_time': {
  2268. info: 'The netdata API response time measures the time netdata needed to serve requests. This time includes everything, from the reception of the first byte of a request, to the dispatch of the last byte of its reply, therefore it includes all network latencies involved (i.e. a client over a slow network will influence these metrics).'
  2269. },
  2270. // ------------------------------------------------------------------------
  2271. // RETROSHARE
  2272. 'retroshare.bandwidth': {
  2273. info: 'RetroShare inbound and outbound traffic.',
  2274. mainheads: [
  2275. netdataDashboard.gaugeChart('Received', '12%', 'bandwidth_down_kb'),
  2276. netdataDashboard.gaugeChart('Sent', '12%', 'bandwidth_up_kb')
  2277. ]
  2278. },
  2279. 'retroshare.peers': {
  2280. info: 'Number of (connected) RetroShare friends.',
  2281. mainheads: [
  2282. function (os, id) {
  2283. void (os);
  2284. return '<div data-netdata="' + id + '"'
  2285. + ' data-dimensions="peers_connected"'
  2286. + ' data-append-options="friends"'
  2287. + ' data-chart-library="easypiechart"'
  2288. + ' data-title="connected friends"'
  2289. + ' data-units=""'
  2290. + ' data-width="8%"'
  2291. + ' data-before="0"'
  2292. + ' data-after="-CHART_DURATION"'
  2293. + ' data-points="CHART_DURATION"'
  2294. + ' role="application"></div>';
  2295. }
  2296. ]
  2297. },
  2298. 'retroshare.dht': {
  2299. info: 'Statistics about RetroShare\'s DHT. These values are estimated!'
  2300. },
  2301. // ------------------------------------------------------------------------
  2302. // fping
  2303. 'fping.quality': {
  2304. colors: NETDATA.colors[10],
  2305. height: 0.5
  2306. },
  2307. 'fping.packets': {
  2308. height: 0.5
  2309. },
  2310. // ------------------------------------------------------------------------
  2311. // containers
  2312. 'cgroup.cpu_limit': {
  2313. valueRange: "[0, null]",
  2314. mainheads: [
  2315. function (os, id) {
  2316. void (os);
  2317. cgroupCPULimitIsSet = 1;
  2318. return '<div data-netdata="' + id + '"'
  2319. + ' data-dimensions="used"'
  2320. + ' data-gauge-max-value="100"'
  2321. + ' data-chart-library="gauge"'
  2322. + ' data-title="CPU"'
  2323. + ' data-units="%"'
  2324. + ' data-gauge-adjust="width"'
  2325. + ' data-width="12%"'
  2326. + ' data-before="0"'
  2327. + ' data-after="-CHART_DURATION"'
  2328. + ' data-points="CHART_DURATION"'
  2329. + ' data-colors="' + NETDATA.colors[4] + '"'
  2330. + ' role="application"></div>';
  2331. }
  2332. ]
  2333. },
  2334. 'cgroup.cpu': {
  2335. mainheads: [
  2336. function (os, id) {
  2337. void (os);
  2338. if (cgroupCPULimitIsSet === 0) {
  2339. return '<div data-netdata="' + id + '"'
  2340. + ' data-chart-library="gauge"'
  2341. + ' data-title="CPU"'
  2342. + ' data-units="%"'
  2343. + ' data-gauge-adjust="width"'
  2344. + ' data-width="12%"'
  2345. + ' data-before="0"'
  2346. + ' data-after="-CHART_DURATION"'
  2347. + ' data-points="CHART_DURATION"'
  2348. + ' data-colors="' + NETDATA.colors[4] + '"'
  2349. + ' role="application"></div>';
  2350. } else
  2351. return '';
  2352. }
  2353. ]
  2354. },
  2355. 'cgroup.mem_usage_limit': {
  2356. mainheads: [
  2357. function (os, id) {
  2358. void (os);
  2359. cgroupMemLimitIsSet = 1;
  2360. return '<div data-netdata="' + id + '"'
  2361. + ' data-dimensions="used"'
  2362. + ' data-append-options="percentage"'
  2363. + ' data-gauge-max-value="100"'
  2364. + ' data-chart-library="gauge"'
  2365. + ' data-title="Memory"'
  2366. + ' data-units="%"'
  2367. + ' data-gauge-adjust="width"'
  2368. + ' data-width="12%"'
  2369. + ' data-before="0"'
  2370. + ' data-after="-CHART_DURATION"'
  2371. + ' data-points="CHART_DURATION"'
  2372. + ' data-colors="' + NETDATA.colors[1] + '"'
  2373. + ' role="application"></div>';
  2374. }
  2375. ]
  2376. },
  2377. 'cgroup.mem_usage': {
  2378. mainheads: [
  2379. function (os, id) {
  2380. void (os);
  2381. if (cgroupMemLimitIsSet === 0) {
  2382. return '<div data-netdata="' + id + '"'
  2383. + ' data-chart-library="gauge"'
  2384. + ' data-title="Memory"'
  2385. + ' data-units="MB"'
  2386. + ' data-gauge-adjust="width"'
  2387. + ' data-width="12%"'
  2388. + ' data-before="0"'
  2389. + ' data-after="-CHART_DURATION"'
  2390. + ' data-points="CHART_DURATION"'
  2391. + ' data-colors="' + NETDATA.colors[1] + '"'
  2392. + ' role="application"></div>';
  2393. } else
  2394. return '';
  2395. }
  2396. ]
  2397. },
  2398. 'cgroup.throttle_io': {
  2399. mainheads: [
  2400. function (os, id) {
  2401. void (os);
  2402. return '<div data-netdata="' + id + '"'
  2403. + ' data-dimensions="read"'
  2404. + ' data-chart-library="gauge"'
  2405. + ' data-title="Read Disk I/O"'
  2406. + ' data-units="KB/s"'
  2407. + ' data-gauge-adjust="width"'
  2408. + ' data-width="12%"'
  2409. + ' data-before="0"'
  2410. + ' data-after="-CHART_DURATION"'
  2411. + ' data-points="CHART_DURATION"'
  2412. + ' data-colors="' + NETDATA.colors[2] + '"'
  2413. + ' role="application"></div>';
  2414. },
  2415. function (os, id) {
  2416. void (os);
  2417. return '<div data-netdata="' + id + '"'
  2418. + ' data-dimensions="write"'
  2419. + ' data-chart-library="gauge"'
  2420. + ' data-title="Write Disk I/O"'
  2421. + ' data-units="KB/s"'
  2422. + ' data-gauge-adjust="width"'
  2423. + ' data-width="12%"'
  2424. + ' data-before="0"'
  2425. + ' data-after="-CHART_DURATION"'
  2426. + ' data-points="CHART_DURATION"'
  2427. + ' data-colors="' + NETDATA.colors[3] + '"'
  2428. + ' role="application"></div>';
  2429. }
  2430. ]
  2431. },
  2432. // ------------------------------------------------------------------------
  2433. // beanstalkd
  2434. // system charts
  2435. 'beanstalk.cpu_usage': {
  2436. info: 'Amount of CPU Time for user and system used by beanstalkd.'
  2437. },
  2438. // This is also a per-tube stat
  2439. 'beanstalk.jobs_rate': {
  2440. info: 'The rate of jobs processed by the beanstalkd served.'
  2441. },
  2442. 'beanstalk.connections_rate': {
  2443. info: 'The rate of connections opened to beanstalkd.'
  2444. },
  2445. 'beanstalk.commands_rate': {
  2446. info: 'The rate of commands received by beanstalkd.'
  2447. },
  2448. 'beanstalk.current_tubes': {
  2449. info: 'Total number of current tubes on the server including the default tube (which always exists).'
  2450. },
  2451. 'beanstalk.current_jobs': {
  2452. info: 'Current number of jobs in all tubes grouped by status: urgent, ready, reserved, delayed and buried.'
  2453. },
  2454. 'beanstalk.current_connections': {
  2455. info: 'Current number of connections group by connection type: written, producers, workers, waiting.'
  2456. },
  2457. 'beanstalk.binlog': {
  2458. info: 'The rate of records <code>written</code> to binlog and <code>migrated</code> as part of compaction.'
  2459. },
  2460. 'beanstalk.uptime': {
  2461. info: 'Total time beanstalkd server has been up for.'
  2462. },
  2463. // tube charts
  2464. 'beanstalk.jobs': {
  2465. info: 'Number of jobs currently in the tube grouped by status: urgent, ready, reserved, delayed and buried.'
  2466. },
  2467. 'beanstalk.connections': {
  2468. info: 'The current number of connections to this tube grouped by connection type; using, waiting and watching.'
  2469. },
  2470. 'beanstalk.commands': {
  2471. info: 'The rate of <code>delete</code> and <code>pause</code> commands executed by beanstalkd.'
  2472. },
  2473. 'beanstalk.pause': {
  2474. info: 'Shows info on how long the tube has been paused for, and how long is left remaining on the pause.'
  2475. },
  2476. // ------------------------------------------------------------------------
  2477. // ceph
  2478. 'ceph.general_usage': {
  2479. info: 'The usage and available space in all ceph cluster.'
  2480. },
  2481. 'ceph.general_objects': {
  2482. info: 'Total number of objects storage on ceph cluster.'
  2483. },
  2484. 'ceph.general_bytes': {
  2485. info: 'Cluster read and write data per second.'
  2486. },
  2487. 'ceph.general_operations': {
  2488. info: 'Number of read and write operations per second.'
  2489. },
  2490. 'ceph.general_latency': {
  2491. info: 'Total of apply and commit latency in all OSDs. The apply latency is the total time taken to flush an update to disk. The commit latency is the total time taken to commit an operation to the journal.'
  2492. },
  2493. 'ceph.pool_usage': {
  2494. info: 'The usage space in each pool.'
  2495. },
  2496. 'ceph.pool_objects': {
  2497. info: 'Number of objects presents in each pool.'
  2498. },
  2499. 'ceph.pool_read_bytes': {
  2500. info: 'The rate of read data per second in each pool.'
  2501. },
  2502. 'ceph.pool_write_bytes': {
  2503. info: 'The rate of write data per second in each pool.'
  2504. },
  2505. 'ceph.pool_read_objects': {
  2506. info: 'Number of read objects per second in each pool.'
  2507. },
  2508. 'ceph.pool_write_objects': {
  2509. info: 'Number of write objects per second in each pool.'
  2510. },
  2511. 'ceph.osd_usage': {
  2512. info: 'The usage space in each OSD.'
  2513. },
  2514. 'ceph.osd_size': {
  2515. info: "Each OSD's size"
  2516. },
  2517. 'ceph.apply_latency': {
  2518. info: 'Time taken to flush an update in each OSD.'
  2519. },
  2520. 'ceph.commit_latency': {
  2521. info: 'Time taken to commit an operation to the journal in each OSD.'
  2522. },
  2523. // ------------------------------------------------------------------------
  2524. // web_log
  2525. 'web_log.response_statuses': {
  2526. info: 'Web server responses by type. <code>success</code> includes <b>1xx</b>, <b>2xx</b>, <b>304</b> and <b>401</b>, <code>error</code> includes <b>5xx</b>, <code>redirect</code> includes <b>3xx</b> except <b>304</b>, <code>bad</code> includes <b>4xx</b> except <b>401</b>, <code>other</code> are all the other responses.',
  2527. mainheads: [
  2528. function (os, id) {
  2529. void (os);
  2530. return '<div data-netdata="' + id + '"'
  2531. + ' data-dimensions="success"'
  2532. + ' data-chart-library="gauge"'
  2533. + ' data-title="Successful"'
  2534. + ' data-units="requests/s"'
  2535. + ' data-gauge-adjust="width"'
  2536. + ' data-width="12%"'
  2537. + ' data-before="0"'
  2538. + ' data-after="-CHART_DURATION"'
  2539. + ' data-points="CHART_DURATION"'
  2540. + ' data-common-max="' + id + '"'
  2541. + ' data-colors="' + NETDATA.colors[0] + '"'
  2542. + ' data-decimal-digits="0"'
  2543. + ' role="application"></div>';
  2544. },
  2545. function (os, id) {
  2546. void (os);
  2547. return '<div data-netdata="' + id + '"'
  2548. + ' data-dimensions="redirect"'
  2549. + ' data-chart-library="gauge"'
  2550. + ' data-title="Redirects"'
  2551. + ' data-units="requests/s"'
  2552. + ' data-gauge-adjust="width"'
  2553. + ' data-width="12%"'
  2554. + ' data-before="0"'
  2555. + ' data-after="-CHART_DURATION"'
  2556. + ' data-points="CHART_DURATION"'
  2557. + ' data-common-max="' + id + '"'
  2558. + ' data-colors="' + NETDATA.colors[2] + '"'
  2559. + ' data-decimal-digits="0"'
  2560. + ' role="application"></div>';
  2561. },
  2562. function (os, id) {
  2563. void (os);
  2564. return '<div data-netdata="' + id + '"'
  2565. + ' data-dimensions="bad"'
  2566. + ' data-chart-library="gauge"'
  2567. + ' data-title="Bad Requests"'
  2568. + ' data-units="requests/s"'
  2569. + ' data-gauge-adjust="width"'
  2570. + ' data-width="12%"'
  2571. + ' data-before="0"'
  2572. + ' data-after="-CHART_DURATION"'
  2573. + ' data-points="CHART_DURATION"'
  2574. + ' data-common-max="' + id + '"'
  2575. + ' data-colors="' + NETDATA.colors[3] + '"'
  2576. + ' data-decimal-digits="0"'
  2577. + ' role="application"></div>';
  2578. },
  2579. function (os, id) {
  2580. void (os);
  2581. return '<div data-netdata="' + id + '"'
  2582. + ' data-dimensions="error"'
  2583. + ' data-chart-library="gauge"'
  2584. + ' data-title="Server Errors"'
  2585. + ' data-units="requests/s"'
  2586. + ' data-gauge-adjust="width"'
  2587. + ' data-width="12%"'
  2588. + ' data-before="0"'
  2589. + ' data-after="-CHART_DURATION"'
  2590. + ' data-points="CHART_DURATION"'
  2591. + ' data-common-max="' + id + '"'
  2592. + ' data-colors="' + NETDATA.colors[1] + '"'
  2593. + ' data-decimal-digits="0"'
  2594. + ' role="application"></div>';
  2595. }
  2596. ]
  2597. },
  2598. 'web_log.response_codes': {
  2599. info: 'Web server responses by code family. ' +
  2600. 'According to the standards <code>1xx</code> are informational responses, ' +
  2601. '<code>2xx</code> are successful responses, ' +
  2602. '<code>3xx</code> are redirects (although they include <b>304</b> which is used as "<b>not modified</b>"), ' +
  2603. '<code>4xx</code> are bad requests, ' +
  2604. '<code>5xx</code> are internal server errors, ' +
  2605. '<code>other</code> are non-standard responses, ' +
  2606. '<code>unmatched</code> counts the lines in the log file that are not matched by the plugin (<a href="https://github.com/netdata/netdata/issues/new?title=web_log%20reports%20unmatched%20lines&body=web_log%20plugin%20reports%20unmatched%20lines.%0A%0AThis%20is%20my%20log:%0A%0A%60%60%60txt%0A%0Aplease%20paste%20your%20web%20server%20log%20here%0A%0A%60%60%60" target="_blank">let us know</a> if you have any unmatched).'
  2607. },
  2608. 'web_log.response_time': {
  2609. mainheads: [
  2610. function (os, id) {
  2611. void (os);
  2612. return '<div data-netdata="' + id + '"'
  2613. + ' data-dimensions="avg"'
  2614. + ' data-chart-library="gauge"'
  2615. + ' data-title="Average Response Time"'
  2616. + ' data-units="milliseconds"'
  2617. + ' data-gauge-adjust="width"'
  2618. + ' data-width="12%"'
  2619. + ' data-before="0"'
  2620. + ' data-after="-CHART_DURATION"'
  2621. + ' data-points="CHART_DURATION"'
  2622. + ' data-colors="' + NETDATA.colors[4] + '"'
  2623. + ' data-decimal-digits="2"'
  2624. + ' role="application"></div>';
  2625. }
  2626. ]
  2627. },
  2628. 'web_log.detailed_response_codes': {
  2629. info: 'Number of responses for each response code individually.'
  2630. },
  2631. 'web_log.requests_per_ipproto': {
  2632. info: 'Web server requests received per IP protocol version.'
  2633. },
  2634. 'web_log.clients': {
  2635. info: 'Unique client IPs accessing the web server, within each data collection iteration. If data collection is <b>per second</b>, this chart shows <b>unique client IPs per second</b>.'
  2636. },
  2637. 'web_log.clients_all': {
  2638. info: 'Unique client IPs accessing the web server since the last restart of netdata. This plugin keeps in memory all the unique IPs that have accessed the web server. On very busy web servers (several millions of unique IPs) you may want to disable this chart (check <a href="https://github.com/netdata/netdata/blob/master/collectors/python.d.plugin/web_log/web_log.conf" target="_blank"><code>/etc/netdata/python.d/web_log.conf</code></a>).'
  2639. },
  2640. // ------------------------------------------------------------------------
  2641. // web_log for squid
  2642. 'web_log.squid_response_statuses': {
  2643. info: 'Squid responses by type. ' +
  2644. '<code>success</code> includes <b>1xx</b>, <b>2xx</b>, <b>000</b>, <b>304</b>, ' +
  2645. '<code>error</code> includes <b>5xx</b> and <b>6xx</b>, ' +
  2646. '<code>redirect</code> includes <b>3xx</b> except <b>304</b>, ' +
  2647. '<code>bad</code> includes <b>4xx</b>, ' +
  2648. '<code>other</code> are all the other responses.',
  2649. mainheads: [
  2650. function (os, id) {
  2651. void (os);
  2652. return '<div data-netdata="' + id + '"'
  2653. + ' data-dimensions="success"'
  2654. + ' data-chart-library="gauge"'
  2655. + ' data-title="Successful"'
  2656. + ' data-units="requests/s"'
  2657. + ' data-gauge-adjust="width"'
  2658. + ' data-width="12%"'
  2659. + ' data-before="0"'
  2660. + ' data-after="-CHART_DURATION"'
  2661. + ' data-points="CHART_DURATION"'
  2662. + ' data-common-max="' + id + '"'
  2663. + ' data-colors="' + NETDATA.colors[0] + '"'
  2664. + ' data-decimal-digits="0"'
  2665. + ' role="application"></div>';
  2666. },
  2667. function (os, id) {
  2668. void (os);
  2669. return '<div data-netdata="' + id + '"'
  2670. + ' data-dimensions="redirect"'
  2671. + ' data-chart-library="gauge"'
  2672. + ' data-title="Redirects"'
  2673. + ' data-units="requests/s"'
  2674. + ' data-gauge-adjust="width"'
  2675. + ' data-width="12%"'
  2676. + ' data-before="0"'
  2677. + ' data-after="-CHART_DURATION"'
  2678. + ' data-points="CHART_DURATION"'
  2679. + ' data-common-max="' + id + '"'
  2680. + ' data-colors="' + NETDATA.colors[2] + '"'
  2681. + ' data-decimal-digits="0"'
  2682. + ' role="application"></div>';
  2683. },
  2684. function (os, id) {
  2685. void (os);
  2686. return '<div data-netdata="' + id + '"'
  2687. + ' data-dimensions="bad"'
  2688. + ' data-chart-library="gauge"'
  2689. + ' data-title="Bad Requests"'
  2690. + ' data-units="requests/s"'
  2691. + ' data-gauge-adjust="width"'
  2692. + ' data-width="12%"'
  2693. + ' data-before="0"'
  2694. + ' data-after="-CHART_DURATION"'
  2695. + ' data-points="CHART_DURATION"'
  2696. + ' data-common-max="' + id + '"'
  2697. + ' data-colors="' + NETDATA.colors[3] + '"'
  2698. + ' data-decimal-digits="0"'
  2699. + ' role="application"></div>';
  2700. },
  2701. function (os, id) {
  2702. void (os);
  2703. return '<div data-netdata="' + id + '"'
  2704. + ' data-dimensions="error"'
  2705. + ' data-chart-library="gauge"'
  2706. + ' data-title="Server Errors"'
  2707. + ' data-units="requests/s"'
  2708. + ' data-gauge-adjust="width"'
  2709. + ' data-width="12%"'
  2710. + ' data-before="0"'
  2711. + ' data-after="-CHART_DURATION"'
  2712. + ' data-points="CHART_DURATION"'
  2713. + ' data-common-max="' + id + '"'
  2714. + ' data-colors="' + NETDATA.colors[1] + '"'
  2715. + ' data-decimal-digits="0"'
  2716. + ' role="application"></div>';
  2717. }
  2718. ]
  2719. },
  2720. 'web_log.squid_response_codes': {
  2721. info: 'Web server responses by code family. ' +
  2722. 'According to HTTP standards <code>1xx</code> are informational responses, ' +
  2723. '<code>2xx</code> are successful responses, ' +
  2724. '<code>3xx</code> are redirects (although they include <b>304</b> which is used as "<b>not modified</b>"), ' +
  2725. '<code>4xx</code> are bad requests, ' +
  2726. '<code>5xx</code> are internal server errors. ' +
  2727. 'Squid also defines <code>000</code> mostly for UDP requests, and ' +
  2728. '<code>6xx</code> for broken upstream servers sending wrong headers. ' +
  2729. 'Finally, <code>other</code> are non-standard responses, and ' +
  2730. '<code>unmatched</code> counts the lines in the log file that are not matched by the plugin (<a href="https://github.com/netdata/netdata/issues/new?title=web_log%20reports%20unmatched%20lines&body=web_log%20plugin%20reports%20unmatched%20lines.%0A%0AThis%20is%20my%20log:%0A%0A%60%60%60txt%0A%0Aplease%20paste%20your%20web%20server%20log%20here%0A%0A%60%60%60" target="_blank">let us know</a> if you have any unmatched).'
  2731. },
  2732. 'web_log.squid_duration': {
  2733. mainheads: [
  2734. function (os, id) {
  2735. void (os);
  2736. return '<div data-netdata="' + id + '"'
  2737. + ' data-dimensions="avg"'
  2738. + ' data-chart-library="gauge"'
  2739. + ' data-title="Average Response Time"'
  2740. + ' data-units="milliseconds"'
  2741. + ' data-gauge-adjust="width"'
  2742. + ' data-width="12%"'
  2743. + ' data-before="0"'
  2744. + ' data-after="-CHART_DURATION"'
  2745. + ' data-points="CHART_DURATION"'
  2746. + ' data-colors="' + NETDATA.colors[4] + '"'
  2747. + ' data-decimal-digits="2"'
  2748. + ' role="application"></div>';
  2749. }
  2750. ]
  2751. },
  2752. 'web_log.squid_detailed_response_codes': {
  2753. info: 'Number of responses for each response code individually.'
  2754. },
  2755. 'web_log.squid_clients': {
  2756. info: 'Unique client IPs accessing squid, within each data collection iteration. If data collection is <b>per second</b>, this chart shows <b>unique client IPs per second</b>.'
  2757. },
  2758. 'web_log.squid_clients_all': {
  2759. info: 'Unique client IPs accessing squid since the last restart of netdata. This plugin keeps in memory all the unique IPs that have accessed the server. On very busy squid servers (several millions of unique IPs) you may want to disable this chart (check <a href="https://github.com/netdata/netdata/blob/master/collectors/python.d.plugin/web_log/web_log.conf" target="_blank"><code>/etc/netdata/python.d/web_log.conf</code></a>).'
  2760. },
  2761. 'web_log.squid_transport_methods': {
  2762. info: 'Break down per delivery method: <code>TCP</code> are requests on the HTTP port (usually 3128), ' +
  2763. '<code>UDP</code> are requests on the ICP port (usually 3130), or HTCP port (usually 4128). ' +
  2764. 'If ICP logging was disabled using the log_icp_queries option, no ICP replies will be logged. ' +
  2765. '<code>NONE</code> are used to state that squid delivered an unusual response or no response at all. ' +
  2766. 'Seen with cachemgr requests and errors, usually when the transaction fails before being classified into one of the above outcomes. ' +
  2767. 'Also seen with responses to <code>CONNECT</code> requests.'
  2768. },
  2769. 'web_log.squid_code': {
  2770. info: 'These are combined squid result status codes. A break down per component is given in the following charts. ' +
  2771. 'Check the <a href="http://wiki.squid-cache.org/SquidFaq/SquidLogs">squid documentation about them</a>.'
  2772. },
  2773. 'web_log.squid_handling_opts': {
  2774. info: 'These tags are optional and describe why the particular handling was performed or where the request came from. ' +
  2775. '<code>CLIENT</code> means that the client request placed limits affecting the response. Usually seen with client issued a <b>no-cache</b>, or analogous cache control command along with the request. Thus, the cache has to validate the object.' +
  2776. '<code>IMS</code> states that the client sent a revalidation (conditional) request. ' +
  2777. '<code>ASYNC</code>, is used when the request was generated internally by Squid. Usually this is background fetches for cache information exchanges, background revalidation from stale-while-revalidate cache controls, or ESI sub-objects being loaded. ' +
  2778. '<code>SWAPFAIL</code> is assigned when the object was believed to be in the cache, but could not be accessed. A new copy was requested from the server. ' +
  2779. '<code>REFRESH</code> when a revalidation (conditional) request was sent to the server. ' +
  2780. '<code>SHARED</code> when this request was combined with an existing transaction by collapsed forwarding. NOTE: the existing request is not marked as SHARED. ' +
  2781. '<code>REPLY</code> when particular handling was requested in the HTTP reply from server or peer. Usually seen on DENIED due to http_reply_access ACLs preventing delivery of servers response object to the client.'
  2782. },
  2783. 'web_log.squid_object_types': {
  2784. info: 'These tags are optional and describe what type of object was produced. ' +
  2785. '<code>NEGATIVE</code> is only seen on HIT responses, indicating the response was a cached error response. e.g. <b>404 not found</b>. ' +
  2786. '<code>STALE</code> means the object was cached and served stale. This is usually caused by stale-while-revalidate or stale-if-error cache controls. ' +
  2787. '<code>OFFLINE</code> when the requested object was retrieved from the cache during offline_mode. The offline mode never validates any object. ' +
  2788. '<code>INVALID</code> when an invalid request was received. An error response was delivered indicating what the problem was. ' +
  2789. '<code>FAIL</code> is only seen on <code>REFRESH</code> to indicate the revalidation request failed. The response object may be the server provided network error or the stale object which was being revalidated depending on stale-if-error cache control. ' +
  2790. '<code>MODIFIED</code> is only seen on <code>REFRESH</code> responses to indicate revalidation produced a new modified object. ' +
  2791. '<code>UNMODIFIED</code> is only seen on <code>REFRESH</code> responses to indicate revalidation produced a <b>304</b> (Not Modified) status, which was relayed to the client. ' +
  2792. '<code>REDIRECT</code> when squid generated an HTTP redirect response to this request.'
  2793. },
  2794. 'web_log.squid_cache_events': {
  2795. info: 'These tags are optional and describe whether the response was loaded from cache, network, or otherwise. ' +
  2796. '<code>HIT</code> when the response object delivered was the local cache object. ' +
  2797. '<code>MEM</code> when the response object came from memory cache, avoiding disk accesses. Only seen on HIT responses. ' +
  2798. '<code>MISS</code> when the response object delivered was the network response object. ' +
  2799. '<code>DENIED</code> when the request was denied by access controls. ' +
  2800. '<code>NOFETCH</code> an ICP specific type, indicating service is alive, but not to be used for this request (sent during "-Y" startup, or during frequent failures, a cache in hit only mode will return either UDP_HIT or UDP_MISS_NOFETCH. Neighbours will thus only fetch hits). ' +
  2801. '<code>TUNNEL</code> when a binary tunnel was established for this transaction.'
  2802. },
  2803. 'web_log.squid_transport_errors': {
  2804. info: 'These tags are optional and describe some error conditions which occurred during response delivery (if any). ' +
  2805. '<code>ABORTED</code> when the response was not completed due to the connection being aborted (usually by the client). ' +
  2806. '<code>TIMEOUT</code>, when the response was not completed due to a connection timeout.'
  2807. },
  2808. // ------------------------------------------------------------------------
  2809. // go web_log
  2810. 'web_log.type_requests': {
  2811. info: 'Web server responses by type. <code>success</code> includes <b>1xx</b>, <b>2xx</b>, <b>304</b> and <b>401</b>, <code>error</code> includes <b>5xx</b>, <code>redirect</code> includes <b>3xx</b> except <b>304</b>, <code>bad</code> includes <b>4xx</b> except <b>401</b>, <code>other</code> are all the other responses.',
  2812. mainheads: [
  2813. function (os, id) {
  2814. void (os);
  2815. return '<div data-netdata="' + id + '"'
  2816. + ' data-dimensions="success"'
  2817. + ' data-chart-library="gauge"'
  2818. + ' data-title="Successful"'
  2819. + ' data-units="requests/s"'
  2820. + ' data-gauge-adjust="width"'
  2821. + ' data-width="12%"'
  2822. + ' data-before="0"'
  2823. + ' data-after="-CHART_DURATION"'
  2824. + ' data-points="CHART_DURATION"'
  2825. + ' data-common-max="' + id + '"'
  2826. + ' data-colors="' + NETDATA.colors[0] + '"'
  2827. + ' data-decimal-digits="0"'
  2828. + ' role="application"></div>';
  2829. },
  2830. function (os, id) {
  2831. void (os);
  2832. return '<div data-netdata="' + id + '"'
  2833. + ' data-dimensions="redirect"'
  2834. + ' data-chart-library="gauge"'
  2835. + ' data-title="Redirects"'
  2836. + ' data-units="requests/s"'
  2837. + ' data-gauge-adjust="width"'
  2838. + ' data-width="12%"'
  2839. + ' data-before="0"'
  2840. + ' data-after="-CHART_DURATION"'
  2841. + ' data-points="CHART_DURATION"'
  2842. + ' data-common-max="' + id + '"'
  2843. + ' data-colors="' + NETDATA.colors[2] + '"'
  2844. + ' data-decimal-digits="0"'
  2845. + ' role="application"></div>';
  2846. },
  2847. function (os, id) {
  2848. void (os);
  2849. return '<div data-netdata="' + id + '"'
  2850. + ' data-dimensions="bad"'
  2851. + ' data-chart-library="gauge"'
  2852. + ' data-title="Bad Requests"'
  2853. + ' data-units="requests/s"'
  2854. + ' data-gauge-adjust="width"'
  2855. + ' data-width="12%"'
  2856. + ' data-before="0"'
  2857. + ' data-after="-CHART_DURATION"'
  2858. + ' data-points="CHART_DURATION"'
  2859. + ' data-common-max="' + id + '"'
  2860. + ' data-colors="' + NETDATA.colors[3] + '"'
  2861. + ' data-decimal-digits="0"'
  2862. + ' role="application"></div>';
  2863. },
  2864. function (os, id) {
  2865. void (os);
  2866. return '<div data-netdata="' + id + '"'
  2867. + ' data-dimensions="error"'
  2868. + ' data-chart-library="gauge"'
  2869. + ' data-title="Server Errors"'
  2870. + ' data-units="requests/s"'
  2871. + ' data-gauge-adjust="width"'
  2872. + ' data-width="12%"'
  2873. + ' data-before="0"'
  2874. + ' data-after="-CHART_DURATION"'
  2875. + ' data-points="CHART_DURATION"'
  2876. + ' data-common-max="' + id + '"'
  2877. + ' data-colors="' + NETDATA.colors[1] + '"'
  2878. + ' data-decimal-digits="0"'
  2879. + ' role="application"></div>';
  2880. }
  2881. ]
  2882. },
  2883. 'web_log.request_processing_time': {
  2884. mainheads: [
  2885. function (os, id) {
  2886. void (os);
  2887. return '<div data-netdata="' + id + '"'
  2888. + ' data-dimensions="avg"'
  2889. + ' data-chart-library="gauge"'
  2890. + ' data-title="Average Response Time"'
  2891. + ' data-units="milliseconds"'
  2892. + ' data-gauge-adjust="width"'
  2893. + ' data-width="12%"'
  2894. + ' data-before="0"'
  2895. + ' data-after="-CHART_DURATION"'
  2896. + ' data-points="CHART_DURATION"'
  2897. + ' data-colors="' + NETDATA.colors[4] + '"'
  2898. + ' data-decimal-digits="2"'
  2899. + ' role="application"></div>';
  2900. }
  2901. ]
  2902. },
  2903. // ------------------------------------------------------------------------
  2904. // Fronius Solar Power
  2905. 'fronius.power': {
  2906. info: 'Positive <code>Grid</code> values mean that power is coming from the grid. Negative values are excess power that is going back into the grid, possibly selling it. ' +
  2907. '<code>Photovoltaics</code> is the power generated from the solar panels. ' +
  2908. '<code>Accumulator</code> is the stored power in the accumulator, if one is present.'
  2909. },
  2910. 'fronius.autonomy': {
  2911. commonMin: true,
  2912. commonMax: true,
  2913. valueRange: "[0, 100]",
  2914. info: 'The <code>Autonomy</code> is the percentage of how autonomous the installation is. An autonomy of 100 % means that the installation is producing more energy than it is needed. ' +
  2915. 'The <code>Self consumption</code> indicates the ratio between the current power generated and the current load. When it reaches 100 %, the <code>Autonomy</code> declines, since the solar panels can not produce enough energy and need support from the grid.'
  2916. },
  2917. 'fronius.energy.today': {
  2918. commonMin: true,
  2919. commonMax: true,
  2920. valueRange: "[0, null]"
  2921. },
  2922. // ------------------------------------------------------------------------
  2923. // Stiebel Eltron Heat pump installation
  2924. 'stiebeleltron.system.roomtemp': {
  2925. commonMin: true,
  2926. commonMax: true,
  2927. valueRange: "[0, null]"
  2928. },
  2929. // ------------------------------------------------------------------------
  2930. // Port check
  2931. 'portcheck.latency': {
  2932. info: 'The <code>latency</code> describes the time spent connecting to a TCP port. No data is sent or received. ' +
  2933. 'Currently, the accuracy of the latency is low and should be used as reference only.'
  2934. },
  2935. 'portcheck.status': {
  2936. valueRange: "[0, 1]",
  2937. info: 'The <code>status</code> chart verifies the availability of the service. ' +
  2938. 'Each status dimension will have a value of <code>1</code> if triggered. Dimension <code>success</code> is <code>1</code> only if connection could be established. ' +
  2939. 'This chart is most useful for alarms and third-party apps.'
  2940. },
  2941. // ------------------------------------------------------------------------
  2942. 'chrony.system': {
  2943. info: 'In normal operation, chronyd never steps the system clock, because any jump in the timescale can have adverse consequences for certain application programs. Instead, any error in the system clock is corrected by slightly speeding up or slowing down the system clock until the error has been removed, and then returning to the system clock’s normal speed. A consequence of this is that there will be a period when the system clock (as read by other programs using the <code>gettimeofday()</code> system call, or by the <code>date</code> command in the shell) will be different from chronyd\'s estimate of the current true time (which it reports to NTP clients when it is operating in server mode). The value reported on this line is the difference due to this effect.',
  2944. colors: NETDATA.colors[3]
  2945. },
  2946. 'chrony.offsets': {
  2947. info: '<code>last offset</code> is the estimated local offset on the last clock update. <code>RMS offset</code> is a long-term average of the offset value.',
  2948. height: 0.5
  2949. },
  2950. 'chrony.stratum': {
  2951. info: 'The <code>stratum</code> indicates how many hops away from a computer with an attached reference clock we are. Such a computer is a stratum-1 computer.',
  2952. decimalDigits: 0,
  2953. height: 0.5
  2954. },
  2955. 'chrony.root': {
  2956. info: 'Estimated delays against the root time server this system is synchronized with. <code>delay</code> is the total of the network path delays to the stratum-1 computer from which the computer is ultimately synchronised. <code>dispersion</code> is the total dispersion accumulated through all the computers back to the stratum-1 computer from which the computer is ultimately synchronised. Dispersion is due to system clock resolution, statistical measurement variations etc.'
  2957. },
  2958. 'chrony.frequency': {
  2959. info: 'The <code>frequency</code> is the rate by which the system\'s clock would be would be wrong if chronyd was not correcting it. It is expressed in ppm (parts per million). For example, a value of 1ppm would mean that when the system\'s clock thinks it has advanced 1 second, it has actually advanced by 1.000001 seconds relative to true time.',
  2960. colors: NETDATA.colors[0]
  2961. },
  2962. 'chrony.residualfreq': {
  2963. info: 'This shows the <code>residual frequency</code> for the currently selected reference source. ' +
  2964. 'It reflects any difference between what the measurements from the reference source indicate the ' +
  2965. 'frequency should be and the frequency currently being used. The reason this is not always zero is ' +
  2966. 'that a smoothing procedure is applied to the frequency. Each time a measurement from the reference ' +
  2967. 'source is obtained and a new residual frequency computed, the estimated accuracy of this residual ' +
  2968. 'is compared with the estimated accuracy (see <code>skew</code>) of the existing frequency value. ' +
  2969. 'A weighted average is computed for the new frequency, with weights depending on these accuracies. ' +
  2970. 'If the measurements from the reference source follow a consistent trend, the residual will be ' +
  2971. 'driven to zero over time.',
  2972. height: 0.5,
  2973. colors: NETDATA.colors[3]
  2974. },
  2975. 'chrony.skew': {
  2976. info: 'The estimated error bound on the frequency.',
  2977. height: 0.5,
  2978. colors: NETDATA.colors[5]
  2979. },
  2980. 'couchdb.active_tasks': {
  2981. info: 'Active tasks running on this CouchDB <b>cluster</b>. Four types of tasks currently exist: indexer (view building), replication, database compaction and view compaction.'
  2982. },
  2983. 'couchdb.replicator_jobs': {
  2984. info: 'Detailed breakdown of any replication jobs in progress on this node. For more information, see the <a href="http://docs.couchdb.org/en/latest/replication/replicator.html">replicator documentation</a>.'
  2985. },
  2986. 'couchdb.open_files': {
  2987. info: 'Count of all files held open by CouchDB. If this value seems pegged at 1024 or 4096, your server process is probably hitting the open file handle limit and <a href="http://docs.couchdb.org/en/latest/maintenance/performance.html#pam-and-ulimit">needs to be increased.</a>'
  2988. },
  2989. 'btrfs.disk': {
  2990. info: 'Physical disk usage of BTRFS. The disk space reported here is the raw physical disk space assigned to the BTRFS volume (i.e. <b>before any RAID levels</b>). BTRFS uses a two-stage allocator, first allocating large regions of disk space for one type of block (data, metadata, or system), and then using a regular block allocator inside those regions. <code>unallocated</code> is the physical disk space that is not allocated yet and is available to become data, metadata or system on demand. When <code>unallocated</code> is zero, all available disk space has been allocated to a specific function. Healthy volumes should ideally have at least five percent of their total space <code>unallocated</code>. You can keep your volume healthy by running the <code>btrfs balance</code> command on it regularly (check <code>man btrfs-balance</code> for more info). Note that some of the space listed as <code>unallocated</code> may not actually be usable if the volume uses devices of different sizes.',
  2991. colors: [NETDATA.colors[12]]
  2992. },
  2993. 'btrfs.data': {
  2994. info: 'Logical disk usage for BTRFS data. Data chunks are used to store the actual file data (file contents). The disk space reported here is the usable allocation (i.e. after any striping or replication). Healthy volumes should ideally have no more than a few GB of free space reported here persistently. Running <code>btrfs balance</code> can help here.'
  2995. },
  2996. 'btrfs.metadata': {
  2997. info: 'Logical disk usage for BTRFS metadata. Metadata chunks store most of the filesystem internal structures, as well as information like directory structure and file names. The disk space reported here is the usable allocation (i.e. after any striping or replication). Healthy volumes should ideally have no more than a few GB of free space reported here persistently. Running <code>btrfs balance</code> can help here.'
  2998. },
  2999. 'btrfs.system': {
  3000. info: 'Logical disk usage for BTRFS system. System chunks store information about the allocation of other chunks. The disk space reported here is the usable allocation (i.e. after any striping or replication). The values reported here should be relatively small compared to Data and Metadata, and will scale with the volume size and overall space usage.'
  3001. },
  3002. // ------------------------------------------------------------------------
  3003. // RabbitMQ
  3004. // info: the text above the charts
  3005. // heads: the representation of the chart at the top the subsection (second level menu)
  3006. // mainheads: the representation of the chart at the top of the section (first level menu)
  3007. // colors: the dimension colors of the chart (the default colors are appended)
  3008. // height: the ratio of the chart height relative to the default
  3009. 'rabbitmq.queued_messages': {
  3010. info: 'Overall total of ready and unacknowledged queued messages. Messages that are delivered immediately are not counted here.'
  3011. },
  3012. 'rabbitmq.message_rates': {
  3013. info: 'Overall messaging rates including acknowledgements, deliveries, redeliveries, and publishes.'
  3014. },
  3015. 'rabbitmq.global_counts': {
  3016. info: 'Overall totals for channels, consumers, connections, queues and exchanges.'
  3017. },
  3018. 'rabbitmq.file_descriptors': {
  3019. info: 'Total number of used filed descriptors. See <code><a href="https://www.rabbitmq.com/production-checklist.html#resource-limits-file-handle-limit" target="_blank">Open File Limits</a></code> for further details.',
  3020. colors: NETDATA.colors[3]
  3021. },
  3022. 'rabbitmq.sockets': {
  3023. info: 'Total number of used socket descriptors. Each used socket also counts as a used file descriptor. See <code><a href="https://www.rabbitmq.com/production-checklist.html#resource-limits-file-handle-limit" target="_blank">Open File Limits</a></code> for further details.',
  3024. colors: NETDATA.colors[3]
  3025. },
  3026. 'rabbitmq.processes': {
  3027. info: 'Total number of processes running within the Erlang VM. This is not the same as the number of processes running on the host.',
  3028. colors: NETDATA.colors[3]
  3029. },
  3030. 'rabbitmq.erlang_run_queue': {
  3031. info: 'Number of Erlang processes the Erlang schedulers have queued to run.',
  3032. colors: NETDATA.colors[3]
  3033. },
  3034. 'rabbitmq.memory': {
  3035. info: 'Total amount of memory used by the RabbitMQ. This is a complex statistic that can be further analyzed in the management UI. See <code><a href="https://www.rabbitmq.com/production-checklist.html#resource-limits-ram" target="_blank">Memory</a></code> for further details.',
  3036. colors: NETDATA.colors[3]
  3037. },
  3038. 'rabbitmq.disk_space': {
  3039. info: 'Total amount of disk space consumed by the message store(s). See <code><a href="https://www.rabbitmq.com/production-checklist.html#resource-limits-disk-space" target=_"blank">Disk Space Limits</a></code> for further details.',
  3040. colors: NETDATA.colors[3]
  3041. },
  3042. 'rabbitmq.queue_messages': {
  3043. info: 'Total amount of messages and their states in this queue.',
  3044. colors: NETDATA.colors[3]
  3045. },
  3046. 'rabbitmq.queue_messages_stats': {
  3047. info: 'Overall messaging rates including acknowledgements, deliveries, redeliveries, and publishes.',
  3048. colors: NETDATA.colors[3]
  3049. },
  3050. // ------------------------------------------------------------------------
  3051. // ntpd
  3052. 'ntpd.sys_offset': {
  3053. info: 'For hosts without any time critical services an offset of &lt; 100 ms should be acceptable even with high network latencies. For hosts with time critical services an offset of about 0.01 ms or less can be achieved by using peers with low delays and configuring optimal <b>poll exponent</b> values.',
  3054. colors: NETDATA.colors[4]
  3055. },
  3056. 'ntpd.sys_jitter': {
  3057. info: 'The jitter statistics are exponentially-weighted RMS averages. The system jitter is defined in the NTPv4 specification; the clock jitter statistic is computed by the clock discipline module.'
  3058. },
  3059. 'ntpd.sys_frequency': {
  3060. info: 'The frequency offset is shown in ppm (parts per million) relative to the frequency of the system. The frequency correction needed for the clock can vary significantly between boots and also due to external influences like temperature or radiation.',
  3061. colors: NETDATA.colors[2],
  3062. height: 0.6
  3063. },
  3064. 'ntpd.sys_wander': {
  3065. info: 'The wander statistics are exponentially-weighted RMS averages.',
  3066. colors: NETDATA.colors[3],
  3067. height: 0.6
  3068. },
  3069. 'ntpd.sys_rootdelay': {
  3070. info: 'The rootdelay is the round-trip delay to the primary reference clock, similar to the delay shown by the <code>ping</code> command. A lower delay should result in a lower clock offset.',
  3071. colors: NETDATA.colors[1]
  3072. },
  3073. 'ntpd.sys_stratum': {
  3074. info: 'The distance in "hops" to the primary reference clock',
  3075. colors: NETDATA.colors[5],
  3076. height: 0.3
  3077. },
  3078. 'ntpd.sys_tc': {
  3079. info: 'Time constants and poll intervals are expressed as exponents of 2. The default poll exponent of 6 corresponds to a poll interval of 64 s. For typical Internet paths, the optimum poll interval is about 64 s. For fast LANs with modern computers, a poll exponent of 4 (16 s) is appropriate. The <a href="http://doc.ntp.org/current-stable/poll.html">poll process</a> sends NTP packets at intervals determined by the clock discipline algorithm.',
  3080. height: 0.5
  3081. },
  3082. 'ntpd.sys_precision': {
  3083. colors: NETDATA.colors[6],
  3084. height: 0.2
  3085. },
  3086. 'ntpd.peer_offset': {
  3087. info: 'The offset of the peer clock relative to the system clock in milliseconds. Smaller values here weight peers more heavily for selection after the initial synchronization of the local clock. For a system providing time service to other systems, these should be as low as possible.'
  3088. },
  3089. 'ntpd.peer_delay': {
  3090. info: 'The round-trip time (RTT) for communication with the peer, similar to the delay shown by the <code>ping</code> command. Not as critical as either the offset or jitter, but still factored into the selection algorithm (because as a general rule, lower delay means more accurate time). In most cases, it should be below 100ms.'
  3091. },
  3092. 'ntpd.peer_dispersion': {
  3093. info: 'This is a measure of the estimated error between the peer and the local system. Lower values here are better.'
  3094. },
  3095. 'ntpd.peer_jitter': {
  3096. info: 'This is essentially a remote estimate of the peer\'s <code>system_jitter</code> value. Lower values here weight highly in favor of peer selection, and this is a good indicator of overall quality of a given time server (good servers will have values not exceeding single digit milliseconds here, with high quality stratum one servers regularly having sub-millisecond jitter).'
  3097. },
  3098. 'ntpd.peer_xleave': {
  3099. info: 'This variable is used in interleaved mode (used only in NTP symmetric and broadcast modes). See <a href="http://doc.ntp.org/current-stable/xleave.html">NTP Interleaved Modes</a>.'
  3100. },
  3101. 'ntpd.peer_rootdelay': {
  3102. info: 'For a stratum 1 server, this is the access latency for the reference clock. For lower stratum servers, it is the sum of the <code>peer_delay</code> and <code>peer_rootdelay</code> for the system they are syncing off of. Similarly to <code>peer_delay</code>, lower values here are technically better, but have limited influence in peer selection.'
  3103. },
  3104. 'ntpd.peer_rootdisp': {
  3105. info: 'Is the same as <code>peer_rootdelay</code>, but measures accumulated <code>peer_dispersion</code> instead of accumulated <code>peer_delay</code>.'
  3106. },
  3107. 'ntpd.peer_hmode': {
  3108. info: 'The <code>peer_hmode</code> and <code>peer_pmode</code> variables give info about what mode the packets being sent to and received from a given peer are. Mode 1 is symmetric active (both the local system and the remote peer have each other declared as peers in <code>/etc/ntp.conf</code>), Mode 2 is symmetric passive (only one side has the other declared as a peer), Mode 3 is client, Mode 4 is server, and Mode 5 is broadcast (also used for multicast and manycast operation).',
  3109. height: 0.2
  3110. },
  3111. 'ntpd.peer_pmode': {
  3112. height: 0.2
  3113. },
  3114. 'ntpd.peer_hpoll': {
  3115. info: 'The <code>peer_hpoll</code> and <code>peer_ppoll</code> variables are log2 representations of the polling interval in seconds.',
  3116. height: 0.5
  3117. },
  3118. 'ntpd.peer_ppoll': {
  3119. height: 0.5
  3120. },
  3121. 'ntpd.peer_precision': {
  3122. height: 0.2
  3123. },
  3124. 'spigotmc.tps': {
  3125. info: 'The running 1, 5, and 15 minute average number of server ticks per second. An idealized server will show 20.0 for all values, but in practice this almost never happens. Typical servers should show approximately 19.98-20.0 here. Lower values indicate progressively more server-side lag (and thus that you need better hardware for your server or a lower user limit). For every 0.05 ticks below 20, redstone clocks will lag behind by approximately 0.25%. Values below approximately 19.50 may interfere with complex free-running redstone circuits and will noticeably slow down growth.'
  3126. },
  3127. 'spigotmc.users': {
  3128. info: 'The number of currently connect users on the monitored Spigot server.'
  3129. },
  3130. 'boinc.tasks': {
  3131. info: 'The total number of tasks and the number of active tasks. Active tasks are those which are either currently being processed, or are partially processed but suspended.'
  3132. },
  3133. 'boinc.states': {
  3134. info: 'Counts of tasks in each task state. The normal sequence of states is <code>New</code>, <code>Downloading</code>, <code>Ready to Run</code>, <code>Uploading</code>, <code>Uploaded</code>. Tasks which are marked <code>Ready to Run</code> may be actively running, or may be waiting to be scheduled. <code>Compute Errors</code> are tasks which failed for some reason during execution. <code>Aborted</code> tasks were manually cancelled, and will not be processed. <code>Failed Uploads</code> are otherwise finished tasks which failed to upload to the server, and usually indicate networking issues.'
  3135. },
  3136. 'boinc.sched': {
  3137. info: 'Counts of active tasks in each scheduling state. <code>Scheduled</code> tasks are the ones which will run if the system is permitted to process tasks. <code>Preempted</code> tasks are on standby, and will run if a <code>Scheduled</code> task stops running for some reason. <code>Uninitialized</code> tasks should never be present, and indicate tha the scheduler has not tried to schedule them yet.'
  3138. },
  3139. 'boinc.process': {
  3140. info: 'Counts of active tasks in each process state. <code>Executing</code> tasks are running right now. <code>Suspended</code> tasks have an associated process, but are not currently running (either because the system isn\'t processing any tasks right now, or because they have been preempted by higher priority tasks). <code>Quit</code> tasks are exiting gracefully. <code>Aborted</code> tasks exceeded some resource limit, and are being shut down. <code>Copy Pending</code> tasks are waiting on a background file transfer to finish. <code>Uninitialized</code> tasks do not have an associated process yet.'
  3141. },
  3142. 'w1sensor.temp': {
  3143. info: 'Temperature derived from 1-Wire temperature sensors.'
  3144. },
  3145. 'logind.sessions': {
  3146. info: 'Shows the number of active sessions of each type tracked by logind.'
  3147. },
  3148. 'logind.users': {
  3149. info: 'Shows the number of active users of each type tracked by logind.'
  3150. },
  3151. 'logind.seats': {
  3152. info: 'Shows the number of active seats tracked by logind. Each seat corresponds to a combination of a display device and input device providing a physical presence for the system.'
  3153. },
  3154. // ------------------------------------------------------------------------
  3155. // ProxySQL
  3156. 'proxysql.pool_status': {
  3157. info: 'The status of the backend servers. ' +
  3158. '<code>1=ONLINE</code> backend server is fully operational, ' +
  3159. '<code>2=SHUNNED</code> backend sever is temporarily taken out of use because of either too many connection errors in a time that was too short, or replication lag exceeded the allowed threshold, ' +
  3160. '<code>3=OFFLINE_SOFT</code> when a server is put into OFFLINE_SOFT mode, new incoming connections aren\'t accepted anymore, while the existing connections are kept until they became inactive. In other words, connections are kept in use until the current transaction is completed. This allows to gracefully detach a backend, ' +
  3161. '<code>4=OFFLINE_HARD</code> when a server is put into OFFLINE_HARD mode, the existing connections are dropped, while new incoming connections aren\'t accepted either. This is equivalent to deleting the server from a hostgroup, or temporarily taking it out of the hostgroup for maintenance work, ' +
  3162. '<code>-1</code> Unknown status.'
  3163. },
  3164. 'proxysql.pool_net': {
  3165. info: 'The amount of data sent to/received from the backend ' +
  3166. '(This does not include metadata (packets\' headers, OK/ERR packets, fields\' description, etc).'
  3167. },
  3168. 'proxysql.pool_overall_net': {
  3169. info: 'The amount of data sent to/received from the all backends ' +
  3170. '(This does not include metadata (packets\' headers, OK/ERR packets, fields\' description, etc).'
  3171. },
  3172. 'proxysql.questions': {
  3173. info: '<code>questions</code> total number of queries sent from frontends, ' +
  3174. '<code>slow_queries</code> number of queries that ran for longer than the threshold in milliseconds defined in global variable <code>mysql-long_query_time</code>. '
  3175. },
  3176. 'proxysql.connections': {
  3177. info: '<code>aborted</code> number of frontend connections aborted due to invalid credential or max_connections reached, ' +
  3178. '<code>connected</code> number of frontend connections currently connected, ' +
  3179. '<code>created</code> number of frontend connections created, ' +
  3180. '<code>non_idle</code> number of frontend connections that are not currently idle. '
  3181. },
  3182. 'proxysql.pool_latency': {
  3183. info: 'The currently ping time in microseconds, as reported from Monitor.'
  3184. },
  3185. 'proxysql.queries': {
  3186. info: 'The number of queries routed towards this particular backend server.'
  3187. },
  3188. 'proxysql.pool_used_connections': {
  3189. info: 'The number of connections are currently used by ProxySQL for sending queries to the backend server.'
  3190. },
  3191. 'proxysql.pool_free_connections': {
  3192. info: 'The number of connections are currently free. They are kept open in order to minimize the time cost of sending a query to the backend server.'
  3193. },
  3194. 'proxysql.pool_ok_connections': {
  3195. info: 'The number of connections were established successfully.'
  3196. },
  3197. 'proxysql.pool_error_connections': {
  3198. info: 'The number of connections weren\'t established successfully.'
  3199. },
  3200. 'proxysql.commands_count': {
  3201. info: 'The total number of commands of that type executed'
  3202. },
  3203. 'proxysql.commands_duration': {
  3204. info: 'The total time spent executing commands of that type, in ms'
  3205. },
  3206. // ------------------------------------------------------------------------
  3207. // Power Supplies
  3208. 'powersupply.capacity': {
  3209. info: undefined
  3210. },
  3211. 'powersupply.charge': {
  3212. info: undefined
  3213. },
  3214. 'powersupply.energy': {
  3215. info: undefined
  3216. },
  3217. 'powersupply.voltage': {
  3218. info: undefined
  3219. },
  3220. // ------------------------------------------------------------------------
  3221. // VMware vSphere
  3222. // Host specific
  3223. 'vsphere.host_mem_usage_percentage': {
  3224. info: 'Percentage of used machine memory: <code>consumed</code> / <code>machine-memory-size</code>.'
  3225. },
  3226. 'vsphere.host_mem_usage': {
  3227. info:
  3228. '<code>granted</code> is amount of machine memory that is mapped for a host, ' +
  3229. 'it equals sum of all granted metrics for all powered-on virtual machines, plus machine memory for vSphere services on the host. ' +
  3230. '<code>consumed</code> is amount of machine memory used on the host, it includes memory used by the Service Console, the VMkernel, vSphere services, plus the total consumed metrics for all running virtual machines. ' +
  3231. '<code>consumed</code> = <code>total host memory</code> - <code>free host memory</code>.' +
  3232. '<code>active</code> is sum of all active metrics for all powered-on virtual machines plus vSphere services (such as COS, vpxa) on the host.' +
  3233. '<code>shared</code> is sum of all shared metrics for all powered-on virtual machines, plus amount for vSphere services on the host. ' +
  3234. '<code>sharedcommon</code> is amount of machine memory that is shared by all powered-on virtual machines and vSphere services on the host. ' +
  3235. '<code>shared</code> - <code>sharedcommon</code> = machine memory (host memory) savings (KB). ' +
  3236. 'For details see <a href="https://docs.vmware.com/en/VMware-vSphere/6.5/com.vmware.vsphere.resmgmt.doc/GUID-BFDC988B-F53D-4E97-9793-A002445AFAE1.html">Measuring and Differentiating Types of Memory Usage</a> and ' +
  3237. '<a href="https://www.vmware.com/support/developer/converter-sdk/conv51_apireference/memory_counters.html">Memory Counters</a> articles.'
  3238. },
  3239. 'vsphere.host_mem_swap_rate': {
  3240. info:
  3241. 'This statistic refers to VMkernel swapping and not to guest OS swapping. ' +
  3242. '<code>in</code> is sum of <code>swapinRate</code> values for all powered-on virtual machines on the host.' +
  3243. '<code>swapinRate</code> is rate at which VMKernel reads data into machine memory from the swap file. ' +
  3244. '<code>out</code> is sum of <code>swapoutRate</code> values for all powered-on virtual machines on the host.' +
  3245. '<code>swapoutRate</code> is rate at which VMkernel writes to the virtual machine’s swap file from machine memory.'
  3246. },
  3247. // VM specific
  3248. 'vsphere.vm_mem_usage_percentage': {
  3249. info: 'Percentage of used virtual machine “physical” memory: <code>active</code> / <code>virtual machine configured size</code>.'
  3250. },
  3251. 'vsphere.vm_mem_usage': {
  3252. info:
  3253. '<code>granted</code> is amount of guest “physical” memory that is mapped to machine memory, it includes <code>shared</code> memory amount. ' +
  3254. '<code>consumed</code> is amount of guest “physical” memory consumed by the virtual machine for guest memory, ' +
  3255. '<code>consumed</code> = <code>granted</code> - <code>memory saved due to memory sharing</code>. ' +
  3256. '<code>active</code> is amount of memory that is actively used, as estimated by VMkernel based on recently touched memory pages. ' +
  3257. '<code>shared</code> is amount of guest “physical” memory shared with other virtual machines (through the VMkernel’s transparent page-sharing mechanism, a RAM de-duplication technique). ' +
  3258. 'For details see <a href="https://docs.vmware.com/en/VMware-vSphere/6.5/com.vmware.vsphere.resmgmt.doc/GUID-BFDC988B-F53D-4E97-9793-A002445AFAE1.html">Measuring and Differentiating Types of Memory Usage</a> and ' +
  3259. '<a href="https://www.vmware.com/support/developer/converter-sdk/conv51_apireference/memory_counters.html">Memory Counters</a> articles.'
  3260. },
  3261. 'vsphere.vm_mem_swap_rate': {
  3262. info:
  3263. 'This statistic refers to VMkernel swapping and not to guest OS swapping. ' +
  3264. '<code>in</code> is rate at which VMKernel reads data into machine memory from the swap file. ' +
  3265. '<code>out</code> is rate at which VMkernel writes to the virtual machine’s swap file from machine memory.'
  3266. },
  3267. 'vsphere.vm_mem_swap': {
  3268. info:
  3269. 'This statistic refers to VMkernel swapping and not to guest OS swapping. ' +
  3270. '<code>swapped</code> is amount of guest physical memory swapped out to the virtual machine\'s swap file by the VMkernel. ' +
  3271. 'Swapped memory stays on disk until the virtual machine needs it.'
  3272. },
  3273. // Common
  3274. 'vsphere.cpu_usage_total': {
  3275. info: 'Summary CPU usage statistics across all CPUs/cores.'
  3276. },
  3277. 'vsphere.net_bandwidth_total': {
  3278. info: 'Summary receive/transmit statistics across all network interfaces.'
  3279. },
  3280. 'vsphere.net_packets_total': {
  3281. info: 'Summary receive/transmit statistics across all network interfaces.'
  3282. },
  3283. 'vsphere.net_errors_total': {
  3284. info: 'Summary receive/transmit statistics across all network interfaces.'
  3285. },
  3286. 'vsphere.net_drops_total': {
  3287. info: 'Summary receive/transmit statistics across all network interfaces.'
  3288. },
  3289. 'vsphere.disk_usage_total': {
  3290. info: 'Summary read/write statistics across all disks.'
  3291. },
  3292. 'vsphere.disk_max_latency': {
  3293. info: '<code>latency</code> is highest latency value across all disks.'
  3294. },
  3295. 'vsphere.overall_status': {
  3296. info: '<code>0</code> is unknown, <code>1</code> is OK, <code>2</code> is might have a problem, <code>3</code> is definitely has a problem.'
  3297. },
  3298. // ------------------------------------------------------------------------
  3299. // VCSA
  3300. 'vcsa.system_health': {
  3301. info:
  3302. '<code>-1</code>: unknown; ' +
  3303. '<code>0</code>: all components are healthy; ' +
  3304. '<code>1</code>: one or more components might become overloaded soon; ' +
  3305. '<code>2</code>: one or more components in the appliance might be degraded; ' +
  3306. '<code>3</code>: one or more components might be in an unusable status and the appliance might become unresponsive soon; ' +
  3307. '<code>4</code>: no health data is available.'
  3308. },
  3309. 'vcsa.components_health': {
  3310. info:
  3311. '<code>-1</code>: unknown; ' +
  3312. '<code>0</code>: healthy; ' +
  3313. '<code>1</code>: healthy, but may have some problems; ' +
  3314. '<code>2</code>: degraded, and may have serious problems; ' +
  3315. '<code>3</code>: unavailable, or will stop functioning soon; ' +
  3316. '<code>4</code>: no health data is available.'
  3317. },
  3318. 'vcsa.software_updates_health': {
  3319. info:
  3320. '<code>softwarepackages</code> represents information on available software updates available in the remote vSphere Update Manager repository.<br>' +
  3321. '<code>-1</code>: unknown; ' +
  3322. '<code>0</code>: no updates available; ' +
  3323. '<code>2</code>: non-security updates are available; ' +
  3324. '<code>3</code>: security updates are available; ' +
  3325. '<code>4</code>: an error retrieving information on software updates.'
  3326. },
  3327. // ------------------------------------------------------------------------
  3328. // Zookeeper
  3329. 'zookeeper.server_state': {
  3330. info:
  3331. '<code>0</code>: unknown, ' +
  3332. '<code>1</code>: leader, ' +
  3333. '<code>2</code>: follower, ' +
  3334. '<code>3</code>: observer, ' +
  3335. '<code>4</code>: standalone.'
  3336. },
  3337. // ------------------------------------------------------------------------
  3338. // Squidlog
  3339. 'squidlog.requests': {
  3340. info: 'Total number of requests (log lines read). It includes <code>unmatched</code>.'
  3341. },
  3342. 'squidlog.excluded_requests': {
  3343. info: '<code>unmatched</code> counts the lines in the log file that are not matched by the plugin parser (<a href="https://github.com/netdata/netdata/issues/new?title=squidlog%20reports%20unmatched%20lines&body=squidlog%20plugin%20reports%20unmatched%20lines.%0A%0AThis%20is%20my%20log:%0A%0A%60%60%60txt%0A%0Aplease%20paste%20your%20squid%20server%20log%20here%0A%0A%60%60%60" target="_blank">let us know</a> if you have any unmatched).'
  3344. },
  3345. 'squidlog.type_requests': {
  3346. info: 'Requests by response type:<br>' +
  3347. '<ul>' +
  3348. ' <li><code>success</code> includes 1xx, 2xx, 0, 304, 401.</li>' +
  3349. ' <li><code>error</code> includes 5xx and 6xx.</li>' +
  3350. ' <li><code>redirect</code> includes 3xx except 304.</li>' +
  3351. ' <li><code>bad</code> includes 4xx except 401.</li>' +
  3352. ' </ul>'
  3353. },
  3354. 'squidlog.http_status_code_class_responses': {
  3355. info: 'The HTTP response status code classes. According to <a href="https://tools.ietf.org/html/rfc7231" target="_blank">rfc7231</a>:<br>' +
  3356. ' <li><code>1xx</code> is informational responses.</li>' +
  3357. ' <li><code>2xx</code> is successful responses.</li>' +
  3358. ' <li><code>3xx</code> is redirects.</li>' +
  3359. ' <li><code>4xx</code> is bad requests.</li>' +
  3360. ' <li><code>5xx</code> is internal server errors.</li>' +
  3361. ' </ul>' +
  3362. 'Squid also uses <code>0</code> for a result code being unavailable, and <code>6xx</code> to signal an invalid header, a proxy error.'
  3363. },
  3364. 'squidlog.http_status_code_responses': {
  3365. info: 'Number of responses for each http response status code individually.'
  3366. },
  3367. 'squidlog.uniq_clients': {
  3368. info: 'Unique clients (requesting instances), within each data collection iteration. If data collection is <b>per second</b>, this chart shows <b>unique clients per second</b>.'
  3369. },
  3370. 'squidlog.bandwidth': {
  3371. info: 'The size is the amount of data delivered to the clients. Mind that this does not constitute the net object size, as headers are also counted. ' +
  3372. 'Also, failed requests may deliver an error page, the size of which is also logged here.'
  3373. },
  3374. 'squidlog.response_time': {
  3375. info: 'The elapsed time considers how many milliseconds the transaction busied the cache. It differs in interpretation between TCP and UDP:' +
  3376. '<ul>' +
  3377. ' <li><code>TCP</code> this is basically the time from having received the request to when Squid finishes sending the last byte of the response.</li>' +
  3378. ' <li><code>UDP</code> this is the time between scheduling a reply and actually sending it.</li>' +
  3379. ' </ul>' +
  3380. 'Please note that <b>the entries are logged after the reply finished being sent</b>, not during the lifetime of the transaction.'
  3381. },
  3382. 'squidlog.cache_result_code_requests': {
  3383. info: 'The Squid result code is composed of several tags (separated by underscore characters) which describe the response sent to the client. ' +
  3384. 'Check the <a href="https://wiki.squid-cache.org/SquidFaq/SquidLogs#Squid_result_codes">squid documentation</a> about them.'
  3385. },
  3386. 'squidlog.cache_result_code_transport_tag_requests': {
  3387. info: 'These tags are always present and describe delivery method.<br>' +
  3388. '<ul>' +
  3389. ' <li><code>TCP</code> requests on the HTTP port (usually 3128).</li>' +
  3390. ' <li><code>UDP</code> requests on the ICP port (usually 3130) or HTCP port (usually 4128).</li>' +
  3391. ' <li><code>NONE</code> Squid delivered an unusual response or no response at all. Seen with cachemgr requests and errors, usually when the transaction fails before being classified into one of the above outcomes. Also seen with responses to CONNECT requests.</li>' +
  3392. ' </ul>'
  3393. },
  3394. 'squidlog.cache_result_code_handling_tag_requests': {
  3395. info: 'These tags are optional and describe why the particular handling was performed or where the request came from.<br>' +
  3396. '<ul>' +
  3397. ' <li><code>CF</code> at least one request in this transaction was collapsed. See <a href="http://www.squid-cache.org/Doc/config/collapsed_forwarding/" target="_blank">collapsed_forwarding</a> for more details about request collapsing.</li>' +
  3398. ' <li><code>CLIENT</code> usually seen with client issued a "no-cache", or analogous cache control command along with the request. Thus, the cache has to validate the object.</li>' +
  3399. ' <li><code>IMS</code> the client sent a revalidation (conditional) request.</li>' +
  3400. ' <li><code>ASYNC</code> the request was generated internally by Squid. Usually this is background fetches for cache information exchanges, background revalidation from <i>stale-while-revalidate</i> cache controls, or ESI sub-objects being loaded.</li>' +
  3401. ' <li><code>SWAPFAIL</code> the object was believed to be in the cache, but could not be accessed. A new copy was requested from the server.</li>' +
  3402. ' <li><code>REFRESH</code> a revalidation (conditional) request was sent to the server.</li>' +
  3403. ' <li><code>SHARED</code> this request was combined with an existing transaction by collapsed forwarding.</li>' +
  3404. ' <li><code>REPLY</code> the HTTP reply from server or peer. Usually seen on <code>DENIED</code> due to <a href="http://www.squid-cache.org/Doc/config/http_reply_access/" target="_blank">http_reply_access</a> ACLs preventing delivery of servers response object to the client.</li>' +
  3405. ' </ul>'
  3406. },
  3407. 'squidlog.cache_code_object_tag_requests': {
  3408. info: 'These tags are optional and describe what type of object was produced.<br>' +
  3409. '<ul>' +
  3410. ' <li><code>NEGATIVE</code> only seen on HIT responses, indicating the response was a cached error response. e.g. <b>404 not found</b>.</li>' +
  3411. ' <li><code>STALE</code> the object was cached and served stale. This is usually caused by <i>stale-while-revalidate</i> or <i>stale-if-error</i> cache controls.</li>' +
  3412. ' <li><code>OFFLINE</code> the requested object was retrieved from the cache during <a href="http://www.squid-cache.org/Doc/config/offline_mode/" target="_blank">offline_mode</a>. The offline mode never validates any object.</li>' +
  3413. ' <li><code>INVALID</code> an invalid request was received. An error response was delivered indicating what the problem was.</li>' +
  3414. ' <li><code>FAILED</code> only seen on <code>REFRESH</code> to indicate the revalidation request failed. The response object may be the server provided network error or the stale object which was being revalidated depending on stale-if-error cache control.</li>' +
  3415. ' <li><code>MODIFIED</code> only seen on <code>REFRESH</code> responses to indicate revalidation produced a new modified object.</li>' +
  3416. ' <li><code>UNMODIFIED</code> only seen on <code>REFRESH</code> responses to indicate revalidation produced a 304 (Not Modified) status. The client gets either a full 200 (OK), a 304 (Not Modified), or (in theory) another response, depending on the client request and other details.</li>' +
  3417. ' <li><code>REDIRECT</code> Squid generated an HTTP redirect response to this request.</li>' +
  3418. ' </ul>'
  3419. },
  3420. 'squidlog.cache_code_load_source_tag_requests': {
  3421. info: 'These tags are optional and describe whether the response was loaded from cache, network, or otherwise.<br>' +
  3422. '<ul>' +
  3423. ' <li><code>HIT</code> the response object delivered was the local cache object.</li>' +
  3424. ' <li><code>MEM</code> the response object came from memory cache, avoiding disk accesses. Only seen on HIT responses.</li>' +
  3425. ' <li><code>MISS</code> the response object delivered was the network response object.</li>' +
  3426. ' <li><code>DENIED</code> the request was denied by access controls.</li>' +
  3427. ' <li><code>NOFETCH</code> an ICP specific type, indicating service is alive, but not to be used for this request.</li>' +
  3428. ' <li><code>TUNNEL</code> a binary tunnel was established for this transaction.</li>' +
  3429. ' </ul>'
  3430. },
  3431. 'squidlog.cache_code_error_tag_requests': {
  3432. info: 'These tags are optional and describe some error conditions which occurred during response delivery.<br>' +
  3433. '<ul>' +
  3434. ' <li><code>ABORTED</code> the response was not completed due to the connection being aborted (usually by the client).</li>' +
  3435. ' <li><code>TIMEOUT</code> the response was not completed due to a connection timeout.</li>' +
  3436. ' <li><code>IGNORED</code> while refreshing a previously cached response A, Squid got a response B that was older than A (as determined by the Date header field). Squid ignored response B (and attempted to use A instead).</li>' +
  3437. ' </ul>'
  3438. },
  3439. 'squidlog.http_method_requests': {
  3440. info: 'The request method to obtain an object. Please refer to section <a href="https://wiki.squid-cache.org/SquidFaq/SquidLogs#Request_methods">request-methods</a> for available methods and their description.'
  3441. },
  3442. 'squidlog.hier_code_requests': {
  3443. info: 'A code that explains how the request was handled, e.g. by forwarding it to a peer, or going straight to the source. ' +
  3444. 'Any hierarchy tag may be prefixed with <code>TIMEOUT_</code>, if the timeout occurs waiting for all ICP replies to return from the neighbours. The timeout is either dynamic, if the <a href="http://www.squid-cache.org/Doc/config/icp_query_timeout/" target="_blank">icp_query_timeout</a> was not set, or the time configured there has run up. ' +
  3445. 'Refer to <a href="https://wiki.squid-cache.org/SquidFaq/SquidLogs#Hierarchy_Codes" target="_blank">Hierarchy Codes</a> for details on hierarchy codes.'
  3446. },
  3447. 'squidlog.server_address_forwarded_requests': {
  3448. info: 'The IP address or hostname where the request (if a miss) was forwarded. For requests sent to origin servers, this is the origin server\'s IP address. ' +
  3449. 'For requests sent to a neighbor cache, this is the neighbor\'s hostname. NOTE: older versions of Squid would put the origin server hostname here.'
  3450. },
  3451. 'squidlog.mime_type_requests': {
  3452. info: 'The content type of the object as seen in the HTTP reply header. Please note that ICP exchanges usually don\'t have any content type.'
  3453. },
  3454. // ------------------------------------------------------------------------
  3455. // CockroachDB
  3456. 'cockroachdb.process_cpu_time_combined_percentage': {
  3457. info: 'Current combined cpu utilization, calculated as <code>(user+system)/num of logical cpus</code>.'
  3458. },
  3459. 'cockroachdb.host_disk_bandwidth': {
  3460. info: 'Summary disk bandwidth statistics across all system host disks.'
  3461. },
  3462. 'cockroachdb.host_disk_operations': {
  3463. info: 'Summary disk operations statistics across all system host disks.'
  3464. },
  3465. 'cockroachdb.host_disk_iops_in_progress': {
  3466. info: 'Summary disk iops in progress statistics across all system host disks.'
  3467. },
  3468. 'cockroachdb.host_network_bandwidth': {
  3469. info: 'Summary network bandwidth statistics across all system host network interfaces.'
  3470. },
  3471. 'cockroachdb.host_network_packets': {
  3472. info: 'Summary network packets statistics across all system host network interfaces.'
  3473. },
  3474. 'cockroachdb.live_nodes': {
  3475. info: 'Will be <code>0</code> if this node is not itself live.'
  3476. },
  3477. 'cockroachdb.total_storage_capacity': {
  3478. info: 'Entire disk capacity. It includes non-CR data, CR data, and empty space.'
  3479. },
  3480. 'cockroachdb.storage_capacity_usability': {
  3481. info: '<code>usable</code> is sum of empty space and CR data, <code>unusable</code> is space used by non-CR data.'
  3482. },
  3483. 'cockroachdb.storage_usable_capacity': {
  3484. info: 'Breakdown of <code>usable</code> space.'
  3485. },
  3486. 'cockroachdb.storage_used_capacity_percentage': {
  3487. info: '<code>total</code> is % of <b>total</b> space used, <code>usable</code> is % of <b>usable</b> space used.'
  3488. },
  3489. 'cockroachdb.sql_bandwidth': {
  3490. info: 'The total amount of SQL client network traffic.'
  3491. },
  3492. 'cockroachdb.sql_errors': {
  3493. info: '<code>statement</code> is statements resulting in a planning or runtime error, ' +
  3494. '<code>transaction</code> is SQL transactions abort errors.'
  3495. },
  3496. 'cockroachdb.sql_started_ddl_statements': {
  3497. info: 'The amount of <b>started</b> DDL (Data Definition Language) statements. ' +
  3498. 'This type means database schema changes. ' +
  3499. 'It includes <code>CREATE</code>, <code>ALTER</code>, <code>DROP</code>, <code>RENAME</code>, <code>TRUNCATE</code> and <code>COMMENT</code> statements.'
  3500. },
  3501. 'cockroachdb.sql_executed_ddl_statements': {
  3502. info: 'The amount of <b>executed</b> DDL (Data Definition Language) statements. ' +
  3503. 'This type means database schema changes. ' +
  3504. 'It includes <code>CREATE</code>, <code>ALTER</code>, <code>DROP</code>, <code>RENAME</code>, <code>TRUNCATE</code> and <code>COMMENT</code> statements.'
  3505. },
  3506. 'cockroachdb.sql_started_dml_statements': {
  3507. info: 'The amount of <b>started</b> DML (Data Manipulation Language) statements.'
  3508. },
  3509. 'cockroachdb.sql_executed_dml_statements': {
  3510. info: 'The amount of <b>executed</b> DML (Data Manipulation Language) statements.'
  3511. },
  3512. 'cockroachdb.sql_started_tcl_statements': {
  3513. info: 'The amount of <b>started</b> TCL (Transaction Control Language) statements.'
  3514. },
  3515. 'cockroachdb.sql_executed_tcl_statements': {
  3516. info: 'The amount of <b>executed</b> TCL (Transaction Control Language) statements.'
  3517. },
  3518. 'cockroachdb.live_bytes': {
  3519. info: 'The amount of live data used by both applications and the CockroachDB system.'
  3520. },
  3521. 'cockroachdb.kv_transactions': {
  3522. info: 'KV transactions breakdown:<br>' +
  3523. '<ul>' +
  3524. ' <li><code>committed</code> committed KV transactions (including 1PC).</li>' +
  3525. ' <li><code>fast-path_committed</code> KV transaction on-phase commit attempts.</li>' +
  3526. ' <li><code>aborted</code> aborted KV transactions.</li>' +
  3527. ' </ul>'
  3528. },
  3529. 'cockroachdb.kv_transaction_restarts': {
  3530. info: 'KV transactions restarts breakdown:<br>' +
  3531. '<ul>' +
  3532. ' <li><code>write too old</code> restarts due to a concurrent writer committing first.</li>' +
  3533. ' <li><code>write too old (multiple)</code> restarts due to multiple concurrent writers committing first.</li>' +
  3534. ' <li><code>forwarded timestamp (iso=serializable)</code> restarts due to a forwarded commit timestamp and isolation=SERIALIZABLE".</li>' +
  3535. ' <li><code>possible replay</code> restarts due to possible replays of command batches at the storage layer.</li>' +
  3536. ' <li><code>async consensus failure</code> restarts due to async consensus writes that failed to leave intents.</li>' +
  3537. ' <li><code>read within uncertainty interval</code> restarts due to reading a new value within the uncertainty interval.</li>' +
  3538. ' <li><code>aborted</code> restarts due to an abort by a concurrent transaction (usually due to deadlock).</li>' +
  3539. ' <li><code>push failure</code> restarts due to a transaction push failure.</li>' +
  3540. ' <li><code>unknown</code> restarts due to a unknown reasons.</li>' +
  3541. ' </ul>'
  3542. },
  3543. 'cockroachdb.ranges': {
  3544. info: 'CockroachDB stores all user data (tables, indexes, etc.) and almost all system data in a giant sorted map of key-value pairs. ' +
  3545. 'This keyspace is divided into "ranges", contiguous chunks of the keyspace, so that every key can always be found in a single range.'
  3546. },
  3547. 'cockroachdb.ranges_replication_problem': {
  3548. info: 'Ranges with not optimal number of replicas:<br>' +
  3549. '<ul>' +
  3550. ' <li><code>unavailable</code> ranges with fewer live replicas than needed for quorum.</li>' +
  3551. ' <li><code>under replicated</code> ranges with fewer live replicas than the replication target.</li>' +
  3552. ' <li><code>over replicated</code> ranges with more live replicas than the replication target.</li>' +
  3553. ' </ul>'
  3554. },
  3555. 'cockroachdb.replicas': {
  3556. info: 'CockroachDB replicates each range (3 times by default) and stores each replica on a different node.'
  3557. },
  3558. 'cockroachdb.replicas_leaders': {
  3559. info: 'For each range, one of the replicas is the <code>leader</code> for write requests, <code>not leaseholders</code> is the number of Raft leaders whose range lease is held by another store.'
  3560. },
  3561. 'cockroachdb.replicas_leaseholders': {
  3562. info: 'For each range, one of the replicas holds the "range lease". This replica, referred to as the <code>leaseholder</code>, is the one that receives and coordinates all read and write requests for the range.'
  3563. },
  3564. 'cockroachdb.queue_processing_failures': {
  3565. info: 'Failed replicas breakdown by queue:<br>' +
  3566. '<ul>' +
  3567. ' <li><code>gc</code> replicas which failed processing in the GC queue.</li>' +
  3568. ' <li><code>replica gc</code> replicas which failed processing in the replica GC queue.</li>' +
  3569. ' <li><code>replication</code> replicas which failed processing in the replicate queue.</li>' +
  3570. ' <li><code>split</code> replicas which failed processing in the split queue.</li>' +
  3571. ' <li><code>consistency</code> replicas which failed processing in the consistency checker queue.</li>' +
  3572. ' <li><code>raft log</code> replicas which failed processing in the Raft log queue.</li>' +
  3573. ' <li><code>raft snapshot</code> replicas which failed processing in the Raft repair queue.</li>' +
  3574. ' <li><code>time series maintenance</code> replicas which failed processing in the time series maintenance queue.</li>' +
  3575. ' </ul>'
  3576. },
  3577. 'cockroachdb.rebalancing_queries': {
  3578. info: 'Number of kv-level requests received per second by the store, averaged over a large time period as used in rebalancing decisions.'
  3579. },
  3580. 'cockroachdb.rebalancing_writes': {
  3581. info: 'Number of keys written (i.e. applied by raft) per second to the store, averaged over a large time period as used in rebalancing decisions.'
  3582. },
  3583. 'cockroachdb.slow_requests': {
  3584. info: 'Requests that have been stuck for a long time.'
  3585. },
  3586. 'cockroachdb.timeseries_samples': {
  3587. info: 'The amount of metric samples written to disk.'
  3588. },
  3589. 'cockroachdb.timeseries_write_errors': {
  3590. info: 'The amount of errors encountered while attempting to write metrics to disk.'
  3591. },
  3592. 'cockroachdb.timeseries_write_bytes': {
  3593. info: 'Size of metric samples written to disk.'
  3594. },
  3595. // ------------------------------------------------------------------------
  3596. // Perf
  3597. 'perf.instructions_per_cycle': {
  3598. info: 'An IPC < 1.0 likely means memory bound, and an IPC > 1.0 likely means instruction bound. For more details about the metric take a look at this <a href="https://www.brendangregg.com/blog/2017-05-09/cpu-utilization-is-wrong.html" target="_blank">blog post</a>.'
  3599. },
  3600. // ------------------------------------------------------------------------
  3601. // Filesystem
  3602. 'filesystem.vfs_deleted_objects': {
  3603. title : 'VFS remove',
  3604. info: 'This chart does not show all events that remove files from the file system, because file systems can create their own functions to remove files, it shows calls for the function <code>vfs_unlink</code>. '
  3605. },
  3606. 'filesystem.vfs_io': {
  3607. title : 'VFS IO',
  3608. info: 'Successful or failed calls to functions <code>vfs_read</code> and <code>vfs_write</code>. This chart may not show all file system events if it uses other functions to store data on disk.'
  3609. },
  3610. 'filesystem.vfs_io_bytes': {
  3611. title : 'VFS bytes written',
  3612. info: 'Total of bytes read or written with success using the functions <code>vfs_read</code> and <code>vfs_write</code>.'
  3613. },
  3614. 'filesystem.vfs_io_error': {
  3615. title : 'VFS IO error',
  3616. info: 'Failed calls to functions <code>vfs_read</code> and <code>vfs_write</code>.'
  3617. },
  3618. 'filesystem.vfs_fsync': {
  3619. info: 'Successful or failed calls to functions <code>vfs_fsync</code>.'
  3620. },
  3621. 'filesystem.vfs_fsync_error': {
  3622. info: 'Failed calls to functions <code>vfs_fsync</code>.'
  3623. },
  3624. 'filesystem.vfs_open': {
  3625. info: 'Successful or failed calls to functions <code>vfs_open</code>.'
  3626. },
  3627. 'filesystem.vfs_open_error': {
  3628. info: 'Failed calls to functions <code>vfs_open</code>.'
  3629. },
  3630. 'filesystem.vfs_create': {
  3631. info: 'Successful or failed calls to functions <code>vfs_create</code>.'
  3632. },
  3633. 'filesystem.vfs_create_error': {
  3634. info: 'Failed calls to functions <code>vfs_create</code>.'
  3635. },
  3636. 'filesystem.ext4_read_latency': {
  3637. info: 'Netdata is attaching <code>kprobes</code> for the function <code>ext4_file_read_iter</code>.'
  3638. },
  3639. 'filesystem.ext4_write_latency': {
  3640. info: 'Netdata is attaching <code>kprobes</code> for the function <code>ext4_file_write_iter</code>.'
  3641. },
  3642. 'filesystem.ext4_open_latency': {
  3643. info: 'Netdata is attaching <code>kprobes</code> for the function <code>ext4_file_open</code>.'
  3644. },
  3645. 'filesystem.ext4_sync_latency': {
  3646. info: 'Netdata is attaching <code>kprobes</code> for the function <code>ext4_sync_file</code>.'
  3647. },
  3648. 'filesystem.xfs_read_latency': {
  3649. info: 'Netdata is attaching <code>kprobes</code> for the function <code>xfs_file_read_iter</code>.'
  3650. },
  3651. 'filesystem.xfs_write_latency': {
  3652. info: 'Netdata is attaching <code>kprobes</code> for the function <code>xfs_file_write_iter</code>.'
  3653. },
  3654. 'filesystem.xfs_open_latency': {
  3655. info: 'Netdata is attaching <code>kprobes</code> for the function <code>xfs_file_open</code>.'
  3656. },
  3657. 'filesystem.xfs_sync_latency': {
  3658. info: 'Netdata is attaching <code>kprobes</code> for the function <code>xfs_file_sync</code>.'
  3659. },
  3660. 'filesystem.nfs_read_latency': {
  3661. info: 'Netdata is attaching <code>kprobes</code> for the function <code>nfs_file_read</code>.'
  3662. },
  3663. 'filesystem.nfs_write_latency': {
  3664. info: 'Netdata is attaching <code>kprobes</code> for the function <code>nfs_file_write</code>.'
  3665. },
  3666. 'filesystem.nfs_open_latency': {
  3667. info: 'Netdata is attaching <code>kprobes</code> for functions <code>nfs_file_open</code> and <code>nfs4_file_open</code>'
  3668. },
  3669. 'filesystem.nfs_attribute_latency': {
  3670. info: 'Netdata is attaching <code>kprobes</code> for the function <code>nfs_getattr</code>.'
  3671. },
  3672. 'filesystem.zfs_read_latency': {
  3673. info: 'Netdata is attaching <code>kprobes</code> for when the function <code>zpl_iter_read</code>.'
  3674. },
  3675. 'filesystem.zfs_write_latency': {
  3676. info: 'Netdata is attaching <code>kprobes</code> for when the function <code>zpl_iter_write</code>.'
  3677. },
  3678. 'filesystem.zfs_open_latency': {
  3679. info: 'Netdata is attaching <code>kprobes</code> for when the function <code>zpl_open</code>.'
  3680. },
  3681. 'filesystem.zfs_sync_latency': {
  3682. info: 'Netdata is attaching <code>kprobes</code> for when the function <code>zpl_fsync</code>.'
  3683. },
  3684. 'filesystem.btrfs_read_latency': {
  3685. info: 'Netdata is attaching <code>kprobes</code> for when the function <code>btrfs_file_read_iter</code> (kernel newer than 5.9.16) or the function <code>generic_file_read_iter</code> (old kernels).'
  3686. },
  3687. 'filesystem.btrfs_write_latency': {
  3688. info: 'Netdata is attaching <code>kprobes</code> for when the function <code>btrfs_file_write_iter</code>.'
  3689. },
  3690. 'filesystem.btrfs_open_latency': {
  3691. info: 'Netdata is attaching <code>kprobes</code> for when the function <code>btrfs_file_open</code>.'
  3692. },
  3693. 'filesystem.btrfs_sync_latency': {
  3694. info: 'Netdata is attaching <code>kprobes</code> for when the function <code>btrfs_sync_file</code>.'
  3695. },
  3696. 'mount_points.call': {
  3697. info: 'Monitor calls to syscalls <code>mount(2)</code> and <code>umount(2)</code> that are responsible for attaching or removing filesystems.'
  3698. },
  3699. 'mount_points.error': {
  3700. info: 'Monitor errors in calls to syscalls <code>mount(2)</code> and <code>umount(2)</code>.'
  3701. },
  3702. 'filesystem.file_descriptor': {
  3703. info: 'Calls for internal functions on Linux kernel. The open dimension is attached to the kernel internal function <code>do_sys_open</code> ( For kernels newer than <code>5.5.19</code> we add a kprobe to <code>do_sys_openat2</code>. ), which is the common function called from'+
  3704. ' <a href="https://www.man7.org/linux/man-pages/man2/open.2.html" target="_blank">open(2)</a> ' +
  3705. ' and <a href="https://www.man7.org/linux/man-pages/man2/openat.2.html" target="_blank">openat(2)</a>. ' +
  3706. ' The close dimension is attached to the function <code>__close_fd</code> or <code>close_fd</code> according to your kernel version, which is called from system call' +
  3707. ' <a href="https://www.man7.org/linux/man-pages/man2/close.2.html" target="_blank">close(2)</a>. '
  3708. },
  3709. 'filesystem.file_error': {
  3710. info: 'Failed calls to the kernel internal function <code>do_sys_open</code> ( For kernels newer than <code>5.5.19</code> we add a kprobe to <code>do_sys_openat2</code>. ), which is the common function called from'+
  3711. ' <a href="https://www.man7.org/linux/man-pages/man2/open.2.html" target="_blank">open(2)</a> ' +
  3712. ' and <a href="https://www.man7.org/linux/man-pages/man2/openat.2.html" target="_blank">openat(2)</a>. ' +
  3713. ' The close dimension is attached to the function <code>__close_fd</code> or <code>close_fd</code> according to your kernel version, which is called from system call' +
  3714. ' <a href="https://www.man7.org/linux/man-pages/man2/close.2.html" target="_blank">close(2)</a>. '
  3715. },
  3716. // ------------------------------------------------------------------------
  3717. // eBPF
  3718. 'ebpf.process_thread': {
  3719. title : 'Task creation',
  3720. info: 'Number of times that either <a href="https://www.ece.uic.edu/~yshi1/linux/lkse/node4.html#SECTION00421000000000000000" target="_blank">do_fork</a>, or <code>kernel_clone</code> if you are running kernel newer than 5.9.16, is called to create a new task, which is the common name used to define process and tasks inside the kernel. Netdata identifies the threads by counting the number of calls for <a href="https://linux.die.net/man/2/clone" target="_blank">sys_clone</a> that has the flag <code>CLONE_THREAD</code> set.'
  3721. },
  3722. 'ebpf.exit': {
  3723. title : 'Exit monitoring',
  3724. info: 'Calls for the functions responsible for closing (<a href="https://www.informit.com/articles/article.aspx?p=370047&seqNum=4" target="_blank">do_exit</a>) and releasing (<a href="https://www.informit.com/articles/article.aspx?p=370047&seqNum=4" target="_blank">release_task</a>) tasks.'
  3725. },
  3726. 'ebpf.task_error': {
  3727. title : 'Task error',
  3728. info: 'Number of errors to create a new process or thread.'
  3729. },
  3730. 'ebpf.process_status': {
  3731. title : 'Task status',
  3732. info: 'Difference between the number of process created and the number of threads created per period(<code>process</code> dimension), it also shows the number of possible zombie process running on system.'
  3733. },
  3734. 'apps.swap_read_call': {
  3735. info: 'The function <code>swap_readpage</code> is called when the kernel reads a page from swap memory. Netdata also gives a summary for these charts in <a href="#menu_system_submenu_swap">System overview</a>.'
  3736. },
  3737. 'apps.swap_write_call': {
  3738. info: 'The function <code>swap_writepage</code> is called when the kernel writes a page to swap memory.'
  3739. },
  3740. // ------------------------------------------------------------------------
  3741. // ACLK Internal Stats
  3742. 'netdata.aclk_status': {
  3743. valueRange: "[0, 1]",
  3744. info: 'This chart shows if ACLK was online during entirety of the sample duration.'
  3745. },
  3746. 'netdata.aclk_query_per_second': {
  3747. info: 'This chart shows how many queries were added for ACLK_query thread to process and how many it was actually able to process.'
  3748. },
  3749. 'netdata.aclk_latency_mqtt': {
  3750. info: 'Measures latency between MQTT publish of the message and it\'s PUB_ACK being received'
  3751. },
  3752. // ------------------------------------------------------------------------
  3753. // VerneMQ
  3754. 'vernemq.sockets': {
  3755. mainheads: [
  3756. function (os, id) {
  3757. void (os);
  3758. return '<div data-netdata="' + id + '"'
  3759. + ' data-dimensions="open_sockets"'
  3760. + ' data-chart-library="gauge"'
  3761. + ' data-title="Connected Clients"'
  3762. + ' data-units="clients"'
  3763. + ' data-gauge-adjust="width"'
  3764. + ' data-width="16%"'
  3765. + ' data-before="0"'
  3766. + ' data-after="-CHART_DURATION"'
  3767. + ' data-points="CHART_DURATION"'
  3768. + ' data-colors="' + NETDATA.colors[4] + '"'
  3769. + ' data-decimal-digits="2"'
  3770. + ' role="application"></div>';
  3771. }
  3772. ]
  3773. },
  3774. 'vernemq.queue_processes': {
  3775. mainheads: [
  3776. function (os, id) {
  3777. void (os);
  3778. return '<div data-netdata="' + id + '"'
  3779. + ' data-dimensions="queue_processes"'
  3780. + ' data-chart-library="gauge"'
  3781. + ' data-title="Queues Processes"'
  3782. + ' data-units="processes"'
  3783. + ' data-gauge-adjust="width"'
  3784. + ' data-width="16%"'
  3785. + ' data-before="0"'
  3786. + ' data-after="-CHART_DURATION"'
  3787. + ' data-points="CHART_DURATION"'
  3788. + ' data-colors="' + NETDATA.colors[4] + '"'
  3789. + ' data-decimal-digits="2"'
  3790. + ' role="application"></div>';
  3791. }
  3792. ]
  3793. },
  3794. 'vernemq.queue_messages': {
  3795. mainheads: [
  3796. function (os, id) {
  3797. void (os);
  3798. return '<div data-netdata="' + id + '"'
  3799. + ' data-dimensions="queue_message_in"'
  3800. + ' data-chart-library="easypiechart"'
  3801. + ' data-title="MQTT Receive Rate"'
  3802. + ' data-units="messages/s"'
  3803. + ' data-gauge-adjust="width"'
  3804. + ' data-width="14%"'
  3805. + ' data-before="0"'
  3806. + ' data-after="-CHART_DURATION"'
  3807. + ' data-points="CHART_DURATION"'
  3808. + ' data-colors="' + NETDATA.colors[0] + '"'
  3809. + ' data-decimal-digits="2"'
  3810. + ' role="application"></div>';
  3811. },
  3812. function (os, id) {
  3813. void (os);
  3814. return '<div data-netdata="' + id + '"'
  3815. + ' data-dimensions="queue_message_out"'
  3816. + ' data-chart-library="easypiechart"'
  3817. + ' data-title="MQTT Send Rate"'
  3818. + ' data-units="messages/s"'
  3819. + ' data-gauge-adjust="width"'
  3820. + ' data-width="14%"'
  3821. + ' data-before="0"'
  3822. + ' data-after="-CHART_DURATION"'
  3823. + ' data-points="CHART_DURATION"'
  3824. + ' data-colors="' + NETDATA.colors[1] + '"'
  3825. + ' data-decimal-digits="2"'
  3826. + ' role="application"></div>';
  3827. },
  3828. ]
  3829. },
  3830. 'vernemq.average_scheduler_utilization': {
  3831. mainheads: [
  3832. function (os, id) {
  3833. void (os);
  3834. return '<div data-netdata="' + id + '"'
  3835. + ' data-dimensions="system_utilization"'
  3836. + ' data-chart-library="gauge"'
  3837. + ' data-gauge-max-value="100"'
  3838. + ' data-title="Average Scheduler Utilization"'
  3839. + ' data-units="percentage"'
  3840. + ' data-gauge-adjust="width"'
  3841. + ' data-width="16%"'
  3842. + ' data-before="0"'
  3843. + ' data-after="-CHART_DURATION"'
  3844. + ' data-points="CHART_DURATION"'
  3845. + ' data-colors="' + NETDATA.colors[3] + '"'
  3846. + ' data-decimal-digits="2"'
  3847. + ' role="application"></div>';
  3848. }
  3849. ]
  3850. },
  3851. // ------------------------------------------------------------------------
  3852. // Apache Pulsar
  3853. 'pulsar.messages_rate': {
  3854. mainheads: [
  3855. function (os, id) {
  3856. void (os);
  3857. return '<div data-netdata="' + id + '"'
  3858. + ' data-dimensions="pulsar_rate_in"'
  3859. + ' data-chart-library="easypiechart"'
  3860. + ' data-title="Publish"'
  3861. + ' data-units="messages/s"'
  3862. + ' data-gauge-adjust="width"'
  3863. + ' data-width="12%"'
  3864. + ' data-before="0"'
  3865. + ' data-after="-CHART_DURATION"'
  3866. + ' data-points="CHART_DURATION"'
  3867. + ' data-colors="' + NETDATA.colors[0] + '"'
  3868. + ' data-decimal-digits="2"'
  3869. + ' role="application"></div>';
  3870. },
  3871. function (os, id) {
  3872. void (os);
  3873. return '<div data-netdata="' + id + '"'
  3874. + ' data-dimensions="pulsar_rate_out"'
  3875. + ' data-chart-library="easypiechart"'
  3876. + ' data-title="Dispatch"'
  3877. + ' data-units="messages/s"'
  3878. + ' data-gauge-adjust="width"'
  3879. + ' data-width="12%"'
  3880. + ' data-before="0"'
  3881. + ' data-after="-CHART_DURATION"'
  3882. + ' data-points="CHART_DURATION"'
  3883. + ' data-colors="' + NETDATA.colors[1] + '"'
  3884. + ' data-decimal-digits="2"'
  3885. + ' role="application"></div>';
  3886. },
  3887. ]
  3888. },
  3889. 'pulsar.subscription_msg_rate_redeliver': {
  3890. mainheads: [
  3891. function (os, id) {
  3892. void (os);
  3893. return '<div data-netdata="' + id + '"'
  3894. + ' data-dimensions="pulsar_subscription_msg_rate_redeliver"'
  3895. + ' data-chart-library="gauge"'
  3896. + ' data-gauge-max-value="100"'
  3897. + ' data-title="Redelivered"'
  3898. + ' data-units="messages/s"'
  3899. + ' data-gauge-adjust="width"'
  3900. + ' data-width="14%"'
  3901. + ' data-before="0"'
  3902. + ' data-after="-CHART_DURATION"'
  3903. + ' data-points="CHART_DURATION"'
  3904. + ' data-colors="' + NETDATA.colors[3] + '"'
  3905. + ' data-decimal-digits="2"'
  3906. + ' role="application"></div>';
  3907. }
  3908. ]
  3909. },
  3910. 'pulsar.subscription_blocked_on_unacked_messages': {
  3911. mainheads: [
  3912. function (os, id) {
  3913. void (os);
  3914. return '<div data-netdata="' + id + '"'
  3915. + ' data-dimensions="pulsar_subscription_blocked_on_unacked_messages"'
  3916. + ' data-chart-library="gauge"'
  3917. + ' data-gauge-max-value="100"'
  3918. + ' data-title="Blocked On Unacked"'
  3919. + ' data-units="subscriptions"'
  3920. + ' data-gauge-adjust="width"'
  3921. + ' data-width="14%"'
  3922. + ' data-before="0"'
  3923. + ' data-after="-CHART_DURATION"'
  3924. + ' data-points="CHART_DURATION"'
  3925. + ' data-colors="' + NETDATA.colors[3] + '"'
  3926. + ' data-decimal-digits="2"'
  3927. + ' role="application"></div>';
  3928. }
  3929. ]
  3930. },
  3931. 'pulsar.msg_backlog': {
  3932. mainheads: [
  3933. function (os, id) {
  3934. void (os);
  3935. return '<div data-netdata="' + id + '"'
  3936. + ' data-dimensions="pulsar_msg_backlog"'
  3937. + ' data-chart-library="gauge"'
  3938. + ' data-gauge-max-value="100"'
  3939. + ' data-title="Messages Backlog"'
  3940. + ' data-units="messages"'
  3941. + ' data-gauge-adjust="width"'
  3942. + ' data-width="14%"'
  3943. + ' data-before="0"'
  3944. + ' data-after="-CHART_DURATION"'
  3945. + ' data-points="CHART_DURATION"'
  3946. + ' data-colors="' + NETDATA.colors[2] + '"'
  3947. + ' data-decimal-digits="2"'
  3948. + ' role="application"></div>';
  3949. }
  3950. ]
  3951. },
  3952. 'pulsar.namespace_messages_rate': {
  3953. heads: [
  3954. function (os, id) {
  3955. void (os);
  3956. return '<div data-netdata="' + id + '"'
  3957. + ' data-dimensions="publish"'
  3958. + ' data-chart-library="easypiechart"'
  3959. + ' data-title="Publish"'
  3960. + ' data-units="messages/s"'
  3961. + ' data-gauge-adjust="width"'
  3962. + ' data-width="12%"'
  3963. + ' data-before="0"'
  3964. + ' data-after="-CHART_DURATION"'
  3965. + ' data-points="CHART_DURATION"'
  3966. + ' data-colors="' + NETDATA.colors[0] + '"'
  3967. + ' data-decimal-digits="2"'
  3968. + ' role="application"></div>';
  3969. },
  3970. function (os, id) {
  3971. void (os);
  3972. return '<div data-netdata="' + id + '"'
  3973. + ' data-dimensions="dispatch"'
  3974. + ' data-chart-library="easypiechart"'
  3975. + ' data-title="Dispatch"'
  3976. + ' data-units="messages/s"'
  3977. + ' data-gauge-adjust="width"'
  3978. + ' data-width="12%"'
  3979. + ' data-before="0"'
  3980. + ' data-after="-CHART_DURATION"'
  3981. + ' data-points="CHART_DURATION"'
  3982. + ' data-colors="' + NETDATA.colors[1] + '"'
  3983. + ' data-decimal-digits="2"'
  3984. + ' role="application"></div>';
  3985. },
  3986. ]
  3987. },
  3988. 'pulsar.namespace_subscription_msg_rate_redeliver': {
  3989. heads: [
  3990. function (os, id) {
  3991. void (os);
  3992. return '<div data-netdata="' + id + '"'
  3993. + ' data-dimensions="redelivered"'
  3994. + ' data-chart-library="gauge"'
  3995. + ' data-gauge-max-value="100"'
  3996. + ' data-title="Redelivered"'
  3997. + ' data-units="messages/s"'
  3998. + ' data-gauge-adjust="width"'
  3999. + ' data-width="14%"'
  4000. + ' data-before="0"'
  4001. + ' data-after="-CHART_DURATION"'
  4002. + ' data-points="CHART_DURATION"'
  4003. + ' data-colors="' + NETDATA.colors[3] + '"'
  4004. + ' data-decimal-digits="2"'
  4005. + ' role="application"></div>';
  4006. }
  4007. ]
  4008. },
  4009. 'pulsar.namespace_subscription_blocked_on_unacked_messages': {
  4010. heads: [
  4011. function (os, id) {
  4012. void (os);
  4013. return '<div data-netdata="' + id + '"'
  4014. + ' data-dimensions="blocked"'
  4015. + ' data-chart-library="gauge"'
  4016. + ' data-gauge-max-value="100"'
  4017. + ' data-title="Blocked On Unacked"'
  4018. + ' data-units="subscriptions"'
  4019. + ' data-gauge-adjust="width"'
  4020. + ' data-width="14%"'
  4021. + ' data-before="0"'
  4022. + ' data-after="-CHART_DURATION"'
  4023. + ' data-points="CHART_DURATION"'
  4024. + ' data-colors="' + NETDATA.colors[3] + '"'
  4025. + ' data-decimal-digits="2"'
  4026. + ' role="application"></div>';
  4027. }
  4028. ]
  4029. },
  4030. 'pulsar.namespace_msg_backlog': {
  4031. heads: [
  4032. function (os, id) {
  4033. void (os);
  4034. return '<div data-netdata="' + id + '"'
  4035. + ' data-dimensions="backlog"'
  4036. + ' data-chart-library="gauge"'
  4037. + ' data-gauge-max-value="100"'
  4038. + ' data-title="Messages Backlog"'
  4039. + ' data-units="messages"'
  4040. + ' data-gauge-adjust="width"'
  4041. + ' data-width="14%"'
  4042. + ' data-before="0"'
  4043. + ' data-after="-CHART_DURATION"'
  4044. + ' data-points="CHART_DURATION"'
  4045. + ' data-colors="' + NETDATA.colors[2] + '"'
  4046. + ' data-decimal-digits="2"'
  4047. + ' role="application"></div>';
  4048. },
  4049. ],
  4050. },
  4051. // ------------------------------------------------------------------------
  4052. // Nvidia-smi
  4053. 'nvidia_smi.fan_speed': {
  4054. heads: [
  4055. function (os, id) {
  4056. void (os);
  4057. return '<div data-netdata="' + id + '"'
  4058. + ' data-dimensions="speed"'
  4059. + ' data-chart-library="easypiechart"'
  4060. + ' data-title="Fan Speed"'
  4061. + ' data-units="percentage"'
  4062. + ' data-easypiechart-max-value="100"'
  4063. + ' data-gauge-adjust="width"'
  4064. + ' data-width="12%"'
  4065. + ' data-before="0"'
  4066. + ' data-after="-CHART_DURATION"'
  4067. + ' data-points="CHART_DURATION"'
  4068. + ' data-colors="' + NETDATA.colors[4] + '"'
  4069. + ' data-decimal-digits="2"'
  4070. + ' role="application"></div>';
  4071. }
  4072. ]
  4073. },
  4074. 'nvidia_smi.temperature': {
  4075. heads: [
  4076. function (os, id) {
  4077. void (os);
  4078. return '<div data-netdata="' + id + '"'
  4079. + ' data-dimensions="temp"'
  4080. + ' data-chart-library="easypiechart"'
  4081. + ' data-title="Temperature"'
  4082. + ' data-units="celsius"'
  4083. + ' data-gauge-adjust="width"'
  4084. + ' data-width="12%"'
  4085. + ' data-before="0"'
  4086. + ' data-after="-CHART_DURATION"'
  4087. + ' data-points="CHART_DURATION"'
  4088. + ' data-colors="' + NETDATA.colors[3] + '"'
  4089. + ' data-decimal-digits="2"'
  4090. + ' role="application"></div>';
  4091. }
  4092. ]
  4093. },
  4094. 'nvidia_smi.memory_allocated': {
  4095. heads: [
  4096. function (os, id) {
  4097. void (os);
  4098. return '<div data-netdata="' + id + '"'
  4099. + ' data-dimensions="used"'
  4100. + ' data-chart-library="easypiechart"'
  4101. + ' data-title="Used Memory"'
  4102. + ' data-units="MiB"'
  4103. + ' data-gauge-adjust="width"'
  4104. + ' data-width="12%"'
  4105. + ' data-before="0"'
  4106. + ' data-after="-CHART_DURATION"'
  4107. + ' data-points="CHART_DURATION"'
  4108. + ' data-colors="' + NETDATA.colors[4] + '"'
  4109. + ' data-decimal-digits="2"'
  4110. + ' role="application"></div>';
  4111. }
  4112. ]
  4113. },
  4114. 'nvidia_smi.power': {
  4115. heads: [
  4116. function (os, id) {
  4117. void (os);
  4118. return '<div data-netdata="' + id + '"'
  4119. + ' data-dimensions="power"'
  4120. + ' data-chart-library="easypiechart"'
  4121. + ' data-title="Power Utilization"'
  4122. + ' data-units="watts"'
  4123. + ' data-gauge-adjust="width"'
  4124. + ' data-width="12%"'
  4125. + ' data-before="0"'
  4126. + ' data-after="-CHART_DURATION"'
  4127. + ' data-points="CHART_DURATION"'
  4128. + ' data-colors="' + NETDATA.colors[2] + '"'
  4129. + ' data-decimal-digits="2"'
  4130. + ' role="application"></div>';
  4131. }
  4132. ]
  4133. },
  4134. // ------------------------------------------------------------------------
  4135. // Supervisor
  4136. 'supervisord.process_state_code': {
  4137. info: '<a href="http://supervisord.org/subprocess.html#process-states" target="_blank">Process states map</a>: ' +
  4138. '<code>0</code> - stopped, <code>10</code> - starting, <code>20</code> - running, <code>30</code> - backoff,' +
  4139. '<code>40</code> - stopping, <code>100</code> - exited, <code>200</code> - fatal, <code>1000</code> - unknown.'
  4140. },
  4141. // ------------------------------------------------------------------------
  4142. // Systemd units
  4143. 'systemd.service_units_state': {
  4144. info: 'Service units start and control daemons and the processes they consist of. ' +
  4145. 'For details, see <a href="https://www.freedesktop.org/software/systemd/man/systemd.service.html#" target="_blank"> systemd.service(5)</a>'
  4146. },
  4147. 'systemd.socket_unit_state': {
  4148. info: 'Socket units encapsulate local IPC or network sockets in the system, useful for socket-based activation. ' +
  4149. 'For details about socket units, see <a href="https://www.freedesktop.org/software/systemd/man/systemd.socket.html#" target="_blank"> systemd.socket(5)</a>, ' +
  4150. 'for details on socket-based activation and other forms of activation, see <a href="https://www.freedesktop.org/software/systemd/man/daemon.html#" target="_blank"> daemon(7)</a>.'
  4151. },
  4152. 'systemd.target_unit_state': {
  4153. info: 'Target units are useful to group units, or provide well-known synchronization points during boot-up, ' +
  4154. 'see <a href="https://www.freedesktop.org/software/systemd/man/systemd.target.html#" target="_blank"> systemd.target(5)</a>.'
  4155. },
  4156. 'systemd.path_unit_state': {
  4157. info: 'Path units may be used to activate other services when file system objects change or are modified. ' +
  4158. 'See <a href="https://www.freedesktop.org/software/systemd/man/systemd.path.html#" target="_blank"> systemd.path(5)</a>.'
  4159. },
  4160. 'systemd.device_unit_state': {
  4161. info: 'Device units expose kernel devices in systemd and may be used to implement device-based activation. ' +
  4162. 'For details, see <a href="https://www.freedesktop.org/software/systemd/man/systemd.device.html#" target="_blank"> systemd.device(5)</a>.'
  4163. },
  4164. 'systemd.mount_unit_state': {
  4165. info: 'Mount units control mount points in the file system. ' +
  4166. 'For details, see <a href="https://www.freedesktop.org/software/systemd/man/systemd.mount.html#" target="_blank"> systemd.mount(5)</a>.'
  4167. },
  4168. 'systemd.automount_unit_state': {
  4169. info: 'Automount units provide automount capabilities, for on-demand mounting of file systems as well as parallelized boot-up. ' +
  4170. 'See <a href="https://www.freedesktop.org/software/systemd/man/systemd.automount.html#" target="_blank"> systemd.automount(5)</a>.'
  4171. },
  4172. 'systemd.swap_unit_state': {
  4173. info: 'Swap units are very similar to mount units and encapsulate memory swap partitions or files of the operating system. ' +
  4174. 'They are described in <a href="https://www.freedesktop.org/software/systemd/man/systemd.swap.html#" target="_blank"> systemd.swap(5)</a>.'
  4175. },
  4176. 'systemd.timer_unit_state': {
  4177. info: 'Timer units are useful for triggering activation of other units based on timers. ' +
  4178. 'You may find details in <a href="https://www.freedesktop.org/software/systemd/man/systemd.timer.html#" target="_blank"> systemd.timer(5)</a>.'
  4179. },
  4180. 'systemd.scope_unit_state': {
  4181. info: 'Slice units may be used to group units which manage system processes (such as service and scope units) ' +
  4182. 'in a hierarchical tree for resource management purposes. ' +
  4183. 'See <a href="https://www.freedesktop.org/software/systemd/man/systemd.scope.html#" target="_blank"> systemd.scope(5)</a>.'
  4184. },
  4185. 'systemd.slice_unit_state': {
  4186. info: 'Scope units are similar to service units, but manage foreign processes instead of starting them as well. ' +
  4187. 'See <a href="https://www.freedesktop.org/software/systemd/man/systemd.slice.html#" target="_blank"> systemd.slice(5)</a>.'
  4188. },
  4189. };