statsd.c 114 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include "daemon/common.h"
  3. #define STATSD_CHART_PREFIX "statsd"
  4. #define PLUGIN_STATSD_NAME "statsd.plugin"
  5. #define STATSD_LISTEN_PORT 8125
  6. #define STATSD_LISTEN_BACKLOG 4096
  7. #define WORKER_JOB_TYPE_TCP_CONNECTED 0
  8. #define WORKER_JOB_TYPE_TCP_DISCONNECTED 1
  9. #define WORKER_JOB_TYPE_RCV_DATA 2
  10. #define WORKER_JOB_TYPE_SND_DATA 3
  11. #if WORKER_UTILIZATION_MAX_JOB_TYPES < 4
  12. #error Please increase WORKER_UTILIZATION_MAX_JOB_TYPES to at least 4
  13. #endif
  14. // --------------------------------------------------------------------------------------
  15. // DO NOT ENABLE MULTITHREADING - IT IS NOT WELL TESTED
  16. // #define STATSD_MULTITHREADED 1
  17. #define STATSD_DICTIONARY_OPTIONS (DICT_OPTION_DONT_OVERWRITE_VALUE | DICT_OPTION_ADD_IN_FRONT)
  18. #define STATSD_DECIMAL_DETAIL 1000 // floating point values get multiplied by this, with the same divisor
  19. // --------------------------------------------------------------------------------------------------------------------
  20. // data specific to each metric type
  21. typedef struct statsd_metric_gauge {
  22. NETDATA_DOUBLE value;
  23. } STATSD_METRIC_GAUGE;
  24. typedef struct statsd_metric_counter { // counter and meter
  25. collected_number value;
  26. } STATSD_METRIC_COUNTER;
  27. typedef struct statsd_histogram_extensions {
  28. netdata_mutex_t mutex;
  29. // average is stored in metric->last
  30. collected_number last_min;
  31. collected_number last_max;
  32. collected_number last_percentile;
  33. collected_number last_median;
  34. collected_number last_stddev;
  35. collected_number last_sum;
  36. int zeroed;
  37. RRDDIM *rd_min;
  38. RRDDIM *rd_max;
  39. RRDDIM *rd_percentile;
  40. RRDDIM *rd_median;
  41. RRDDIM *rd_stddev;
  42. //RRDDIM *rd_sum;
  43. uint32_t size;
  44. uint32_t used;
  45. NETDATA_DOUBLE *values; // dynamic array of values collected
  46. } STATSD_METRIC_HISTOGRAM_EXTENSIONS;
  47. typedef struct statsd_metric_histogram { // histogram and timer
  48. STATSD_METRIC_HISTOGRAM_EXTENSIONS *ext;
  49. } STATSD_METRIC_HISTOGRAM;
  50. typedef struct statsd_metric_set {
  51. DICTIONARY *dict;
  52. } STATSD_METRIC_SET;
  53. typedef struct statsd_metric_dictionary_item {
  54. uint32_t count;
  55. RRDDIM *rd;
  56. } STATSD_METRIC_DICTIONARY_ITEM;
  57. typedef struct statsd_metric_dictionary {
  58. DICTIONARY *dict;
  59. } STATSD_METRIC_DICTIONARY;
  60. // --------------------------------------------------------------------------------------------------------------------
  61. // this is a metric - for all types of metrics
  62. typedef enum __attribute__((packed)) statsd_metric_options {
  63. STATSD_METRIC_OPTION_NONE = 0x00000000, // no options set
  64. STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED = 0x00000001, // do not update the chart dimension, when this metric is not collected
  65. STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED = 0x00000002, // render a private chart for this metric
  66. STATSD_METRIC_OPTION_PRIVATE_CHART_CHECKED = 0x00000004, // the metric has been checked if it should get private chart or not
  67. STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT = 0x00000008, // show the count of events for this private chart
  68. STATSD_METRIC_OPTION_CHECKED_IN_APPS = 0x00000010, // set when this metric has been checked against apps
  69. STATSD_METRIC_OPTION_USED_IN_APPS = 0x00000020, // set when this metric is used in apps
  70. STATSD_METRIC_OPTION_CHECKED = 0x00000040, // set when the charting thread checks this metric for use in charts (its usefulness)
  71. STATSD_METRIC_OPTION_USEFUL = 0x00000080, // set when the charting thread finds the metric useful (i.e. used in a chart)
  72. STATSD_METRIC_OPTION_COLLECTION_FULL_LOGGED = 0x00000100, // set when the collection is full for this metric
  73. STATSD_METRIC_OPTION_UPDATED_CHART_METADATA = 0x00000200, // set when the private chart metadata have been updated via tags
  74. STATSD_METRIC_OPTION_OBSOLETE = 0x00004000, // set when the metric is obsoleted
  75. } STATS_METRIC_OPTIONS;
  76. typedef enum __attribute__((packed)) statsd_metric_type {
  77. STATSD_METRIC_TYPE_GAUGE,
  78. STATSD_METRIC_TYPE_COUNTER,
  79. STATSD_METRIC_TYPE_METER,
  80. STATSD_METRIC_TYPE_TIMER,
  81. STATSD_METRIC_TYPE_HISTOGRAM,
  82. STATSD_METRIC_TYPE_SET,
  83. STATSD_METRIC_TYPE_DICTIONARY
  84. } STATSD_METRIC_TYPE;
  85. typedef struct statsd_metric {
  86. const char *name; // the name of the metric - linked to dictionary name
  87. uint32_t hash; // hash of the name
  88. STATSD_METRIC_TYPE type;
  89. // metadata about data collection
  90. collected_number events; // the number of times this metric has been collected (never resets)
  91. uint32_t count; // the number of times this metric has been collected since the last flush
  92. time_t last_collected; // timestamp of the last incoming value
  93. // the actual collected data
  94. union {
  95. STATSD_METRIC_GAUGE gauge;
  96. STATSD_METRIC_COUNTER counter;
  97. STATSD_METRIC_HISTOGRAM histogram;
  98. STATSD_METRIC_SET set;
  99. STATSD_METRIC_DICTIONARY dictionary;
  100. };
  101. char *units;
  102. char *dimname;
  103. char *family;
  104. // chart related members
  105. STATS_METRIC_OPTIONS options; // STATSD_METRIC_OPTION_* (bitfield)
  106. char reset; // set to 1 by the charting thread to instruct the collector thread(s) to reset this metric
  107. collected_number last; // the last value sent to netdata
  108. RRDSET *st; // the private chart of this metric
  109. RRDDIM *rd_value; // the dimension of this metric value
  110. RRDDIM *rd_count; // the dimension for the number of events received
  111. // linking, used for walking through all metrics
  112. struct statsd_metric *next_useful;
  113. } STATSD_METRIC;
  114. // --------------------------------------------------------------------------------------------------------------------
  115. // each type of metric has its own index
  116. typedef struct statsd_index {
  117. char *name; // the name of the index of metrics
  118. uint32_t events; // the number of events processed for this index
  119. uint32_t metrics; // the number of metrics in this index
  120. uint32_t useful; // the number of useful metrics in this index
  121. STATS_METRIC_OPTIONS default_options; // default options for all metrics in this index
  122. STATSD_METRIC_TYPE type; // the type of index
  123. DICTIONARY *dict;
  124. STATSD_METRIC *first_useful; // the linked list of useful metrics (new metrics are added in front)
  125. } STATSD_INDEX;
  126. // --------------------------------------------------------------------------------------------------------------------
  127. // synthetic charts
  128. typedef enum __attribute__((packed)) statsd_app_chart_dimension_value_type {
  129. STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS,
  130. STATSD_APP_CHART_DIM_VALUE_TYPE_LAST,
  131. STATSD_APP_CHART_DIM_VALUE_TYPE_AVERAGE,
  132. STATSD_APP_CHART_DIM_VALUE_TYPE_SUM,
  133. STATSD_APP_CHART_DIM_VALUE_TYPE_MIN,
  134. STATSD_APP_CHART_DIM_VALUE_TYPE_MAX,
  135. STATSD_APP_CHART_DIM_VALUE_TYPE_PERCENTILE,
  136. STATSD_APP_CHART_DIM_VALUE_TYPE_MEDIAN,
  137. STATSD_APP_CHART_DIM_VALUE_TYPE_STDDEV
  138. } STATSD_APP_CHART_DIM_VALUE_TYPE;
  139. typedef struct statsd_app_chart_dimension {
  140. const char *name; // the name of this dimension
  141. const char *metric; // the source metric name of this dimension
  142. uint32_t metric_hash; // hash for fast string comparisons
  143. int32_t multiplier; // the multiplier of the dimension
  144. int32_t divisor; // the divisor of the dimension
  145. RRDDIM_FLAGS flags; // the RRDDIM flags for this dimension
  146. RRDDIM_OPTIONS options; // the RRDDIM options for this dimension
  147. RRD_ALGORITHM algorithm; // the algorithm of this dimension
  148. STATSD_APP_CHART_DIM_VALUE_TYPE value_type; // which value to use of the source metric
  149. SIMPLE_PATTERN *metric_pattern; // set when the 'metric' is a simple pattern
  150. RRDDIM *rd; // a pointer to the RRDDIM that has been created for this dimension
  151. collected_number *value_ptr; // a pointer to the source metric value
  152. struct statsd_app_chart_dimension *next; // the next dimension for this chart
  153. } STATSD_APP_CHART_DIM;
  154. typedef struct statsd_app_chart {
  155. const char *id;
  156. const char *name;
  157. const char *title;
  158. const char *family;
  159. const char *context;
  160. const char *units;
  161. const char *module;
  162. int32_t priority;
  163. RRDSET_TYPE chart_type;
  164. STATSD_APP_CHART_DIM *dimensions;
  165. uint32_t dimensions_count;
  166. uint32_t dimensions_linked_count;
  167. RRDSET *st;
  168. struct statsd_app_chart *next;
  169. } STATSD_APP_CHART;
  170. typedef struct statsd_app {
  171. const char *name;
  172. SIMPLE_PATTERN *metrics;
  173. STATS_METRIC_OPTIONS default_options;
  174. RRD_MEMORY_MODE rrd_memory_mode;
  175. int32_t rrd_history_entries;
  176. DICTIONARY *dict;
  177. const char *source;
  178. STATSD_APP_CHART *charts;
  179. struct statsd_app *next;
  180. } STATSD_APP;
  181. // --------------------------------------------------------------------------------------------------------------------
  182. // global statsd data
  183. struct collection_thread_status {
  184. SPINLOCK spinlock;
  185. bool running;
  186. uint32_t max_sockets;
  187. netdata_thread_t thread;
  188. };
  189. static struct statsd {
  190. STATSD_INDEX gauges;
  191. STATSD_INDEX counters;
  192. STATSD_INDEX timers;
  193. STATSD_INDEX histograms;
  194. STATSD_INDEX meters;
  195. STATSD_INDEX sets;
  196. STATSD_INDEX dictionaries;
  197. size_t unknown_types;
  198. size_t socket_errors;
  199. size_t tcp_socket_connects;
  200. size_t tcp_socket_disconnects;
  201. size_t tcp_socket_connected;
  202. size_t tcp_socket_reads;
  203. size_t tcp_packets_received;
  204. size_t tcp_bytes_read;
  205. size_t udp_socket_reads;
  206. size_t udp_packets_received;
  207. size_t udp_bytes_read;
  208. int32_t update_every;
  209. bool enabled;
  210. bool private_charts_hidden;
  211. SIMPLE_PATTERN *charts_for;
  212. uint32_t tcp_idle_timeout;
  213. collected_number decimal_detail;
  214. uint32_t private_charts;
  215. uint32_t max_private_charts_hard;
  216. uint32_t set_obsolete_after;
  217. STATSD_APP *apps;
  218. uint32_t recvmmsg_size;
  219. uint32_t histogram_increase_step;
  220. uint32_t dictionary_max_unique;
  221. double histogram_percentile;
  222. char *histogram_percentile_str;
  223. int threads;
  224. struct collection_thread_status *collection_threads_status;
  225. LISTEN_SOCKETS sockets;
  226. } statsd = {
  227. .enabled = 1,
  228. .max_private_charts_hard = 1000,
  229. .private_charts_hidden = false,
  230. .recvmmsg_size = 10,
  231. .decimal_detail = STATSD_DECIMAL_DETAIL,
  232. .gauges = {
  233. .name = "gauge",
  234. .events = 0,
  235. .metrics = 0,
  236. .dict = NULL,
  237. .type = STATSD_METRIC_TYPE_GAUGE,
  238. .default_options = STATSD_METRIC_OPTION_NONE
  239. },
  240. .counters = {
  241. .name = "counter",
  242. .events = 0,
  243. .metrics = 0,
  244. .dict = NULL,
  245. .type = STATSD_METRIC_TYPE_COUNTER,
  246. .default_options = STATSD_METRIC_OPTION_NONE
  247. },
  248. .timers = {
  249. .name = "timer",
  250. .events = 0,
  251. .metrics = 0,
  252. .dict = NULL,
  253. .type = STATSD_METRIC_TYPE_TIMER,
  254. .default_options = STATSD_METRIC_OPTION_NONE
  255. },
  256. .histograms = {
  257. .name = "histogram",
  258. .events = 0,
  259. .metrics = 0,
  260. .dict = NULL,
  261. .type = STATSD_METRIC_TYPE_HISTOGRAM,
  262. .default_options = STATSD_METRIC_OPTION_NONE
  263. },
  264. .meters = {
  265. .name = "meter",
  266. .events = 0,
  267. .metrics = 0,
  268. .dict = NULL,
  269. .type = STATSD_METRIC_TYPE_METER,
  270. .default_options = STATSD_METRIC_OPTION_NONE
  271. },
  272. .sets = {
  273. .name = "set",
  274. .events = 0,
  275. .metrics = 0,
  276. .dict = NULL,
  277. .type = STATSD_METRIC_TYPE_SET,
  278. .default_options = STATSD_METRIC_OPTION_NONE
  279. },
  280. .dictionaries = {
  281. .name = "dictionary",
  282. .events = 0,
  283. .metrics = 0,
  284. .dict = NULL,
  285. .type = STATSD_METRIC_TYPE_DICTIONARY,
  286. .default_options = STATSD_METRIC_OPTION_NONE
  287. },
  288. .tcp_idle_timeout = 600,
  289. .apps = NULL,
  290. .histogram_percentile = 95.0,
  291. .histogram_increase_step = 10,
  292. .dictionary_max_unique = 200,
  293. .threads = 0,
  294. .collection_threads_status = NULL,
  295. .sockets = {
  296. .config = &netdata_config,
  297. .config_section = CONFIG_SECTION_STATSD,
  298. .default_bind_to = "udp:localhost tcp:localhost",
  299. .default_port = STATSD_LISTEN_PORT,
  300. .backlog = STATSD_LISTEN_BACKLOG
  301. },
  302. };
  303. // --------------------------------------------------------------------------------------------------------------------
  304. // statsd index management - add/find metrics
  305. static void dictionary_metric_insert_callback(const DICTIONARY_ITEM *item, void *value, void *data) {
  306. STATSD_INDEX *index = (STATSD_INDEX *)data;
  307. STATSD_METRIC *m = (STATSD_METRIC *)value;
  308. const char *name = dictionary_acquired_item_name(item);
  309. netdata_log_debug(D_STATSD, "Creating new %s metric '%s'", index->name, name);
  310. m->name = name;
  311. m->hash = simple_hash(name);
  312. m->type = index->type;
  313. m->options = index->default_options;
  314. if (m->type == STATSD_METRIC_TYPE_HISTOGRAM || m->type == STATSD_METRIC_TYPE_TIMER) {
  315. m->histogram.ext = callocz(1,sizeof(STATSD_METRIC_HISTOGRAM_EXTENSIONS));
  316. netdata_mutex_init(&m->histogram.ext->mutex);
  317. }
  318. __atomic_fetch_add(&index->metrics, 1, __ATOMIC_RELAXED);
  319. }
  320. static void dictionary_metric_delete_callback(const DICTIONARY_ITEM *item, void *value, void *data) {
  321. (void)data; // STATSD_INDEX *index = (STATSD_INDEX *)data;
  322. (void)item;
  323. STATSD_METRIC *m = (STATSD_METRIC *)value;
  324. if(m->type == STATSD_METRIC_TYPE_HISTOGRAM || m->type == STATSD_METRIC_TYPE_TIMER) {
  325. freez(m->histogram.ext);
  326. m->histogram.ext = NULL;
  327. }
  328. freez(m->units);
  329. freez(m->family);
  330. freez(m->dimname);
  331. }
  332. static inline STATSD_METRIC *statsd_find_or_add_metric(STATSD_INDEX *index, const char *name) {
  333. netdata_log_debug(D_STATSD, "searching for metric '%s' under '%s'", name, index->name);
  334. #ifdef STATSD_MULTITHREADED
  335. // avoid the write lock of dictionary_set() for existing metrics
  336. STATSD_METRIC *m = dictionary_get(index->dict, name);
  337. if(!m) m = dictionary_set(index->dict, name, NULL, sizeof(STATSD_METRIC));
  338. #else
  339. // no locks here, go faster
  340. // this will call the dictionary_metric_insert_callback() if an item
  341. // is inserted, otherwise it will return the existing one.
  342. // We used the flag DICT_OPTION_DONT_OVERWRITE_VALUE to support this.
  343. STATSD_METRIC *m = dictionary_set(index->dict, name, NULL, sizeof(STATSD_METRIC));
  344. #endif
  345. index->events++;
  346. return m;
  347. }
  348. // --------------------------------------------------------------------------------------------------------------------
  349. // statsd parsing numbers
  350. static inline NETDATA_DOUBLE statsd_parse_float(const char *v, NETDATA_DOUBLE def) {
  351. NETDATA_DOUBLE value;
  352. if(likely(v && *v)) {
  353. char *e = NULL;
  354. value = str2ndd(v, &e);
  355. if(unlikely(e && *e))
  356. collector_error("STATSD: excess data '%s' after value '%s'", e, v);
  357. }
  358. else
  359. value = def;
  360. return value;
  361. }
  362. static inline NETDATA_DOUBLE statsd_parse_sampling_rate(const char *v) {
  363. NETDATA_DOUBLE sampling_rate = statsd_parse_float(v, 1.0);
  364. if(unlikely(isless(sampling_rate, 0.001))) sampling_rate = 0.001;
  365. if(unlikely(isgreater(sampling_rate, 1.0))) sampling_rate = 1.0;
  366. return sampling_rate;
  367. }
  368. static inline long long statsd_parse_int(const char *v, long long def) {
  369. long long value;
  370. if(likely(v && *v)) {
  371. char *e = NULL;
  372. value = str2ll(v, &e);
  373. if(unlikely(e && *e))
  374. collector_error("STATSD: excess data '%s' after value '%s'", e, v);
  375. }
  376. else
  377. value = def;
  378. return value;
  379. }
  380. // --------------------------------------------------------------------------------------------------------------------
  381. // statsd processors per metric type
  382. static inline void statsd_reset_metric(STATSD_METRIC *m) {
  383. m->reset = 0;
  384. m->count = 0;
  385. }
  386. static inline int value_is_zinit(const char *value) {
  387. return (value && *value == 'z' && *++value == 'i' && *++value == 'n' && *++value == 'i' && *++value == 't' && *++value == '\0');
  388. }
  389. #define is_metric_checked(m) ((m)->options & STATSD_METRIC_OPTION_CHECKED)
  390. #define is_metric_useful_for_collection(m) (!is_metric_checked(m) || ((m)->options & STATSD_METRIC_OPTION_USEFUL))
  391. static inline void metric_update_counters_and_obsoletion(STATSD_METRIC *m) {
  392. m->events++;
  393. m->count++;
  394. m->last_collected = now_realtime_sec();
  395. if (m->st && unlikely(rrdset_flag_check(m->st, RRDSET_FLAG_OBSOLETE))) {
  396. rrdset_isnot_obsolete___safe_from_collector_thread(m->st);
  397. m->options &= ~STATSD_METRIC_OPTION_OBSOLETE;
  398. }
  399. }
  400. static inline void statsd_process_gauge(STATSD_METRIC *m, const char *value, const char *sampling) {
  401. if(!is_metric_useful_for_collection(m)) return;
  402. if(unlikely(!value || !*value)) {
  403. collector_error("STATSD: metric '%s' of type gauge, with empty value is ignored.", m->name);
  404. return;
  405. }
  406. if(unlikely(m->reset)) {
  407. // no need to reset anything specific for gauges
  408. statsd_reset_metric(m);
  409. }
  410. if(unlikely(value_is_zinit(value))) {
  411. // magic loading of metric, without affecting anything
  412. }
  413. else {
  414. if (unlikely(*value == '+' || *value == '-'))
  415. m->gauge.value += statsd_parse_float(value, 1.0) / statsd_parse_sampling_rate(sampling);
  416. else
  417. m->gauge.value = statsd_parse_float(value, 1.0);
  418. metric_update_counters_and_obsoletion(m);
  419. }
  420. }
  421. static inline void statsd_process_counter_or_meter(STATSD_METRIC *m, const char *value, const char *sampling) {
  422. if(!is_metric_useful_for_collection(m)) return;
  423. // we accept empty values for counters
  424. if(unlikely(m->reset)) statsd_reset_metric(m);
  425. if(unlikely(value_is_zinit(value))) {
  426. // magic loading of metric, without affecting anything
  427. }
  428. else {
  429. m->counter.value += llrintndd((NETDATA_DOUBLE) statsd_parse_int(value, 1) / statsd_parse_sampling_rate(sampling));
  430. metric_update_counters_and_obsoletion(m);
  431. }
  432. }
  433. #define statsd_process_counter(m, value, sampling) statsd_process_counter_or_meter(m, value, sampling)
  434. #define statsd_process_meter(m, value, sampling) statsd_process_counter_or_meter(m, value, sampling)
  435. static inline void statsd_process_histogram_or_timer(STATSD_METRIC *m, const char *value, const char *sampling, const char *type) {
  436. if(!is_metric_useful_for_collection(m)) return;
  437. if(unlikely(!value || !*value)) {
  438. collector_error("STATSD: metric of type %s, with empty value is ignored.", type);
  439. return;
  440. }
  441. if(unlikely(m->reset)) {
  442. m->histogram.ext->used = 0;
  443. statsd_reset_metric(m);
  444. }
  445. if(unlikely(value_is_zinit(value))) {
  446. // magic loading of metric, without affecting anything
  447. }
  448. else {
  449. NETDATA_DOUBLE v = statsd_parse_float(value, 1.0);
  450. NETDATA_DOUBLE sampling_rate = statsd_parse_sampling_rate(sampling);
  451. if(unlikely(isless(sampling_rate, 0.01))) sampling_rate = 0.01;
  452. if(unlikely(isgreater(sampling_rate, 1.0))) sampling_rate = 1.0;
  453. long long samples = llrintndd(1.0 / sampling_rate);
  454. while(samples-- > 0) {
  455. if(unlikely(m->histogram.ext->used == m->histogram.ext->size)) {
  456. netdata_mutex_lock(&m->histogram.ext->mutex);
  457. m->histogram.ext->size += statsd.histogram_increase_step;
  458. m->histogram.ext->values = reallocz(m->histogram.ext->values, sizeof(NETDATA_DOUBLE) * m->histogram.ext->size);
  459. netdata_mutex_unlock(&m->histogram.ext->mutex);
  460. }
  461. m->histogram.ext->values[m->histogram.ext->used++] = v;
  462. }
  463. metric_update_counters_and_obsoletion(m);
  464. }
  465. }
  466. #define statsd_process_timer(m, value, sampling) statsd_process_histogram_or_timer(m, value, sampling, "timer")
  467. #define statsd_process_histogram(m, value, sampling) statsd_process_histogram_or_timer(m, value, sampling, "histogram")
  468. static inline void statsd_process_set(STATSD_METRIC *m, const char *value) {
  469. if(!is_metric_useful_for_collection(m)) return;
  470. if(unlikely(!value || !*value)) {
  471. netdata_log_error("STATSD: metric of type set, with empty value is ignored.");
  472. return;
  473. }
  474. if(unlikely(m->reset)) {
  475. if(likely(m->set.dict)) {
  476. dictionary_destroy(m->set.dict);
  477. m->set.dict = NULL;
  478. }
  479. statsd_reset_metric(m);
  480. }
  481. if (unlikely(!m->set.dict))
  482. m->set.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  483. if(unlikely(value_is_zinit(value))) {
  484. // magic loading of metric, without affecting anything
  485. }
  486. else {
  487. #ifdef STATSD_MULTITHREADED
  488. // avoid the write lock to check if something is already there
  489. if(!dictionary_get(m->set.dict, value))
  490. dictionary_set(m->set.dict, value, NULL, 0);
  491. #else
  492. dictionary_set(m->set.dict, value, NULL, 0);
  493. #endif
  494. metric_update_counters_and_obsoletion(m);
  495. }
  496. }
  497. static inline void statsd_process_dictionary(STATSD_METRIC *m, const char *value) {
  498. if(!is_metric_useful_for_collection(m)) return;
  499. if(unlikely(!value || !*value)) {
  500. netdata_log_error("STATSD: metric of type set, with empty value is ignored.");
  501. return;
  502. }
  503. if(unlikely(m->reset))
  504. statsd_reset_metric(m);
  505. if (unlikely(!m->dictionary.dict))
  506. m->dictionary.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  507. if(unlikely(value_is_zinit(value))) {
  508. // magic loading of metric, without affecting anything
  509. }
  510. else {
  511. STATSD_METRIC_DICTIONARY_ITEM *t = (STATSD_METRIC_DICTIONARY_ITEM *)dictionary_get(m->dictionary.dict, value);
  512. if (unlikely(!t)) {
  513. if(!t && dictionary_entries(m->dictionary.dict) >= statsd.dictionary_max_unique)
  514. value = "other";
  515. t = (STATSD_METRIC_DICTIONARY_ITEM *)dictionary_set(m->dictionary.dict, value, NULL, sizeof(STATSD_METRIC_DICTIONARY_ITEM));
  516. }
  517. t->count++;
  518. metric_update_counters_and_obsoletion(m);
  519. }
  520. }
  521. // --------------------------------------------------------------------------------------------------------------------
  522. // statsd parsing
  523. static inline const char *statsd_parse_skip_up_to(const char *s, char d1, char d2, char d3) {
  524. char c;
  525. for(c = *s; c && c != d1 && c != d2 && c != d3 && c != '\r' && c != '\n'; c = *++s) ;
  526. return s;
  527. }
  528. const char *statsd_parse_skip_spaces(const char *s) {
  529. char c;
  530. for(c = *s; c && ( c == ' ' || c == '\t' || c == '\r' || c == '\n' ); c = *++s) ;
  531. return s;
  532. }
  533. static inline const char *statsd_parse_field_trim(const char *start, char *end) {
  534. if(unlikely(!start || !*start)) {
  535. start = end;
  536. return start;
  537. }
  538. while(start <= end && (*start == ' ' || *start == '\t'))
  539. start++;
  540. *end = '\0';
  541. end--;
  542. while(end >= start && (*end == ' ' || *end == '\t'))
  543. *end-- = '\0';
  544. return start;
  545. }
  546. static void statsd_process_metric(const char *name, const char *value, const char *type, const char *sampling, const char *tags) {
  547. netdata_log_debug(D_STATSD, "STATSD: raw metric '%s', value '%s', type '%s', sampling '%s', tags '%s'", name?name:"(null)", value?value:"(null)", type?type:"(null)", sampling?sampling:"(null)", tags?tags:"(null)");
  548. if(unlikely(!name || !*name)) return;
  549. if(unlikely(!type || !*type)) type = "m";
  550. STATSD_METRIC *m = NULL;
  551. char t0 = type[0], t1 = type[1];
  552. if(unlikely(t0 == 'g' && t1 == '\0')) {
  553. statsd_process_gauge(
  554. m = statsd_find_or_add_metric(&statsd.gauges, name),
  555. value, sampling);
  556. }
  557. else if(unlikely((t0 == 'c' || t0 == 'C') && t1 == '\0')) {
  558. // etsy/statsd uses 'c'
  559. // brubeck uses 'C'
  560. statsd_process_counter(
  561. m = statsd_find_or_add_metric(&statsd.counters, name),
  562. value, sampling);
  563. }
  564. else if(unlikely(t0 == 'm' && t1 == '\0')) {
  565. statsd_process_meter(
  566. m = statsd_find_or_add_metric(&statsd.meters, name),
  567. value, sampling);
  568. }
  569. else if(unlikely(t0 == 'h' && t1 == '\0')) {
  570. statsd_process_histogram(
  571. m = statsd_find_or_add_metric(&statsd.histograms, name),
  572. value, sampling);
  573. }
  574. else if(unlikely(t0 == 's' && t1 == '\0')) {
  575. statsd_process_set(
  576. m = statsd_find_or_add_metric(&statsd.sets, name),
  577. value);
  578. }
  579. else if(unlikely(t0 == 'd' && t1 == '\0')) {
  580. statsd_process_dictionary(
  581. m = statsd_find_or_add_metric(&statsd.dictionaries, name),
  582. value);
  583. }
  584. else if(unlikely(t0 == 'm' && t1 == 's' && type[2] == '\0')) {
  585. statsd_process_timer(
  586. m = statsd_find_or_add_metric(&statsd.timers, name),
  587. value, sampling);
  588. }
  589. else {
  590. statsd.unknown_types++;
  591. netdata_log_error("STATSD: metric '%s' with value '%s' is sent with unknown metric type '%s'", name, value?value:"", type);
  592. }
  593. if(m && tags && *tags) {
  594. const char *s = tags;
  595. while(*s) {
  596. const char *tagkey = NULL, *tagvalue = NULL;
  597. char *tagkey_end = NULL, *tagvalue_end = NULL;
  598. s = tagkey_end = (char *)statsd_parse_skip_up_to(tagkey = s, ':', '=', ',');
  599. if(tagkey == tagkey_end) {
  600. if (*s) {
  601. s++;
  602. s = statsd_parse_skip_spaces(s);
  603. }
  604. continue;
  605. }
  606. if(likely(*s == ':' || *s == '='))
  607. s = tagvalue_end = (char *) statsd_parse_skip_up_to(tagvalue = ++s, ',', '\0', '\0');
  608. if(*s == ',') s++;
  609. statsd_parse_field_trim(tagkey, tagkey_end);
  610. statsd_parse_field_trim(tagvalue, tagvalue_end);
  611. if(tagkey && *tagkey && tagvalue && *tagvalue) {
  612. if (strcmp(tagkey, "units") == 0 && (!m->units || strcmp(m->units, tagvalue) != 0)) {
  613. m->units = strdupz(tagvalue);
  614. m->options |= STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  615. }
  616. if (strcmp(tagkey, "name") == 0 && (!m->dimname || strcmp(m->dimname, tagvalue) != 0)) {
  617. m->dimname = strdupz(tagvalue);
  618. m->options |= STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  619. }
  620. if (strcmp(tagkey, "family") == 0 && (!m->family || strcmp(m->family, tagvalue) != 0)) {
  621. m->family = strdupz(tagvalue);
  622. m->options |= STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  623. }
  624. }
  625. }
  626. }
  627. }
  628. static inline size_t statsd_process(char *buffer, size_t size, int require_newlines) {
  629. buffer[size] = '\0';
  630. netdata_log_debug(D_STATSD, "RECEIVED: %zu bytes: '%s'", size, buffer);
  631. const char *s = buffer;
  632. while(*s) {
  633. const char *name = NULL, *value = NULL, *type = NULL, *sampling = NULL, *tags = NULL;
  634. char *name_end = NULL, *value_end = NULL, *type_end = NULL, *sampling_end = NULL, *tags_end = NULL;
  635. s = name_end = (char *)statsd_parse_skip_up_to(name = s, ':', '=', '|');
  636. if(name == name_end) {
  637. if (*s) {
  638. s++;
  639. s = statsd_parse_skip_spaces(s);
  640. }
  641. continue;
  642. }
  643. if(likely(*s == ':' || *s == '='))
  644. s = value_end = (char *) statsd_parse_skip_up_to(value = ++s, '|', '@', '#');
  645. if(likely(*s == '|'))
  646. s = type_end = (char *) statsd_parse_skip_up_to(type = ++s, '|', '@', '#');
  647. while(*s == '|' || *s == '@' || *s == '#') {
  648. // parse all the fields that may be appended
  649. if ((*s == '|' && s[1] == '@') || *s == '@') {
  650. s = sampling_end = (char *)statsd_parse_skip_up_to(sampling = ++s, '|', '@', '#');
  651. if (*sampling == '@') sampling++;
  652. }
  653. else if ((*s == '|' && s[1] == '#') || *s == '#') {
  654. s = tags_end = (char *)statsd_parse_skip_up_to(tags = ++s, '|', '@', '#');
  655. if (*tags == '#') tags++;
  656. }
  657. else {
  658. // unknown field, skip it
  659. s = (char *)statsd_parse_skip_up_to(++s, '|', '@', '#');
  660. }
  661. }
  662. // skip everything until the end of the line
  663. while(*s && *s != '\n') s++;
  664. if(unlikely(require_newlines && *s != '\n' && s > buffer)) {
  665. // move the remaining data to the beginning
  666. size -= (name - buffer);
  667. memmove(buffer, name, size);
  668. return size;
  669. }
  670. else
  671. s = statsd_parse_skip_spaces(s);
  672. statsd_process_metric(
  673. statsd_parse_field_trim(name, name_end)
  674. , statsd_parse_field_trim(value, value_end)
  675. , statsd_parse_field_trim(type, type_end)
  676. , statsd_parse_field_trim(sampling, sampling_end)
  677. , statsd_parse_field_trim(tags, tags_end)
  678. );
  679. }
  680. return 0;
  681. }
  682. // --------------------------------------------------------------------------------------------------------------------
  683. // statsd pollfd interface
  684. #define STATSD_TCP_BUFFER_SIZE 65536 // minimize tcp reads
  685. #define STATSD_UDP_BUFFER_SIZE 9000 // this should be up to MTU
  686. typedef enum {
  687. STATSD_SOCKET_DATA_TYPE_TCP,
  688. STATSD_SOCKET_DATA_TYPE_UDP
  689. } STATSD_SOCKET_DATA_TYPE;
  690. struct statsd_tcp {
  691. STATSD_SOCKET_DATA_TYPE type;
  692. size_t size;
  693. size_t len;
  694. char buffer[];
  695. };
  696. struct statsd_udp {
  697. struct collection_thread_status *status;
  698. STATSD_SOCKET_DATA_TYPE type;
  699. #ifdef HAVE_RECVMMSG
  700. size_t size;
  701. struct iovec *iovecs;
  702. struct mmsghdr *msgs;
  703. #else
  704. int *running;
  705. char buffer[STATSD_UDP_BUFFER_SIZE];
  706. #endif
  707. };
  708. // new TCP client connected
  709. static void *statsd_add_callback(POLLINFO *pi, short int *events, void *data) {
  710. (void)pi;
  711. (void)data;
  712. worker_is_busy(WORKER_JOB_TYPE_TCP_CONNECTED);
  713. *events = POLLIN;
  714. struct statsd_tcp *t = (struct statsd_tcp *)callocz(sizeof(struct statsd_tcp) + STATSD_TCP_BUFFER_SIZE, 1);
  715. t->type = STATSD_SOCKET_DATA_TYPE_TCP;
  716. t->size = STATSD_TCP_BUFFER_SIZE - 1;
  717. statsd.tcp_socket_connects++;
  718. statsd.tcp_socket_connected++;
  719. worker_is_idle();
  720. return t;
  721. }
  722. // TCP client disconnected
  723. static void statsd_del_callback(POLLINFO *pi) {
  724. worker_is_busy(WORKER_JOB_TYPE_TCP_DISCONNECTED);
  725. struct statsd_tcp *t = pi->data;
  726. if(likely(t)) {
  727. if(t->type == STATSD_SOCKET_DATA_TYPE_TCP) {
  728. if(t->len != 0) {
  729. statsd.socket_errors++;
  730. netdata_log_error("STATSD: client is probably sending unterminated metrics. Closed socket left with '%s'. Trying to process it.", t->buffer);
  731. statsd_process(t->buffer, t->len, 0);
  732. }
  733. statsd.tcp_socket_disconnects++;
  734. statsd.tcp_socket_connected--;
  735. }
  736. else
  737. netdata_log_error("STATSD: internal error: received socket data type is %d, but expected %d", (int)t->type, (int)STATSD_SOCKET_DATA_TYPE_TCP);
  738. freez(t);
  739. }
  740. worker_is_idle();
  741. }
  742. // Receive data
  743. static int statsd_rcv_callback(POLLINFO *pi, short int *events) {
  744. int retval = -1;
  745. worker_is_busy(WORKER_JOB_TYPE_RCV_DATA);
  746. *events = POLLIN;
  747. int fd = pi->fd;
  748. switch(pi->socktype) {
  749. case SOCK_STREAM: {
  750. struct statsd_tcp *d = (struct statsd_tcp *)pi->data;
  751. if(unlikely(!d)) {
  752. netdata_log_error("STATSD: internal error: expected TCP data pointer is NULL");
  753. statsd.socket_errors++;
  754. retval = -1;
  755. goto cleanup;
  756. }
  757. #ifdef NETDATA_INTERNAL_CHECKS
  758. if(unlikely(d->type != STATSD_SOCKET_DATA_TYPE_TCP)) {
  759. netdata_log_error("STATSD: internal error: socket data type should be %d, but it is %d", (int)STATSD_SOCKET_DATA_TYPE_TCP, (int)d->type);
  760. statsd.socket_errors++;
  761. retval = -1;
  762. goto cleanup;
  763. }
  764. #endif
  765. int ret = 0;
  766. ssize_t rc;
  767. do {
  768. rc = recv(fd, &d->buffer[d->len], d->size - d->len, MSG_DONTWAIT);
  769. if (rc < 0) {
  770. // read failed
  771. if (errno != EWOULDBLOCK && errno != EAGAIN && errno != EINTR) {
  772. netdata_log_error("STATSD: recv() on TCP socket %d failed.", fd);
  773. statsd.socket_errors++;
  774. ret = -1;
  775. }
  776. }
  777. else if (!rc) {
  778. // connection closed
  779. netdata_log_debug(D_STATSD, "STATSD: client disconnected.");
  780. ret = -1;
  781. }
  782. else {
  783. // data received
  784. d->len += rc;
  785. statsd.tcp_socket_reads++;
  786. statsd.tcp_bytes_read += rc;
  787. }
  788. if(likely(d->len > 0)) {
  789. statsd.tcp_packets_received++;
  790. d->len = statsd_process(d->buffer, d->len, 1);
  791. }
  792. if(unlikely(ret == -1)) {
  793. retval = -1;
  794. goto cleanup;
  795. }
  796. } while (rc != -1);
  797. break;
  798. }
  799. case SOCK_DGRAM: {
  800. struct statsd_udp *d = (struct statsd_udp *)pi->data;
  801. if(unlikely(!d)) {
  802. netdata_log_error("STATSD: internal error: expected UDP data pointer is NULL");
  803. statsd.socket_errors++;
  804. retval = -1;
  805. goto cleanup;
  806. }
  807. #ifdef NETDATA_INTERNAL_CHECKS
  808. if(unlikely(d->type != STATSD_SOCKET_DATA_TYPE_UDP)) {
  809. netdata_log_error("STATSD: internal error: socket data should be %d, but it is %d", (int)d->type, (int)STATSD_SOCKET_DATA_TYPE_UDP);
  810. statsd.socket_errors++;
  811. retval = -1;
  812. goto cleanup;
  813. }
  814. #endif
  815. #ifdef HAVE_RECVMMSG
  816. ssize_t rc;
  817. do {
  818. rc = recvmmsg(fd, d->msgs, (unsigned int)d->size, MSG_DONTWAIT, NULL);
  819. if (rc < 0) {
  820. // read failed
  821. if (errno != EWOULDBLOCK && errno != EAGAIN && errno != EINTR) {
  822. netdata_log_error("STATSD: recvmmsg() on UDP socket %d failed.", fd);
  823. statsd.socket_errors++;
  824. retval = -1;
  825. goto cleanup;
  826. }
  827. } else if (rc) {
  828. // data received
  829. statsd.udp_socket_reads++;
  830. statsd.udp_packets_received += rc;
  831. size_t i;
  832. for (i = 0; i < (size_t)rc; ++i) {
  833. size_t len = (size_t)d->msgs[i].msg_len;
  834. statsd.udp_bytes_read += len;
  835. statsd_process(d->msgs[i].msg_hdr.msg_iov->iov_base, len, 0);
  836. }
  837. }
  838. } while (rc != -1);
  839. #else // !HAVE_RECVMMSG
  840. ssize_t rc;
  841. do {
  842. rc = recv(fd, d->buffer, STATSD_UDP_BUFFER_SIZE - 1, MSG_DONTWAIT);
  843. if (rc < 0) {
  844. // read failed
  845. if (errno != EWOULDBLOCK && errno != EAGAIN && errno != EINTR) {
  846. netdata_log_error("STATSD: recv() on UDP socket %d failed.", fd);
  847. statsd.socket_errors++;
  848. retval = -1;
  849. goto cleanup;
  850. }
  851. } else if (rc) {
  852. // data received
  853. statsd.udp_socket_reads++;
  854. statsd.udp_packets_received++;
  855. statsd.udp_bytes_read += rc;
  856. statsd_process(d->buffer, (size_t) rc, 0);
  857. }
  858. } while (rc != -1);
  859. #endif
  860. break;
  861. }
  862. default: {
  863. netdata_log_error("STATSD: internal error: unknown socktype %d on socket %d", pi->socktype, fd);
  864. statsd.socket_errors++;
  865. retval = -1;
  866. goto cleanup;
  867. }
  868. }
  869. retval = 0;
  870. cleanup:
  871. worker_is_idle();
  872. return retval;
  873. }
  874. static int statsd_snd_callback(POLLINFO *pi, short int *events) {
  875. (void)pi;
  876. (void)events;
  877. worker_is_busy(WORKER_JOB_TYPE_SND_DATA);
  878. netdata_log_error("STATSD: snd_callback() called, but we never requested to send data to statsd clients.");
  879. worker_is_idle();
  880. return -1;
  881. }
  882. // --------------------------------------------------------------------------------------------------------------------
  883. // statsd child thread to collect metrics from network
  884. void statsd_collector_thread_cleanup(void *data) {
  885. struct statsd_udp *d = data;
  886. spinlock_lock(&d->status->spinlock);
  887. d->status->running = false;
  888. spinlock_unlock(&d->status->spinlock);
  889. collector_info("cleaning up...");
  890. #ifdef HAVE_RECVMMSG
  891. size_t i;
  892. for (i = 0; i < d->size; i++)
  893. freez(d->iovecs[i].iov_base);
  894. freez(d->iovecs);
  895. freez(d->msgs);
  896. #endif
  897. freez(d);
  898. worker_unregister();
  899. }
  900. static bool statsd_should_stop(void) {
  901. return !service_running(SERVICE_COLLECTORS);
  902. }
  903. void *statsd_collector_thread(void *ptr) {
  904. struct collection_thread_status *status = ptr;
  905. spinlock_lock(&status->spinlock);
  906. status->running = true;
  907. spinlock_unlock(&status->spinlock);
  908. worker_register("STATSD");
  909. worker_register_job_name(WORKER_JOB_TYPE_TCP_CONNECTED, "tcp connect");
  910. worker_register_job_name(WORKER_JOB_TYPE_TCP_DISCONNECTED, "tcp disconnect");
  911. worker_register_job_name(WORKER_JOB_TYPE_RCV_DATA, "receive");
  912. worker_register_job_name(WORKER_JOB_TYPE_SND_DATA, "send");
  913. collector_info("STATSD collector thread started with taskid %d", gettid());
  914. struct statsd_udp *d = callocz(sizeof(struct statsd_udp), 1);
  915. d->status = status;
  916. netdata_thread_cleanup_push(statsd_collector_thread_cleanup, d);
  917. #ifdef HAVE_RECVMMSG
  918. d->type = STATSD_SOCKET_DATA_TYPE_UDP;
  919. d->size = statsd.recvmmsg_size;
  920. d->iovecs = callocz(sizeof(struct iovec), d->size);
  921. d->msgs = callocz(sizeof(struct mmsghdr), d->size);
  922. size_t i;
  923. for (i = 0; i < d->size; i++) {
  924. d->iovecs[i].iov_base = mallocz(STATSD_UDP_BUFFER_SIZE);
  925. d->iovecs[i].iov_len = STATSD_UDP_BUFFER_SIZE - 1;
  926. d->msgs[i].msg_hdr.msg_iov = &d->iovecs[i];
  927. d->msgs[i].msg_hdr.msg_iovlen = 1;
  928. }
  929. #endif
  930. poll_events(&statsd.sockets
  931. , statsd_add_callback
  932. , statsd_del_callback
  933. , statsd_rcv_callback
  934. , statsd_snd_callback
  935. , NULL
  936. , statsd_should_stop
  937. , NULL // No access control pattern
  938. , 0 // No dns lookups for access control pattern
  939. , (void *)d
  940. , 0 // tcp request timeout, 0 = disabled
  941. , statsd.tcp_idle_timeout // tcp idle timeout, 0 = disabled
  942. , statsd.update_every * 1000
  943. , ptr // timer_data
  944. , status->max_sockets
  945. );
  946. netdata_thread_cleanup_pop(1);
  947. return NULL;
  948. }
  949. // --------------------------------------------------------------------------------------------------------------------
  950. // statsd applications configuration files parsing
  951. #define STATSD_CONF_LINE_MAX 8192
  952. static STATSD_APP_CHART_DIM_VALUE_TYPE string2valuetype(const char *type, size_t line, const char *filename) {
  953. if(!type || !*type) type = "last";
  954. if(!strcmp(type, "events")) return STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS;
  955. else if(!strcmp(type, "last")) return STATSD_APP_CHART_DIM_VALUE_TYPE_LAST;
  956. else if(!strcmp(type, "min")) return STATSD_APP_CHART_DIM_VALUE_TYPE_MIN;
  957. else if(!strcmp(type, "max")) return STATSD_APP_CHART_DIM_VALUE_TYPE_MAX;
  958. else if(!strcmp(type, "sum")) return STATSD_APP_CHART_DIM_VALUE_TYPE_SUM;
  959. else if(!strcmp(type, "average")) return STATSD_APP_CHART_DIM_VALUE_TYPE_AVERAGE;
  960. else if(!strcmp(type, "median")) return STATSD_APP_CHART_DIM_VALUE_TYPE_MEDIAN;
  961. else if(!strcmp(type, "stddev")) return STATSD_APP_CHART_DIM_VALUE_TYPE_STDDEV;
  962. else if(!strcmp(type, "percentile")) return STATSD_APP_CHART_DIM_VALUE_TYPE_PERCENTILE;
  963. netdata_log_error("STATSD: invalid type '%s' at line %zu of file '%s'. Using 'last'.", type, line, filename);
  964. return STATSD_APP_CHART_DIM_VALUE_TYPE_LAST;
  965. }
  966. static const char *valuetype2string(STATSD_APP_CHART_DIM_VALUE_TYPE type) {
  967. switch(type) {
  968. case STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS: return "events";
  969. case STATSD_APP_CHART_DIM_VALUE_TYPE_LAST: return "last";
  970. case STATSD_APP_CHART_DIM_VALUE_TYPE_MIN: return "min";
  971. case STATSD_APP_CHART_DIM_VALUE_TYPE_MAX: return "max";
  972. case STATSD_APP_CHART_DIM_VALUE_TYPE_SUM: return "sum";
  973. case STATSD_APP_CHART_DIM_VALUE_TYPE_AVERAGE: return "average";
  974. case STATSD_APP_CHART_DIM_VALUE_TYPE_MEDIAN: return "median";
  975. case STATSD_APP_CHART_DIM_VALUE_TYPE_STDDEV: return "stddev";
  976. case STATSD_APP_CHART_DIM_VALUE_TYPE_PERCENTILE: return "percentile";
  977. }
  978. return "unknown";
  979. }
  980. static STATSD_APP_CHART_DIM *add_dimension_to_app_chart(
  981. STATSD_APP *app __maybe_unused
  982. , STATSD_APP_CHART *chart
  983. , const char *metric_name
  984. , const char *dim_name
  985. , collected_number multiplier
  986. , collected_number divisor
  987. , RRDDIM_FLAGS flags
  988. , RRDDIM_OPTIONS options
  989. , STATSD_APP_CHART_DIM_VALUE_TYPE value_type
  990. ) {
  991. STATSD_APP_CHART_DIM *dim = callocz(sizeof(STATSD_APP_CHART_DIM), 1);
  992. dim->metric = strdupz(metric_name);
  993. dim->metric_hash = simple_hash(dim->metric);
  994. dim->name = strdupz((dim_name)?dim_name:"");
  995. dim->multiplier = multiplier;
  996. dim->divisor = divisor;
  997. dim->value_type = value_type;
  998. dim->flags = flags;
  999. dim->options = options;
  1000. if(!dim->multiplier)
  1001. dim->multiplier = 1;
  1002. if(!dim->divisor)
  1003. dim->divisor = 1;
  1004. // append it to the list of dimension
  1005. STATSD_APP_CHART_DIM *tdim;
  1006. for(tdim = chart->dimensions; tdim && tdim->next ; tdim = tdim->next) ;
  1007. if(!tdim) {
  1008. dim->next = chart->dimensions;
  1009. chart->dimensions = dim;
  1010. }
  1011. else {
  1012. dim->next = tdim->next;
  1013. tdim->next = dim;
  1014. }
  1015. chart->dimensions_count++;
  1016. netdata_log_debug(D_STATSD, "Added dimension '%s' to chart '%s' of app '%s', for metric '%s', with type %u, multiplier %d, divisor %d",
  1017. dim->name, chart->id, app->name, dim->metric, dim->value_type, dim->multiplier, dim->divisor);
  1018. return dim;
  1019. }
  1020. static int statsd_readfile(const char *filename, STATSD_APP *app, STATSD_APP_CHART *chart, DICTIONARY *dict) {
  1021. netdata_log_debug(D_STATSD, "STATSD configuration reading file '%s'", filename);
  1022. char *buffer = mallocz(STATSD_CONF_LINE_MAX + 1);
  1023. FILE *fp = fopen(filename, "r");
  1024. if(!fp) {
  1025. netdata_log_error("STATSD: cannot open file '%s'.", filename);
  1026. freez(buffer);
  1027. return -1;
  1028. }
  1029. size_t line = 0;
  1030. char *s;
  1031. while(fgets(buffer, STATSD_CONF_LINE_MAX, fp) != NULL) {
  1032. buffer[STATSD_CONF_LINE_MAX] = '\0';
  1033. line++;
  1034. s = trim(buffer);
  1035. if (!s || *s == '#') {
  1036. netdata_log_debug(D_STATSD, "STATSD: ignoring line %zu of file '%s', it is empty.", line, filename);
  1037. continue;
  1038. }
  1039. netdata_log_debug(D_STATSD, "STATSD: processing line %zu of file '%s': %s", line, filename, buffer);
  1040. if(*s == 'i' && strncmp(s, "include", 7) == 0) {
  1041. s = trim(&s[7]);
  1042. if(s && *s) {
  1043. char *tmp;
  1044. if(*s == '/')
  1045. tmp = strdupz(s);
  1046. else {
  1047. // the file to be included is relative to current file
  1048. // find the directory name from the file we already read
  1049. char *filename2 = strdupz(filename); // copy filename, since dirname() will change it
  1050. char *dir = dirname(filename2); // find the directory part of the filename
  1051. tmp = strdupz_path_subpath(dir, s); // compose the new filename to read;
  1052. freez(filename2); // free the filename we copied
  1053. }
  1054. statsd_readfile(tmp, app, chart, dict);
  1055. freez(tmp);
  1056. }
  1057. else
  1058. netdata_log_error("STATSD: ignoring line %zu of file '%s', include filename is empty", line, filename);
  1059. continue;
  1060. }
  1061. int len = (int) strlen(s);
  1062. if (*s == '[' && s[len - 1] == ']') {
  1063. // new section
  1064. s[len - 1] = '\0';
  1065. s++;
  1066. if (!strcmp(s, "app")) {
  1067. // a new app
  1068. app = callocz(sizeof(STATSD_APP), 1);
  1069. app->name = strdupz("unnamed");
  1070. app->rrd_memory_mode = localhost->rrd_memory_mode;
  1071. app->rrd_history_entries = localhost->rrd_history_entries;
  1072. app->next = statsd.apps;
  1073. statsd.apps = app;
  1074. chart = NULL;
  1075. dict = NULL;
  1076. {
  1077. char lineandfile[FILENAME_MAX + 1];
  1078. snprintfz(lineandfile, FILENAME_MAX, "%zu@%s", line, filename);
  1079. app->source = strdupz(lineandfile);
  1080. }
  1081. }
  1082. else if(app) {
  1083. if(!strcmp(s, "dictionary")) {
  1084. if(!app->dict)
  1085. app->dict = dictionary_create_advanced(DICT_OPTION_SINGLE_THREADED, &dictionary_stats_category_collectors, 0);
  1086. dict = app->dict;
  1087. }
  1088. else {
  1089. dict = NULL;
  1090. // a new chart
  1091. chart = callocz(sizeof(STATSD_APP_CHART), 1);
  1092. netdata_fix_chart_id(s);
  1093. chart->id = strdupz(s);
  1094. chart->name = strdupz(s);
  1095. chart->title = strdupz("Statsd chart");
  1096. chart->context = strdupz(s);
  1097. chart->family = strdupz("overview");
  1098. chart->units = strdupz("value");
  1099. chart->priority = NETDATA_CHART_PRIO_STATSD_PRIVATE;
  1100. chart->chart_type = RRDSET_TYPE_LINE;
  1101. chart->next = app->charts;
  1102. app->charts = chart;
  1103. if (!strncmp(
  1104. filename,
  1105. netdata_configured_stock_config_dir,
  1106. strlen(netdata_configured_stock_config_dir))) {
  1107. char tmpfilename[FILENAME_MAX + 1];
  1108. strncpyz(tmpfilename, filename, FILENAME_MAX);
  1109. chart->module = strdupz(basename(tmpfilename));
  1110. } else {
  1111. chart->module = strdupz("synthetic_chart");
  1112. }
  1113. }
  1114. }
  1115. else
  1116. netdata_log_error("STATSD: ignoring line %zu ('%s') of file '%s', [app] is not defined.", line, s, filename);
  1117. continue;
  1118. }
  1119. if(!app) {
  1120. netdata_log_error("STATSD: ignoring line %zu ('%s') of file '%s', it is outside all sections.", line, s, filename);
  1121. continue;
  1122. }
  1123. char *name = s;
  1124. char *value = strchr(s, '=');
  1125. if(!value) {
  1126. netdata_log_error("STATSD: ignoring line %zu ('%s') of file '%s', there is no = in it.", line, s, filename);
  1127. continue;
  1128. }
  1129. *value = '\0';
  1130. value++;
  1131. name = trim(name);
  1132. value = trim(value);
  1133. if(!name || *name == '#') {
  1134. netdata_log_error("STATSD: ignoring line %zu of file '%s', name is empty.", line, filename);
  1135. continue;
  1136. }
  1137. if(!value) {
  1138. netdata_log_debug(D_CONFIG, "STATSD: ignoring line %zu of file '%s', value is empty.", line, filename);
  1139. continue;
  1140. }
  1141. if(unlikely(dict)) {
  1142. // parse [dictionary] members
  1143. dictionary_set(dict, name, value, strlen(value) + 1);
  1144. }
  1145. else if(!chart) {
  1146. // parse [app] members
  1147. if(!strcmp(name, "name")) {
  1148. freez((void *)app->name);
  1149. netdata_fix_chart_name(value);
  1150. app->name = strdupz(value);
  1151. }
  1152. else if (!strcmp(name, "metrics")) {
  1153. simple_pattern_free(app->metrics);
  1154. app->metrics = simple_pattern_create(value, NULL, SIMPLE_PATTERN_EXACT, true);
  1155. }
  1156. else if (!strcmp(name, "private charts")) {
  1157. if (!strcmp(value, "yes") || !strcmp(value, "on"))
  1158. app->default_options |= STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1159. else
  1160. app->default_options &= ~STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1161. }
  1162. else if (!strcmp(name, "gaps when not collected")) {
  1163. if (!strcmp(value, "yes") || !strcmp(value, "on"))
  1164. app->default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  1165. }
  1166. else if (!strcmp(name, "memory mode")) {
  1167. // this is not supported anymore
  1168. // with the implementation of storage engines, all charts have the same storage engine always
  1169. // app->rrd_memory_mode = rrd_memory_mode_id(value);
  1170. ;
  1171. }
  1172. else if (!strcmp(name, "history")) {
  1173. app->rrd_history_entries = atol(value);
  1174. if (app->rrd_history_entries < 5)
  1175. app->rrd_history_entries = 5;
  1176. }
  1177. else {
  1178. netdata_log_error("STATSD: ignoring line %zu ('%s') of file '%s'. Unknown keyword for the [app] section.", line, name, filename);
  1179. continue;
  1180. }
  1181. }
  1182. else {
  1183. // parse [chart] members
  1184. if(!strcmp(name, "name")) {
  1185. freez((void *)chart->name);
  1186. netdata_fix_chart_id(value);
  1187. chart->name = strdupz(value);
  1188. }
  1189. else if(!strcmp(name, "title")) {
  1190. freez((void *)chart->title);
  1191. chart->title = strdupz(value);
  1192. }
  1193. else if (!strcmp(name, "family")) {
  1194. freez((void *)chart->family);
  1195. chart->family = strdupz(value);
  1196. }
  1197. else if (!strcmp(name, "context")) {
  1198. freez((void *)chart->context);
  1199. netdata_fix_chart_id(value);
  1200. chart->context = strdupz(value);
  1201. }
  1202. else if (!strcmp(name, "units")) {
  1203. freez((void *)chart->units);
  1204. chart->units = strdupz(value);
  1205. }
  1206. else if (!strcmp(name, "priority")) {
  1207. chart->priority = atol(value);
  1208. }
  1209. else if (!strcmp(name, "type")) {
  1210. chart->chart_type = rrdset_type_id(value);
  1211. }
  1212. else if (!strcmp(name, "dimension")) {
  1213. // metric [name [type [multiplier [divisor]]]]
  1214. char *words[10] = { NULL };
  1215. size_t num_words = quoted_strings_splitter_pluginsd(value, words, 10);
  1216. int pattern = 0;
  1217. size_t i = 0;
  1218. char *metric_name = get_word(words, num_words, i++);
  1219. if(strcmp(metric_name, "pattern") == 0) {
  1220. metric_name = get_word(words, num_words, i++);
  1221. pattern = 1;
  1222. }
  1223. char *dim_name = get_word(words, num_words, i++);
  1224. char *type = get_word(words, num_words, i++);
  1225. char *multiplier = get_word(words, num_words, i++);
  1226. char *divisor = get_word(words, num_words, i++);
  1227. char *opts = get_word(words, num_words, i++);
  1228. RRDDIM_FLAGS flags = RRDDIM_FLAG_NONE;
  1229. RRDDIM_OPTIONS options = RRDDIM_OPTION_NONE;
  1230. if(opts && *opts) {
  1231. if(strstr(opts, "hidden") != NULL) options |= RRDDIM_OPTION_HIDDEN;
  1232. if(strstr(opts, "noreset") != NULL) options |= RRDDIM_OPTION_DONT_DETECT_RESETS_OR_OVERFLOWS;
  1233. if(strstr(opts, "nooverflow") != NULL) options |= RRDDIM_OPTION_DONT_DETECT_RESETS_OR_OVERFLOWS;
  1234. }
  1235. if(!pattern) {
  1236. if(app->dict) {
  1237. if(dim_name && *dim_name) {
  1238. char *n = dictionary_get(app->dict, dim_name);
  1239. if(n) dim_name = n;
  1240. }
  1241. else {
  1242. dim_name = dictionary_get(app->dict, metric_name);
  1243. }
  1244. }
  1245. if(!dim_name || !*dim_name)
  1246. dim_name = metric_name;
  1247. }
  1248. STATSD_APP_CHART_DIM *dim = add_dimension_to_app_chart(
  1249. app
  1250. , chart
  1251. , metric_name
  1252. , dim_name
  1253. , (multiplier && *multiplier)?str2l(multiplier):1
  1254. , (divisor && *divisor)?str2l(divisor):1
  1255. , flags
  1256. ,
  1257. options, string2valuetype(type, line, filename)
  1258. );
  1259. if(pattern)
  1260. dim->metric_pattern = simple_pattern_create(dim->metric, NULL, SIMPLE_PATTERN_EXACT, true);
  1261. }
  1262. else {
  1263. netdata_log_error("STATSD: ignoring line %zu ('%s') of file '%s'. Unknown keyword for the [%s] section.", line, name, filename, chart->id);
  1264. continue;
  1265. }
  1266. }
  1267. }
  1268. freez(buffer);
  1269. fclose(fp);
  1270. return 0;
  1271. }
  1272. static int statsd_file_callback(const char *filename, void *data) {
  1273. (void)data;
  1274. return statsd_readfile(filename, NULL, NULL, NULL);
  1275. }
  1276. static inline void statsd_readdir(const char *user_path, const char *stock_path, const char *subpath) {
  1277. recursive_config_double_dir_load(user_path, stock_path, subpath, statsd_file_callback, NULL, 0);
  1278. }
  1279. // --------------------------------------------------------------------------------------------------------------------
  1280. // send metrics to netdata - in private charts - called from the main thread
  1281. // extract chart type and chart id from metric name
  1282. static inline void statsd_get_metric_type_and_id(STATSD_METRIC *m, char *type, char *id, char *context, const char *metrictype, size_t len) {
  1283. // The full chart type.id looks like this:
  1284. // ${STATSD_CHART_PREFIX} + "_" + ${METRIC_NAME} + "_" + ${METRIC_TYPE}
  1285. //
  1286. // where:
  1287. // STATSD_CHART_PREFIX = "statsd" as defined above
  1288. // METRIC_NAME = whatever the user gave to statsd
  1289. // METRIC_TYPE = "gauge", "counter", "meter", "timer", "histogram", "set", "dictionary"
  1290. // for chart type, we want:
  1291. // ${STATSD_CHART_PREFIX} + "_" + the first word of ${METRIC_NAME}
  1292. // find the first word of ${METRIC_NAME}
  1293. char firstword[len + 1], *s = "";
  1294. strncpyz(firstword, m->name, len);
  1295. for (s = firstword; *s ; s++) {
  1296. if (unlikely(*s == '.' || *s == '_')) {
  1297. *s = '\0';
  1298. s++;
  1299. break;
  1300. }
  1301. }
  1302. // firstword has the first word of ${METRIC_NAME}
  1303. // s has the remaining, if any
  1304. // create the chart type:
  1305. snprintfz(type, len, STATSD_CHART_PREFIX "_%s", firstword);
  1306. // for chart id, we want:
  1307. // the remaining of the words of ${METRIC_NAME} + "_" + ${METRIC_TYPE}
  1308. // or the ${METRIC_NAME} has no remaining words, the ${METRIC_TYPE} alone
  1309. if(*s)
  1310. snprintfz(id, len, "%s_%s", s, metrictype);
  1311. else
  1312. snprintfz(id, len, "%s", metrictype);
  1313. // for the context, we want the full of both the above, separated with a dot (type.id):
  1314. snprintfz(context, RRD_ID_LENGTH_MAX, "%s.%s", type, id);
  1315. // make sure they don't have illegal characters
  1316. netdata_fix_chart_id(type);
  1317. netdata_fix_chart_id(id);
  1318. netdata_fix_chart_id(context);
  1319. }
  1320. static inline RRDSET *statsd_private_rrdset_create(
  1321. STATSD_METRIC *m __maybe_unused
  1322. , const char *type
  1323. , const char *id
  1324. , const char *name
  1325. , const char *family
  1326. , const char *context
  1327. , const char *title
  1328. , const char *units
  1329. , long priority
  1330. , int update_every
  1331. , RRDSET_TYPE chart_type
  1332. ) {
  1333. if(!m->st)
  1334. statsd.private_charts++;
  1335. RRDSET *st = rrdset_create_custom(
  1336. localhost // host
  1337. , type // type
  1338. , id // id
  1339. , name // name
  1340. , family // family
  1341. , context // context
  1342. , title // title
  1343. , units // units
  1344. , PLUGIN_STATSD_NAME // plugin
  1345. , "private_chart" // module
  1346. , priority // priority
  1347. , update_every // update every
  1348. , chart_type // chart type
  1349. , default_rrd_memory_mode // memory mode
  1350. , default_rrd_history_entries // history
  1351. );
  1352. rrdset_flag_set(st, RRDSET_FLAG_STORE_FIRST);
  1353. if(statsd.private_charts_hidden)
  1354. rrdset_flag_set(st, RRDSET_FLAG_HIDDEN);
  1355. // rrdset_flag_set(st, RRDSET_FLAG_DEBUG);
  1356. return st;
  1357. }
  1358. static inline void statsd_private_chart_gauge(STATSD_METRIC *m) {
  1359. netdata_log_debug(D_STATSD, "updating private chart for gauge metric '%s'", m->name);
  1360. if(m->st && unlikely(rrdset_flag_check(m->st, RRDSET_FLAG_OBSOLETE)))
  1361. return;
  1362. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1363. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1364. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1365. statsd_get_metric_type_and_id(m, type, id, context, "gauge", RRD_ID_LENGTH_MAX);
  1366. char title[RRD_ID_LENGTH_MAX + 1];
  1367. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for gauge %s", m->name);
  1368. m->st = statsd_private_rrdset_create(
  1369. m
  1370. , type
  1371. , id
  1372. , NULL // name
  1373. , m->family?m->family:"gauges" // family (submenu)
  1374. , context // context
  1375. , title // title
  1376. , m->units?m->units:"value" // units
  1377. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1378. , statsd.update_every
  1379. , RRDSET_TYPE_LINE
  1380. );
  1381. m->rd_value = rrddim_add(m->st, "gauge", m->dimname?m->dimname:NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1382. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1383. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1384. }
  1385. rrddim_set_by_pointer(m->st, m->rd_value, m->last);
  1386. if(m->rd_count)
  1387. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1388. rrdset_done(m->st);
  1389. }
  1390. static inline void statsd_private_chart_counter_or_meter(STATSD_METRIC *m, const char *dim, const char *family) {
  1391. netdata_log_debug(D_STATSD, "updating private chart for %s metric '%s'", dim, m->name);
  1392. if(m->st && unlikely(rrdset_flag_check(m->st, RRDSET_FLAG_OBSOLETE)))
  1393. return;
  1394. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1395. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1396. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1397. statsd_get_metric_type_and_id(m, type, id, context, dim, RRD_ID_LENGTH_MAX);
  1398. char title[RRD_ID_LENGTH_MAX + 1];
  1399. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for %s %s", dim, m->name);
  1400. m->st = statsd_private_rrdset_create(
  1401. m
  1402. , type
  1403. , id
  1404. , NULL // name
  1405. , m->family?m->family:family // family (submenu)
  1406. , context // context
  1407. , title // title
  1408. , m->units?m->units:"events/s" // units
  1409. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1410. , statsd.update_every
  1411. , RRDSET_TYPE_AREA
  1412. );
  1413. m->rd_value = rrddim_add(m->st, dim, m->dimname?m->dimname:NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1414. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1415. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1416. }
  1417. rrddim_set_by_pointer(m->st, m->rd_value, m->last);
  1418. if(m->rd_count)
  1419. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1420. rrdset_done(m->st);
  1421. }
  1422. static inline void statsd_private_chart_set(STATSD_METRIC *m) {
  1423. netdata_log_debug(D_STATSD, "updating private chart for set metric '%s'", m->name);
  1424. if(m->st && unlikely(rrdset_flag_check(m->st, RRDSET_FLAG_OBSOLETE)))
  1425. return;
  1426. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1427. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1428. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1429. statsd_get_metric_type_and_id(m, type, id, context, "set", RRD_ID_LENGTH_MAX);
  1430. char title[RRD_ID_LENGTH_MAX + 1];
  1431. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for set %s", m->name);
  1432. m->st = statsd_private_rrdset_create(
  1433. m
  1434. , type
  1435. , id
  1436. , NULL // name
  1437. , m->family?m->family:"sets" // family (submenu)
  1438. , context // context
  1439. , title // title
  1440. , m->units?m->units:"entries" // units
  1441. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1442. , statsd.update_every
  1443. , RRDSET_TYPE_LINE
  1444. );
  1445. m->rd_value = rrddim_add(m->st, "set", m->dimname?m->dimname:"unique", 1, 1, RRD_ALGORITHM_ABSOLUTE);
  1446. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1447. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1448. }
  1449. rrddim_set_by_pointer(m->st, m->rd_value, m->last);
  1450. if(m->rd_count)
  1451. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1452. rrdset_done(m->st);
  1453. }
  1454. static inline void statsd_private_chart_dictionary(STATSD_METRIC *m) {
  1455. netdata_log_debug(D_STATSD, "updating private chart for dictionary metric '%s'", m->name);
  1456. if(m->st && unlikely(rrdset_flag_check(m->st, RRDSET_FLAG_OBSOLETE)))
  1457. return;
  1458. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1459. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1460. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1461. statsd_get_metric_type_and_id(m, type, id, context, "dictionary", RRD_ID_LENGTH_MAX);
  1462. char title[RRD_ID_LENGTH_MAX + 1];
  1463. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for dictionary %s", m->name);
  1464. m->st = statsd_private_rrdset_create(
  1465. m
  1466. , type
  1467. , id
  1468. , NULL // name
  1469. , m->family?m->family:"dictionaries" // family (submenu)
  1470. , context // context
  1471. , title // title
  1472. , m->units?m->units:"events/s" // units
  1473. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1474. , statsd.update_every
  1475. , RRDSET_TYPE_STACKED
  1476. );
  1477. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1478. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1479. }
  1480. STATSD_METRIC_DICTIONARY_ITEM *t;
  1481. dfe_start_read(m->dictionary.dict, t) {
  1482. if (!t->rd) t->rd = rrddim_add(m->st, t_dfe.name, NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1483. rrddim_set_by_pointer(m->st, t->rd, (collected_number)t->count);
  1484. }
  1485. dfe_done(t);
  1486. if(m->rd_count)
  1487. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1488. rrdset_done(m->st);
  1489. }
  1490. static inline void statsd_private_chart_timer_or_histogram(STATSD_METRIC *m, const char *dim, const char *family, const char *units) {
  1491. netdata_log_debug(D_STATSD, "updating private chart for %s metric '%s'", dim, m->name);
  1492. if(m->st && unlikely(rrdset_flag_check(m->st, RRDSET_FLAG_OBSOLETE)))
  1493. return;
  1494. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1495. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1496. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1497. statsd_get_metric_type_and_id(m, type, id, context, dim, RRD_ID_LENGTH_MAX);
  1498. char title[RRD_ID_LENGTH_MAX + 1];
  1499. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for %s %s", dim, m->name);
  1500. m->st = statsd_private_rrdset_create(
  1501. m
  1502. , type
  1503. , id
  1504. , NULL // name
  1505. , m->family?m->family:family // family (submenu)
  1506. , context // context
  1507. , title // title
  1508. , m->units?m->units:units // units
  1509. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1510. , statsd.update_every
  1511. , RRDSET_TYPE_AREA
  1512. );
  1513. m->histogram.ext->rd_min = rrddim_add(m->st, "min", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1514. m->histogram.ext->rd_max = rrddim_add(m->st, "max", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1515. m->rd_value = rrddim_add(m->st, "average", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1516. m->histogram.ext->rd_percentile = rrddim_add(m->st, statsd.histogram_percentile_str, NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1517. m->histogram.ext->rd_median = rrddim_add(m->st, "median", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1518. m->histogram.ext->rd_stddev = rrddim_add(m->st, "stddev", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1519. //m->histogram.ext->rd_sum = rrddim_add(m->st, "sum", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1520. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1521. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1522. }
  1523. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_min, m->histogram.ext->last_min);
  1524. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_max, m->histogram.ext->last_max);
  1525. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_percentile, m->histogram.ext->last_percentile);
  1526. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_median, m->histogram.ext->last_median);
  1527. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_stddev, m->histogram.ext->last_stddev);
  1528. //rrddim_set_by_pointer(m->st, m->histogram.ext->rd_sum, m->histogram.ext->last_sum);
  1529. rrddim_set_by_pointer(m->st, m->rd_value, m->last);
  1530. if(m->rd_count)
  1531. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1532. rrdset_done(m->st);
  1533. }
  1534. // --------------------------------------------------------------------------------------------------------------------
  1535. // statsd flush metrics
  1536. static inline void metric_check_obsoletion(STATSD_METRIC *m) {
  1537. if(statsd.set_obsolete_after &&
  1538. !rrdset_flag_check(m->st, RRDSET_FLAG_OBSOLETE) &&
  1539. m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED &&
  1540. m->last_collected + statsd.set_obsolete_after < now_realtime_sec()) {
  1541. rrdset_is_obsolete___safe_from_collector_thread(m->st);
  1542. m->options |= STATSD_METRIC_OPTION_OBSOLETE;
  1543. }
  1544. }
  1545. static inline void statsd_flush_gauge(STATSD_METRIC *m) {
  1546. netdata_log_debug(D_STATSD, "flushing gauge metric '%s'", m->name);
  1547. int updated = 0;
  1548. if(unlikely(!m->reset && m->count)) {
  1549. m->last = (collected_number) (m->gauge.value * statsd.decimal_detail);
  1550. m->reset = 1;
  1551. updated = 1;
  1552. }
  1553. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1554. statsd_private_chart_gauge(m);
  1555. metric_check_obsoletion(m);
  1556. }
  1557. static inline void statsd_flush_counter_or_meter(STATSD_METRIC *m, const char *dim, const char *family) {
  1558. netdata_log_debug(D_STATSD, "flushing %s metric '%s'", dim, m->name);
  1559. int updated = 0;
  1560. if(unlikely(!m->reset && m->count)) {
  1561. m->last = m->counter.value;
  1562. m->reset = 1;
  1563. updated = 1;
  1564. }
  1565. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1566. statsd_private_chart_counter_or_meter(m, dim, family);
  1567. metric_check_obsoletion(m);
  1568. }
  1569. static inline void statsd_flush_counter(STATSD_METRIC *m) {
  1570. statsd_flush_counter_or_meter(m, "counter", "counters");
  1571. }
  1572. static inline void statsd_flush_meter(STATSD_METRIC *m) {
  1573. statsd_flush_counter_or_meter(m, "meter", "meters");
  1574. }
  1575. static inline void statsd_flush_set(STATSD_METRIC *m) {
  1576. netdata_log_debug(D_STATSD, "flushing set metric '%s'", m->name);
  1577. int updated = 0;
  1578. if(unlikely(!m->reset && m->count)) {
  1579. m->last = (collected_number)dictionary_entries(m->set.dict);
  1580. m->reset = 1;
  1581. updated = 1;
  1582. }
  1583. else {
  1584. m->last = 0;
  1585. }
  1586. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1587. statsd_private_chart_set(m);
  1588. metric_check_obsoletion(m);
  1589. }
  1590. static inline void statsd_flush_dictionary(STATSD_METRIC *m) {
  1591. netdata_log_debug(D_STATSD, "flushing dictionary metric '%s'", m->name);
  1592. int updated = 0;
  1593. if(unlikely(!m->reset && m->count)) {
  1594. m->last = (collected_number)dictionary_entries(m->dictionary.dict);
  1595. m->reset = 1;
  1596. updated = 1;
  1597. }
  1598. else {
  1599. m->last = 0;
  1600. }
  1601. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1602. statsd_private_chart_dictionary(m);
  1603. if(dictionary_entries(m->dictionary.dict) >= statsd.dictionary_max_unique) {
  1604. if(!(m->options & STATSD_METRIC_OPTION_COLLECTION_FULL_LOGGED)) {
  1605. m->options |= STATSD_METRIC_OPTION_COLLECTION_FULL_LOGGED;
  1606. collector_info(
  1607. "STATSD dictionary '%s' reach max of %zu items - try increasing 'dictionaries max unique dimensions' in netdata.conf",
  1608. m->name,
  1609. dictionary_entries(m->dictionary.dict));
  1610. }
  1611. }
  1612. metric_check_obsoletion(m);
  1613. }
  1614. static inline void statsd_flush_timer_or_histogram(STATSD_METRIC *m, const char *dim, const char *family, const char *units) {
  1615. netdata_log_debug(D_STATSD, "flushing %s metric '%s'", dim, m->name);
  1616. int updated = 0;
  1617. if(unlikely(!m->reset && m->count && m->histogram.ext->used > 0)) {
  1618. netdata_mutex_lock(&m->histogram.ext->mutex);
  1619. size_t len = m->histogram.ext->used;
  1620. NETDATA_DOUBLE *series = m->histogram.ext->values;
  1621. sort_series(series, len);
  1622. m->histogram.ext->last_min = (collected_number)roundndd(series[0] * statsd.decimal_detail);
  1623. m->histogram.ext->last_max = (collected_number)roundndd(series[len - 1] * statsd.decimal_detail);
  1624. m->last = (collected_number)roundndd(average(series, len) * statsd.decimal_detail);
  1625. m->histogram.ext->last_median = (collected_number)roundndd(median_on_sorted_series(series, len) * statsd.decimal_detail);
  1626. m->histogram.ext->last_stddev = (collected_number)roundndd(standard_deviation(series, len) * statsd.decimal_detail);
  1627. m->histogram.ext->last_sum = (collected_number)roundndd(sum(series, len) * statsd.decimal_detail);
  1628. size_t pct_len = (size_t)floor((double)len * statsd.histogram_percentile / 100.0);
  1629. if(pct_len < 1)
  1630. m->histogram.ext->last_percentile = (collected_number)(series[0] * statsd.decimal_detail);
  1631. else
  1632. m->histogram.ext->last_percentile = (collected_number)roundndd(series[pct_len - 1] * statsd.decimal_detail);
  1633. netdata_mutex_unlock(&m->histogram.ext->mutex);
  1634. netdata_log_debug(D_STATSD, "STATSD %s metric %s: min " COLLECTED_NUMBER_FORMAT ", max " COLLECTED_NUMBER_FORMAT ", last " COLLECTED_NUMBER_FORMAT ", pcent " COLLECTED_NUMBER_FORMAT ", median " COLLECTED_NUMBER_FORMAT ", stddev " COLLECTED_NUMBER_FORMAT ", sum " COLLECTED_NUMBER_FORMAT,
  1635. dim, m->name, m->histogram.ext->last_min, m->histogram.ext->last_max, m->last, m->histogram.ext->last_percentile, m->histogram.ext->last_median, m->histogram.ext->last_stddev, m->histogram.ext->last_sum);
  1636. m->histogram.ext->zeroed = 0;
  1637. m->reset = 1;
  1638. updated = 1;
  1639. }
  1640. else if(unlikely(!m->histogram.ext->zeroed)) {
  1641. // reset the metrics
  1642. // if we collected anything, they will be updated below
  1643. // this ensures that we report zeros if nothing is collected
  1644. m->histogram.ext->last_min = 0;
  1645. m->histogram.ext->last_max = 0;
  1646. m->last = 0;
  1647. m->histogram.ext->last_median = 0;
  1648. m->histogram.ext->last_stddev = 0;
  1649. m->histogram.ext->last_sum = 0;
  1650. m->histogram.ext->last_percentile = 0;
  1651. m->histogram.ext->zeroed = 1;
  1652. }
  1653. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1654. statsd_private_chart_timer_or_histogram(m, dim, family, units);
  1655. metric_check_obsoletion(m);
  1656. }
  1657. static inline void statsd_flush_timer(STATSD_METRIC *m) {
  1658. statsd_flush_timer_or_histogram(m, "timer", "timers", "milliseconds");
  1659. }
  1660. static inline void statsd_flush_histogram(STATSD_METRIC *m) {
  1661. statsd_flush_timer_or_histogram(m, "histogram", "histograms", "value");
  1662. }
  1663. static inline RRD_ALGORITHM statsd_algorithm_for_metric(STATSD_METRIC *m) {
  1664. switch(m->type) {
  1665. default:
  1666. case STATSD_METRIC_TYPE_GAUGE:
  1667. case STATSD_METRIC_TYPE_SET:
  1668. case STATSD_METRIC_TYPE_TIMER:
  1669. case STATSD_METRIC_TYPE_HISTOGRAM:
  1670. return RRD_ALGORITHM_ABSOLUTE;
  1671. case STATSD_METRIC_TYPE_METER:
  1672. case STATSD_METRIC_TYPE_COUNTER:
  1673. case STATSD_METRIC_TYPE_DICTIONARY:
  1674. return RRD_ALGORITHM_INCREMENTAL;
  1675. }
  1676. }
  1677. static inline void link_metric_to_app_dimension(STATSD_APP *app, STATSD_METRIC *m, STATSD_APP_CHART *chart, STATSD_APP_CHART_DIM *dim) {
  1678. if(dim->value_type == STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS) {
  1679. dim->value_ptr = &m->events;
  1680. dim->algorithm = RRD_ALGORITHM_INCREMENTAL;
  1681. }
  1682. else if(m->type == STATSD_METRIC_TYPE_HISTOGRAM || m->type == STATSD_METRIC_TYPE_TIMER) {
  1683. dim->algorithm = RRD_ALGORITHM_ABSOLUTE;
  1684. dim->divisor *= statsd.decimal_detail;
  1685. switch(dim->value_type) {
  1686. case STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS:
  1687. // will never match - added to avoid warning
  1688. break;
  1689. case STATSD_APP_CHART_DIM_VALUE_TYPE_LAST:
  1690. case STATSD_APP_CHART_DIM_VALUE_TYPE_AVERAGE:
  1691. dim->value_ptr = &m->last;
  1692. break;
  1693. case STATSD_APP_CHART_DIM_VALUE_TYPE_SUM:
  1694. dim->value_ptr = &m->histogram.ext->last_sum;
  1695. break;
  1696. case STATSD_APP_CHART_DIM_VALUE_TYPE_MIN:
  1697. dim->value_ptr = &m->histogram.ext->last_min;
  1698. break;
  1699. case STATSD_APP_CHART_DIM_VALUE_TYPE_MAX:
  1700. dim->value_ptr = &m->histogram.ext->last_max;
  1701. break;
  1702. case STATSD_APP_CHART_DIM_VALUE_TYPE_MEDIAN:
  1703. dim->value_ptr = &m->histogram.ext->last_median;
  1704. break;
  1705. case STATSD_APP_CHART_DIM_VALUE_TYPE_PERCENTILE:
  1706. dim->value_ptr = &m->histogram.ext->last_percentile;
  1707. break;
  1708. case STATSD_APP_CHART_DIM_VALUE_TYPE_STDDEV:
  1709. dim->value_ptr = &m->histogram.ext->last_stddev;
  1710. break;
  1711. }
  1712. }
  1713. else {
  1714. if (dim->value_type != STATSD_APP_CHART_DIM_VALUE_TYPE_LAST)
  1715. netdata_log_error("STATSD: unsupported value type for dimension '%s' of chart '%s' of app '%s' on metric '%s'", dim->name, chart->id, app->name, m->name);
  1716. dim->value_ptr = &m->last;
  1717. dim->algorithm = statsd_algorithm_for_metric(m);
  1718. if(m->type == STATSD_METRIC_TYPE_GAUGE)
  1719. dim->divisor *= statsd.decimal_detail;
  1720. }
  1721. if(unlikely(chart->st && dim->rd)) {
  1722. rrddim_set_algorithm(chart->st, dim->rd, dim->algorithm);
  1723. rrddim_set_multiplier(chart->st, dim->rd, dim->multiplier);
  1724. rrddim_set_divisor(chart->st, dim->rd, dim->divisor);
  1725. }
  1726. chart->dimensions_linked_count++;
  1727. m->options |= STATSD_METRIC_OPTION_USED_IN_APPS;
  1728. netdata_log_debug(D_STATSD, "metric '%s' of type %u linked with app '%s', chart '%s', dimension '%s', algorithm '%s'", m->name, m->type, app->name, chart->id, dim->name, rrd_algorithm_name(dim->algorithm));
  1729. }
  1730. static inline void check_if_metric_is_for_app(STATSD_INDEX *index, STATSD_METRIC *m) {
  1731. (void)index;
  1732. STATSD_APP *app;
  1733. for(app = statsd.apps; app ;app = app->next) {
  1734. if(unlikely(simple_pattern_matches(app->metrics, m->name))) {
  1735. netdata_log_debug(D_STATSD, "metric '%s' matches app '%s'", m->name, app->name);
  1736. // the metric should get the options from the app
  1737. if(app->default_options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED)
  1738. m->options |= STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1739. else
  1740. m->options &= ~STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1741. if(app->default_options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED)
  1742. m->options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  1743. else
  1744. m->options &= ~STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  1745. m->options |= STATSD_METRIC_OPTION_PRIVATE_CHART_CHECKED;
  1746. // check if there is a chart in this app, willing to get this metric
  1747. STATSD_APP_CHART *chart;
  1748. for(chart = app->charts; chart; chart = chart->next) {
  1749. STATSD_APP_CHART_DIM *dim;
  1750. for(dim = chart->dimensions; dim ; dim = dim->next) {
  1751. if(unlikely(dim->metric_pattern)) {
  1752. size_t dim_name_len = strlen(dim->name);
  1753. size_t wildcarded_len = dim_name_len + strlen(m->name) + 1;
  1754. char wildcarded[wildcarded_len];
  1755. strcpy(wildcarded, dim->name);
  1756. char *ws = &wildcarded[dim_name_len];
  1757. if(simple_pattern_matches_extract(dim->metric_pattern, m->name, ws, wildcarded_len - dim_name_len) == SP_MATCHED_POSITIVE) {
  1758. char *final_name = NULL;
  1759. if(app->dict) {
  1760. if(likely(*wildcarded)) {
  1761. // use the name of the wildcarded string
  1762. final_name = dictionary_get(app->dict, wildcarded);
  1763. }
  1764. if(unlikely(!final_name)) {
  1765. // use the name of the metric
  1766. final_name = dictionary_get(app->dict, m->name);
  1767. }
  1768. }
  1769. if(unlikely(!final_name))
  1770. final_name = wildcarded;
  1771. add_dimension_to_app_chart(
  1772. app
  1773. , chart
  1774. , m->name
  1775. , final_name
  1776. , dim->multiplier
  1777. , dim->divisor
  1778. , dim->flags
  1779. , dim->options
  1780. , dim->value_type
  1781. );
  1782. // the new dimension is appended to the list
  1783. // so, it will be matched and linked later too
  1784. }
  1785. }
  1786. else if(!dim->value_ptr && dim->metric_hash == m->hash && !strcmp(dim->metric, m->name)) {
  1787. // we have a match - this metric should be linked to this dimension
  1788. link_metric_to_app_dimension(app, m, chart, dim);
  1789. }
  1790. }
  1791. }
  1792. }
  1793. }
  1794. }
  1795. static inline RRDDIM *statsd_add_dim_to_app_chart(STATSD_APP *app, STATSD_APP_CHART *chart, STATSD_APP_CHART_DIM *dim) {
  1796. (void)app;
  1797. // allow the same statsd metric to be added multiple times to the same chart
  1798. STATSD_APP_CHART_DIM *tdim;
  1799. size_t count_same_metric = 0, count_same_metric_value_type = 0;
  1800. size_t pos_same_metric_value_type = 0;
  1801. for (tdim = chart->dimensions; tdim && tdim->next; tdim = tdim->next) {
  1802. if (dim->metric_hash == tdim->metric_hash && !strcmp(dim->metric, tdim->metric)) {
  1803. count_same_metric++;
  1804. if(dim->value_type == tdim->value_type) {
  1805. count_same_metric_value_type++;
  1806. if (tdim == dim)
  1807. pos_same_metric_value_type = count_same_metric_value_type;
  1808. }
  1809. }
  1810. }
  1811. if(count_same_metric > 1) {
  1812. // the same metric is found multiple times
  1813. size_t len = strlen(dim->metric) + 100;
  1814. char metric[ len + 1 ];
  1815. if(count_same_metric_value_type > 1) {
  1816. // the same metric, with the same value type, is added multiple times
  1817. snprintfz(metric, len, "%s_%s%zu", dim->metric, valuetype2string(dim->value_type), pos_same_metric_value_type);
  1818. }
  1819. else {
  1820. // the same metric, with different value type is added
  1821. snprintfz(metric, len, "%s_%s", dim->metric, valuetype2string(dim->value_type));
  1822. }
  1823. dim->rd = rrddim_add(chart->st, metric, dim->name, dim->multiplier, dim->divisor, dim->algorithm);
  1824. if(dim->flags != RRDDIM_FLAG_NONE) dim->rd->flags |= dim->flags;
  1825. if(dim->options != RRDDIM_OPTION_NONE) dim->rd->collector.options |= dim->options;
  1826. return dim->rd;
  1827. }
  1828. dim->rd = rrddim_add(chart->st, dim->metric, dim->name, dim->multiplier, dim->divisor, dim->algorithm);
  1829. if(dim->flags != RRDDIM_FLAG_NONE) dim->rd->flags |= dim->flags;
  1830. if(dim->options != RRDDIM_OPTION_NONE) dim->rd->collector.options |= dim->options;
  1831. return dim->rd;
  1832. }
  1833. static inline void statsd_update_app_chart(STATSD_APP *app, STATSD_APP_CHART *chart) {
  1834. netdata_log_debug(D_STATSD, "updating chart '%s' for app '%s'", chart->id, app->name);
  1835. if(!chart->st) {
  1836. chart->st = rrdset_create_custom(
  1837. localhost // host
  1838. , app->name // type
  1839. , chart->id // id
  1840. , chart->name // name
  1841. , chart->family // family
  1842. , chart->context // context
  1843. , chart->title // title
  1844. , chart->units // units
  1845. , PLUGIN_STATSD_NAME // plugin
  1846. , chart->module // module
  1847. , chart->priority // priority
  1848. , statsd.update_every // update every
  1849. , chart->chart_type // chart type
  1850. , app->rrd_memory_mode // memory mode
  1851. , app->rrd_history_entries // history
  1852. );
  1853. rrdset_flag_set(chart->st, RRDSET_FLAG_STORE_FIRST);
  1854. // rrdset_flag_set(chart->st, RRDSET_FLAG_DEBUG);
  1855. }
  1856. STATSD_APP_CHART_DIM *dim;
  1857. for(dim = chart->dimensions; dim ;dim = dim->next) {
  1858. if(likely(!dim->metric_pattern)) {
  1859. if (unlikely(!dim->rd))
  1860. statsd_add_dim_to_app_chart(app, chart, dim);
  1861. if (unlikely(dim->value_ptr)) {
  1862. netdata_log_debug(D_STATSD, "updating dimension '%s' (%s) of chart '%s' (%s) for app '%s' with value " COLLECTED_NUMBER_FORMAT, dim->name, rrddim_id(dim->rd), chart->id, rrdset_id(chart->st), app->name, *dim->value_ptr);
  1863. rrddim_set_by_pointer(chart->st, dim->rd, *dim->value_ptr);
  1864. }
  1865. }
  1866. }
  1867. rrdset_done(chart->st);
  1868. netdata_log_debug(D_STATSD, "completed update of chart '%s' for app '%s'", chart->id, app->name);
  1869. }
  1870. static inline void statsd_update_all_app_charts(void) {
  1871. // netdata_log_debug(D_STATSD, "updating app charts");
  1872. STATSD_APP *app;
  1873. for(app = statsd.apps; app ;app = app->next) {
  1874. // netdata_log_debug(D_STATSD, "updating charts for app '%s'", app->name);
  1875. STATSD_APP_CHART *chart;
  1876. for(chart = app->charts; chart ;chart = chart->next) {
  1877. if(unlikely(chart->dimensions_linked_count)) {
  1878. statsd_update_app_chart(app, chart);
  1879. }
  1880. }
  1881. }
  1882. // netdata_log_debug(D_STATSD, "completed update of app charts");
  1883. }
  1884. const char *statsd_metric_type_string(STATSD_METRIC_TYPE type) {
  1885. switch(type) {
  1886. case STATSD_METRIC_TYPE_COUNTER: return "counter";
  1887. case STATSD_METRIC_TYPE_GAUGE: return "gauge";
  1888. case STATSD_METRIC_TYPE_HISTOGRAM: return "histogram";
  1889. case STATSD_METRIC_TYPE_METER: return "meter";
  1890. case STATSD_METRIC_TYPE_SET: return "set";
  1891. case STATSD_METRIC_TYPE_DICTIONARY: return "dictionary";
  1892. case STATSD_METRIC_TYPE_TIMER: return "timer";
  1893. default: return "unknown";
  1894. }
  1895. }
  1896. static inline void statsd_flush_index_metrics(STATSD_INDEX *index, void (*flush_metric)(STATSD_METRIC *)) {
  1897. STATSD_METRIC *m;
  1898. // find the useful metrics (incremental = each time we are called, we check the new metrics only)
  1899. dfe_start_read(index->dict, m) {
  1900. // since we add new metrics at the beginning
  1901. // check for useful charts, until the point we last checked
  1902. if(unlikely(is_metric_checked(m))) break;
  1903. if(unlikely(!(m->options & STATSD_METRIC_OPTION_CHECKED_IN_APPS))) {
  1904. nd_log(NDLS_ACCESS, NDLP_DEBUG, "NEW STATSD METRIC '%s': '%s'", statsd_metric_type_string(m->type), m->name);
  1905. check_if_metric_is_for_app(index, m);
  1906. m->options |= STATSD_METRIC_OPTION_CHECKED_IN_APPS;
  1907. }
  1908. if(unlikely(!(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_CHECKED))) {
  1909. if(unlikely(statsd.private_charts >= statsd.max_private_charts_hard)) {
  1910. netdata_log_debug(D_STATSD, "STATSD: metric '%s' will not be charted, because the hard limit of the maximum number "
  1911. "of charts has been reached.", m->name);
  1912. collector_info("STATSD: metric '%s' will not be charted, because the hard limit of the maximum number "
  1913. "of charts (%u) has been reached. Increase the number of charts by editing netdata.conf, "
  1914. "[statsd] section.", m->name, statsd.max_private_charts_hard);
  1915. m->options &= ~STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1916. }
  1917. else {
  1918. if (simple_pattern_matches(statsd.charts_for, m->name)) {
  1919. netdata_log_debug(D_STATSD, "STATSD: metric '%s' will be charted.", m->name);
  1920. m->options |= STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1921. } else {
  1922. netdata_log_debug(D_STATSD, "STATSD: metric '%s' will not be charted.", m->name);
  1923. m->options &= ~STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1924. }
  1925. }
  1926. m->options |= STATSD_METRIC_OPTION_PRIVATE_CHART_CHECKED;
  1927. }
  1928. // mark it as checked
  1929. m->options |= STATSD_METRIC_OPTION_CHECKED;
  1930. // check if it is used in charts
  1931. if((m->options & (STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED|STATSD_METRIC_OPTION_USED_IN_APPS)) && !(m->options & STATSD_METRIC_OPTION_USEFUL)) {
  1932. m->options |= STATSD_METRIC_OPTION_USEFUL;
  1933. index->useful++;
  1934. m->next_useful = index->first_useful;
  1935. index->first_useful = m;
  1936. }
  1937. }
  1938. dfe_done(m);
  1939. // flush all the useful metrics
  1940. STATSD_METRIC *m_prev;
  1941. for(m_prev = m = index->first_useful; m ; m = m->next_useful) {
  1942. flush_metric(m);
  1943. if (m->options & STATSD_METRIC_OPTION_OBSOLETE) {
  1944. if (m == index->first_useful)
  1945. index->first_useful = m->next_useful;
  1946. else
  1947. m_prev->next_useful = m->next_useful;
  1948. dictionary_del(index->dict, m->name);
  1949. index->useful--;
  1950. index->metrics--;
  1951. statsd.private_charts--;
  1952. } else
  1953. m_prev = m;
  1954. }
  1955. }
  1956. // --------------------------------------------------------------------------------------
  1957. // statsd main thread
  1958. static int statsd_listen_sockets_setup(void) {
  1959. return listen_sockets_setup(&statsd.sockets);
  1960. }
  1961. static void statsd_main_cleanup(void *data) {
  1962. struct netdata_static_thread *static_thread = (struct netdata_static_thread *)data;
  1963. static_thread->enabled = NETDATA_MAIN_THREAD_EXITING;
  1964. collector_info("cleaning up...");
  1965. if (statsd.collection_threads_status) {
  1966. int i;
  1967. for (i = 0; i < statsd.threads; i++) {
  1968. spinlock_lock(&statsd.collection_threads_status[i].spinlock);
  1969. if(statsd.collection_threads_status[i].running) {
  1970. collector_info("STATSD: stopping data collection thread %d...", i + 1);
  1971. netdata_thread_cancel(statsd.collection_threads_status[i].thread);
  1972. }
  1973. else {
  1974. collector_info("STATSD: data collection thread %d found stopped.", i + 1);
  1975. }
  1976. spinlock_unlock(&statsd.collection_threads_status[i].spinlock);
  1977. }
  1978. }
  1979. collector_info("STATSD: closing sockets...");
  1980. listen_sockets_close(&statsd.sockets);
  1981. // destroy the dictionaries
  1982. dictionary_destroy(statsd.gauges.dict);
  1983. dictionary_destroy(statsd.meters.dict);
  1984. dictionary_destroy(statsd.counters.dict);
  1985. dictionary_destroy(statsd.histograms.dict);
  1986. dictionary_destroy(statsd.dictionaries.dict);
  1987. dictionary_destroy(statsd.sets.dict);
  1988. dictionary_destroy(statsd.timers.dict);
  1989. collector_info("STATSD: cleanup completed.");
  1990. static_thread->enabled = NETDATA_MAIN_THREAD_EXITED;
  1991. worker_unregister();
  1992. }
  1993. #define WORKER_STATSD_FLUSH_GAUGES 0
  1994. #define WORKER_STATSD_FLUSH_COUNTERS 1
  1995. #define WORKER_STATSD_FLUSH_METERS 2
  1996. #define WORKER_STATSD_FLUSH_TIMERS 3
  1997. #define WORKER_STATSD_FLUSH_HISTOGRAMS 4
  1998. #define WORKER_STATSD_FLUSH_SETS 5
  1999. #define WORKER_STATSD_FLUSH_DICTIONARIES 6
  2000. #define WORKER_STATSD_FLUSH_STATS 7
  2001. #if WORKER_UTILIZATION_MAX_JOB_TYPES < 8
  2002. #error WORKER_UTILIZATION_MAX_JOB_TYPES has to be at least 8
  2003. #endif
  2004. void *statsd_main(void *ptr) {
  2005. worker_register("STATSDFLUSH");
  2006. worker_register_job_name(WORKER_STATSD_FLUSH_GAUGES, "gauges");
  2007. worker_register_job_name(WORKER_STATSD_FLUSH_COUNTERS, "counters");
  2008. worker_register_job_name(WORKER_STATSD_FLUSH_METERS, "meters");
  2009. worker_register_job_name(WORKER_STATSD_FLUSH_TIMERS, "timers");
  2010. worker_register_job_name(WORKER_STATSD_FLUSH_HISTOGRAMS, "histograms");
  2011. worker_register_job_name(WORKER_STATSD_FLUSH_SETS, "sets");
  2012. worker_register_job_name(WORKER_STATSD_FLUSH_DICTIONARIES, "dictionaries");
  2013. worker_register_job_name(WORKER_STATSD_FLUSH_STATS, "statistics");
  2014. netdata_thread_cleanup_push(statsd_main_cleanup, ptr);
  2015. statsd.gauges.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  2016. statsd.meters.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  2017. statsd.counters.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  2018. statsd.histograms.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  2019. statsd.dictionaries.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  2020. statsd.sets.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  2021. statsd.timers.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  2022. dictionary_register_insert_callback(statsd.gauges.dict, dictionary_metric_insert_callback, &statsd.gauges);
  2023. dictionary_register_insert_callback(statsd.meters.dict, dictionary_metric_insert_callback, &statsd.meters);
  2024. dictionary_register_insert_callback(statsd.counters.dict, dictionary_metric_insert_callback, &statsd.counters);
  2025. dictionary_register_insert_callback(statsd.histograms.dict, dictionary_metric_insert_callback, &statsd.histograms);
  2026. dictionary_register_insert_callback(statsd.dictionaries.dict, dictionary_metric_insert_callback, &statsd.dictionaries);
  2027. dictionary_register_insert_callback(statsd.sets.dict, dictionary_metric_insert_callback, &statsd.sets);
  2028. dictionary_register_insert_callback(statsd.timers.dict, dictionary_metric_insert_callback, &statsd.timers);
  2029. dictionary_register_delete_callback(statsd.gauges.dict, dictionary_metric_delete_callback, &statsd.gauges);
  2030. dictionary_register_delete_callback(statsd.meters.dict, dictionary_metric_delete_callback, &statsd.meters);
  2031. dictionary_register_delete_callback(statsd.counters.dict, dictionary_metric_delete_callback, &statsd.counters);
  2032. dictionary_register_delete_callback(statsd.histograms.dict, dictionary_metric_delete_callback, &statsd.histograms);
  2033. dictionary_register_delete_callback(statsd.dictionaries.dict, dictionary_metric_delete_callback, &statsd.dictionaries);
  2034. dictionary_register_delete_callback(statsd.sets.dict, dictionary_metric_delete_callback, &statsd.sets);
  2035. dictionary_register_delete_callback(statsd.timers.dict, dictionary_metric_delete_callback, &statsd.timers);
  2036. // ----------------------------------------------------------------------------------------------------------------
  2037. // statsd configuration
  2038. statsd.enabled = config_get_boolean(CONFIG_SECTION_PLUGINS, "statsd", statsd.enabled);
  2039. statsd.update_every = default_rrd_update_every;
  2040. statsd.update_every = (int)config_get_number(CONFIG_SECTION_STATSD, "update every (flushInterval)", statsd.update_every);
  2041. if(statsd.update_every < default_rrd_update_every) {
  2042. collector_error("STATSD: minimum flush interval %d given, but the minimum is the update every of netdata. Using %d", statsd.update_every, default_rrd_update_every);
  2043. statsd.update_every = default_rrd_update_every;
  2044. }
  2045. #ifdef HAVE_RECVMMSG
  2046. statsd.recvmmsg_size = (size_t)config_get_number(CONFIG_SECTION_STATSD, "udp messages to process at once", (long long)statsd.recvmmsg_size);
  2047. #endif
  2048. statsd.charts_for = simple_pattern_create(
  2049. config_get(CONFIG_SECTION_STATSD, "create private charts for metrics matching", "*"), NULL,
  2050. SIMPLE_PATTERN_EXACT, true);
  2051. statsd.max_private_charts_hard = (size_t)config_get_number(CONFIG_SECTION_STATSD, "max private charts hard limit", (long long)statsd.max_private_charts_hard);
  2052. statsd.set_obsolete_after = (size_t)config_get_number(CONFIG_SECTION_STATSD, "set charts as obsolete after secs", (long long)statsd.set_obsolete_after);
  2053. statsd.decimal_detail = (collected_number)config_get_number(CONFIG_SECTION_STATSD, "decimal detail", (long long int)statsd.decimal_detail);
  2054. statsd.tcp_idle_timeout = (size_t) config_get_number(CONFIG_SECTION_STATSD, "disconnect idle tcp clients after seconds", (long long int)statsd.tcp_idle_timeout);
  2055. statsd.private_charts_hidden = (unsigned int)config_get_boolean(CONFIG_SECTION_STATSD, "private charts hidden", statsd.private_charts_hidden);
  2056. statsd.histogram_percentile = (double)config_get_float(CONFIG_SECTION_STATSD, "histograms and timers percentile (percentThreshold)", statsd.histogram_percentile);
  2057. if(isless(statsd.histogram_percentile, 0) || isgreater(statsd.histogram_percentile, 100)) {
  2058. collector_error("STATSD: invalid histograms and timers percentile %0.5f given", statsd.histogram_percentile);
  2059. statsd.histogram_percentile = 95.0;
  2060. }
  2061. {
  2062. char buffer[314 + 1];
  2063. snprintfz(buffer, sizeof(buffer) - 1, "%0.1f%%", statsd.histogram_percentile);
  2064. statsd.histogram_percentile_str = strdupz(buffer);
  2065. }
  2066. statsd.dictionary_max_unique = config_get_number(CONFIG_SECTION_STATSD, "dictionaries max unique dimensions", statsd.dictionary_max_unique);
  2067. if(config_get_boolean(CONFIG_SECTION_STATSD, "add dimension for number of events received", 0)) {
  2068. statsd.gauges.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2069. statsd.counters.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2070. statsd.meters.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2071. statsd.sets.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2072. statsd.histograms.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2073. statsd.timers.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2074. statsd.dictionaries.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2075. }
  2076. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on gauges (deleteGauges)", 0))
  2077. statsd.gauges.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2078. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on counters (deleteCounters)", 0))
  2079. statsd.counters.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2080. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on meters (deleteMeters)", 0))
  2081. statsd.meters.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2082. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on sets (deleteSets)", 0))
  2083. statsd.sets.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2084. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on histograms (deleteHistograms)", 0))
  2085. statsd.histograms.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2086. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on timers (deleteTimers)", 0))
  2087. statsd.timers.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2088. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on dictionaries (deleteDictionaries)", 0))
  2089. statsd.dictionaries.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2090. size_t max_sockets = (size_t)config_get_number(CONFIG_SECTION_STATSD, "statsd server max TCP sockets", (long long int)(rlimit_nofile.rlim_cur / 4));
  2091. #ifdef STATSD_MULTITHREADED
  2092. statsd.threads = (int)config_get_number(CONFIG_SECTION_STATSD, "threads", processors);
  2093. if(statsd.threads < 1) {
  2094. collector_error("STATSD: Invalid number of threads %d, using %d", statsd.threads, processors);
  2095. statsd.threads = processors;
  2096. config_set_number(CONFIG_SECTION_STATSD, "collector threads", statsd.threads);
  2097. }
  2098. #else
  2099. statsd.threads = 1;
  2100. #endif
  2101. // read custom application definitions
  2102. statsd_readdir(netdata_configured_user_config_dir, netdata_configured_stock_config_dir, "statsd.d");
  2103. // ----------------------------------------------------------------------------------------------------------------
  2104. // statsd setup
  2105. if(!statsd.enabled) goto cleanup;
  2106. statsd_listen_sockets_setup();
  2107. if(!statsd.sockets.opened) {
  2108. collector_error("STATSD: No statsd sockets to listen to. statsd will be disabled.");
  2109. goto cleanup;
  2110. }
  2111. statsd.collection_threads_status = callocz((size_t)statsd.threads, sizeof(struct collection_thread_status));
  2112. int i;
  2113. for(i = 0; i < statsd.threads ;i++) {
  2114. statsd.collection_threads_status[i].max_sockets = max_sockets / statsd.threads;
  2115. char tag[NETDATA_THREAD_TAG_MAX + 1];
  2116. snprintfz(tag, NETDATA_THREAD_TAG_MAX, "STATSD_IN[%d]", i + 1);
  2117. spinlock_init(&statsd.collection_threads_status[i].spinlock);
  2118. netdata_thread_create(&statsd.collection_threads_status[i].thread, tag, NETDATA_THREAD_OPTION_DEFAULT, statsd_collector_thread, &statsd.collection_threads_status[i]);
  2119. }
  2120. // ----------------------------------------------------------------------------------------------------------------
  2121. // statsd monitoring charts
  2122. RRDSET *st_metrics = NULL;
  2123. RRDDIM *rd_metrics_gauge = NULL;
  2124. RRDDIM *rd_metrics_counter = NULL;
  2125. RRDDIM *rd_metrics_timer = NULL;
  2126. RRDDIM *rd_metrics_meter = NULL;
  2127. RRDDIM *rd_metrics_histogram = NULL;
  2128. RRDDIM *rd_metrics_set = NULL;
  2129. RRDDIM *rd_metrics_dictionary = NULL;
  2130. RRDSET *st_useful_metrics = NULL;
  2131. RRDDIM *rd_useful_metrics_gauge = NULL;
  2132. RRDDIM *rd_useful_metrics_counter = NULL;
  2133. RRDDIM *rd_useful_metrics_timer = NULL;
  2134. RRDDIM *rd_useful_metrics_meter = NULL;
  2135. RRDDIM *rd_useful_metrics_histogram = NULL;
  2136. RRDDIM *rd_useful_metrics_set = NULL;
  2137. RRDDIM *rd_useful_metrics_dictionary = NULL;
  2138. RRDSET *st_events = NULL;
  2139. RRDDIM *rd_events_gauge = NULL;
  2140. RRDDIM *rd_events_counter = NULL;
  2141. RRDDIM *rd_events_timer = NULL;
  2142. RRDDIM *rd_events_meter = NULL;
  2143. RRDDIM *rd_events_histogram = NULL;
  2144. RRDDIM *rd_events_set = NULL;
  2145. RRDDIM *rd_events_dictionary = NULL;
  2146. RRDDIM *rd_events_unknown = NULL;
  2147. RRDDIM *rd_events_errors = NULL;
  2148. RRDSET *st_reads = NULL;
  2149. RRDDIM *rd_reads_tcp = NULL;
  2150. RRDDIM *rd_reads_udp = NULL;
  2151. RRDSET *st_bytes = NULL;
  2152. RRDDIM *rd_bytes_tcp = NULL;
  2153. RRDDIM *rd_bytes_udp = NULL;
  2154. RRDSET *st_packets = NULL;
  2155. RRDDIM *rd_packets_tcp = NULL;
  2156. RRDDIM *rd_packets_udp = NULL;
  2157. RRDSET *st_tcp_connects = NULL;
  2158. RRDDIM *rd_tcp_connects = NULL;
  2159. RRDDIM *rd_tcp_disconnects = NULL;
  2160. RRDSET *st_tcp_connected = NULL;
  2161. RRDDIM *rd_tcp_connected = NULL;
  2162. RRDSET *st_pcharts = NULL;
  2163. RRDDIM *rd_pcharts = NULL;
  2164. if(global_statistics_enabled) {
  2165. st_metrics = rrdset_create_localhost(
  2166. "netdata",
  2167. "statsd_metrics",
  2168. NULL,
  2169. "statsd",
  2170. NULL,
  2171. "Metrics in the netdata statsd database",
  2172. "metrics",
  2173. PLUGIN_STATSD_NAME,
  2174. "stats",
  2175. 132010,
  2176. statsd.update_every,
  2177. RRDSET_TYPE_STACKED);
  2178. rd_metrics_gauge = rrddim_add(st_metrics, "gauges", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2179. rd_metrics_counter = rrddim_add(st_metrics, "counters", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2180. rd_metrics_timer = rrddim_add(st_metrics, "timers", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2181. rd_metrics_meter = rrddim_add(st_metrics, "meters", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2182. rd_metrics_histogram = rrddim_add(st_metrics, "histograms", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2183. rd_metrics_set = rrddim_add(st_metrics, "sets", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2184. rd_metrics_dictionary = rrddim_add(st_metrics, "dictionaries", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2185. st_useful_metrics = rrdset_create_localhost(
  2186. "netdata",
  2187. "statsd_useful_metrics",
  2188. NULL,
  2189. "statsd",
  2190. NULL,
  2191. "Useful metrics in the netdata statsd database",
  2192. "metrics",
  2193. PLUGIN_STATSD_NAME,
  2194. "stats",
  2195. 132010,
  2196. statsd.update_every,
  2197. RRDSET_TYPE_STACKED);
  2198. rd_useful_metrics_gauge = rrddim_add(st_useful_metrics, "gauges", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2199. rd_useful_metrics_counter = rrddim_add(st_useful_metrics, "counters", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2200. rd_useful_metrics_timer = rrddim_add(st_useful_metrics, "timers", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2201. rd_useful_metrics_meter = rrddim_add(st_useful_metrics, "meters", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2202. rd_useful_metrics_histogram = rrddim_add(st_useful_metrics, "histograms", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2203. rd_useful_metrics_set = rrddim_add(st_useful_metrics, "sets", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2204. rd_useful_metrics_dictionary = rrddim_add(st_useful_metrics, "dictionaries", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2205. st_events = rrdset_create_localhost(
  2206. "netdata",
  2207. "statsd_events",
  2208. NULL,
  2209. "statsd",
  2210. NULL,
  2211. "Events processed by the netdata statsd server",
  2212. "events/s",
  2213. PLUGIN_STATSD_NAME,
  2214. "stats",
  2215. 132011,
  2216. statsd.update_every,
  2217. RRDSET_TYPE_STACKED);
  2218. rd_events_gauge = rrddim_add(st_events, "gauges", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2219. rd_events_counter = rrddim_add(st_events, "counters", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2220. rd_events_timer = rrddim_add(st_events, "timers", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2221. rd_events_meter = rrddim_add(st_events, "meters", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2222. rd_events_histogram = rrddim_add(st_events, "histograms", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2223. rd_events_set = rrddim_add(st_events, "sets", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2224. rd_events_dictionary = rrddim_add(st_events, "dictionaries", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2225. rd_events_unknown = rrddim_add(st_events, "unknown", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2226. rd_events_errors = rrddim_add(st_events, "errors", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2227. st_reads = rrdset_create_localhost(
  2228. "netdata",
  2229. "statsd_reads",
  2230. NULL,
  2231. "statsd",
  2232. NULL,
  2233. "Read operations made by the netdata statsd server",
  2234. "reads/s",
  2235. PLUGIN_STATSD_NAME,
  2236. "stats",
  2237. 132012,
  2238. statsd.update_every,
  2239. RRDSET_TYPE_STACKED);
  2240. rd_reads_tcp = rrddim_add(st_reads, "tcp", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2241. rd_reads_udp = rrddim_add(st_reads, "udp", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2242. st_bytes = rrdset_create_localhost(
  2243. "netdata",
  2244. "statsd_bytes",
  2245. NULL,
  2246. "statsd",
  2247. NULL,
  2248. "Bytes read by the netdata statsd server",
  2249. "kilobits/s",
  2250. PLUGIN_STATSD_NAME,
  2251. "stats",
  2252. 132013,
  2253. statsd.update_every,
  2254. RRDSET_TYPE_STACKED);
  2255. rd_bytes_tcp = rrddim_add(st_bytes, "tcp", NULL, 8, BITS_IN_A_KILOBIT, RRD_ALGORITHM_INCREMENTAL);
  2256. rd_bytes_udp = rrddim_add(st_bytes, "udp", NULL, 8, BITS_IN_A_KILOBIT, RRD_ALGORITHM_INCREMENTAL);
  2257. st_packets = rrdset_create_localhost(
  2258. "netdata",
  2259. "statsd_packets",
  2260. NULL,
  2261. "statsd",
  2262. NULL,
  2263. "Network packets processed by the netdata statsd server",
  2264. "packets/s",
  2265. PLUGIN_STATSD_NAME,
  2266. "stats",
  2267. 132014,
  2268. statsd.update_every,
  2269. RRDSET_TYPE_STACKED);
  2270. rd_packets_tcp = rrddim_add(st_packets, "tcp", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2271. rd_packets_udp = rrddim_add(st_packets, "udp", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2272. st_tcp_connects = rrdset_create_localhost(
  2273. "netdata",
  2274. "tcp_connects",
  2275. NULL,
  2276. "statsd",
  2277. NULL,
  2278. "statsd server TCP connects and disconnects",
  2279. "events",
  2280. PLUGIN_STATSD_NAME,
  2281. "stats",
  2282. 132015,
  2283. statsd.update_every,
  2284. RRDSET_TYPE_LINE);
  2285. rd_tcp_connects = rrddim_add(st_tcp_connects, "connects", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2286. rd_tcp_disconnects = rrddim_add(st_tcp_connects, "disconnects", NULL, -1, 1, RRD_ALGORITHM_INCREMENTAL);
  2287. st_tcp_connected = rrdset_create_localhost(
  2288. "netdata",
  2289. "tcp_connected",
  2290. NULL,
  2291. "statsd",
  2292. NULL,
  2293. "statsd server TCP connected sockets",
  2294. "sockets",
  2295. PLUGIN_STATSD_NAME,
  2296. "stats",
  2297. 132016,
  2298. statsd.update_every,
  2299. RRDSET_TYPE_LINE);
  2300. rd_tcp_connected = rrddim_add(st_tcp_connected, "connected", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2301. st_pcharts = rrdset_create_localhost(
  2302. "netdata",
  2303. "private_charts",
  2304. NULL,
  2305. "statsd",
  2306. NULL,
  2307. "Private metric charts created by the netdata statsd server",
  2308. "charts",
  2309. PLUGIN_STATSD_NAME,
  2310. "stats",
  2311. 132020,
  2312. statsd.update_every,
  2313. RRDSET_TYPE_AREA);
  2314. rd_pcharts = rrddim_add(st_pcharts, "charts", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2315. }
  2316. // ----------------------------------------------------------------------------------------------------------------
  2317. // statsd thread to turn metrics into charts
  2318. usec_t step = statsd.update_every * USEC_PER_SEC;
  2319. heartbeat_t hb;
  2320. heartbeat_init(&hb);
  2321. while(service_running(SERVICE_COLLECTORS)) {
  2322. worker_is_idle();
  2323. heartbeat_next(&hb, step);
  2324. worker_is_busy(WORKER_STATSD_FLUSH_GAUGES);
  2325. statsd_flush_index_metrics(&statsd.gauges, statsd_flush_gauge);
  2326. worker_is_busy(WORKER_STATSD_FLUSH_COUNTERS);
  2327. statsd_flush_index_metrics(&statsd.counters, statsd_flush_counter);
  2328. worker_is_busy(WORKER_STATSD_FLUSH_METERS);
  2329. statsd_flush_index_metrics(&statsd.meters, statsd_flush_meter);
  2330. worker_is_busy(WORKER_STATSD_FLUSH_TIMERS);
  2331. statsd_flush_index_metrics(&statsd.timers, statsd_flush_timer);
  2332. worker_is_busy(WORKER_STATSD_FLUSH_HISTOGRAMS);
  2333. statsd_flush_index_metrics(&statsd.histograms, statsd_flush_histogram);
  2334. worker_is_busy(WORKER_STATSD_FLUSH_SETS);
  2335. statsd_flush_index_metrics(&statsd.sets, statsd_flush_set);
  2336. worker_is_busy(WORKER_STATSD_FLUSH_DICTIONARIES);
  2337. statsd_flush_index_metrics(&statsd.dictionaries,statsd_flush_dictionary);
  2338. worker_is_busy(WORKER_STATSD_FLUSH_STATS);
  2339. statsd_update_all_app_charts();
  2340. if(unlikely(!service_running(SERVICE_COLLECTORS)))
  2341. break;
  2342. if(global_statistics_enabled) {
  2343. rrddim_set_by_pointer(st_metrics, rd_metrics_gauge, (collected_number)statsd.gauges.metrics);
  2344. rrddim_set_by_pointer(st_metrics, rd_metrics_counter, (collected_number)statsd.counters.metrics);
  2345. rrddim_set_by_pointer(st_metrics, rd_metrics_timer, (collected_number)statsd.timers.metrics);
  2346. rrddim_set_by_pointer(st_metrics, rd_metrics_meter, (collected_number)statsd.meters.metrics);
  2347. rrddim_set_by_pointer(st_metrics, rd_metrics_histogram, (collected_number)statsd.histograms.metrics);
  2348. rrddim_set_by_pointer(st_metrics, rd_metrics_set, (collected_number)statsd.sets.metrics);
  2349. rrddim_set_by_pointer(st_metrics, rd_metrics_dictionary, (collected_number)statsd.dictionaries.metrics);
  2350. rrdset_done(st_metrics);
  2351. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_gauge, (collected_number)statsd.gauges.useful);
  2352. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_counter, (collected_number)statsd.counters.useful);
  2353. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_timer, (collected_number)statsd.timers.useful);
  2354. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_meter, (collected_number)statsd.meters.useful);
  2355. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_histogram, (collected_number)statsd.histograms.useful);
  2356. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_set, (collected_number)statsd.sets.useful);
  2357. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_dictionary, (collected_number)statsd.dictionaries.useful);
  2358. rrdset_done(st_useful_metrics);
  2359. rrddim_set_by_pointer(st_events, rd_events_gauge, (collected_number)statsd.gauges.events);
  2360. rrddim_set_by_pointer(st_events, rd_events_counter, (collected_number)statsd.counters.events);
  2361. rrddim_set_by_pointer(st_events, rd_events_timer, (collected_number)statsd.timers.events);
  2362. rrddim_set_by_pointer(st_events, rd_events_meter, (collected_number)statsd.meters.events);
  2363. rrddim_set_by_pointer(st_events, rd_events_histogram, (collected_number)statsd.histograms.events);
  2364. rrddim_set_by_pointer(st_events, rd_events_set, (collected_number)statsd.sets.events);
  2365. rrddim_set_by_pointer(st_events, rd_events_dictionary, (collected_number)statsd.dictionaries.events);
  2366. rrddim_set_by_pointer(st_events, rd_events_unknown, (collected_number)statsd.unknown_types);
  2367. rrddim_set_by_pointer(st_events, rd_events_errors, (collected_number)statsd.socket_errors);
  2368. rrdset_done(st_events);
  2369. rrddim_set_by_pointer(st_reads, rd_reads_tcp, (collected_number)statsd.tcp_socket_reads);
  2370. rrddim_set_by_pointer(st_reads, rd_reads_udp, (collected_number)statsd.udp_socket_reads);
  2371. rrdset_done(st_reads);
  2372. rrddim_set_by_pointer(st_bytes, rd_bytes_tcp, (collected_number)statsd.tcp_bytes_read);
  2373. rrddim_set_by_pointer(st_bytes, rd_bytes_udp, (collected_number)statsd.udp_bytes_read);
  2374. rrdset_done(st_bytes);
  2375. rrddim_set_by_pointer(st_packets, rd_packets_tcp, (collected_number)statsd.tcp_packets_received);
  2376. rrddim_set_by_pointer(st_packets, rd_packets_udp, (collected_number)statsd.udp_packets_received);
  2377. rrdset_done(st_packets);
  2378. rrddim_set_by_pointer(st_tcp_connects, rd_tcp_connects, (collected_number)statsd.tcp_socket_connects);
  2379. rrddim_set_by_pointer(st_tcp_connects, rd_tcp_disconnects, (collected_number)statsd.tcp_socket_disconnects);
  2380. rrdset_done(st_tcp_connects);
  2381. rrddim_set_by_pointer(st_tcp_connected, rd_tcp_connected, (collected_number)statsd.tcp_socket_connected);
  2382. rrdset_done(st_tcp_connected);
  2383. rrddim_set_by_pointer(st_pcharts, rd_pcharts, (collected_number)statsd.private_charts);
  2384. rrdset_done(st_pcharts);
  2385. }
  2386. }
  2387. cleanup: ; // added semi-colon to prevent older gcc error: label at end of compound statement
  2388. netdata_thread_cleanup_pop(1);
  2389. return NULL;
  2390. }