statsd.c 112 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include "daemon/common.h"
  3. #define STATSD_CHART_PREFIX "statsd"
  4. #define PLUGIN_STATSD_NAME "statsd.plugin"
  5. #define STATSD_LISTEN_PORT 8125
  6. #define STATSD_LISTEN_BACKLOG 4096
  7. #define WORKER_JOB_TYPE_TCP_CONNECTED 0
  8. #define WORKER_JOB_TYPE_TCP_DISCONNECTED 1
  9. #define WORKER_JOB_TYPE_RCV_DATA 2
  10. #define WORKER_JOB_TYPE_SND_DATA 3
  11. #if WORKER_UTILIZATION_MAX_JOB_TYPES < 4
  12. #error Please increase WORKER_UTILIZATION_MAX_JOB_TYPES to at least 4
  13. #endif
  14. // --------------------------------------------------------------------------------------
  15. // DO NOT ENABLE MULTITHREADING - IT IS NOT WELL TESTED
  16. // #define STATSD_MULTITHREADED 1
  17. #define STATSD_DICTIONARY_OPTIONS (DICT_OPTION_DONT_OVERWRITE_VALUE | DICT_OPTION_ADD_IN_FRONT)
  18. #define STATSD_DECIMAL_DETAIL 1000 // floating point values get multiplied by this, with the same divisor
  19. // --------------------------------------------------------------------------------------------------------------------
  20. // data specific to each metric type
  21. typedef struct statsd_metric_gauge {
  22. NETDATA_DOUBLE value;
  23. } STATSD_METRIC_GAUGE;
  24. typedef struct statsd_metric_counter { // counter and meter
  25. collected_number value;
  26. } STATSD_METRIC_COUNTER;
  27. typedef struct statsd_histogram_extensions {
  28. netdata_mutex_t mutex;
  29. // average is stored in metric->last
  30. collected_number last_min;
  31. collected_number last_max;
  32. collected_number last_percentile;
  33. collected_number last_median;
  34. collected_number last_stddev;
  35. collected_number last_sum;
  36. int zeroed;
  37. RRDDIM *rd_min;
  38. RRDDIM *rd_max;
  39. RRDDIM *rd_percentile;
  40. RRDDIM *rd_median;
  41. RRDDIM *rd_stddev;
  42. //RRDDIM *rd_sum;
  43. uint32_t size;
  44. uint32_t used;
  45. NETDATA_DOUBLE *values; // dynamic array of values collected
  46. } STATSD_METRIC_HISTOGRAM_EXTENSIONS;
  47. typedef struct statsd_metric_histogram { // histogram and timer
  48. STATSD_METRIC_HISTOGRAM_EXTENSIONS *ext;
  49. } STATSD_METRIC_HISTOGRAM;
  50. typedef struct statsd_metric_set {
  51. DICTIONARY *dict;
  52. } STATSD_METRIC_SET;
  53. typedef struct statsd_metric_dictionary_item {
  54. uint32_t count;
  55. RRDDIM *rd;
  56. } STATSD_METRIC_DICTIONARY_ITEM;
  57. typedef struct statsd_metric_dictionary {
  58. DICTIONARY *dict;
  59. } STATSD_METRIC_DICTIONARY;
  60. // --------------------------------------------------------------------------------------------------------------------
  61. // this is a metric - for all types of metrics
  62. typedef enum __attribute__((packed)) statsd_metric_options {
  63. STATSD_METRIC_OPTION_NONE = 0x00000000, // no options set
  64. STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED = 0x00000001, // do not update the chart dimension, when this metric is not collected
  65. STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED = 0x00000002, // render a private chart for this metric
  66. STATSD_METRIC_OPTION_PRIVATE_CHART_CHECKED = 0x00000004, // the metric has been checked if it should get private chart or not
  67. STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT = 0x00000008, // show the count of events for this private chart
  68. STATSD_METRIC_OPTION_CHECKED_IN_APPS = 0x00000010, // set when this metric has been checked against apps
  69. STATSD_METRIC_OPTION_USED_IN_APPS = 0x00000020, // set when this metric is used in apps
  70. STATSD_METRIC_OPTION_CHECKED = 0x00000040, // set when the charting thread checks this metric for use in charts (its usefulness)
  71. STATSD_METRIC_OPTION_USEFUL = 0x00000080, // set when the charting thread finds the metric useful (i.e. used in a chart)
  72. STATSD_METRIC_OPTION_COLLECTION_FULL_LOGGED = 0x00000100, // set when the collection is full for this metric
  73. STATSD_METRIC_OPTION_UPDATED_CHART_METADATA = 0x00000200, // set when the private chart metadata have been updated via tags
  74. } STATS_METRIC_OPTIONS;
  75. typedef enum __attribute__((packed)) statsd_metric_type {
  76. STATSD_METRIC_TYPE_GAUGE,
  77. STATSD_METRIC_TYPE_COUNTER,
  78. STATSD_METRIC_TYPE_METER,
  79. STATSD_METRIC_TYPE_TIMER,
  80. STATSD_METRIC_TYPE_HISTOGRAM,
  81. STATSD_METRIC_TYPE_SET,
  82. STATSD_METRIC_TYPE_DICTIONARY
  83. } STATSD_METRIC_TYPE;
  84. typedef struct statsd_metric {
  85. const char *name; // the name of the metric - linked to dictionary name
  86. uint32_t hash; // hash of the name
  87. STATSD_METRIC_TYPE type;
  88. // metadata about data collection
  89. collected_number events; // the number of times this metric has been collected (never resets)
  90. uint32_t count; // the number of times this metric has been collected since the last flush
  91. // the actual collected data
  92. union {
  93. STATSD_METRIC_GAUGE gauge;
  94. STATSD_METRIC_COUNTER counter;
  95. STATSD_METRIC_HISTOGRAM histogram;
  96. STATSD_METRIC_SET set;
  97. STATSD_METRIC_DICTIONARY dictionary;
  98. };
  99. char *units;
  100. char *dimname;
  101. char *family;
  102. // chart related members
  103. STATS_METRIC_OPTIONS options; // STATSD_METRIC_OPTION_* (bitfield)
  104. char reset; // set to 1 by the charting thread to instruct the collector thread(s) to reset this metric
  105. collected_number last; // the last value sent to netdata
  106. RRDSET *st; // the private chart of this metric
  107. RRDDIM *rd_value; // the dimension of this metric value
  108. RRDDIM *rd_count; // the dimension for the number of events received
  109. // linking, used for walking through all metrics
  110. struct statsd_metric *next_useful;
  111. } STATSD_METRIC;
  112. // --------------------------------------------------------------------------------------------------------------------
  113. // each type of metric has its own index
  114. typedef struct statsd_index {
  115. char *name; // the name of the index of metrics
  116. uint32_t events; // the number of events processed for this index
  117. uint32_t metrics; // the number of metrics in this index
  118. uint32_t useful; // the number of useful metrics in this index
  119. STATS_METRIC_OPTIONS default_options; // default options for all metrics in this index
  120. STATSD_METRIC_TYPE type; // the type of index
  121. DICTIONARY *dict;
  122. STATSD_METRIC *first_useful; // the linked list of useful metrics (new metrics are added in front)
  123. } STATSD_INDEX;
  124. // --------------------------------------------------------------------------------------------------------------------
  125. // synthetic charts
  126. typedef enum __attribute__((packed)) statsd_app_chart_dimension_value_type {
  127. STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS,
  128. STATSD_APP_CHART_DIM_VALUE_TYPE_LAST,
  129. STATSD_APP_CHART_DIM_VALUE_TYPE_AVERAGE,
  130. STATSD_APP_CHART_DIM_VALUE_TYPE_SUM,
  131. STATSD_APP_CHART_DIM_VALUE_TYPE_MIN,
  132. STATSD_APP_CHART_DIM_VALUE_TYPE_MAX,
  133. STATSD_APP_CHART_DIM_VALUE_TYPE_PERCENTILE,
  134. STATSD_APP_CHART_DIM_VALUE_TYPE_MEDIAN,
  135. STATSD_APP_CHART_DIM_VALUE_TYPE_STDDEV
  136. } STATSD_APP_CHART_DIM_VALUE_TYPE;
  137. typedef struct statsd_app_chart_dimension {
  138. const char *name; // the name of this dimension
  139. const char *metric; // the source metric name of this dimension
  140. uint32_t metric_hash; // hash for fast string comparisons
  141. int32_t multiplier; // the multiplier of the dimension
  142. int32_t divisor; // the divisor of the dimension
  143. RRDDIM_FLAGS flags; // the RRDDIM flags for this dimension
  144. RRDDIM_OPTIONS options; // the RRDDIM options for this dimension
  145. RRD_ALGORITHM algorithm; // the algorithm of this dimension
  146. STATSD_APP_CHART_DIM_VALUE_TYPE value_type; // which value to use of the source metric
  147. SIMPLE_PATTERN *metric_pattern; // set when the 'metric' is a simple pattern
  148. RRDDIM *rd; // a pointer to the RRDDIM that has been created for this dimension
  149. collected_number *value_ptr; // a pointer to the source metric value
  150. struct statsd_app_chart_dimension *next; // the next dimension for this chart
  151. } STATSD_APP_CHART_DIM;
  152. typedef struct statsd_app_chart {
  153. const char *id;
  154. const char *name;
  155. const char *title;
  156. const char *family;
  157. const char *context;
  158. const char *units;
  159. const char *module;
  160. int32_t priority;
  161. RRDSET_TYPE chart_type;
  162. STATSD_APP_CHART_DIM *dimensions;
  163. uint32_t dimensions_count;
  164. uint32_t dimensions_linked_count;
  165. RRDSET *st;
  166. struct statsd_app_chart *next;
  167. } STATSD_APP_CHART;
  168. typedef struct statsd_app {
  169. const char *name;
  170. SIMPLE_PATTERN *metrics;
  171. STATS_METRIC_OPTIONS default_options;
  172. RRD_MEMORY_MODE rrd_memory_mode;
  173. int32_t rrd_history_entries;
  174. DICTIONARY *dict;
  175. const char *source;
  176. STATSD_APP_CHART *charts;
  177. struct statsd_app *next;
  178. } STATSD_APP;
  179. // --------------------------------------------------------------------------------------------------------------------
  180. // global statsd data
  181. struct collection_thread_status {
  182. SPINLOCK spinlock;
  183. bool running;
  184. uint32_t max_sockets;
  185. netdata_thread_t thread;
  186. };
  187. static struct statsd {
  188. STATSD_INDEX gauges;
  189. STATSD_INDEX counters;
  190. STATSD_INDEX timers;
  191. STATSD_INDEX histograms;
  192. STATSD_INDEX meters;
  193. STATSD_INDEX sets;
  194. STATSD_INDEX dictionaries;
  195. size_t unknown_types;
  196. size_t socket_errors;
  197. size_t tcp_socket_connects;
  198. size_t tcp_socket_disconnects;
  199. size_t tcp_socket_connected;
  200. size_t tcp_socket_reads;
  201. size_t tcp_packets_received;
  202. size_t tcp_bytes_read;
  203. size_t udp_socket_reads;
  204. size_t udp_packets_received;
  205. size_t udp_bytes_read;
  206. int32_t update_every;
  207. bool enabled;
  208. bool private_charts_hidden;
  209. SIMPLE_PATTERN *charts_for;
  210. uint32_t tcp_idle_timeout;
  211. collected_number decimal_detail;
  212. uint32_t private_charts;
  213. uint32_t max_private_charts_hard;
  214. STATSD_APP *apps;
  215. uint32_t recvmmsg_size;
  216. uint32_t histogram_increase_step;
  217. uint32_t dictionary_max_unique;
  218. double histogram_percentile;
  219. char *histogram_percentile_str;
  220. int threads;
  221. struct collection_thread_status *collection_threads_status;
  222. LISTEN_SOCKETS sockets;
  223. } statsd = {
  224. .enabled = 1,
  225. .max_private_charts_hard = 1000,
  226. .private_charts_hidden = false,
  227. .recvmmsg_size = 10,
  228. .decimal_detail = STATSD_DECIMAL_DETAIL,
  229. .gauges = {
  230. .name = "gauge",
  231. .events = 0,
  232. .metrics = 0,
  233. .dict = NULL,
  234. .type = STATSD_METRIC_TYPE_GAUGE,
  235. .default_options = STATSD_METRIC_OPTION_NONE
  236. },
  237. .counters = {
  238. .name = "counter",
  239. .events = 0,
  240. .metrics = 0,
  241. .dict = NULL,
  242. .type = STATSD_METRIC_TYPE_COUNTER,
  243. .default_options = STATSD_METRIC_OPTION_NONE
  244. },
  245. .timers = {
  246. .name = "timer",
  247. .events = 0,
  248. .metrics = 0,
  249. .dict = NULL,
  250. .type = STATSD_METRIC_TYPE_TIMER,
  251. .default_options = STATSD_METRIC_OPTION_NONE
  252. },
  253. .histograms = {
  254. .name = "histogram",
  255. .events = 0,
  256. .metrics = 0,
  257. .dict = NULL,
  258. .type = STATSD_METRIC_TYPE_HISTOGRAM,
  259. .default_options = STATSD_METRIC_OPTION_NONE
  260. },
  261. .meters = {
  262. .name = "meter",
  263. .events = 0,
  264. .metrics = 0,
  265. .dict = NULL,
  266. .type = STATSD_METRIC_TYPE_METER,
  267. .default_options = STATSD_METRIC_OPTION_NONE
  268. },
  269. .sets = {
  270. .name = "set",
  271. .events = 0,
  272. .metrics = 0,
  273. .dict = NULL,
  274. .type = STATSD_METRIC_TYPE_SET,
  275. .default_options = STATSD_METRIC_OPTION_NONE
  276. },
  277. .dictionaries = {
  278. .name = "dictionary",
  279. .events = 0,
  280. .metrics = 0,
  281. .dict = NULL,
  282. .type = STATSD_METRIC_TYPE_DICTIONARY,
  283. .default_options = STATSD_METRIC_OPTION_NONE
  284. },
  285. .tcp_idle_timeout = 600,
  286. .apps = NULL,
  287. .histogram_percentile = 95.0,
  288. .histogram_increase_step = 10,
  289. .dictionary_max_unique = 200,
  290. .threads = 0,
  291. .collection_threads_status = NULL,
  292. .sockets = {
  293. .config = &netdata_config,
  294. .config_section = CONFIG_SECTION_STATSD,
  295. .default_bind_to = "udp:localhost tcp:localhost",
  296. .default_port = STATSD_LISTEN_PORT,
  297. .backlog = STATSD_LISTEN_BACKLOG
  298. },
  299. };
  300. // --------------------------------------------------------------------------------------------------------------------
  301. // statsd index management - add/find metrics
  302. static void dictionary_metric_insert_callback(const DICTIONARY_ITEM *item, void *value, void *data) {
  303. STATSD_INDEX *index = (STATSD_INDEX *)data;
  304. STATSD_METRIC *m = (STATSD_METRIC *)value;
  305. const char *name = dictionary_acquired_item_name(item);
  306. netdata_log_debug(D_STATSD, "Creating new %s metric '%s'", index->name, name);
  307. m->name = name;
  308. m->hash = simple_hash(name);
  309. m->type = index->type;
  310. m->options = index->default_options;
  311. if (m->type == STATSD_METRIC_TYPE_HISTOGRAM || m->type == STATSD_METRIC_TYPE_TIMER) {
  312. m->histogram.ext = callocz(1,sizeof(STATSD_METRIC_HISTOGRAM_EXTENSIONS));
  313. netdata_mutex_init(&m->histogram.ext->mutex);
  314. }
  315. __atomic_fetch_add(&index->metrics, 1, __ATOMIC_RELAXED);
  316. }
  317. static void dictionary_metric_delete_callback(const DICTIONARY_ITEM *item, void *value, void *data) {
  318. (void)data; // STATSD_INDEX *index = (STATSD_INDEX *)data;
  319. (void)item;
  320. STATSD_METRIC *m = (STATSD_METRIC *)value;
  321. if(m->type == STATSD_METRIC_TYPE_HISTOGRAM || m->type == STATSD_METRIC_TYPE_TIMER) {
  322. freez(m->histogram.ext);
  323. m->histogram.ext = NULL;
  324. }
  325. freez(m->units);
  326. freez(m->family);
  327. freez(m->dimname);
  328. }
  329. static inline STATSD_METRIC *statsd_find_or_add_metric(STATSD_INDEX *index, const char *name) {
  330. netdata_log_debug(D_STATSD, "searching for metric '%s' under '%s'", name, index->name);
  331. #ifdef STATSD_MULTITHREADED
  332. // avoid the write lock of dictionary_set() for existing metrics
  333. STATSD_METRIC *m = dictionary_get(index->dict, name);
  334. if(!m) m = dictionary_set(index->dict, name, NULL, sizeof(STATSD_METRIC));
  335. #else
  336. // no locks here, go faster
  337. // this will call the dictionary_metric_insert_callback() if an item
  338. // is inserted, otherwise it will return the existing one.
  339. // We used the flag DICT_OPTION_DONT_OVERWRITE_VALUE to support this.
  340. STATSD_METRIC *m = dictionary_set(index->dict, name, NULL, sizeof(STATSD_METRIC));
  341. #endif
  342. index->events++;
  343. return m;
  344. }
  345. // --------------------------------------------------------------------------------------------------------------------
  346. // statsd parsing numbers
  347. static inline NETDATA_DOUBLE statsd_parse_float(const char *v, NETDATA_DOUBLE def) {
  348. NETDATA_DOUBLE value;
  349. if(likely(v && *v)) {
  350. char *e = NULL;
  351. value = str2ndd(v, &e);
  352. if(unlikely(e && *e))
  353. collector_error("STATSD: excess data '%s' after value '%s'", e, v);
  354. }
  355. else
  356. value = def;
  357. return value;
  358. }
  359. static inline NETDATA_DOUBLE statsd_parse_sampling_rate(const char *v) {
  360. NETDATA_DOUBLE sampling_rate = statsd_parse_float(v, 1.0);
  361. if(unlikely(isless(sampling_rate, 0.001))) sampling_rate = 0.001;
  362. if(unlikely(isgreater(sampling_rate, 1.0))) sampling_rate = 1.0;
  363. return sampling_rate;
  364. }
  365. static inline long long statsd_parse_int(const char *v, long long def) {
  366. long long value;
  367. if(likely(v && *v)) {
  368. char *e = NULL;
  369. value = str2ll(v, &e);
  370. if(unlikely(e && *e))
  371. collector_error("STATSD: excess data '%s' after value '%s'", e, v);
  372. }
  373. else
  374. value = def;
  375. return value;
  376. }
  377. // --------------------------------------------------------------------------------------------------------------------
  378. // statsd processors per metric type
  379. static inline void statsd_reset_metric(STATSD_METRIC *m) {
  380. m->reset = 0;
  381. m->count = 0;
  382. }
  383. static inline int value_is_zinit(const char *value) {
  384. return (value && *value == 'z' && *++value == 'i' && *++value == 'n' && *++value == 'i' && *++value == 't' && *++value == '\0');
  385. }
  386. #define is_metric_checked(m) ((m)->options & STATSD_METRIC_OPTION_CHECKED)
  387. #define is_metric_useful_for_collection(m) (!is_metric_checked(m) || ((m)->options & STATSD_METRIC_OPTION_USEFUL))
  388. static inline void statsd_process_gauge(STATSD_METRIC *m, const char *value, const char *sampling) {
  389. if(!is_metric_useful_for_collection(m)) return;
  390. if(unlikely(!value || !*value)) {
  391. collector_error("STATSD: metric '%s' of type gauge, with empty value is ignored.", m->name);
  392. return;
  393. }
  394. if(unlikely(m->reset)) {
  395. // no need to reset anything specific for gauges
  396. statsd_reset_metric(m);
  397. }
  398. if(unlikely(value_is_zinit(value))) {
  399. // magic loading of metric, without affecting anything
  400. }
  401. else {
  402. if (unlikely(*value == '+' || *value == '-'))
  403. m->gauge.value += statsd_parse_float(value, 1.0) / statsd_parse_sampling_rate(sampling);
  404. else
  405. m->gauge.value = statsd_parse_float(value, 1.0);
  406. m->events++;
  407. m->count++;
  408. }
  409. }
  410. static inline void statsd_process_counter_or_meter(STATSD_METRIC *m, const char *value, const char *sampling) {
  411. if(!is_metric_useful_for_collection(m)) return;
  412. // we accept empty values for counters
  413. if(unlikely(m->reset)) statsd_reset_metric(m);
  414. if(unlikely(value_is_zinit(value))) {
  415. // magic loading of metric, without affecting anything
  416. }
  417. else {
  418. m->counter.value += llrintndd((NETDATA_DOUBLE) statsd_parse_int(value, 1) / statsd_parse_sampling_rate(sampling));
  419. m->events++;
  420. m->count++;
  421. }
  422. }
  423. #define statsd_process_counter(m, value, sampling) statsd_process_counter_or_meter(m, value, sampling)
  424. #define statsd_process_meter(m, value, sampling) statsd_process_counter_or_meter(m, value, sampling)
  425. static inline void statsd_process_histogram_or_timer(STATSD_METRIC *m, const char *value, const char *sampling, const char *type) {
  426. if(!is_metric_useful_for_collection(m)) return;
  427. if(unlikely(!value || !*value)) {
  428. collector_error("STATSD: metric of type %s, with empty value is ignored.", type);
  429. return;
  430. }
  431. if(unlikely(m->reset)) {
  432. m->histogram.ext->used = 0;
  433. statsd_reset_metric(m);
  434. }
  435. if(unlikely(value_is_zinit(value))) {
  436. // magic loading of metric, without affecting anything
  437. }
  438. else {
  439. NETDATA_DOUBLE v = statsd_parse_float(value, 1.0);
  440. NETDATA_DOUBLE sampling_rate = statsd_parse_sampling_rate(sampling);
  441. if(unlikely(isless(sampling_rate, 0.01))) sampling_rate = 0.01;
  442. if(unlikely(isgreater(sampling_rate, 1.0))) sampling_rate = 1.0;
  443. long long samples = llrintndd(1.0 / sampling_rate);
  444. while(samples-- > 0) {
  445. if(unlikely(m->histogram.ext->used == m->histogram.ext->size)) {
  446. netdata_mutex_lock(&m->histogram.ext->mutex);
  447. m->histogram.ext->size += statsd.histogram_increase_step;
  448. m->histogram.ext->values = reallocz(m->histogram.ext->values, sizeof(NETDATA_DOUBLE) * m->histogram.ext->size);
  449. netdata_mutex_unlock(&m->histogram.ext->mutex);
  450. }
  451. m->histogram.ext->values[m->histogram.ext->used++] = v;
  452. }
  453. m->events++;
  454. m->count++;
  455. }
  456. }
  457. #define statsd_process_timer(m, value, sampling) statsd_process_histogram_or_timer(m, value, sampling, "timer")
  458. #define statsd_process_histogram(m, value, sampling) statsd_process_histogram_or_timer(m, value, sampling, "histogram")
  459. static inline void statsd_process_set(STATSD_METRIC *m, const char *value) {
  460. if(!is_metric_useful_for_collection(m)) return;
  461. if(unlikely(!value || !*value)) {
  462. netdata_log_error("STATSD: metric of type set, with empty value is ignored.");
  463. return;
  464. }
  465. if(unlikely(m->reset)) {
  466. if(likely(m->set.dict)) {
  467. dictionary_destroy(m->set.dict);
  468. m->set.dict = NULL;
  469. }
  470. statsd_reset_metric(m);
  471. }
  472. if (unlikely(!m->set.dict))
  473. m->set.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  474. if(unlikely(value_is_zinit(value))) {
  475. // magic loading of metric, without affecting anything
  476. }
  477. else {
  478. #ifdef STATSD_MULTITHREADED
  479. // avoid the write lock to check if something is already there
  480. if(!dictionary_get(m->set.dict, value))
  481. dictionary_set(m->set.dict, value, NULL, 0);
  482. #else
  483. dictionary_set(m->set.dict, value, NULL, 0);
  484. #endif
  485. m->events++;
  486. m->count++;
  487. }
  488. }
  489. static inline void statsd_process_dictionary(STATSD_METRIC *m, const char *value) {
  490. if(!is_metric_useful_for_collection(m)) return;
  491. if(unlikely(!value || !*value)) {
  492. netdata_log_error("STATSD: metric of type set, with empty value is ignored.");
  493. return;
  494. }
  495. if(unlikely(m->reset))
  496. statsd_reset_metric(m);
  497. if (unlikely(!m->dictionary.dict))
  498. m->dictionary.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  499. if(unlikely(value_is_zinit(value))) {
  500. // magic loading of metric, without affecting anything
  501. }
  502. else {
  503. STATSD_METRIC_DICTIONARY_ITEM *t = (STATSD_METRIC_DICTIONARY_ITEM *)dictionary_get(m->dictionary.dict, value);
  504. if (unlikely(!t)) {
  505. if(!t && dictionary_entries(m->dictionary.dict) >= statsd.dictionary_max_unique)
  506. value = "other";
  507. t = (STATSD_METRIC_DICTIONARY_ITEM *)dictionary_set(m->dictionary.dict, value, NULL, sizeof(STATSD_METRIC_DICTIONARY_ITEM));
  508. }
  509. t->count++;
  510. m->events++;
  511. m->count++;
  512. }
  513. }
  514. // --------------------------------------------------------------------------------------------------------------------
  515. // statsd parsing
  516. static inline const char *statsd_parse_skip_up_to(const char *s, char d1, char d2, char d3) {
  517. char c;
  518. for(c = *s; c && c != d1 && c != d2 && c != d3 && c != '\r' && c != '\n'; c = *++s) ;
  519. return s;
  520. }
  521. const char *statsd_parse_skip_spaces(const char *s) {
  522. char c;
  523. for(c = *s; c && ( c == ' ' || c == '\t' || c == '\r' || c == '\n' ); c = *++s) ;
  524. return s;
  525. }
  526. static inline const char *statsd_parse_field_trim(const char *start, char *end) {
  527. if(unlikely(!start || !*start)) {
  528. start = end;
  529. return start;
  530. }
  531. while(start <= end && (*start == ' ' || *start == '\t'))
  532. start++;
  533. *end = '\0';
  534. end--;
  535. while(end >= start && (*end == ' ' || *end == '\t'))
  536. *end-- = '\0';
  537. return start;
  538. }
  539. static void statsd_process_metric(const char *name, const char *value, const char *type, const char *sampling, const char *tags) {
  540. netdata_log_debug(D_STATSD, "STATSD: raw metric '%s', value '%s', type '%s', sampling '%s', tags '%s'", name?name:"(null)", value?value:"(null)", type?type:"(null)", sampling?sampling:"(null)", tags?tags:"(null)");
  541. if(unlikely(!name || !*name)) return;
  542. if(unlikely(!type || !*type)) type = "m";
  543. STATSD_METRIC *m = NULL;
  544. char t0 = type[0], t1 = type[1];
  545. if(unlikely(t0 == 'g' && t1 == '\0')) {
  546. statsd_process_gauge(
  547. m = statsd_find_or_add_metric(&statsd.gauges, name),
  548. value, sampling);
  549. }
  550. else if(unlikely((t0 == 'c' || t0 == 'C') && t1 == '\0')) {
  551. // etsy/statsd uses 'c'
  552. // brubeck uses 'C'
  553. statsd_process_counter(
  554. m = statsd_find_or_add_metric(&statsd.counters, name),
  555. value, sampling);
  556. }
  557. else if(unlikely(t0 == 'm' && t1 == '\0')) {
  558. statsd_process_meter(
  559. m = statsd_find_or_add_metric(&statsd.meters, name),
  560. value, sampling);
  561. }
  562. else if(unlikely(t0 == 'h' && t1 == '\0')) {
  563. statsd_process_histogram(
  564. m = statsd_find_or_add_metric(&statsd.histograms, name),
  565. value, sampling);
  566. }
  567. else if(unlikely(t0 == 's' && t1 == '\0')) {
  568. statsd_process_set(
  569. m = statsd_find_or_add_metric(&statsd.sets, name),
  570. value);
  571. }
  572. else if(unlikely(t0 == 'd' && t1 == '\0')) {
  573. statsd_process_dictionary(
  574. m = statsd_find_or_add_metric(&statsd.dictionaries, name),
  575. value);
  576. }
  577. else if(unlikely(t0 == 'm' && t1 == 's' && type[2] == '\0')) {
  578. statsd_process_timer(
  579. m = statsd_find_or_add_metric(&statsd.timers, name),
  580. value, sampling);
  581. }
  582. else {
  583. statsd.unknown_types++;
  584. netdata_log_error("STATSD: metric '%s' with value '%s' is sent with unknown metric type '%s'", name, value?value:"", type);
  585. }
  586. if(m && tags && *tags) {
  587. const char *s = tags;
  588. while(*s) {
  589. const char *tagkey = NULL, *tagvalue = NULL;
  590. char *tagkey_end = NULL, *tagvalue_end = NULL;
  591. s = tagkey_end = (char *)statsd_parse_skip_up_to(tagkey = s, ':', '=', ',');
  592. if(tagkey == tagkey_end) {
  593. if (*s) {
  594. s++;
  595. s = statsd_parse_skip_spaces(s);
  596. }
  597. continue;
  598. }
  599. if(likely(*s == ':' || *s == '='))
  600. s = tagvalue_end = (char *) statsd_parse_skip_up_to(tagvalue = ++s, ',', '\0', '\0');
  601. if(*s == ',') s++;
  602. statsd_parse_field_trim(tagkey, tagkey_end);
  603. statsd_parse_field_trim(tagvalue, tagvalue_end);
  604. if(tagkey && *tagkey && tagvalue && *tagvalue) {
  605. if (strcmp(tagkey, "units") == 0 && (!m->units || strcmp(m->units, tagvalue) != 0)) {
  606. m->units = strdupz(tagvalue);
  607. m->options |= STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  608. }
  609. if (strcmp(tagkey, "name") == 0 && (!m->dimname || strcmp(m->dimname, tagvalue) != 0)) {
  610. m->dimname = strdupz(tagvalue);
  611. m->options |= STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  612. }
  613. if (strcmp(tagkey, "family") == 0 && (!m->family || strcmp(m->family, tagvalue) != 0)) {
  614. m->family = strdupz(tagvalue);
  615. m->options |= STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  616. }
  617. }
  618. }
  619. }
  620. }
  621. static inline size_t statsd_process(char *buffer, size_t size, int require_newlines) {
  622. buffer[size] = '\0';
  623. netdata_log_debug(D_STATSD, "RECEIVED: %zu bytes: '%s'", size, buffer);
  624. const char *s = buffer;
  625. while(*s) {
  626. const char *name = NULL, *value = NULL, *type = NULL, *sampling = NULL, *tags = NULL;
  627. char *name_end = NULL, *value_end = NULL, *type_end = NULL, *sampling_end = NULL, *tags_end = NULL;
  628. s = name_end = (char *)statsd_parse_skip_up_to(name = s, ':', '=', '|');
  629. if(name == name_end) {
  630. if (*s) {
  631. s++;
  632. s = statsd_parse_skip_spaces(s);
  633. }
  634. continue;
  635. }
  636. if(likely(*s == ':' || *s == '='))
  637. s = value_end = (char *) statsd_parse_skip_up_to(value = ++s, '|', '@', '#');
  638. if(likely(*s == '|'))
  639. s = type_end = (char *) statsd_parse_skip_up_to(type = ++s, '|', '@', '#');
  640. while(*s == '|' || *s == '@' || *s == '#') {
  641. // parse all the fields that may be appended
  642. if ((*s == '|' && s[1] == '@') || *s == '@') {
  643. s = sampling_end = (char *)statsd_parse_skip_up_to(sampling = ++s, '|', '@', '#');
  644. if (*sampling == '@') sampling++;
  645. }
  646. else if ((*s == '|' && s[1] == '#') || *s == '#') {
  647. s = tags_end = (char *)statsd_parse_skip_up_to(tags = ++s, '|', '@', '#');
  648. if (*tags == '#') tags++;
  649. }
  650. else {
  651. // unknown field, skip it
  652. s = (char *)statsd_parse_skip_up_to(++s, '|', '@', '#');
  653. }
  654. }
  655. // skip everything until the end of the line
  656. while(*s && *s != '\n') s++;
  657. if(unlikely(require_newlines && *s != '\n' && s > buffer)) {
  658. // move the remaining data to the beginning
  659. size -= (name - buffer);
  660. memmove(buffer, name, size);
  661. return size;
  662. }
  663. else
  664. s = statsd_parse_skip_spaces(s);
  665. statsd_process_metric(
  666. statsd_parse_field_trim(name, name_end)
  667. , statsd_parse_field_trim(value, value_end)
  668. , statsd_parse_field_trim(type, type_end)
  669. , statsd_parse_field_trim(sampling, sampling_end)
  670. , statsd_parse_field_trim(tags, tags_end)
  671. );
  672. }
  673. return 0;
  674. }
  675. // --------------------------------------------------------------------------------------------------------------------
  676. // statsd pollfd interface
  677. #define STATSD_TCP_BUFFER_SIZE 65536 // minimize tcp reads
  678. #define STATSD_UDP_BUFFER_SIZE 9000 // this should be up to MTU
  679. typedef enum {
  680. STATSD_SOCKET_DATA_TYPE_TCP,
  681. STATSD_SOCKET_DATA_TYPE_UDP
  682. } STATSD_SOCKET_DATA_TYPE;
  683. struct statsd_tcp {
  684. STATSD_SOCKET_DATA_TYPE type;
  685. size_t size;
  686. size_t len;
  687. char buffer[];
  688. };
  689. struct statsd_udp {
  690. struct collection_thread_status *status;
  691. STATSD_SOCKET_DATA_TYPE type;
  692. #ifdef HAVE_RECVMMSG
  693. size_t size;
  694. struct iovec *iovecs;
  695. struct mmsghdr *msgs;
  696. #else
  697. int *running;
  698. char buffer[STATSD_UDP_BUFFER_SIZE];
  699. #endif
  700. };
  701. // new TCP client connected
  702. static void *statsd_add_callback(POLLINFO *pi, short int *events, void *data) {
  703. (void)pi;
  704. (void)data;
  705. worker_is_busy(WORKER_JOB_TYPE_TCP_CONNECTED);
  706. *events = POLLIN;
  707. struct statsd_tcp *t = (struct statsd_tcp *)callocz(sizeof(struct statsd_tcp) + STATSD_TCP_BUFFER_SIZE, 1);
  708. t->type = STATSD_SOCKET_DATA_TYPE_TCP;
  709. t->size = STATSD_TCP_BUFFER_SIZE - 1;
  710. statsd.tcp_socket_connects++;
  711. statsd.tcp_socket_connected++;
  712. worker_is_idle();
  713. return t;
  714. }
  715. // TCP client disconnected
  716. static void statsd_del_callback(POLLINFO *pi) {
  717. worker_is_busy(WORKER_JOB_TYPE_TCP_DISCONNECTED);
  718. struct statsd_tcp *t = pi->data;
  719. if(likely(t)) {
  720. if(t->type == STATSD_SOCKET_DATA_TYPE_TCP) {
  721. if(t->len != 0) {
  722. statsd.socket_errors++;
  723. netdata_log_error("STATSD: client is probably sending unterminated metrics. Closed socket left with '%s'. Trying to process it.", t->buffer);
  724. statsd_process(t->buffer, t->len, 0);
  725. }
  726. statsd.tcp_socket_disconnects++;
  727. statsd.tcp_socket_connected--;
  728. }
  729. else
  730. netdata_log_error("STATSD: internal error: received socket data type is %d, but expected %d", (int)t->type, (int)STATSD_SOCKET_DATA_TYPE_TCP);
  731. freez(t);
  732. }
  733. worker_is_idle();
  734. }
  735. // Receive data
  736. static int statsd_rcv_callback(POLLINFO *pi, short int *events) {
  737. int retval = -1;
  738. worker_is_busy(WORKER_JOB_TYPE_RCV_DATA);
  739. *events = POLLIN;
  740. int fd = pi->fd;
  741. switch(pi->socktype) {
  742. case SOCK_STREAM: {
  743. struct statsd_tcp *d = (struct statsd_tcp *)pi->data;
  744. if(unlikely(!d)) {
  745. netdata_log_error("STATSD: internal error: expected TCP data pointer is NULL");
  746. statsd.socket_errors++;
  747. retval = -1;
  748. goto cleanup;
  749. }
  750. #ifdef NETDATA_INTERNAL_CHECKS
  751. if(unlikely(d->type != STATSD_SOCKET_DATA_TYPE_TCP)) {
  752. netdata_log_error("STATSD: internal error: socket data type should be %d, but it is %d", (int)STATSD_SOCKET_DATA_TYPE_TCP, (int)d->type);
  753. statsd.socket_errors++;
  754. retval = -1;
  755. goto cleanup;
  756. }
  757. #endif
  758. int ret = 0;
  759. ssize_t rc;
  760. do {
  761. rc = recv(fd, &d->buffer[d->len], d->size - d->len, MSG_DONTWAIT);
  762. if (rc < 0) {
  763. // read failed
  764. if (errno != EWOULDBLOCK && errno != EAGAIN && errno != EINTR) {
  765. netdata_log_error("STATSD: recv() on TCP socket %d failed.", fd);
  766. statsd.socket_errors++;
  767. ret = -1;
  768. }
  769. }
  770. else if (!rc) {
  771. // connection closed
  772. netdata_log_debug(D_STATSD, "STATSD: client disconnected.");
  773. ret = -1;
  774. }
  775. else {
  776. // data received
  777. d->len += rc;
  778. statsd.tcp_socket_reads++;
  779. statsd.tcp_bytes_read += rc;
  780. }
  781. if(likely(d->len > 0)) {
  782. statsd.tcp_packets_received++;
  783. d->len = statsd_process(d->buffer, d->len, 1);
  784. }
  785. if(unlikely(ret == -1)) {
  786. retval = -1;
  787. goto cleanup;
  788. }
  789. } while (rc != -1);
  790. break;
  791. }
  792. case SOCK_DGRAM: {
  793. struct statsd_udp *d = (struct statsd_udp *)pi->data;
  794. if(unlikely(!d)) {
  795. netdata_log_error("STATSD: internal error: expected UDP data pointer is NULL");
  796. statsd.socket_errors++;
  797. retval = -1;
  798. goto cleanup;
  799. }
  800. #ifdef NETDATA_INTERNAL_CHECKS
  801. if(unlikely(d->type != STATSD_SOCKET_DATA_TYPE_UDP)) {
  802. netdata_log_error("STATSD: internal error: socket data should be %d, but it is %d", (int)d->type, (int)STATSD_SOCKET_DATA_TYPE_UDP);
  803. statsd.socket_errors++;
  804. retval = -1;
  805. goto cleanup;
  806. }
  807. #endif
  808. #ifdef HAVE_RECVMMSG
  809. ssize_t rc;
  810. do {
  811. rc = recvmmsg(fd, d->msgs, (unsigned int)d->size, MSG_DONTWAIT, NULL);
  812. if (rc < 0) {
  813. // read failed
  814. if (errno != EWOULDBLOCK && errno != EAGAIN && errno != EINTR) {
  815. netdata_log_error("STATSD: recvmmsg() on UDP socket %d failed.", fd);
  816. statsd.socket_errors++;
  817. retval = -1;
  818. goto cleanup;
  819. }
  820. } else if (rc) {
  821. // data received
  822. statsd.udp_socket_reads++;
  823. statsd.udp_packets_received += rc;
  824. size_t i;
  825. for (i = 0; i < (size_t)rc; ++i) {
  826. size_t len = (size_t)d->msgs[i].msg_len;
  827. statsd.udp_bytes_read += len;
  828. statsd_process(d->msgs[i].msg_hdr.msg_iov->iov_base, len, 0);
  829. }
  830. }
  831. } while (rc != -1);
  832. #else // !HAVE_RECVMMSG
  833. ssize_t rc;
  834. do {
  835. rc = recv(fd, d->buffer, STATSD_UDP_BUFFER_SIZE - 1, MSG_DONTWAIT);
  836. if (rc < 0) {
  837. // read failed
  838. if (errno != EWOULDBLOCK && errno != EAGAIN && errno != EINTR) {
  839. netdata_log_error("STATSD: recv() on UDP socket %d failed.", fd);
  840. statsd.socket_errors++;
  841. retval = -1;
  842. goto cleanup;
  843. }
  844. } else if (rc) {
  845. // data received
  846. statsd.udp_socket_reads++;
  847. statsd.udp_packets_received++;
  848. statsd.udp_bytes_read += rc;
  849. statsd_process(d->buffer, (size_t) rc, 0);
  850. }
  851. } while (rc != -1);
  852. #endif
  853. break;
  854. }
  855. default: {
  856. netdata_log_error("STATSD: internal error: unknown socktype %d on socket %d", pi->socktype, fd);
  857. statsd.socket_errors++;
  858. retval = -1;
  859. goto cleanup;
  860. }
  861. }
  862. retval = 0;
  863. cleanup:
  864. worker_is_idle();
  865. return retval;
  866. }
  867. static int statsd_snd_callback(POLLINFO *pi, short int *events) {
  868. (void)pi;
  869. (void)events;
  870. worker_is_busy(WORKER_JOB_TYPE_SND_DATA);
  871. netdata_log_error("STATSD: snd_callback() called, but we never requested to send data to statsd clients.");
  872. worker_is_idle();
  873. return -1;
  874. }
  875. // --------------------------------------------------------------------------------------------------------------------
  876. // statsd child thread to collect metrics from network
  877. void statsd_collector_thread_cleanup(void *data) {
  878. struct statsd_udp *d = data;
  879. spinlock_lock(&d->status->spinlock);
  880. d->status->running = false;
  881. spinlock_unlock(&d->status->spinlock);
  882. collector_info("cleaning up...");
  883. #ifdef HAVE_RECVMMSG
  884. size_t i;
  885. for (i = 0; i < d->size; i++)
  886. freez(d->iovecs[i].iov_base);
  887. freez(d->iovecs);
  888. freez(d->msgs);
  889. #endif
  890. freez(d);
  891. worker_unregister();
  892. }
  893. static bool statsd_should_stop(void) {
  894. return !service_running(SERVICE_COLLECTORS);
  895. }
  896. void *statsd_collector_thread(void *ptr) {
  897. struct collection_thread_status *status = ptr;
  898. spinlock_lock(&status->spinlock);
  899. status->running = true;
  900. spinlock_unlock(&status->spinlock);
  901. worker_register("STATSD");
  902. worker_register_job_name(WORKER_JOB_TYPE_TCP_CONNECTED, "tcp connect");
  903. worker_register_job_name(WORKER_JOB_TYPE_TCP_DISCONNECTED, "tcp disconnect");
  904. worker_register_job_name(WORKER_JOB_TYPE_RCV_DATA, "receive");
  905. worker_register_job_name(WORKER_JOB_TYPE_SND_DATA, "send");
  906. collector_info("STATSD collector thread started with taskid %d", gettid());
  907. struct statsd_udp *d = callocz(sizeof(struct statsd_udp), 1);
  908. d->status = status;
  909. netdata_thread_cleanup_push(statsd_collector_thread_cleanup, d);
  910. #ifdef HAVE_RECVMMSG
  911. d->type = STATSD_SOCKET_DATA_TYPE_UDP;
  912. d->size = statsd.recvmmsg_size;
  913. d->iovecs = callocz(sizeof(struct iovec), d->size);
  914. d->msgs = callocz(sizeof(struct mmsghdr), d->size);
  915. size_t i;
  916. for (i = 0; i < d->size; i++) {
  917. d->iovecs[i].iov_base = mallocz(STATSD_UDP_BUFFER_SIZE);
  918. d->iovecs[i].iov_len = STATSD_UDP_BUFFER_SIZE - 1;
  919. d->msgs[i].msg_hdr.msg_iov = &d->iovecs[i];
  920. d->msgs[i].msg_hdr.msg_iovlen = 1;
  921. }
  922. #endif
  923. poll_events(&statsd.sockets
  924. , statsd_add_callback
  925. , statsd_del_callback
  926. , statsd_rcv_callback
  927. , statsd_snd_callback
  928. , NULL
  929. , statsd_should_stop
  930. , NULL // No access control pattern
  931. , 0 // No dns lookups for access control pattern
  932. , (void *)d
  933. , 0 // tcp request timeout, 0 = disabled
  934. , statsd.tcp_idle_timeout // tcp idle timeout, 0 = disabled
  935. , statsd.update_every * 1000
  936. , ptr // timer_data
  937. , status->max_sockets
  938. );
  939. netdata_thread_cleanup_pop(1);
  940. return NULL;
  941. }
  942. // --------------------------------------------------------------------------------------------------------------------
  943. // statsd applications configuration files parsing
  944. #define STATSD_CONF_LINE_MAX 8192
  945. static STATSD_APP_CHART_DIM_VALUE_TYPE string2valuetype(const char *type, size_t line, const char *filename) {
  946. if(!type || !*type) type = "last";
  947. if(!strcmp(type, "events")) return STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS;
  948. else if(!strcmp(type, "last")) return STATSD_APP_CHART_DIM_VALUE_TYPE_LAST;
  949. else if(!strcmp(type, "min")) return STATSD_APP_CHART_DIM_VALUE_TYPE_MIN;
  950. else if(!strcmp(type, "max")) return STATSD_APP_CHART_DIM_VALUE_TYPE_MAX;
  951. else if(!strcmp(type, "sum")) return STATSD_APP_CHART_DIM_VALUE_TYPE_SUM;
  952. else if(!strcmp(type, "average")) return STATSD_APP_CHART_DIM_VALUE_TYPE_AVERAGE;
  953. else if(!strcmp(type, "median")) return STATSD_APP_CHART_DIM_VALUE_TYPE_MEDIAN;
  954. else if(!strcmp(type, "stddev")) return STATSD_APP_CHART_DIM_VALUE_TYPE_STDDEV;
  955. else if(!strcmp(type, "percentile")) return STATSD_APP_CHART_DIM_VALUE_TYPE_PERCENTILE;
  956. netdata_log_error("STATSD: invalid type '%s' at line %zu of file '%s'. Using 'last'.", type, line, filename);
  957. return STATSD_APP_CHART_DIM_VALUE_TYPE_LAST;
  958. }
  959. static const char *valuetype2string(STATSD_APP_CHART_DIM_VALUE_TYPE type) {
  960. switch(type) {
  961. case STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS: return "events";
  962. case STATSD_APP_CHART_DIM_VALUE_TYPE_LAST: return "last";
  963. case STATSD_APP_CHART_DIM_VALUE_TYPE_MIN: return "min";
  964. case STATSD_APP_CHART_DIM_VALUE_TYPE_MAX: return "max";
  965. case STATSD_APP_CHART_DIM_VALUE_TYPE_SUM: return "sum";
  966. case STATSD_APP_CHART_DIM_VALUE_TYPE_AVERAGE: return "average";
  967. case STATSD_APP_CHART_DIM_VALUE_TYPE_MEDIAN: return "median";
  968. case STATSD_APP_CHART_DIM_VALUE_TYPE_STDDEV: return "stddev";
  969. case STATSD_APP_CHART_DIM_VALUE_TYPE_PERCENTILE: return "percentile";
  970. }
  971. return "unknown";
  972. }
  973. static STATSD_APP_CHART_DIM *add_dimension_to_app_chart(
  974. STATSD_APP *app __maybe_unused
  975. , STATSD_APP_CHART *chart
  976. , const char *metric_name
  977. , const char *dim_name
  978. , collected_number multiplier
  979. , collected_number divisor
  980. , RRDDIM_FLAGS flags
  981. , RRDDIM_OPTIONS options
  982. , STATSD_APP_CHART_DIM_VALUE_TYPE value_type
  983. ) {
  984. STATSD_APP_CHART_DIM *dim = callocz(sizeof(STATSD_APP_CHART_DIM), 1);
  985. dim->metric = strdupz(metric_name);
  986. dim->metric_hash = simple_hash(dim->metric);
  987. dim->name = strdupz((dim_name)?dim_name:"");
  988. dim->multiplier = multiplier;
  989. dim->divisor = divisor;
  990. dim->value_type = value_type;
  991. dim->flags = flags;
  992. dim->options = options;
  993. if(!dim->multiplier)
  994. dim->multiplier = 1;
  995. if(!dim->divisor)
  996. dim->divisor = 1;
  997. // append it to the list of dimension
  998. STATSD_APP_CHART_DIM *tdim;
  999. for(tdim = chart->dimensions; tdim && tdim->next ; tdim = tdim->next) ;
  1000. if(!tdim) {
  1001. dim->next = chart->dimensions;
  1002. chart->dimensions = dim;
  1003. }
  1004. else {
  1005. dim->next = tdim->next;
  1006. tdim->next = dim;
  1007. }
  1008. chart->dimensions_count++;
  1009. netdata_log_debug(D_STATSD, "Added dimension '%s' to chart '%s' of app '%s', for metric '%s', with type %u, multiplier %d, divisor %d",
  1010. dim->name, chart->id, app->name, dim->metric, dim->value_type, dim->multiplier, dim->divisor);
  1011. return dim;
  1012. }
  1013. static int statsd_readfile(const char *filename, STATSD_APP *app, STATSD_APP_CHART *chart, DICTIONARY *dict) {
  1014. netdata_log_debug(D_STATSD, "STATSD configuration reading file '%s'", filename);
  1015. char *buffer = mallocz(STATSD_CONF_LINE_MAX + 1);
  1016. FILE *fp = fopen(filename, "r");
  1017. if(!fp) {
  1018. netdata_log_error("STATSD: cannot open file '%s'.", filename);
  1019. freez(buffer);
  1020. return -1;
  1021. }
  1022. size_t line = 0;
  1023. char *s;
  1024. while(fgets(buffer, STATSD_CONF_LINE_MAX, fp) != NULL) {
  1025. buffer[STATSD_CONF_LINE_MAX] = '\0';
  1026. line++;
  1027. s = trim(buffer);
  1028. if (!s || *s == '#') {
  1029. netdata_log_debug(D_STATSD, "STATSD: ignoring line %zu of file '%s', it is empty.", line, filename);
  1030. continue;
  1031. }
  1032. netdata_log_debug(D_STATSD, "STATSD: processing line %zu of file '%s': %s", line, filename, buffer);
  1033. if(*s == 'i' && strncmp(s, "include", 7) == 0) {
  1034. s = trim(&s[7]);
  1035. if(s && *s) {
  1036. char *tmp;
  1037. if(*s == '/')
  1038. tmp = strdupz(s);
  1039. else {
  1040. // the file to be included is relative to current file
  1041. // find the directory name from the file we already read
  1042. char *filename2 = strdupz(filename); // copy filename, since dirname() will change it
  1043. char *dir = dirname(filename2); // find the directory part of the filename
  1044. tmp = strdupz_path_subpath(dir, s); // compose the new filename to read;
  1045. freez(filename2); // free the filename we copied
  1046. }
  1047. statsd_readfile(tmp, app, chart, dict);
  1048. freez(tmp);
  1049. }
  1050. else
  1051. netdata_log_error("STATSD: ignoring line %zu of file '%s', include filename is empty", line, filename);
  1052. continue;
  1053. }
  1054. int len = (int) strlen(s);
  1055. if (*s == '[' && s[len - 1] == ']') {
  1056. // new section
  1057. s[len - 1] = '\0';
  1058. s++;
  1059. if (!strcmp(s, "app")) {
  1060. // a new app
  1061. app = callocz(sizeof(STATSD_APP), 1);
  1062. app->name = strdupz("unnamed");
  1063. app->rrd_memory_mode = localhost->rrd_memory_mode;
  1064. app->rrd_history_entries = localhost->rrd_history_entries;
  1065. app->next = statsd.apps;
  1066. statsd.apps = app;
  1067. chart = NULL;
  1068. dict = NULL;
  1069. {
  1070. char lineandfile[FILENAME_MAX + 1];
  1071. snprintfz(lineandfile, FILENAME_MAX, "%zu@%s", line, filename);
  1072. app->source = strdupz(lineandfile);
  1073. }
  1074. }
  1075. else if(app) {
  1076. if(!strcmp(s, "dictionary")) {
  1077. if(!app->dict)
  1078. app->dict = dictionary_create_advanced(DICT_OPTION_SINGLE_THREADED, &dictionary_stats_category_collectors, 0);
  1079. dict = app->dict;
  1080. }
  1081. else {
  1082. dict = NULL;
  1083. // a new chart
  1084. chart = callocz(sizeof(STATSD_APP_CHART), 1);
  1085. netdata_fix_chart_id(s);
  1086. chart->id = strdupz(s);
  1087. chart->name = strdupz(s);
  1088. chart->title = strdupz("Statsd chart");
  1089. chart->context = strdupz(s);
  1090. chart->family = strdupz("overview");
  1091. chart->units = strdupz("value");
  1092. chart->priority = NETDATA_CHART_PRIO_STATSD_PRIVATE;
  1093. chart->chart_type = RRDSET_TYPE_LINE;
  1094. chart->next = app->charts;
  1095. app->charts = chart;
  1096. if (!strncmp(
  1097. filename,
  1098. netdata_configured_stock_config_dir,
  1099. strlen(netdata_configured_stock_config_dir))) {
  1100. char tmpfilename[FILENAME_MAX + 1];
  1101. strncpyz(tmpfilename, filename, FILENAME_MAX);
  1102. chart->module = strdupz(basename(tmpfilename));
  1103. } else {
  1104. chart->module = strdupz("synthetic_chart");
  1105. }
  1106. }
  1107. }
  1108. else
  1109. netdata_log_error("STATSD: ignoring line %zu ('%s') of file '%s', [app] is not defined.", line, s, filename);
  1110. continue;
  1111. }
  1112. if(!app) {
  1113. netdata_log_error("STATSD: ignoring line %zu ('%s') of file '%s', it is outside all sections.", line, s, filename);
  1114. continue;
  1115. }
  1116. char *name = s;
  1117. char *value = strchr(s, '=');
  1118. if(!value) {
  1119. netdata_log_error("STATSD: ignoring line %zu ('%s') of file '%s', there is no = in it.", line, s, filename);
  1120. continue;
  1121. }
  1122. *value = '\0';
  1123. value++;
  1124. name = trim(name);
  1125. value = trim(value);
  1126. if(!name || *name == '#') {
  1127. netdata_log_error("STATSD: ignoring line %zu of file '%s', name is empty.", line, filename);
  1128. continue;
  1129. }
  1130. if(!value) {
  1131. netdata_log_debug(D_CONFIG, "STATSD: ignoring line %zu of file '%s', value is empty.", line, filename);
  1132. continue;
  1133. }
  1134. if(unlikely(dict)) {
  1135. // parse [dictionary] members
  1136. dictionary_set(dict, name, value, strlen(value) + 1);
  1137. }
  1138. else if(!chart) {
  1139. // parse [app] members
  1140. if(!strcmp(name, "name")) {
  1141. freez((void *)app->name);
  1142. netdata_fix_chart_name(value);
  1143. app->name = strdupz(value);
  1144. }
  1145. else if (!strcmp(name, "metrics")) {
  1146. simple_pattern_free(app->metrics);
  1147. app->metrics = simple_pattern_create(value, NULL, SIMPLE_PATTERN_EXACT, true);
  1148. }
  1149. else if (!strcmp(name, "private charts")) {
  1150. if (!strcmp(value, "yes") || !strcmp(value, "on"))
  1151. app->default_options |= STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1152. else
  1153. app->default_options &= ~STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1154. }
  1155. else if (!strcmp(name, "gaps when not collected")) {
  1156. if (!strcmp(value, "yes") || !strcmp(value, "on"))
  1157. app->default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  1158. }
  1159. else if (!strcmp(name, "memory mode")) {
  1160. // this is not supported anymore
  1161. // with the implementation of storage engines, all charts have the same storage engine always
  1162. // app->rrd_memory_mode = rrd_memory_mode_id(value);
  1163. ;
  1164. }
  1165. else if (!strcmp(name, "history")) {
  1166. app->rrd_history_entries = atol(value);
  1167. if (app->rrd_history_entries < 5)
  1168. app->rrd_history_entries = 5;
  1169. }
  1170. else {
  1171. netdata_log_error("STATSD: ignoring line %zu ('%s') of file '%s'. Unknown keyword for the [app] section.", line, name, filename);
  1172. continue;
  1173. }
  1174. }
  1175. else {
  1176. // parse [chart] members
  1177. if(!strcmp(name, "name")) {
  1178. freez((void *)chart->name);
  1179. netdata_fix_chart_id(value);
  1180. chart->name = strdupz(value);
  1181. }
  1182. else if(!strcmp(name, "title")) {
  1183. freez((void *)chart->title);
  1184. chart->title = strdupz(value);
  1185. }
  1186. else if (!strcmp(name, "family")) {
  1187. freez((void *)chart->family);
  1188. chart->family = strdupz(value);
  1189. }
  1190. else if (!strcmp(name, "context")) {
  1191. freez((void *)chart->context);
  1192. netdata_fix_chart_id(value);
  1193. chart->context = strdupz(value);
  1194. }
  1195. else if (!strcmp(name, "units")) {
  1196. freez((void *)chart->units);
  1197. chart->units = strdupz(value);
  1198. }
  1199. else if (!strcmp(name, "priority")) {
  1200. chart->priority = atol(value);
  1201. }
  1202. else if (!strcmp(name, "type")) {
  1203. chart->chart_type = rrdset_type_id(value);
  1204. }
  1205. else if (!strcmp(name, "dimension")) {
  1206. // metric [name [type [multiplier [divisor]]]]
  1207. char *words[10] = { NULL };
  1208. size_t num_words = quoted_strings_splitter_pluginsd(value, words, 10);
  1209. int pattern = 0;
  1210. size_t i = 0;
  1211. char *metric_name = get_word(words, num_words, i++);
  1212. if(strcmp(metric_name, "pattern") == 0) {
  1213. metric_name = get_word(words, num_words, i++);
  1214. pattern = 1;
  1215. }
  1216. char *dim_name = get_word(words, num_words, i++);
  1217. char *type = get_word(words, num_words, i++);
  1218. char *multiplier = get_word(words, num_words, i++);
  1219. char *divisor = get_word(words, num_words, i++);
  1220. char *opts = get_word(words, num_words, i++);
  1221. RRDDIM_FLAGS flags = RRDDIM_FLAG_NONE;
  1222. RRDDIM_OPTIONS options = RRDDIM_OPTION_NONE;
  1223. if(opts && *opts) {
  1224. if(strstr(opts, "hidden") != NULL) options |= RRDDIM_OPTION_HIDDEN;
  1225. if(strstr(opts, "noreset") != NULL) options |= RRDDIM_OPTION_DONT_DETECT_RESETS_OR_OVERFLOWS;
  1226. if(strstr(opts, "nooverflow") != NULL) options |= RRDDIM_OPTION_DONT_DETECT_RESETS_OR_OVERFLOWS;
  1227. }
  1228. if(!pattern) {
  1229. if(app->dict) {
  1230. if(dim_name && *dim_name) {
  1231. char *n = dictionary_get(app->dict, dim_name);
  1232. if(n) dim_name = n;
  1233. }
  1234. else {
  1235. dim_name = dictionary_get(app->dict, metric_name);
  1236. }
  1237. }
  1238. if(!dim_name || !*dim_name)
  1239. dim_name = metric_name;
  1240. }
  1241. STATSD_APP_CHART_DIM *dim = add_dimension_to_app_chart(
  1242. app
  1243. , chart
  1244. , metric_name
  1245. , dim_name
  1246. , (multiplier && *multiplier)?str2l(multiplier):1
  1247. , (divisor && *divisor)?str2l(divisor):1
  1248. , flags
  1249. ,
  1250. options, string2valuetype(type, line, filename)
  1251. );
  1252. if(pattern)
  1253. dim->metric_pattern = simple_pattern_create(dim->metric, NULL, SIMPLE_PATTERN_EXACT, true);
  1254. }
  1255. else {
  1256. netdata_log_error("STATSD: ignoring line %zu ('%s') of file '%s'. Unknown keyword for the [%s] section.", line, name, filename, chart->id);
  1257. continue;
  1258. }
  1259. }
  1260. }
  1261. freez(buffer);
  1262. fclose(fp);
  1263. return 0;
  1264. }
  1265. static int statsd_file_callback(const char *filename, void *data) {
  1266. (void)data;
  1267. return statsd_readfile(filename, NULL, NULL, NULL);
  1268. }
  1269. static inline void statsd_readdir(const char *user_path, const char *stock_path, const char *subpath) {
  1270. recursive_config_double_dir_load(user_path, stock_path, subpath, statsd_file_callback, NULL, 0);
  1271. }
  1272. // --------------------------------------------------------------------------------------------------------------------
  1273. // send metrics to netdata - in private charts - called from the main thread
  1274. // extract chart type and chart id from metric name
  1275. static inline void statsd_get_metric_type_and_id(STATSD_METRIC *m, char *type, char *id, char *context, const char *metrictype, size_t len) {
  1276. // The full chart type.id looks like this:
  1277. // ${STATSD_CHART_PREFIX} + "_" + ${METRIC_NAME} + "_" + ${METRIC_TYPE}
  1278. //
  1279. // where:
  1280. // STATSD_CHART_PREFIX = "statsd" as defined above
  1281. // METRIC_NAME = whatever the user gave to statsd
  1282. // METRIC_TYPE = "gauge", "counter", "meter", "timer", "histogram", "set", "dictionary"
  1283. // for chart type, we want:
  1284. // ${STATSD_CHART_PREFIX} + "_" + the first word of ${METRIC_NAME}
  1285. // find the first word of ${METRIC_NAME}
  1286. char firstword[len + 1], *s = "";
  1287. strncpyz(firstword, m->name, len);
  1288. for (s = firstword; *s ; s++) {
  1289. if (unlikely(*s == '.' || *s == '_')) {
  1290. *s = '\0';
  1291. s++;
  1292. break;
  1293. }
  1294. }
  1295. // firstword has the first word of ${METRIC_NAME}
  1296. // s has the remaining, if any
  1297. // create the chart type:
  1298. snprintfz(type, len, STATSD_CHART_PREFIX "_%s", firstword);
  1299. // for chart id, we want:
  1300. // the remaining of the words of ${METRIC_NAME} + "_" + ${METRIC_TYPE}
  1301. // or the ${METRIC_NAME} has no remaining words, the ${METRIC_TYPE} alone
  1302. if(*s)
  1303. snprintfz(id, len, "%s_%s", s, metrictype);
  1304. else
  1305. snprintfz(id, len, "%s", metrictype);
  1306. // for the context, we want the full of both the above, separated with a dot (type.id):
  1307. snprintfz(context, RRD_ID_LENGTH_MAX, "%s.%s", type, id);
  1308. // make sure they don't have illegal characters
  1309. netdata_fix_chart_id(type);
  1310. netdata_fix_chart_id(id);
  1311. netdata_fix_chart_id(context);
  1312. }
  1313. static inline RRDSET *statsd_private_rrdset_create(
  1314. STATSD_METRIC *m __maybe_unused
  1315. , const char *type
  1316. , const char *id
  1317. , const char *name
  1318. , const char *family
  1319. , const char *context
  1320. , const char *title
  1321. , const char *units
  1322. , long priority
  1323. , int update_every
  1324. , RRDSET_TYPE chart_type
  1325. ) {
  1326. if(!m->st)
  1327. statsd.private_charts++;
  1328. RRDSET *st = rrdset_create_custom(
  1329. localhost // host
  1330. , type // type
  1331. , id // id
  1332. , name // name
  1333. , family // family
  1334. , context // context
  1335. , title // title
  1336. , units // units
  1337. , PLUGIN_STATSD_NAME // plugin
  1338. , "private_chart" // module
  1339. , priority // priority
  1340. , update_every // update every
  1341. , chart_type // chart type
  1342. , default_rrd_memory_mode // memory mode
  1343. , default_rrd_history_entries // history
  1344. );
  1345. rrdset_flag_set(st, RRDSET_FLAG_STORE_FIRST);
  1346. if(statsd.private_charts_hidden)
  1347. rrdset_flag_set(st, RRDSET_FLAG_HIDDEN);
  1348. // rrdset_flag_set(st, RRDSET_FLAG_DEBUG);
  1349. return st;
  1350. }
  1351. static inline void statsd_private_chart_gauge(STATSD_METRIC *m) {
  1352. netdata_log_debug(D_STATSD, "updating private chart for gauge metric '%s'", m->name);
  1353. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1354. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1355. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1356. statsd_get_metric_type_and_id(m, type, id, context, "gauge", RRD_ID_LENGTH_MAX);
  1357. char title[RRD_ID_LENGTH_MAX + 1];
  1358. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for gauge %s", m->name);
  1359. m->st = statsd_private_rrdset_create(
  1360. m
  1361. , type
  1362. , id
  1363. , NULL // name
  1364. , m->family?m->family:"gauges" // family (submenu)
  1365. , context // context
  1366. , title // title
  1367. , m->units?m->units:"value" // units
  1368. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1369. , statsd.update_every
  1370. , RRDSET_TYPE_LINE
  1371. );
  1372. m->rd_value = rrddim_add(m->st, "gauge", m->dimname?m->dimname:NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1373. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1374. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1375. }
  1376. rrddim_set_by_pointer(m->st, m->rd_value, m->last);
  1377. if(m->rd_count)
  1378. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1379. rrdset_done(m->st);
  1380. }
  1381. static inline void statsd_private_chart_counter_or_meter(STATSD_METRIC *m, const char *dim, const char *family) {
  1382. netdata_log_debug(D_STATSD, "updating private chart for %s metric '%s'", dim, m->name);
  1383. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1384. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1385. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1386. statsd_get_metric_type_and_id(m, type, id, context, dim, RRD_ID_LENGTH_MAX);
  1387. char title[RRD_ID_LENGTH_MAX + 1];
  1388. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for %s %s", dim, m->name);
  1389. m->st = statsd_private_rrdset_create(
  1390. m
  1391. , type
  1392. , id
  1393. , NULL // name
  1394. , m->family?m->family:family // family (submenu)
  1395. , context // context
  1396. , title // title
  1397. , m->units?m->units:"events/s" // units
  1398. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1399. , statsd.update_every
  1400. , RRDSET_TYPE_AREA
  1401. );
  1402. m->rd_value = rrddim_add(m->st, dim, m->dimname?m->dimname:NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1403. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1404. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1405. }
  1406. rrddim_set_by_pointer(m->st, m->rd_value, m->last);
  1407. if(m->rd_count)
  1408. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1409. rrdset_done(m->st);
  1410. }
  1411. static inline void statsd_private_chart_set(STATSD_METRIC *m) {
  1412. netdata_log_debug(D_STATSD, "updating private chart for set metric '%s'", m->name);
  1413. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1414. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1415. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1416. statsd_get_metric_type_and_id(m, type, id, context, "set", RRD_ID_LENGTH_MAX);
  1417. char title[RRD_ID_LENGTH_MAX + 1];
  1418. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for set %s", m->name);
  1419. m->st = statsd_private_rrdset_create(
  1420. m
  1421. , type
  1422. , id
  1423. , NULL // name
  1424. , m->family?m->family:"sets" // family (submenu)
  1425. , context // context
  1426. , title // title
  1427. , m->units?m->units:"entries" // units
  1428. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1429. , statsd.update_every
  1430. , RRDSET_TYPE_LINE
  1431. );
  1432. m->rd_value = rrddim_add(m->st, "set", m->dimname?m->dimname:"unique", 1, 1, RRD_ALGORITHM_ABSOLUTE);
  1433. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1434. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1435. }
  1436. rrddim_set_by_pointer(m->st, m->rd_value, m->last);
  1437. if(m->rd_count)
  1438. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1439. rrdset_done(m->st);
  1440. }
  1441. static inline void statsd_private_chart_dictionary(STATSD_METRIC *m) {
  1442. netdata_log_debug(D_STATSD, "updating private chart for dictionary metric '%s'", m->name);
  1443. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1444. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1445. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1446. statsd_get_metric_type_and_id(m, type, id, context, "dictionary", RRD_ID_LENGTH_MAX);
  1447. char title[RRD_ID_LENGTH_MAX + 1];
  1448. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for dictionary %s", m->name);
  1449. m->st = statsd_private_rrdset_create(
  1450. m
  1451. , type
  1452. , id
  1453. , NULL // name
  1454. , m->family?m->family:"dictionaries" // family (submenu)
  1455. , context // context
  1456. , title // title
  1457. , m->units?m->units:"events/s" // units
  1458. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1459. , statsd.update_every
  1460. , RRDSET_TYPE_STACKED
  1461. );
  1462. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1463. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1464. }
  1465. STATSD_METRIC_DICTIONARY_ITEM *t;
  1466. dfe_start_read(m->dictionary.dict, t) {
  1467. if (!t->rd) t->rd = rrddim_add(m->st, t_dfe.name, NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1468. rrddim_set_by_pointer(m->st, t->rd, (collected_number)t->count);
  1469. }
  1470. dfe_done(t);
  1471. if(m->rd_count)
  1472. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1473. rrdset_done(m->st);
  1474. }
  1475. static inline void statsd_private_chart_timer_or_histogram(STATSD_METRIC *m, const char *dim, const char *family, const char *units) {
  1476. netdata_log_debug(D_STATSD, "updating private chart for %s metric '%s'", dim, m->name);
  1477. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1478. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1479. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1480. statsd_get_metric_type_and_id(m, type, id, context, dim, RRD_ID_LENGTH_MAX);
  1481. char title[RRD_ID_LENGTH_MAX + 1];
  1482. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for %s %s", dim, m->name);
  1483. m->st = statsd_private_rrdset_create(
  1484. m
  1485. , type
  1486. , id
  1487. , NULL // name
  1488. , m->family?m->family:family // family (submenu)
  1489. , context // context
  1490. , title // title
  1491. , m->units?m->units:units // units
  1492. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1493. , statsd.update_every
  1494. , RRDSET_TYPE_AREA
  1495. );
  1496. m->histogram.ext->rd_min = rrddim_add(m->st, "min", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1497. m->histogram.ext->rd_max = rrddim_add(m->st, "max", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1498. m->rd_value = rrddim_add(m->st, "average", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1499. m->histogram.ext->rd_percentile = rrddim_add(m->st, statsd.histogram_percentile_str, NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1500. m->histogram.ext->rd_median = rrddim_add(m->st, "median", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1501. m->histogram.ext->rd_stddev = rrddim_add(m->st, "stddev", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1502. //m->histogram.ext->rd_sum = rrddim_add(m->st, "sum", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1503. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1504. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1505. }
  1506. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_min, m->histogram.ext->last_min);
  1507. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_max, m->histogram.ext->last_max);
  1508. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_percentile, m->histogram.ext->last_percentile);
  1509. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_median, m->histogram.ext->last_median);
  1510. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_stddev, m->histogram.ext->last_stddev);
  1511. //rrddim_set_by_pointer(m->st, m->histogram.ext->rd_sum, m->histogram.ext->last_sum);
  1512. rrddim_set_by_pointer(m->st, m->rd_value, m->last);
  1513. if(m->rd_count)
  1514. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1515. rrdset_done(m->st);
  1516. }
  1517. // --------------------------------------------------------------------------------------------------------------------
  1518. // statsd flush metrics
  1519. static inline void statsd_flush_gauge(STATSD_METRIC *m) {
  1520. netdata_log_debug(D_STATSD, "flushing gauge metric '%s'", m->name);
  1521. int updated = 0;
  1522. if(unlikely(!m->reset && m->count)) {
  1523. m->last = (collected_number) (m->gauge.value * statsd.decimal_detail);
  1524. m->reset = 1;
  1525. updated = 1;
  1526. }
  1527. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1528. statsd_private_chart_gauge(m);
  1529. }
  1530. static inline void statsd_flush_counter_or_meter(STATSD_METRIC *m, const char *dim, const char *family) {
  1531. netdata_log_debug(D_STATSD, "flushing %s metric '%s'", dim, m->name);
  1532. int updated = 0;
  1533. if(unlikely(!m->reset && m->count)) {
  1534. m->last = m->counter.value;
  1535. m->reset = 1;
  1536. updated = 1;
  1537. }
  1538. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1539. statsd_private_chart_counter_or_meter(m, dim, family);
  1540. }
  1541. static inline void statsd_flush_counter(STATSD_METRIC *m) {
  1542. statsd_flush_counter_or_meter(m, "counter", "counters");
  1543. }
  1544. static inline void statsd_flush_meter(STATSD_METRIC *m) {
  1545. statsd_flush_counter_or_meter(m, "meter", "meters");
  1546. }
  1547. static inline void statsd_flush_set(STATSD_METRIC *m) {
  1548. netdata_log_debug(D_STATSD, "flushing set metric '%s'", m->name);
  1549. int updated = 0;
  1550. if(unlikely(!m->reset && m->count)) {
  1551. m->last = (collected_number)dictionary_entries(m->set.dict);
  1552. m->reset = 1;
  1553. updated = 1;
  1554. }
  1555. else {
  1556. m->last = 0;
  1557. }
  1558. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1559. statsd_private_chart_set(m);
  1560. }
  1561. static inline void statsd_flush_dictionary(STATSD_METRIC *m) {
  1562. netdata_log_debug(D_STATSD, "flushing dictionary metric '%s'", m->name);
  1563. int updated = 0;
  1564. if(unlikely(!m->reset && m->count)) {
  1565. m->last = (collected_number)dictionary_entries(m->dictionary.dict);
  1566. m->reset = 1;
  1567. updated = 1;
  1568. }
  1569. else {
  1570. m->last = 0;
  1571. }
  1572. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1573. statsd_private_chart_dictionary(m);
  1574. if(dictionary_entries(m->dictionary.dict) >= statsd.dictionary_max_unique) {
  1575. if(!(m->options & STATSD_METRIC_OPTION_COLLECTION_FULL_LOGGED)) {
  1576. m->options |= STATSD_METRIC_OPTION_COLLECTION_FULL_LOGGED;
  1577. collector_info(
  1578. "STATSD dictionary '%s' reach max of %zu items - try increasing 'dictionaries max unique dimensions' in netdata.conf",
  1579. m->name,
  1580. dictionary_entries(m->dictionary.dict));
  1581. }
  1582. }
  1583. }
  1584. static inline void statsd_flush_timer_or_histogram(STATSD_METRIC *m, const char *dim, const char *family, const char *units) {
  1585. netdata_log_debug(D_STATSD, "flushing %s metric '%s'", dim, m->name);
  1586. int updated = 0;
  1587. if(unlikely(!m->reset && m->count && m->histogram.ext->used > 0)) {
  1588. netdata_mutex_lock(&m->histogram.ext->mutex);
  1589. size_t len = m->histogram.ext->used;
  1590. NETDATA_DOUBLE *series = m->histogram.ext->values;
  1591. sort_series(series, len);
  1592. m->histogram.ext->last_min = (collected_number)roundndd(series[0] * statsd.decimal_detail);
  1593. m->histogram.ext->last_max = (collected_number)roundndd(series[len - 1] * statsd.decimal_detail);
  1594. m->last = (collected_number)roundndd(average(series, len) * statsd.decimal_detail);
  1595. m->histogram.ext->last_median = (collected_number)roundndd(median_on_sorted_series(series, len) * statsd.decimal_detail);
  1596. m->histogram.ext->last_stddev = (collected_number)roundndd(standard_deviation(series, len) * statsd.decimal_detail);
  1597. m->histogram.ext->last_sum = (collected_number)roundndd(sum(series, len) * statsd.decimal_detail);
  1598. size_t pct_len = (size_t)floor((double)len * statsd.histogram_percentile / 100.0);
  1599. if(pct_len < 1)
  1600. m->histogram.ext->last_percentile = (collected_number)(series[0] * statsd.decimal_detail);
  1601. else
  1602. m->histogram.ext->last_percentile = (collected_number)roundndd(series[pct_len - 1] * statsd.decimal_detail);
  1603. netdata_mutex_unlock(&m->histogram.ext->mutex);
  1604. netdata_log_debug(D_STATSD, "STATSD %s metric %s: min " COLLECTED_NUMBER_FORMAT ", max " COLLECTED_NUMBER_FORMAT ", last " COLLECTED_NUMBER_FORMAT ", pcent " COLLECTED_NUMBER_FORMAT ", median " COLLECTED_NUMBER_FORMAT ", stddev " COLLECTED_NUMBER_FORMAT ", sum " COLLECTED_NUMBER_FORMAT,
  1605. dim, m->name, m->histogram.ext->last_min, m->histogram.ext->last_max, m->last, m->histogram.ext->last_percentile, m->histogram.ext->last_median, m->histogram.ext->last_stddev, m->histogram.ext->last_sum);
  1606. m->histogram.ext->zeroed = 0;
  1607. m->reset = 1;
  1608. updated = 1;
  1609. }
  1610. else if(unlikely(!m->histogram.ext->zeroed)) {
  1611. // reset the metrics
  1612. // if we collected anything, they will be updated below
  1613. // this ensures that we report zeros if nothing is collected
  1614. m->histogram.ext->last_min = 0;
  1615. m->histogram.ext->last_max = 0;
  1616. m->last = 0;
  1617. m->histogram.ext->last_median = 0;
  1618. m->histogram.ext->last_stddev = 0;
  1619. m->histogram.ext->last_sum = 0;
  1620. m->histogram.ext->last_percentile = 0;
  1621. m->histogram.ext->zeroed = 1;
  1622. }
  1623. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1624. statsd_private_chart_timer_or_histogram(m, dim, family, units);
  1625. }
  1626. static inline void statsd_flush_timer(STATSD_METRIC *m) {
  1627. statsd_flush_timer_or_histogram(m, "timer", "timers", "milliseconds");
  1628. }
  1629. static inline void statsd_flush_histogram(STATSD_METRIC *m) {
  1630. statsd_flush_timer_or_histogram(m, "histogram", "histograms", "value");
  1631. }
  1632. static inline RRD_ALGORITHM statsd_algorithm_for_metric(STATSD_METRIC *m) {
  1633. switch(m->type) {
  1634. default:
  1635. case STATSD_METRIC_TYPE_GAUGE:
  1636. case STATSD_METRIC_TYPE_SET:
  1637. case STATSD_METRIC_TYPE_TIMER:
  1638. case STATSD_METRIC_TYPE_HISTOGRAM:
  1639. return RRD_ALGORITHM_ABSOLUTE;
  1640. case STATSD_METRIC_TYPE_METER:
  1641. case STATSD_METRIC_TYPE_COUNTER:
  1642. case STATSD_METRIC_TYPE_DICTIONARY:
  1643. return RRD_ALGORITHM_INCREMENTAL;
  1644. }
  1645. }
  1646. static inline void link_metric_to_app_dimension(STATSD_APP *app, STATSD_METRIC *m, STATSD_APP_CHART *chart, STATSD_APP_CHART_DIM *dim) {
  1647. if(dim->value_type == STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS) {
  1648. dim->value_ptr = &m->events;
  1649. dim->algorithm = RRD_ALGORITHM_INCREMENTAL;
  1650. }
  1651. else if(m->type == STATSD_METRIC_TYPE_HISTOGRAM || m->type == STATSD_METRIC_TYPE_TIMER) {
  1652. dim->algorithm = RRD_ALGORITHM_ABSOLUTE;
  1653. dim->divisor *= statsd.decimal_detail;
  1654. switch(dim->value_type) {
  1655. case STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS:
  1656. // will never match - added to avoid warning
  1657. break;
  1658. case STATSD_APP_CHART_DIM_VALUE_TYPE_LAST:
  1659. case STATSD_APP_CHART_DIM_VALUE_TYPE_AVERAGE:
  1660. dim->value_ptr = &m->last;
  1661. break;
  1662. case STATSD_APP_CHART_DIM_VALUE_TYPE_SUM:
  1663. dim->value_ptr = &m->histogram.ext->last_sum;
  1664. break;
  1665. case STATSD_APP_CHART_DIM_VALUE_TYPE_MIN:
  1666. dim->value_ptr = &m->histogram.ext->last_min;
  1667. break;
  1668. case STATSD_APP_CHART_DIM_VALUE_TYPE_MAX:
  1669. dim->value_ptr = &m->histogram.ext->last_max;
  1670. break;
  1671. case STATSD_APP_CHART_DIM_VALUE_TYPE_MEDIAN:
  1672. dim->value_ptr = &m->histogram.ext->last_median;
  1673. break;
  1674. case STATSD_APP_CHART_DIM_VALUE_TYPE_PERCENTILE:
  1675. dim->value_ptr = &m->histogram.ext->last_percentile;
  1676. break;
  1677. case STATSD_APP_CHART_DIM_VALUE_TYPE_STDDEV:
  1678. dim->value_ptr = &m->histogram.ext->last_stddev;
  1679. break;
  1680. }
  1681. }
  1682. else {
  1683. if (dim->value_type != STATSD_APP_CHART_DIM_VALUE_TYPE_LAST)
  1684. netdata_log_error("STATSD: unsupported value type for dimension '%s' of chart '%s' of app '%s' on metric '%s'", dim->name, chart->id, app->name, m->name);
  1685. dim->value_ptr = &m->last;
  1686. dim->algorithm = statsd_algorithm_for_metric(m);
  1687. if(m->type == STATSD_METRIC_TYPE_GAUGE)
  1688. dim->divisor *= statsd.decimal_detail;
  1689. }
  1690. if(unlikely(chart->st && dim->rd)) {
  1691. rrddim_set_algorithm(chart->st, dim->rd, dim->algorithm);
  1692. rrddim_set_multiplier(chart->st, dim->rd, dim->multiplier);
  1693. rrddim_set_divisor(chart->st, dim->rd, dim->divisor);
  1694. }
  1695. chart->dimensions_linked_count++;
  1696. m->options |= STATSD_METRIC_OPTION_USED_IN_APPS;
  1697. netdata_log_debug(D_STATSD, "metric '%s' of type %u linked with app '%s', chart '%s', dimension '%s', algorithm '%s'", m->name, m->type, app->name, chart->id, dim->name, rrd_algorithm_name(dim->algorithm));
  1698. }
  1699. static inline void check_if_metric_is_for_app(STATSD_INDEX *index, STATSD_METRIC *m) {
  1700. (void)index;
  1701. STATSD_APP *app;
  1702. for(app = statsd.apps; app ;app = app->next) {
  1703. if(unlikely(simple_pattern_matches(app->metrics, m->name))) {
  1704. netdata_log_debug(D_STATSD, "metric '%s' matches app '%s'", m->name, app->name);
  1705. // the metric should get the options from the app
  1706. if(app->default_options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED)
  1707. m->options |= STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1708. else
  1709. m->options &= ~STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1710. if(app->default_options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED)
  1711. m->options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  1712. else
  1713. m->options &= ~STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  1714. m->options |= STATSD_METRIC_OPTION_PRIVATE_CHART_CHECKED;
  1715. // check if there is a chart in this app, willing to get this metric
  1716. STATSD_APP_CHART *chart;
  1717. for(chart = app->charts; chart; chart = chart->next) {
  1718. STATSD_APP_CHART_DIM *dim;
  1719. for(dim = chart->dimensions; dim ; dim = dim->next) {
  1720. if(unlikely(dim->metric_pattern)) {
  1721. size_t dim_name_len = strlen(dim->name);
  1722. size_t wildcarded_len = dim_name_len + strlen(m->name) + 1;
  1723. char wildcarded[wildcarded_len];
  1724. strcpy(wildcarded, dim->name);
  1725. char *ws = &wildcarded[dim_name_len];
  1726. if(simple_pattern_matches_extract(dim->metric_pattern, m->name, ws, wildcarded_len - dim_name_len) == SP_MATCHED_POSITIVE) {
  1727. char *final_name = NULL;
  1728. if(app->dict) {
  1729. if(likely(*wildcarded)) {
  1730. // use the name of the wildcarded string
  1731. final_name = dictionary_get(app->dict, wildcarded);
  1732. }
  1733. if(unlikely(!final_name)) {
  1734. // use the name of the metric
  1735. final_name = dictionary_get(app->dict, m->name);
  1736. }
  1737. }
  1738. if(unlikely(!final_name))
  1739. final_name = wildcarded;
  1740. add_dimension_to_app_chart(
  1741. app
  1742. , chart
  1743. , m->name
  1744. , final_name
  1745. , dim->multiplier
  1746. , dim->divisor
  1747. , dim->flags
  1748. , dim->options
  1749. , dim->value_type
  1750. );
  1751. // the new dimension is appended to the list
  1752. // so, it will be matched and linked later too
  1753. }
  1754. }
  1755. else if(!dim->value_ptr && dim->metric_hash == m->hash && !strcmp(dim->metric, m->name)) {
  1756. // we have a match - this metric should be linked to this dimension
  1757. link_metric_to_app_dimension(app, m, chart, dim);
  1758. }
  1759. }
  1760. }
  1761. }
  1762. }
  1763. }
  1764. static inline RRDDIM *statsd_add_dim_to_app_chart(STATSD_APP *app, STATSD_APP_CHART *chart, STATSD_APP_CHART_DIM *dim) {
  1765. (void)app;
  1766. // allow the same statsd metric to be added multiple times to the same chart
  1767. STATSD_APP_CHART_DIM *tdim;
  1768. size_t count_same_metric = 0, count_same_metric_value_type = 0;
  1769. size_t pos_same_metric_value_type = 0;
  1770. for (tdim = chart->dimensions; tdim && tdim->next; tdim = tdim->next) {
  1771. if (dim->metric_hash == tdim->metric_hash && !strcmp(dim->metric, tdim->metric)) {
  1772. count_same_metric++;
  1773. if(dim->value_type == tdim->value_type) {
  1774. count_same_metric_value_type++;
  1775. if (tdim == dim)
  1776. pos_same_metric_value_type = count_same_metric_value_type;
  1777. }
  1778. }
  1779. }
  1780. if(count_same_metric > 1) {
  1781. // the same metric is found multiple times
  1782. size_t len = strlen(dim->metric) + 100;
  1783. char metric[ len + 1 ];
  1784. if(count_same_metric_value_type > 1) {
  1785. // the same metric, with the same value type, is added multiple times
  1786. snprintfz(metric, len, "%s_%s%zu", dim->metric, valuetype2string(dim->value_type), pos_same_metric_value_type);
  1787. }
  1788. else {
  1789. // the same metric, with different value type is added
  1790. snprintfz(metric, len, "%s_%s", dim->metric, valuetype2string(dim->value_type));
  1791. }
  1792. dim->rd = rrddim_add(chart->st, metric, dim->name, dim->multiplier, dim->divisor, dim->algorithm);
  1793. if(dim->flags != RRDDIM_FLAG_NONE) dim->rd->flags |= dim->flags;
  1794. if(dim->options != RRDDIM_OPTION_NONE) dim->rd->collector.options |= dim->options;
  1795. return dim->rd;
  1796. }
  1797. dim->rd = rrddim_add(chart->st, dim->metric, dim->name, dim->multiplier, dim->divisor, dim->algorithm);
  1798. if(dim->flags != RRDDIM_FLAG_NONE) dim->rd->flags |= dim->flags;
  1799. if(dim->options != RRDDIM_OPTION_NONE) dim->rd->collector.options |= dim->options;
  1800. return dim->rd;
  1801. }
  1802. static inline void statsd_update_app_chart(STATSD_APP *app, STATSD_APP_CHART *chart) {
  1803. netdata_log_debug(D_STATSD, "updating chart '%s' for app '%s'", chart->id, app->name);
  1804. if(!chart->st) {
  1805. chart->st = rrdset_create_custom(
  1806. localhost // host
  1807. , app->name // type
  1808. , chart->id // id
  1809. , chart->name // name
  1810. , chart->family // family
  1811. , chart->context // context
  1812. , chart->title // title
  1813. , chart->units // units
  1814. , PLUGIN_STATSD_NAME // plugin
  1815. , chart->module // module
  1816. , chart->priority // priority
  1817. , statsd.update_every // update every
  1818. , chart->chart_type // chart type
  1819. , app->rrd_memory_mode // memory mode
  1820. , app->rrd_history_entries // history
  1821. );
  1822. rrdset_flag_set(chart->st, RRDSET_FLAG_STORE_FIRST);
  1823. // rrdset_flag_set(chart->st, RRDSET_FLAG_DEBUG);
  1824. }
  1825. STATSD_APP_CHART_DIM *dim;
  1826. for(dim = chart->dimensions; dim ;dim = dim->next) {
  1827. if(likely(!dim->metric_pattern)) {
  1828. if (unlikely(!dim->rd))
  1829. statsd_add_dim_to_app_chart(app, chart, dim);
  1830. if (unlikely(dim->value_ptr)) {
  1831. netdata_log_debug(D_STATSD, "updating dimension '%s' (%s) of chart '%s' (%s) for app '%s' with value " COLLECTED_NUMBER_FORMAT, dim->name, rrddim_id(dim->rd), chart->id, rrdset_id(chart->st), app->name, *dim->value_ptr);
  1832. rrddim_set_by_pointer(chart->st, dim->rd, *dim->value_ptr);
  1833. }
  1834. }
  1835. }
  1836. rrdset_done(chart->st);
  1837. netdata_log_debug(D_STATSD, "completed update of chart '%s' for app '%s'", chart->id, app->name);
  1838. }
  1839. static inline void statsd_update_all_app_charts(void) {
  1840. // netdata_log_debug(D_STATSD, "updating app charts");
  1841. STATSD_APP *app;
  1842. for(app = statsd.apps; app ;app = app->next) {
  1843. // netdata_log_debug(D_STATSD, "updating charts for app '%s'", app->name);
  1844. STATSD_APP_CHART *chart;
  1845. for(chart = app->charts; chart ;chart = chart->next) {
  1846. if(unlikely(chart->dimensions_linked_count)) {
  1847. statsd_update_app_chart(app, chart);
  1848. }
  1849. }
  1850. }
  1851. // netdata_log_debug(D_STATSD, "completed update of app charts");
  1852. }
  1853. const char *statsd_metric_type_string(STATSD_METRIC_TYPE type) {
  1854. switch(type) {
  1855. case STATSD_METRIC_TYPE_COUNTER: return "counter";
  1856. case STATSD_METRIC_TYPE_GAUGE: return "gauge";
  1857. case STATSD_METRIC_TYPE_HISTOGRAM: return "histogram";
  1858. case STATSD_METRIC_TYPE_METER: return "meter";
  1859. case STATSD_METRIC_TYPE_SET: return "set";
  1860. case STATSD_METRIC_TYPE_DICTIONARY: return "dictionary";
  1861. case STATSD_METRIC_TYPE_TIMER: return "timer";
  1862. default: return "unknown";
  1863. }
  1864. }
  1865. static inline void statsd_flush_index_metrics(STATSD_INDEX *index, void (*flush_metric)(STATSD_METRIC *)) {
  1866. STATSD_METRIC *m;
  1867. // find the useful metrics (incremental = each time we are called, we check the new metrics only)
  1868. dfe_start_read(index->dict, m) {
  1869. // since we add new metrics at the beginning
  1870. // check for useful charts, until the point we last checked
  1871. if(unlikely(is_metric_checked(m))) break;
  1872. if(unlikely(!(m->options & STATSD_METRIC_OPTION_CHECKED_IN_APPS))) {
  1873. netdata_log_access("NEW STATSD METRIC '%s': '%s'", statsd_metric_type_string(m->type), m->name);
  1874. check_if_metric_is_for_app(index, m);
  1875. m->options |= STATSD_METRIC_OPTION_CHECKED_IN_APPS;
  1876. }
  1877. if(unlikely(!(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_CHECKED))) {
  1878. if(unlikely(statsd.private_charts >= statsd.max_private_charts_hard)) {
  1879. netdata_log_debug(D_STATSD, "STATSD: metric '%s' will not be charted, because the hard limit of the maximum number "
  1880. "of charts has been reached.", m->name);
  1881. collector_info("STATSD: metric '%s' will not be charted, because the hard limit of the maximum number "
  1882. "of charts (%u) has been reached. Increase the number of charts by editing netdata.conf, "
  1883. "[statsd] section.", m->name, statsd.max_private_charts_hard);
  1884. m->options &= ~STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1885. }
  1886. else {
  1887. if (simple_pattern_matches(statsd.charts_for, m->name)) {
  1888. netdata_log_debug(D_STATSD, "STATSD: metric '%s' will be charted.", m->name);
  1889. m->options |= STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1890. } else {
  1891. netdata_log_debug(D_STATSD, "STATSD: metric '%s' will not be charted.", m->name);
  1892. m->options &= ~STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1893. }
  1894. }
  1895. m->options |= STATSD_METRIC_OPTION_PRIVATE_CHART_CHECKED;
  1896. }
  1897. // mark it as checked
  1898. m->options |= STATSD_METRIC_OPTION_CHECKED;
  1899. // check if it is used in charts
  1900. if((m->options & (STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED|STATSD_METRIC_OPTION_USED_IN_APPS)) && !(m->options & STATSD_METRIC_OPTION_USEFUL)) {
  1901. m->options |= STATSD_METRIC_OPTION_USEFUL;
  1902. index->useful++;
  1903. m->next_useful = index->first_useful;
  1904. index->first_useful = m;
  1905. }
  1906. }
  1907. dfe_done(m);
  1908. // flush all the useful metrics
  1909. for(m = index->first_useful; m ; m = m->next_useful) {
  1910. flush_metric(m);
  1911. }
  1912. }
  1913. // --------------------------------------------------------------------------------------
  1914. // statsd main thread
  1915. static int statsd_listen_sockets_setup(void) {
  1916. return listen_sockets_setup(&statsd.sockets);
  1917. }
  1918. static void statsd_main_cleanup(void *data) {
  1919. struct netdata_static_thread *static_thread = (struct netdata_static_thread *)data;
  1920. static_thread->enabled = NETDATA_MAIN_THREAD_EXITING;
  1921. collector_info("cleaning up...");
  1922. if (statsd.collection_threads_status) {
  1923. int i;
  1924. for (i = 0; i < statsd.threads; i++) {
  1925. spinlock_lock(&statsd.collection_threads_status[i].spinlock);
  1926. if(statsd.collection_threads_status[i].running) {
  1927. collector_info("STATSD: stopping data collection thread %d...", i + 1);
  1928. netdata_thread_cancel(statsd.collection_threads_status[i].thread);
  1929. }
  1930. else {
  1931. collector_info("STATSD: data collection thread %d found stopped.", i + 1);
  1932. }
  1933. spinlock_unlock(&statsd.collection_threads_status[i].spinlock);
  1934. }
  1935. }
  1936. collector_info("STATSD: closing sockets...");
  1937. listen_sockets_close(&statsd.sockets);
  1938. // destroy the dictionaries
  1939. dictionary_destroy(statsd.gauges.dict);
  1940. dictionary_destroy(statsd.meters.dict);
  1941. dictionary_destroy(statsd.counters.dict);
  1942. dictionary_destroy(statsd.histograms.dict);
  1943. dictionary_destroy(statsd.dictionaries.dict);
  1944. dictionary_destroy(statsd.sets.dict);
  1945. dictionary_destroy(statsd.timers.dict);
  1946. collector_info("STATSD: cleanup completed.");
  1947. static_thread->enabled = NETDATA_MAIN_THREAD_EXITED;
  1948. worker_unregister();
  1949. }
  1950. #define WORKER_STATSD_FLUSH_GAUGES 0
  1951. #define WORKER_STATSD_FLUSH_COUNTERS 1
  1952. #define WORKER_STATSD_FLUSH_METERS 2
  1953. #define WORKER_STATSD_FLUSH_TIMERS 3
  1954. #define WORKER_STATSD_FLUSH_HISTOGRAMS 4
  1955. #define WORKER_STATSD_FLUSH_SETS 5
  1956. #define WORKER_STATSD_FLUSH_DICTIONARIES 6
  1957. #define WORKER_STATSD_FLUSH_STATS 7
  1958. #if WORKER_UTILIZATION_MAX_JOB_TYPES < 8
  1959. #error WORKER_UTILIZATION_MAX_JOB_TYPES has to be at least 8
  1960. #endif
  1961. void *statsd_main(void *ptr) {
  1962. worker_register("STATSDFLUSH");
  1963. worker_register_job_name(WORKER_STATSD_FLUSH_GAUGES, "gauges");
  1964. worker_register_job_name(WORKER_STATSD_FLUSH_COUNTERS, "counters");
  1965. worker_register_job_name(WORKER_STATSD_FLUSH_METERS, "meters");
  1966. worker_register_job_name(WORKER_STATSD_FLUSH_TIMERS, "timers");
  1967. worker_register_job_name(WORKER_STATSD_FLUSH_HISTOGRAMS, "histograms");
  1968. worker_register_job_name(WORKER_STATSD_FLUSH_SETS, "sets");
  1969. worker_register_job_name(WORKER_STATSD_FLUSH_DICTIONARIES, "dictionaries");
  1970. worker_register_job_name(WORKER_STATSD_FLUSH_STATS, "statistics");
  1971. netdata_thread_cleanup_push(statsd_main_cleanup, ptr);
  1972. statsd.gauges.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1973. statsd.meters.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1974. statsd.counters.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1975. statsd.histograms.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1976. statsd.dictionaries.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1977. statsd.sets.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1978. statsd.timers.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1979. dictionary_register_insert_callback(statsd.gauges.dict, dictionary_metric_insert_callback, &statsd.gauges);
  1980. dictionary_register_insert_callback(statsd.meters.dict, dictionary_metric_insert_callback, &statsd.meters);
  1981. dictionary_register_insert_callback(statsd.counters.dict, dictionary_metric_insert_callback, &statsd.counters);
  1982. dictionary_register_insert_callback(statsd.histograms.dict, dictionary_metric_insert_callback, &statsd.histograms);
  1983. dictionary_register_insert_callback(statsd.dictionaries.dict, dictionary_metric_insert_callback, &statsd.dictionaries);
  1984. dictionary_register_insert_callback(statsd.sets.dict, dictionary_metric_insert_callback, &statsd.sets);
  1985. dictionary_register_insert_callback(statsd.timers.dict, dictionary_metric_insert_callback, &statsd.timers);
  1986. dictionary_register_delete_callback(statsd.gauges.dict, dictionary_metric_delete_callback, &statsd.gauges);
  1987. dictionary_register_delete_callback(statsd.meters.dict, dictionary_metric_delete_callback, &statsd.meters);
  1988. dictionary_register_delete_callback(statsd.counters.dict, dictionary_metric_delete_callback, &statsd.counters);
  1989. dictionary_register_delete_callback(statsd.histograms.dict, dictionary_metric_delete_callback, &statsd.histograms);
  1990. dictionary_register_delete_callback(statsd.dictionaries.dict, dictionary_metric_delete_callback, &statsd.dictionaries);
  1991. dictionary_register_delete_callback(statsd.sets.dict, dictionary_metric_delete_callback, &statsd.sets);
  1992. dictionary_register_delete_callback(statsd.timers.dict, dictionary_metric_delete_callback, &statsd.timers);
  1993. // ----------------------------------------------------------------------------------------------------------------
  1994. // statsd configuration
  1995. statsd.enabled = config_get_boolean(CONFIG_SECTION_PLUGINS, "statsd", statsd.enabled);
  1996. statsd.update_every = default_rrd_update_every;
  1997. statsd.update_every = (int)config_get_number(CONFIG_SECTION_STATSD, "update every (flushInterval)", statsd.update_every);
  1998. if(statsd.update_every < default_rrd_update_every) {
  1999. collector_error("STATSD: minimum flush interval %d given, but the minimum is the update every of netdata. Using %d", statsd.update_every, default_rrd_update_every);
  2000. statsd.update_every = default_rrd_update_every;
  2001. }
  2002. #ifdef HAVE_RECVMMSG
  2003. statsd.recvmmsg_size = (size_t)config_get_number(CONFIG_SECTION_STATSD, "udp messages to process at once", (long long)statsd.recvmmsg_size);
  2004. #endif
  2005. statsd.charts_for = simple_pattern_create(
  2006. config_get(CONFIG_SECTION_STATSD, "create private charts for metrics matching", "*"), NULL,
  2007. SIMPLE_PATTERN_EXACT, true);
  2008. statsd.max_private_charts_hard = (size_t)config_get_number(CONFIG_SECTION_STATSD, "max private charts hard limit", (long long)statsd.max_private_charts_hard);
  2009. statsd.decimal_detail = (collected_number)config_get_number(CONFIG_SECTION_STATSD, "decimal detail", (long long int)statsd.decimal_detail);
  2010. statsd.tcp_idle_timeout = (size_t) config_get_number(CONFIG_SECTION_STATSD, "disconnect idle tcp clients after seconds", (long long int)statsd.tcp_idle_timeout);
  2011. statsd.private_charts_hidden = (unsigned int)config_get_boolean(CONFIG_SECTION_STATSD, "private charts hidden", statsd.private_charts_hidden);
  2012. statsd.histogram_percentile = (double)config_get_float(CONFIG_SECTION_STATSD, "histograms and timers percentile (percentThreshold)", statsd.histogram_percentile);
  2013. if(isless(statsd.histogram_percentile, 0) || isgreater(statsd.histogram_percentile, 100)) {
  2014. collector_error("STATSD: invalid histograms and timers percentile %0.5f given", statsd.histogram_percentile);
  2015. statsd.histogram_percentile = 95.0;
  2016. }
  2017. {
  2018. char buffer[314 + 1];
  2019. snprintfz(buffer, 314, "%0.1f%%", statsd.histogram_percentile);
  2020. statsd.histogram_percentile_str = strdupz(buffer);
  2021. }
  2022. statsd.dictionary_max_unique = config_get_number(CONFIG_SECTION_STATSD, "dictionaries max unique dimensions", statsd.dictionary_max_unique);
  2023. if(config_get_boolean(CONFIG_SECTION_STATSD, "add dimension for number of events received", 0)) {
  2024. statsd.gauges.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2025. statsd.counters.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2026. statsd.meters.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2027. statsd.sets.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2028. statsd.histograms.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2029. statsd.timers.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2030. statsd.dictionaries.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2031. }
  2032. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on gauges (deleteGauges)", 0))
  2033. statsd.gauges.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2034. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on counters (deleteCounters)", 0))
  2035. statsd.counters.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2036. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on meters (deleteMeters)", 0))
  2037. statsd.meters.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2038. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on sets (deleteSets)", 0))
  2039. statsd.sets.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2040. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on histograms (deleteHistograms)", 0))
  2041. statsd.histograms.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2042. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on timers (deleteTimers)", 0))
  2043. statsd.timers.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2044. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on dictionaries (deleteDictionaries)", 0))
  2045. statsd.dictionaries.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2046. size_t max_sockets = (size_t)config_get_number(CONFIG_SECTION_STATSD, "statsd server max TCP sockets", (long long int)(rlimit_nofile.rlim_cur / 4));
  2047. #ifdef STATSD_MULTITHREADED
  2048. statsd.threads = (int)config_get_number(CONFIG_SECTION_STATSD, "threads", processors);
  2049. if(statsd.threads < 1) {
  2050. collector_error("STATSD: Invalid number of threads %d, using %d", statsd.threads, processors);
  2051. statsd.threads = processors;
  2052. config_set_number(CONFIG_SECTION_STATSD, "collector threads", statsd.threads);
  2053. }
  2054. #else
  2055. statsd.threads = 1;
  2056. #endif
  2057. // read custom application definitions
  2058. statsd_readdir(netdata_configured_user_config_dir, netdata_configured_stock_config_dir, "statsd.d");
  2059. // ----------------------------------------------------------------------------------------------------------------
  2060. // statsd setup
  2061. if(!statsd.enabled) goto cleanup;
  2062. statsd_listen_sockets_setup();
  2063. if(!statsd.sockets.opened) {
  2064. collector_error("STATSD: No statsd sockets to listen to. statsd will be disabled.");
  2065. goto cleanup;
  2066. }
  2067. statsd.collection_threads_status = callocz((size_t)statsd.threads, sizeof(struct collection_thread_status));
  2068. int i;
  2069. for(i = 0; i < statsd.threads ;i++) {
  2070. statsd.collection_threads_status[i].max_sockets = max_sockets / statsd.threads;
  2071. char tag[NETDATA_THREAD_TAG_MAX + 1];
  2072. snprintfz(tag, NETDATA_THREAD_TAG_MAX, "STATSD_IN[%d]", i + 1);
  2073. spinlock_init(&statsd.collection_threads_status[i].spinlock);
  2074. netdata_thread_create(&statsd.collection_threads_status[i].thread, tag, NETDATA_THREAD_OPTION_DEFAULT, statsd_collector_thread, &statsd.collection_threads_status[i]);
  2075. }
  2076. // ----------------------------------------------------------------------------------------------------------------
  2077. // statsd monitoring charts
  2078. RRDSET *st_metrics = NULL;
  2079. RRDDIM *rd_metrics_gauge = NULL;
  2080. RRDDIM *rd_metrics_counter = NULL;
  2081. RRDDIM *rd_metrics_timer = NULL;
  2082. RRDDIM *rd_metrics_meter = NULL;
  2083. RRDDIM *rd_metrics_histogram = NULL;
  2084. RRDDIM *rd_metrics_set = NULL;
  2085. RRDDIM *rd_metrics_dictionary = NULL;
  2086. RRDSET *st_useful_metrics = NULL;
  2087. RRDDIM *rd_useful_metrics_gauge = NULL;
  2088. RRDDIM *rd_useful_metrics_counter = NULL;
  2089. RRDDIM *rd_useful_metrics_timer = NULL;
  2090. RRDDIM *rd_useful_metrics_meter = NULL;
  2091. RRDDIM *rd_useful_metrics_histogram = NULL;
  2092. RRDDIM *rd_useful_metrics_set = NULL;
  2093. RRDDIM *rd_useful_metrics_dictionary = NULL;
  2094. RRDSET *st_events = NULL;
  2095. RRDDIM *rd_events_gauge = NULL;
  2096. RRDDIM *rd_events_counter = NULL;
  2097. RRDDIM *rd_events_timer = NULL;
  2098. RRDDIM *rd_events_meter = NULL;
  2099. RRDDIM *rd_events_histogram = NULL;
  2100. RRDDIM *rd_events_set = NULL;
  2101. RRDDIM *rd_events_dictionary = NULL;
  2102. RRDDIM *rd_events_unknown = NULL;
  2103. RRDDIM *rd_events_errors = NULL;
  2104. RRDSET *st_reads = NULL;
  2105. RRDDIM *rd_reads_tcp = NULL;
  2106. RRDDIM *rd_reads_udp = NULL;
  2107. RRDSET *st_bytes = NULL;
  2108. RRDDIM *rd_bytes_tcp = NULL;
  2109. RRDDIM *rd_bytes_udp = NULL;
  2110. RRDSET *st_packets = NULL;
  2111. RRDDIM *rd_packets_tcp = NULL;
  2112. RRDDIM *rd_packets_udp = NULL;
  2113. RRDSET *st_tcp_connects = NULL;
  2114. RRDDIM *rd_tcp_connects = NULL;
  2115. RRDDIM *rd_tcp_disconnects = NULL;
  2116. RRDSET *st_tcp_connected = NULL;
  2117. RRDDIM *rd_tcp_connected = NULL;
  2118. RRDSET *st_pcharts = NULL;
  2119. RRDDIM *rd_pcharts = NULL;
  2120. if(global_statistics_enabled) {
  2121. st_metrics = rrdset_create_localhost(
  2122. "netdata",
  2123. "statsd_metrics",
  2124. NULL,
  2125. "statsd",
  2126. NULL,
  2127. "Metrics in the netdata statsd database",
  2128. "metrics",
  2129. PLUGIN_STATSD_NAME,
  2130. "stats",
  2131. 132010,
  2132. statsd.update_every,
  2133. RRDSET_TYPE_STACKED);
  2134. rd_metrics_gauge = rrddim_add(st_metrics, "gauges", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2135. rd_metrics_counter = rrddim_add(st_metrics, "counters", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2136. rd_metrics_timer = rrddim_add(st_metrics, "timers", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2137. rd_metrics_meter = rrddim_add(st_metrics, "meters", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2138. rd_metrics_histogram = rrddim_add(st_metrics, "histograms", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2139. rd_metrics_set = rrddim_add(st_metrics, "sets", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2140. rd_metrics_dictionary = rrddim_add(st_metrics, "dictionaries", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2141. st_useful_metrics = rrdset_create_localhost(
  2142. "netdata",
  2143. "statsd_useful_metrics",
  2144. NULL,
  2145. "statsd",
  2146. NULL,
  2147. "Useful metrics in the netdata statsd database",
  2148. "metrics",
  2149. PLUGIN_STATSD_NAME,
  2150. "stats",
  2151. 132010,
  2152. statsd.update_every,
  2153. RRDSET_TYPE_STACKED);
  2154. rd_useful_metrics_gauge = rrddim_add(st_useful_metrics, "gauges", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2155. rd_useful_metrics_counter = rrddim_add(st_useful_metrics, "counters", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2156. rd_useful_metrics_timer = rrddim_add(st_useful_metrics, "timers", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2157. rd_useful_metrics_meter = rrddim_add(st_useful_metrics, "meters", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2158. rd_useful_metrics_histogram = rrddim_add(st_useful_metrics, "histograms", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2159. rd_useful_metrics_set = rrddim_add(st_useful_metrics, "sets", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2160. rd_useful_metrics_dictionary = rrddim_add(st_useful_metrics, "dictionaries", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2161. st_events = rrdset_create_localhost(
  2162. "netdata",
  2163. "statsd_events",
  2164. NULL,
  2165. "statsd",
  2166. NULL,
  2167. "Events processed by the netdata statsd server",
  2168. "events/s",
  2169. PLUGIN_STATSD_NAME,
  2170. "stats",
  2171. 132011,
  2172. statsd.update_every,
  2173. RRDSET_TYPE_STACKED);
  2174. rd_events_gauge = rrddim_add(st_events, "gauges", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2175. rd_events_counter = rrddim_add(st_events, "counters", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2176. rd_events_timer = rrddim_add(st_events, "timers", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2177. rd_events_meter = rrddim_add(st_events, "meters", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2178. rd_events_histogram = rrddim_add(st_events, "histograms", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2179. rd_events_set = rrddim_add(st_events, "sets", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2180. rd_events_dictionary = rrddim_add(st_events, "dictionaries", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2181. rd_events_unknown = rrddim_add(st_events, "unknown", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2182. rd_events_errors = rrddim_add(st_events, "errors", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2183. st_reads = rrdset_create_localhost(
  2184. "netdata",
  2185. "statsd_reads",
  2186. NULL,
  2187. "statsd",
  2188. NULL,
  2189. "Read operations made by the netdata statsd server",
  2190. "reads/s",
  2191. PLUGIN_STATSD_NAME,
  2192. "stats",
  2193. 132012,
  2194. statsd.update_every,
  2195. RRDSET_TYPE_STACKED);
  2196. rd_reads_tcp = rrddim_add(st_reads, "tcp", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2197. rd_reads_udp = rrddim_add(st_reads, "udp", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2198. st_bytes = rrdset_create_localhost(
  2199. "netdata",
  2200. "statsd_bytes",
  2201. NULL,
  2202. "statsd",
  2203. NULL,
  2204. "Bytes read by the netdata statsd server",
  2205. "kilobits/s",
  2206. PLUGIN_STATSD_NAME,
  2207. "stats",
  2208. 132013,
  2209. statsd.update_every,
  2210. RRDSET_TYPE_STACKED);
  2211. rd_bytes_tcp = rrddim_add(st_bytes, "tcp", NULL, 8, BITS_IN_A_KILOBIT, RRD_ALGORITHM_INCREMENTAL);
  2212. rd_bytes_udp = rrddim_add(st_bytes, "udp", NULL, 8, BITS_IN_A_KILOBIT, RRD_ALGORITHM_INCREMENTAL);
  2213. st_packets = rrdset_create_localhost(
  2214. "netdata",
  2215. "statsd_packets",
  2216. NULL,
  2217. "statsd",
  2218. NULL,
  2219. "Network packets processed by the netdata statsd server",
  2220. "packets/s",
  2221. PLUGIN_STATSD_NAME,
  2222. "stats",
  2223. 132014,
  2224. statsd.update_every,
  2225. RRDSET_TYPE_STACKED);
  2226. rd_packets_tcp = rrddim_add(st_packets, "tcp", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2227. rd_packets_udp = rrddim_add(st_packets, "udp", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2228. st_tcp_connects = rrdset_create_localhost(
  2229. "netdata",
  2230. "tcp_connects",
  2231. NULL,
  2232. "statsd",
  2233. NULL,
  2234. "statsd server TCP connects and disconnects",
  2235. "events",
  2236. PLUGIN_STATSD_NAME,
  2237. "stats",
  2238. 132015,
  2239. statsd.update_every,
  2240. RRDSET_TYPE_LINE);
  2241. rd_tcp_connects = rrddim_add(st_tcp_connects, "connects", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2242. rd_tcp_disconnects = rrddim_add(st_tcp_connects, "disconnects", NULL, -1, 1, RRD_ALGORITHM_INCREMENTAL);
  2243. st_tcp_connected = rrdset_create_localhost(
  2244. "netdata",
  2245. "tcp_connected",
  2246. NULL,
  2247. "statsd",
  2248. NULL,
  2249. "statsd server TCP connected sockets",
  2250. "sockets",
  2251. PLUGIN_STATSD_NAME,
  2252. "stats",
  2253. 132016,
  2254. statsd.update_every,
  2255. RRDSET_TYPE_LINE);
  2256. rd_tcp_connected = rrddim_add(st_tcp_connected, "connected", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2257. st_pcharts = rrdset_create_localhost(
  2258. "netdata",
  2259. "private_charts",
  2260. NULL,
  2261. "statsd",
  2262. NULL,
  2263. "Private metric charts created by the netdata statsd server",
  2264. "charts",
  2265. PLUGIN_STATSD_NAME,
  2266. "stats",
  2267. 132020,
  2268. statsd.update_every,
  2269. RRDSET_TYPE_AREA);
  2270. rd_pcharts = rrddim_add(st_pcharts, "charts", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2271. }
  2272. // ----------------------------------------------------------------------------------------------------------------
  2273. // statsd thread to turn metrics into charts
  2274. usec_t step = statsd.update_every * USEC_PER_SEC;
  2275. heartbeat_t hb;
  2276. heartbeat_init(&hb);
  2277. while(service_running(SERVICE_COLLECTORS)) {
  2278. worker_is_idle();
  2279. heartbeat_next(&hb, step);
  2280. worker_is_busy(WORKER_STATSD_FLUSH_GAUGES);
  2281. statsd_flush_index_metrics(&statsd.gauges, statsd_flush_gauge);
  2282. worker_is_busy(WORKER_STATSD_FLUSH_COUNTERS);
  2283. statsd_flush_index_metrics(&statsd.counters, statsd_flush_counter);
  2284. worker_is_busy(WORKER_STATSD_FLUSH_METERS);
  2285. statsd_flush_index_metrics(&statsd.meters, statsd_flush_meter);
  2286. worker_is_busy(WORKER_STATSD_FLUSH_TIMERS);
  2287. statsd_flush_index_metrics(&statsd.timers, statsd_flush_timer);
  2288. worker_is_busy(WORKER_STATSD_FLUSH_HISTOGRAMS);
  2289. statsd_flush_index_metrics(&statsd.histograms, statsd_flush_histogram);
  2290. worker_is_busy(WORKER_STATSD_FLUSH_SETS);
  2291. statsd_flush_index_metrics(&statsd.sets, statsd_flush_set);
  2292. worker_is_busy(WORKER_STATSD_FLUSH_DICTIONARIES);
  2293. statsd_flush_index_metrics(&statsd.dictionaries,statsd_flush_dictionary);
  2294. worker_is_busy(WORKER_STATSD_FLUSH_STATS);
  2295. statsd_update_all_app_charts();
  2296. if(unlikely(!service_running(SERVICE_COLLECTORS)))
  2297. break;
  2298. if(global_statistics_enabled) {
  2299. rrddim_set_by_pointer(st_metrics, rd_metrics_gauge, (collected_number)statsd.gauges.metrics);
  2300. rrddim_set_by_pointer(st_metrics, rd_metrics_counter, (collected_number)statsd.counters.metrics);
  2301. rrddim_set_by_pointer(st_metrics, rd_metrics_timer, (collected_number)statsd.timers.metrics);
  2302. rrddim_set_by_pointer(st_metrics, rd_metrics_meter, (collected_number)statsd.meters.metrics);
  2303. rrddim_set_by_pointer(st_metrics, rd_metrics_histogram, (collected_number)statsd.histograms.metrics);
  2304. rrddim_set_by_pointer(st_metrics, rd_metrics_set, (collected_number)statsd.sets.metrics);
  2305. rrddim_set_by_pointer(st_metrics, rd_metrics_dictionary, (collected_number)statsd.dictionaries.metrics);
  2306. rrdset_done(st_metrics);
  2307. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_gauge, (collected_number)statsd.gauges.useful);
  2308. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_counter, (collected_number)statsd.counters.useful);
  2309. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_timer, (collected_number)statsd.timers.useful);
  2310. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_meter, (collected_number)statsd.meters.useful);
  2311. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_histogram, (collected_number)statsd.histograms.useful);
  2312. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_set, (collected_number)statsd.sets.useful);
  2313. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_dictionary, (collected_number)statsd.dictionaries.useful);
  2314. rrdset_done(st_useful_metrics);
  2315. rrddim_set_by_pointer(st_events, rd_events_gauge, (collected_number)statsd.gauges.events);
  2316. rrddim_set_by_pointer(st_events, rd_events_counter, (collected_number)statsd.counters.events);
  2317. rrddim_set_by_pointer(st_events, rd_events_timer, (collected_number)statsd.timers.events);
  2318. rrddim_set_by_pointer(st_events, rd_events_meter, (collected_number)statsd.meters.events);
  2319. rrddim_set_by_pointer(st_events, rd_events_histogram, (collected_number)statsd.histograms.events);
  2320. rrddim_set_by_pointer(st_events, rd_events_set, (collected_number)statsd.sets.events);
  2321. rrddim_set_by_pointer(st_events, rd_events_dictionary, (collected_number)statsd.dictionaries.events);
  2322. rrddim_set_by_pointer(st_events, rd_events_unknown, (collected_number)statsd.unknown_types);
  2323. rrddim_set_by_pointer(st_events, rd_events_errors, (collected_number)statsd.socket_errors);
  2324. rrdset_done(st_events);
  2325. rrddim_set_by_pointer(st_reads, rd_reads_tcp, (collected_number)statsd.tcp_socket_reads);
  2326. rrddim_set_by_pointer(st_reads, rd_reads_udp, (collected_number)statsd.udp_socket_reads);
  2327. rrdset_done(st_reads);
  2328. rrddim_set_by_pointer(st_bytes, rd_bytes_tcp, (collected_number)statsd.tcp_bytes_read);
  2329. rrddim_set_by_pointer(st_bytes, rd_bytes_udp, (collected_number)statsd.udp_bytes_read);
  2330. rrdset_done(st_bytes);
  2331. rrddim_set_by_pointer(st_packets, rd_packets_tcp, (collected_number)statsd.tcp_packets_received);
  2332. rrddim_set_by_pointer(st_packets, rd_packets_udp, (collected_number)statsd.udp_packets_received);
  2333. rrdset_done(st_packets);
  2334. rrddim_set_by_pointer(st_tcp_connects, rd_tcp_connects, (collected_number)statsd.tcp_socket_connects);
  2335. rrddim_set_by_pointer(st_tcp_connects, rd_tcp_disconnects, (collected_number)statsd.tcp_socket_disconnects);
  2336. rrdset_done(st_tcp_connects);
  2337. rrddim_set_by_pointer(st_tcp_connected, rd_tcp_connected, (collected_number)statsd.tcp_socket_connected);
  2338. rrdset_done(st_tcp_connected);
  2339. rrddim_set_by_pointer(st_pcharts, rd_pcharts, (collected_number)statsd.private_charts);
  2340. rrdset_done(st_pcharts);
  2341. }
  2342. }
  2343. cleanup: ; // added semi-colon to prevent older gcc error: label at end of compound statement
  2344. netdata_thread_cleanup_pop(1);
  2345. return NULL;
  2346. }