statsd.c 112 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include "daemon/common.h"
  3. #define STATSD_CHART_PREFIX "statsd"
  4. #define PLUGIN_STATSD_NAME "statsd.plugin"
  5. #define STATSD_LISTEN_PORT 8125
  6. #define STATSD_LISTEN_BACKLOG 4096
  7. #define WORKER_JOB_TYPE_TCP_CONNECTED 0
  8. #define WORKER_JOB_TYPE_TCP_DISCONNECTED 1
  9. #define WORKER_JOB_TYPE_RCV_DATA 2
  10. #define WORKER_JOB_TYPE_SND_DATA 3
  11. #if WORKER_UTILIZATION_MAX_JOB_TYPES < 4
  12. #error Please increase WORKER_UTILIZATION_MAX_JOB_TYPES to at least 4
  13. #endif
  14. // --------------------------------------------------------------------------------------
  15. // DO NOT ENABLE MULTITHREADING - IT IS NOT WELL TESTED
  16. // #define STATSD_MULTITHREADED 1
  17. #define STATSD_DICTIONARY_OPTIONS (DICT_OPTION_DONT_OVERWRITE_VALUE | DICT_OPTION_ADD_IN_FRONT)
  18. #define STATSD_DECIMAL_DETAIL 1000 // floating point values get multiplied by this, with the same divisor
  19. // --------------------------------------------------------------------------------------------------------------------
  20. // data specific to each metric type
  21. typedef struct statsd_metric_gauge {
  22. NETDATA_DOUBLE value;
  23. } STATSD_METRIC_GAUGE;
  24. typedef struct statsd_metric_counter { // counter and meter
  25. long long value;
  26. } STATSD_METRIC_COUNTER;
  27. typedef struct statsd_histogram_extensions {
  28. netdata_mutex_t mutex;
  29. // average is stored in metric->last
  30. collected_number last_min;
  31. collected_number last_max;
  32. collected_number last_percentile;
  33. collected_number last_median;
  34. collected_number last_stddev;
  35. collected_number last_sum;
  36. int zeroed;
  37. RRDDIM *rd_min;
  38. RRDDIM *rd_max;
  39. RRDDIM *rd_percentile;
  40. RRDDIM *rd_median;
  41. RRDDIM *rd_stddev;
  42. //RRDDIM *rd_sum;
  43. size_t size;
  44. size_t used;
  45. NETDATA_DOUBLE *values; // dynamic array of values collected
  46. } STATSD_METRIC_HISTOGRAM_EXTENSIONS;
  47. typedef struct statsd_metric_histogram { // histogram and timer
  48. STATSD_METRIC_HISTOGRAM_EXTENSIONS *ext;
  49. } STATSD_METRIC_HISTOGRAM;
  50. typedef struct statsd_metric_set {
  51. DICTIONARY *dict;
  52. size_t unique;
  53. } STATSD_METRIC_SET;
  54. typedef struct statsd_metric_dictionary_item {
  55. size_t count;
  56. RRDDIM *rd;
  57. } STATSD_METRIC_DICTIONARY_ITEM;
  58. typedef struct statsd_metric_dictionary {
  59. DICTIONARY *dict;
  60. size_t unique;
  61. } STATSD_METRIC_DICTIONARY;
  62. // --------------------------------------------------------------------------------------------------------------------
  63. // this is a metric - for all types of metrics
  64. typedef enum statsd_metric_options {
  65. STATSD_METRIC_OPTION_NONE = 0x00000000, // no options set
  66. STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED = 0x00000001, // do not update the chart dimension, when this metric is not collected
  67. STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED = 0x00000002, // render a private chart for this metric
  68. STATSD_METRIC_OPTION_PRIVATE_CHART_CHECKED = 0x00000004, // the metric has been checked if it should get private chart or not
  69. STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT = 0x00000008, // show the count of events for this private chart
  70. STATSD_METRIC_OPTION_CHECKED_IN_APPS = 0x00000010, // set when this metric has been checked against apps
  71. STATSD_METRIC_OPTION_USED_IN_APPS = 0x00000020, // set when this metric is used in apps
  72. STATSD_METRIC_OPTION_CHECKED = 0x00000040, // set when the charting thread checks this metric for use in charts (its usefulness)
  73. STATSD_METRIC_OPTION_USEFUL = 0x00000080, // set when the charting thread finds the metric useful (i.e. used in a chart)
  74. STATSD_METRIC_OPTION_COLLECTION_FULL_LOGGED = 0x00000100, // set when the collection is full for this metric
  75. STATSD_METRIC_OPTION_UPDATED_CHART_METADATA = 0x00000200, // set when the private chart metadata have been updated via tags
  76. } STATS_METRIC_OPTIONS;
  77. typedef enum statsd_metric_type {
  78. STATSD_METRIC_TYPE_GAUGE,
  79. STATSD_METRIC_TYPE_COUNTER,
  80. STATSD_METRIC_TYPE_METER,
  81. STATSD_METRIC_TYPE_TIMER,
  82. STATSD_METRIC_TYPE_HISTOGRAM,
  83. STATSD_METRIC_TYPE_SET,
  84. STATSD_METRIC_TYPE_DICTIONARY
  85. } STATSD_METRIC_TYPE;
  86. typedef struct statsd_metric {
  87. const char *name; // the name of the metric - linked to dictionary name
  88. uint32_t hash; // hash of the name
  89. STATSD_METRIC_TYPE type;
  90. // metadata about data collection
  91. collected_number events; // the number of times this metric has been collected (never resets)
  92. size_t count; // the number of times this metric has been collected since the last flush
  93. // the actual collected data
  94. union {
  95. STATSD_METRIC_GAUGE gauge;
  96. STATSD_METRIC_COUNTER counter;
  97. STATSD_METRIC_HISTOGRAM histogram;
  98. STATSD_METRIC_SET set;
  99. STATSD_METRIC_DICTIONARY dictionary;
  100. };
  101. char *units;
  102. char *dimname;
  103. char *family;
  104. // chart related members
  105. STATS_METRIC_OPTIONS options; // STATSD_METRIC_OPTION_* (bitfield)
  106. char reset; // set to 1 by the charting thread to instruct the collector thread(s) to reset this metric
  107. collected_number last; // the last value sent to netdata
  108. RRDSET *st; // the private chart of this metric
  109. RRDDIM *rd_value; // the dimension of this metric value
  110. RRDDIM *rd_count; // the dimension for the number of events received
  111. // linking, used for walking through all metrics
  112. struct statsd_metric *next_useful;
  113. } STATSD_METRIC;
  114. // --------------------------------------------------------------------------------------------------------------------
  115. // each type of metric has its own index
  116. typedef struct statsd_index {
  117. char *name; // the name of the index of metrics
  118. size_t events; // the number of events processed for this index
  119. size_t metrics; // the number of metrics in this index
  120. size_t useful; // the number of useful metrics in this index
  121. STATSD_METRIC_TYPE type; // the type of index
  122. DICTIONARY *dict;
  123. STATSD_METRIC *first_useful; // the linked list of useful metrics (new metrics are added in front)
  124. STATS_METRIC_OPTIONS default_options; // default options for all metrics in this index
  125. } STATSD_INDEX;
  126. // --------------------------------------------------------------------------------------------------------------------
  127. // synthetic charts
  128. typedef enum statsd_app_chart_dimension_value_type {
  129. STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS,
  130. STATSD_APP_CHART_DIM_VALUE_TYPE_LAST,
  131. STATSD_APP_CHART_DIM_VALUE_TYPE_AVERAGE,
  132. STATSD_APP_CHART_DIM_VALUE_TYPE_SUM,
  133. STATSD_APP_CHART_DIM_VALUE_TYPE_MIN,
  134. STATSD_APP_CHART_DIM_VALUE_TYPE_MAX,
  135. STATSD_APP_CHART_DIM_VALUE_TYPE_PERCENTILE,
  136. STATSD_APP_CHART_DIM_VALUE_TYPE_MEDIAN,
  137. STATSD_APP_CHART_DIM_VALUE_TYPE_STDDEV
  138. } STATSD_APP_CHART_DIM_VALUE_TYPE;
  139. typedef struct statsd_app_chart_dimension {
  140. const char *name; // the name of this dimension
  141. const char *metric; // the source metric name of this dimension
  142. uint32_t metric_hash; // hash for fast string comparisons
  143. SIMPLE_PATTERN *metric_pattern; // set when the 'metric' is a simple pattern
  144. collected_number multiplier; // the multiplier of the dimension
  145. collected_number divisor; // the divisor of the dimension
  146. RRDDIM_FLAGS flags; // the RRDDIM flags for this dimension
  147. RRDDIM_OPTIONS options; // the RRDDIM options for this dimension
  148. STATSD_APP_CHART_DIM_VALUE_TYPE value_type; // which value to use of the source metric
  149. RRDDIM *rd; // a pointer to the RRDDIM that has been created for this dimension
  150. collected_number *value_ptr; // a pointer to the source metric value
  151. RRD_ALGORITHM algorithm; // the algorithm of this dimension
  152. struct statsd_app_chart_dimension *next; // the next dimension for this chart
  153. } STATSD_APP_CHART_DIM;
  154. typedef struct statsd_app_chart {
  155. const char *id;
  156. const char *name;
  157. const char *title;
  158. const char *family;
  159. const char *context;
  160. const char *units;
  161. const char *module;
  162. long priority;
  163. RRDSET_TYPE chart_type;
  164. STATSD_APP_CHART_DIM *dimensions;
  165. size_t dimensions_count;
  166. size_t dimensions_linked_count;
  167. RRDSET *st;
  168. struct statsd_app_chart *next;
  169. } STATSD_APP_CHART;
  170. typedef struct statsd_app {
  171. const char *name;
  172. SIMPLE_PATTERN *metrics;
  173. STATS_METRIC_OPTIONS default_options;
  174. RRD_MEMORY_MODE rrd_memory_mode;
  175. DICTIONARY *dict;
  176. long rrd_history_entries;
  177. const char *source;
  178. STATSD_APP_CHART *charts;
  179. struct statsd_app *next;
  180. } STATSD_APP;
  181. // --------------------------------------------------------------------------------------------------------------------
  182. // global statsd data
  183. struct collection_thread_status {
  184. SPINLOCK spinlock;
  185. bool running;
  186. size_t max_sockets;
  187. netdata_thread_t thread;
  188. };
  189. static struct statsd {
  190. STATSD_INDEX gauges;
  191. STATSD_INDEX counters;
  192. STATSD_INDEX timers;
  193. STATSD_INDEX histograms;
  194. STATSD_INDEX meters;
  195. STATSD_INDEX sets;
  196. STATSD_INDEX dictionaries;
  197. size_t unknown_types;
  198. size_t socket_errors;
  199. size_t tcp_socket_connects;
  200. size_t tcp_socket_disconnects;
  201. size_t tcp_socket_connected;
  202. size_t tcp_socket_reads;
  203. size_t tcp_packets_received;
  204. size_t tcp_bytes_read;
  205. size_t udp_socket_reads;
  206. size_t udp_packets_received;
  207. size_t udp_bytes_read;
  208. int enabled;
  209. int update_every;
  210. SIMPLE_PATTERN *charts_for;
  211. size_t tcp_idle_timeout;
  212. collected_number decimal_detail;
  213. size_t private_charts;
  214. size_t max_private_charts_hard;
  215. long private_charts_rrd_history_entries;
  216. unsigned int private_charts_hidden:1;
  217. STATSD_APP *apps;
  218. size_t recvmmsg_size;
  219. size_t histogram_increase_step;
  220. double histogram_percentile;
  221. char *histogram_percentile_str;
  222. size_t dictionary_max_unique;
  223. int threads;
  224. struct collection_thread_status *collection_threads_status;
  225. LISTEN_SOCKETS sockets;
  226. } statsd = {
  227. .enabled = 1,
  228. .max_private_charts_hard = 1000,
  229. .private_charts_hidden = 0,
  230. .recvmmsg_size = 10,
  231. .decimal_detail = STATSD_DECIMAL_DETAIL,
  232. .gauges = {
  233. .name = "gauge",
  234. .events = 0,
  235. .metrics = 0,
  236. .dict = NULL,
  237. .type = STATSD_METRIC_TYPE_GAUGE,
  238. .default_options = STATSD_METRIC_OPTION_NONE
  239. },
  240. .counters = {
  241. .name = "counter",
  242. .events = 0,
  243. .metrics = 0,
  244. .dict = NULL,
  245. .type = STATSD_METRIC_TYPE_COUNTER,
  246. .default_options = STATSD_METRIC_OPTION_NONE
  247. },
  248. .timers = {
  249. .name = "timer",
  250. .events = 0,
  251. .metrics = 0,
  252. .dict = NULL,
  253. .type = STATSD_METRIC_TYPE_TIMER,
  254. .default_options = STATSD_METRIC_OPTION_NONE
  255. },
  256. .histograms = {
  257. .name = "histogram",
  258. .events = 0,
  259. .metrics = 0,
  260. .dict = NULL,
  261. .type = STATSD_METRIC_TYPE_HISTOGRAM,
  262. .default_options = STATSD_METRIC_OPTION_NONE
  263. },
  264. .meters = {
  265. .name = "meter",
  266. .events = 0,
  267. .metrics = 0,
  268. .dict = NULL,
  269. .type = STATSD_METRIC_TYPE_METER,
  270. .default_options = STATSD_METRIC_OPTION_NONE
  271. },
  272. .sets = {
  273. .name = "set",
  274. .events = 0,
  275. .metrics = 0,
  276. .dict = NULL,
  277. .type = STATSD_METRIC_TYPE_SET,
  278. .default_options = STATSD_METRIC_OPTION_NONE
  279. },
  280. .dictionaries = {
  281. .name = "dictionary",
  282. .events = 0,
  283. .metrics = 0,
  284. .dict = NULL,
  285. .type = STATSD_METRIC_TYPE_DICTIONARY,
  286. .default_options = STATSD_METRIC_OPTION_NONE
  287. },
  288. .tcp_idle_timeout = 600,
  289. .apps = NULL,
  290. .histogram_percentile = 95.0,
  291. .histogram_increase_step = 10,
  292. .dictionary_max_unique = 200,
  293. .threads = 0,
  294. .collection_threads_status = NULL,
  295. .sockets = {
  296. .config = &netdata_config,
  297. .config_section = CONFIG_SECTION_STATSD,
  298. .default_bind_to = "udp:localhost tcp:localhost",
  299. .default_port = STATSD_LISTEN_PORT,
  300. .backlog = STATSD_LISTEN_BACKLOG
  301. },
  302. };
  303. // --------------------------------------------------------------------------------------------------------------------
  304. // statsd index management - add/find metrics
  305. static void dictionary_metric_insert_callback(const DICTIONARY_ITEM *item, void *value, void *data) {
  306. STATSD_INDEX *index = (STATSD_INDEX *)data;
  307. STATSD_METRIC *m = (STATSD_METRIC *)value;
  308. const char *name = dictionary_acquired_item_name(item);
  309. debug(D_STATSD, "Creating new %s metric '%s'", index->name, name);
  310. m->name = name;
  311. m->hash = simple_hash(name);
  312. m->type = index->type;
  313. m->options = index->default_options;
  314. if (m->type == STATSD_METRIC_TYPE_HISTOGRAM || m->type == STATSD_METRIC_TYPE_TIMER) {
  315. m->histogram.ext = callocz(1,sizeof(STATSD_METRIC_HISTOGRAM_EXTENSIONS));
  316. netdata_mutex_init(&m->histogram.ext->mutex);
  317. }
  318. __atomic_fetch_add(&index->metrics, 1, __ATOMIC_RELAXED);
  319. }
  320. static void dictionary_metric_delete_callback(const DICTIONARY_ITEM *item, void *value, void *data) {
  321. (void)data; // STATSD_INDEX *index = (STATSD_INDEX *)data;
  322. (void)item;
  323. STATSD_METRIC *m = (STATSD_METRIC *)value;
  324. if(m->type == STATSD_METRIC_TYPE_HISTOGRAM || m->type == STATSD_METRIC_TYPE_TIMER) {
  325. freez(m->histogram.ext);
  326. m->histogram.ext = NULL;
  327. }
  328. freez(m->units);
  329. freez(m->family);
  330. freez(m->dimname);
  331. }
  332. static inline STATSD_METRIC *statsd_find_or_add_metric(STATSD_INDEX *index, const char *name) {
  333. debug(D_STATSD, "searching for metric '%s' under '%s'", name, index->name);
  334. #ifdef STATSD_MULTITHREADED
  335. // avoid the write lock of dictionary_set() for existing metrics
  336. STATSD_METRIC *m = dictionary_get(index->dict, name);
  337. if(!m) m = dictionary_set(index->dict, name, NULL, sizeof(STATSD_METRIC));
  338. #else
  339. // no locks here, go faster
  340. // this will call the dictionary_metric_insert_callback() if an item
  341. // is inserted, otherwise it will return the existing one.
  342. // We used the flag DICT_OPTION_DONT_OVERWRITE_VALUE to support this.
  343. STATSD_METRIC *m = dictionary_set(index->dict, name, NULL, sizeof(STATSD_METRIC));
  344. #endif
  345. index->events++;
  346. return m;
  347. }
  348. // --------------------------------------------------------------------------------------------------------------------
  349. // statsd parsing numbers
  350. static inline NETDATA_DOUBLE statsd_parse_float(const char *v, NETDATA_DOUBLE def) {
  351. NETDATA_DOUBLE value;
  352. if(likely(v && *v)) {
  353. char *e = NULL;
  354. value = str2ndd(v, &e);
  355. if(unlikely(e && *e))
  356. collector_error("STATSD: excess data '%s' after value '%s'", e, v);
  357. }
  358. else
  359. value = def;
  360. return value;
  361. }
  362. static inline NETDATA_DOUBLE statsd_parse_sampling_rate(const char *v) {
  363. NETDATA_DOUBLE sampling_rate = statsd_parse_float(v, 1.0);
  364. if(unlikely(isless(sampling_rate, 0.001))) sampling_rate = 0.001;
  365. if(unlikely(isgreater(sampling_rate, 1.0))) sampling_rate = 1.0;
  366. return sampling_rate;
  367. }
  368. static inline long long statsd_parse_int(const char *v, long long def) {
  369. long long value;
  370. if(likely(v && *v)) {
  371. char *e = NULL;
  372. value = str2ll(v, &e);
  373. if(unlikely(e && *e))
  374. collector_error("STATSD: excess data '%s' after value '%s'", e, v);
  375. }
  376. else
  377. value = def;
  378. return value;
  379. }
  380. // --------------------------------------------------------------------------------------------------------------------
  381. // statsd processors per metric type
  382. static inline void statsd_reset_metric(STATSD_METRIC *m) {
  383. m->reset = 0;
  384. m->count = 0;
  385. }
  386. static inline int value_is_zinit(const char *value) {
  387. return (value && *value == 'z' && *++value == 'i' && *++value == 'n' && *++value == 'i' && *++value == 't' && *++value == '\0');
  388. }
  389. #define is_metric_checked(m) ((m)->options & STATSD_METRIC_OPTION_CHECKED)
  390. #define is_metric_useful_for_collection(m) (!is_metric_checked(m) || ((m)->options & STATSD_METRIC_OPTION_USEFUL))
  391. static inline void statsd_process_gauge(STATSD_METRIC *m, const char *value, const char *sampling) {
  392. if(!is_metric_useful_for_collection(m)) return;
  393. if(unlikely(!value || !*value)) {
  394. collector_error("STATSD: metric '%s' of type gauge, with empty value is ignored.", m->name);
  395. return;
  396. }
  397. if(unlikely(m->reset)) {
  398. // no need to reset anything specific for gauges
  399. statsd_reset_metric(m);
  400. }
  401. if(unlikely(value_is_zinit(value))) {
  402. // magic loading of metric, without affecting anything
  403. }
  404. else {
  405. if (unlikely(*value == '+' || *value == '-'))
  406. m->gauge.value += statsd_parse_float(value, 1.0) / statsd_parse_sampling_rate(sampling);
  407. else
  408. m->gauge.value = statsd_parse_float(value, 1.0);
  409. m->events++;
  410. m->count++;
  411. }
  412. }
  413. static inline void statsd_process_counter_or_meter(STATSD_METRIC *m, const char *value, const char *sampling) {
  414. if(!is_metric_useful_for_collection(m)) return;
  415. // we accept empty values for counters
  416. if(unlikely(m->reset)) statsd_reset_metric(m);
  417. if(unlikely(value_is_zinit(value))) {
  418. // magic loading of metric, without affecting anything
  419. }
  420. else {
  421. m->counter.value += llrintndd((NETDATA_DOUBLE) statsd_parse_int(value, 1) / statsd_parse_sampling_rate(sampling));
  422. m->events++;
  423. m->count++;
  424. }
  425. }
  426. #define statsd_process_counter(m, value, sampling) statsd_process_counter_or_meter(m, value, sampling)
  427. #define statsd_process_meter(m, value, sampling) statsd_process_counter_or_meter(m, value, sampling)
  428. static inline void statsd_process_histogram_or_timer(STATSD_METRIC *m, const char *value, const char *sampling, const char *type) {
  429. if(!is_metric_useful_for_collection(m)) return;
  430. if(unlikely(!value || !*value)) {
  431. collector_error("STATSD: metric of type %s, with empty value is ignored.", type);
  432. return;
  433. }
  434. if(unlikely(m->reset)) {
  435. m->histogram.ext->used = 0;
  436. statsd_reset_metric(m);
  437. }
  438. if(unlikely(value_is_zinit(value))) {
  439. // magic loading of metric, without affecting anything
  440. }
  441. else {
  442. NETDATA_DOUBLE v = statsd_parse_float(value, 1.0);
  443. NETDATA_DOUBLE sampling_rate = statsd_parse_sampling_rate(sampling);
  444. if(unlikely(isless(sampling_rate, 0.01))) sampling_rate = 0.01;
  445. if(unlikely(isgreater(sampling_rate, 1.0))) sampling_rate = 1.0;
  446. long long samples = llrintndd(1.0 / sampling_rate);
  447. while(samples-- > 0) {
  448. if(unlikely(m->histogram.ext->used == m->histogram.ext->size)) {
  449. netdata_mutex_lock(&m->histogram.ext->mutex);
  450. m->histogram.ext->size += statsd.histogram_increase_step;
  451. m->histogram.ext->values = reallocz(m->histogram.ext->values, sizeof(NETDATA_DOUBLE) * m->histogram.ext->size);
  452. netdata_mutex_unlock(&m->histogram.ext->mutex);
  453. }
  454. m->histogram.ext->values[m->histogram.ext->used++] = v;
  455. }
  456. m->events++;
  457. m->count++;
  458. }
  459. }
  460. #define statsd_process_timer(m, value, sampling) statsd_process_histogram_or_timer(m, value, sampling, "timer")
  461. #define statsd_process_histogram(m, value, sampling) statsd_process_histogram_or_timer(m, value, sampling, "histogram")
  462. static void dictionary_metric_set_value_insert_callback(const DICTIONARY_ITEM *item, void *value, void *data) {
  463. (void)item;
  464. (void)value;
  465. STATSD_METRIC *m = (STATSD_METRIC *)data;
  466. m->set.unique++;
  467. }
  468. static inline void statsd_process_set(STATSD_METRIC *m, const char *value) {
  469. if(!is_metric_useful_for_collection(m)) return;
  470. if(unlikely(!value || !*value)) {
  471. error("STATSD: metric of type set, with empty value is ignored.");
  472. return;
  473. }
  474. if(unlikely(m->reset)) {
  475. if(likely(m->set.dict)) {
  476. dictionary_destroy(m->set.dict);
  477. m->set.dict = NULL;
  478. }
  479. statsd_reset_metric(m);
  480. }
  481. if (unlikely(!m->set.dict)) {
  482. m->set.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  483. dictionary_register_insert_callback(m->set.dict, dictionary_metric_set_value_insert_callback, m);
  484. m->set.unique = 0;
  485. }
  486. if(unlikely(value_is_zinit(value))) {
  487. // magic loading of metric, without affecting anything
  488. }
  489. else {
  490. #ifdef STATSD_MULTITHREADED
  491. // avoid the write lock to check if something is already there
  492. if(!dictionary_get(m->set.dict, value))
  493. dictionary_set(m->set.dict, value, NULL, 0);
  494. #else
  495. dictionary_set(m->set.dict, value, NULL, 0);
  496. #endif
  497. m->events++;
  498. m->count++;
  499. }
  500. }
  501. static void dictionary_metric_dict_value_insert_callback(const DICTIONARY_ITEM *item, void *value, void *data) {
  502. (void)item;
  503. (void)value;
  504. STATSD_METRIC *m = (STATSD_METRIC *)data;
  505. m->dictionary.unique++;
  506. }
  507. static inline void statsd_process_dictionary(STATSD_METRIC *m, const char *value) {
  508. if(!is_metric_useful_for_collection(m)) return;
  509. if(unlikely(!value || !*value)) {
  510. error("STATSD: metric of type set, with empty value is ignored.");
  511. return;
  512. }
  513. if(unlikely(m->reset))
  514. statsd_reset_metric(m);
  515. if (unlikely(!m->dictionary.dict)) {
  516. m->dictionary.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  517. dictionary_register_insert_callback(m->dictionary.dict, dictionary_metric_dict_value_insert_callback, m);
  518. m->dictionary.unique = 0;
  519. }
  520. if(unlikely(value_is_zinit(value))) {
  521. // magic loading of metric, without affecting anything
  522. }
  523. else {
  524. STATSD_METRIC_DICTIONARY_ITEM *t = (STATSD_METRIC_DICTIONARY_ITEM *)dictionary_get(m->dictionary.dict, value);
  525. if (unlikely(!t)) {
  526. if(!t && m->dictionary.unique >= statsd.dictionary_max_unique)
  527. value = "other";
  528. t = (STATSD_METRIC_DICTIONARY_ITEM *)dictionary_set(m->dictionary.dict, value, NULL, sizeof(STATSD_METRIC_DICTIONARY_ITEM));
  529. }
  530. t->count++;
  531. m->events++;
  532. m->count++;
  533. }
  534. }
  535. // --------------------------------------------------------------------------------------------------------------------
  536. // statsd parsing
  537. static inline const char *statsd_parse_skip_up_to(const char *s, char d1, char d2, char d3) {
  538. char c;
  539. for(c = *s; c && c != d1 && c != d2 && c != d3 && c != '\r' && c != '\n'; c = *++s) ;
  540. return s;
  541. }
  542. const char *statsd_parse_skip_spaces(const char *s) {
  543. char c;
  544. for(c = *s; c && ( c == ' ' || c == '\t' || c == '\r' || c == '\n' ); c = *++s) ;
  545. return s;
  546. }
  547. static inline const char *statsd_parse_field_trim(const char *start, char *end) {
  548. if(unlikely(!start || !*start)) {
  549. start = end;
  550. return start;
  551. }
  552. while(start <= end && (*start == ' ' || *start == '\t'))
  553. start++;
  554. *end = '\0';
  555. end--;
  556. while(end >= start && (*end == ' ' || *end == '\t'))
  557. *end-- = '\0';
  558. return start;
  559. }
  560. static void statsd_process_metric(const char *name, const char *value, const char *type, const char *sampling, const char *tags) {
  561. debug(D_STATSD, "STATSD: raw metric '%s', value '%s', type '%s', sampling '%s', tags '%s'", name?name:"(null)", value?value:"(null)", type?type:"(null)", sampling?sampling:"(null)", tags?tags:"(null)");
  562. if(unlikely(!name || !*name)) return;
  563. if(unlikely(!type || !*type)) type = "m";
  564. STATSD_METRIC *m = NULL;
  565. char t0 = type[0], t1 = type[1];
  566. if(unlikely(t0 == 'g' && t1 == '\0')) {
  567. statsd_process_gauge(
  568. m = statsd_find_or_add_metric(&statsd.gauges, name),
  569. value, sampling);
  570. }
  571. else if(unlikely((t0 == 'c' || t0 == 'C') && t1 == '\0')) {
  572. // etsy/statsd uses 'c'
  573. // brubeck uses 'C'
  574. statsd_process_counter(
  575. m = statsd_find_or_add_metric(&statsd.counters, name),
  576. value, sampling);
  577. }
  578. else if(unlikely(t0 == 'm' && t1 == '\0')) {
  579. statsd_process_meter(
  580. m = statsd_find_or_add_metric(&statsd.meters, name),
  581. value, sampling);
  582. }
  583. else if(unlikely(t0 == 'h' && t1 == '\0')) {
  584. statsd_process_histogram(
  585. m = statsd_find_or_add_metric(&statsd.histograms, name),
  586. value, sampling);
  587. }
  588. else if(unlikely(t0 == 's' && t1 == '\0')) {
  589. statsd_process_set(
  590. m = statsd_find_or_add_metric(&statsd.sets, name),
  591. value);
  592. }
  593. else if(unlikely(t0 == 'd' && t1 == '\0')) {
  594. statsd_process_dictionary(
  595. m = statsd_find_or_add_metric(&statsd.dictionaries, name),
  596. value);
  597. }
  598. else if(unlikely(t0 == 'm' && t1 == 's' && type[2] == '\0')) {
  599. statsd_process_timer(
  600. m = statsd_find_or_add_metric(&statsd.timers, name),
  601. value, sampling);
  602. }
  603. else {
  604. statsd.unknown_types++;
  605. error("STATSD: metric '%s' with value '%s' is sent with unknown metric type '%s'", name, value?value:"", type);
  606. }
  607. if(m && tags && *tags) {
  608. const char *s = tags;
  609. while(*s) {
  610. const char *tagkey = NULL, *tagvalue = NULL;
  611. char *tagkey_end = NULL, *tagvalue_end = NULL;
  612. s = tagkey_end = (char *)statsd_parse_skip_up_to(tagkey = s, ':', '=', ',');
  613. if(tagkey == tagkey_end) {
  614. if (*s) {
  615. s++;
  616. s = statsd_parse_skip_spaces(s);
  617. }
  618. continue;
  619. }
  620. if(likely(*s == ':' || *s == '='))
  621. s = tagvalue_end = (char *) statsd_parse_skip_up_to(tagvalue = ++s, ',', '\0', '\0');
  622. if(*s == ',') s++;
  623. statsd_parse_field_trim(tagkey, tagkey_end);
  624. statsd_parse_field_trim(tagvalue, tagvalue_end);
  625. if(tagkey && *tagkey && tagvalue && *tagvalue) {
  626. if (strcmp(tagkey, "units") == 0 && (!m->units || strcmp(m->units, tagvalue) != 0)) {
  627. m->units = strdupz(tagvalue);
  628. m->options |= STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  629. }
  630. if (strcmp(tagkey, "name") == 0 && (!m->dimname || strcmp(m->dimname, tagvalue) != 0)) {
  631. m->dimname = strdupz(tagvalue);
  632. m->options |= STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  633. }
  634. if (strcmp(tagkey, "family") == 0 && (!m->family || strcmp(m->family, tagvalue) != 0)) {
  635. m->family = strdupz(tagvalue);
  636. m->options |= STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  637. }
  638. }
  639. }
  640. }
  641. }
  642. static inline size_t statsd_process(char *buffer, size_t size, int require_newlines) {
  643. buffer[size] = '\0';
  644. debug(D_STATSD, "RECEIVED: %zu bytes: '%s'", size, buffer);
  645. const char *s = buffer;
  646. while(*s) {
  647. const char *name = NULL, *value = NULL, *type = NULL, *sampling = NULL, *tags = NULL;
  648. char *name_end = NULL, *value_end = NULL, *type_end = NULL, *sampling_end = NULL, *tags_end = NULL;
  649. s = name_end = (char *)statsd_parse_skip_up_to(name = s, ':', '=', '|');
  650. if(name == name_end) {
  651. if (*s) {
  652. s++;
  653. s = statsd_parse_skip_spaces(s);
  654. }
  655. continue;
  656. }
  657. if(likely(*s == ':' || *s == '='))
  658. s = value_end = (char *) statsd_parse_skip_up_to(value = ++s, '|', '@', '#');
  659. if(likely(*s == '|'))
  660. s = type_end = (char *) statsd_parse_skip_up_to(type = ++s, '|', '@', '#');
  661. while(*s == '|' || *s == '@' || *s == '#') {
  662. // parse all the fields that may be appended
  663. if ((*s == '|' && s[1] == '@') || *s == '@') {
  664. s = sampling_end = (char *)statsd_parse_skip_up_to(sampling = ++s, '|', '@', '#');
  665. if (*sampling == '@') sampling++;
  666. }
  667. else if ((*s == '|' && s[1] == '#') || *s == '#') {
  668. s = tags_end = (char *)statsd_parse_skip_up_to(tags = ++s, '|', '@', '#');
  669. if (*tags == '#') tags++;
  670. }
  671. else {
  672. // unknown field, skip it
  673. s = (char *)statsd_parse_skip_up_to(++s, '|', '@', '#');
  674. }
  675. }
  676. // skip everything until the end of the line
  677. while(*s && *s != '\n') s++;
  678. if(unlikely(require_newlines && *s != '\n' && s > buffer)) {
  679. // move the remaining data to the beginning
  680. size -= (name - buffer);
  681. memmove(buffer, name, size);
  682. return size;
  683. }
  684. else
  685. s = statsd_parse_skip_spaces(s);
  686. statsd_process_metric(
  687. statsd_parse_field_trim(name, name_end)
  688. , statsd_parse_field_trim(value, value_end)
  689. , statsd_parse_field_trim(type, type_end)
  690. , statsd_parse_field_trim(sampling, sampling_end)
  691. , statsd_parse_field_trim(tags, tags_end)
  692. );
  693. }
  694. return 0;
  695. }
  696. // --------------------------------------------------------------------------------------------------------------------
  697. // statsd pollfd interface
  698. #define STATSD_TCP_BUFFER_SIZE 65536 // minimize tcp reads
  699. #define STATSD_UDP_BUFFER_SIZE 9000 // this should be up to MTU
  700. typedef enum {
  701. STATSD_SOCKET_DATA_TYPE_TCP,
  702. STATSD_SOCKET_DATA_TYPE_UDP
  703. } STATSD_SOCKET_DATA_TYPE;
  704. struct statsd_tcp {
  705. STATSD_SOCKET_DATA_TYPE type;
  706. size_t size;
  707. size_t len;
  708. char buffer[];
  709. };
  710. struct statsd_udp {
  711. struct collection_thread_status *status;
  712. STATSD_SOCKET_DATA_TYPE type;
  713. #ifdef HAVE_RECVMMSG
  714. size_t size;
  715. struct iovec *iovecs;
  716. struct mmsghdr *msgs;
  717. #else
  718. int *running;
  719. char buffer[STATSD_UDP_BUFFER_SIZE];
  720. #endif
  721. };
  722. // new TCP client connected
  723. static void *statsd_add_callback(POLLINFO *pi, short int *events, void *data) {
  724. (void)pi;
  725. (void)data;
  726. worker_is_busy(WORKER_JOB_TYPE_TCP_CONNECTED);
  727. *events = POLLIN;
  728. struct statsd_tcp *t = (struct statsd_tcp *)callocz(sizeof(struct statsd_tcp) + STATSD_TCP_BUFFER_SIZE, 1);
  729. t->type = STATSD_SOCKET_DATA_TYPE_TCP;
  730. t->size = STATSD_TCP_BUFFER_SIZE - 1;
  731. statsd.tcp_socket_connects++;
  732. statsd.tcp_socket_connected++;
  733. worker_is_idle();
  734. return t;
  735. }
  736. // TCP client disconnected
  737. static void statsd_del_callback(POLLINFO *pi) {
  738. worker_is_busy(WORKER_JOB_TYPE_TCP_DISCONNECTED);
  739. struct statsd_tcp *t = pi->data;
  740. if(likely(t)) {
  741. if(t->type == STATSD_SOCKET_DATA_TYPE_TCP) {
  742. if(t->len != 0) {
  743. statsd.socket_errors++;
  744. error("STATSD: client is probably sending unterminated metrics. Closed socket left with '%s'. Trying to process it.", t->buffer);
  745. statsd_process(t->buffer, t->len, 0);
  746. }
  747. statsd.tcp_socket_disconnects++;
  748. statsd.tcp_socket_connected--;
  749. }
  750. else
  751. error("STATSD: internal error: received socket data type is %d, but expected %d", (int)t->type, (int)STATSD_SOCKET_DATA_TYPE_TCP);
  752. freez(t);
  753. }
  754. worker_is_idle();
  755. }
  756. // Receive data
  757. static int statsd_rcv_callback(POLLINFO *pi, short int *events) {
  758. int retval = -1;
  759. worker_is_busy(WORKER_JOB_TYPE_RCV_DATA);
  760. *events = POLLIN;
  761. int fd = pi->fd;
  762. switch(pi->socktype) {
  763. case SOCK_STREAM: {
  764. struct statsd_tcp *d = (struct statsd_tcp *)pi->data;
  765. if(unlikely(!d)) {
  766. error("STATSD: internal error: expected TCP data pointer is NULL");
  767. statsd.socket_errors++;
  768. retval = -1;
  769. goto cleanup;
  770. }
  771. #ifdef NETDATA_INTERNAL_CHECKS
  772. if(unlikely(d->type != STATSD_SOCKET_DATA_TYPE_TCP)) {
  773. error("STATSD: internal error: socket data type should be %d, but it is %d", (int)STATSD_SOCKET_DATA_TYPE_TCP, (int)d->type);
  774. statsd.socket_errors++;
  775. retval = -1;
  776. goto cleanup;
  777. }
  778. #endif
  779. int ret = 0;
  780. ssize_t rc;
  781. do {
  782. rc = recv(fd, &d->buffer[d->len], d->size - d->len, MSG_DONTWAIT);
  783. if (rc < 0) {
  784. // read failed
  785. if (errno != EWOULDBLOCK && errno != EAGAIN && errno != EINTR) {
  786. error("STATSD: recv() on TCP socket %d failed.", fd);
  787. statsd.socket_errors++;
  788. ret = -1;
  789. }
  790. }
  791. else if (!rc) {
  792. // connection closed
  793. debug(D_STATSD, "STATSD: client disconnected.");
  794. ret = -1;
  795. }
  796. else {
  797. // data received
  798. d->len += rc;
  799. statsd.tcp_socket_reads++;
  800. statsd.tcp_bytes_read += rc;
  801. }
  802. if(likely(d->len > 0)) {
  803. statsd.tcp_packets_received++;
  804. d->len = statsd_process(d->buffer, d->len, 1);
  805. }
  806. if(unlikely(ret == -1)) {
  807. retval = -1;
  808. goto cleanup;
  809. }
  810. } while (rc != -1);
  811. break;
  812. }
  813. case SOCK_DGRAM: {
  814. struct statsd_udp *d = (struct statsd_udp *)pi->data;
  815. if(unlikely(!d)) {
  816. error("STATSD: internal error: expected UDP data pointer is NULL");
  817. statsd.socket_errors++;
  818. retval = -1;
  819. goto cleanup;
  820. }
  821. #ifdef NETDATA_INTERNAL_CHECKS
  822. if(unlikely(d->type != STATSD_SOCKET_DATA_TYPE_UDP)) {
  823. error("STATSD: internal error: socket data should be %d, but it is %d", (int)d->type, (int)STATSD_SOCKET_DATA_TYPE_UDP);
  824. statsd.socket_errors++;
  825. retval = -1;
  826. goto cleanup;
  827. }
  828. #endif
  829. #ifdef HAVE_RECVMMSG
  830. ssize_t rc;
  831. do {
  832. rc = recvmmsg(fd, d->msgs, (unsigned int)d->size, MSG_DONTWAIT, NULL);
  833. if (rc < 0) {
  834. // read failed
  835. if (errno != EWOULDBLOCK && errno != EAGAIN && errno != EINTR) {
  836. error("STATSD: recvmmsg() on UDP socket %d failed.", fd);
  837. statsd.socket_errors++;
  838. retval = -1;
  839. goto cleanup;
  840. }
  841. } else if (rc) {
  842. // data received
  843. statsd.udp_socket_reads++;
  844. statsd.udp_packets_received += rc;
  845. size_t i;
  846. for (i = 0; i < (size_t)rc; ++i) {
  847. size_t len = (size_t)d->msgs[i].msg_len;
  848. statsd.udp_bytes_read += len;
  849. statsd_process(d->msgs[i].msg_hdr.msg_iov->iov_base, len, 0);
  850. }
  851. }
  852. } while (rc != -1);
  853. #else // !HAVE_RECVMMSG
  854. ssize_t rc;
  855. do {
  856. rc = recv(fd, d->buffer, STATSD_UDP_BUFFER_SIZE - 1, MSG_DONTWAIT);
  857. if (rc < 0) {
  858. // read failed
  859. if (errno != EWOULDBLOCK && errno != EAGAIN && errno != EINTR) {
  860. error("STATSD: recv() on UDP socket %d failed.", fd);
  861. statsd.socket_errors++;
  862. retval = -1;
  863. goto cleanup;
  864. }
  865. } else if (rc) {
  866. // data received
  867. statsd.udp_socket_reads++;
  868. statsd.udp_packets_received++;
  869. statsd.udp_bytes_read += rc;
  870. statsd_process(d->buffer, (size_t) rc, 0);
  871. }
  872. } while (rc != -1);
  873. #endif
  874. break;
  875. }
  876. default: {
  877. error("STATSD: internal error: unknown socktype %d on socket %d", pi->socktype, fd);
  878. statsd.socket_errors++;
  879. retval = -1;
  880. goto cleanup;
  881. }
  882. }
  883. retval = 0;
  884. cleanup:
  885. worker_is_idle();
  886. return retval;
  887. }
  888. static int statsd_snd_callback(POLLINFO *pi, short int *events) {
  889. (void)pi;
  890. (void)events;
  891. worker_is_busy(WORKER_JOB_TYPE_SND_DATA);
  892. error("STATSD: snd_callback() called, but we never requested to send data to statsd clients.");
  893. worker_is_idle();
  894. return -1;
  895. }
  896. // --------------------------------------------------------------------------------------------------------------------
  897. // statsd child thread to collect metrics from network
  898. void statsd_collector_thread_cleanup(void *data) {
  899. struct statsd_udp *d = data;
  900. netdata_spinlock_lock(&d->status->spinlock);
  901. d->status->running = false;
  902. netdata_spinlock_unlock(&d->status->spinlock);
  903. collector_info("cleaning up...");
  904. #ifdef HAVE_RECVMMSG
  905. size_t i;
  906. for (i = 0; i < d->size; i++)
  907. freez(d->iovecs[i].iov_base);
  908. freez(d->iovecs);
  909. freez(d->msgs);
  910. #endif
  911. freez(d);
  912. worker_unregister();
  913. }
  914. static bool statsd_should_stop(void) {
  915. return !service_running(SERVICE_COLLECTORS);
  916. }
  917. void *statsd_collector_thread(void *ptr) {
  918. struct collection_thread_status *status = ptr;
  919. netdata_spinlock_lock(&status->spinlock);
  920. status->running = true;
  921. netdata_spinlock_unlock(&status->spinlock);
  922. worker_register("STATSD");
  923. worker_register_job_name(WORKER_JOB_TYPE_TCP_CONNECTED, "tcp connect");
  924. worker_register_job_name(WORKER_JOB_TYPE_TCP_DISCONNECTED, "tcp disconnect");
  925. worker_register_job_name(WORKER_JOB_TYPE_RCV_DATA, "receive");
  926. worker_register_job_name(WORKER_JOB_TYPE_SND_DATA, "send");
  927. collector_info("STATSD collector thread started with taskid %d", gettid());
  928. struct statsd_udp *d = callocz(sizeof(struct statsd_udp), 1);
  929. d->status = status;
  930. netdata_thread_cleanup_push(statsd_collector_thread_cleanup, d);
  931. #ifdef HAVE_RECVMMSG
  932. d->type = STATSD_SOCKET_DATA_TYPE_UDP;
  933. d->size = statsd.recvmmsg_size;
  934. d->iovecs = callocz(sizeof(struct iovec), d->size);
  935. d->msgs = callocz(sizeof(struct mmsghdr), d->size);
  936. size_t i;
  937. for (i = 0; i < d->size; i++) {
  938. d->iovecs[i].iov_base = mallocz(STATSD_UDP_BUFFER_SIZE);
  939. d->iovecs[i].iov_len = STATSD_UDP_BUFFER_SIZE - 1;
  940. d->msgs[i].msg_hdr.msg_iov = &d->iovecs[i];
  941. d->msgs[i].msg_hdr.msg_iovlen = 1;
  942. }
  943. #endif
  944. poll_events(&statsd.sockets
  945. , statsd_add_callback
  946. , statsd_del_callback
  947. , statsd_rcv_callback
  948. , statsd_snd_callback
  949. , NULL
  950. , statsd_should_stop
  951. , NULL // No access control pattern
  952. , 0 // No dns lookups for access control pattern
  953. , (void *)d
  954. , 0 // tcp request timeout, 0 = disabled
  955. , statsd.tcp_idle_timeout // tcp idle timeout, 0 = disabled
  956. , statsd.update_every * 1000
  957. , ptr // timer_data
  958. , status->max_sockets
  959. );
  960. netdata_thread_cleanup_pop(1);
  961. return NULL;
  962. }
  963. // --------------------------------------------------------------------------------------------------------------------
  964. // statsd applications configuration files parsing
  965. #define STATSD_CONF_LINE_MAX 8192
  966. static STATSD_APP_CHART_DIM_VALUE_TYPE string2valuetype(const char *type, size_t line, const char *filename) {
  967. if(!type || !*type) type = "last";
  968. if(!strcmp(type, "events")) return STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS;
  969. else if(!strcmp(type, "last")) return STATSD_APP_CHART_DIM_VALUE_TYPE_LAST;
  970. else if(!strcmp(type, "min")) return STATSD_APP_CHART_DIM_VALUE_TYPE_MIN;
  971. else if(!strcmp(type, "max")) return STATSD_APP_CHART_DIM_VALUE_TYPE_MAX;
  972. else if(!strcmp(type, "sum")) return STATSD_APP_CHART_DIM_VALUE_TYPE_SUM;
  973. else if(!strcmp(type, "average")) return STATSD_APP_CHART_DIM_VALUE_TYPE_AVERAGE;
  974. else if(!strcmp(type, "median")) return STATSD_APP_CHART_DIM_VALUE_TYPE_MEDIAN;
  975. else if(!strcmp(type, "stddev")) return STATSD_APP_CHART_DIM_VALUE_TYPE_STDDEV;
  976. else if(!strcmp(type, "percentile")) return STATSD_APP_CHART_DIM_VALUE_TYPE_PERCENTILE;
  977. error("STATSD: invalid type '%s' at line %zu of file '%s'. Using 'last'.", type, line, filename);
  978. return STATSD_APP_CHART_DIM_VALUE_TYPE_LAST;
  979. }
  980. static const char *valuetype2string(STATSD_APP_CHART_DIM_VALUE_TYPE type) {
  981. switch(type) {
  982. case STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS: return "events";
  983. case STATSD_APP_CHART_DIM_VALUE_TYPE_LAST: return "last";
  984. case STATSD_APP_CHART_DIM_VALUE_TYPE_MIN: return "min";
  985. case STATSD_APP_CHART_DIM_VALUE_TYPE_MAX: return "max";
  986. case STATSD_APP_CHART_DIM_VALUE_TYPE_SUM: return "sum";
  987. case STATSD_APP_CHART_DIM_VALUE_TYPE_AVERAGE: return "average";
  988. case STATSD_APP_CHART_DIM_VALUE_TYPE_MEDIAN: return "median";
  989. case STATSD_APP_CHART_DIM_VALUE_TYPE_STDDEV: return "stddev";
  990. case STATSD_APP_CHART_DIM_VALUE_TYPE_PERCENTILE: return "percentile";
  991. }
  992. return "unknown";
  993. }
  994. static STATSD_APP_CHART_DIM *add_dimension_to_app_chart(
  995. STATSD_APP *app __maybe_unused
  996. , STATSD_APP_CHART *chart
  997. , const char *metric_name
  998. , const char *dim_name
  999. , collected_number multiplier
  1000. , collected_number divisor
  1001. , RRDDIM_FLAGS flags
  1002. , RRDDIM_OPTIONS options
  1003. , STATSD_APP_CHART_DIM_VALUE_TYPE value_type
  1004. ) {
  1005. STATSD_APP_CHART_DIM *dim = callocz(sizeof(STATSD_APP_CHART_DIM), 1);
  1006. dim->metric = strdupz(metric_name);
  1007. dim->metric_hash = simple_hash(dim->metric);
  1008. dim->name = strdupz((dim_name)?dim_name:"");
  1009. dim->multiplier = multiplier;
  1010. dim->divisor = divisor;
  1011. dim->value_type = value_type;
  1012. dim->flags = flags;
  1013. dim->options = options;
  1014. if(!dim->multiplier)
  1015. dim->multiplier = 1;
  1016. if(!dim->divisor)
  1017. dim->divisor = 1;
  1018. // append it to the list of dimension
  1019. STATSD_APP_CHART_DIM *tdim;
  1020. for(tdim = chart->dimensions; tdim && tdim->next ; tdim = tdim->next) ;
  1021. if(!tdim) {
  1022. dim->next = chart->dimensions;
  1023. chart->dimensions = dim;
  1024. }
  1025. else {
  1026. dim->next = tdim->next;
  1027. tdim->next = dim;
  1028. }
  1029. chart->dimensions_count++;
  1030. debug(D_STATSD, "Added dimension '%s' to chart '%s' of app '%s', for metric '%s', with type %u, multiplier " COLLECTED_NUMBER_FORMAT ", divisor " COLLECTED_NUMBER_FORMAT,
  1031. dim->name, chart->id, app->name, dim->metric, dim->value_type, dim->multiplier, dim->divisor);
  1032. return dim;
  1033. }
  1034. static int statsd_readfile(const char *filename, STATSD_APP *app, STATSD_APP_CHART *chart, DICTIONARY *dict) {
  1035. debug(D_STATSD, "STATSD configuration reading file '%s'", filename);
  1036. char *buffer = mallocz(STATSD_CONF_LINE_MAX + 1);
  1037. FILE *fp = fopen(filename, "r");
  1038. if(!fp) {
  1039. error("STATSD: cannot open file '%s'.", filename);
  1040. freez(buffer);
  1041. return -1;
  1042. }
  1043. size_t line = 0;
  1044. char *s;
  1045. while(fgets(buffer, STATSD_CONF_LINE_MAX, fp) != NULL) {
  1046. buffer[STATSD_CONF_LINE_MAX] = '\0';
  1047. line++;
  1048. s = trim(buffer);
  1049. if (!s || *s == '#') {
  1050. debug(D_STATSD, "STATSD: ignoring line %zu of file '%s', it is empty.", line, filename);
  1051. continue;
  1052. }
  1053. debug(D_STATSD, "STATSD: processing line %zu of file '%s': %s", line, filename, buffer);
  1054. if(*s == 'i' && strncmp(s, "include", 7) == 0) {
  1055. s = trim(&s[7]);
  1056. if(s && *s) {
  1057. char *tmp;
  1058. if(*s == '/')
  1059. tmp = strdupz(s);
  1060. else {
  1061. // the file to be included is relative to current file
  1062. // find the directory name from the file we already read
  1063. char *filename2 = strdupz(filename); // copy filename, since dirname() will change it
  1064. char *dir = dirname(filename2); // find the directory part of the filename
  1065. tmp = strdupz_path_subpath(dir, s); // compose the new filename to read;
  1066. freez(filename2); // free the filename we copied
  1067. }
  1068. statsd_readfile(tmp, app, chart, dict);
  1069. freez(tmp);
  1070. }
  1071. else
  1072. error("STATSD: ignoring line %zu of file '%s', include filename is empty", line, filename);
  1073. continue;
  1074. }
  1075. int len = (int) strlen(s);
  1076. if (*s == '[' && s[len - 1] == ']') {
  1077. // new section
  1078. s[len - 1] = '\0';
  1079. s++;
  1080. if (!strcmp(s, "app")) {
  1081. // a new app
  1082. app = callocz(sizeof(STATSD_APP), 1);
  1083. app->name = strdupz("unnamed");
  1084. app->rrd_memory_mode = localhost->rrd_memory_mode;
  1085. app->rrd_history_entries = localhost->rrd_history_entries;
  1086. app->next = statsd.apps;
  1087. statsd.apps = app;
  1088. chart = NULL;
  1089. dict = NULL;
  1090. {
  1091. char lineandfile[FILENAME_MAX + 1];
  1092. snprintfz(lineandfile, FILENAME_MAX, "%zu@%s", line, filename);
  1093. app->source = strdupz(lineandfile);
  1094. }
  1095. }
  1096. else if(app) {
  1097. if(!strcmp(s, "dictionary")) {
  1098. if(!app->dict)
  1099. app->dict = dictionary_create_advanced(DICT_OPTION_SINGLE_THREADED, &dictionary_stats_category_collectors, 0);
  1100. dict = app->dict;
  1101. }
  1102. else {
  1103. dict = NULL;
  1104. // a new chart
  1105. chart = callocz(sizeof(STATSD_APP_CHART), 1);
  1106. netdata_fix_chart_id(s);
  1107. chart->id = strdupz(s);
  1108. chart->name = strdupz(s);
  1109. chart->title = strdupz("Statsd chart");
  1110. chart->context = strdupz(s);
  1111. chart->family = strdupz("overview");
  1112. chart->units = strdupz("value");
  1113. chart->priority = NETDATA_CHART_PRIO_STATSD_PRIVATE;
  1114. chart->chart_type = RRDSET_TYPE_LINE;
  1115. chart->next = app->charts;
  1116. app->charts = chart;
  1117. if (!strncmp(
  1118. filename,
  1119. netdata_configured_stock_config_dir,
  1120. strlen(netdata_configured_stock_config_dir))) {
  1121. char tmpfilename[FILENAME_MAX + 1];
  1122. strncpyz(tmpfilename, filename, FILENAME_MAX);
  1123. chart->module = strdupz(basename(tmpfilename));
  1124. } else {
  1125. chart->module = strdupz("synthetic_chart");
  1126. }
  1127. }
  1128. }
  1129. else
  1130. error("STATSD: ignoring line %zu ('%s') of file '%s', [app] is not defined.", line, s, filename);
  1131. continue;
  1132. }
  1133. if(!app) {
  1134. error("STATSD: ignoring line %zu ('%s') of file '%s', it is outside all sections.", line, s, filename);
  1135. continue;
  1136. }
  1137. char *name = s;
  1138. char *value = strchr(s, '=');
  1139. if(!value) {
  1140. error("STATSD: ignoring line %zu ('%s') of file '%s', there is no = in it.", line, s, filename);
  1141. continue;
  1142. }
  1143. *value = '\0';
  1144. value++;
  1145. name = trim(name);
  1146. value = trim(value);
  1147. if(!name || *name == '#') {
  1148. error("STATSD: ignoring line %zu of file '%s', name is empty.", line, filename);
  1149. continue;
  1150. }
  1151. if(!value) {
  1152. debug(D_CONFIG, "STATSD: ignoring line %zu of file '%s', value is empty.", line, filename);
  1153. continue;
  1154. }
  1155. if(unlikely(dict)) {
  1156. // parse [dictionary] members
  1157. dictionary_set(dict, name, value, strlen(value) + 1);
  1158. }
  1159. else if(!chart) {
  1160. // parse [app] members
  1161. if(!strcmp(name, "name")) {
  1162. freez((void *)app->name);
  1163. netdata_fix_chart_name(value);
  1164. app->name = strdupz(value);
  1165. }
  1166. else if (!strcmp(name, "metrics")) {
  1167. simple_pattern_free(app->metrics);
  1168. app->metrics = simple_pattern_create(value, NULL, SIMPLE_PATTERN_EXACT);
  1169. }
  1170. else if (!strcmp(name, "private charts")) {
  1171. if (!strcmp(value, "yes") || !strcmp(value, "on"))
  1172. app->default_options |= STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1173. else
  1174. app->default_options &= ~STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1175. }
  1176. else if (!strcmp(name, "gaps when not collected")) {
  1177. if (!strcmp(value, "yes") || !strcmp(value, "on"))
  1178. app->default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  1179. }
  1180. else if (!strcmp(name, "memory mode")) {
  1181. // this is not supported anymore
  1182. // with the implementation of storage engines, all charts have the same storage engine always
  1183. // app->rrd_memory_mode = rrd_memory_mode_id(value);
  1184. ;
  1185. }
  1186. else if (!strcmp(name, "history")) {
  1187. app->rrd_history_entries = atol(value);
  1188. if (app->rrd_history_entries < 5)
  1189. app->rrd_history_entries = 5;
  1190. }
  1191. else {
  1192. error("STATSD: ignoring line %zu ('%s') of file '%s'. Unknown keyword for the [app] section.", line, name, filename);
  1193. continue;
  1194. }
  1195. }
  1196. else {
  1197. // parse [chart] members
  1198. if(!strcmp(name, "name")) {
  1199. freez((void *)chart->name);
  1200. netdata_fix_chart_id(value);
  1201. chart->name = strdupz(value);
  1202. }
  1203. else if(!strcmp(name, "title")) {
  1204. freez((void *)chart->title);
  1205. chart->title = strdupz(value);
  1206. }
  1207. else if (!strcmp(name, "family")) {
  1208. freez((void *)chart->family);
  1209. chart->family = strdupz(value);
  1210. }
  1211. else if (!strcmp(name, "context")) {
  1212. freez((void *)chart->context);
  1213. netdata_fix_chart_id(value);
  1214. chart->context = strdupz(value);
  1215. }
  1216. else if (!strcmp(name, "units")) {
  1217. freez((void *)chart->units);
  1218. chart->units = strdupz(value);
  1219. }
  1220. else if (!strcmp(name, "priority")) {
  1221. chart->priority = atol(value);
  1222. }
  1223. else if (!strcmp(name, "type")) {
  1224. chart->chart_type = rrdset_type_id(value);
  1225. }
  1226. else if (!strcmp(name, "dimension")) {
  1227. // metric [name [type [multiplier [divisor]]]]
  1228. char *words[10] = { NULL };
  1229. size_t num_words = pluginsd_split_words(value, words, 10, NULL, NULL, 0);
  1230. int pattern = 0;
  1231. size_t i = 0;
  1232. char *metric_name = get_word(words, num_words, i++);
  1233. if(strcmp(metric_name, "pattern") == 0) {
  1234. metric_name = get_word(words, num_words, i++);
  1235. pattern = 1;
  1236. }
  1237. char *dim_name = get_word(words, num_words, i++);
  1238. char *type = get_word(words, num_words, i++);
  1239. char *multiplier = get_word(words, num_words, i++);
  1240. char *divisor = get_word(words, num_words, i++);
  1241. char *opts = get_word(words, num_words, i++);
  1242. RRDDIM_FLAGS flags = RRDDIM_FLAG_NONE;
  1243. RRDDIM_OPTIONS options = RRDDIM_OPTION_NONE;
  1244. if(opts && *opts) {
  1245. if(strstr(opts, "hidden") != NULL) options |= RRDDIM_OPTION_HIDDEN;
  1246. if(strstr(opts, "noreset") != NULL) options |= RRDDIM_OPTION_DONT_DETECT_RESETS_OR_OVERFLOWS;
  1247. if(strstr(opts, "nooverflow") != NULL) options |= RRDDIM_OPTION_DONT_DETECT_RESETS_OR_OVERFLOWS;
  1248. }
  1249. if(!pattern) {
  1250. if(app->dict) {
  1251. if(dim_name && *dim_name) {
  1252. char *n = dictionary_get(app->dict, dim_name);
  1253. if(n) dim_name = n;
  1254. }
  1255. else {
  1256. dim_name = dictionary_get(app->dict, metric_name);
  1257. }
  1258. }
  1259. if(!dim_name || !*dim_name)
  1260. dim_name = metric_name;
  1261. }
  1262. STATSD_APP_CHART_DIM *dim = add_dimension_to_app_chart(
  1263. app
  1264. , chart
  1265. , metric_name
  1266. , dim_name
  1267. , (multiplier && *multiplier)?str2l(multiplier):1
  1268. , (divisor && *divisor)?str2l(divisor):1
  1269. , flags
  1270. ,
  1271. options, string2valuetype(type, line, filename)
  1272. );
  1273. if(pattern)
  1274. dim->metric_pattern = simple_pattern_create(dim->metric, NULL, SIMPLE_PATTERN_EXACT);
  1275. }
  1276. else {
  1277. error("STATSD: ignoring line %zu ('%s') of file '%s'. Unknown keyword for the [%s] section.", line, name, filename, chart->id);
  1278. continue;
  1279. }
  1280. }
  1281. }
  1282. freez(buffer);
  1283. fclose(fp);
  1284. return 0;
  1285. }
  1286. static int statsd_file_callback(const char *filename, void *data) {
  1287. (void)data;
  1288. return statsd_readfile(filename, NULL, NULL, NULL);
  1289. }
  1290. static inline void statsd_readdir(const char *user_path, const char *stock_path, const char *subpath) {
  1291. recursive_config_double_dir_load(user_path, stock_path, subpath, statsd_file_callback, NULL, 0);
  1292. }
  1293. // --------------------------------------------------------------------------------------------------------------------
  1294. // send metrics to netdata - in private charts - called from the main thread
  1295. // extract chart type and chart id from metric name
  1296. static inline void statsd_get_metric_type_and_id(STATSD_METRIC *m, char *type, char *id, char *context, const char *metrictype, size_t len) {
  1297. // The full chart type.id looks like this:
  1298. // ${STATSD_CHART_PREFIX} + "_" + ${METRIC_NAME} + "_" + ${METRIC_TYPE}
  1299. //
  1300. // where:
  1301. // STATSD_CHART_PREFIX = "statsd" as defined above
  1302. // METRIC_NAME = whatever the user gave to statsd
  1303. // METRIC_TYPE = "gauge", "counter", "meter", "timer", "histogram", "set", "dictionary"
  1304. // for chart type, we want:
  1305. // ${STATSD_CHART_PREFIX} + "_" + the first word of ${METRIC_NAME}
  1306. // find the first word of ${METRIC_NAME}
  1307. char firstword[len + 1], *s = "";
  1308. strncpyz(firstword, m->name, len);
  1309. for (s = firstword; *s ; s++) {
  1310. if (unlikely(*s == '.' || *s == '_')) {
  1311. *s = '\0';
  1312. s++;
  1313. break;
  1314. }
  1315. }
  1316. // firstword has the first word of ${METRIC_NAME}
  1317. // s has the remaining, if any
  1318. // create the chart type:
  1319. snprintfz(type, len, STATSD_CHART_PREFIX "_%s", firstword);
  1320. // for chart id, we want:
  1321. // the remaining of the words of ${METRIC_NAME} + "_" + ${METRIC_TYPE}
  1322. // or the ${METRIC_NAME} has no remaining words, the ${METRIC_TYPE} alone
  1323. if(*s)
  1324. snprintfz(id, len, "%s_%s", s, metrictype);
  1325. else
  1326. snprintfz(id, len, "%s", metrictype);
  1327. // for the context, we want the full of both the above, separated with a dot (type.id):
  1328. snprintfz(context, RRD_ID_LENGTH_MAX, "%s.%s", type, id);
  1329. // make sure they don't have illegal characters
  1330. netdata_fix_chart_id(type);
  1331. netdata_fix_chart_id(id);
  1332. netdata_fix_chart_id(context);
  1333. }
  1334. static inline RRDSET *statsd_private_rrdset_create(
  1335. STATSD_METRIC *m __maybe_unused
  1336. , const char *type
  1337. , const char *id
  1338. , const char *name
  1339. , const char *family
  1340. , const char *context
  1341. , const char *title
  1342. , const char *units
  1343. , long priority
  1344. , int update_every
  1345. , RRDSET_TYPE chart_type
  1346. ) {
  1347. if(!m->st)
  1348. statsd.private_charts++;
  1349. RRDSET *st = rrdset_create_custom(
  1350. localhost // host
  1351. , type // type
  1352. , id // id
  1353. , name // name
  1354. , family // family
  1355. , context // context
  1356. , title // title
  1357. , units // units
  1358. , PLUGIN_STATSD_NAME // plugin
  1359. , "private_chart" // module
  1360. , priority // priority
  1361. , update_every // update every
  1362. , chart_type // chart type
  1363. , default_rrd_memory_mode // memory mode
  1364. , default_rrd_history_entries // history
  1365. );
  1366. rrdset_flag_set(st, RRDSET_FLAG_STORE_FIRST);
  1367. if(statsd.private_charts_hidden)
  1368. rrdset_flag_set(st, RRDSET_FLAG_HIDDEN);
  1369. // rrdset_flag_set(st, RRDSET_FLAG_DEBUG);
  1370. return st;
  1371. }
  1372. static inline void statsd_private_chart_gauge(STATSD_METRIC *m) {
  1373. debug(D_STATSD, "updating private chart for gauge metric '%s'", m->name);
  1374. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1375. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1376. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1377. statsd_get_metric_type_and_id(m, type, id, context, "gauge", RRD_ID_LENGTH_MAX);
  1378. char title[RRD_ID_LENGTH_MAX + 1];
  1379. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for gauge %s", m->name);
  1380. m->st = statsd_private_rrdset_create(
  1381. m
  1382. , type
  1383. , id
  1384. , NULL // name
  1385. , m->family?m->family:"gauges" // family (submenu)
  1386. , context // context
  1387. , title // title
  1388. , m->units?m->units:"value" // units
  1389. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1390. , statsd.update_every
  1391. , RRDSET_TYPE_LINE
  1392. );
  1393. m->rd_value = rrddim_add(m->st, "gauge", m->dimname?m->dimname:NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1394. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1395. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1396. }
  1397. rrddim_set_by_pointer(m->st, m->rd_value, m->last);
  1398. if(m->rd_count)
  1399. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1400. rrdset_done(m->st);
  1401. }
  1402. static inline void statsd_private_chart_counter_or_meter(STATSD_METRIC *m, const char *dim, const char *family) {
  1403. debug(D_STATSD, "updating private chart for %s metric '%s'", dim, m->name);
  1404. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1405. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1406. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1407. statsd_get_metric_type_and_id(m, type, id, context, dim, RRD_ID_LENGTH_MAX);
  1408. char title[RRD_ID_LENGTH_MAX + 1];
  1409. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for %s %s", dim, m->name);
  1410. m->st = statsd_private_rrdset_create(
  1411. m
  1412. , type
  1413. , id
  1414. , NULL // name
  1415. , m->family?m->family:family // family (submenu)
  1416. , context // context
  1417. , title // title
  1418. , m->units?m->units:"events/s" // units
  1419. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1420. , statsd.update_every
  1421. , RRDSET_TYPE_AREA
  1422. );
  1423. m->rd_value = rrddim_add(m->st, dim, m->dimname?m->dimname:NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1424. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1425. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1426. }
  1427. rrddim_set_by_pointer(m->st, m->rd_value, m->last);
  1428. if(m->rd_count)
  1429. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1430. rrdset_done(m->st);
  1431. }
  1432. static inline void statsd_private_chart_set(STATSD_METRIC *m) {
  1433. debug(D_STATSD, "updating private chart for set metric '%s'", m->name);
  1434. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1435. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1436. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1437. statsd_get_metric_type_and_id(m, type, id, context, "set", RRD_ID_LENGTH_MAX);
  1438. char title[RRD_ID_LENGTH_MAX + 1];
  1439. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for set %s", m->name);
  1440. m->st = statsd_private_rrdset_create(
  1441. m
  1442. , type
  1443. , id
  1444. , NULL // name
  1445. , m->family?m->family:"sets" // family (submenu)
  1446. , context // context
  1447. , title // title
  1448. , m->units?m->units:"entries" // units
  1449. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1450. , statsd.update_every
  1451. , RRDSET_TYPE_LINE
  1452. );
  1453. m->rd_value = rrddim_add(m->st, "set", m->dimname?m->dimname:"unique", 1, 1, RRD_ALGORITHM_ABSOLUTE);
  1454. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1455. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1456. }
  1457. rrddim_set_by_pointer(m->st, m->rd_value, m->last);
  1458. if(m->rd_count)
  1459. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1460. rrdset_done(m->st);
  1461. }
  1462. static inline void statsd_private_chart_dictionary(STATSD_METRIC *m) {
  1463. debug(D_STATSD, "updating private chart for dictionary metric '%s'", m->name);
  1464. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1465. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1466. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1467. statsd_get_metric_type_and_id(m, type, id, context, "dictionary", RRD_ID_LENGTH_MAX);
  1468. char title[RRD_ID_LENGTH_MAX + 1];
  1469. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for dictionary %s", m->name);
  1470. m->st = statsd_private_rrdset_create(
  1471. m
  1472. , type
  1473. , id
  1474. , NULL // name
  1475. , m->family?m->family:"dictionaries" // family (submenu)
  1476. , context // context
  1477. , title // title
  1478. , m->units?m->units:"events/s" // units
  1479. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1480. , statsd.update_every
  1481. , RRDSET_TYPE_STACKED
  1482. );
  1483. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1484. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1485. }
  1486. STATSD_METRIC_DICTIONARY_ITEM *t;
  1487. dfe_start_read(m->dictionary.dict, t) {
  1488. if (!t->rd) t->rd = rrddim_add(m->st, t_dfe.name, NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1489. rrddim_set_by_pointer(m->st, t->rd, (collected_number)t->count);
  1490. }
  1491. dfe_done(t);
  1492. if(m->rd_count)
  1493. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1494. rrdset_done(m->st);
  1495. }
  1496. static inline void statsd_private_chart_timer_or_histogram(STATSD_METRIC *m, const char *dim, const char *family, const char *units) {
  1497. debug(D_STATSD, "updating private chart for %s metric '%s'", dim, m->name);
  1498. if(unlikely(!m->st || m->options & STATSD_METRIC_OPTION_UPDATED_CHART_METADATA)) {
  1499. m->options &= ~STATSD_METRIC_OPTION_UPDATED_CHART_METADATA;
  1500. char type[RRD_ID_LENGTH_MAX + 1], id[RRD_ID_LENGTH_MAX + 1], context[RRD_ID_LENGTH_MAX + 1];
  1501. statsd_get_metric_type_and_id(m, type, id, context, dim, RRD_ID_LENGTH_MAX);
  1502. char title[RRD_ID_LENGTH_MAX + 1];
  1503. snprintfz(title, RRD_ID_LENGTH_MAX, "statsd private chart for %s %s", dim, m->name);
  1504. m->st = statsd_private_rrdset_create(
  1505. m
  1506. , type
  1507. , id
  1508. , NULL // name
  1509. , m->family?m->family:family // family (submenu)
  1510. , context // context
  1511. , title // title
  1512. , m->units?m->units:units // units
  1513. , NETDATA_CHART_PRIO_STATSD_PRIVATE
  1514. , statsd.update_every
  1515. , RRDSET_TYPE_AREA
  1516. );
  1517. m->histogram.ext->rd_min = rrddim_add(m->st, "min", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1518. m->histogram.ext->rd_max = rrddim_add(m->st, "max", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1519. m->rd_value = rrddim_add(m->st, "average", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1520. m->histogram.ext->rd_percentile = rrddim_add(m->st, statsd.histogram_percentile_str, NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1521. m->histogram.ext->rd_median = rrddim_add(m->st, "median", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1522. m->histogram.ext->rd_stddev = rrddim_add(m->st, "stddev", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1523. //m->histogram.ext->rd_sum = rrddim_add(m->st, "sum", NULL, 1, statsd.decimal_detail, RRD_ALGORITHM_ABSOLUTE);
  1524. if(m->options & STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT)
  1525. m->rd_count = rrddim_add(m->st, "events", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  1526. }
  1527. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_min, m->histogram.ext->last_min);
  1528. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_max, m->histogram.ext->last_max);
  1529. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_percentile, m->histogram.ext->last_percentile);
  1530. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_median, m->histogram.ext->last_median);
  1531. rrddim_set_by_pointer(m->st, m->histogram.ext->rd_stddev, m->histogram.ext->last_stddev);
  1532. //rrddim_set_by_pointer(m->st, m->histogram.ext->rd_sum, m->histogram.ext->last_sum);
  1533. rrddim_set_by_pointer(m->st, m->rd_value, m->last);
  1534. if(m->rd_count)
  1535. rrddim_set_by_pointer(m->st, m->rd_count, m->events);
  1536. rrdset_done(m->st);
  1537. }
  1538. // --------------------------------------------------------------------------------------------------------------------
  1539. // statsd flush metrics
  1540. static inline void statsd_flush_gauge(STATSD_METRIC *m) {
  1541. debug(D_STATSD, "flushing gauge metric '%s'", m->name);
  1542. int updated = 0;
  1543. if(unlikely(!m->reset && m->count)) {
  1544. m->last = (collected_number) (m->gauge.value * statsd.decimal_detail);
  1545. m->reset = 1;
  1546. updated = 1;
  1547. }
  1548. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1549. statsd_private_chart_gauge(m);
  1550. }
  1551. static inline void statsd_flush_counter_or_meter(STATSD_METRIC *m, const char *dim, const char *family) {
  1552. debug(D_STATSD, "flushing %s metric '%s'", dim, m->name);
  1553. int updated = 0;
  1554. if(unlikely(!m->reset && m->count)) {
  1555. m->last = m->counter.value;
  1556. m->reset = 1;
  1557. updated = 1;
  1558. }
  1559. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1560. statsd_private_chart_counter_or_meter(m, dim, family);
  1561. }
  1562. static inline void statsd_flush_counter(STATSD_METRIC *m) {
  1563. statsd_flush_counter_or_meter(m, "counter", "counters");
  1564. }
  1565. static inline void statsd_flush_meter(STATSD_METRIC *m) {
  1566. statsd_flush_counter_or_meter(m, "meter", "meters");
  1567. }
  1568. static inline void statsd_flush_set(STATSD_METRIC *m) {
  1569. debug(D_STATSD, "flushing set metric '%s'", m->name);
  1570. int updated = 0;
  1571. if(unlikely(!m->reset && m->count)) {
  1572. m->last = (collected_number)m->set.unique;
  1573. m->reset = 1;
  1574. updated = 1;
  1575. }
  1576. else {
  1577. m->last = 0;
  1578. }
  1579. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1580. statsd_private_chart_set(m);
  1581. }
  1582. static inline void statsd_flush_dictionary(STATSD_METRIC *m) {
  1583. debug(D_STATSD, "flushing dictionary metric '%s'", m->name);
  1584. int updated = 0;
  1585. if(unlikely(!m->reset && m->count)) {
  1586. m->last = (collected_number)m->dictionary.unique;
  1587. m->reset = 1;
  1588. updated = 1;
  1589. }
  1590. else {
  1591. m->last = 0;
  1592. }
  1593. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1594. statsd_private_chart_dictionary(m);
  1595. if(m->dictionary.unique >= statsd.dictionary_max_unique) {
  1596. if(!(m->options & STATSD_METRIC_OPTION_COLLECTION_FULL_LOGGED)) {
  1597. m->options |= STATSD_METRIC_OPTION_COLLECTION_FULL_LOGGED;
  1598. collector_info(
  1599. "STATSD dictionary '%s' reach max of %zu items - try increasing 'dictionaries max unique dimensions' in netdata.conf",
  1600. m->name,
  1601. m->dictionary.unique);
  1602. }
  1603. }
  1604. }
  1605. static inline void statsd_flush_timer_or_histogram(STATSD_METRIC *m, const char *dim, const char *family, const char *units) {
  1606. debug(D_STATSD, "flushing %s metric '%s'", dim, m->name);
  1607. int updated = 0;
  1608. if(unlikely(!m->reset && m->count && m->histogram.ext->used > 0)) {
  1609. netdata_mutex_lock(&m->histogram.ext->mutex);
  1610. size_t len = m->histogram.ext->used;
  1611. NETDATA_DOUBLE *series = m->histogram.ext->values;
  1612. sort_series(series, len);
  1613. m->histogram.ext->last_min = (collected_number)roundndd(series[0] * statsd.decimal_detail);
  1614. m->histogram.ext->last_max = (collected_number)roundndd(series[len - 1] * statsd.decimal_detail);
  1615. m->last = (collected_number)roundndd(average(series, len) * statsd.decimal_detail);
  1616. m->histogram.ext->last_median = (collected_number)roundndd(median_on_sorted_series(series, len) * statsd.decimal_detail);
  1617. m->histogram.ext->last_stddev = (collected_number)roundndd(standard_deviation(series, len) * statsd.decimal_detail);
  1618. m->histogram.ext->last_sum = (collected_number)roundndd(sum(series, len) * statsd.decimal_detail);
  1619. size_t pct_len = (size_t)floor((double)len * statsd.histogram_percentile / 100.0);
  1620. if(pct_len < 1)
  1621. m->histogram.ext->last_percentile = (collected_number)(series[0] * statsd.decimal_detail);
  1622. else
  1623. m->histogram.ext->last_percentile = (collected_number)roundndd(series[pct_len - 1] * statsd.decimal_detail);
  1624. netdata_mutex_unlock(&m->histogram.ext->mutex);
  1625. debug(D_STATSD, "STATSD %s metric %s: min " COLLECTED_NUMBER_FORMAT ", max " COLLECTED_NUMBER_FORMAT ", last " COLLECTED_NUMBER_FORMAT ", pcent " COLLECTED_NUMBER_FORMAT ", median " COLLECTED_NUMBER_FORMAT ", stddev " COLLECTED_NUMBER_FORMAT ", sum " COLLECTED_NUMBER_FORMAT,
  1626. dim, m->name, m->histogram.ext->last_min, m->histogram.ext->last_max, m->last, m->histogram.ext->last_percentile, m->histogram.ext->last_median, m->histogram.ext->last_stddev, m->histogram.ext->last_sum);
  1627. m->histogram.ext->zeroed = 0;
  1628. m->reset = 1;
  1629. updated = 1;
  1630. }
  1631. else if(unlikely(!m->histogram.ext->zeroed)) {
  1632. // reset the metrics
  1633. // if we collected anything, they will be updated below
  1634. // this ensures that we report zeros if nothing is collected
  1635. m->histogram.ext->last_min = 0;
  1636. m->histogram.ext->last_max = 0;
  1637. m->last = 0;
  1638. m->histogram.ext->last_median = 0;
  1639. m->histogram.ext->last_stddev = 0;
  1640. m->histogram.ext->last_sum = 0;
  1641. m->histogram.ext->last_percentile = 0;
  1642. m->histogram.ext->zeroed = 1;
  1643. }
  1644. if(unlikely(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED && (updated || !(m->options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED))))
  1645. statsd_private_chart_timer_or_histogram(m, dim, family, units);
  1646. }
  1647. static inline void statsd_flush_timer(STATSD_METRIC *m) {
  1648. statsd_flush_timer_or_histogram(m, "timer", "timers", "milliseconds");
  1649. }
  1650. static inline void statsd_flush_histogram(STATSD_METRIC *m) {
  1651. statsd_flush_timer_or_histogram(m, "histogram", "histograms", "value");
  1652. }
  1653. static inline RRD_ALGORITHM statsd_algorithm_for_metric(STATSD_METRIC *m) {
  1654. switch(m->type) {
  1655. default:
  1656. case STATSD_METRIC_TYPE_GAUGE:
  1657. case STATSD_METRIC_TYPE_SET:
  1658. case STATSD_METRIC_TYPE_TIMER:
  1659. case STATSD_METRIC_TYPE_HISTOGRAM:
  1660. return RRD_ALGORITHM_ABSOLUTE;
  1661. case STATSD_METRIC_TYPE_METER:
  1662. case STATSD_METRIC_TYPE_COUNTER:
  1663. case STATSD_METRIC_TYPE_DICTIONARY:
  1664. return RRD_ALGORITHM_INCREMENTAL;
  1665. }
  1666. }
  1667. static inline void link_metric_to_app_dimension(STATSD_APP *app, STATSD_METRIC *m, STATSD_APP_CHART *chart, STATSD_APP_CHART_DIM *dim) {
  1668. if(dim->value_type == STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS) {
  1669. dim->value_ptr = &m->events;
  1670. dim->algorithm = RRD_ALGORITHM_INCREMENTAL;
  1671. }
  1672. else if(m->type == STATSD_METRIC_TYPE_HISTOGRAM || m->type == STATSD_METRIC_TYPE_TIMER) {
  1673. dim->algorithm = RRD_ALGORITHM_ABSOLUTE;
  1674. dim->divisor *= statsd.decimal_detail;
  1675. switch(dim->value_type) {
  1676. case STATSD_APP_CHART_DIM_VALUE_TYPE_EVENTS:
  1677. // will never match - added to avoid warning
  1678. break;
  1679. case STATSD_APP_CHART_DIM_VALUE_TYPE_LAST:
  1680. case STATSD_APP_CHART_DIM_VALUE_TYPE_AVERAGE:
  1681. dim->value_ptr = &m->last;
  1682. break;
  1683. case STATSD_APP_CHART_DIM_VALUE_TYPE_SUM:
  1684. dim->value_ptr = &m->histogram.ext->last_sum;
  1685. break;
  1686. case STATSD_APP_CHART_DIM_VALUE_TYPE_MIN:
  1687. dim->value_ptr = &m->histogram.ext->last_min;
  1688. break;
  1689. case STATSD_APP_CHART_DIM_VALUE_TYPE_MAX:
  1690. dim->value_ptr = &m->histogram.ext->last_max;
  1691. break;
  1692. case STATSD_APP_CHART_DIM_VALUE_TYPE_MEDIAN:
  1693. dim->value_ptr = &m->histogram.ext->last_median;
  1694. break;
  1695. case STATSD_APP_CHART_DIM_VALUE_TYPE_PERCENTILE:
  1696. dim->value_ptr = &m->histogram.ext->last_percentile;
  1697. break;
  1698. case STATSD_APP_CHART_DIM_VALUE_TYPE_STDDEV:
  1699. dim->value_ptr = &m->histogram.ext->last_stddev;
  1700. break;
  1701. }
  1702. }
  1703. else {
  1704. if (dim->value_type != STATSD_APP_CHART_DIM_VALUE_TYPE_LAST)
  1705. error("STATSD: unsupported value type for dimension '%s' of chart '%s' of app '%s' on metric '%s'", dim->name, chart->id, app->name, m->name);
  1706. dim->value_ptr = &m->last;
  1707. dim->algorithm = statsd_algorithm_for_metric(m);
  1708. if(m->type == STATSD_METRIC_TYPE_GAUGE)
  1709. dim->divisor *= statsd.decimal_detail;
  1710. }
  1711. if(unlikely(chart->st && dim->rd)) {
  1712. rrddim_set_algorithm(chart->st, dim->rd, dim->algorithm);
  1713. rrddim_set_multiplier(chart->st, dim->rd, dim->multiplier);
  1714. rrddim_set_divisor(chart->st, dim->rd, dim->divisor);
  1715. }
  1716. chart->dimensions_linked_count++;
  1717. m->options |= STATSD_METRIC_OPTION_USED_IN_APPS;
  1718. debug(D_STATSD, "metric '%s' of type %u linked with app '%s', chart '%s', dimension '%s', algorithm '%s'", m->name, m->type, app->name, chart->id, dim->name, rrd_algorithm_name(dim->algorithm));
  1719. }
  1720. static inline void check_if_metric_is_for_app(STATSD_INDEX *index, STATSD_METRIC *m) {
  1721. (void)index;
  1722. STATSD_APP *app;
  1723. for(app = statsd.apps; app ;app = app->next) {
  1724. if(unlikely(simple_pattern_matches(app->metrics, m->name))) {
  1725. debug(D_STATSD, "metric '%s' matches app '%s'", m->name, app->name);
  1726. // the metric should get the options from the app
  1727. if(app->default_options & STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED)
  1728. m->options |= STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1729. else
  1730. m->options &= ~STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1731. if(app->default_options & STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED)
  1732. m->options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  1733. else
  1734. m->options &= ~STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  1735. m->options |= STATSD_METRIC_OPTION_PRIVATE_CHART_CHECKED;
  1736. // check if there is a chart in this app, willing to get this metric
  1737. STATSD_APP_CHART *chart;
  1738. for(chart = app->charts; chart; chart = chart->next) {
  1739. STATSD_APP_CHART_DIM *dim;
  1740. for(dim = chart->dimensions; dim ; dim = dim->next) {
  1741. if(unlikely(dim->metric_pattern)) {
  1742. size_t dim_name_len = strlen(dim->name);
  1743. size_t wildcarded_len = dim_name_len + strlen(m->name) + 1;
  1744. char wildcarded[wildcarded_len];
  1745. strcpy(wildcarded, dim->name);
  1746. char *ws = &wildcarded[dim_name_len];
  1747. if(simple_pattern_matches_extract(dim->metric_pattern, m->name, ws, wildcarded_len - dim_name_len)) {
  1748. char *final_name = NULL;
  1749. if(app->dict) {
  1750. if(likely(*wildcarded)) {
  1751. // use the name of the wildcarded string
  1752. final_name = dictionary_get(app->dict, wildcarded);
  1753. }
  1754. if(unlikely(!final_name)) {
  1755. // use the name of the metric
  1756. final_name = dictionary_get(app->dict, m->name);
  1757. }
  1758. }
  1759. if(unlikely(!final_name))
  1760. final_name = wildcarded;
  1761. add_dimension_to_app_chart(
  1762. app
  1763. , chart
  1764. , m->name
  1765. , final_name
  1766. , dim->multiplier
  1767. , dim->divisor
  1768. , dim->flags
  1769. , dim->options
  1770. , dim->value_type
  1771. );
  1772. // the new dimension is appended to the list
  1773. // so, it will be matched and linked later too
  1774. }
  1775. }
  1776. else if(!dim->value_ptr && dim->metric_hash == m->hash && !strcmp(dim->metric, m->name)) {
  1777. // we have a match - this metric should be linked to this dimension
  1778. link_metric_to_app_dimension(app, m, chart, dim);
  1779. }
  1780. }
  1781. }
  1782. }
  1783. }
  1784. }
  1785. static inline RRDDIM *statsd_add_dim_to_app_chart(STATSD_APP *app, STATSD_APP_CHART *chart, STATSD_APP_CHART_DIM *dim) {
  1786. (void)app;
  1787. // allow the same statsd metric to be added multiple times to the same chart
  1788. STATSD_APP_CHART_DIM *tdim;
  1789. size_t count_same_metric = 0, count_same_metric_value_type = 0;
  1790. size_t pos_same_metric_value_type = 0;
  1791. for (tdim = chart->dimensions; tdim && tdim->next; tdim = tdim->next) {
  1792. if (dim->metric_hash == tdim->metric_hash && !strcmp(dim->metric, tdim->metric)) {
  1793. count_same_metric++;
  1794. if(dim->value_type == tdim->value_type) {
  1795. count_same_metric_value_type++;
  1796. if (tdim == dim)
  1797. pos_same_metric_value_type = count_same_metric_value_type;
  1798. }
  1799. }
  1800. }
  1801. if(count_same_metric > 1) {
  1802. // the same metric is found multiple times
  1803. size_t len = strlen(dim->metric) + 100;
  1804. char metric[ len + 1 ];
  1805. if(count_same_metric_value_type > 1) {
  1806. // the same metric, with the same value type, is added multiple times
  1807. snprintfz(metric, len, "%s_%s%zu", dim->metric, valuetype2string(dim->value_type), pos_same_metric_value_type);
  1808. }
  1809. else {
  1810. // the same metric, with different value type is added
  1811. snprintfz(metric, len, "%s_%s", dim->metric, valuetype2string(dim->value_type));
  1812. }
  1813. dim->rd = rrddim_add(chart->st, metric, dim->name, dim->multiplier, dim->divisor, dim->algorithm);
  1814. if(dim->flags != RRDDIM_FLAG_NONE) dim->rd->flags |= dim->flags;
  1815. if(dim->options != RRDDIM_OPTION_NONE) dim->rd->options |= dim->options;
  1816. return dim->rd;
  1817. }
  1818. dim->rd = rrddim_add(chart->st, dim->metric, dim->name, dim->multiplier, dim->divisor, dim->algorithm);
  1819. if(dim->flags != RRDDIM_FLAG_NONE) dim->rd->flags |= dim->flags;
  1820. if(dim->options != RRDDIM_OPTION_NONE) dim->rd->options |= dim->options;
  1821. return dim->rd;
  1822. }
  1823. static inline void statsd_update_app_chart(STATSD_APP *app, STATSD_APP_CHART *chart) {
  1824. debug(D_STATSD, "updating chart '%s' for app '%s'", chart->id, app->name);
  1825. if(!chart->st) {
  1826. chart->st = rrdset_create_custom(
  1827. localhost // host
  1828. , app->name // type
  1829. , chart->id // id
  1830. , chart->name // name
  1831. , chart->family // family
  1832. , chart->context // context
  1833. , chart->title // title
  1834. , chart->units // units
  1835. , PLUGIN_STATSD_NAME // plugin
  1836. , chart->module // module
  1837. , chart->priority // priority
  1838. , statsd.update_every // update every
  1839. , chart->chart_type // chart type
  1840. , app->rrd_memory_mode // memory mode
  1841. , app->rrd_history_entries // history
  1842. );
  1843. rrdset_flag_set(chart->st, RRDSET_FLAG_STORE_FIRST);
  1844. // rrdset_flag_set(chart->st, RRDSET_FLAG_DEBUG);
  1845. }
  1846. STATSD_APP_CHART_DIM *dim;
  1847. for(dim = chart->dimensions; dim ;dim = dim->next) {
  1848. if(likely(!dim->metric_pattern)) {
  1849. if (unlikely(!dim->rd))
  1850. statsd_add_dim_to_app_chart(app, chart, dim);
  1851. if (unlikely(dim->value_ptr)) {
  1852. debug(D_STATSD, "updating dimension '%s' (%s) of chart '%s' (%s) for app '%s' with value " COLLECTED_NUMBER_FORMAT, dim->name, rrddim_id(dim->rd), chart->id, rrdset_id(chart->st), app->name, *dim->value_ptr);
  1853. rrddim_set_by_pointer(chart->st, dim->rd, *dim->value_ptr);
  1854. }
  1855. }
  1856. }
  1857. rrdset_done(chart->st);
  1858. debug(D_STATSD, "completed update of chart '%s' for app '%s'", chart->id, app->name);
  1859. }
  1860. static inline void statsd_update_all_app_charts(void) {
  1861. // debug(D_STATSD, "updating app charts");
  1862. STATSD_APP *app;
  1863. for(app = statsd.apps; app ;app = app->next) {
  1864. // debug(D_STATSD, "updating charts for app '%s'", app->name);
  1865. STATSD_APP_CHART *chart;
  1866. for(chart = app->charts; chart ;chart = chart->next) {
  1867. if(unlikely(chart->dimensions_linked_count)) {
  1868. statsd_update_app_chart(app, chart);
  1869. }
  1870. }
  1871. }
  1872. // debug(D_STATSD, "completed update of app charts");
  1873. }
  1874. const char *statsd_metric_type_string(STATSD_METRIC_TYPE type) {
  1875. switch(type) {
  1876. case STATSD_METRIC_TYPE_COUNTER: return "counter";
  1877. case STATSD_METRIC_TYPE_GAUGE: return "gauge";
  1878. case STATSD_METRIC_TYPE_HISTOGRAM: return "histogram";
  1879. case STATSD_METRIC_TYPE_METER: return "meter";
  1880. case STATSD_METRIC_TYPE_SET: return "set";
  1881. case STATSD_METRIC_TYPE_DICTIONARY: return "dictionary";
  1882. case STATSD_METRIC_TYPE_TIMER: return "timer";
  1883. default: return "unknown";
  1884. }
  1885. }
  1886. static inline void statsd_flush_index_metrics(STATSD_INDEX *index, void (*flush_metric)(STATSD_METRIC *)) {
  1887. STATSD_METRIC *m;
  1888. // find the useful metrics (incremental = each time we are called, we check the new metrics only)
  1889. dfe_start_read(index->dict, m) {
  1890. // since we add new metrics at the beginning
  1891. // check for useful charts, until the point we last checked
  1892. if(unlikely(is_metric_checked(m))) break;
  1893. if(unlikely(!(m->options & STATSD_METRIC_OPTION_CHECKED_IN_APPS))) {
  1894. log_access("NEW STATSD METRIC '%s': '%s'", statsd_metric_type_string(m->type), m->name);
  1895. check_if_metric_is_for_app(index, m);
  1896. m->options |= STATSD_METRIC_OPTION_CHECKED_IN_APPS;
  1897. }
  1898. if(unlikely(!(m->options & STATSD_METRIC_OPTION_PRIVATE_CHART_CHECKED))) {
  1899. if(unlikely(statsd.private_charts >= statsd.max_private_charts_hard)) {
  1900. debug(D_STATSD, "STATSD: metric '%s' will not be charted, because the hard limit of the maximum number of charts has been reached.", m->name);
  1901. collector_info("STATSD: metric '%s' will not be charted, because the hard limit of the maximum number of charts (%zu) has been reached. Increase the number of charts by editing netdata.conf, [statsd] section.", m->name, statsd.max_private_charts_hard);
  1902. m->options &= ~STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1903. }
  1904. else {
  1905. if (simple_pattern_matches(statsd.charts_for, m->name)) {
  1906. debug(D_STATSD, "STATSD: metric '%s' will be charted.", m->name);
  1907. m->options |= STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1908. } else {
  1909. debug(D_STATSD, "STATSD: metric '%s' will not be charted.", m->name);
  1910. m->options &= ~STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED;
  1911. }
  1912. }
  1913. m->options |= STATSD_METRIC_OPTION_PRIVATE_CHART_CHECKED;
  1914. }
  1915. // mark it as checked
  1916. m->options |= STATSD_METRIC_OPTION_CHECKED;
  1917. // check if it is used in charts
  1918. if((m->options & (STATSD_METRIC_OPTION_PRIVATE_CHART_ENABLED|STATSD_METRIC_OPTION_USED_IN_APPS)) && !(m->options & STATSD_METRIC_OPTION_USEFUL)) {
  1919. m->options |= STATSD_METRIC_OPTION_USEFUL;
  1920. index->useful++;
  1921. m->next_useful = index->first_useful;
  1922. index->first_useful = m;
  1923. }
  1924. }
  1925. dfe_done(m);
  1926. // flush all the useful metrics
  1927. for(m = index->first_useful; m ; m = m->next_useful) {
  1928. flush_metric(m);
  1929. }
  1930. }
  1931. // --------------------------------------------------------------------------------------
  1932. // statsd main thread
  1933. static int statsd_listen_sockets_setup(void) {
  1934. return listen_sockets_setup(&statsd.sockets);
  1935. }
  1936. static void statsd_main_cleanup(void *data) {
  1937. struct netdata_static_thread *static_thread = (struct netdata_static_thread *)data;
  1938. static_thread->enabled = NETDATA_MAIN_THREAD_EXITING;
  1939. collector_info("cleaning up...");
  1940. if (statsd.collection_threads_status) {
  1941. int i;
  1942. for (i = 0; i < statsd.threads; i++) {
  1943. netdata_spinlock_lock(&statsd.collection_threads_status[i].spinlock);
  1944. if(statsd.collection_threads_status[i].running) {
  1945. collector_info("STATSD: stopping data collection thread %d...", i + 1);
  1946. netdata_thread_cancel(statsd.collection_threads_status[i].thread);
  1947. }
  1948. else {
  1949. collector_info("STATSD: data collection thread %d found stopped.", i + 1);
  1950. }
  1951. netdata_spinlock_unlock(&statsd.collection_threads_status[i].spinlock);
  1952. }
  1953. }
  1954. collector_info("STATSD: closing sockets...");
  1955. listen_sockets_close(&statsd.sockets);
  1956. // destroy the dictionaries
  1957. dictionary_destroy(statsd.gauges.dict);
  1958. dictionary_destroy(statsd.meters.dict);
  1959. dictionary_destroy(statsd.counters.dict);
  1960. dictionary_destroy(statsd.histograms.dict);
  1961. dictionary_destroy(statsd.dictionaries.dict);
  1962. dictionary_destroy(statsd.sets.dict);
  1963. dictionary_destroy(statsd.timers.dict);
  1964. collector_info("STATSD: cleanup completed.");
  1965. static_thread->enabled = NETDATA_MAIN_THREAD_EXITED;
  1966. worker_unregister();
  1967. }
  1968. #define WORKER_STATSD_FLUSH_GAUGES 0
  1969. #define WORKER_STATSD_FLUSH_COUNTERS 1
  1970. #define WORKER_STATSD_FLUSH_METERS 2
  1971. #define WORKER_STATSD_FLUSH_TIMERS 3
  1972. #define WORKER_STATSD_FLUSH_HISTOGRAMS 4
  1973. #define WORKER_STATSD_FLUSH_SETS 5
  1974. #define WORKER_STATSD_FLUSH_DICTIONARIES 6
  1975. #define WORKER_STATSD_FLUSH_STATS 7
  1976. #if WORKER_UTILIZATION_MAX_JOB_TYPES < 8
  1977. #error WORKER_UTILIZATION_MAX_JOB_TYPES has to be at least 8
  1978. #endif
  1979. void *statsd_main(void *ptr) {
  1980. worker_register("STATSDFLUSH");
  1981. worker_register_job_name(WORKER_STATSD_FLUSH_GAUGES, "gauges");
  1982. worker_register_job_name(WORKER_STATSD_FLUSH_COUNTERS, "counters");
  1983. worker_register_job_name(WORKER_STATSD_FLUSH_METERS, "meters");
  1984. worker_register_job_name(WORKER_STATSD_FLUSH_TIMERS, "timers");
  1985. worker_register_job_name(WORKER_STATSD_FLUSH_HISTOGRAMS, "histograms");
  1986. worker_register_job_name(WORKER_STATSD_FLUSH_SETS, "sets");
  1987. worker_register_job_name(WORKER_STATSD_FLUSH_DICTIONARIES, "dictionaries");
  1988. worker_register_job_name(WORKER_STATSD_FLUSH_STATS, "statistics");
  1989. netdata_thread_cleanup_push(statsd_main_cleanup, ptr);
  1990. statsd.gauges.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1991. statsd.meters.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1992. statsd.counters.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1993. statsd.histograms.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1994. statsd.dictionaries.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1995. statsd.sets.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1996. statsd.timers.dict = dictionary_create_advanced(STATSD_DICTIONARY_OPTIONS, &dictionary_stats_category_collectors, 0);
  1997. dictionary_register_insert_callback(statsd.gauges.dict, dictionary_metric_insert_callback, &statsd.gauges);
  1998. dictionary_register_insert_callback(statsd.meters.dict, dictionary_metric_insert_callback, &statsd.meters);
  1999. dictionary_register_insert_callback(statsd.counters.dict, dictionary_metric_insert_callback, &statsd.counters);
  2000. dictionary_register_insert_callback(statsd.histograms.dict, dictionary_metric_insert_callback, &statsd.histograms);
  2001. dictionary_register_insert_callback(statsd.dictionaries.dict, dictionary_metric_insert_callback, &statsd.dictionaries);
  2002. dictionary_register_insert_callback(statsd.sets.dict, dictionary_metric_insert_callback, &statsd.sets);
  2003. dictionary_register_insert_callback(statsd.timers.dict, dictionary_metric_insert_callback, &statsd.timers);
  2004. dictionary_register_delete_callback(statsd.gauges.dict, dictionary_metric_delete_callback, &statsd.gauges);
  2005. dictionary_register_delete_callback(statsd.meters.dict, dictionary_metric_delete_callback, &statsd.meters);
  2006. dictionary_register_delete_callback(statsd.counters.dict, dictionary_metric_delete_callback, &statsd.counters);
  2007. dictionary_register_delete_callback(statsd.histograms.dict, dictionary_metric_delete_callback, &statsd.histograms);
  2008. dictionary_register_delete_callback(statsd.dictionaries.dict, dictionary_metric_delete_callback, &statsd.dictionaries);
  2009. dictionary_register_delete_callback(statsd.sets.dict, dictionary_metric_delete_callback, &statsd.sets);
  2010. dictionary_register_delete_callback(statsd.timers.dict, dictionary_metric_delete_callback, &statsd.timers);
  2011. // ----------------------------------------------------------------------------------------------------------------
  2012. // statsd configuration
  2013. statsd.enabled = config_get_boolean(CONFIG_SECTION_PLUGINS, "statsd", statsd.enabled);
  2014. statsd.update_every = default_rrd_update_every;
  2015. statsd.update_every = (int)config_get_number(CONFIG_SECTION_STATSD, "update every (flushInterval)", statsd.update_every);
  2016. if(statsd.update_every < default_rrd_update_every) {
  2017. collector_error("STATSD: minimum flush interval %d given, but the minimum is the update every of netdata. Using %d", statsd.update_every, default_rrd_update_every);
  2018. statsd.update_every = default_rrd_update_every;
  2019. }
  2020. #ifdef HAVE_RECVMMSG
  2021. statsd.recvmmsg_size = (size_t)config_get_number(CONFIG_SECTION_STATSD, "udp messages to process at once", (long long)statsd.recvmmsg_size);
  2022. #endif
  2023. statsd.charts_for = simple_pattern_create(config_get(CONFIG_SECTION_STATSD, "create private charts for metrics matching", "*"), NULL, SIMPLE_PATTERN_EXACT);
  2024. statsd.max_private_charts_hard = (size_t)config_get_number(CONFIG_SECTION_STATSD, "max private charts hard limit", (long long)statsd.max_private_charts_hard);
  2025. statsd.private_charts_rrd_history_entries = (int)config_get_number(CONFIG_SECTION_STATSD, "private charts history", default_rrd_history_entries);
  2026. statsd.decimal_detail = (collected_number)config_get_number(CONFIG_SECTION_STATSD, "decimal detail", (long long int)statsd.decimal_detail);
  2027. statsd.tcp_idle_timeout = (size_t) config_get_number(CONFIG_SECTION_STATSD, "disconnect idle tcp clients after seconds", (long long int)statsd.tcp_idle_timeout);
  2028. statsd.private_charts_hidden = (unsigned int)config_get_boolean(CONFIG_SECTION_STATSD, "private charts hidden", statsd.private_charts_hidden);
  2029. statsd.histogram_percentile = (double)config_get_float(CONFIG_SECTION_STATSD, "histograms and timers percentile (percentThreshold)", statsd.histogram_percentile);
  2030. if(isless(statsd.histogram_percentile, 0) || isgreater(statsd.histogram_percentile, 100)) {
  2031. collector_error("STATSD: invalid histograms and timers percentile %0.5f given", statsd.histogram_percentile);
  2032. statsd.histogram_percentile = 95.0;
  2033. }
  2034. {
  2035. char buffer[314 + 1];
  2036. snprintfz(buffer, 314, "%0.1f%%", statsd.histogram_percentile);
  2037. statsd.histogram_percentile_str = strdupz(buffer);
  2038. }
  2039. statsd.dictionary_max_unique = config_get_number(CONFIG_SECTION_STATSD, "dictionaries max unique dimensions", statsd.dictionary_max_unique);
  2040. if(config_get_boolean(CONFIG_SECTION_STATSD, "add dimension for number of events received", 0)) {
  2041. statsd.gauges.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2042. statsd.counters.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2043. statsd.meters.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2044. statsd.sets.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2045. statsd.histograms.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2046. statsd.timers.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2047. statsd.dictionaries.default_options |= STATSD_METRIC_OPTION_CHART_DIMENSION_COUNT;
  2048. }
  2049. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on gauges (deleteGauges)", 0))
  2050. statsd.gauges.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2051. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on counters (deleteCounters)", 0))
  2052. statsd.counters.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2053. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on meters (deleteMeters)", 0))
  2054. statsd.meters.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2055. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on sets (deleteSets)", 0))
  2056. statsd.sets.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2057. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on histograms (deleteHistograms)", 0))
  2058. statsd.histograms.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2059. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on timers (deleteTimers)", 0))
  2060. statsd.timers.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2061. if(config_get_boolean(CONFIG_SECTION_STATSD, "gaps on dictionaries (deleteDictionaries)", 0))
  2062. statsd.dictionaries.default_options |= STATSD_METRIC_OPTION_SHOW_GAPS_WHEN_NOT_COLLECTED;
  2063. size_t max_sockets = (size_t)config_get_number(CONFIG_SECTION_STATSD, "statsd server max TCP sockets", (long long int)(rlimit_nofile.rlim_cur / 4));
  2064. #ifdef STATSD_MULTITHREADED
  2065. statsd.threads = (int)config_get_number(CONFIG_SECTION_STATSD, "threads", processors);
  2066. if(statsd.threads < 1) {
  2067. collector_error("STATSD: Invalid number of threads %d, using %d", statsd.threads, processors);
  2068. statsd.threads = processors;
  2069. config_set_number(CONFIG_SECTION_STATSD, "collector threads", statsd.threads);
  2070. }
  2071. #else
  2072. statsd.threads = 1;
  2073. #endif
  2074. // read custom application definitions
  2075. statsd_readdir(netdata_configured_user_config_dir, netdata_configured_stock_config_dir, "statsd.d");
  2076. // ----------------------------------------------------------------------------------------------------------------
  2077. // statsd setup
  2078. if(!statsd.enabled) goto cleanup;
  2079. statsd_listen_sockets_setup();
  2080. if(!statsd.sockets.opened) {
  2081. collector_error("STATSD: No statsd sockets to listen to. statsd will be disabled.");
  2082. goto cleanup;
  2083. }
  2084. statsd.collection_threads_status = callocz((size_t)statsd.threads, sizeof(struct collection_thread_status));
  2085. int i;
  2086. for(i = 0; i < statsd.threads ;i++) {
  2087. statsd.collection_threads_status[i].max_sockets = max_sockets / statsd.threads;
  2088. char tag[NETDATA_THREAD_TAG_MAX + 1];
  2089. snprintfz(tag, NETDATA_THREAD_TAG_MAX, "STATSD_IN[%d]", i + 1);
  2090. netdata_spinlock_init(&statsd.collection_threads_status[i].spinlock);
  2091. netdata_thread_create(&statsd.collection_threads_status[i].thread, tag, NETDATA_THREAD_OPTION_DEFAULT, statsd_collector_thread, &statsd.collection_threads_status[i]);
  2092. }
  2093. // ----------------------------------------------------------------------------------------------------------------
  2094. // statsd monitoring charts
  2095. RRDSET *st_metrics = NULL;
  2096. RRDDIM *rd_metrics_gauge = NULL;
  2097. RRDDIM *rd_metrics_counter = NULL;
  2098. RRDDIM *rd_metrics_timer = NULL;
  2099. RRDDIM *rd_metrics_meter = NULL;
  2100. RRDDIM *rd_metrics_histogram = NULL;
  2101. RRDDIM *rd_metrics_set = NULL;
  2102. RRDDIM *rd_metrics_dictionary = NULL;
  2103. RRDSET *st_useful_metrics = NULL;
  2104. RRDDIM *rd_useful_metrics_gauge = NULL;
  2105. RRDDIM *rd_useful_metrics_counter = NULL;
  2106. RRDDIM *rd_useful_metrics_timer = NULL;
  2107. RRDDIM *rd_useful_metrics_meter = NULL;
  2108. RRDDIM *rd_useful_metrics_histogram = NULL;
  2109. RRDDIM *rd_useful_metrics_set = NULL;
  2110. RRDDIM *rd_useful_metrics_dictionary = NULL;
  2111. RRDSET *st_events = NULL;
  2112. RRDDIM *rd_events_gauge = NULL;
  2113. RRDDIM *rd_events_counter = NULL;
  2114. RRDDIM *rd_events_timer = NULL;
  2115. RRDDIM *rd_events_meter = NULL;
  2116. RRDDIM *rd_events_histogram = NULL;
  2117. RRDDIM *rd_events_set = NULL;
  2118. RRDDIM *rd_events_dictionary = NULL;
  2119. RRDDIM *rd_events_unknown = NULL;
  2120. RRDDIM *rd_events_errors = NULL;
  2121. RRDSET *st_reads = NULL;
  2122. RRDDIM *rd_reads_tcp = NULL;
  2123. RRDDIM *rd_reads_udp = NULL;
  2124. RRDSET *st_bytes = NULL;
  2125. RRDDIM *rd_bytes_tcp = NULL;
  2126. RRDDIM *rd_bytes_udp = NULL;
  2127. RRDSET *st_packets = NULL;
  2128. RRDDIM *rd_packets_tcp = NULL;
  2129. RRDDIM *rd_packets_udp = NULL;
  2130. RRDSET *st_tcp_connects = NULL;
  2131. RRDDIM *rd_tcp_connects = NULL;
  2132. RRDDIM *rd_tcp_disconnects = NULL;
  2133. RRDSET *st_tcp_connected = NULL;
  2134. RRDDIM *rd_tcp_connected = NULL;
  2135. RRDSET *st_pcharts = NULL;
  2136. RRDDIM *rd_pcharts = NULL;
  2137. if(global_statistics_enabled) {
  2138. st_metrics = rrdset_create_localhost(
  2139. "netdata",
  2140. "statsd_metrics",
  2141. NULL,
  2142. "statsd",
  2143. NULL,
  2144. "Metrics in the netdata statsd database",
  2145. "metrics",
  2146. PLUGIN_STATSD_NAME,
  2147. "stats",
  2148. 132010,
  2149. statsd.update_every,
  2150. RRDSET_TYPE_STACKED);
  2151. rd_metrics_gauge = rrddim_add(st_metrics, "gauges", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2152. rd_metrics_counter = rrddim_add(st_metrics, "counters", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2153. rd_metrics_timer = rrddim_add(st_metrics, "timers", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2154. rd_metrics_meter = rrddim_add(st_metrics, "meters", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2155. rd_metrics_histogram = rrddim_add(st_metrics, "histograms", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2156. rd_metrics_set = rrddim_add(st_metrics, "sets", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2157. rd_metrics_dictionary = rrddim_add(st_metrics, "dictionaries", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2158. st_useful_metrics = rrdset_create_localhost(
  2159. "netdata",
  2160. "statsd_useful_metrics",
  2161. NULL,
  2162. "statsd",
  2163. NULL,
  2164. "Useful metrics in the netdata statsd database",
  2165. "metrics",
  2166. PLUGIN_STATSD_NAME,
  2167. "stats",
  2168. 132010,
  2169. statsd.update_every,
  2170. RRDSET_TYPE_STACKED);
  2171. rd_useful_metrics_gauge = rrddim_add(st_useful_metrics, "gauges", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2172. rd_useful_metrics_counter = rrddim_add(st_useful_metrics, "counters", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2173. rd_useful_metrics_timer = rrddim_add(st_useful_metrics, "timers", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2174. rd_useful_metrics_meter = rrddim_add(st_useful_metrics, "meters", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2175. rd_useful_metrics_histogram = rrddim_add(st_useful_metrics, "histograms", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2176. rd_useful_metrics_set = rrddim_add(st_useful_metrics, "sets", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2177. rd_useful_metrics_dictionary = rrddim_add(st_useful_metrics, "dictionaries", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2178. st_events = rrdset_create_localhost(
  2179. "netdata",
  2180. "statsd_events",
  2181. NULL,
  2182. "statsd",
  2183. NULL,
  2184. "Events processed by the netdata statsd server",
  2185. "events/s",
  2186. PLUGIN_STATSD_NAME,
  2187. "stats",
  2188. 132011,
  2189. statsd.update_every,
  2190. RRDSET_TYPE_STACKED);
  2191. rd_events_gauge = rrddim_add(st_events, "gauges", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2192. rd_events_counter = rrddim_add(st_events, "counters", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2193. rd_events_timer = rrddim_add(st_events, "timers", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2194. rd_events_meter = rrddim_add(st_events, "meters", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2195. rd_events_histogram = rrddim_add(st_events, "histograms", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2196. rd_events_set = rrddim_add(st_events, "sets", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2197. rd_events_dictionary = rrddim_add(st_events, "dictionaries", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2198. rd_events_unknown = rrddim_add(st_events, "unknown", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2199. rd_events_errors = rrddim_add(st_events, "errors", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2200. st_reads = rrdset_create_localhost(
  2201. "netdata",
  2202. "statsd_reads",
  2203. NULL,
  2204. "statsd",
  2205. NULL,
  2206. "Read operations made by the netdata statsd server",
  2207. "reads/s",
  2208. PLUGIN_STATSD_NAME,
  2209. "stats",
  2210. 132012,
  2211. statsd.update_every,
  2212. RRDSET_TYPE_STACKED);
  2213. rd_reads_tcp = rrddim_add(st_reads, "tcp", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2214. rd_reads_udp = rrddim_add(st_reads, "udp", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2215. st_bytes = rrdset_create_localhost(
  2216. "netdata",
  2217. "statsd_bytes",
  2218. NULL,
  2219. "statsd",
  2220. NULL,
  2221. "Bytes read by the netdata statsd server",
  2222. "kilobits/s",
  2223. PLUGIN_STATSD_NAME,
  2224. "stats",
  2225. 132013,
  2226. statsd.update_every,
  2227. RRDSET_TYPE_STACKED);
  2228. rd_bytes_tcp = rrddim_add(st_bytes, "tcp", NULL, 8, BITS_IN_A_KILOBIT, RRD_ALGORITHM_INCREMENTAL);
  2229. rd_bytes_udp = rrddim_add(st_bytes, "udp", NULL, 8, BITS_IN_A_KILOBIT, RRD_ALGORITHM_INCREMENTAL);
  2230. st_packets = rrdset_create_localhost(
  2231. "netdata",
  2232. "statsd_packets",
  2233. NULL,
  2234. "statsd",
  2235. NULL,
  2236. "Network packets processed by the netdata statsd server",
  2237. "packets/s",
  2238. PLUGIN_STATSD_NAME,
  2239. "stats",
  2240. 132014,
  2241. statsd.update_every,
  2242. RRDSET_TYPE_STACKED);
  2243. rd_packets_tcp = rrddim_add(st_packets, "tcp", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2244. rd_packets_udp = rrddim_add(st_packets, "udp", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2245. st_tcp_connects = rrdset_create_localhost(
  2246. "netdata",
  2247. "tcp_connects",
  2248. NULL,
  2249. "statsd",
  2250. NULL,
  2251. "statsd server TCP connects and disconnects",
  2252. "events",
  2253. PLUGIN_STATSD_NAME,
  2254. "stats",
  2255. 132015,
  2256. statsd.update_every,
  2257. RRDSET_TYPE_LINE);
  2258. rd_tcp_connects = rrddim_add(st_tcp_connects, "connects", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
  2259. rd_tcp_disconnects = rrddim_add(st_tcp_connects, "disconnects", NULL, -1, 1, RRD_ALGORITHM_INCREMENTAL);
  2260. st_tcp_connected = rrdset_create_localhost(
  2261. "netdata",
  2262. "tcp_connected",
  2263. NULL,
  2264. "statsd",
  2265. NULL,
  2266. "statsd server TCP connected sockets",
  2267. "sockets",
  2268. PLUGIN_STATSD_NAME,
  2269. "stats",
  2270. 132016,
  2271. statsd.update_every,
  2272. RRDSET_TYPE_LINE);
  2273. rd_tcp_connected = rrddim_add(st_tcp_connected, "connected", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2274. st_pcharts = rrdset_create_localhost(
  2275. "netdata",
  2276. "private_charts",
  2277. NULL,
  2278. "statsd",
  2279. NULL,
  2280. "Private metric charts created by the netdata statsd server",
  2281. "charts",
  2282. PLUGIN_STATSD_NAME,
  2283. "stats",
  2284. 132020,
  2285. statsd.update_every,
  2286. RRDSET_TYPE_AREA);
  2287. rd_pcharts = rrddim_add(st_pcharts, "charts", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
  2288. }
  2289. // ----------------------------------------------------------------------------------------------------------------
  2290. // statsd thread to turn metrics into charts
  2291. usec_t step = statsd.update_every * USEC_PER_SEC;
  2292. heartbeat_t hb;
  2293. heartbeat_init(&hb);
  2294. while(service_running(SERVICE_COLLECTORS)) {
  2295. worker_is_idle();
  2296. heartbeat_next(&hb, step);
  2297. worker_is_busy(WORKER_STATSD_FLUSH_GAUGES);
  2298. statsd_flush_index_metrics(&statsd.gauges, statsd_flush_gauge);
  2299. worker_is_busy(WORKER_STATSD_FLUSH_COUNTERS);
  2300. statsd_flush_index_metrics(&statsd.counters, statsd_flush_counter);
  2301. worker_is_busy(WORKER_STATSD_FLUSH_METERS);
  2302. statsd_flush_index_metrics(&statsd.meters, statsd_flush_meter);
  2303. worker_is_busy(WORKER_STATSD_FLUSH_TIMERS);
  2304. statsd_flush_index_metrics(&statsd.timers, statsd_flush_timer);
  2305. worker_is_busy(WORKER_STATSD_FLUSH_HISTOGRAMS);
  2306. statsd_flush_index_metrics(&statsd.histograms, statsd_flush_histogram);
  2307. worker_is_busy(WORKER_STATSD_FLUSH_SETS);
  2308. statsd_flush_index_metrics(&statsd.sets, statsd_flush_set);
  2309. worker_is_busy(WORKER_STATSD_FLUSH_DICTIONARIES);
  2310. statsd_flush_index_metrics(&statsd.dictionaries,statsd_flush_dictionary);
  2311. worker_is_busy(WORKER_STATSD_FLUSH_STATS);
  2312. statsd_update_all_app_charts();
  2313. if(unlikely(!service_running(SERVICE_COLLECTORS)))
  2314. break;
  2315. if(global_statistics_enabled) {
  2316. rrddim_set_by_pointer(st_metrics, rd_metrics_gauge, (collected_number)statsd.gauges.metrics);
  2317. rrddim_set_by_pointer(st_metrics, rd_metrics_counter, (collected_number)statsd.counters.metrics);
  2318. rrddim_set_by_pointer(st_metrics, rd_metrics_timer, (collected_number)statsd.timers.metrics);
  2319. rrddim_set_by_pointer(st_metrics, rd_metrics_meter, (collected_number)statsd.meters.metrics);
  2320. rrddim_set_by_pointer(st_metrics, rd_metrics_histogram, (collected_number)statsd.histograms.metrics);
  2321. rrddim_set_by_pointer(st_metrics, rd_metrics_set, (collected_number)statsd.sets.metrics);
  2322. rrddim_set_by_pointer(st_metrics, rd_metrics_dictionary, (collected_number)statsd.dictionaries.metrics);
  2323. rrdset_done(st_metrics);
  2324. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_gauge, (collected_number)statsd.gauges.useful);
  2325. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_counter, (collected_number)statsd.counters.useful);
  2326. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_timer, (collected_number)statsd.timers.useful);
  2327. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_meter, (collected_number)statsd.meters.useful);
  2328. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_histogram, (collected_number)statsd.histograms.useful);
  2329. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_set, (collected_number)statsd.sets.useful);
  2330. rrddim_set_by_pointer(st_useful_metrics, rd_useful_metrics_dictionary, (collected_number)statsd.dictionaries.useful);
  2331. rrdset_done(st_useful_metrics);
  2332. rrddim_set_by_pointer(st_events, rd_events_gauge, (collected_number)statsd.gauges.events);
  2333. rrddim_set_by_pointer(st_events, rd_events_counter, (collected_number)statsd.counters.events);
  2334. rrddim_set_by_pointer(st_events, rd_events_timer, (collected_number)statsd.timers.events);
  2335. rrddim_set_by_pointer(st_events, rd_events_meter, (collected_number)statsd.meters.events);
  2336. rrddim_set_by_pointer(st_events, rd_events_histogram, (collected_number)statsd.histograms.events);
  2337. rrddim_set_by_pointer(st_events, rd_events_set, (collected_number)statsd.sets.events);
  2338. rrddim_set_by_pointer(st_events, rd_events_dictionary, (collected_number)statsd.dictionaries.events);
  2339. rrddim_set_by_pointer(st_events, rd_events_unknown, (collected_number)statsd.unknown_types);
  2340. rrddim_set_by_pointer(st_events, rd_events_errors, (collected_number)statsd.socket_errors);
  2341. rrdset_done(st_events);
  2342. rrddim_set_by_pointer(st_reads, rd_reads_tcp, (collected_number)statsd.tcp_socket_reads);
  2343. rrddim_set_by_pointer(st_reads, rd_reads_udp, (collected_number)statsd.udp_socket_reads);
  2344. rrdset_done(st_reads);
  2345. rrddim_set_by_pointer(st_bytes, rd_bytes_tcp, (collected_number)statsd.tcp_bytes_read);
  2346. rrddim_set_by_pointer(st_bytes, rd_bytes_udp, (collected_number)statsd.udp_bytes_read);
  2347. rrdset_done(st_bytes);
  2348. rrddim_set_by_pointer(st_packets, rd_packets_tcp, (collected_number)statsd.tcp_packets_received);
  2349. rrddim_set_by_pointer(st_packets, rd_packets_udp, (collected_number)statsd.udp_packets_received);
  2350. rrdset_done(st_packets);
  2351. rrddim_set_by_pointer(st_tcp_connects, rd_tcp_connects, (collected_number)statsd.tcp_socket_connects);
  2352. rrddim_set_by_pointer(st_tcp_connects, rd_tcp_disconnects, (collected_number)statsd.tcp_socket_disconnects);
  2353. rrdset_done(st_tcp_connects);
  2354. rrddim_set_by_pointer(st_tcp_connected, rd_tcp_connected, (collected_number)statsd.tcp_socket_connected);
  2355. rrdset_done(st_tcp_connected);
  2356. rrddim_set_by_pointer(st_pcharts, rd_pcharts, (collected_number)statsd.private_charts);
  2357. rrdset_done(st_pcharts);
  2358. }
  2359. }
  2360. cleanup: ; // added semi-colon to prevent older gcc error: label at end of compound statement
  2361. netdata_thread_cleanup_pop(1);
  2362. return NULL;
  2363. }