12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168 |
- // SPDX-License-Identifier: GPL-3.0-or-later
- #include "common.h"
- #include "buildinfo.h"
- #include "static_threads.h"
- #if defined(ENV32BIT)
- #warning COMPILING 32BIT NETDATA
- #endif
- bool unittest_running = false;
- int netdata_zero_metrics_enabled;
- int netdata_anonymous_statistics_enabled;
- int libuv_worker_threads = MIN_LIBUV_WORKER_THREADS;
- bool ieee754_doubles = false;
- time_t netdata_start_time = 0;
- struct netdata_static_thread *static_threads;
- struct config netdata_config = {
- .first_section = NULL,
- .last_section = NULL,
- .mutex = NETDATA_MUTEX_INITIALIZER,
- .index = {
- .avl_tree = {
- .root = NULL,
- .compar = appconfig_section_compare
- },
- .rwlock = AVL_LOCK_INITIALIZER
- }
- };
- typedef struct service_thread {
- pid_t tid;
- SERVICE_THREAD_TYPE type;
- SERVICE_TYPE services;
- char name[NETDATA_THREAD_NAME_MAX + 1];
- bool stop_immediately;
- bool cancelled;
- union {
- netdata_thread_t netdata_thread;
- uv_thread_t uv_thread;
- };
- force_quit_t force_quit_callback;
- request_quit_t request_quit_callback;
- void *data;
- } SERVICE_THREAD;
- struct service_globals {
- SPINLOCK lock;
- Pvoid_t pid_judy;
- } service_globals = {
- .pid_judy = NULL,
- };
- SERVICE_THREAD *service_register(SERVICE_THREAD_TYPE thread_type, request_quit_t request_quit_callback, force_quit_t force_quit_callback, void *data, bool update __maybe_unused) {
- SERVICE_THREAD *sth = NULL;
- pid_t tid = gettid();
- spinlock_lock(&service_globals.lock);
- Pvoid_t *PValue = JudyLIns(&service_globals.pid_judy, tid, PJE0);
- if(!*PValue) {
- sth = callocz(1, sizeof(SERVICE_THREAD));
- sth->tid = tid;
- sth->type = thread_type;
- sth->request_quit_callback = request_quit_callback;
- sth->force_quit_callback = force_quit_callback;
- sth->data = data;
- os_thread_get_current_name_np(sth->name);
- *PValue = sth;
- switch(thread_type) {
- default:
- case SERVICE_THREAD_TYPE_NETDATA:
- sth->netdata_thread = netdata_thread_self();
- break;
- case SERVICE_THREAD_TYPE_EVENT_LOOP:
- case SERVICE_THREAD_TYPE_LIBUV:
- sth->uv_thread = uv_thread_self();
- break;
- }
- }
- else {
- sth = *PValue;
- }
- spinlock_unlock(&service_globals.lock);
- return sth;
- }
- void service_exits(void) {
- pid_t tid = gettid();
- spinlock_lock(&service_globals.lock);
- Pvoid_t *PValue = JudyLGet(service_globals.pid_judy, tid, PJE0);
- if(PValue) {
- freez(*PValue);
- JudyLDel(&service_globals.pid_judy, tid, PJE0);
- }
- spinlock_unlock(&service_globals.lock);
- }
- bool service_running(SERVICE_TYPE service) {
- static __thread SERVICE_THREAD *sth = NULL;
- if(unlikely(!sth))
- sth = service_register(SERVICE_THREAD_TYPE_NETDATA, NULL, NULL, NULL, false);
- sth->services |= service;
- return !(sth->stop_immediately || netdata_exit);
- }
- void service_signal_exit(SERVICE_TYPE service) {
- spinlock_lock(&service_globals.lock);
- Pvoid_t *PValue;
- Word_t tid = 0;
- bool first = true;
- while((PValue = JudyLFirstThenNext(service_globals.pid_judy, &tid, &first))) {
- SERVICE_THREAD *sth = *PValue;
- if((sth->services & service)) {
- sth->stop_immediately = true;
- if(sth->request_quit_callback) {
- spinlock_unlock(&service_globals.lock);
- sth->request_quit_callback(sth->data);
- spinlock_lock(&service_globals.lock);
- }
- }
- }
- spinlock_unlock(&service_globals.lock);
- }
- static void service_to_buffer(BUFFER *wb, SERVICE_TYPE service) {
- if(service & SERVICE_MAINTENANCE)
- buffer_strcat(wb, "MAINTENANCE ");
- if(service & SERVICE_COLLECTORS)
- buffer_strcat(wb, "COLLECTORS ");
- if(service & SERVICE_REPLICATION)
- buffer_strcat(wb, "REPLICATION ");
- if(service & ABILITY_DATA_QUERIES)
- buffer_strcat(wb, "DATA_QUERIES ");
- if(service & ABILITY_WEB_REQUESTS)
- buffer_strcat(wb, "WEB_REQUESTS ");
- if(service & SERVICE_WEB_SERVER)
- buffer_strcat(wb, "WEB_SERVER ");
- if(service & SERVICE_ACLK)
- buffer_strcat(wb, "ACLK ");
- if(service & SERVICE_HEALTH)
- buffer_strcat(wb, "HEALTH ");
- if(service & SERVICE_STREAMING)
- buffer_strcat(wb, "STREAMING ");
- if(service & ABILITY_STREAMING_CONNECTIONS)
- buffer_strcat(wb, "STREAMING_CONNECTIONS ");
- if(service & SERVICE_CONTEXT)
- buffer_strcat(wb, "CONTEXT ");
- if(service & SERVICE_ANALYTICS)
- buffer_strcat(wb, "ANALYTICS ");
- if(service & SERVICE_EXPORTERS)
- buffer_strcat(wb, "EXPORTERS ");
- if(service & SERVICE_HTTPD)
- buffer_strcat(wb, "HTTPD ");
- }
- static bool service_wait_exit(SERVICE_TYPE service, usec_t timeout_ut) {
- BUFFER *service_list = buffer_create(1024, NULL);
- BUFFER *thread_list = buffer_create(1024, NULL);
- usec_t started_ut = now_monotonic_usec(), ended_ut;
- size_t running;
- SERVICE_TYPE running_services = 0;
- // cancel the threads
- running = 0;
- running_services = 0;
- {
- buffer_flush(thread_list);
- spinlock_lock(&service_globals.lock);
- Pvoid_t *PValue;
- Word_t tid = 0;
- bool first = true;
- while((PValue = JudyLFirstThenNext(service_globals.pid_judy, &tid, &first))) {
- SERVICE_THREAD *sth = *PValue;
- if(sth->services & service && sth->tid != gettid() && !sth->cancelled) {
- sth->cancelled = true;
- switch(sth->type) {
- default:
- case SERVICE_THREAD_TYPE_NETDATA:
- netdata_thread_cancel(sth->netdata_thread);
- break;
- case SERVICE_THREAD_TYPE_EVENT_LOOP:
- case SERVICE_THREAD_TYPE_LIBUV:
- break;
- }
- if(running)
- buffer_strcat(thread_list, ", ");
- buffer_sprintf(thread_list, "'%s' (%d)", sth->name, sth->tid);
- running++;
- running_services |= sth->services & service;
- if(sth->force_quit_callback) {
- spinlock_unlock(&service_globals.lock);
- sth->force_quit_callback(sth->data);
- spinlock_lock(&service_globals.lock);
- continue;
- }
- }
- }
- spinlock_unlock(&service_globals.lock);
- }
- service_signal_exit(service);
- // signal them to stop
- size_t last_running = 0;
- size_t stale_time_ut = 0;
- usec_t sleep_ut = 50 * USEC_PER_MS;
- size_t log_countdown_ut = sleep_ut;
- do {
- if(running != last_running)
- stale_time_ut = 0;
- last_running = running;
- running = 0;
- running_services = 0;
- buffer_flush(thread_list);
- spinlock_lock(&service_globals.lock);
- Pvoid_t *PValue;
- Word_t tid = 0;
- bool first = true;
- while((PValue = JudyLFirstThenNext(service_globals.pid_judy, &tid, &first))) {
- SERVICE_THREAD *sth = *PValue;
- if(sth->services & service && sth->tid != gettid()) {
- if(running)
- buffer_strcat(thread_list, ", ");
- buffer_sprintf(thread_list, "'%s' (%d)", sth->name, sth->tid);
- running_services |= sth->services & service;
- running++;
- }
- }
- spinlock_unlock(&service_globals.lock);
- if(running) {
- log_countdown_ut -= (log_countdown_ut >= sleep_ut) ? sleep_ut : log_countdown_ut;
- if(log_countdown_ut == 0 || running != last_running) {
- log_countdown_ut = 20 * sleep_ut;
- buffer_flush(service_list);
- service_to_buffer(service_list, running_services);
- netdata_log_info("SERVICE CONTROL: waiting for the following %zu services [ %s] to exit: %s",
- running, buffer_tostring(service_list),
- running <= 10 ? buffer_tostring(thread_list) : "");
- }
- sleep_usec(sleep_ut);
- stale_time_ut += sleep_ut;
- }
- ended_ut = now_monotonic_usec();
- } while(running && (ended_ut - started_ut < timeout_ut || stale_time_ut < timeout_ut));
- if(running) {
- buffer_flush(service_list);
- service_to_buffer(service_list, running_services);
- netdata_log_info("SERVICE CONTROL: "
- "the following %zu service(s) [ %s] take too long to exit: %s; "
- "giving up on them...",
- running, buffer_tostring(service_list),
- buffer_tostring(thread_list));
- }
- buffer_free(thread_list);
- buffer_free(service_list);
- return (running == 0);
- }
- #define delta_shutdown_time(msg) \
- { \
- usec_t now_ut = now_monotonic_usec(); \
- if(prev_msg) \
- netdata_log_info("NETDATA SHUTDOWN: in %7llu ms, %s%s - next: %s", (now_ut - last_ut) / USEC_PER_MS, (timeout)?"(TIMEOUT) ":"", prev_msg, msg); \
- else \
- netdata_log_info("NETDATA SHUTDOWN: next: %s", msg); \
- last_ut = now_ut; \
- prev_msg = msg; \
- timeout = false; \
- }
- void web_client_cache_destroy(void);
- void netdata_cleanup_and_exit(int ret) {
- usec_t started_ut = now_monotonic_usec();
- usec_t last_ut = started_ut;
- const char *prev_msg = NULL;
- bool timeout = false;
- error_log_limit_unlimited();
- netdata_log_info("NETDATA SHUTDOWN: initializing shutdown with code %d...", ret);
- send_statistics("EXIT", ret?"ERROR":"OK","-");
- delta_shutdown_time("create shutdown file");
- char agent_crash_file[FILENAME_MAX + 1];
- char agent_incomplete_shutdown_file[FILENAME_MAX + 1];
- snprintfz(agent_crash_file, FILENAME_MAX, "%s/.agent_crash", netdata_configured_varlib_dir);
- snprintfz(agent_incomplete_shutdown_file, FILENAME_MAX, "%s/.agent_incomplete_shutdown", netdata_configured_varlib_dir);
- (void) rename(agent_crash_file, agent_incomplete_shutdown_file);
- #ifdef ENABLE_DBENGINE
- if(dbengine_enabled) {
- delta_shutdown_time("dbengine exit mode");
- for (size_t tier = 0; tier < storage_tiers; tier++)
- rrdeng_exit_mode(multidb_ctx[tier]);
- }
- #endif
- delta_shutdown_time("close webrtc connections");
- webrtc_close_all_connections();
- delta_shutdown_time("disable maintenance, new queries, new web requests, new streaming connections and aclk");
- service_signal_exit(
- SERVICE_MAINTENANCE
- | ABILITY_DATA_QUERIES
- | ABILITY_WEB_REQUESTS
- | ABILITY_STREAMING_CONNECTIONS
- | SERVICE_ACLK
- | SERVICE_ACLKSYNC
- );
- delta_shutdown_time("stop replication, exporters, health and web servers threads");
- timeout = !service_wait_exit(
- SERVICE_EXPORTERS
- | SERVICE_HEALTH
- | SERVICE_WEB_SERVER
- | SERVICE_HTTPD
- , 3 * USEC_PER_SEC);
- delta_shutdown_time("stop collectors and streaming threads");
- timeout = !service_wait_exit(
- SERVICE_COLLECTORS
- | SERVICE_STREAMING
- , 3 * USEC_PER_SEC);
- delta_shutdown_time("stop replication threads");
- timeout = !service_wait_exit(
- SERVICE_REPLICATION // replication has to be stopped after STREAMING, because it cleans up ARAL
- , 3 * USEC_PER_SEC);
- delta_shutdown_time("disable ML detection and training threads");
- ml_stop_threads();
- ml_fini();
- delta_shutdown_time("stop context thread");
- timeout = !service_wait_exit(
- SERVICE_CONTEXT
- , 3 * USEC_PER_SEC);
- delta_shutdown_time("stop maintenance thread");
- timeout = !service_wait_exit(
- SERVICE_MAINTENANCE
- , 3 * USEC_PER_SEC);
- delta_shutdown_time("clear web client cache");
- web_client_cache_destroy();
- delta_shutdown_time("clean rrdhost database");
- rrdhost_cleanup_all();
- delta_shutdown_time("prepare metasync shutdown");
- metadata_sync_shutdown_prepare();
- delta_shutdown_time("stop aclk threads");
- timeout = !service_wait_exit(
- SERVICE_ACLK
- , 3 * USEC_PER_SEC);
- delta_shutdown_time("stop all remaining worker threads");
- timeout = !service_wait_exit(~0, 10 * USEC_PER_SEC);
- delta_shutdown_time("cancel main threads");
- cancel_main_threads();
- if(!ret) {
- // exit cleanly
- #ifdef ENABLE_DBENGINE
- if(dbengine_enabled) {
- delta_shutdown_time("flush dbengine tiers");
- for (size_t tier = 0; tier < storage_tiers; tier++)
- rrdeng_prepare_exit(multidb_ctx[tier]);
- }
- #endif
- // free the database
- delta_shutdown_time("stop collection for all hosts");
- // rrdhost_free_all();
- rrd_finalize_collection_for_all_hosts();
- delta_shutdown_time("stop metasync threads");
- metadata_sync_shutdown();
- #ifdef ENABLE_DBENGINE
- if(dbengine_enabled) {
- delta_shutdown_time("wait for dbengine collectors to finish");
- size_t running = 1;
- while(running) {
- running = 0;
- for (size_t tier = 0; tier < storage_tiers; tier++)
- running += rrdeng_collectors_running(multidb_ctx[tier]);
- if(running) {
- error_limit_static_thread_var(erl, 1, 100 * USEC_PER_MS);
- error_limit(&erl, "waiting for %zu collectors to finish", running);
- // sleep_usec(100 * USEC_PER_MS);
- }
- }
- delta_shutdown_time("wait for dbengine main cache to finish flushing");
- while (pgc_hot_and_dirty_entries(main_cache)) {
- pgc_flush_all_hot_and_dirty_pages(main_cache, PGC_SECTION_ALL);
- sleep_usec(100 * USEC_PER_MS);
- }
- delta_shutdown_time("stop dbengine tiers");
- for (size_t tier = 0; tier < storage_tiers; tier++)
- rrdeng_exit(multidb_ctx[tier]);
- }
- #endif
- }
- delta_shutdown_time("close SQL context db");
- sql_close_context_database();
- delta_shutdown_time("closed SQL main db");
- sql_close_database();
- // unlink the pid
- if(pidfile[0]) {
- delta_shutdown_time("remove pid file");
- if(unlink(pidfile) != 0)
- netdata_log_error("EXIT: cannot unlink pidfile '%s'.", pidfile);
- }
- #ifdef ENABLE_HTTPS
- delta_shutdown_time("free openssl structures");
- netdata_ssl_cleanup();
- #endif
- delta_shutdown_time("remove incomplete shutdown file");
- (void) unlink(agent_incomplete_shutdown_file);
- delta_shutdown_time("exit");
- usec_t ended_ut = now_monotonic_usec();
- netdata_log_info("NETDATA SHUTDOWN: completed in %llu ms - netdata is now exiting - bye bye...", (ended_ut - started_ut) / USEC_PER_MS);
- exit(ret);
- }
- void web_server_threading_selection(void) {
- web_server_mode = web_server_mode_id(config_get(CONFIG_SECTION_WEB, "mode", web_server_mode_name(web_server_mode)));
- int static_threaded = (web_server_mode == WEB_SERVER_MODE_STATIC_THREADED);
- int i;
- for (i = 0; static_threads[i].name; i++) {
- if (static_threads[i].start_routine == socket_listen_main_static_threaded)
- static_threads[i].enabled = static_threaded;
- }
- }
- int make_dns_decision(const char *section_name, const char *config_name, const char *default_value, SIMPLE_PATTERN *p)
- {
- char *value = config_get(section_name,config_name,default_value);
- if(!strcmp("yes",value))
- return 1;
- if(!strcmp("no",value))
- return 0;
- if(strcmp("heuristic",value))
- netdata_log_error("Invalid configuration option '%s' for '%s'/'%s'. Valid options are 'yes', 'no' and 'heuristic'. Proceeding with 'heuristic'",
- value, section_name, config_name);
- return simple_pattern_is_potential_name(p);
- }
- void web_server_config_options(void)
- {
- web_client_timeout =
- (int)config_get_number(CONFIG_SECTION_WEB, "disconnect idle clients after seconds", web_client_timeout);
- web_client_first_request_timeout =
- (int)config_get_number(CONFIG_SECTION_WEB, "timeout for first request", web_client_first_request_timeout);
- web_client_streaming_rate_t =
- config_get_number(CONFIG_SECTION_WEB, "accept a streaming request every seconds", web_client_streaming_rate_t);
- respect_web_browser_do_not_track_policy =
- config_get_boolean(CONFIG_SECTION_WEB, "respect do not track policy", respect_web_browser_do_not_track_policy);
- web_x_frame_options = config_get(CONFIG_SECTION_WEB, "x-frame-options response header", "");
- if(!*web_x_frame_options)
- web_x_frame_options = NULL;
- web_allow_connections_from =
- simple_pattern_create(config_get(CONFIG_SECTION_WEB, "allow connections from", "localhost *"),
- NULL, SIMPLE_PATTERN_EXACT, true);
- web_allow_connections_dns =
- make_dns_decision(CONFIG_SECTION_WEB, "allow connections by dns", "heuristic", web_allow_connections_from);
- web_allow_dashboard_from =
- simple_pattern_create(config_get(CONFIG_SECTION_WEB, "allow dashboard from", "localhost *"),
- NULL, SIMPLE_PATTERN_EXACT, true);
- web_allow_dashboard_dns =
- make_dns_decision(CONFIG_SECTION_WEB, "allow dashboard by dns", "heuristic", web_allow_dashboard_from);
- web_allow_badges_from =
- simple_pattern_create(config_get(CONFIG_SECTION_WEB, "allow badges from", "*"), NULL, SIMPLE_PATTERN_EXACT,
- true);
- web_allow_badges_dns =
- make_dns_decision(CONFIG_SECTION_WEB, "allow badges by dns", "heuristic", web_allow_badges_from);
- web_allow_registry_from =
- simple_pattern_create(config_get(CONFIG_SECTION_REGISTRY, "allow from", "*"), NULL, SIMPLE_PATTERN_EXACT,
- true);
- web_allow_registry_dns = make_dns_decision(CONFIG_SECTION_REGISTRY, "allow by dns", "heuristic",
- web_allow_registry_from);
- web_allow_streaming_from = simple_pattern_create(config_get(CONFIG_SECTION_WEB, "allow streaming from", "*"),
- NULL, SIMPLE_PATTERN_EXACT, true);
- web_allow_streaming_dns = make_dns_decision(CONFIG_SECTION_WEB, "allow streaming by dns", "heuristic",
- web_allow_streaming_from);
- // Note the default is not heuristic, the wildcards could match DNS but the intent is ip-addresses.
- web_allow_netdataconf_from = simple_pattern_create(config_get(CONFIG_SECTION_WEB, "allow netdata.conf from",
- "localhost fd* 10.* 192.168.* 172.16.* 172.17.* 172.18.*"
- " 172.19.* 172.20.* 172.21.* 172.22.* 172.23.* 172.24.*"
- " 172.25.* 172.26.* 172.27.* 172.28.* 172.29.* 172.30.*"
- " 172.31.* UNKNOWN"), NULL, SIMPLE_PATTERN_EXACT,
- true);
- web_allow_netdataconf_dns =
- make_dns_decision(CONFIG_SECTION_WEB, "allow netdata.conf by dns", "no", web_allow_netdataconf_from);
- web_allow_mgmt_from =
- simple_pattern_create(config_get(CONFIG_SECTION_WEB, "allow management from", "localhost"),
- NULL, SIMPLE_PATTERN_EXACT, true);
- web_allow_mgmt_dns =
- make_dns_decision(CONFIG_SECTION_WEB, "allow management by dns","heuristic",web_allow_mgmt_from);
- web_enable_gzip = config_get_boolean(CONFIG_SECTION_WEB, "enable gzip compression", web_enable_gzip);
- char *s = config_get(CONFIG_SECTION_WEB, "gzip compression strategy", "default");
- if(!strcmp(s, "default"))
- web_gzip_strategy = Z_DEFAULT_STRATEGY;
- else if(!strcmp(s, "filtered"))
- web_gzip_strategy = Z_FILTERED;
- else if(!strcmp(s, "huffman only"))
- web_gzip_strategy = Z_HUFFMAN_ONLY;
- else if(!strcmp(s, "rle"))
- web_gzip_strategy = Z_RLE;
- else if(!strcmp(s, "fixed"))
- web_gzip_strategy = Z_FIXED;
- else {
- netdata_log_error("Invalid compression strategy '%s'. Valid strategies are 'default', 'filtered', 'huffman only', 'rle' and 'fixed'. Proceeding with 'default'.", s);
- web_gzip_strategy = Z_DEFAULT_STRATEGY;
- }
- web_gzip_level = (int)config_get_number(CONFIG_SECTION_WEB, "gzip compression level", 3);
- if(web_gzip_level < 1) {
- netdata_log_error("Invalid compression level %d. Valid levels are 1 (fastest) to 9 (best ratio). Proceeding with level 1 (fastest compression).", web_gzip_level);
- web_gzip_level = 1;
- }
- else if(web_gzip_level > 9) {
- netdata_log_error("Invalid compression level %d. Valid levels are 1 (fastest) to 9 (best ratio). Proceeding with level 9 (best compression).", web_gzip_level);
- web_gzip_level = 9;
- }
- }
- // killpid kills pid with SIGTERM.
- int killpid(pid_t pid) {
- int ret;
- netdata_log_debug(D_EXIT, "Request to kill pid %d", pid);
- errno = 0;
- ret = kill(pid, SIGTERM);
- if (ret == -1) {
- switch(errno) {
- case ESRCH:
- // We wanted the process to exit so just let the caller handle.
- return ret;
- case EPERM:
- netdata_log_error("Cannot kill pid %d, but I do not have enough permissions.", pid);
- break;
- default:
- netdata_log_error("Cannot kill pid %d, but I received an error.", pid);
- break;
- }
- }
- return ret;
- }
- static void set_nofile_limit(struct rlimit *rl) {
- // get the num files allowed
- if(getrlimit(RLIMIT_NOFILE, rl) != 0) {
- netdata_log_error("getrlimit(RLIMIT_NOFILE) failed");
- return;
- }
- netdata_log_info("resources control: allowed file descriptors: soft = %zu, max = %zu",
- (size_t) rl->rlim_cur, (size_t) rl->rlim_max);
- // make the soft/hard limits equal
- rl->rlim_cur = rl->rlim_max;
- if (setrlimit(RLIMIT_NOFILE, rl) != 0) {
- netdata_log_error("setrlimit(RLIMIT_NOFILE, { %zu, %zu }) failed", (size_t)rl->rlim_cur, (size_t)rl->rlim_max);
- }
- // sanity check to make sure we have enough file descriptors available to open
- if (getrlimit(RLIMIT_NOFILE, rl) != 0) {
- netdata_log_error("getrlimit(RLIMIT_NOFILE) failed");
- return;
- }
- if (rl->rlim_cur < 1024)
- netdata_log_error("Number of open file descriptors allowed for this process is too low (RLIMIT_NOFILE=%zu)", (size_t)rl->rlim_cur);
- }
- void cancel_main_threads() {
- error_log_limit_unlimited();
- int i, found = 0;
- usec_t max = 5 * USEC_PER_SEC, step = 100000;
- for (i = 0; static_threads[i].name != NULL ; i++) {
- if (static_threads[i].enabled == NETDATA_MAIN_THREAD_RUNNING) {
- if (static_threads[i].thread) {
- netdata_log_info("EXIT: Stopping main thread: %s", static_threads[i].name);
- netdata_thread_cancel(*static_threads[i].thread);
- } else {
- netdata_log_info("EXIT: No thread running (marking as EXITED): %s", static_threads[i].name);
- static_threads[i].enabled = NETDATA_MAIN_THREAD_EXITED;
- }
- found++;
- }
- }
- netdata_exit = 1;
- while(found && max > 0) {
- max -= step;
- netdata_log_info("Waiting %d threads to finish...", found);
- sleep_usec(step);
- found = 0;
- for (i = 0; static_threads[i].name != NULL ; i++) {
- if (static_threads[i].enabled != NETDATA_MAIN_THREAD_EXITED)
- found++;
- }
- }
- if(found) {
- for (i = 0; static_threads[i].name != NULL ; i++) {
- if (static_threads[i].enabled != NETDATA_MAIN_THREAD_EXITED)
- netdata_log_error("Main thread %s takes too long to exit. Giving up...", static_threads[i].name);
- }
- }
- else
- netdata_log_info("All threads finished.");
- for (i = 0; static_threads[i].name != NULL ; i++)
- freez(static_threads[i].thread);
- freez(static_threads);
- }
- struct option_def option_definitions[] = {
- // opt description arg name default value
- { 'c', "Configuration file to load.", "filename", CONFIG_DIR "/" CONFIG_FILENAME},
- { 'D', "Do not fork. Run in the foreground.", NULL, "run in the background"},
- { 'd', "Fork. Run in the background.", NULL, "run in the background"},
- { 'h', "Display this help message.", NULL, NULL},
- { 'P', "File to save a pid while running.", "filename", "do not save pid to a file"},
- { 'i', "The IP address to listen to.", "IP", "all IP addresses IPv4 and IPv6"},
- { 'p', "API/Web port to use.", "port", "19999"},
- { 's', "Prefix for /proc and /sys (for containers).", "path", "no prefix"},
- { 't', "The internal clock of netdata.", "seconds", "1"},
- { 'u', "Run as user.", "username", "netdata"},
- { 'v', "Print netdata version and exit.", NULL, NULL},
- { 'V', "Print netdata version and exit.", NULL, NULL},
- { 'W', "See Advanced options below.", "options", NULL},
- };
- int help(int exitcode) {
- FILE *stream;
- if(exitcode == 0)
- stream = stdout;
- else
- stream = stderr;
- int num_opts = sizeof(option_definitions) / sizeof(struct option_def);
- int i;
- int max_len_arg = 0;
- // Compute maximum argument length
- for( i = 0; i < num_opts; i++ ) {
- if(option_definitions[i].arg_name) {
- int len_arg = (int)strlen(option_definitions[i].arg_name);
- if(len_arg > max_len_arg) max_len_arg = len_arg;
- }
- }
- if(max_len_arg > 30) max_len_arg = 30;
- if(max_len_arg < 20) max_len_arg = 20;
- fprintf(stream, "%s", "\n"
- " ^\n"
- " |.-. .-. .-. .-. . netdata \n"
- " | '-' '-' '-' '-' real-time performance monitoring, done right! \n"
- " +----+-----+-----+-----+-----+-----+-----+-----+-----+-----+-----+-----+--->\n"
- "\n"
- " Copyright (C) 2016-2022, Netdata, Inc. <info@netdata.cloud>\n"
- " Released under GNU General Public License v3 or later.\n"
- " All rights reserved.\n"
- "\n"
- " Home Page : https://netdata.cloud\n"
- " Source Code: https://github.com/netdata/netdata\n"
- " Docs : https://learn.netdata.cloud\n"
- " Support : https://github.com/netdata/netdata/issues\n"
- " License : https://github.com/netdata/netdata/blob/master/LICENSE.md\n"
- "\n"
- " Twitter : https://twitter.com/linuxnetdata\n"
- " LinkedIn : https://linkedin.com/company/netdata-cloud/\n"
- " Facebook : https://facebook.com/linuxnetdata/\n"
- "\n"
- "\n"
- );
- fprintf(stream, " SYNOPSIS: netdata [options]\n");
- fprintf(stream, "\n");
- fprintf(stream, " Options:\n\n");
- // Output options description.
- for( i = 0; i < num_opts; i++ ) {
- fprintf(stream, " -%c %-*s %s", option_definitions[i].val, max_len_arg, option_definitions[i].arg_name ? option_definitions[i].arg_name : "", option_definitions[i].description);
- if(option_definitions[i].default_value) {
- fprintf(stream, "\n %c %-*s Default: %s\n", ' ', max_len_arg, "", option_definitions[i].default_value);
- } else {
- fprintf(stream, "\n");
- }
- fprintf(stream, "\n");
- }
- fprintf(stream, "\n Advanced options:\n\n"
- " -W stacksize=N Set the stacksize (in bytes).\n\n"
- " -W debug_flags=N Set runtime tracing to debug.log.\n\n"
- " -W unittest Run internal unittests and exit.\n\n"
- " -W sqlite-check Check metadata database integrity and exit.\n\n"
- " -W sqlite-fix Check metadata database integrity, fix if needed and exit.\n\n"
- " -W sqlite-compact Reclaim metadata database unused space and exit.\n\n"
- #ifdef ENABLE_DBENGINE
- " -W createdataset=N Create a DB engine dataset of N seconds and exit.\n\n"
- " -W stresstest=A,B,C,D,E,F,G\n"
- " Run a DB engine stress test for A seconds,\n"
- " with B writers and C readers, with a ramp up\n"
- " time of D seconds for writers, a page cache\n"
- " size of E MiB, an optional disk space limit\n"
- " of F MiB, G libuv workers (default 16) and exit.\n\n"
- #endif
- " -W set section option value\n"
- " set netdata.conf option from the command line.\n\n"
- " -W buildinfo Print the version, the configure options,\n"
- " a list of optional features, and whether they\n"
- " are enabled or not.\n\n"
- " -W buildinfojson Print the version, the configure options,\n"
- " a list of optional features, and whether they\n"
- " are enabled or not, in JSON format.\n\n"
- " -W simple-pattern pattern string\n"
- " Check if string matches pattern and exit.\n\n"
- " -W \"claim -token=TOKEN -rooms=ROOM1,ROOM2\"\n"
- " Claim the agent to the workspace rooms pointed to by TOKEN and ROOM*.\n\n"
- );
- fprintf(stream, "\n Signals netdata handles:\n\n"
- " - HUP Close and reopen log files.\n"
- " - USR1 Save internal DB to disk.\n"
- " - USR2 Reload health configuration.\n"
- "\n"
- );
- fflush(stream);
- return exitcode;
- }
- #ifdef ENABLE_HTTPS
- static void security_init(){
- char filename[FILENAME_MAX + 1];
- snprintfz(filename, FILENAME_MAX, "%s/ssl/key.pem",netdata_configured_user_config_dir);
- netdata_ssl_security_key = config_get(CONFIG_SECTION_WEB, "ssl key", filename);
- snprintfz(filename, FILENAME_MAX, "%s/ssl/cert.pem",netdata_configured_user_config_dir);
- netdata_ssl_security_cert = config_get(CONFIG_SECTION_WEB, "ssl certificate", filename);
- tls_version = config_get(CONFIG_SECTION_WEB, "tls version", "1.3");
- tls_ciphers = config_get(CONFIG_SECTION_WEB, "tls ciphers", "none");
- netdata_ssl_initialize_openssl();
- }
- #endif
- static void log_init(void) {
- char filename[FILENAME_MAX + 1];
- snprintfz(filename, FILENAME_MAX, "%s/debug.log", netdata_configured_log_dir);
- stdout_filename = config_get(CONFIG_SECTION_LOGS, "debug", filename);
- snprintfz(filename, FILENAME_MAX, "%s/error.log", netdata_configured_log_dir);
- stderr_filename = config_get(CONFIG_SECTION_LOGS, "error", filename);
- snprintfz(filename, FILENAME_MAX, "%s/collector.log", netdata_configured_log_dir);
- stdcollector_filename = config_get(CONFIG_SECTION_LOGS, "collector", filename);
- snprintfz(filename, FILENAME_MAX, "%s/access.log", netdata_configured_log_dir);
- stdaccess_filename = config_get(CONFIG_SECTION_LOGS, "access", filename);
- snprintfz(filename, FILENAME_MAX, "%s/health.log", netdata_configured_log_dir);
- stdhealth_filename = config_get(CONFIG_SECTION_LOGS, "health", filename);
- #ifdef ENABLE_ACLK
- aclklog_enabled = config_get_boolean(CONFIG_SECTION_CLOUD, "conversation log", CONFIG_BOOLEAN_NO);
- if (aclklog_enabled) {
- snprintfz(filename, FILENAME_MAX, "%s/aclk.log", netdata_configured_log_dir);
- aclklog_filename = config_get(CONFIG_SECTION_CLOUD, "conversation log file", filename);
- }
- #endif
- char deffacility[8];
- snprintfz(deffacility,7,"%s","daemon");
- facility_log = config_get(CONFIG_SECTION_LOGS, "facility", deffacility);
- error_log_throttle_period = config_get_number(CONFIG_SECTION_LOGS, "errors flood protection period", error_log_throttle_period);
- error_log_errors_per_period = (unsigned long)config_get_number(CONFIG_SECTION_LOGS, "errors to trigger flood protection", (long long int)error_log_errors_per_period);
- error_log_errors_per_period_backup = error_log_errors_per_period;
- setenv("NETDATA_ERRORS_THROTTLE_PERIOD", config_get(CONFIG_SECTION_LOGS, "errors flood protection period" , ""), 1);
- setenv("NETDATA_ERRORS_PER_PERIOD", config_get(CONFIG_SECTION_LOGS, "errors to trigger flood protection", ""), 1);
- }
- char *initialize_lock_directory_path(char *prefix)
- {
- char filename[FILENAME_MAX + 1];
- snprintfz(filename, FILENAME_MAX, "%s/lock", prefix);
- return config_get(CONFIG_SECTION_DIRECTORIES, "lock", filename);
- }
- static void backwards_compatible_config() {
- // move [global] options to the [web] section
- config_move(CONFIG_SECTION_GLOBAL, "http port listen backlog",
- CONFIG_SECTION_WEB, "listen backlog");
- config_move(CONFIG_SECTION_GLOBAL, "bind socket to IP",
- CONFIG_SECTION_WEB, "bind to");
- config_move(CONFIG_SECTION_GLOBAL, "bind to",
- CONFIG_SECTION_WEB, "bind to");
- config_move(CONFIG_SECTION_GLOBAL, "port",
- CONFIG_SECTION_WEB, "default port");
- config_move(CONFIG_SECTION_GLOBAL, "default port",
- CONFIG_SECTION_WEB, "default port");
- config_move(CONFIG_SECTION_GLOBAL, "disconnect idle web clients after seconds",
- CONFIG_SECTION_WEB, "disconnect idle clients after seconds");
- config_move(CONFIG_SECTION_GLOBAL, "respect web browser do not track policy",
- CONFIG_SECTION_WEB, "respect do not track policy");
- config_move(CONFIG_SECTION_GLOBAL, "web x-frame-options header",
- CONFIG_SECTION_WEB, "x-frame-options response header");
- config_move(CONFIG_SECTION_GLOBAL, "enable web responses gzip compression",
- CONFIG_SECTION_WEB, "enable gzip compression");
- config_move(CONFIG_SECTION_GLOBAL, "web compression strategy",
- CONFIG_SECTION_WEB, "gzip compression strategy");
- config_move(CONFIG_SECTION_GLOBAL, "web compression level",
- CONFIG_SECTION_WEB, "gzip compression level");
- config_move(CONFIG_SECTION_GLOBAL, "config directory",
- CONFIG_SECTION_DIRECTORIES, "config");
- config_move(CONFIG_SECTION_GLOBAL, "stock config directory",
- CONFIG_SECTION_DIRECTORIES, "stock config");
- config_move(CONFIG_SECTION_GLOBAL, "log directory",
- CONFIG_SECTION_DIRECTORIES, "log");
- config_move(CONFIG_SECTION_GLOBAL, "web files directory",
- CONFIG_SECTION_DIRECTORIES, "web");
- config_move(CONFIG_SECTION_GLOBAL, "cache directory",
- CONFIG_SECTION_DIRECTORIES, "cache");
- config_move(CONFIG_SECTION_GLOBAL, "lib directory",
- CONFIG_SECTION_DIRECTORIES, "lib");
- config_move(CONFIG_SECTION_GLOBAL, "home directory",
- CONFIG_SECTION_DIRECTORIES, "home");
- config_move(CONFIG_SECTION_GLOBAL, "lock directory",
- CONFIG_SECTION_DIRECTORIES, "lock");
- config_move(CONFIG_SECTION_GLOBAL, "plugins directory",
- CONFIG_SECTION_DIRECTORIES, "plugins");
- config_move(CONFIG_SECTION_HEALTH, "health configuration directory",
- CONFIG_SECTION_DIRECTORIES, "health config");
- config_move(CONFIG_SECTION_HEALTH, "stock health configuration directory",
- CONFIG_SECTION_DIRECTORIES, "stock health config");
- config_move(CONFIG_SECTION_REGISTRY, "registry db directory",
- CONFIG_SECTION_DIRECTORIES, "registry");
- config_move(CONFIG_SECTION_GLOBAL, "debug log",
- CONFIG_SECTION_LOGS, "debug");
- config_move(CONFIG_SECTION_GLOBAL, "error log",
- CONFIG_SECTION_LOGS, "error");
- config_move(CONFIG_SECTION_GLOBAL, "access log",
- CONFIG_SECTION_LOGS, "access");
- config_move(CONFIG_SECTION_GLOBAL, "facility log",
- CONFIG_SECTION_LOGS, "facility");
- config_move(CONFIG_SECTION_GLOBAL, "errors flood protection period",
- CONFIG_SECTION_LOGS, "errors flood protection period");
- config_move(CONFIG_SECTION_GLOBAL, "errors to trigger flood protection",
- CONFIG_SECTION_LOGS, "errors to trigger flood protection");
- config_move(CONFIG_SECTION_GLOBAL, "debug flags",
- CONFIG_SECTION_LOGS, "debug flags");
- config_move(CONFIG_SECTION_GLOBAL, "TZ environment variable",
- CONFIG_SECTION_ENV_VARS, "TZ");
- config_move(CONFIG_SECTION_PLUGINS, "PATH environment variable",
- CONFIG_SECTION_ENV_VARS, "PATH");
- config_move(CONFIG_SECTION_PLUGINS, "PYTHONPATH environment variable",
- CONFIG_SECTION_ENV_VARS, "PYTHONPATH");
- config_move(CONFIG_SECTION_STATSD, "enabled",
- CONFIG_SECTION_PLUGINS, "statsd");
- config_move(CONFIG_SECTION_GLOBAL, "memory mode",
- CONFIG_SECTION_DB, "mode");
- config_move(CONFIG_SECTION_GLOBAL, "history",
- CONFIG_SECTION_DB, "retention");
- config_move(CONFIG_SECTION_GLOBAL, "update every",
- CONFIG_SECTION_DB, "update every");
- config_move(CONFIG_SECTION_GLOBAL, "page cache size",
- CONFIG_SECTION_DB, "dbengine page cache size MB");
- config_move(CONFIG_SECTION_DB, "page cache size",
- CONFIG_SECTION_DB, "dbengine page cache size MB");
- config_move(CONFIG_SECTION_GLOBAL, "page cache uses malloc",
- CONFIG_SECTION_DB, "dbengine page cache with malloc");
- config_move(CONFIG_SECTION_DB, "page cache with malloc",
- CONFIG_SECTION_DB, "dbengine page cache with malloc");
- config_move(CONFIG_SECTION_GLOBAL, "dbengine disk space",
- CONFIG_SECTION_DB, "dbengine disk space MB");
- config_move(CONFIG_SECTION_GLOBAL, "dbengine multihost disk space",
- CONFIG_SECTION_DB, "dbengine multihost disk space MB");
- config_move(CONFIG_SECTION_GLOBAL, "memory deduplication (ksm)",
- CONFIG_SECTION_DB, "memory deduplication (ksm)");
- config_move(CONFIG_SECTION_GLOBAL, "dbengine page fetch timeout",
- CONFIG_SECTION_DB, "dbengine page fetch timeout secs");
- config_move(CONFIG_SECTION_GLOBAL, "dbengine page fetch retries",
- CONFIG_SECTION_DB, "dbengine page fetch retries");
- config_move(CONFIG_SECTION_GLOBAL, "dbengine extent pages",
- CONFIG_SECTION_DB, "dbengine pages per extent");
- config_move(CONFIG_SECTION_GLOBAL, "cleanup obsolete charts after seconds",
- CONFIG_SECTION_DB, "cleanup obsolete charts after secs");
- config_move(CONFIG_SECTION_GLOBAL, "gap when lost iterations above",
- CONFIG_SECTION_DB, "gap when lost iterations above");
- config_move(CONFIG_SECTION_GLOBAL, "cleanup orphan hosts after seconds",
- CONFIG_SECTION_DB, "cleanup orphan hosts after secs");
- config_move(CONFIG_SECTION_GLOBAL, "delete obsolete charts files",
- CONFIG_SECTION_DB, "delete obsolete charts files");
- config_move(CONFIG_SECTION_GLOBAL, "delete orphan hosts files",
- CONFIG_SECTION_DB, "delete orphan hosts files");
- config_move(CONFIG_SECTION_GLOBAL, "enable zero metrics",
- CONFIG_SECTION_DB, "enable zero metrics");
- }
- static void get_netdata_configured_variables() {
- backwards_compatible_config();
- // ------------------------------------------------------------------------
- // get the hostname
- char buf[HOSTNAME_MAX + 1];
- if(gethostname(buf, HOSTNAME_MAX) == -1){
- netdata_log_error("Cannot get machine hostname.");
- }
- netdata_configured_hostname = config_get(CONFIG_SECTION_GLOBAL, "hostname", buf);
- netdata_log_debug(D_OPTIONS, "hostname set to '%s'", netdata_configured_hostname);
- // ------------------------------------------------------------------------
- // get default database update frequency
- default_rrd_update_every = (int) config_get_number(CONFIG_SECTION_DB, "update every", UPDATE_EVERY);
- if(default_rrd_update_every < 1 || default_rrd_update_every > 600) {
- netdata_log_error("Invalid data collection frequency (update every) %d given. Defaulting to %d.", default_rrd_update_every, UPDATE_EVERY);
- default_rrd_update_every = UPDATE_EVERY;
- config_set_number(CONFIG_SECTION_DB, "update every", default_rrd_update_every);
- }
- // ------------------------------------------------------------------------
- // get default memory mode for the database
- {
- const char *mode = config_get(CONFIG_SECTION_DB, "mode", rrd_memory_mode_name(default_rrd_memory_mode));
- default_rrd_memory_mode = rrd_memory_mode_id(mode);
- if(strcmp(mode, rrd_memory_mode_name(default_rrd_memory_mode)) != 0) {
- netdata_log_error("Invalid memory mode '%s' given. Using '%s'", mode, rrd_memory_mode_name(default_rrd_memory_mode));
- config_set(CONFIG_SECTION_DB, "mode", rrd_memory_mode_name(default_rrd_memory_mode));
- }
- }
- // ------------------------------------------------------------------------
- // get default database size
- if(default_rrd_memory_mode != RRD_MEMORY_MODE_DBENGINE && default_rrd_memory_mode != RRD_MEMORY_MODE_NONE) {
- default_rrd_history_entries = (int)config_get_number(
- CONFIG_SECTION_DB, "retention",
- align_entries_to_pagesize(default_rrd_memory_mode, RRD_DEFAULT_HISTORY_ENTRIES));
- long h = align_entries_to_pagesize(default_rrd_memory_mode, default_rrd_history_entries);
- if (h != default_rrd_history_entries) {
- config_set_number(CONFIG_SECTION_DB, "retention", h);
- default_rrd_history_entries = (int)h;
- }
- }
- // ------------------------------------------------------------------------
- // get system paths
- netdata_configured_user_config_dir = config_get(CONFIG_SECTION_DIRECTORIES, "config", netdata_configured_user_config_dir);
- netdata_configured_stock_config_dir = config_get(CONFIG_SECTION_DIRECTORIES, "stock config", netdata_configured_stock_config_dir);
- netdata_configured_log_dir = config_get(CONFIG_SECTION_DIRECTORIES, "log", netdata_configured_log_dir);
- netdata_configured_web_dir = config_get(CONFIG_SECTION_DIRECTORIES, "web", netdata_configured_web_dir);
- netdata_configured_cache_dir = config_get(CONFIG_SECTION_DIRECTORIES, "cache", netdata_configured_cache_dir);
- netdata_configured_varlib_dir = config_get(CONFIG_SECTION_DIRECTORIES, "lib", netdata_configured_varlib_dir);
- char *env_home=getenv("HOME");
- netdata_configured_home_dir = config_get(CONFIG_SECTION_DIRECTORIES, "home", env_home?env_home:netdata_configured_home_dir);
- netdata_configured_lock_dir = initialize_lock_directory_path(netdata_configured_varlib_dir);
- {
- pluginsd_initialize_plugin_directories();
- netdata_configured_primary_plugins_dir = plugin_directories[PLUGINSD_STOCK_PLUGINS_DIRECTORY_PATH];
- }
- #ifdef ENABLE_DBENGINE
- // ------------------------------------------------------------------------
- // get default Database Engine page cache size in MiB
- default_rrdeng_page_cache_mb = (int) config_get_number(CONFIG_SECTION_DB, "dbengine page cache size MB", default_rrdeng_page_cache_mb);
- default_rrdeng_extent_cache_mb = (int) config_get_number(CONFIG_SECTION_DB, "dbengine extent cache size MB", default_rrdeng_extent_cache_mb);
- db_engine_journal_check = config_get_boolean(CONFIG_SECTION_DB, "dbengine enable journal integrity check", CONFIG_BOOLEAN_NO);
- if(default_rrdeng_extent_cache_mb < 0)
- default_rrdeng_extent_cache_mb = 0;
- if(default_rrdeng_page_cache_mb < RRDENG_MIN_PAGE_CACHE_SIZE_MB) {
- netdata_log_error("Invalid page cache size %d given. Defaulting to %d.", default_rrdeng_page_cache_mb, RRDENG_MIN_PAGE_CACHE_SIZE_MB);
- default_rrdeng_page_cache_mb = RRDENG_MIN_PAGE_CACHE_SIZE_MB;
- config_set_number(CONFIG_SECTION_DB, "dbengine page cache size MB", default_rrdeng_page_cache_mb);
- }
- // ------------------------------------------------------------------------
- // get default Database Engine disk space quota in MiB
- default_rrdeng_disk_quota_mb = (int) config_get_number(CONFIG_SECTION_DB, "dbengine disk space MB", default_rrdeng_disk_quota_mb);
- if(default_rrdeng_disk_quota_mb < RRDENG_MIN_DISK_SPACE_MB) {
- netdata_log_error("Invalid dbengine disk space %d given. Defaulting to %d.", default_rrdeng_disk_quota_mb, RRDENG_MIN_DISK_SPACE_MB);
- default_rrdeng_disk_quota_mb = RRDENG_MIN_DISK_SPACE_MB;
- config_set_number(CONFIG_SECTION_DB, "dbengine disk space MB", default_rrdeng_disk_quota_mb);
- }
- default_multidb_disk_quota_mb = (int) config_get_number(CONFIG_SECTION_DB, "dbengine multihost disk space MB", compute_multidb_diskspace());
- if(default_multidb_disk_quota_mb < RRDENG_MIN_DISK_SPACE_MB) {
- netdata_log_error("Invalid multidb disk space %d given. Defaulting to %d.", default_multidb_disk_quota_mb, default_rrdeng_disk_quota_mb);
- default_multidb_disk_quota_mb = default_rrdeng_disk_quota_mb;
- config_set_number(CONFIG_SECTION_DB, "dbengine multihost disk space MB", default_multidb_disk_quota_mb);
- }
- #else
- if (default_rrd_memory_mode == RRD_MEMORY_MODE_DBENGINE) {
- error_report("RRD_MEMORY_MODE_DBENGINE is not supported in this platform. The agent will use db mode 'save' instead.");
- default_rrd_memory_mode = RRD_MEMORY_MODE_SAVE;
- }
- #endif
- // ------------------------------------------------------------------------
- netdata_configured_host_prefix = config_get(CONFIG_SECTION_GLOBAL, "host access prefix", "");
- verify_netdata_host_prefix();
- // --------------------------------------------------------------------
- // get KSM settings
- #ifdef MADV_MERGEABLE
- enable_ksm = config_get_boolean(CONFIG_SECTION_DB, "memory deduplication (ksm)", enable_ksm);
- #endif
- // --------------------------------------------------------------------
- // metric correlations
- enable_metric_correlations = config_get_boolean(CONFIG_SECTION_GLOBAL, "enable metric correlations", enable_metric_correlations);
- default_metric_correlations_method = weights_string_to_method(config_get(
- CONFIG_SECTION_GLOBAL, "metric correlations method",
- weights_method_to_string(default_metric_correlations_method)));
- // --------------------------------------------------------------------
- rrdset_free_obsolete_time_s = config_get_number(CONFIG_SECTION_DB, "cleanup obsolete charts after secs", rrdset_free_obsolete_time_s);
- // Current chart locking and invalidation scheme doesn't prevent Netdata from segmentation faults if a short
- // cleanup delay is set. Extensive stress tests showed that 10 seconds is quite a safe delay. Look at
- // https://github.com/netdata/netdata/pull/11222#issuecomment-868367920 for more information.
- if (rrdset_free_obsolete_time_s < 10) {
- rrdset_free_obsolete_time_s = 10;
- netdata_log_info("The \"cleanup obsolete charts after seconds\" option was set to 10 seconds.");
- config_set_number(CONFIG_SECTION_DB, "cleanup obsolete charts after secs", rrdset_free_obsolete_time_s);
- }
- gap_when_lost_iterations_above = (int)config_get_number(CONFIG_SECTION_DB, "gap when lost iterations above", gap_when_lost_iterations_above);
- if (gap_when_lost_iterations_above < 1) {
- gap_when_lost_iterations_above = 1;
- config_set_number(CONFIG_SECTION_DB, "gap when lost iterations above", gap_when_lost_iterations_above);
- }
- gap_when_lost_iterations_above += 2;
- // --------------------------------------------------------------------
- // get various system parameters
- get_system_HZ();
- get_system_cpus_uncached();
- get_system_pid_max();
- }
- static void post_conf_load(char **user)
- {
- // --------------------------------------------------------------------
- // get the user we should run
- // IMPORTANT: this is required before web_files_uid()
- if(getuid() == 0) {
- *user = config_get(CONFIG_SECTION_GLOBAL, "run as user", NETDATA_USER);
- }
- else {
- struct passwd *passwd = getpwuid(getuid());
- *user = config_get(CONFIG_SECTION_GLOBAL, "run as user", (passwd && passwd->pw_name)?passwd->pw_name:"");
- }
- }
- static bool load_netdata_conf(char *filename, char overwrite_used, char **user) {
- errno = 0;
- int ret = 0;
- if(filename && *filename) {
- ret = config_load(filename, overwrite_used, NULL);
- if(!ret)
- netdata_log_error("CONFIG: cannot load config file '%s'.", filename);
- }
- else {
- filename = strdupz_path_subpath(netdata_configured_user_config_dir, "netdata.conf");
- ret = config_load(filename, overwrite_used, NULL);
- if(!ret) {
- netdata_log_info("CONFIG: cannot load user config '%s'. Will try the stock version.", filename);
- freez(filename);
- filename = strdupz_path_subpath(netdata_configured_stock_config_dir, "netdata.conf");
- ret = config_load(filename, overwrite_used, NULL);
- if(!ret)
- netdata_log_info("CONFIG: cannot load stock config '%s'. Running with internal defaults.", filename);
- }
- freez(filename);
- }
- post_conf_load(user);
- return ret;
- }
- // coverity[ +tainted_string_sanitize_content : arg-0 ]
- static inline void coverity_remove_taint(char *s)
- {
- (void)s;
- }
- int get_system_info(struct rrdhost_system_info *system_info, bool log) {
- char *script;
- script = mallocz(sizeof(char) * (strlen(netdata_configured_primary_plugins_dir) + strlen("system-info.sh") + 2));
- sprintf(script, "%s/%s", netdata_configured_primary_plugins_dir, "system-info.sh");
- if (unlikely(access(script, R_OK) != 0)) {
- netdata_log_error("System info script %s not found.",script);
- freez(script);
- return 1;
- }
- pid_t command_pid;
- FILE *fp_child_input;
- FILE *fp_child_output = netdata_popen(script, &command_pid, &fp_child_input);
- if(fp_child_output) {
- char line[200 + 1];
- // Removed the double strlens, if the Coverity tainted string warning reappears I'll revert.
- // One time init code, but I'm curious about the warning...
- while (fgets(line, 200, fp_child_output) != NULL) {
- char *value=line;
- while (*value && *value != '=') value++;
- if (*value=='=') {
- *value='\0';
- value++;
- char *end = value;
- while (*end && *end != '\n') end++;
- *end = '\0'; // Overwrite newline if present
- coverity_remove_taint(line); // I/O is controlled result of system_info.sh - not tainted
- coverity_remove_taint(value);
- if(unlikely(rrdhost_set_system_info_variable(system_info, line, value))) {
- netdata_log_error("Unexpected environment variable %s=%s", line, value);
- }
- else {
- if(log)
- netdata_log_info("%s=%s", line, value);
- setenv(line, value, 1);
- }
- }
- }
- netdata_pclose(fp_child_input, fp_child_output, command_pid);
- }
- freez(script);
- return 0;
- }
- void set_silencers_filename() {
- char filename[FILENAME_MAX + 1];
- snprintfz(filename, FILENAME_MAX, "%s/health.silencers.json", netdata_configured_varlib_dir);
- silencers_filename = config_get(CONFIG_SECTION_HEALTH, "silencers file", filename);
- }
- /* Any config setting that can be accessed without a default value i.e. configget(...,...,NULL) *MUST*
- be set in this procedure to be called in all the relevant code paths.
- */
- #define delta_startup_time(msg) \
- { \
- usec_t now_ut = now_monotonic_usec(); \
- if(prev_msg) \
- netdata_log_info("NETDATA STARTUP: in %7llu ms, %s - next: %s", (now_ut - last_ut) / USEC_PER_MS, prev_msg, msg); \
- else \
- netdata_log_info("NETDATA STARTUP: next: %s", msg); \
- last_ut = now_ut; \
- prev_msg = msg; \
- }
- int buffer_unittest(void);
- int pgc_unittest(void);
- int mrg_unittest(void);
- int julytest(void);
- int pluginsd_parser_unittest(void);
- void replication_initialize(void);
- int main(int argc, char **argv) {
- // initialize the system clocks
- clocks_init();
- netdata_start_time = now_realtime_sec();
- usec_t started_ut = now_monotonic_usec();
- usec_t last_ut = started_ut;
- const char *prev_msg = NULL;
- // Initialize stderror avoiding coredump when netdata_log_info() or netdata_log_error() is called
- stderror = stderr;
- int i;
- int config_loaded = 0;
- int dont_fork = 0;
- bool close_open_fds = true;
- size_t default_stacksize;
- char *user = NULL;
- static_threads = static_threads_get();
- netdata_ready = false;
- // set the name for logging
- program_name = "netdata";
- if (argc > 1 && strcmp(argv[1], SPAWN_SERVER_COMMAND_LINE_ARGUMENT) == 0) {
- // don't run netdata, this is the spawn server
- spawn_server();
- exit(0);
- }
- // parse options
- {
- int num_opts = sizeof(option_definitions) / sizeof(struct option_def);
- char optstring[(num_opts * 2) + 1];
- int string_i = 0;
- for( i = 0; i < num_opts; i++ ) {
- optstring[string_i] = option_definitions[i].val;
- string_i++;
- if(option_definitions[i].arg_name) {
- optstring[string_i] = ':';
- string_i++;
- }
- }
- // terminate optstring
- optstring[string_i] ='\0';
- optstring[(num_opts *2)] ='\0';
- int opt;
- while( (opt = getopt(argc, argv, optstring)) != -1 ) {
- switch(opt) {
- case 'c':
- if(!load_netdata_conf(optarg, 1, &user)) {
- netdata_log_error("Cannot load configuration file %s.", optarg);
- return 1;
- }
- else {
- netdata_log_debug(D_OPTIONS, "Configuration loaded from %s.", optarg);
- load_cloud_conf(1);
- config_loaded = 1;
- }
- break;
- case 'D':
- dont_fork = 1;
- break;
- case 'd':
- dont_fork = 0;
- break;
- case 'h':
- return help(0);
- case 'i':
- config_set(CONFIG_SECTION_WEB, "bind to", optarg);
- break;
- case 'P':
- strncpy(pidfile, optarg, FILENAME_MAX);
- pidfile[FILENAME_MAX] = '\0';
- break;
- case 'p':
- config_set(CONFIG_SECTION_GLOBAL, "default port", optarg);
- break;
- case 's':
- config_set(CONFIG_SECTION_GLOBAL, "host access prefix", optarg);
- break;
- case 't':
- config_set(CONFIG_SECTION_GLOBAL, "update every", optarg);
- break;
- case 'u':
- config_set(CONFIG_SECTION_GLOBAL, "run as user", optarg);
- break;
- case 'v':
- case 'V':
- printf("%s %s\n", program_name, program_version);
- return 0;
- case 'W':
- {
- char* stacksize_string = "stacksize=";
- char* debug_flags_string = "debug_flags=";
- char* claim_string = "claim";
- #ifdef ENABLE_DBENGINE
- char* createdataset_string = "createdataset=";
- char* stresstest_string = "stresstest=";
- #endif
- if(strcmp(optarg, "sqlite-check") == 0) {
- sql_init_database(DB_CHECK_INTEGRITY, 0);
- return 0;
- }
- if(strcmp(optarg, "sqlite-fix") == 0) {
- sql_init_database(DB_CHECK_FIX_DB, 0);
- return 0;
- }
- if(strcmp(optarg, "sqlite-compact") == 0) {
- sql_init_database(DB_CHECK_RECLAIM_SPACE, 0);
- return 0;
- }
- if(strcmp(optarg, "unittest") == 0) {
- unittest_running = true;
- if (pluginsd_parser_unittest())
- return 1;
- if (unit_test_static_threads())
- return 1;
- if (unit_test_buffer())
- return 1;
- if (unit_test_str2ld())
- return 1;
- if (buffer_unittest())
- return 1;
- if (unit_test_bitmaps())
- return 1;
- // No call to load the config file on this code-path
- post_conf_load(&user);
- get_netdata_configured_variables();
- default_rrd_update_every = 1;
- default_rrd_memory_mode = RRD_MEMORY_MODE_RAM;
- default_health_enabled = 0;
- storage_tiers = 1;
- registry_init();
- if(rrd_init("unittest", NULL, true)) {
- fprintf(stderr, "rrd_init failed for unittest\n");
- return 1;
- }
- default_rrdpush_enabled = 0;
- if(run_all_mockup_tests()) return 1;
- if(unit_test_storage()) return 1;
- #ifdef ENABLE_DBENGINE
- if(test_dbengine()) return 1;
- #endif
- if(test_sqlite()) return 1;
- if(string_unittest(10000)) return 1;
- if (dictionary_unittest(10000))
- return 1;
- if(aral_unittest(10000))
- return 1;
- if (rrdlabels_unittest())
- return 1;
- if (ctx_unittest())
- return 1;
- fprintf(stderr, "\n\nALL TESTS PASSED\n\n");
- return 0;
- }
- else if(strcmp(optarg, "escapetest") == 0) {
- return command_argument_sanitization_tests();
- }
- else if(strcmp(optarg, "dicttest") == 0) {
- unittest_running = true;
- return dictionary_unittest(10000);
- }
- else if(strcmp(optarg, "araltest") == 0) {
- unittest_running = true;
- return aral_unittest(10000);
- }
- else if(strcmp(optarg, "stringtest") == 0) {
- unittest_running = true;
- return string_unittest(10000);
- }
- else if(strcmp(optarg, "rrdlabelstest") == 0) {
- unittest_running = true;
- return rrdlabels_unittest();
- }
- else if(strcmp(optarg, "buffertest") == 0) {
- unittest_running = true;
- return buffer_unittest();
- }
- #ifdef ENABLE_DBENGINE
- else if(strcmp(optarg, "mctest") == 0) {
- unittest_running = true;
- return mc_unittest();
- }
- else if(strcmp(optarg, "ctxtest") == 0) {
- unittest_running = true;
- return ctx_unittest();
- }
- else if(strcmp(optarg, "metatest") == 0) {
- unittest_running = true;
- return metadata_unittest();
- }
- else if(strcmp(optarg, "pgctest") == 0) {
- unittest_running = true;
- return pgc_unittest();
- }
- else if(strcmp(optarg, "mrgtest") == 0) {
- unittest_running = true;
- return mrg_unittest();
- }
- else if(strcmp(optarg, "julytest") == 0) {
- unittest_running = true;
- return julytest();
- }
- else if(strcmp(optarg, "parsertest") == 0) {
- unittest_running = true;
- return pluginsd_parser_unittest();
- }
- else if(strncmp(optarg, createdataset_string, strlen(createdataset_string)) == 0) {
- optarg += strlen(createdataset_string);
- unsigned history_seconds = strtoul(optarg, NULL, 0);
- post_conf_load(&user);
- get_netdata_configured_variables();
- default_rrd_update_every = 1;
- registry_init();
- if(rrd_init("dbengine-dataset", NULL, true)) {
- fprintf(stderr, "rrd_init failed for unittest\n");
- return 1;
- }
- generate_dbengine_dataset(history_seconds);
- return 0;
- }
- else if(strncmp(optarg, stresstest_string, strlen(stresstest_string)) == 0) {
- char *endptr;
- unsigned test_duration_sec = 0, dset_charts = 0, query_threads = 0, ramp_up_seconds = 0,
- page_cache_mb = 0, disk_space_mb = 0, workers = 16;
- optarg += strlen(stresstest_string);
- test_duration_sec = (unsigned)strtoul(optarg, &endptr, 0);
- if (',' == *endptr)
- dset_charts = (unsigned)strtoul(endptr + 1, &endptr, 0);
- if (',' == *endptr)
- query_threads = (unsigned)strtoul(endptr + 1, &endptr, 0);
- if (',' == *endptr)
- ramp_up_seconds = (unsigned)strtoul(endptr + 1, &endptr, 0);
- if (',' == *endptr)
- page_cache_mb = (unsigned)strtoul(endptr + 1, &endptr, 0);
- if (',' == *endptr)
- disk_space_mb = (unsigned)strtoul(endptr + 1, &endptr, 0);
- if (',' == *endptr)
- workers = (unsigned)strtoul(endptr + 1, &endptr, 0);
- if (workers > 1024)
- workers = 1024;
- char workers_str[16];
- snprintf(workers_str, 15, "%u", workers);
- setenv("UV_THREADPOOL_SIZE", workers_str, 1);
- dbengine_stress_test(test_duration_sec, dset_charts, query_threads, ramp_up_seconds,
- page_cache_mb, disk_space_mb);
- return 0;
- }
- #endif
- else if(strcmp(optarg, "simple-pattern") == 0) {
- if(optind + 2 > argc) {
- fprintf(stderr, "%s", "\nUSAGE: -W simple-pattern 'pattern' 'string'\n\n"
- " Checks if 'pattern' matches the given 'string'.\n"
- " - 'pattern' can be one or more space separated words.\n"
- " - each 'word' can contain one or more asterisks.\n"
- " - words starting with '!' give negative matches.\n"
- " - words are processed left to right\n"
- "\n"
- "Examples:\n"
- "\n"
- " > match all veth interfaces, except veth0:\n"
- "\n"
- " -W simple-pattern '!veth0 veth*' 'veth12'\n"
- "\n"
- "\n"
- " > match all *.ext files directly in /path/:\n"
- " (this will not match *.ext files in a subdir of /path/)\n"
- "\n"
- " -W simple-pattern '!/path/*/*.ext /path/*.ext' '/path/test.ext'\n"
- "\n"
- );
- return 1;
- }
- const char *haystack = argv[optind];
- const char *needle = argv[optind + 1];
- size_t len = strlen(needle) + 1;
- char wildcarded[len];
- SIMPLE_PATTERN *p = simple_pattern_create(haystack, NULL, SIMPLE_PATTERN_EXACT, true);
- SIMPLE_PATTERN_RESULT ret = simple_pattern_matches_extract(p, needle, wildcarded, len);
- simple_pattern_free(p);
- if(ret == SP_MATCHED_POSITIVE) {
- fprintf(stdout, "RESULT: POSITIVE MATCHED - pattern '%s' matches '%s', wildcarded '%s'\n", haystack, needle, wildcarded);
- return 0;
- }
- else if(ret == SP_MATCHED_NEGATIVE) {
- fprintf(stdout, "RESULT: NEGATIVE MATCHED - pattern '%s' matches '%s', wildcarded '%s'\n", haystack, needle, wildcarded);
- return 0;
- }
- else {
- fprintf(stdout, "RESULT: NOT MATCHED - pattern '%s' does not match '%s', wildcarded '%s'\n", haystack, needle, wildcarded);
- return 1;
- }
- }
- else if(strncmp(optarg, stacksize_string, strlen(stacksize_string)) == 0) {
- optarg += strlen(stacksize_string);
- config_set(CONFIG_SECTION_GLOBAL, "pthread stack size", optarg);
- }
- else if(strncmp(optarg, debug_flags_string, strlen(debug_flags_string)) == 0) {
- optarg += strlen(debug_flags_string);
- config_set(CONFIG_SECTION_LOGS, "debug flags", optarg);
- debug_flags = strtoull(optarg, NULL, 0);
- }
- else if(strcmp(optarg, "set") == 0) {
- if(optind + 3 > argc) {
- fprintf(stderr, "%s", "\nUSAGE: -W set 'section' 'key' 'value'\n\n"
- " Overwrites settings of netdata.conf.\n"
- "\n"
- " These options interact with: -c netdata.conf\n"
- " If -c netdata.conf is given on the command line,\n"
- " before -W set... the user may overwrite command\n"
- " line parameters at netdata.conf\n"
- " If -c netdata.conf is given after (or missing)\n"
- " -W set... the user cannot overwrite the command line\n"
- " parameters."
- "\n"
- );
- return 1;
- }
- const char *section = argv[optind];
- const char *key = argv[optind + 1];
- const char *value = argv[optind + 2];
- optind += 3;
- // set this one as the default
- // only if it is not already set in the config file
- // so the caller can use -c netdata.conf before or
- // after this parameter to prevent or allow overwriting
- // variables at netdata.conf
- config_set_default(section, key, value);
- // fprintf(stderr, "SET section '%s', key '%s', value '%s'\n", section, key, value);
- }
- else if(strcmp(optarg, "set2") == 0) {
- if(optind + 4 > argc) {
- fprintf(stderr, "%s", "\nUSAGE: -W set 'conf_file' 'section' 'key' 'value'\n\n"
- " Overwrites settings of netdata.conf or cloud.conf\n"
- "\n"
- " These options interact with: -c netdata.conf\n"
- " If -c netdata.conf is given on the command line,\n"
- " before -W set... the user may overwrite command\n"
- " line parameters at netdata.conf\n"
- " If -c netdata.conf is given after (or missing)\n"
- " -W set... the user cannot overwrite the command line\n"
- " parameters."
- " conf_file can be \"cloud\" or \"netdata\".\n"
- "\n"
- );
- return 1;
- }
- const char *conf_file = argv[optind]; /* "cloud" is cloud.conf, otherwise netdata.conf */
- struct config *tmp_config = strcmp(conf_file, "cloud") ? &netdata_config : &cloud_config;
- const char *section = argv[optind + 1];
- const char *key = argv[optind + 2];
- const char *value = argv[optind + 3];
- optind += 4;
- // set this one as the default
- // only if it is not already set in the config file
- // so the caller can use -c netdata.conf before or
- // after this parameter to prevent or allow overwriting
- // variables at netdata.conf
- appconfig_set_default(tmp_config, section, key, value);
- // fprintf(stderr, "SET section '%s', key '%s', value '%s'\n", section, key, value);
- }
- else if(strcmp(optarg, "get") == 0) {
- if(optind + 3 > argc) {
- fprintf(stderr, "%s", "\nUSAGE: -W get 'section' 'key' 'value'\n\n"
- " Prints settings of netdata.conf.\n"
- "\n"
- " These options interact with: -c netdata.conf\n"
- " -c netdata.conf has to be given before -W get.\n"
- "\n"
- );
- return 1;
- }
- if(!config_loaded) {
- fprintf(stderr, "warning: no configuration file has been loaded. Use -c CONFIG_FILE, before -W get. Using default config.\n");
- load_netdata_conf(NULL, 0, &user);
- }
- get_netdata_configured_variables();
- const char *section = argv[optind];
- const char *key = argv[optind + 1];
- const char *def = argv[optind + 2];
- const char *value = config_get(section, key, def);
- printf("%s\n", value);
- return 0;
- }
- else if(strcmp(optarg, "get2") == 0) {
- if(optind + 4 > argc) {
- fprintf(stderr, "%s", "\nUSAGE: -W get2 'conf_file' 'section' 'key' 'value'\n\n"
- " Prints settings of netdata.conf or cloud.conf\n"
- "\n"
- " These options interact with: -c netdata.conf\n"
- " -c netdata.conf has to be given before -W get2.\n"
- " conf_file can be \"cloud\" or \"netdata\".\n"
- "\n"
- );
- return 1;
- }
- if(!config_loaded) {
- fprintf(stderr, "warning: no configuration file has been loaded. Use -c CONFIG_FILE, before -W get. Using default config.\n");
- load_netdata_conf(NULL, 0, &user);
- load_cloud_conf(1);
- }
- get_netdata_configured_variables();
- const char *conf_file = argv[optind]; /* "cloud" is cloud.conf, otherwise netdata.conf */
- struct config *tmp_config = strcmp(conf_file, "cloud") ? &netdata_config : &cloud_config;
- const char *section = argv[optind + 1];
- const char *key = argv[optind + 2];
- const char *def = argv[optind + 3];
- const char *value = appconfig_get(tmp_config, section, key, def);
- printf("%s\n", value);
- return 0;
- }
- else if(strncmp(optarg, claim_string, strlen(claim_string)) == 0) {
- /* will trigger a claiming attempt when the agent is initialized */
- claiming_pending_arguments = optarg + strlen(claim_string);
- }
- else if(strcmp(optarg, "buildinfo") == 0) {
- print_build_info();
- return 0;
- }
- else if(strcmp(optarg, "buildinfojson") == 0) {
- print_build_info_json();
- return 0;
- }
- else if(strcmp(optarg, "keepopenfds") == 0) {
- // Internal dev option to skip closing inherited
- // open FDs. Useful, when we want to run the agent
- // under profiling tools that open/maintain their
- // own FDs.
- close_open_fds = false;
- } else {
- fprintf(stderr, "Unknown -W parameter '%s'\n", optarg);
- return help(1);
- }
- }
- break;
- default: /* ? */
- fprintf(stderr, "Unknown parameter '%c'\n", opt);
- return help(1);
- }
- }
- }
- if (close_open_fds == true) {
- // close all open file descriptors, except the standard ones
- // the caller may have left open files (lxc-attach has this issue)
- for_each_open_fd(OPEN_FD_ACTION_CLOSE, OPEN_FD_EXCLUDE_STDIN | OPEN_FD_EXCLUDE_STDOUT | OPEN_FD_EXCLUDE_STDERR);
- }
- if(!config_loaded) {
- load_netdata_conf(NULL, 0, &user);
- load_cloud_conf(0);
- }
- // ------------------------------------------------------------------------
- // initialize netdata
- {
- char *pmax = config_get(CONFIG_SECTION_GLOBAL, "glibc malloc arena max for plugins", "1");
- if(pmax && *pmax)
- setenv("MALLOC_ARENA_MAX", pmax, 1);
- #if defined(HAVE_C_MALLOPT)
- i = (int)config_get_number(CONFIG_SECTION_GLOBAL, "glibc malloc arena max for netdata", 1);
- if(i > 0)
- mallopt(M_ARENA_MAX, 1);
- #ifdef NETDATA_INTERNAL_CHECKS
- mallopt(M_PERTURB, 0x5A);
- // mallopt(M_MXFAST, 0);
- #endif
- #endif
- // set libuv worker threads
- libuv_worker_threads = (int)get_netdata_cpus() * 6;
- if(libuv_worker_threads < MIN_LIBUV_WORKER_THREADS)
- libuv_worker_threads = MIN_LIBUV_WORKER_THREADS;
- if(libuv_worker_threads > MAX_LIBUV_WORKER_THREADS)
- libuv_worker_threads = MAX_LIBUV_WORKER_THREADS;
- libuv_worker_threads = config_get_number(CONFIG_SECTION_GLOBAL, "libuv worker threads", libuv_worker_threads);
- if(libuv_worker_threads < MIN_LIBUV_WORKER_THREADS) {
- libuv_worker_threads = MIN_LIBUV_WORKER_THREADS;
- config_set_number(CONFIG_SECTION_GLOBAL, "libuv worker threads", libuv_worker_threads);
- }
- {
- char buf[20 + 1];
- snprintfz(buf, 20, "%d", libuv_worker_threads);
- setenv("UV_THREADPOOL_SIZE", buf, 1);
- }
- // prepare configuration environment variables for the plugins
- get_netdata_configured_variables();
- set_global_environment();
- // work while we are cd into config_dir
- // to allow the plugins refer to their config
- // files using relative filenames
- if(chdir(netdata_configured_user_config_dir) == -1)
- fatal("Cannot cd to '%s'", netdata_configured_user_config_dir);
- // Get execution path before switching user to avoid permission issues
- get_netdata_execution_path();
- }
- {
- // --------------------------------------------------------------------
- // get the debugging flags from the configuration file
- char *flags = config_get(CONFIG_SECTION_LOGS, "debug flags", "0x0000000000000000");
- setenv("NETDATA_DEBUG_FLAGS", flags, 1);
- debug_flags = strtoull(flags, NULL, 0);
- netdata_log_debug(D_OPTIONS, "Debug flags set to '0x%" PRIX64 "'.", debug_flags);
- if(debug_flags != 0) {
- struct rlimit rl = { RLIM_INFINITY, RLIM_INFINITY };
- if(setrlimit(RLIMIT_CORE, &rl) != 0)
- netdata_log_error("Cannot request unlimited core dumps for debugging... Proceeding anyway...");
- #ifdef HAVE_SYS_PRCTL_H
- prctl(PR_SET_DUMPABLE, 1, 0, 0, 0);
- #endif
- }
- // --------------------------------------------------------------------
- // get log filenames and settings
- log_init();
- error_log_limit_unlimited();
- // initialize the log files
- open_all_log_files();
- ieee754_doubles = is_system_ieee754_double();
- aral_judy_init();
- get_system_timezone();
- bearer_tokens_init();
- replication_initialize();
- // --------------------------------------------------------------------
- // get the certificate and start security
- #ifdef ENABLE_HTTPS
- security_init();
- #endif
- // --------------------------------------------------------------------
- // This is the safest place to start the SILENCERS structure
- set_silencers_filename();
- health_initialize_global_silencers();
- // --------------------------------------------------------------------
- // Initialize ML configuration
- delta_startup_time("initialize ML");
- ml_init();
- // --------------------------------------------------------------------
- // setup process signals
- // block signals while initializing threads.
- // this causes the threads to block signals.
- delta_startup_time("initialize signals");
- signals_block();
- signals_init(); // setup the signals we want to use
- // --------------------------------------------------------------------
- // check which threads are enabled and initialize them
- delta_startup_time("initialize static threads");
- // setup threads configs
- default_stacksize = netdata_threads_init();
- for (i = 0; static_threads[i].name != NULL ; i++) {
- struct netdata_static_thread *st = &static_threads[i];
- if(st->config_name)
- st->enabled = config_get_boolean(st->config_section, st->config_name, st->enabled);
- if(st->enabled && st->init_routine)
- st->init_routine();
- if(st->env_name)
- setenv(st->env_name, st->enabled?"YES":"NO", 1);
- if(st->global_variable)
- *st->global_variable = (st->enabled) ? true : false;
- }
- // --------------------------------------------------------------------
- // create the listening sockets
- delta_startup_time("initialize web server");
- web_client_api_v1_init();
- web_server_threading_selection();
- if(web_server_mode != WEB_SERVER_MODE_NONE)
- api_listen_sockets_setup();
- #ifdef ENABLE_H2O
- delta_startup_time("initialize h2o server");
- for (int i = 0; static_threads[i].name; i++) {
- if (static_threads[i].start_routine == h2o_main)
- static_threads[i].enabled = httpd_is_enabled();
- }
- #endif
- }
- delta_startup_time("set resource limits");
- #ifdef NETDATA_INTERNAL_CHECKS
- if(debug_flags != 0) {
- struct rlimit rl = { RLIM_INFINITY, RLIM_INFINITY };
- if(setrlimit(RLIMIT_CORE, &rl) != 0)
- netdata_log_error("Cannot request unlimited core dumps for debugging... Proceeding anyway...");
- #ifdef HAVE_SYS_PRCTL_H
- prctl(PR_SET_DUMPABLE, 1, 0, 0, 0);
- #endif
- }
- #endif /* NETDATA_INTERNAL_CHECKS */
- set_nofile_limit(&rlimit_nofile);
- delta_startup_time("become daemon");
- // fork, switch user, create pid file, set process priority
- if(become_daemon(dont_fork, user) == -1)
- fatal("Cannot daemonize myself.");
- netdata_log_info("netdata started on pid %d.", getpid());
- delta_startup_time("initialize threads after fork");
- netdata_threads_init_after_fork((size_t)config_get_number(CONFIG_SECTION_GLOBAL, "pthread stack size", (long)default_stacksize));
- // initialize internal registry
- delta_startup_time("initialize registry");
- registry_init();
- // fork the spawn server
- delta_startup_time("fork the spawn server");
- spawn_init();
- /*
- * Libuv uv_spawn() uses SIGCHLD internally:
- * https://github.com/libuv/libuv/blob/cc51217a317e96510fbb284721d5e6bc2af31e33/src/unix/process.c#L485
- * and inadvertently replaces the netdata signal handler which was setup during initialization.
- * Thusly, we must explicitly restore the signal handler for SIGCHLD.
- * Warning: extreme care is needed when mixing and matching POSIX and libuv.
- */
- signals_restore_SIGCHLD();
- // ------------------------------------------------------------------------
- // initialize rrd, registry, health, rrdpush, etc.
- delta_startup_time("collecting system info");
- netdata_anonymous_statistics_enabled=-1;
- struct rrdhost_system_info *system_info = callocz(1, sizeof(struct rrdhost_system_info));
- __atomic_sub_fetch(&netdata_buffers_statistics.rrdhost_allocations_size, sizeof(struct rrdhost_system_info), __ATOMIC_RELAXED);
- get_system_info(system_info, true);
- (void) registry_get_this_machine_guid();
- system_info->hops = 0;
- get_install_type(&system_info->install_type, &system_info->prebuilt_arch, &system_info->prebuilt_dist);
- delta_startup_time("initialize RRD structures");
- if(rrd_init(netdata_configured_hostname, system_info, false)) {
- set_late_global_environment(system_info);
- fatal("Cannot initialize localhost instance with name '%s'.", netdata_configured_hostname);
- }
- delta_startup_time("check for incomplete shutdown");
- char agent_crash_file[FILENAME_MAX + 1];
- char agent_incomplete_shutdown_file[FILENAME_MAX + 1];
- snprintfz(agent_incomplete_shutdown_file, FILENAME_MAX, "%s/.agent_incomplete_shutdown", netdata_configured_varlib_dir);
- int incomplete_shutdown_detected = (unlink(agent_incomplete_shutdown_file) == 0);
- snprintfz(agent_crash_file, FILENAME_MAX, "%s/.agent_crash", netdata_configured_varlib_dir);
- int crash_detected = (unlink(agent_crash_file) == 0);
- int fd = open(agent_crash_file, O_WRONLY | O_CREAT | O_TRUNC, 444);
- if (fd >= 0)
- close(fd);
- // ------------------------------------------------------------------------
- // Claim netdata agent to a cloud endpoint
- delta_startup_time("collect claiming info");
- if (claiming_pending_arguments)
- claim_agent(claiming_pending_arguments, false, NULL);
- load_claiming_state();
- // ------------------------------------------------------------------------
- // enable log flood protection
- error_log_limit_reset();
- // Load host labels
- delta_startup_time("collect host labels");
- reload_host_labels();
- // ------------------------------------------------------------------------
- // spawn the threads
- delta_startup_time("start the static threads");
- web_server_config_options();
- netdata_zero_metrics_enabled = config_get_boolean_ondemand(CONFIG_SECTION_DB, "enable zero metrics", CONFIG_BOOLEAN_NO);
- set_late_global_environment(system_info);
- for (i = 0; static_threads[i].name != NULL ; i++) {
- struct netdata_static_thread *st = &static_threads[i];
- if(st->enabled) {
- st->thread = mallocz(sizeof(netdata_thread_t));
- netdata_log_debug(D_SYSTEM, "Starting thread %s.", st->name);
- netdata_thread_create(st->thread, st->name, NETDATA_THREAD_OPTION_DEFAULT, st->start_routine, st);
- }
- else
- netdata_log_debug(D_SYSTEM, "Not starting thread %s.", st->name);
- }
- ml_start_threads();
- // ------------------------------------------------------------------------
- // Initialize netdata agent command serving from cli and signals
- delta_startup_time("initialize commands API");
- commands_init();
- delta_startup_time("ready");
- usec_t ready_ut = now_monotonic_usec();
- netdata_log_info("NETDATA STARTUP: completed in %llu ms. Enjoy real-time performance monitoring!", (ready_ut - started_ut) / USEC_PER_MS);
- netdata_ready = true;
- send_statistics("START", "-", "-");
- if (crash_detected)
- send_statistics("CRASH", "-", "-");
- if (incomplete_shutdown_detected)
- send_statistics("INCOMPLETE_SHUTDOWN", "-", "-");
- //check if ANALYTICS needs to start
- if (netdata_anonymous_statistics_enabled == 1) {
- for (i = 0; static_threads[i].name != NULL; i++) {
- if (!strncmp(static_threads[i].name, "ANALYTICS", 9)) {
- struct netdata_static_thread *st = &static_threads[i];
- st->thread = mallocz(sizeof(netdata_thread_t));
- st->enabled = 1;
- netdata_log_debug(D_SYSTEM, "Starting thread %s.", st->name);
- netdata_thread_create(st->thread, st->name, NETDATA_THREAD_OPTION_DEFAULT, st->start_routine, st);
- }
- }
- }
- // ------------------------------------------------------------------------
- // Report ACLK build failure
- #ifndef ENABLE_ACLK
- netdata_log_error("This agent doesn't have ACLK.");
- char filename[FILENAME_MAX + 1];
- snprintfz(filename, FILENAME_MAX, "%s/.aclk_report_sent", netdata_configured_varlib_dir);
- if (netdata_anonymous_statistics_enabled > 0 && access(filename, F_OK)) { // -1 -> not initialized
- send_statistics("ACLK_DISABLED", "-", "-");
- int fd = open(filename, O_WRONLY | O_CREAT | O_TRUNC, 444);
- if (fd == -1)
- netdata_log_error("Cannot create file '%s'. Please fix this.", filename);
- else
- close(fd);
- }
- #endif
- // ------------------------------------------------------------------------
- // initialize WebRTC
- webrtc_initialize();
- // ------------------------------------------------------------------------
- // unblock signals
- signals_unblock();
- // ------------------------------------------------------------------------
- // Handle signals
- signals_handle();
- // should never reach this point
- // but we need it for rpmlint #2752
- return 1;
- }
|