sqlite_aclk_chart.c 35 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include "sqlite_functions.h"
  3. #include "sqlite_aclk_chart.h"
  4. #ifdef ENABLE_NEW_CLOUD_PROTOCOL
  5. #include "../../aclk/aclk_charts_api.h"
  6. #include "../../aclk/aclk.h"
  7. static inline int sql_queue_chart_payload(struct aclk_database_worker_config *wc,
  8. void *data, enum aclk_database_opcode opcode)
  9. {
  10. int rc;
  11. if (unlikely(!wc))
  12. return 1;
  13. struct aclk_database_cmd cmd;
  14. memset(&cmd, 0, sizeof(cmd));
  15. cmd.opcode = opcode;
  16. cmd.data = data;
  17. rc = aclk_database_enq_cmd_noblock(wc, &cmd);
  18. return rc;
  19. }
  20. static int payload_sent(char *uuid_str, uuid_t *uuid, void *payload, size_t payload_size)
  21. {
  22. static __thread sqlite3_stmt *res = NULL;
  23. int rc;
  24. int send_status = 0;
  25. if (unlikely(!res)) {
  26. BUFFER *sql = buffer_create(1024);
  27. buffer_sprintf(sql,"SELECT 1 FROM aclk_chart_latest_%s acl, aclk_chart_payload_%s acp "
  28. "WHERE acl.unique_id = acp.unique_id AND acl.uuid = @uuid AND acp.payload = @payload;",
  29. uuid_str, uuid_str);
  30. rc = prepare_statement(db_meta, (char *) buffer_tostring(sql), &res);
  31. buffer_free(sql);
  32. if (rc != SQLITE_OK) {
  33. error_report("Failed to prepare statement to check payload data");
  34. return 0;
  35. }
  36. }
  37. rc = sqlite3_bind_blob(res, 1, uuid , sizeof(*uuid), SQLITE_STATIC);
  38. if (unlikely(rc != SQLITE_OK))
  39. goto bind_fail;
  40. rc = sqlite3_bind_blob(res, 2, payload , payload_size, SQLITE_STATIC);
  41. if (unlikely(rc != SQLITE_OK))
  42. goto bind_fail;
  43. while (sqlite3_step(res) == SQLITE_ROW) {
  44. send_status = sqlite3_column_int(res, 0);
  45. }
  46. bind_fail:
  47. if (unlikely(sqlite3_reset(res) != SQLITE_OK))
  48. error_report("Failed to reset statement in check payload, rc = %d", rc);
  49. return send_status;
  50. }
  51. static int aclk_add_chart_payload(struct aclk_database_worker_config *wc, uuid_t *uuid, char *claim_id,
  52. ACLK_PAYLOAD_TYPE payload_type, void *payload, size_t payload_size)
  53. {
  54. static __thread sqlite3_stmt *res_chart = NULL;
  55. int rc;
  56. rc = payload_sent(wc->uuid_str, uuid, payload, payload_size);
  57. if (rc == 1)
  58. return 0;
  59. if (unlikely(!res_chart)) {
  60. BUFFER *sql = buffer_create(1024);
  61. buffer_sprintf(sql,"INSERT INTO aclk_chart_payload_%s (unique_id, uuid, claim_id, date_created, type, payload) " \
  62. "VALUES (@unique_id, @uuid, @claim_id, strftime('%%s','now'), @type, @payload);", wc->uuid_str);
  63. rc = prepare_statement(db_meta, (char *) buffer_tostring(sql), &res_chart);
  64. buffer_free(sql);
  65. if (rc != SQLITE_OK) {
  66. error_report("Failed to prepare statement to store chart payload data");
  67. return 1;
  68. }
  69. }
  70. uuid_t unique_uuid;
  71. uuid_generate(unique_uuid);
  72. uuid_t claim_uuid;
  73. if (uuid_parse(claim_id, claim_uuid))
  74. return 1;
  75. rc = sqlite3_bind_blob(res_chart, 1, &unique_uuid , sizeof(unique_uuid), SQLITE_STATIC);
  76. if (unlikely(rc != SQLITE_OK))
  77. goto bind_fail;
  78. rc = sqlite3_bind_blob(res_chart, 2, uuid , sizeof(*uuid), SQLITE_STATIC);
  79. if (unlikely(rc != SQLITE_OK))
  80. goto bind_fail;
  81. rc = sqlite3_bind_blob(res_chart, 3, &claim_uuid , sizeof(claim_uuid), SQLITE_STATIC);
  82. if (unlikely(rc != SQLITE_OK))
  83. goto bind_fail;
  84. rc = sqlite3_bind_int(res_chart, 4, payload_type);
  85. if (unlikely(rc != SQLITE_OK))
  86. goto bind_fail;
  87. rc = sqlite3_bind_blob(res_chart, 5, payload, payload_size, SQLITE_STATIC);
  88. if (unlikely(rc != SQLITE_OK))
  89. goto bind_fail;
  90. rc = execute_insert(res_chart);
  91. if (unlikely(rc != SQLITE_DONE))
  92. error_report("Failed store chart payload event, rc = %d", rc);
  93. else {
  94. wc->chart_payload_count++;
  95. time_t now = now_realtime_sec();
  96. if (wc->rotation_after > now && wc->rotation_after < now + ACLK_DATABASE_ROTATION_DELAY)
  97. wc->rotation_after = now + ACLK_DATABASE_ROTATION_DELAY;
  98. }
  99. bind_fail:
  100. if (unlikely(sqlite3_reset(res_chart) != SQLITE_OK))
  101. error_report("Failed to reset statement in store chart payload, rc = %d", rc);
  102. return (rc != SQLITE_DONE);
  103. }
  104. int aclk_add_chart_event(struct aclk_database_worker_config *wc, struct aclk_database_cmd cmd)
  105. {
  106. int rc = 0;
  107. CHECK_SQLITE_CONNECTION(db_meta);
  108. char *claim_id = is_agent_claimed();
  109. RRDSET *st = cmd.data;
  110. if (likely(claim_id)) {
  111. struct chart_instance_updated chart_payload;
  112. memset(&chart_payload, 0, sizeof(chart_payload));
  113. chart_payload.config_hash = get_str_from_uuid(&st->state->hash_id);
  114. chart_payload.update_every = st->update_every;
  115. chart_payload.memory_mode = st->rrd_memory_mode;
  116. chart_payload.name = (char *)st->name;
  117. chart_payload.node_id = wc->node_id;
  118. chart_payload.claim_id = claim_id;
  119. chart_payload.id = strdupz(st->id);
  120. struct label_index *labels = &st->state->labels;
  121. netdata_rwlock_wrlock(&labels->labels_rwlock);
  122. struct label *label_list = labels->head;
  123. struct label *chart_label = NULL;
  124. while (label_list) {
  125. chart_label = add_label_to_list(chart_label, label_list->key, label_list->value, label_list->label_source);
  126. label_list = label_list->next;
  127. }
  128. netdata_rwlock_unlock(&labels->labels_rwlock);
  129. chart_payload.label_head = chart_label;
  130. size_t size;
  131. char *payload = generate_chart_instance_updated(&size, &chart_payload);
  132. if (likely(payload))
  133. rc = aclk_add_chart_payload(wc, st->chart_uuid, claim_id, ACLK_PAYLOAD_CHART, (void *) payload, size);
  134. freez(payload);
  135. chart_instance_updated_destroy(&chart_payload);
  136. }
  137. return rc;
  138. }
  139. static inline int aclk_upd_dimension_event(struct aclk_database_worker_config *wc, char *claim_id, uuid_t *dim_uuid,
  140. const char *dim_id, const char *dim_name, const char *chart_type_id, time_t first_time, time_t last_time)
  141. {
  142. int rc = 0;
  143. size_t size;
  144. if (unlikely(!dim_uuid || !dim_id || !dim_name || !chart_type_id))
  145. return 0;
  146. struct chart_dimension_updated dim_payload;
  147. memset(&dim_payload, 0, sizeof(dim_payload));
  148. #ifdef NETDATA_INTERNAL_CHECKS
  149. if (!first_time)
  150. info("Host %s (node %s) deleting dimension id=[%s] name=[%s] chart=[%s]",
  151. wc->host_guid, wc->node_id, dim_id, dim_name, chart_type_id);
  152. #endif
  153. dim_payload.node_id = wc->node_id;
  154. dim_payload.claim_id = claim_id;
  155. dim_payload.name = dim_name;
  156. dim_payload.id = dim_id;
  157. dim_payload.chart_id = chart_type_id;
  158. dim_payload.created_at.tv_sec = first_time;
  159. dim_payload.last_timestamp.tv_sec = last_time;
  160. char *payload = generate_chart_dimension_updated(&size, &dim_payload);
  161. if (likely(payload))
  162. rc = aclk_add_chart_payload(wc, dim_uuid, claim_id, ACLK_PAYLOAD_DIMENSION, (void *)payload, size);
  163. freez(payload);
  164. return rc;
  165. }
  166. void aclk_process_dimension_deletion(struct aclk_database_worker_config *wc, struct aclk_database_cmd cmd)
  167. {
  168. int rc = 0;
  169. sqlite3_stmt *res = NULL;
  170. if (!aclk_use_new_cloud_arch || !aclk_connected)
  171. return;
  172. if (unlikely(!db_meta))
  173. return;
  174. uuid_t host_id;
  175. if (uuid_parse(wc->host_guid, host_id))
  176. return;
  177. char *claim_id = is_agent_claimed();
  178. if (!claim_id)
  179. return;
  180. rc = sqlite3_prepare_v2(db_meta, "DELETE FROM dimension_delete where host_id = @host_id " \
  181. "RETURNING dimension_id, dimension_name, chart_type_id, dim_id LIMIT 10;", -1, &res, 0);
  182. if (rc != SQLITE_OK) {
  183. error_report("Failed to prepare statement when trying to delete dimension deletes");
  184. freez(claim_id);
  185. return;
  186. }
  187. rc = sqlite3_bind_blob(res, 1, &host_id , sizeof(host_id), SQLITE_STATIC);
  188. if (unlikely(rc != SQLITE_OK))
  189. goto bind_fail;
  190. unsigned count = 0;
  191. while (sqlite3_step(res) == SQLITE_ROW) {
  192. (void) aclk_upd_dimension_event(
  193. wc,
  194. claim_id,
  195. (uuid_t *)sqlite3_column_text(res, 3),
  196. (const char *)sqlite3_column_text(res, 0),
  197. (const char *)sqlite3_column_text(res, 1),
  198. (const char *)sqlite3_column_text(res, 2),
  199. 0,
  200. 0);
  201. count++;
  202. }
  203. if (count) {
  204. memset(&cmd, 0, sizeof(cmd));
  205. cmd.opcode = ACLK_DATABASE_DIM_DELETION;
  206. if (aclk_database_enq_cmd_noblock(wc, &cmd))
  207. info("Failed to queue a dimension deletion message");
  208. }
  209. bind_fail:
  210. rc = sqlite3_finalize(res);
  211. if (unlikely(rc != SQLITE_OK))
  212. error_report("Failed to finalize statement when adding dimension deletion events, rc = %d", rc);
  213. freez(claim_id);
  214. return;
  215. }
  216. int aclk_add_dimension_event(struct aclk_database_worker_config *wc, struct aclk_database_cmd cmd)
  217. {
  218. int rc = 0;
  219. CHECK_SQLITE_CONNECTION(db_meta);
  220. char *claim_id = is_agent_claimed();
  221. RRDDIM *rd = cmd.data;
  222. if (likely(claim_id)) {
  223. time_t now = now_realtime_sec();
  224. time_t first_t = rd->state->query_ops.oldest_time(rd);
  225. time_t last_t = rd->state->query_ops.latest_time(rd);
  226. int live = ((now - last_t) < (RRDSET_MINIMUM_LIVE_COUNT * rd->update_every));
  227. rc = aclk_upd_dimension_event(
  228. wc,
  229. claim_id,
  230. &rd->state->metric_uuid,
  231. rd->id,
  232. rd->name,
  233. rd->rrdset->id,
  234. first_t,
  235. live ? 0 : last_t);
  236. freez(claim_id);
  237. }
  238. rrddim_flag_clear(rd, RRDDIM_FLAG_ACLK);
  239. return rc;
  240. }
  241. void aclk_send_chart_event(struct aclk_database_worker_config *wc, struct aclk_database_cmd cmd)
  242. {
  243. int rc;
  244. wc->chart_pending = 0;
  245. if (unlikely(!wc->chart_updates)) {
  246. log_access("AC [%s (%s)]: Ignoring chart push event, updates have been turned off for this node.", wc->node_id, wc->host ? wc->host->hostname : "N/A");
  247. return;
  248. }
  249. char *claim_id = is_agent_claimed();
  250. if (unlikely(!claim_id))
  251. return;
  252. uuid_t claim_uuid;
  253. if (uuid_parse(claim_id, claim_uuid))
  254. return;
  255. int limit = cmd.count > 0 ? cmd.count : 1;
  256. uint64_t first_sequence;
  257. uint64_t last_sequence;
  258. time_t last_timestamp;
  259. BUFFER *sql = buffer_create(1024);
  260. sqlite3_stmt *res = NULL;
  261. buffer_sprintf(sql, "SELECT ac.sequence_id, acp.payload, ac.date_created, ac.type, ac.uuid " \
  262. "FROM aclk_chart_%s ac, aclk_chart_payload_%s acp " \
  263. "WHERE ac.date_submitted IS NULL AND ac.unique_id = acp.unique_id AND ac.update_count > 0 " \
  264. "AND acp.claim_id = @claim_id ORDER BY ac.sequence_id ASC LIMIT %d;", wc->uuid_str, wc->uuid_str, limit);
  265. rc = sqlite3_prepare_v2(db_meta, buffer_tostring(sql), -1, &res, 0);
  266. if (rc != SQLITE_OK) {
  267. error_report("Failed to prepare statement when trying to send a chart update via ACLK");
  268. buffer_free(sql);
  269. freez(claim_id);
  270. return;
  271. }
  272. rc = sqlite3_bind_blob(res, 1, claim_uuid , sizeof(claim_uuid), SQLITE_STATIC);
  273. if (unlikely(rc != SQLITE_OK))
  274. goto bind_fail;
  275. char **payload_list = callocz(limit+1, sizeof(char *));
  276. size_t *payload_list_size = callocz(limit+1, sizeof(size_t));
  277. size_t *payload_list_max_size = callocz(limit+1, sizeof(size_t));
  278. struct aclk_message_position *position_list = callocz(limit+1, sizeof(*position_list));
  279. int *is_dim = callocz(limit+1, sizeof(*is_dim));
  280. int loop = cmd.param1;
  281. uint64_t start_sequence_id = wc->chart_sequence_id;
  282. while (loop > 0) {
  283. uint64_t previous_sequence_id = wc->chart_sequence_id;
  284. int count = 0;
  285. first_sequence = 0;
  286. last_sequence = 0;
  287. while (count < limit && sqlite3_step(res) == SQLITE_ROW) {
  288. size_t payload_size = sqlite3_column_bytes(res, 1);
  289. if (payload_list_max_size[count] < payload_size) {
  290. freez(payload_list[count]);
  291. payload_list_max_size[count] = payload_size;
  292. payload_list[count] = mallocz(payload_size);
  293. }
  294. payload_list_size[count] = payload_size;
  295. memcpy(payload_list[count], sqlite3_column_blob(res, 1), payload_size);
  296. position_list[count].sequence_id = (uint64_t)sqlite3_column_int64(res, 0);
  297. position_list[count].previous_sequence_id = previous_sequence_id;
  298. position_list[count].seq_id_creation_time.tv_sec = sqlite3_column_int64(res, 2);
  299. position_list[count].seq_id_creation_time.tv_usec = 0;
  300. if (!first_sequence)
  301. first_sequence = position_list[count].sequence_id;
  302. last_sequence = position_list[count].sequence_id;
  303. last_timestamp = position_list[count].seq_id_creation_time.tv_sec;
  304. previous_sequence_id = last_sequence;
  305. is_dim[count] = sqlite3_column_int(res, 3) > 0;
  306. count++;
  307. if (wc->chart_payload_count)
  308. wc->chart_payload_count--;
  309. }
  310. freez(payload_list[count]);
  311. payload_list_max_size[count] = 0;
  312. payload_list[count] = NULL;
  313. rc = sqlite3_reset(res);
  314. if (unlikely(rc != SQLITE_OK))
  315. error_report("Failed to reset statement when pushing chart events, rc = %d", rc);
  316. if (likely(first_sequence)) {
  317. buffer_flush(sql);
  318. db_lock();
  319. buffer_sprintf(sql, "UPDATE aclk_chart_%s SET status = NULL, date_submitted=strftime('%%s','now') "
  320. "WHERE date_submitted IS NULL AND sequence_id BETWEEN %" PRIu64 " AND %" PRIu64 ";",
  321. wc->uuid_str, first_sequence, last_sequence);
  322. db_execute(buffer_tostring(sql));
  323. buffer_flush(sql);
  324. buffer_sprintf(sql, "INSERT OR REPLACE INTO aclk_chart_latest_%s (uuid, unique_id, date_submitted) "
  325. " SELECT uuid, unique_id, date_submitted FROM aclk_chart_%s s "
  326. " WHERE date_submitted IS NOT NULL AND sequence_id BETWEEN %" PRIu64 " AND %" PRIu64
  327. " ;",
  328. wc->uuid_str, wc->uuid_str, first_sequence, last_sequence);
  329. db_execute(buffer_tostring(sql));
  330. db_unlock();
  331. aclk_chart_inst_and_dim_update(payload_list, payload_list_size, is_dim, position_list, wc->batch_id);
  332. log_access("OG [%s (%s)]: Sending charts and dimensions update, batch_id %"PRIu64", first sequence %"PRIu64", last sequence %"PRIu64, wc->node_id, wc->host ? wc->host->hostname : "N/A", wc->batch_id, first_sequence, last_sequence);
  333. wc->chart_sequence_id = last_sequence;
  334. wc->chart_timestamp = last_timestamp;
  335. }
  336. else
  337. break;
  338. --loop;
  339. }
  340. if (start_sequence_id != wc->chart_sequence_id) {
  341. time_t now = now_realtime_sec();
  342. if (wc->rotation_after > now && wc->rotation_after < now + ACLK_DATABASE_ROTATION_DELAY)
  343. wc->rotation_after = now + ACLK_DATABASE_ROTATION_DELAY;
  344. }
  345. else {
  346. wc->chart_payload_count = sql_get_pending_count(wc);
  347. if (!wc->chart_payload_count)
  348. log_access("AC [%s (%s)]: Sync of charts and dimensions done in %ld seconds.", wc->node_id, wc->host ? wc->host->hostname : "N/A", now_realtime_sec() - wc->startup_time);
  349. }
  350. for (int i = 0; i <= limit; ++i)
  351. freez(payload_list[i]);
  352. freez(payload_list);
  353. freez(payload_list_size);
  354. freez(payload_list_max_size);
  355. freez(position_list);
  356. freez(is_dim);
  357. bind_fail:
  358. rc = sqlite3_finalize(res);
  359. if (unlikely(rc != SQLITE_OK))
  360. error_report("Failed to finalize statement when pushing chart events, rc = %d", rc);
  361. buffer_free(sql);
  362. freez(claim_id);
  363. return;
  364. }
  365. // Push one chart config to the cloud
  366. int aclk_send_chart_config(struct aclk_database_worker_config *wc, struct aclk_database_cmd cmd)
  367. {
  368. UNUSED(wc);
  369. CHECK_SQLITE_CONNECTION(db_meta);
  370. sqlite3_stmt *res = NULL;
  371. int rc = 0;
  372. char *hash_id = (char *) cmd.data_param;
  373. uuid_t hash_uuid;
  374. rc = uuid_parse(hash_id, hash_uuid);
  375. if (unlikely(rc)) {
  376. freez((char *) cmd.data_param);
  377. return 1;
  378. }
  379. BUFFER *sql = buffer_create(1024);
  380. buffer_sprintf(sql, "SELECT type, family, context, title, priority, plugin, module, unit, chart_type " \
  381. "FROM chart_hash WHERE hash_id = @hash_id;");
  382. rc = sqlite3_prepare_v2(db_meta, buffer_tostring(sql), -1, &res, 0);
  383. if (rc != SQLITE_OK) {
  384. error_report("Failed to prepare statement when trying to fetch a chart hash configuration");
  385. goto fail;
  386. }
  387. rc = sqlite3_bind_blob(res, 1, &hash_uuid , sizeof(hash_uuid), SQLITE_STATIC);
  388. if (unlikely(rc != SQLITE_OK))
  389. goto bind_fail;
  390. struct chart_config_updated chart_config;
  391. chart_config.config_hash = NULL;
  392. while (sqlite3_step(res) == SQLITE_ROW) {
  393. chart_config.type = strdupz((char *)sqlite3_column_text(res, 0));
  394. chart_config.family = strdupz((char *)sqlite3_column_text(res, 1));
  395. chart_config.context = strdupz((char *)sqlite3_column_text(res, 2));
  396. chart_config.title = strdupz((char *)sqlite3_column_text(res, 3));
  397. chart_config.priority = sqlite3_column_int64(res, 4);
  398. chart_config.plugin = strdupz((char *)sqlite3_column_text(res, 5));
  399. chart_config.module = sqlite3_column_bytes(res, 6) > 0 ? strdupz((char *)sqlite3_column_text(res, 6)) : NULL;
  400. chart_config.chart_type = (RRDSET_TYPE) sqlite3_column_int(res,8);
  401. chart_config.units = strdupz((char *)sqlite3_column_text(res, 7));
  402. chart_config.config_hash = strdupz(hash_id);
  403. }
  404. if (likely(chart_config.config_hash)) {
  405. log_access("OG [%s (%s)]: Sending chart config for %s.", wc->node_id, wc->host ? wc->host->hostname : "N/A", hash_id);
  406. aclk_chart_config_updated(&chart_config, 1);
  407. destroy_chart_config_updated(&chart_config);
  408. }
  409. else
  410. log_access("AC [%s (%s)]: Chart config for %s not found.", wc->node_id, wc->host ? wc->host->hostname : "N/A", hash_id);
  411. bind_fail:
  412. rc = sqlite3_finalize(res);
  413. if (unlikely(rc != SQLITE_OK))
  414. error_report("Failed to reset statement when pushing chart config hash, rc = %d", rc);
  415. fail:
  416. freez((char *) cmd.data_param);
  417. buffer_free(sql);
  418. return rc;
  419. }
  420. void aclk_receive_chart_ack(struct aclk_database_worker_config *wc, struct aclk_database_cmd cmd)
  421. {
  422. int rc;
  423. sqlite3_stmt *res = NULL;
  424. log_access("IN [%s (%s)]: Received ack chart sequence id %"PRIu64, wc->node_id, wc->host ? wc->host->hostname : "N/A", cmd.param1);
  425. BUFFER *sql = buffer_create(1024);
  426. buffer_sprintf(sql, "UPDATE aclk_chart_%s SET date_updated=strftime('%%s','now') WHERE sequence_id <= @sequence_id "
  427. "AND date_submitted IS NOT NULL AND date_updated IS NULL;", wc->uuid_str);
  428. rc = sqlite3_prepare_v2(db_meta, buffer_tostring(sql), -1, &res, 0);
  429. if (rc != SQLITE_OK) {
  430. error_report("Failed to prepare statement count sequence ids in the database");
  431. goto prepare_fail;
  432. }
  433. rc = sqlite3_bind_int64(res, 1, (uint64_t) cmd.param1);
  434. if (unlikely(rc != SQLITE_OK))
  435. goto bind_fail;
  436. rc = execute_insert(res);
  437. if (rc != SQLITE_DONE)
  438. error_report("Failed to ACK sequence id, rc = %d", rc);
  439. bind_fail:
  440. if (unlikely(sqlite3_finalize(res) != SQLITE_OK))
  441. error_report("Failed to finalize statement to ACK older sequence ids, rc = %d", rc);
  442. prepare_fail:
  443. buffer_free(sql);
  444. return;
  445. }
  446. void aclk_receive_chart_reset(struct aclk_database_worker_config *wc, struct aclk_database_cmd cmd)
  447. {
  448. BUFFER *sql = buffer_create(1024);
  449. buffer_sprintf(sql, "UPDATE aclk_chart_%s SET status = NULL, date_submitted = NULL WHERE sequence_id >= %"PRIu64";",
  450. wc->uuid_str, cmd.param1);
  451. db_execute(buffer_tostring(sql));
  452. if (cmd.param1 == 1) {
  453. db_lock();
  454. buffer_flush(sql);
  455. log_access("IN [%s (%s)]: Received chart full resync.", wc->node_id, wc->host ? wc->host->hostname : "N/A");
  456. buffer_sprintf(sql, "DELETE FROM aclk_chart_payload_%s; DELETE FROM aclk_chart_%s; " \
  457. "DELETE FROM aclk_chart_latest_%s;", wc->uuid_str, wc->uuid_str, wc->uuid_str);
  458. db_execute("BEGIN TRANSACTION;");
  459. db_execute(buffer_tostring(sql));
  460. db_execute("COMMIT TRANSACTION;");
  461. db_unlock();
  462. wc->chart_sequence_id = 0;
  463. wc->chart_timestamp = 0;
  464. wc->chart_payload_count = 0;
  465. RRDHOST *host = wc->host;
  466. if (likely(host)) {
  467. rrdhost_rdlock(host);
  468. RRDSET *st;
  469. rrdset_foreach_read(st, host)
  470. {
  471. rrdset_rdlock(st);
  472. rrdset_flag_clear(st, RRDSET_FLAG_ACLK);
  473. RRDDIM *rd;
  474. rrddim_foreach_read(rd, st)
  475. {
  476. rd->state->aclk_live_status = (rd->state->aclk_live_status == 0);
  477. }
  478. rrdset_unlock(st);
  479. }
  480. rrdhost_unlock(host);
  481. }
  482. else
  483. error_report("ACLK synchronization thread for %s is not linked to HOST", wc->host_guid);
  484. }
  485. else {
  486. log_access("AC [%s (%s)]: Restarting chart sync from sequence %"PRIu64, wc->node_id, wc->host ? wc->host->hostname : "N/A", cmd.param1);
  487. wc->chart_payload_count = sql_get_pending_count(wc);
  488. sql_get_last_chart_sequence(wc);
  489. }
  490. buffer_free(sql);
  491. wc->chart_updates = 1;
  492. return;
  493. }
  494. //
  495. // Functions called directly from ACLK threads and will queue commands
  496. //
  497. void aclk_get_chart_config(char **hash_id)
  498. {
  499. struct aclk_database_worker_config *wc = (struct aclk_database_worker_config *)localhost->dbsync_worker;
  500. if (unlikely(!wc || !hash_id))
  501. return;
  502. struct aclk_database_cmd cmd;
  503. memset(&cmd, 0, sizeof(cmd));
  504. cmd.opcode = ACLK_DATABASE_PUSH_CHART_CONFIG;
  505. for (int i = 0; hash_id[i]; ++i) {
  506. // TODO: Verify that we have a valid hash_id
  507. log_access("IN [%s (%s)]: Request %d for chart config with hash %s received.", wc->node_id, wc->host ? wc->host->hostname : "N/A", i, hash_id[i]);
  508. cmd.data_param = (void *)strdupz(hash_id[i]);
  509. aclk_database_enq_cmd(wc, &cmd);
  510. }
  511. return;
  512. }
  513. // Send a command to a node_id
  514. // Need to discover the thread that will handle the request
  515. // if thread not in active hosts, then try to find in the queue
  516. static void aclk_submit_param_command(char *node_id, enum aclk_database_opcode aclk_command, uint64_t param)
  517. {
  518. if (unlikely(!node_id))
  519. return;
  520. struct aclk_database_worker_config *wc = NULL;
  521. struct aclk_database_cmd cmd;
  522. memset(&cmd, 0, sizeof(cmd));
  523. cmd.opcode = aclk_command;
  524. cmd.param1 = param;
  525. rrd_wrlock();
  526. RRDHOST *host = find_host_by_node_id(node_id);
  527. if (likely(host))
  528. wc = (struct aclk_database_worker_config *)host->dbsync_worker;
  529. rrd_unlock();
  530. if (wc)
  531. aclk_database_enq_cmd(wc, &cmd);
  532. else {
  533. if (aclk_worker_enq_cmd(node_id, &cmd))
  534. log_access("AC [%s (%s)]: ACLK synchronization thread is not active.", node_id, host ? host->hostname : "N/A");
  535. }
  536. return;
  537. }
  538. void aclk_ack_chart_sequence_id(char *node_id, uint64_t last_sequence_id)
  539. {
  540. if (unlikely(!node_id))
  541. return;
  542. log_access("AC [%s (N/A)]: Node reports last sequence id received %"PRIu64, node_id, last_sequence_id);
  543. aclk_submit_param_command(node_id, ACLK_DATABASE_CHART_ACK, last_sequence_id);
  544. return;
  545. }
  546. // Start streaming charts / dimensions for node_id
  547. void aclk_start_streaming(char *node_id, uint64_t sequence_id, time_t created_at, uint64_t batch_id)
  548. {
  549. UNUSED(created_at);
  550. if (unlikely(!node_id))
  551. return;
  552. log_access("IN [%s (N/A)]: Start streaming charts from sequence %"PRIu64" t=%ld, batch=%"PRIu64, node_id,
  553. sequence_id, created_at, batch_id);
  554. uuid_t node_uuid;
  555. if (uuid_parse(node_id, node_uuid))
  556. return;
  557. struct aclk_database_worker_config *wc = NULL;
  558. rrd_wrlock();
  559. RRDHOST *host = localhost;
  560. while(host) {
  561. if (host->node_id && !(uuid_compare(*host->node_id, node_uuid))) {
  562. rrd_unlock();
  563. wc = (struct aclk_database_worker_config *)host->dbsync_worker;
  564. if (likely(wc)) {
  565. wc->chart_reset_count++;
  566. __sync_synchronize();
  567. wc->chart_updates = 0;
  568. wc->batch_id = batch_id;
  569. __sync_synchronize();
  570. wc->batch_created = now_realtime_sec();
  571. if (sequence_id > wc->chart_sequence_id || wc->chart_reset_count > 10) {
  572. log_access("AC [%s (%s)]: Requesting full resync from the cloud "
  573. "(reset=%d, remote_seq=%"PRIu64", local_seq=%"PRIu64")"
  574. , wc->node_id, wc->host ? wc->host->hostname : "N/A", wc->chart_reset_count, sequence_id, wc->chart_sequence_id);
  575. chart_reset_t chart_reset;
  576. chart_reset.claim_id = is_agent_claimed();
  577. if (chart_reset.claim_id) {
  578. chart_reset.node_id = node_id;
  579. chart_reset.reason = SEQ_ID_NOT_EXISTS;
  580. aclk_chart_reset(chart_reset);
  581. freez(chart_reset.claim_id);
  582. wc->chart_reset_count = -1;
  583. }
  584. return;
  585. } else {
  586. struct aclk_database_cmd cmd;
  587. memset(&cmd, 0, sizeof(cmd));
  588. // TODO: handle timestamp
  589. if (sequence_id < wc->chart_sequence_id || !sequence_id) { // || created_at != wc->chart_timestamp) {
  590. log_access("AC [%s (%s)]: Reset streaming charts from sequence %"PRIu64 \
  591. " t=%ld (reset count=%d)", wc->node_id, wc->host ? wc->host->hostname : "N/A", wc->chart_sequence_id,
  592. wc->chart_timestamp, wc->chart_reset_count);
  593. cmd.opcode = ACLK_DATABASE_RESET_CHART;
  594. cmd.param1 = sequence_id + 1;
  595. cmd.completion = NULL;
  596. aclk_database_enq_cmd(wc, &cmd);
  597. }
  598. else {
  599. log_access("AC [%s (%s)]: Start streaming charts enabled -- last streamed sequence %"PRIu64 \
  600. " t=%ld (reset count=%d)", wc->node_id, wc->host ? wc->host->hostname : "N/A", wc->chart_sequence_id,
  601. wc->chart_timestamp, wc->chart_reset_count);
  602. wc->chart_reset_count = 0;
  603. wc->chart_updates = 1;
  604. }
  605. }
  606. }
  607. else
  608. log_access("AC [%s (%s)]: ACLK synchronization thread is not active.", wc->node_id, wc->host ? wc->host->hostname : "N/A");
  609. return;
  610. }
  611. host = host->next;
  612. }
  613. rrd_unlock();
  614. return;
  615. }
  616. #define SQL_SELECT_HOST_MEMORY_MODE "SELECT memory_mode FROM chart WHERE host_id = @host_id LIMIT 1;"
  617. static RRD_MEMORY_MODE sql_get_host_memory_mode(uuid_t *host_id)
  618. {
  619. int rc;
  620. RRD_MEMORY_MODE memory_mode = RRD_MEMORY_MODE_RAM;
  621. sqlite3_stmt *res = NULL;
  622. rc = sqlite3_prepare_v2(db_meta, SQL_SELECT_HOST_MEMORY_MODE, -1, &res, 0);
  623. if (unlikely(rc != SQLITE_OK)) {
  624. error_report("Failed to prepare statement to read host memory mode");
  625. return memory_mode;
  626. }
  627. rc = sqlite3_bind_blob(res, 1, host_id, sizeof(*host_id), SQLITE_STATIC);
  628. if (unlikely(rc != SQLITE_OK)) {
  629. error_report("Failed to bind host parameter to fetch host memory mode");
  630. goto failed;
  631. }
  632. while (sqlite3_step(res) == SQLITE_ROW) {
  633. memory_mode = (RRD_MEMORY_MODE) sqlite3_column_int(res, 0);
  634. }
  635. failed:
  636. rc = sqlite3_finalize(res);
  637. if (unlikely(rc != SQLITE_OK))
  638. error_report("Failed to finalize the prepared statement when reading host memory mode");
  639. return memory_mode;
  640. }
  641. #define SELECT_HOST_DIMENSION_LIST "SELECT d.dim_id, c.update_every, c.type||'.'||c.id, d.id, d.name FROM chart c, dimension d " \
  642. "WHERE d.chart_id = c.chart_id AND c.host_id = @host_id ORDER BY c.update_every ASC;"
  643. #define SELECT_HOST_CHART_LIST "SELECT distinct h.host_id, c.update_every, c.type||'.'||c.id FROM chart c, host h " \
  644. "WHERE c.host_id = h.host_id AND c.host_id = @host_id ORDER BY c.update_every ASC;"
  645. void aclk_update_retention(struct aclk_database_worker_config *wc, struct aclk_database_cmd cmd)
  646. {
  647. UNUSED(cmd);
  648. int rc;
  649. if (!aclk_use_new_cloud_arch || !aclk_connected)
  650. return;
  651. char *claim_id = is_agent_claimed();
  652. if (unlikely(!claim_id))
  653. return;
  654. sqlite3_stmt *res = NULL;
  655. RRD_MEMORY_MODE memory_mode;
  656. uuid_t host_uuid;
  657. rc = uuid_parse(wc->host_guid, host_uuid);
  658. if (unlikely(rc)) {
  659. freez(claim_id);
  660. return;
  661. }
  662. if (wc->host)
  663. memory_mode = wc->host->rrd_memory_mode;
  664. else
  665. memory_mode = sql_get_host_memory_mode(&host_uuid);
  666. if (memory_mode == RRD_MEMORY_MODE_DBENGINE)
  667. rc = sqlite3_prepare_v2(db_meta, SELECT_HOST_DIMENSION_LIST, -1, &res, 0);
  668. else
  669. rc = sqlite3_prepare_v2(db_meta, SELECT_HOST_CHART_LIST, -1, &res, 0);
  670. if (unlikely(rc != SQLITE_OK)) {
  671. error_report("Failed to prepare statement to fetch host dimensions");
  672. freez(claim_id);
  673. return;
  674. }
  675. rc = sqlite3_bind_blob(res, 1, &host_uuid, sizeof(host_uuid), SQLITE_STATIC);
  676. if (unlikely(rc != SQLITE_OK)) {
  677. error_report("Failed to bind host parameter to fetch host dimensions");
  678. goto failed;
  679. }
  680. time_t start_time = LONG_MAX;
  681. time_t first_entry_t;
  682. time_t last_entry_t;
  683. uint32_t update_every = 0;
  684. struct retention_updated rotate_data;
  685. memset(&rotate_data, 0, sizeof(rotate_data));
  686. int max_intervals = 32;
  687. rotate_data.interval_duration_count = 0;
  688. rotate_data.interval_durations = callocz(max_intervals, sizeof(*rotate_data.interval_durations));
  689. now_realtime_timeval(&rotate_data.rotation_timestamp);
  690. rotate_data.memory_mode = memory_mode;
  691. rotate_data.claim_id = claim_id;
  692. rotate_data.node_id = strdupz(wc->node_id);
  693. // time_t now = now_realtime_sec();
  694. while (sqlite3_step(res) == SQLITE_ROW) {
  695. if (!update_every || update_every != (uint32_t) sqlite3_column_int(res, 1)) {
  696. if (update_every) {
  697. debug(D_ACLK_SYNC,"Update %s for %u oldest time = %ld", wc->host_guid, update_every, start_time);
  698. if (start_time == LONG_MAX)
  699. rotate_data.interval_durations[rotate_data.interval_duration_count].retention = 0;
  700. else
  701. rotate_data.interval_durations[rotate_data.interval_duration_count].retention =
  702. rotate_data.rotation_timestamp.tv_sec - start_time;
  703. rotate_data.interval_duration_count++;
  704. }
  705. update_every = (uint32_t) sqlite3_column_int(res, 1);
  706. rotate_data.interval_durations[rotate_data.interval_duration_count].update_every = update_every;
  707. start_time = LONG_MAX;
  708. }
  709. #ifdef ENABLE_DBENGINE
  710. if (memory_mode == RRD_MEMORY_MODE_DBENGINE)
  711. rc = rrdeng_metric_latest_time_by_uuid((uuid_t *)sqlite3_column_blob(res, 0), &first_entry_t, &last_entry_t);
  712. else
  713. #endif
  714. {
  715. if (wc->host) {
  716. RRDSET *st = NULL;
  717. rc = (st = rrdset_find(wc->host, (const char *)sqlite3_column_text(res, 2))) ? 0 : 1;
  718. if (!rc) {
  719. first_entry_t = rrdset_first_entry_t(st);
  720. last_entry_t = rrdset_last_entry_t(st);
  721. }
  722. }
  723. else {
  724. rc = 0;
  725. first_entry_t = rotate_data.rotation_timestamp.tv_sec;
  726. }
  727. }
  728. if (likely(!rc && first_entry_t))
  729. start_time = MIN(start_time, first_entry_t);
  730. }
  731. if (update_every) {
  732. debug(D_ACLK_SYNC, "Update %s for %u oldest time = %ld", wc->host_guid, update_every, start_time);
  733. if (start_time == LONG_MAX)
  734. rotate_data.interval_durations[rotate_data.interval_duration_count].retention = 0;
  735. else
  736. rotate_data.interval_durations[rotate_data.interval_duration_count].retention =
  737. rotate_data.rotation_timestamp.tv_sec - start_time;
  738. rotate_data.interval_duration_count++;
  739. }
  740. #ifdef NETDATA_INTERNAL_CHECKS
  741. for (int i = 0; i < rotate_data.interval_duration_count; ++i)
  742. info("Update for host %s (node %s) for %u Retention = %u", wc->host_guid, wc->node_id,
  743. rotate_data.interval_durations[i].update_every, rotate_data.interval_durations[i].retention);
  744. #endif
  745. aclk_retention_updated(&rotate_data);
  746. freez(rotate_data.node_id);
  747. freez(rotate_data.interval_durations);
  748. failed:
  749. freez(claim_id);
  750. rc = sqlite3_finalize(res);
  751. if (unlikely(rc != SQLITE_OK))
  752. error_report("Failed to finalize the prepared statement when reading host dimensions");
  753. return;
  754. }
  755. uint32_t sql_get_pending_count(struct aclk_database_worker_config *wc)
  756. {
  757. BUFFER *sql = buffer_create(1024);
  758. sqlite3_stmt *res = NULL;
  759. buffer_sprintf(sql,"SELECT count(1) FROM aclk_chart_%s ac WHERE ac.date_submitted IS NULL;", wc->uuid_str);
  760. int rc;
  761. uint32_t chart_payload_count = 0;
  762. rc = sqlite3_prepare_v2(db_meta, buffer_tostring(sql), -1, &res, 0);
  763. if (rc != SQLITE_OK) {
  764. error_report("Failed to prepare statement to count pending messages");
  765. goto fail;
  766. }
  767. while (sqlite3_step(res) == SQLITE_ROW)
  768. chart_payload_count = (uint32_t) sqlite3_column_int(res, 0);
  769. rc = sqlite3_finalize(res);
  770. if (unlikely(rc != SQLITE_OK))
  771. error_report("Failed to reset statement when fetching pending messages, rc = %d", rc);
  772. fail:
  773. buffer_free(sql);
  774. return chart_payload_count;
  775. }
  776. void sql_get_last_chart_sequence(struct aclk_database_worker_config *wc)
  777. {
  778. BUFFER *sql = buffer_create(1024);
  779. buffer_sprintf(sql,"SELECT ac.sequence_id, ac.date_created FROM aclk_chart_%s ac " \
  780. "WHERE ac.date_submitted IS NOT NULL ORDER BY ac.sequence_id DESC LIMIT 1;", wc->uuid_str);
  781. int rc;
  782. sqlite3_stmt *res = NULL;
  783. rc = sqlite3_prepare_v2(db_meta, buffer_tostring(sql), -1, &res, 0);
  784. if (rc != SQLITE_OK) {
  785. error_report("Failed to prepare statement to find last chart sequence id");
  786. goto fail;
  787. }
  788. wc->chart_sequence_id = 0;
  789. wc->chart_timestamp = 0;
  790. while (sqlite3_step(res) == SQLITE_ROW) {
  791. wc->chart_sequence_id = (uint64_t) sqlite3_column_int64(res, 0);
  792. wc->chart_timestamp = (time_t) sqlite3_column_int64(res, 1);
  793. }
  794. debug(D_ACLK_SYNC,"Node %s reports last sequence_id=%"PRIu64, wc->node_id, wc->chart_sequence_id);
  795. rc = sqlite3_finalize(res);
  796. if (unlikely(rc != SQLITE_OK))
  797. error_report("Failed to reset statement when fetching chart sequence info, rc = %d", rc);
  798. fail:
  799. buffer_free(sql);
  800. return;
  801. }
  802. int queue_dimension_to_aclk(RRDDIM *rd)
  803. {
  804. int rc = sql_queue_chart_payload((struct aclk_database_worker_config *) rd->rrdset->rrdhost->dbsync_worker,
  805. rd, ACLK_DATABASE_ADD_DIMENSION);
  806. return rc;
  807. }
  808. #endif //ENABLE_NEW_CLOUD_PROTOCOL
  809. // ST is read locked
  810. int queue_chart_to_aclk(RRDSET *st)
  811. {
  812. #ifndef ENABLE_NEW_CLOUD_PROTOCOL
  813. #ifdef ENABLE_ACLK
  814. aclk_update_chart(st->rrdhost, st->id, 1);
  815. #endif
  816. return 0;
  817. #else
  818. if (!aclk_use_new_cloud_arch && aclk_connected) {
  819. aclk_update_chart(st->rrdhost, st->id, 1);
  820. return 0;
  821. }
  822. return sql_queue_chart_payload((struct aclk_database_worker_config *) st->rrdhost->dbsync_worker,
  823. st, ACLK_DATABASE_ADD_CHART);
  824. #endif
  825. }