buffer.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515
  1. // SPDX-License-Identifier: GPL-3.0-or-later
  2. #include "../libnetdata.h"
  3. static inline void buffer_overflow_init(BUFFER *b)
  4. {
  5. b->buffer[b->size] = '\0';
  6. strcpy(&b->buffer[b->size + 1], BUFFER_OVERFLOW_EOF);
  7. }
  8. void buffer_reset(BUFFER *wb) {
  9. buffer_flush(wb);
  10. wb->content_type = CT_TEXT_PLAIN;
  11. wb->options = 0;
  12. wb->date = 0;
  13. wb->expires = 0;
  14. buffer_overflow_check(wb);
  15. }
  16. const char *buffer_tostring(BUFFER *wb)
  17. {
  18. buffer_need_bytes(wb, 1);
  19. wb->buffer[wb->len] = '\0';
  20. buffer_overflow_check(wb);
  21. return(wb->buffer);
  22. }
  23. void buffer_char_replace(BUFFER *wb, char from, char to) {
  24. char *s = wb->buffer, *end = &wb->buffer[wb->len];
  25. while(s != end) {
  26. if(*s == from) *s = to;
  27. s++;
  28. }
  29. buffer_overflow_check(wb);
  30. }
  31. void buffer_print_sn_flags(BUFFER *wb, SN_FLAGS flags, bool send_anomaly_bit) {
  32. if(unlikely(flags == SN_EMPTY_SLOT)) {
  33. buffer_fast_strcat(wb, "E", 1);
  34. return;
  35. }
  36. size_t printed = 0;
  37. if(likely(send_anomaly_bit && (flags & SN_FLAG_NOT_ANOMALOUS))) {
  38. buffer_fast_strcat(wb, "A", 1);
  39. printed++;
  40. }
  41. if(unlikely(flags & SN_FLAG_RESET)) {
  42. buffer_fast_strcat(wb, "R", 1);
  43. printed++;
  44. }
  45. if(!printed)
  46. buffer_fast_strcat(wb, "''", 2);
  47. }
  48. void buffer_strcat_htmlescape(BUFFER *wb, const char *txt)
  49. {
  50. while(*txt) {
  51. switch(*txt) {
  52. case '&': buffer_strcat(wb, "&"); break;
  53. case '<': buffer_strcat(wb, "&lt;"); break;
  54. case '>': buffer_strcat(wb, "&gt;"); break;
  55. case '"': buffer_strcat(wb, "&quot;"); break;
  56. case '/': buffer_strcat(wb, "&#x2F;"); break;
  57. case '\'': buffer_strcat(wb, "&#x27;"); break;
  58. default: {
  59. buffer_need_bytes(wb, 1);
  60. wb->buffer[wb->len++] = *txt;
  61. }
  62. }
  63. txt++;
  64. }
  65. buffer_overflow_check(wb);
  66. }
  67. void buffer_snprintf(BUFFER *wb, size_t len, const char *fmt, ...)
  68. {
  69. if(unlikely(!fmt || !*fmt)) return;
  70. buffer_need_bytes(wb, len + 1);
  71. va_list args;
  72. va_start(args, fmt);
  73. wb->len += vsnprintfz(&wb->buffer[wb->len], len, fmt, args);
  74. va_end(args);
  75. buffer_overflow_check(wb);
  76. // the buffer is \0 terminated by vsnprintfz
  77. }
  78. void buffer_vsprintf(BUFFER *wb, const char *fmt, va_list args)
  79. {
  80. if(unlikely(!fmt || !*fmt)) return;
  81. size_t wrote = 0, need = 2, space_remaining = 0;
  82. do {
  83. need += space_remaining * 2;
  84. netdata_log_debug(D_WEB_BUFFER, "web_buffer_sprintf(): increasing web_buffer at position %zu, size = %zu, by %zu bytes (wrote = %zu)\n", wb->len, wb->size, need, wrote);
  85. buffer_need_bytes(wb, need);
  86. space_remaining = wb->size - wb->len - 1;
  87. wrote = (size_t) vsnprintfz(&wb->buffer[wb->len], space_remaining, fmt, args);
  88. } while(wrote >= space_remaining);
  89. wb->len += wrote;
  90. // the buffer is \0 terminated by vsnprintf
  91. }
  92. void buffer_sprintf(BUFFER *wb, const char *fmt, ...)
  93. {
  94. if(unlikely(!fmt || !*fmt)) return;
  95. va_list args;
  96. size_t wrote = 0, need = 2, space_remaining = 0;
  97. do {
  98. need += space_remaining * 2;
  99. netdata_log_debug(D_WEB_BUFFER, "web_buffer_sprintf(): increasing web_buffer at position %zu, size = %zu, by %zu bytes (wrote = %zu)\n", wb->len, wb->size, need, wrote);
  100. buffer_need_bytes(wb, need);
  101. space_remaining = wb->size - wb->len - 1;
  102. va_start(args, fmt);
  103. wrote = (size_t) vsnprintfz(&wb->buffer[wb->len], space_remaining, fmt, args);
  104. va_end(args);
  105. } while(wrote >= space_remaining);
  106. wb->len += wrote;
  107. // the buffer is \0 terminated by vsnprintf
  108. }
  109. // generate a javascript date, the fastest possible way...
  110. void buffer_jsdate(BUFFER *wb, int year, int month, int day, int hours, int minutes, int seconds)
  111. {
  112. // 10 20 30 = 35
  113. // 01234567890123456789012345678901234
  114. // Date(2014,04,01,03,28,20)
  115. buffer_need_bytes(wb, 30);
  116. char *b = &wb->buffer[wb->len], *p;
  117. unsigned int *q = (unsigned int *)b;
  118. #if __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__
  119. *q++ = 0x65746144; // "Date" backwards.
  120. #else
  121. *q++ = 0x44617465; // "Date"
  122. #endif
  123. p = (char *)q;
  124. *p++ = '(';
  125. *p++ = '0' + year / 1000; year %= 1000;
  126. *p++ = '0' + year / 100; year %= 100;
  127. *p++ = '0' + year / 10;
  128. *p++ = '0' + year % 10;
  129. *p++ = ',';
  130. *p = '0' + month / 10; if (*p != '0') p++;
  131. *p++ = '0' + month % 10;
  132. *p++ = ',';
  133. *p = '0' + day / 10; if (*p != '0') p++;
  134. *p++ = '0' + day % 10;
  135. *p++ = ',';
  136. *p = '0' + hours / 10; if (*p != '0') p++;
  137. *p++ = '0' + hours % 10;
  138. *p++ = ',';
  139. *p = '0' + minutes / 10; if (*p != '0') p++;
  140. *p++ = '0' + minutes % 10;
  141. *p++ = ',';
  142. *p = '0' + seconds / 10; if (*p != '0') p++;
  143. *p++ = '0' + seconds % 10;
  144. unsigned short *r = (unsigned short *)p;
  145. #if __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__
  146. *r++ = 0x0029; // ")\0" backwards.
  147. #else
  148. *r++ = 0x2900; // ")\0"
  149. #endif
  150. wb->len += (size_t)((char *)r - b - 1);
  151. // terminate it
  152. wb->buffer[wb->len] = '\0';
  153. buffer_overflow_check(wb);
  154. }
  155. // generate a date, the fastest possible way...
  156. void buffer_date(BUFFER *wb, int year, int month, int day, int hours, int minutes, int seconds)
  157. {
  158. // 10 20 30 = 35
  159. // 01234567890123456789012345678901234
  160. // 2014-04-01 03:28:20
  161. buffer_need_bytes(wb, 36);
  162. char *b = &wb->buffer[wb->len];
  163. char *p = b;
  164. *p++ = '0' + year / 1000; year %= 1000;
  165. *p++ = '0' + year / 100; year %= 100;
  166. *p++ = '0' + year / 10;
  167. *p++ = '0' + year % 10;
  168. *p++ = '-';
  169. *p++ = '0' + month / 10;
  170. *p++ = '0' + month % 10;
  171. *p++ = '-';
  172. *p++ = '0' + day / 10;
  173. *p++ = '0' + day % 10;
  174. *p++ = ' ';
  175. *p++ = '0' + hours / 10;
  176. *p++ = '0' + hours % 10;
  177. *p++ = ':';
  178. *p++ = '0' + minutes / 10;
  179. *p++ = '0' + minutes % 10;
  180. *p++ = ':';
  181. *p++ = '0' + seconds / 10;
  182. *p++ = '0' + seconds % 10;
  183. *p = '\0';
  184. wb->len += (size_t)(p - b);
  185. // terminate it
  186. wb->buffer[wb->len] = '\0';
  187. buffer_overflow_check(wb);
  188. }
  189. BUFFER *buffer_create(size_t size, size_t *statistics)
  190. {
  191. BUFFER *b;
  192. netdata_log_debug(D_WEB_BUFFER, "Creating new web buffer of size %zu.", size);
  193. b = callocz(1, sizeof(BUFFER));
  194. b->buffer = mallocz(size + sizeof(BUFFER_OVERFLOW_EOF) + 2);
  195. b->buffer[0] = '\0';
  196. b->size = size;
  197. b->content_type = CT_TEXT_PLAIN;
  198. b->statistics = statistics;
  199. buffer_overflow_init(b);
  200. buffer_overflow_check(b);
  201. if(b->statistics)
  202. __atomic_add_fetch(b->statistics, b->size + sizeof(BUFFER) + sizeof(BUFFER_OVERFLOW_EOF) + 2, __ATOMIC_RELAXED);
  203. return(b);
  204. }
  205. void buffer_free(BUFFER *b) {
  206. if(unlikely(!b)) return;
  207. buffer_overflow_check(b);
  208. netdata_log_debug(D_WEB_BUFFER, "Freeing web buffer of size %zu.", b->size);
  209. if(b->statistics)
  210. __atomic_sub_fetch(b->statistics, b->size + sizeof(BUFFER) + sizeof(BUFFER_OVERFLOW_EOF) + 2, __ATOMIC_RELAXED);
  211. freez(b->buffer);
  212. freez(b);
  213. }
  214. void buffer_increase(BUFFER *b, size_t free_size_required) {
  215. buffer_overflow_check(b);
  216. size_t left = b->size - b->len;
  217. if(left >= free_size_required) return;
  218. size_t wanted = free_size_required - left;
  219. size_t minimum = WEB_DATA_LENGTH_INCREASE_STEP;
  220. if(minimum > wanted) wanted = minimum;
  221. size_t optimal = (b->size > 5*1024*1024) ? b->size / 2 : b->size;
  222. if(optimal > wanted) wanted = optimal;
  223. netdata_log_debug(D_WEB_BUFFER, "Increasing data buffer from size %zu to %zu.", b->size, b->size + wanted);
  224. b->buffer = reallocz(b->buffer, b->size + wanted + sizeof(BUFFER_OVERFLOW_EOF) + 2);
  225. b->size += wanted;
  226. if(b->statistics)
  227. __atomic_add_fetch(b->statistics, wanted, __ATOMIC_RELAXED);
  228. buffer_overflow_init(b);
  229. buffer_overflow_check(b);
  230. }
  231. // ----------------------------------------------------------------------------
  232. void buffer_json_initialize(BUFFER *wb, const char *key_quote, const char *value_quote, int depth,
  233. bool add_anonymous_object, bool minify) {
  234. strncpyz(wb->json.key_quote, key_quote, BUFFER_QUOTE_MAX_SIZE);
  235. strncpyz(wb->json.value_quote, value_quote, BUFFER_QUOTE_MAX_SIZE);
  236. wb->json.minify = minify;
  237. wb->json.depth = (int8_t)(depth - 1);
  238. _buffer_json_depth_push(wb, BUFFER_JSON_OBJECT);
  239. if(add_anonymous_object)
  240. buffer_fast_strcat(wb, "{", 1);
  241. wb->content_type = CT_APPLICATION_JSON;
  242. }
  243. void buffer_json_finalize(BUFFER *wb) {
  244. while(wb->json.depth >= 0) {
  245. switch(wb->json.stack[wb->json.depth].type) {
  246. case BUFFER_JSON_OBJECT:
  247. buffer_json_object_close(wb);
  248. break;
  249. case BUFFER_JSON_ARRAY:
  250. buffer_json_array_close(wb);
  251. break;
  252. default:
  253. internal_fatal(true, "BUFFER: unknown json member type in stack");
  254. break;
  255. }
  256. }
  257. if(!wb->json.minify)
  258. buffer_fast_strcat(wb, "\n", 1);
  259. }
  260. // ----------------------------------------------------------------------------
  261. const char hex_digits[16] = "0123456789ABCDEF";
  262. const char base64_digits[64] = "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
  263. unsigned char hex_value_from_ascii[256];
  264. unsigned char base64_value_from_ascii[256];
  265. __attribute__((constructor)) void initialize_ascii_maps(void) {
  266. for(size_t i = 0 ; i < 256 ; i++) {
  267. hex_value_from_ascii[i] = 255;
  268. base64_value_from_ascii[i] = 255;
  269. }
  270. for(size_t i = 0; i < 16 ; i++)
  271. hex_value_from_ascii[(int)hex_digits[i]] = i;
  272. for(size_t i = 0; i < 64 ; i++)
  273. base64_value_from_ascii[(int)base64_digits[i]] = i;
  274. }
  275. // ----------------------------------------------------------------------------
  276. // unit test
  277. static int buffer_expect(BUFFER *wb, const char *expected) {
  278. const char *generated = buffer_tostring(wb);
  279. if(strcmp(generated, expected) != 0) {
  280. netdata_log_error("BUFFER: mismatch.\nGenerated:\n%s\nExpected:\n%s\n",
  281. generated, expected);
  282. return 1;
  283. }
  284. return 0;
  285. }
  286. static int buffer_uint64_roundtrip(BUFFER *wb, NUMBER_ENCODING encoding, uint64_t value, const char *expected) {
  287. int errors = 0;
  288. buffer_flush(wb);
  289. buffer_print_uint64_encoded(wb, encoding, value);
  290. if(expected)
  291. errors += buffer_expect(wb, expected);
  292. uint64_t v = str2ull_encoded(buffer_tostring(wb));
  293. if(v != value) {
  294. netdata_log_error("BUFFER: string '%s' does resolves to %llu, expected %llu",
  295. buffer_tostring(wb), (unsigned long long)v, (unsigned long long)value);
  296. errors++;
  297. }
  298. buffer_flush(wb);
  299. return errors;
  300. }
  301. static int buffer_int64_roundtrip(BUFFER *wb, NUMBER_ENCODING encoding, int64_t value, const char *expected) {
  302. int errors = 0;
  303. buffer_flush(wb);
  304. buffer_print_int64_encoded(wb, encoding, value);
  305. if(expected)
  306. errors += buffer_expect(wb, expected);
  307. int64_t v = str2ll_encoded(buffer_tostring(wb));
  308. if(v != value) {
  309. netdata_log_error("BUFFER: string '%s' does resolves to %lld, expected %lld",
  310. buffer_tostring(wb), (long long)v, (long long)value);
  311. errors++;
  312. }
  313. buffer_flush(wb);
  314. return errors;
  315. }
  316. static int buffer_double_roundtrip(BUFFER *wb, NUMBER_ENCODING encoding, NETDATA_DOUBLE value, const char *expected) {
  317. int errors = 0;
  318. buffer_flush(wb);
  319. buffer_print_netdata_double_encoded(wb, encoding, value);
  320. if(expected)
  321. errors += buffer_expect(wb, expected);
  322. NETDATA_DOUBLE v = str2ndd_encoded(buffer_tostring(wb), NULL);
  323. if(v != value) {
  324. netdata_log_error("BUFFER: string '%s' does resolves to %.12f, expected %.12f",
  325. buffer_tostring(wb), v, value);
  326. errors++;
  327. }
  328. buffer_flush(wb);
  329. return errors;
  330. }
  331. int buffer_unittest(void) {
  332. int errors = 0;
  333. BUFFER *wb = buffer_create(0, NULL);
  334. buffer_uint64_roundtrip(wb, NUMBER_ENCODING_DECIMAL, 0, "0");
  335. buffer_uint64_roundtrip(wb, NUMBER_ENCODING_HEX, 0, "0x0");
  336. buffer_uint64_roundtrip(wb, NUMBER_ENCODING_BASE64, 0, "#A");
  337. buffer_uint64_roundtrip(wb, NUMBER_ENCODING_DECIMAL, 1676071986, "1676071986");
  338. buffer_uint64_roundtrip(wb, NUMBER_ENCODING_HEX, 1676071986, "0x63E6D432");
  339. buffer_uint64_roundtrip(wb, NUMBER_ENCODING_BASE64, 1676071986, "#Bj5tQy");
  340. buffer_uint64_roundtrip(wb, NUMBER_ENCODING_DECIMAL, 18446744073709551615ULL, "18446744073709551615");
  341. buffer_uint64_roundtrip(wb, NUMBER_ENCODING_HEX, 18446744073709551615ULL, "0xFFFFFFFFFFFFFFFF");
  342. buffer_uint64_roundtrip(wb, NUMBER_ENCODING_BASE64, 18446744073709551615ULL, "#P//////////");
  343. buffer_int64_roundtrip(wb, NUMBER_ENCODING_DECIMAL, 0, "0");
  344. buffer_int64_roundtrip(wb, NUMBER_ENCODING_HEX, 0, "0x0");
  345. buffer_int64_roundtrip(wb, NUMBER_ENCODING_BASE64, 0, "#A");
  346. buffer_int64_roundtrip(wb, NUMBER_ENCODING_DECIMAL, -1676071986, "-1676071986");
  347. buffer_int64_roundtrip(wb, NUMBER_ENCODING_HEX, -1676071986, "-0x63E6D432");
  348. buffer_int64_roundtrip(wb, NUMBER_ENCODING_BASE64, -1676071986, "-#Bj5tQy");
  349. buffer_int64_roundtrip(wb, NUMBER_ENCODING_DECIMAL, (int64_t)-9223372036854775807ULL, "-9223372036854775807");
  350. buffer_int64_roundtrip(wb, NUMBER_ENCODING_HEX, (int64_t)-9223372036854775807ULL, "-0x7FFFFFFFFFFFFFFF");
  351. buffer_int64_roundtrip(wb, NUMBER_ENCODING_BASE64, (int64_t)-9223372036854775807ULL, "-#H//////////");
  352. buffer_double_roundtrip(wb, NUMBER_ENCODING_DECIMAL, 0, "0");
  353. buffer_double_roundtrip(wb, NUMBER_ENCODING_HEX, 0, "%0");
  354. buffer_double_roundtrip(wb, NUMBER_ENCODING_BASE64, 0, "@A");
  355. buffer_double_roundtrip(wb, NUMBER_ENCODING_DECIMAL, 1.5, "1.5");
  356. buffer_double_roundtrip(wb, NUMBER_ENCODING_HEX, 1.5, "%3FF8000000000000");
  357. buffer_double_roundtrip(wb, NUMBER_ENCODING_BASE64, 1.5, "@D/4AAAAAAAA");
  358. buffer_double_roundtrip(wb, NUMBER_ENCODING_DECIMAL, 1.23e+14, "123000000000000");
  359. buffer_double_roundtrip(wb, NUMBER_ENCODING_HEX, 1.23e+14, "%42DBF78AD3AC0000");
  360. buffer_double_roundtrip(wb, NUMBER_ENCODING_BASE64, 1.23e+14, "@ELb94rTrAAA");
  361. buffer_double_roundtrip(wb, NUMBER_ENCODING_DECIMAL, 9.12345678901234567890123456789e+45, "9.123456789012346128e+45");
  362. buffer_double_roundtrip(wb, NUMBER_ENCODING_HEX, 9.12345678901234567890123456789e+45, "%497991C25C9E4309");
  363. buffer_double_roundtrip(wb, NUMBER_ENCODING_BASE64, 9.12345678901234567890123456789e+45, "@El5kcJcnkMJ");
  364. buffer_flush(wb);
  365. {
  366. char buf[1024 + 1];
  367. for(size_t i = 0; i < 1024 ;i++)
  368. buf[i] = (char)(i % 26) + 'A';
  369. buf[1024] = '\0';
  370. buffer_strcat(wb, buf);
  371. errors += buffer_expect(wb, buf);
  372. }
  373. buffer_flush(wb);
  374. buffer_json_initialize(wb, "\"", "\"", 0, true, false);
  375. buffer_json_finalize(wb);
  376. errors += buffer_expect(wb, "{\n}\n");
  377. buffer_flush(wb);
  378. buffer_json_initialize(wb, "\"", "\"", 0, true, false);
  379. buffer_json_member_add_string(wb, "hello", "world");
  380. buffer_json_member_add_string(wb, "alpha", "this: \" is a double quote");
  381. buffer_json_member_add_object(wb, "object1");
  382. buffer_json_member_add_string(wb, "hello", "world");
  383. buffer_json_finalize(wb);
  384. errors += buffer_expect(wb, "{\n \"hello\":\"world\",\n \"alpha\":\"this: \\\" is a double quote\",\n \"object1\":{\n \"hello\":\"world\"\n }\n}\n");
  385. buffer_free(wb);
  386. return errors;
  387. }
  388. #ifdef ENABLE_H2O
  389. h2o_iovec_t buffer_to_h2o_iovec(BUFFER *wb) {
  390. h2o_iovec_t ret;
  391. ret.base = wb->buffer;
  392. ret.len = wb->len;
  393. return ret;
  394. }
  395. #endif