compression.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322
  1. #include "rrdpush.h"
  2. #ifdef ENABLE_COMPRESSION
  3. #include "lz4.h"
  4. #define STREAM_COMPRESSION_MSG "STREAM_COMPRESSION"
  5. // signature MUST end with a newline
  6. #define SIGNATURE ((uint32_t)('z' | 0x80) | (0x80 << 8) | (0x80 << 16) | ('\n' << 24))
  7. #define SIGNATURE_MASK ((uint32_t)0xff | (0x80 << 8) | (0x80 << 16) | (0xff << 24))
  8. #define SIGNATURE_SIZE 4
  9. /*
  10. * LZ4 streaming API compressor specific data
  11. */
  12. struct compressor_data {
  13. LZ4_stream_t *stream;
  14. char *input_ring_buffer;
  15. size_t input_ring_buffer_size;
  16. size_t input_ring_buffer_pos;
  17. };
  18. /*
  19. * Reset compressor state for a new stream
  20. */
  21. static void lz4_compressor_reset(struct compressor_state *state)
  22. {
  23. if (state->data) {
  24. if (state->data->stream) {
  25. LZ4_resetStream_fast(state->data->stream);
  26. internal_error(true, "%s: compressor reset", STREAM_COMPRESSION_MSG);
  27. }
  28. state->data->input_ring_buffer_pos = 0;
  29. }
  30. }
  31. /*
  32. * Destroy compressor state and all related data
  33. */
  34. static void lz4_compressor_destroy(struct compressor_state **state)
  35. {
  36. if (state && *state) {
  37. struct compressor_state *s = *state;
  38. if (s->data) {
  39. if (s->data->stream)
  40. LZ4_freeStream(s->data->stream);
  41. freez(s->data->input_ring_buffer);
  42. freez(s->data);
  43. }
  44. freez(s->compression_result_buffer);
  45. freez(s);
  46. *state = NULL;
  47. debug(D_STREAM, "%s: Compressor Destroyed.", STREAM_COMPRESSION_MSG);
  48. }
  49. }
  50. /*
  51. * Compress the given block of data
  52. * Compressed data will remain in the internal buffer until the next invocation
  53. * Return the size of compressed data block as result and the pointer to internal buffer using the last argument
  54. * or 0 in case of error
  55. */
  56. static size_t lz4_compressor_compress(struct compressor_state *state, const char *data, size_t size, char **out)
  57. {
  58. if(unlikely(!state || !size || !out))
  59. return 0;
  60. if(unlikely(size > COMPRESSION_MAX_MSG_SIZE)) {
  61. error("%s: Compression Failed - Message size %lu above compression buffer limit: %d", STREAM_COMPRESSION_MSG, (long unsigned int)size, COMPRESSION_MAX_MSG_SIZE);
  62. return 0;
  63. }
  64. size_t max_dst_size = LZ4_COMPRESSBOUND(size);
  65. size_t data_size = max_dst_size + SIGNATURE_SIZE;
  66. if (!state->compression_result_buffer) {
  67. state->compression_result_buffer = mallocz(data_size);
  68. state->compression_result_buffer_size = data_size;
  69. }
  70. else if(unlikely(state->compression_result_buffer_size < data_size)) {
  71. state->compression_result_buffer = reallocz(state->compression_result_buffer, data_size);
  72. state->compression_result_buffer_size = data_size;
  73. }
  74. // the ring buffer always has space for LZ4_MAX_MSG_SIZE
  75. memcpy(state->data->input_ring_buffer + state->data->input_ring_buffer_pos, data, size);
  76. // this call needs the last 64K of our previous data
  77. // they are available in the ring buffer
  78. long int compressed_data_size = LZ4_compress_fast_continue(
  79. state->data->stream,
  80. state->data->input_ring_buffer + state->data->input_ring_buffer_pos,
  81. state->compression_result_buffer + SIGNATURE_SIZE,
  82. size,
  83. max_dst_size,
  84. 1);
  85. if (compressed_data_size < 0) {
  86. error("Data compression error: %ld", compressed_data_size);
  87. return 0;
  88. }
  89. // update the next writing position of the ring buffer
  90. state->data->input_ring_buffer_pos += size;
  91. if(unlikely(state->data->input_ring_buffer_pos >= state->data->input_ring_buffer_size - COMPRESSION_MAX_MSG_SIZE))
  92. state->data->input_ring_buffer_pos = 0;
  93. // update the signature header
  94. uint32_t len = ((compressed_data_size & 0x7f) | 0x80 | (((compressed_data_size & (0x7f << 7)) << 1) | 0x8000)) << 8;
  95. *(uint32_t *)state->compression_result_buffer = len | SIGNATURE;
  96. *out = state->compression_result_buffer;
  97. debug(D_STREAM, "%s: Compressed data header: %ld", STREAM_COMPRESSION_MSG, compressed_data_size);
  98. return compressed_data_size + SIGNATURE_SIZE;
  99. }
  100. /*
  101. * Create and initialize compressor state
  102. * Return the pointer to compressor_state structure created
  103. */
  104. struct compressor_state *create_compressor()
  105. {
  106. struct compressor_state *state = callocz(1, sizeof(struct compressor_state));
  107. state->reset = lz4_compressor_reset;
  108. state->compress = lz4_compressor_compress;
  109. state->destroy = lz4_compressor_destroy;
  110. state->data = callocz(1, sizeof(struct compressor_data));
  111. state->data->stream = LZ4_createStream();
  112. state->data->input_ring_buffer_size = LZ4_DECODER_RING_BUFFER_SIZE(COMPRESSION_MAX_MSG_SIZE * 2);
  113. state->data->input_ring_buffer = callocz(1, state->data->input_ring_buffer_size);
  114. state->compression_result_buffer_size = 0;
  115. state->reset(state);
  116. debug(D_STREAM, "%s: Initialize streaming compression!", STREAM_COMPRESSION_MSG);
  117. return state;
  118. }
  119. /*
  120. * LZ4 streaming API decompressor specific data
  121. */
  122. struct decompressor_stream {
  123. LZ4_streamDecode_t *lz4_stream;
  124. char *buffer;
  125. size_t size;
  126. size_t write_at;
  127. size_t read_at;
  128. };
  129. /*
  130. * Reset decompressor state for a new stream
  131. */
  132. static void lz4_decompressor_reset(struct decompressor_state *state)
  133. {
  134. if (state->stream) {
  135. if (state->stream->lz4_stream)
  136. LZ4_setStreamDecode(state->stream->lz4_stream, NULL, 0);
  137. state->stream->write_at = 0;
  138. state->stream->read_at = 0;
  139. }
  140. }
  141. /*
  142. * Destroy decompressor state and all related data
  143. */
  144. static void lz4_decompressor_destroy(struct decompressor_state **state)
  145. {
  146. if (state && *state) {
  147. struct decompressor_state *s = *state;
  148. if (s->stream) {
  149. debug(D_STREAM, "%s: Destroying decompressor.", STREAM_COMPRESSION_MSG);
  150. if (s->stream->lz4_stream)
  151. LZ4_freeStreamDecode(s->stream->lz4_stream);
  152. freez(s->stream->buffer);
  153. freez(s->stream);
  154. }
  155. freez(s);
  156. *state = NULL;
  157. }
  158. }
  159. static size_t decode_compress_header(const char *data, size_t data_size) {
  160. if (unlikely(!data || !data_size))
  161. return 0;
  162. if (unlikely(data_size != SIGNATURE_SIZE))
  163. return 0;
  164. uint32_t sign = *(uint32_t *)data;
  165. if (unlikely((sign & SIGNATURE_MASK) != SIGNATURE))
  166. return 0;
  167. size_t length = ((sign >> 8) & 0x7f) | ((sign >> 9) & (0x7f << 7));
  168. return length;
  169. }
  170. /*
  171. * Start the collection of compressed data in an internal buffer
  172. * Return the size of compressed data or 0 for uncompressed data
  173. */
  174. static size_t lz4_decompressor_start(struct decompressor_state *state __maybe_unused, const char *header, size_t header_size) {
  175. if(unlikely(state->stream->read_at != state->stream->write_at))
  176. fatal("%s: asked to decompress new data, while there are unread data in the decompression buffer!"
  177. , STREAM_COMPRESSION_MSG);
  178. return decode_compress_header(header, header_size);
  179. }
  180. /*
  181. * Decompress the compressed data in the internal buffer
  182. * Return the size of uncompressed data or 0 for error
  183. */
  184. static size_t lz4_decompressor_decompress(struct decompressor_state *state, const char *compressed_data, size_t compressed_size) {
  185. if (unlikely(!state || !compressed_data || !compressed_size))
  186. return 0;
  187. if(unlikely(state->stream->read_at != state->stream->write_at))
  188. fatal("%s: asked to decompress new data, while there are unread data in the decompression buffer!"
  189. , STREAM_COMPRESSION_MSG);
  190. if (unlikely(state->stream->write_at >= state->stream->size / 2)) {
  191. state->stream->write_at = 0;
  192. state->stream->read_at = 0;
  193. }
  194. long int decompressed_size = LZ4_decompress_safe_continue(
  195. state->stream->lz4_stream
  196. , compressed_data
  197. , state->stream->buffer + state->stream->write_at
  198. , (int)compressed_size
  199. , (int)(state->stream->size - state->stream->write_at)
  200. );
  201. if (unlikely(decompressed_size < 0)) {
  202. error("%s: decompressor returned negative decompressed bytes: %ld", STREAM_COMPRESSION_MSG, decompressed_size);
  203. return 0;
  204. }
  205. if(unlikely(decompressed_size + state->stream->write_at > state->stream->size))
  206. fatal("%s: decompressor overflown the stream_buffer. size: %zu, pos: %zu, added: %ld, exceeding the buffer by %zu"
  207. , STREAM_COMPRESSION_MSG
  208. , state->stream->size
  209. , state->stream->write_at
  210. , decompressed_size
  211. , (size_t)(state->stream->write_at + decompressed_size - state->stream->size)
  212. );
  213. state->stream->write_at += decompressed_size;
  214. // statistics
  215. state->total_compressed += compressed_size + SIGNATURE_SIZE;
  216. state->total_uncompressed += decompressed_size;
  217. state->packet_count++;
  218. return decompressed_size;
  219. }
  220. /*
  221. * Return the size of uncompressed data left in the internal buffer or 0 for error
  222. */
  223. static size_t lz4_decompressor_decompressed_bytes_in_buffer(struct decompressor_state *state) {
  224. if(unlikely(state->stream->read_at > state->stream->write_at))
  225. fatal("%s: invalid read/write stream positions"
  226. , STREAM_COMPRESSION_MSG);
  227. return state->stream->write_at - state->stream->read_at;
  228. }
  229. /*
  230. * Fill the buffer provided with uncompressed data from the internal buffer
  231. * Return the size of uncompressed data copied or 0 for error
  232. */
  233. static size_t lz4_decompressor_get(struct decompressor_state *state, char *dst, size_t size) {
  234. if (unlikely(!state || !size || !dst))
  235. return 0;
  236. size_t remaining = lz4_decompressor_decompressed_bytes_in_buffer(state);
  237. if(unlikely(!remaining))
  238. return 0;
  239. size_t bytes_to_return = size;
  240. if(bytes_to_return > remaining)
  241. bytes_to_return = remaining;
  242. memcpy(dst, state->stream->buffer + state->stream->read_at, bytes_to_return);
  243. state->stream->read_at += bytes_to_return;
  244. if(unlikely(state->stream->read_at > state->stream->write_at))
  245. fatal("%s: invalid read/write stream positions"
  246. , STREAM_COMPRESSION_MSG);
  247. return bytes_to_return;
  248. }
  249. /*
  250. * Create and initialize decompressor state
  251. * Return the pointer to decompressor_state structure created
  252. */
  253. struct decompressor_state *create_decompressor()
  254. {
  255. struct decompressor_state *state = callocz(1, sizeof(struct decompressor_state));
  256. state->signature_size = SIGNATURE_SIZE;
  257. state->reset = lz4_decompressor_reset;
  258. state->start = lz4_decompressor_start;
  259. state->decompress = lz4_decompressor_decompress;
  260. state->get = lz4_decompressor_get;
  261. state->decompressed_bytes_in_buffer = lz4_decompressor_decompressed_bytes_in_buffer;
  262. state->destroy = lz4_decompressor_destroy;
  263. state->stream = callocz(1, sizeof(struct decompressor_stream));
  264. fatal_assert(state->stream);
  265. state->stream->lz4_stream = LZ4_createStreamDecode();
  266. state->stream->size = LZ4_decoderRingBufferSize(COMPRESSION_MAX_MSG_SIZE) * 2;
  267. state->stream->buffer = mallocz(state->stream->size);
  268. fatal_assert(state->stream->buffer);
  269. state->reset(state);
  270. debug(D_STREAM, "%s: Initialize streaming decompression!", STREAM_COMPRESSION_MSG);
  271. return state;
  272. }
  273. #endif