netdata/streaming/compression.h
Costa Tsaousis cd584e0357
ZSTD and GZIP/DEFLATE streaming support (#16268)
* move compression header to compression.h

* prototype with zstd compression

* updated capabilities

* no need for resetting compression

* left-over reset function

* use ZSTD_compressStream() instead of ZSTD_compressStream2() for backwards compatibility

* remove call to LZ4_decoderRingBufferSize()

* debug signature failures

* fix the buffers of lz4

* fix decoding of zstd

* detect compression based on initialization; prefer ZSTD over LZ4

* allow both lz4 and zstd

* initialize zstd streams

* define missing ZSTD_CLEVEL_DEFAULT

* log zero compressed size

* debug log

* flush compression buffer

* add sender compression statistics

* removed debugging messages

* do not fail if zstd is not available

* cleanup and buildinfo

* fix max message size, use zstd level 1, add compressio ratio reporting

* use compression level 1

* fix ratio title

* better compression error logs

* for backwards compatibility use buffers of COMPRESSION_MAX_CHUNK

* switch to default compression level

* additional streaming error conditions detection

* do not expose compression stats when compression is not enabled

* test for the right lz4 functions

* moved lz4 and zstd to their own files

* add gzip streaming compression

* gzip error handling

* added unittest for streaming compression

* eliminate a copy of the uncompressed data during zstd compression

* eliminate not needed zstd allocations

* cleanup

* decode gzip with Z_SYNC_FLUSH

* set the decoding gzip algorithm

* user configuration for compression levels and compression algorithms order

* fix exclusion of not preferred compressions

* remove now obsolete compression define, since gzip is always available

* rename compression algorithms order in stream.conf

* move common checks in compression.c

* cleanup

* backwards compatible error checking
2023-10-27 17:37:34 +03:00

172 lines
5.5 KiB
C

// SPDX-License-Identifier: GPL-3.0-or-later
#include "rrdpush.h"
#ifndef NETDATA_RRDPUSH_COMPRESSION_H
#define NETDATA_RRDPUSH_COMPRESSION_H 1
// signature MUST end with a newline
#if COMPRESSION_MAX_MSG_SIZE >= (COMPRESSION_MAX_CHUNK - COMPRESSION_MAX_OVERHEAD)
#error "COMPRESSION_MAX_MSG_SIZE >= (COMPRESSION_MAX_CHUNK - COMPRESSION_MAX_OVERHEAD)"
#endif
typedef uint32_t rrdpush_signature_t;
#define RRDPUSH_COMPRESSION_SIGNATURE ((rrdpush_signature_t)('z' | 0x80) | (0x80 << 8) | (0x80 << 16) | ('\n' << 24))
#define RRDPUSH_COMPRESSION_SIGNATURE_MASK ((rrdpush_signature_t)0xff | (0x80 << 8) | (0x80 << 16) | (0xff << 24))
#define RRDPUSH_COMPRESSION_SIGNATURE_SIZE sizeof(rrdpush_signature_t)
static inline rrdpush_signature_t rrdpush_compress_encode_signature(size_t compressed_data_size) {
rrdpush_signature_t len = ((compressed_data_size & 0x7f) | 0x80 | (((compressed_data_size & (0x7f << 7)) << 1) | 0x8000)) << 8;
return len | RRDPUSH_COMPRESSION_SIGNATURE;
}
typedef enum {
COMPRESSION_ALGORITHM_NONE = 0,
COMPRESSION_ALGORITHM_ZSTD,
COMPRESSION_ALGORITHM_LZ4,
COMPRESSION_ALGORITHM_GZIP,
// terminator
COMPRESSION_ALGORITHM_MAX,
} compression_algorithm_t;
extern int rrdpush_compression_levels[COMPRESSION_ALGORITHM_MAX];
// ----------------------------------------------------------------------------
typedef struct simple_ring_buffer {
const char *data;
size_t size;
size_t read_pos;
size_t write_pos;
} SIMPLE_RING_BUFFER;
static inline void simple_ring_buffer_reset(SIMPLE_RING_BUFFER *b) {
b->read_pos = b->write_pos = 0;
}
static inline void simple_ring_buffer_make_room(SIMPLE_RING_BUFFER *b, size_t size) {
if(b->write_pos + size > b->size) {
if(!b->size)
b->size = COMPRESSION_MAX_CHUNK;
else
b->size *= 2;
if(b->write_pos + size > b->size)
b->size += size;
b->data = (const char *)reallocz((void *)b->data, b->size);
}
}
static inline void simple_ring_buffer_append_data(SIMPLE_RING_BUFFER *b, const void *data, size_t size) {
simple_ring_buffer_make_room(b, size);
memcpy((void *)(b->data + b->write_pos), data, size);
b->write_pos += size;
}
static inline void simple_ring_buffer_destroy(SIMPLE_RING_BUFFER *b) {
freez((void *)b->data);
b->data = NULL;
b->read_pos = b->write_pos = b->size = 0;
}
// ----------------------------------------------------------------------------
struct compressor_state {
bool initialized;
compression_algorithm_t algorithm;
SIMPLE_RING_BUFFER input;
SIMPLE_RING_BUFFER output;
int level;
void *stream;
struct {
size_t total_compressed;
size_t total_uncompressed;
size_t total_compressions;
} sender_locked;
};
void rrdpush_compressor_init(struct compressor_state *state);
void rrdpush_compressor_destroy(struct compressor_state *state);
size_t rrdpush_compress(struct compressor_state *state, const char *data, size_t size, const char **out);
// ----------------------------------------------------------------------------
struct decompressor_state {
bool initialized;
compression_algorithm_t algorithm;
size_t signature_size;
size_t total_compressed;
size_t total_uncompressed;
size_t total_compressions;
SIMPLE_RING_BUFFER output;
void *stream;
};
void rrdpush_decompressor_destroy(struct decompressor_state *state);
void rrdpush_decompressor_init(struct decompressor_state *state);
size_t rrdpush_decompress(struct decompressor_state *state, const char *compressed_data, size_t compressed_size);
static inline size_t rrdpush_decompress_decode_signature(const char *data, size_t data_size) {
if (unlikely(!data || !data_size))
return 0;
if (unlikely(data_size != RRDPUSH_COMPRESSION_SIGNATURE_SIZE))
return 0;
rrdpush_signature_t sign = *(rrdpush_signature_t *)data;
if (unlikely((sign & RRDPUSH_COMPRESSION_SIGNATURE_MASK) != RRDPUSH_COMPRESSION_SIGNATURE))
return 0;
size_t length = ((sign >> 8) & 0x7f) | ((sign >> 9) & (0x7f << 7));
return length;
}
static inline size_t rrdpush_decompressor_start(struct decompressor_state *state, const char *header, size_t header_size) {
if(unlikely(state->output.read_pos != state->output.write_pos))
fatal("RRDPUSH DECOMPRESS: asked to decompress new data, while there are unread data in the decompression buffer!");
return rrdpush_decompress_decode_signature(header, header_size);
}
static inline size_t rrdpush_decompressed_bytes_in_buffer(struct decompressor_state *state) {
if(unlikely(state->output.read_pos > state->output.write_pos))
fatal("RRDPUSH DECOMPRESS: invalid read/write stream positions");
return state->output.write_pos - state->output.read_pos;
}
static inline size_t rrdpush_decompressor_get(struct decompressor_state *state, char *dst, size_t size) {
if (unlikely(!state || !size || !dst))
return 0;
size_t remaining = rrdpush_decompressed_bytes_in_buffer(state);
if(unlikely(!remaining))
return 0;
size_t bytes_to_return = size;
if(bytes_to_return > remaining)
bytes_to_return = remaining;
memcpy(dst, state->output.data + state->output.read_pos, bytes_to_return);
state->output.read_pos += bytes_to_return;
if(unlikely(state->output.read_pos > state->output.write_pos))
fatal("RRDPUSH DECOMPRESS: invalid read/write stream positions");
return bytes_to_return;
}
// ----------------------------------------------------------------------------
#endif // NETDATA_RRDPUSH_COMPRESSION_H 1