1062 lines
35 KiB
C
1062 lines
35 KiB
C
/* SPDX-License-Identifier: LGPL-2.1-or-later */
|
|
|
|
#include <inttypes.h>
|
|
#include <stdlib.h>
|
|
#include <sys/mman.h>
|
|
#include <sys/types.h>
|
|
#include <sys/stat.h>
|
|
#include <unistd.h>
|
|
|
|
#if HAVE_XZ
|
|
#include <lzma.h>
|
|
#endif
|
|
|
|
#if HAVE_LZ4
|
|
#include <lz4.h>
|
|
#include <lz4frame.h>
|
|
#endif
|
|
|
|
#if HAVE_ZSTD
|
|
#include <zstd.h>
|
|
#include <zstd_errors.h>
|
|
#endif
|
|
|
|
#include "alloc-util.h"
|
|
#include "compress.h"
|
|
#include "fd-util.h"
|
|
#include "io-util.h"
|
|
#include "journal-def.h"
|
|
#include "macro.h"
|
|
#include "sparse-endian.h"
|
|
#include "string-table.h"
|
|
#include "string-util.h"
|
|
#include "unaligned.h"
|
|
#include "util.h"
|
|
|
|
#if HAVE_LZ4
|
|
DEFINE_TRIVIAL_CLEANUP_FUNC(LZ4F_compressionContext_t, LZ4F_freeCompressionContext);
|
|
DEFINE_TRIVIAL_CLEANUP_FUNC(LZ4F_decompressionContext_t, LZ4F_freeDecompressionContext);
|
|
#endif
|
|
|
|
#if HAVE_ZSTD
|
|
DEFINE_TRIVIAL_CLEANUP_FUNC(ZSTD_CCtx *, ZSTD_freeCCtx);
|
|
DEFINE_TRIVIAL_CLEANUP_FUNC(ZSTD_DCtx *, ZSTD_freeDCtx);
|
|
|
|
static int zstd_ret_to_errno(size_t ret) {
|
|
switch (ZSTD_getErrorCode(ret)) {
|
|
case ZSTD_error_dstSize_tooSmall:
|
|
return -ENOBUFS;
|
|
case ZSTD_error_memory_allocation:
|
|
return -ENOMEM;
|
|
default:
|
|
return -EBADMSG;
|
|
}
|
|
}
|
|
#endif
|
|
|
|
#define ALIGN_8(l) ALIGN_TO(l, sizeof(size_t))
|
|
|
|
static const char* const object_compressed_table[_OBJECT_COMPRESSED_MAX] = {
|
|
[OBJECT_COMPRESSED_XZ] = "XZ",
|
|
[OBJECT_COMPRESSED_LZ4] = "LZ4",
|
|
[OBJECT_COMPRESSED_ZSTD] = "ZSTD",
|
|
/* If we add too many more entries here, it's going to grow quite large (and be mostly sparse), since
|
|
* the array key is actually a bitmask, not a plain enum */
|
|
};
|
|
|
|
DEFINE_STRING_TABLE_LOOKUP(object_compressed, int);
|
|
|
|
int compress_blob_xz(const void *src, uint64_t src_size,
|
|
void *dst, size_t dst_alloc_size, size_t *dst_size) {
|
|
#if HAVE_XZ
|
|
static const lzma_options_lzma opt = {
|
|
1u << 20u, NULL, 0, LZMA_LC_DEFAULT, LZMA_LP_DEFAULT,
|
|
LZMA_PB_DEFAULT, LZMA_MODE_FAST, 128, LZMA_MF_HC3, 4
|
|
};
|
|
static const lzma_filter filters[] = {
|
|
{ LZMA_FILTER_LZMA2, (lzma_options_lzma*) &opt },
|
|
{ LZMA_VLI_UNKNOWN, NULL }
|
|
};
|
|
lzma_ret ret;
|
|
size_t out_pos = 0;
|
|
|
|
assert(src);
|
|
assert(src_size > 0);
|
|
assert(dst);
|
|
assert(dst_alloc_size > 0);
|
|
assert(dst_size);
|
|
|
|
/* Returns < 0 if we couldn't compress the data or the
|
|
* compressed result is longer than the original */
|
|
|
|
if (src_size < 80)
|
|
return -ENOBUFS;
|
|
|
|
ret = lzma_stream_buffer_encode((lzma_filter*) filters, LZMA_CHECK_NONE, NULL,
|
|
src, src_size, dst, &out_pos, dst_alloc_size);
|
|
if (ret != LZMA_OK)
|
|
return -ENOBUFS;
|
|
|
|
*dst_size = out_pos;
|
|
return 0;
|
|
#else
|
|
return -EPROTONOSUPPORT;
|
|
#endif
|
|
}
|
|
|
|
int compress_blob_lz4(const void *src, uint64_t src_size,
|
|
void *dst, size_t dst_alloc_size, size_t *dst_size) {
|
|
#if HAVE_LZ4
|
|
int r;
|
|
|
|
assert(src);
|
|
assert(src_size > 0);
|
|
assert(dst);
|
|
assert(dst_alloc_size > 0);
|
|
assert(dst_size);
|
|
|
|
/* Returns < 0 if we couldn't compress the data or the
|
|
* compressed result is longer than the original */
|
|
|
|
if (src_size < 9)
|
|
return -ENOBUFS;
|
|
|
|
r = LZ4_compress_default(src, (char*)dst + 8, src_size, (int) dst_alloc_size - 8);
|
|
if (r <= 0)
|
|
return -ENOBUFS;
|
|
|
|
unaligned_write_le64(dst, src_size);
|
|
*dst_size = r + 8;
|
|
|
|
return 0;
|
|
#else
|
|
return -EPROTONOSUPPORT;
|
|
#endif
|
|
}
|
|
|
|
int compress_blob_zstd(
|
|
const void *src, uint64_t src_size,
|
|
void *dst, size_t dst_alloc_size, size_t *dst_size) {
|
|
#if HAVE_ZSTD
|
|
size_t k;
|
|
|
|
assert(src);
|
|
assert(src_size > 0);
|
|
assert(dst);
|
|
assert(dst_alloc_size > 0);
|
|
assert(dst_size);
|
|
|
|
k = ZSTD_compress(dst, dst_alloc_size, src, src_size, 0);
|
|
if (ZSTD_isError(k))
|
|
return zstd_ret_to_errno(k);
|
|
|
|
*dst_size = k;
|
|
return 0;
|
|
#else
|
|
return -EPROTONOSUPPORT;
|
|
#endif
|
|
}
|
|
|
|
int decompress_blob_xz(const void *src, uint64_t src_size,
|
|
void **dst, size_t *dst_alloc_size, size_t* dst_size, size_t dst_max) {
|
|
|
|
#if HAVE_XZ
|
|
_cleanup_(lzma_end) lzma_stream s = LZMA_STREAM_INIT;
|
|
lzma_ret ret;
|
|
size_t space;
|
|
|
|
assert(src);
|
|
assert(src_size > 0);
|
|
assert(dst);
|
|
assert(dst_alloc_size);
|
|
assert(dst_size);
|
|
assert(*dst_alloc_size == 0 || *dst);
|
|
|
|
ret = lzma_stream_decoder(&s, UINT64_MAX, 0);
|
|
if (ret != LZMA_OK)
|
|
return -ENOMEM;
|
|
|
|
space = MIN(src_size * 2, dst_max ?: (size_t) -1);
|
|
if (!greedy_realloc(dst, dst_alloc_size, space, 1))
|
|
return -ENOMEM;
|
|
|
|
s.next_in = src;
|
|
s.avail_in = src_size;
|
|
|
|
s.next_out = *dst;
|
|
s.avail_out = space;
|
|
|
|
for (;;) {
|
|
size_t used;
|
|
|
|
ret = lzma_code(&s, LZMA_FINISH);
|
|
|
|
if (ret == LZMA_STREAM_END)
|
|
break;
|
|
else if (ret != LZMA_OK)
|
|
return -ENOMEM;
|
|
|
|
if (dst_max > 0 && (space - s.avail_out) >= dst_max)
|
|
break;
|
|
else if (dst_max > 0 && space == dst_max)
|
|
return -ENOBUFS;
|
|
|
|
used = space - s.avail_out;
|
|
space = MIN(2 * space, dst_max ?: (size_t) -1);
|
|
if (!greedy_realloc(dst, dst_alloc_size, space, 1))
|
|
return -ENOMEM;
|
|
|
|
s.avail_out = space - used;
|
|
s.next_out = *(uint8_t**)dst + used;
|
|
}
|
|
|
|
*dst_size = space - s.avail_out;
|
|
return 0;
|
|
#else
|
|
return -EPROTONOSUPPORT;
|
|
#endif
|
|
}
|
|
|
|
int decompress_blob_lz4(const void *src, uint64_t src_size,
|
|
void **dst, size_t *dst_alloc_size, size_t* dst_size, size_t dst_max) {
|
|
|
|
#if HAVE_LZ4
|
|
char* out;
|
|
int r, size; /* LZ4 uses int for size */
|
|
|
|
assert(src);
|
|
assert(src_size > 0);
|
|
assert(dst);
|
|
assert(dst_alloc_size);
|
|
assert(dst_size);
|
|
assert(*dst_alloc_size == 0 || *dst);
|
|
|
|
if (src_size <= 8)
|
|
return -EBADMSG;
|
|
|
|
size = unaligned_read_le64(src);
|
|
if (size < 0 || (unsigned) size != unaligned_read_le64(src))
|
|
return -EFBIG;
|
|
if ((size_t) size > *dst_alloc_size) {
|
|
out = realloc(*dst, size);
|
|
if (!out)
|
|
return -ENOMEM;
|
|
*dst = out;
|
|
*dst_alloc_size = size;
|
|
} else
|
|
out = *dst;
|
|
|
|
r = LZ4_decompress_safe((char*)src + 8, out, src_size - 8, size);
|
|
if (r < 0 || r != size)
|
|
return -EBADMSG;
|
|
|
|
*dst_size = size;
|
|
return 0;
|
|
#else
|
|
return -EPROTONOSUPPORT;
|
|
#endif
|
|
}
|
|
|
|
int decompress_blob_zstd(
|
|
const void *src, uint64_t src_size,
|
|
void **dst, size_t *dst_alloc_size, size_t *dst_size, size_t dst_max) {
|
|
|
|
#if HAVE_ZSTD
|
|
uint64_t size;
|
|
|
|
assert(src);
|
|
assert(src_size > 0);
|
|
assert(dst);
|
|
assert(dst_alloc_size);
|
|
assert(dst_size);
|
|
assert(*dst_alloc_size == 0 || *dst);
|
|
|
|
size = ZSTD_getFrameContentSize(src, src_size);
|
|
if (IN_SET(size, ZSTD_CONTENTSIZE_ERROR, ZSTD_CONTENTSIZE_UNKNOWN))
|
|
return -EBADMSG;
|
|
|
|
if (dst_max > 0 && size > dst_max)
|
|
size = dst_max;
|
|
if (size > SIZE_MAX)
|
|
return -E2BIG;
|
|
|
|
if (!(greedy_realloc(dst, dst_alloc_size, MAX(ZSTD_DStreamOutSize(), size), 1)))
|
|
return -ENOMEM;
|
|
|
|
_cleanup_(ZSTD_freeDCtxp) ZSTD_DCtx *dctx = ZSTD_createDCtx();
|
|
if (!dctx)
|
|
return -ENOMEM;
|
|
|
|
ZSTD_inBuffer input = {
|
|
.src = src,
|
|
.size = src_size,
|
|
};
|
|
ZSTD_outBuffer output = {
|
|
.dst = *dst,
|
|
.size = *dst_alloc_size,
|
|
};
|
|
|
|
size_t k = ZSTD_decompressStream(dctx, &output, &input);
|
|
if (ZSTD_isError(k)) {
|
|
log_debug("ZSTD decoder failed: %s", ZSTD_getErrorName(k));
|
|
return zstd_ret_to_errno(k);
|
|
}
|
|
assert(output.pos >= size);
|
|
|
|
*dst_size = size;
|
|
return 0;
|
|
#else
|
|
return -EPROTONOSUPPORT;
|
|
#endif
|
|
}
|
|
|
|
int decompress_blob(
|
|
int compression,
|
|
const void *src, uint64_t src_size,
|
|
void **dst, size_t *dst_alloc_size, size_t* dst_size, size_t dst_max) {
|
|
|
|
if (compression == OBJECT_COMPRESSED_XZ)
|
|
return decompress_blob_xz(
|
|
src, src_size,
|
|
dst, dst_alloc_size, dst_size, dst_max);
|
|
else if (compression == OBJECT_COMPRESSED_LZ4)
|
|
return decompress_blob_lz4(
|
|
src, src_size,
|
|
dst, dst_alloc_size, dst_size, dst_max);
|
|
else if (compression == OBJECT_COMPRESSED_ZSTD)
|
|
return decompress_blob_zstd(
|
|
src, src_size,
|
|
dst, dst_alloc_size, dst_size, dst_max);
|
|
else
|
|
return -EPROTONOSUPPORT;
|
|
}
|
|
|
|
int decompress_startswith_xz(const void *src, uint64_t src_size,
|
|
void **buffer, size_t *buffer_size,
|
|
const void *prefix, size_t prefix_len,
|
|
uint8_t extra) {
|
|
|
|
#if HAVE_XZ
|
|
_cleanup_(lzma_end) lzma_stream s = LZMA_STREAM_INIT;
|
|
lzma_ret ret;
|
|
|
|
/* Checks whether the decompressed blob starts with the
|
|
* mentioned prefix. The byte extra needs to follow the
|
|
* prefix */
|
|
|
|
assert(src);
|
|
assert(src_size > 0);
|
|
assert(buffer);
|
|
assert(buffer_size);
|
|
assert(prefix);
|
|
assert(*buffer_size == 0 || *buffer);
|
|
|
|
ret = lzma_stream_decoder(&s, UINT64_MAX, 0);
|
|
if (ret != LZMA_OK)
|
|
return -EBADMSG;
|
|
|
|
if (!(greedy_realloc(buffer, buffer_size, ALIGN_8(prefix_len + 1), 1)))
|
|
return -ENOMEM;
|
|
|
|
s.next_in = src;
|
|
s.avail_in = src_size;
|
|
|
|
s.next_out = *buffer;
|
|
s.avail_out = *buffer_size;
|
|
|
|
for (;;) {
|
|
ret = lzma_code(&s, LZMA_FINISH);
|
|
|
|
if (!IN_SET(ret, LZMA_OK, LZMA_STREAM_END))
|
|
return -EBADMSG;
|
|
|
|
if (*buffer_size - s.avail_out >= prefix_len + 1)
|
|
return memcmp(*buffer, prefix, prefix_len) == 0 &&
|
|
((const uint8_t*) *buffer)[prefix_len] == extra;
|
|
|
|
if (ret == LZMA_STREAM_END)
|
|
return 0;
|
|
|
|
s.avail_out += *buffer_size;
|
|
|
|
if (!(greedy_realloc(buffer, buffer_size, *buffer_size * 2, 1)))
|
|
return -ENOMEM;
|
|
|
|
s.next_out = *(uint8_t**)buffer + *buffer_size - s.avail_out;
|
|
}
|
|
|
|
#else
|
|
return -EPROTONOSUPPORT;
|
|
#endif
|
|
}
|
|
|
|
int decompress_startswith_lz4(const void *src, uint64_t src_size,
|
|
void **buffer, size_t *buffer_size,
|
|
const void *prefix, size_t prefix_len,
|
|
uint8_t extra) {
|
|
#if HAVE_LZ4
|
|
/* Checks whether the decompressed blob starts with the
|
|
* mentioned prefix. The byte extra needs to follow the
|
|
* prefix */
|
|
|
|
int r;
|
|
|
|
assert(src);
|
|
assert(src_size > 0);
|
|
assert(buffer);
|
|
assert(buffer_size);
|
|
assert(prefix);
|
|
assert(*buffer_size == 0 || *buffer);
|
|
|
|
if (src_size <= 8)
|
|
return -EBADMSG;
|
|
|
|
if (!(greedy_realloc(buffer, buffer_size, ALIGN_8(prefix_len + 1), 1)))
|
|
return -ENOMEM;
|
|
|
|
r = LZ4_decompress_safe_partial((char*)src + 8, *buffer, src_size - 8,
|
|
prefix_len + 1, *buffer_size);
|
|
/* One lz4 < 1.8.3, we might get "failure" (r < 0), or "success" where
|
|
* just a part of the buffer is decompressed. But if we get a smaller
|
|
* amount of bytes than requested, we don't know whether there isn't enough
|
|
* data to fill the requested size or whether we just got a partial answer.
|
|
*/
|
|
if (r < 0 || (size_t) r < prefix_len + 1) {
|
|
size_t size;
|
|
|
|
if (LZ4_versionNumber() >= 10803)
|
|
/* We trust that the newer lz4 decompresses the number of bytes we
|
|
* requested if available in the compressed string. */
|
|
return 0;
|
|
|
|
if (r > 0)
|
|
/* Compare what we have first, in case of mismatch we can
|
|
* shortcut the full comparison. */
|
|
if (memcmp(*buffer, prefix, r) != 0)
|
|
return 0;
|
|
|
|
/* Before version 1.8.3, lz4 always tries to decode full a "sequence",
|
|
* so in pathological cases might need to decompress the full field. */
|
|
r = decompress_blob_lz4(src, src_size, buffer, buffer_size, &size, 0);
|
|
if (r < 0)
|
|
return r;
|
|
|
|
if (size < prefix_len + 1)
|
|
return 0;
|
|
}
|
|
|
|
return memcmp(*buffer, prefix, prefix_len) == 0 &&
|
|
((const uint8_t*) *buffer)[prefix_len] == extra;
|
|
#else
|
|
return -EPROTONOSUPPORT;
|
|
#endif
|
|
}
|
|
|
|
int decompress_startswith_zstd(
|
|
const void *src, uint64_t src_size,
|
|
void **buffer, size_t *buffer_size,
|
|
const void *prefix, size_t prefix_len,
|
|
uint8_t extra) {
|
|
#if HAVE_ZSTD
|
|
assert(src);
|
|
assert(src_size > 0);
|
|
assert(buffer);
|
|
assert(buffer_size);
|
|
assert(prefix);
|
|
assert(*buffer_size == 0 || *buffer);
|
|
|
|
uint64_t size = ZSTD_getFrameContentSize(src, src_size);
|
|
if (IN_SET(size, ZSTD_CONTENTSIZE_ERROR, ZSTD_CONTENTSIZE_UNKNOWN))
|
|
return -EBADMSG;
|
|
|
|
if (size < prefix_len + 1)
|
|
return 0; /* Decompressed text too short to match the prefix and extra */
|
|
|
|
_cleanup_(ZSTD_freeDCtxp) ZSTD_DCtx *dctx = ZSTD_createDCtx();
|
|
if (!dctx)
|
|
return -ENOMEM;
|
|
|
|
if (!(greedy_realloc(buffer, buffer_size, MAX(ZSTD_DStreamOutSize(), prefix_len + 1), 1)))
|
|
return -ENOMEM;
|
|
|
|
ZSTD_inBuffer input = {
|
|
.src = src,
|
|
.size = src_size,
|
|
};
|
|
ZSTD_outBuffer output = {
|
|
.dst = *buffer,
|
|
.size = *buffer_size,
|
|
};
|
|
size_t k;
|
|
|
|
k = ZSTD_decompressStream(dctx, &output, &input);
|
|
if (ZSTD_isError(k)) {
|
|
log_debug("ZSTD decoder failed: %s", ZSTD_getErrorName(k));
|
|
return zstd_ret_to_errno(k);
|
|
}
|
|
assert(output.pos >= prefix_len + 1);
|
|
|
|
return memcmp(*buffer, prefix, prefix_len) == 0 &&
|
|
((const uint8_t*) *buffer)[prefix_len] == extra;
|
|
#else
|
|
return -EPROTONOSUPPORT;
|
|
#endif
|
|
}
|
|
|
|
int decompress_startswith(
|
|
int compression,
|
|
const void *src, uint64_t src_size,
|
|
void **buffer, size_t *buffer_size,
|
|
const void *prefix, size_t prefix_len,
|
|
uint8_t extra) {
|
|
|
|
if (compression == OBJECT_COMPRESSED_XZ)
|
|
return decompress_startswith_xz(
|
|
src, src_size,
|
|
buffer, buffer_size,
|
|
prefix, prefix_len,
|
|
extra);
|
|
|
|
else if (compression == OBJECT_COMPRESSED_LZ4)
|
|
return decompress_startswith_lz4(
|
|
src, src_size,
|
|
buffer, buffer_size,
|
|
prefix, prefix_len,
|
|
extra);
|
|
else if (compression == OBJECT_COMPRESSED_ZSTD)
|
|
return decompress_startswith_zstd(
|
|
src, src_size,
|
|
buffer, buffer_size,
|
|
prefix, prefix_len,
|
|
extra);
|
|
else
|
|
return -EBADMSG;
|
|
}
|
|
|
|
int compress_stream_xz(int fdf, int fdt, uint64_t max_bytes) {
|
|
#if HAVE_XZ
|
|
_cleanup_(lzma_end) lzma_stream s = LZMA_STREAM_INIT;
|
|
lzma_ret ret;
|
|
uint8_t buf[BUFSIZ], out[BUFSIZ];
|
|
lzma_action action = LZMA_RUN;
|
|
|
|
assert(fdf >= 0);
|
|
assert(fdt >= 0);
|
|
|
|
ret = lzma_easy_encoder(&s, LZMA_PRESET_DEFAULT, LZMA_CHECK_CRC64);
|
|
if (ret != LZMA_OK)
|
|
return log_error_errno(SYNTHETIC_ERRNO(EINVAL),
|
|
"Failed to initialize XZ encoder: code %u",
|
|
ret);
|
|
|
|
for (;;) {
|
|
if (s.avail_in == 0 && action == LZMA_RUN) {
|
|
size_t m = sizeof(buf);
|
|
ssize_t n;
|
|
|
|
if (max_bytes != (uint64_t) -1 && (uint64_t) m > max_bytes)
|
|
m = (size_t) max_bytes;
|
|
|
|
n = read(fdf, buf, m);
|
|
if (n < 0)
|
|
return -errno;
|
|
if (n == 0)
|
|
action = LZMA_FINISH;
|
|
else {
|
|
s.next_in = buf;
|
|
s.avail_in = n;
|
|
|
|
if (max_bytes != (uint64_t) -1) {
|
|
assert(max_bytes >= (uint64_t) n);
|
|
max_bytes -= n;
|
|
}
|
|
}
|
|
}
|
|
|
|
if (s.avail_out == 0) {
|
|
s.next_out = out;
|
|
s.avail_out = sizeof(out);
|
|
}
|
|
|
|
ret = lzma_code(&s, action);
|
|
if (!IN_SET(ret, LZMA_OK, LZMA_STREAM_END))
|
|
return log_error_errno(SYNTHETIC_ERRNO(EBADMSG),
|
|
"Compression failed: code %u",
|
|
ret);
|
|
|
|
if (s.avail_out == 0 || ret == LZMA_STREAM_END) {
|
|
ssize_t n, k;
|
|
|
|
n = sizeof(out) - s.avail_out;
|
|
|
|
k = loop_write(fdt, out, n, false);
|
|
if (k < 0)
|
|
return k;
|
|
|
|
if (ret == LZMA_STREAM_END) {
|
|
log_debug("XZ compression finished (%"PRIu64" -> %"PRIu64" bytes, %.1f%%)",
|
|
s.total_in, s.total_out,
|
|
(double) s.total_out / s.total_in * 100);
|
|
|
|
return 0;
|
|
}
|
|
}
|
|
}
|
|
#else
|
|
return -EPROTONOSUPPORT;
|
|
#endif
|
|
}
|
|
|
|
#define LZ4_BUFSIZE (512*1024u)
|
|
|
|
int compress_stream_lz4(int fdf, int fdt, uint64_t max_bytes) {
|
|
|
|
#if HAVE_LZ4
|
|
LZ4F_errorCode_t c;
|
|
_cleanup_(LZ4F_freeCompressionContextp) LZ4F_compressionContext_t ctx = NULL;
|
|
_cleanup_free_ char *buf = NULL;
|
|
char *src = NULL;
|
|
size_t size, n, total_in = 0, total_out, offset = 0, frame_size;
|
|
struct stat st;
|
|
int r;
|
|
static const LZ4F_compressOptions_t options = {
|
|
.stableSrc = 1,
|
|
};
|
|
static const LZ4F_preferences_t preferences = {
|
|
.frameInfo.blockSizeID = 5,
|
|
};
|
|
|
|
c = LZ4F_createCompressionContext(&ctx, LZ4F_VERSION);
|
|
if (LZ4F_isError(c))
|
|
return -ENOMEM;
|
|
|
|
if (fstat(fdf, &st) < 0)
|
|
return log_debug_errno(errno, "fstat() failed: %m");
|
|
|
|
frame_size = LZ4F_compressBound(LZ4_BUFSIZE, &preferences);
|
|
size = frame_size + 64*1024; /* add some space for header and trailer */
|
|
buf = malloc(size);
|
|
if (!buf)
|
|
return -ENOMEM;
|
|
|
|
n = offset = total_out = LZ4F_compressBegin(ctx, buf, size, &preferences);
|
|
if (LZ4F_isError(n))
|
|
return -EINVAL;
|
|
|
|
src = mmap(NULL, st.st_size, PROT_READ, MAP_PRIVATE, fdf, 0);
|
|
if (src == MAP_FAILED)
|
|
return -errno;
|
|
|
|
log_debug("Buffer size is %zu bytes, header size %zu bytes.", size, n);
|
|
|
|
while (total_in < (size_t) st.st_size) {
|
|
ssize_t k;
|
|
|
|
k = MIN(LZ4_BUFSIZE, st.st_size - total_in);
|
|
n = LZ4F_compressUpdate(ctx, buf + offset, size - offset,
|
|
src + total_in, k, &options);
|
|
if (LZ4F_isError(n)) {
|
|
r = -ENOTRECOVERABLE;
|
|
goto cleanup;
|
|
}
|
|
|
|
total_in += k;
|
|
offset += n;
|
|
total_out += n;
|
|
|
|
if (max_bytes != (uint64_t) -1 && total_out > (size_t) max_bytes)
|
|
return log_debug_errno(SYNTHETIC_ERRNO(EFBIG),
|
|
"Compressed stream longer than %" PRIu64 " bytes",
|
|
max_bytes);
|
|
|
|
if (size - offset < frame_size + 4) {
|
|
k = loop_write(fdt, buf, offset, false);
|
|
if (k < 0) {
|
|
r = k;
|
|
goto cleanup;
|
|
}
|
|
offset = 0;
|
|
}
|
|
}
|
|
|
|
n = LZ4F_compressEnd(ctx, buf + offset, size - offset, &options);
|
|
if (LZ4F_isError(n)) {
|
|
r = -ENOTRECOVERABLE;
|
|
goto cleanup;
|
|
}
|
|
|
|
offset += n;
|
|
total_out += n;
|
|
r = loop_write(fdt, buf, offset, false);
|
|
if (r < 0)
|
|
goto cleanup;
|
|
|
|
log_debug("LZ4 compression finished (%zu -> %zu bytes, %.1f%%)",
|
|
total_in, total_out,
|
|
(double) total_out / total_in * 100);
|
|
cleanup:
|
|
munmap(src, st.st_size);
|
|
return r;
|
|
#else
|
|
return -EPROTONOSUPPORT;
|
|
#endif
|
|
}
|
|
|
|
int decompress_stream_xz(int fdf, int fdt, uint64_t max_bytes) {
|
|
|
|
#if HAVE_XZ
|
|
_cleanup_(lzma_end) lzma_stream s = LZMA_STREAM_INIT;
|
|
lzma_ret ret;
|
|
|
|
uint8_t buf[BUFSIZ], out[BUFSIZ];
|
|
lzma_action action = LZMA_RUN;
|
|
|
|
assert(fdf >= 0);
|
|
assert(fdt >= 0);
|
|
|
|
ret = lzma_stream_decoder(&s, UINT64_MAX, 0);
|
|
if (ret != LZMA_OK)
|
|
return log_debug_errno(SYNTHETIC_ERRNO(ENOMEM),
|
|
"Failed to initialize XZ decoder: code %u",
|
|
ret);
|
|
|
|
for (;;) {
|
|
if (s.avail_in == 0 && action == LZMA_RUN) {
|
|
ssize_t n;
|
|
|
|
n = read(fdf, buf, sizeof(buf));
|
|
if (n < 0)
|
|
return -errno;
|
|
if (n == 0)
|
|
action = LZMA_FINISH;
|
|
else {
|
|
s.next_in = buf;
|
|
s.avail_in = n;
|
|
}
|
|
}
|
|
|
|
if (s.avail_out == 0) {
|
|
s.next_out = out;
|
|
s.avail_out = sizeof(out);
|
|
}
|
|
|
|
ret = lzma_code(&s, action);
|
|
if (!IN_SET(ret, LZMA_OK, LZMA_STREAM_END))
|
|
return log_debug_errno(SYNTHETIC_ERRNO(EBADMSG),
|
|
"Decompression failed: code %u",
|
|
ret);
|
|
|
|
if (s.avail_out == 0 || ret == LZMA_STREAM_END) {
|
|
ssize_t n, k;
|
|
|
|
n = sizeof(out) - s.avail_out;
|
|
|
|
if (max_bytes != (uint64_t) -1) {
|
|
if (max_bytes < (uint64_t) n)
|
|
return -EFBIG;
|
|
|
|
max_bytes -= n;
|
|
}
|
|
|
|
k = loop_write(fdt, out, n, false);
|
|
if (k < 0)
|
|
return k;
|
|
|
|
if (ret == LZMA_STREAM_END) {
|
|
log_debug("XZ decompression finished (%"PRIu64" -> %"PRIu64" bytes, %.1f%%)",
|
|
s.total_in, s.total_out,
|
|
(double) s.total_out / s.total_in * 100);
|
|
|
|
return 0;
|
|
}
|
|
}
|
|
}
|
|
#else
|
|
return log_debug_errno(SYNTHETIC_ERRNO(EPROTONOSUPPORT),
|
|
"Cannot decompress file. Compiled without XZ support.");
|
|
#endif
|
|
}
|
|
|
|
int decompress_stream_lz4(int in, int out, uint64_t max_bytes) {
|
|
#if HAVE_LZ4
|
|
size_t c;
|
|
_cleanup_(LZ4F_freeDecompressionContextp) LZ4F_decompressionContext_t ctx = NULL;
|
|
_cleanup_free_ char *buf = NULL;
|
|
char *src;
|
|
struct stat st;
|
|
int r = 0;
|
|
size_t total_in = 0, total_out = 0;
|
|
|
|
c = LZ4F_createDecompressionContext(&ctx, LZ4F_VERSION);
|
|
if (LZ4F_isError(c))
|
|
return -ENOMEM;
|
|
|
|
if (fstat(in, &st) < 0)
|
|
return log_debug_errno(errno, "fstat() failed: %m");
|
|
|
|
buf = malloc(LZ4_BUFSIZE);
|
|
if (!buf)
|
|
return -ENOMEM;
|
|
|
|
src = mmap(NULL, st.st_size, PROT_READ, MAP_PRIVATE, in, 0);
|
|
if (src == MAP_FAILED)
|
|
return -errno;
|
|
|
|
while (total_in < (size_t) st.st_size) {
|
|
size_t produced = LZ4_BUFSIZE;
|
|
size_t used = st.st_size - total_in;
|
|
|
|
c = LZ4F_decompress(ctx, buf, &produced, src + total_in, &used, NULL);
|
|
if (LZ4F_isError(c)) {
|
|
r = -EBADMSG;
|
|
goto cleanup;
|
|
}
|
|
|
|
total_in += used;
|
|
total_out += produced;
|
|
|
|
if (max_bytes != (uint64_t) -1 && total_out > (size_t) max_bytes) {
|
|
log_debug("Decompressed stream longer than %"PRIu64" bytes", max_bytes);
|
|
r = -EFBIG;
|
|
goto cleanup;
|
|
}
|
|
|
|
r = loop_write(out, buf, produced, false);
|
|
if (r < 0)
|
|
goto cleanup;
|
|
}
|
|
|
|
log_debug("LZ4 decompression finished (%zu -> %zu bytes, %.1f%%)",
|
|
total_in, total_out,
|
|
total_in > 0 ? (double) total_out / total_in * 100 : 0.0);
|
|
cleanup:
|
|
munmap(src, st.st_size);
|
|
return r;
|
|
#else
|
|
return log_debug_errno(SYNTHETIC_ERRNO(EPROTONOSUPPORT),
|
|
"Cannot decompress file. Compiled without LZ4 support.");
|
|
#endif
|
|
}
|
|
|
|
int compress_stream_zstd(int fdf, int fdt, uint64_t max_bytes) {
|
|
#if HAVE_ZSTD
|
|
_cleanup_(ZSTD_freeCCtxp) ZSTD_CCtx *cctx = NULL;
|
|
_cleanup_free_ void *in_buff = NULL, *out_buff = NULL;
|
|
size_t in_allocsize, out_allocsize;
|
|
size_t z;
|
|
uint64_t left = max_bytes, in_bytes = 0;
|
|
|
|
assert(fdf >= 0);
|
|
assert(fdt >= 0);
|
|
|
|
/* Create the context and buffers */
|
|
in_allocsize = ZSTD_CStreamInSize();
|
|
out_allocsize = ZSTD_CStreamOutSize();
|
|
in_buff = malloc(in_allocsize);
|
|
out_buff = malloc(out_allocsize);
|
|
cctx = ZSTD_createCCtx();
|
|
if (!cctx || !out_buff || !in_buff)
|
|
return -ENOMEM;
|
|
|
|
z = ZSTD_CCtx_setParameter(cctx, ZSTD_c_checksumFlag, 1);
|
|
if (ZSTD_isError(z))
|
|
log_debug("Failed to enable ZSTD checksum, ignoring: %s", ZSTD_getErrorName(z));
|
|
|
|
/* This loop read from the input file, compresses that entire chunk,
|
|
* and writes all output produced to the output file.
|
|
*/
|
|
for (;;) {
|
|
bool is_last_chunk;
|
|
ZSTD_inBuffer input = {
|
|
.src = in_buff,
|
|
.size = 0,
|
|
.pos = 0
|
|
};
|
|
ssize_t red;
|
|
|
|
red = loop_read(fdf, in_buff, in_allocsize, true);
|
|
if (red < 0)
|
|
return red;
|
|
is_last_chunk = red == 0;
|
|
|
|
in_bytes += (size_t) red;
|
|
input.size = (size_t) red;
|
|
|
|
for (bool finished = false; !finished;) {
|
|
ZSTD_outBuffer output = {
|
|
.dst = out_buff,
|
|
.size = out_allocsize,
|
|
.pos = 0
|
|
};
|
|
size_t remaining;
|
|
ssize_t wrote;
|
|
|
|
/* Compress into the output buffer and write all of the
|
|
* output to the file so we can reuse the buffer next
|
|
* iteration.
|
|
*/
|
|
remaining = ZSTD_compressStream2(
|
|
cctx, &output, &input,
|
|
is_last_chunk ? ZSTD_e_end : ZSTD_e_continue);
|
|
|
|
if (ZSTD_isError(remaining)) {
|
|
log_debug("ZSTD encoder failed: %s", ZSTD_getErrorName(remaining));
|
|
return zstd_ret_to_errno(remaining);
|
|
}
|
|
|
|
if (left < output.pos)
|
|
return -EFBIG;
|
|
|
|
wrote = loop_write(fdt, output.dst, output.pos, 1);
|
|
if (wrote < 0)
|
|
return wrote;
|
|
|
|
left -= output.pos;
|
|
|
|
/* If we're on the last chunk we're finished when zstd
|
|
* returns 0, which means its consumed all the input AND
|
|
* finished the frame. Otherwise, we're finished when
|
|
* we've consumed all the input.
|
|
*/
|
|
finished = is_last_chunk ? (remaining == 0) : (input.pos == input.size);
|
|
}
|
|
|
|
/* zstd only returns 0 when the input is completely consumed */
|
|
assert(input.pos == input.size);
|
|
if (is_last_chunk)
|
|
break;
|
|
}
|
|
|
|
if (in_bytes > 0)
|
|
log_debug("ZSTD compression finished (%" PRIu64 " -> %" PRIu64 " bytes, %.1f%%)",
|
|
in_bytes, max_bytes - left, (double) (max_bytes - left) / in_bytes * 100);
|
|
else
|
|
log_debug("ZSTD compression finished (%" PRIu64 " -> %" PRIu64 " bytes)",
|
|
in_bytes, max_bytes - left);
|
|
|
|
return 0;
|
|
#else
|
|
return -EPROTONOSUPPORT;
|
|
#endif
|
|
}
|
|
|
|
int decompress_stream_zstd(int fdf, int fdt, uint64_t max_bytes) {
|
|
#if HAVE_ZSTD
|
|
_cleanup_(ZSTD_freeDCtxp) ZSTD_DCtx *dctx = NULL;
|
|
_cleanup_free_ void *in_buff = NULL, *out_buff = NULL;
|
|
size_t in_allocsize, out_allocsize;
|
|
size_t last_result = 0;
|
|
uint64_t left = max_bytes, in_bytes = 0;
|
|
|
|
assert(fdf >= 0);
|
|
assert(fdt >= 0);
|
|
|
|
/* Create the context and buffers */
|
|
in_allocsize = ZSTD_DStreamInSize();
|
|
out_allocsize = ZSTD_DStreamOutSize();
|
|
in_buff = malloc(in_allocsize);
|
|
out_buff = malloc(out_allocsize);
|
|
dctx = ZSTD_createDCtx();
|
|
if (!dctx || !out_buff || !in_buff)
|
|
return -ENOMEM;
|
|
|
|
/* This loop assumes that the input file is one or more concatenated
|
|
* zstd streams. This example won't work if there is trailing non-zstd
|
|
* data at the end, but streaming decompression in general handles this
|
|
* case. ZSTD_decompressStream() returns 0 exactly when the frame is
|
|
* completed, and doesn't consume input after the frame.
|
|
*/
|
|
for (;;) {
|
|
bool has_error = false;
|
|
ZSTD_inBuffer input = {
|
|
.src = in_buff,
|
|
.size = 0,
|
|
.pos = 0
|
|
};
|
|
ssize_t red;
|
|
|
|
red = loop_read(fdf, in_buff, in_allocsize, true);
|
|
if (red < 0)
|
|
return red;
|
|
if (red == 0)
|
|
break;
|
|
|
|
in_bytes += (size_t) red;
|
|
input.size = (size_t) red;
|
|
input.pos = 0;
|
|
|
|
/* Given a valid frame, zstd won't consume the last byte of the
|
|
* frame until it has flushed all of the decompressed data of
|
|
* the frame. So input.pos < input.size means frame is not done
|
|
* or there is still output available.
|
|
*/
|
|
while (input.pos < input.size) {
|
|
ZSTD_outBuffer output = {
|
|
.dst = out_buff,
|
|
.size = out_allocsize,
|
|
.pos = 0
|
|
};
|
|
ssize_t wrote;
|
|
/* The return code is zero if the frame is complete, but
|
|
* there may be multiple frames concatenated together.
|
|
* Zstd will automatically reset the context when a
|
|
* frame is complete. Still, calling ZSTD_DCtx_reset()
|
|
* can be useful to reset the context to a clean state,
|
|
* for instance if the last decompression call returned
|
|
* an error.
|
|
*/
|
|
last_result = ZSTD_decompressStream(dctx, &output, &input);
|
|
if (ZSTD_isError(last_result)) {
|
|
has_error = true;
|
|
break;
|
|
}
|
|
|
|
if (left < output.pos)
|
|
return -EFBIG;
|
|
|
|
wrote = loop_write(fdt, output.dst, output.pos, 1);
|
|
if (wrote < 0)
|
|
return wrote;
|
|
|
|
left -= output.pos;
|
|
}
|
|
if (has_error)
|
|
break;
|
|
}
|
|
|
|
if (in_bytes == 0)
|
|
return log_debug_errno(SYNTHETIC_ERRNO(EBADMSG), "ZSTD decoder failed: no data read");
|
|
|
|
if (last_result != 0) {
|
|
/* The last return value from ZSTD_decompressStream did not end
|
|
* on a frame, but we reached the end of the file! We assume
|
|
* this is an error, and the input was truncated.
|
|
*/
|
|
log_debug("ZSTD decoder failed: %s", ZSTD_getErrorName(last_result));
|
|
return zstd_ret_to_errno(last_result);
|
|
}
|
|
|
|
log_debug(
|
|
"ZSTD decompression finished (%" PRIu64 " -> %" PRIu64 " bytes, %.1f%%)",
|
|
in_bytes,
|
|
max_bytes - left,
|
|
(double) (max_bytes - left) / in_bytes * 100);
|
|
return 0;
|
|
#else
|
|
return log_debug_errno(SYNTHETIC_ERRNO(EPROTONOSUPPORT),
|
|
"Cannot decompress file. Compiled without ZSTD support.");
|
|
#endif
|
|
}
|
|
|
|
int decompress_stream(const char *filename, int fdf, int fdt, uint64_t max_bytes) {
|
|
|
|
if (endswith(filename, ".lz4"))
|
|
return decompress_stream_lz4(fdf, fdt, max_bytes);
|
|
else if (endswith(filename, ".xz"))
|
|
return decompress_stream_xz(fdf, fdt, max_bytes);
|
|
else if (endswith(filename, ".zst"))
|
|
return decompress_stream_zstd(fdf, fdt, max_bytes);
|
|
else
|
|
return -EPROTONOSUPPORT;
|
|
}
|