1
0
mirror of https://github.com/samba-team/samba.git synced 2025-01-10 01:18:15 +03:00
samba-mirror/lib/compression/lzxpress_huffman.h
Douglas Bagnall d4e3f0c88e lib/compression: LZ77 + Huffman compression
This compresses files as described in MS-XCA 2.2, and as decompressed
by the decompressor in the previous commit.

As with the decompressor, there are two public functions -- one that
uses a talloc context, and one that uses pre-allocated memory. The
compressor requires a tightly bound amount of auxillary memory
(>220kB) in a few different buffers, which is all gathered together in
the public struct lzxhuff_compressor_mem. An instantiated but not
initialised copy of this struct is required by the non-talloc
function; it can be used over and over again.

Our compression speed is about the same as the decompression speed
(between 20 and 500 MB/s on this laptop, depending on the data), and
our compression ratio is very similar to that of Windows.

Signed-off-by: Douglas Bagnall <douglas.bagnall@catalyst.net.nz>
Reviewed-by: Joseph Sutton <josephsutton@catalyst.net.nz>
2022-12-01 22:56:39 +00:00

88 lines
2.5 KiB
C

/*
* Samba compression library - LGPLv3
*
* Copyright © Catalyst IT 2022
*
* ** NOTE! The following LGPL license applies to this file.
* ** It does NOT imply that all of Samba is released under the LGPL
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 3 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with this library; if not, see <http://www.gnu.org/licenses/>.
*/
#ifndef HAVE_LZXPRESS_HUFFMAN_H
#define HAVE_LZXPRESS_HUFFMAN_H
struct huffman_node {
struct huffman_node *left;
struct huffman_node *right;
uint32_t count;
uint16_t symbol;
int8_t depth;
};
/*
* LZX_HUFF_COMP_HASH_BITS is how big to make the hash tables
* (12 means 4096, etc).
*
* A larger number (up to 16) will be faster on long messages (fewer
* collisions), but probably slower on short ones (more prep).
*/
#define LZX_HUFF_COMP_HASH_BITS 14
/*
* This struct just coalesces all the memory you need for LZ77 + Huffman
* compresssion together in one bundle.
*
* There are a few different things you want, you usually want them all, so
* this makes it easy to allocate them all at once.
*/
struct lzxhuff_compressor_mem {
struct huffman_node leaf_nodes[512];
struct huffman_node internal_nodes[512];
uint16_t symbol_values[512];
uint16_t intermediate[65536 + 6];
uint16_t hash_table1[1 << LZX_HUFF_COMP_HASH_BITS];
uint16_t hash_table2[1 << LZX_HUFF_COMP_HASH_BITS];
};
ssize_t lzxpress_huffman_compress(struct lzxhuff_compressor_mem *cmp,
const uint8_t *input_bytes,
size_t input_size,
uint8_t *output,
size_t available_size);
ssize_t lzxpress_huffman_compress_talloc(TALLOC_CTX *mem_ctx,
const uint8_t *input_bytes,
size_t input_size,
uint8_t **output);
ssize_t lzxpress_huffman_decompress(const uint8_t *input,
size_t input_size,
uint8_t *output,
size_t max_output_size);
uint8_t *lzxpress_huffman_decompress_talloc(TALLOC_CTX *mem_ctx,
const uint8_t *input_bytes,
size_t input_size,
size_t output_size);
#endif /* HAVE_LZXPRESS_HUFFMAN_H */