2008-07-10 09:31:43 +00:00
/*
* Copyright ( C ) Matthieu Suiche 2008
*
* All rights reserved .
*
* Redistribution and use in source and binary forms , with or without
* modification , are permitted provided that the following conditions
* are met :
*
* 1. Redistributions of source code must retain the above copyright
* notice , this list of conditions and the following disclaimer .
*
* 2. Redistributions in binary form must reproduce the above copyright
* notice , this list of conditions and the following disclaimer in the
* documentation and / or other materials provided with the distribution .
*
* 3. Neither the name of the author nor the names of its contributors
* may be used to endorse or promote products derived from this software
* without specific prior written permission .
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ` ` AS IS ' ' AND
* ANY EXPRESS OR IMPLIED WARRANTIES , INCLUDING , BUT NOT LIMITED TO , THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED . IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT , INDIRECT , INCIDENTAL , SPECIAL , EXEMPLARY , OR CONSEQUENTIAL
* DAMAGES ( INCLUDING , BUT NOT LIMITED TO , PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES ; LOSS OF USE , DATA , OR PROFITS ; OR BUSINESS INTERRUPTION )
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY , WHETHER IN CONTRACT , STRICT
* LIABILITY , OR TORT ( INCLUDING NEGLIGENCE OR OTHERWISE ) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE , EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE .
*
*/
# include "replace.h"
# include "lzxpress.h"
2010-11-26 23:45:13 +03:00
# include "../lib/util/byteorder.h"
2008-07-10 09:31:43 +00:00
# define __BUF_POS_CONST(buf,ofs)(((const uint8_t *)buf)+(ofs))
# define __PULL_BYTE(buf,ofs) \
( ( uint8_t ) ( ( * __BUF_POS_CONST ( buf , ofs ) ) & 0xFF ) )
# ifndef PULL_LE_UINT16
# define PULL_LE_UINT16(buf,ofs) ((uint16_t)( \
( ( uint16_t ) ( ( ( uint16_t ) ( __PULL_BYTE ( buf , ( ofs ) + 0 ) ) ) < < 0 ) ) | \
( ( uint16_t ) ( ( ( uint16_t ) ( __PULL_BYTE ( buf , ( ofs ) + 1 ) ) ) < < 8 ) ) \
) )
# endif
# ifndef PULL_LE_UINT32
# define PULL_LE_UINT32(buf,ofs) ((uint32_t)( \
( ( uint32_t ) ( ( ( uint32_t ) ( __PULL_BYTE ( buf , ( ofs ) + 0 ) ) ) < < 0 ) ) | \
( ( uint32_t ) ( ( ( uint32_t ) ( __PULL_BYTE ( buf , ( ofs ) + 1 ) ) ) < < 8 ) ) | \
( ( uint32_t ) ( ( ( uint32_t ) ( __PULL_BYTE ( buf , ( ofs ) + 2 ) ) ) < < 16 ) ) | \
( ( uint32_t ) ( ( ( uint32_t ) ( __PULL_BYTE ( buf , ( ofs ) + 3 ) ) ) < < 24 ) ) \
) )
# endif
2008-07-10 09:31:43 +00:00
ssize_t lzxpress_compress ( const uint8_t * uncompressed ,
uint32_t uncompressed_size ,
uint8_t * compressed ,
uint32_t max_compressed_size )
{
uint32_t uncompressed_pos , compressed_pos , byte_left ;
uint32_t max_offset , best_offset ;
int32_t offset ;
uint32_t max_len , len , best_len ;
const uint8_t * str1 , * str2 ;
uint32_t indic ;
uint8_t * indic_pos ;
uint32_t indic_bit , nibble_index ;
uint32_t metadata_size ;
uint16_t metadata ;
uint16_t * dest ;
if ( ! uncompressed_size ) {
return 0 ;
}
uncompressed_pos = 0 ;
indic = 0 ;
2010-11-05 09:00:57 +11:00
* ( uint32_t * ) compressed = 0 ;
2008-07-10 09:31:43 +00:00
compressed_pos = sizeof ( uint32_t ) ;
indic_pos = & compressed [ 0 ] ;
byte_left = uncompressed_size ;
indic_bit = 0 ;
nibble_index = 0 ;
if ( uncompressed_pos > XPRESS_BLOCK_SIZE )
return 0 ;
do {
bool found = false ;
max_offset = uncompressed_pos ;
str1 = & uncompressed [ uncompressed_pos ] ;
best_len = 2 ;
best_offset = 0 ;
max_offset = MIN ( 0x1FFF , max_offset ) ;
/* search for the longest match in the window for the lookahead buffer */
for ( offset = 1 ; ( uint32_t ) offset < = max_offset ; offset + + ) {
str2 = & str1 [ - offset ] ;
/* maximum len we can encode into metadata */
max_len = MIN ( ( 255 + 15 + 7 + 3 ) , byte_left ) ;
for ( len = 0 ; ( len < max_len ) & & ( str1 [ len ] = = str2 [ len ] ) ; len + + ) ;
/*
* We check if len is better than the value found before , including the
* sequence of identical bytes
*/
if ( len > best_len ) {
found = true ;
best_len = len ;
best_offset = offset ;
}
}
if ( found ) {
metadata_size = 0 ;
dest = ( uint16_t * ) & compressed [ compressed_pos ] ;
if ( best_len < 10 ) {
/* Classical meta-data */
metadata = ( uint16_t ) ( ( ( best_offset - 1 ) < < 3 ) | ( best_len - 3 ) ) ;
2010-11-26 23:45:13 +03:00
SSVAL ( dest , metadata_size / sizeof ( uint16_t ) , metadata ) ;
2008-07-10 09:31:43 +00:00
metadata_size + = sizeof ( uint16_t ) ;
} else {
metadata = ( uint16_t ) ( ( ( best_offset - 1 ) < < 3 ) | 7 ) ;
2010-11-26 23:45:13 +03:00
SSVAL ( dest , metadata_size / sizeof ( uint16_t ) , metadata ) ;
2008-07-10 09:31:43 +00:00
metadata_size = sizeof ( uint16_t ) ;
if ( best_len < ( 15 + 7 + 3 ) ) {
/* Shared byte */
if ( ! nibble_index ) {
compressed [ compressed_pos + metadata_size ] = ( best_len - ( 3 + 7 ) ) & 0xF ;
metadata_size + = sizeof ( uint8_t ) ;
} else {
compressed [ nibble_index ] & = 0xF ;
compressed [ nibble_index ] | = ( best_len - ( 3 + 7 ) ) * 16 ;
}
} else if ( best_len < ( 3 + 7 + 15 + 255 ) ) {
/* Shared byte */
if ( ! nibble_index ) {
compressed [ compressed_pos + metadata_size ] = 15 ;
metadata_size + = sizeof ( uint8_t ) ;
} else {
compressed [ nibble_index ] & = 0xF ;
compressed [ nibble_index ] | = ( 15 * 16 ) ;
}
2010-02-21 16:33:24 +11:00
/* Additional best_len */
2008-07-10 09:31:43 +00:00
compressed [ compressed_pos + metadata_size ] = ( best_len - ( 3 + 7 + 15 ) ) & 0xFF ;
metadata_size + = sizeof ( uint8_t ) ;
} else {
/* Shared byte */
if ( ! nibble_index ) {
compressed [ compressed_pos + metadata_size ] | = 15 ;
metadata_size + = sizeof ( uint8_t ) ;
} else {
compressed [ nibble_index ] | = 15 < < 4 ;
}
2010-02-21 16:33:24 +11:00
/* Additional best_len */
2008-07-10 09:31:43 +00:00
compressed [ compressed_pos + metadata_size ] = 255 ;
metadata_size + = sizeof ( uint8_t ) ;
compressed [ compressed_pos + metadata_size ] = ( best_len - 3 ) & 0xFF ;
compressed [ compressed_pos + metadata_size + 1 ] = ( ( best_len - 3 ) > > 8 ) & 0xFF ;
metadata_size + = sizeof ( uint16_t ) ;
}
}
2020-08-06 17:17:01 +12:00
indic | = 1U < < ( 32 - ( ( indic_bit % 32 ) + 1 ) ) ;
2008-07-10 09:31:43 +00:00
if ( best_len > 9 ) {
if ( nibble_index = = 0 ) {
nibble_index = compressed_pos + sizeof ( uint16_t ) ;
} else {
nibble_index = 0 ;
}
}
compressed_pos + = metadata_size ;
uncompressed_pos + = best_len ;
byte_left - = best_len ;
} else {
compressed [ compressed_pos + + ] = uncompressed [ uncompressed_pos + + ] ;
byte_left - - ;
}
indic_bit + + ;
if ( ( indic_bit - 1 ) % 32 > ( indic_bit % 32 ) ) {
2010-11-26 23:45:13 +03:00
SIVAL ( indic_pos , 0 , indic ) ;
2008-07-10 09:31:43 +00:00
indic = 0 ;
indic_pos = & compressed [ compressed_pos ] ;
compressed_pos + = sizeof ( uint32_t ) ;
}
} while ( byte_left > 3 ) ;
do {
compressed [ compressed_pos ] = uncompressed [ uncompressed_pos ] ;
indic_bit + + ;
uncompressed_pos + + ;
compressed_pos + + ;
if ( ( ( indic_bit - 1 ) % 32 ) > ( indic_bit % 32 ) ) {
2010-11-26 23:45:13 +03:00
SIVAL ( indic_pos , 0 , indic ) ;
2008-07-10 09:31:43 +00:00
indic = 0 ;
indic_pos = & compressed [ compressed_pos ] ;
compressed_pos + = sizeof ( uint32_t ) ;
}
} while ( uncompressed_pos < uncompressed_size ) ;
if ( ( indic_bit % 32 ) > 0 ) {
for ( ; ( indic_bit % 32 ) ! = 0 ; indic_bit + + )
indic | = 0 < < ( 32 - ( ( indic_bit % 32 ) + 1 ) ) ;
2018-11-22 15:11:09 +01:00
SIVAL ( compressed , compressed_pos , 0 ) ;
2010-11-26 23:45:13 +03:00
SIVAL ( indic_pos , 0 , indic ) ;
2008-07-10 09:31:43 +00:00
compressed_pos + = sizeof ( uint32_t ) ;
}
return compressed_pos ;
}
2008-07-10 09:31:43 +00:00
ssize_t lzxpress_decompress ( const uint8_t * input ,
uint32_t input_size ,
uint8_t * output ,
uint32_t max_output_size )
2008-07-10 09:31:43 +00:00
{
uint32_t output_index , input_index ;
uint32_t indicator , indicator_bit ;
uint32_t length ;
uint32_t offset ;
uint32_t nibble_index ;
output_index = 0 ;
input_index = 0 ;
indicator = 0 ;
indicator_bit = 0 ;
length = 0 ;
offset = 0 ;
nibble_index = 0 ;
2019-11-07 10:03:36 +01:00
# define __CHECK_BYTES(__size, __index, __needed) do { \
if ( unlikely ( __index > = __size ) ) { \
return - 1 ; \
} else { \
uint32_t __avail = __size - __index ; \
if ( unlikely ( __needed > __avail ) ) { \
return - 1 ; \
} \
} \
} while ( 0 )
# define CHECK_INPUT_BYTES(__needed) \
__CHECK_BYTES ( input_size , input_index , __needed )
# define CHECK_OUTPUT_BYTES(__needed) \
__CHECK_BYTES ( max_output_size , output_index , __needed )
2008-07-10 09:31:43 +00:00
do {
if ( indicator_bit = = 0 ) {
2019-11-07 10:03:36 +01:00
CHECK_INPUT_BYTES ( 4 ) ;
2008-07-10 09:31:43 +00:00
indicator = PULL_LE_UINT32 ( input , input_index ) ;
input_index + = sizeof ( uint32_t ) ;
indicator_bit = 32 ;
}
indicator_bit - - ;
/*
* check whether the bit specified by indicator_bit is set or not
* set in indicator . For example , if indicator_bit has value 4
* check whether the 4 th bit of the value in indicator is set
*/
if ( ( ( indicator > > indicator_bit ) & 1 ) = = 0 ) {
2019-11-07 10:03:36 +01:00
CHECK_INPUT_BYTES ( 1 ) ;
CHECK_OUTPUT_BYTES ( 1 ) ;
2008-07-10 09:31:43 +00:00
output [ output_index ] = input [ input_index ] ;
input_index + = sizeof ( uint8_t ) ;
output_index + = sizeof ( uint8_t ) ;
} else {
2019-11-07 10:03:36 +01:00
CHECK_INPUT_BYTES ( 2 ) ;
2008-07-10 09:31:43 +00:00
length = PULL_LE_UINT16 ( input , input_index ) ;
input_index + = sizeof ( uint16_t ) ;
offset = length / 8 ;
length = length % 8 ;
if ( length = = 7 ) {
if ( nibble_index = = 0 ) {
2019-11-07 10:03:36 +01:00
CHECK_INPUT_BYTES ( 1 ) ;
2008-07-10 09:31:43 +00:00
nibble_index = input_index ;
length = input [ input_index ] % 16 ;
input_index + = sizeof ( uint8_t ) ;
} else {
length = input [ nibble_index ] / 16 ;
nibble_index = 0 ;
}
if ( length = = 15 ) {
2019-11-07 10:03:36 +01:00
CHECK_INPUT_BYTES ( 1 ) ;
2008-07-10 09:31:43 +00:00
length = input [ input_index ] ;
input_index + = sizeof ( uint8_t ) ;
2008-07-10 09:31:43 +00:00
if ( length = = 255 ) {
2019-11-07 10:03:36 +01:00
CHECK_INPUT_BYTES ( 2 ) ;
2008-07-10 09:31:43 +00:00
length = PULL_LE_UINT16 ( input , input_index ) ;
input_index + = sizeof ( uint16_t ) ;
length - = ( 15 + 7 ) ;
}
2008-07-10 09:31:43 +00:00
length + = 15 ;
}
length + = 7 ;
}
length + = 3 ;
2019-11-07 10:03:36 +01:00
if ( length = = 0 ) {
return - 1 ;
}
2008-07-10 09:31:43 +00:00
2019-11-07 10:03:36 +01:00
if ( offset > = output_index ) {
return - 1 ;
}
CHECK_OUTPUT_BYTES ( length ) ;
2008-07-10 09:31:43 +00:00
2019-11-07 10:03:36 +01:00
do {
2008-07-10 09:31:43 +00:00
output [ output_index ] = output [ output_index - offset - 1 ] ;
2008-07-10 09:31:43 +00:00
2008-07-10 09:31:43 +00:00
output_index + = sizeof ( uint8_t ) ;
length - = sizeof ( uint8_t ) ;
} while ( length ! = 0 ) ;
}
2008-07-10 09:31:43 +00:00
} while ( ( output_index < max_output_size ) & & ( input_index < ( input_size ) ) ) ;
2008-07-10 09:31:43 +00:00
return output_index ;
}