2013-07-08 16:01:49 -07:00
/*
* LZ4 HC - High Compression Mode of LZ4
* Copyright ( C ) 2011 - 2012 , Yann Collet .
* BSD 2 - Clause License ( http : //www.opensource.org/licenses/bsd-license.php)
*
* Redistribution and use in source and binary forms , with or without
* modification , are permitted provided that the following conditions are
* met :
*
* * Redistributions of source code must retain the above copyright
* notice , this list of conditions and the following disclaimer .
* * Redistributions in binary form must reproduce the above
* copyright notice , this list of conditions and the following disclaimer
* in the documentation and / or other materials provided with the
* distribution .
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
* " AS IS " AND ANY EXPRESS OR IMPLIED WARRANTIES , INCLUDING , BUT NOT
* LIMITED TO , THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
* A PARTICULAR PURPOSE ARE DISCLAIMED . IN NO EVENT SHALL THE COPYRIGHT
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT , INDIRECT , INCIDENTAL ,
* SPECIAL , EXEMPLARY , OR CONSEQUENTIAL DAMAGES ( INCLUDING , BUT NOT
* LIMITED TO , PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES ; LOSS OF USE ,
* DATA , OR PROFITS ; OR BUSINESS INTERRUPTION ) HOWEVER CAUSED AND ON ANY
* THEORY OF LIABILITY , WHETHER IN CONTRACT , STRICT LIABILITY , OR TORT
* ( INCLUDING NEGLIGENCE OR OTHERWISE ) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE , EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE .
*
* You can contact the author at :
* - LZ4 homepage : http : //fastcompression.blogspot.com/p/lz4.html
* - LZ4 source repository : http : //code.google.com/p/lz4/
*
* Changed for kernel use by :
* Chanho Min < chanho . min @ lge . com >
*/
# include <linux/module.h>
# include <linux/kernel.h>
# include <linux/lz4.h>
# include <asm/unaligned.h>
# include "lz4defs.h"
struct lz4hc_data {
const u8 * base ;
HTYPE hashtable [ HASHTABLESIZE ] ;
u16 chaintable [ MAXD ] ;
const u8 * nexttoupdate ;
} __attribute__ ( ( __packed__ ) ) ;
static inline int lz4hc_init ( struct lz4hc_data * hc4 , const u8 * base )
{
memset ( ( void * ) hc4 - > hashtable , 0 , sizeof ( hc4 - > hashtable ) ) ;
memset ( hc4 - > chaintable , 0xFF , sizeof ( hc4 - > chaintable ) ) ;
# if LZ4_ARCH64
hc4 - > nexttoupdate = base + 1 ;
# else
hc4 - > nexttoupdate = base ;
# endif
hc4 - > base = base ;
return 1 ;
}
/* Update chains up to ip (excluded) */
static inline void lz4hc_insert ( struct lz4hc_data * hc4 , const u8 * ip )
{
u16 * chaintable = hc4 - > chaintable ;
HTYPE * hashtable = hc4 - > hashtable ;
# if LZ4_ARCH64
const BYTE * const base = hc4 - > base ;
# else
const int base = 0 ;
# endif
while ( hc4 - > nexttoupdate < ip ) {
const u8 * p = hc4 - > nexttoupdate ;
size_t delta = p - ( hashtable [ HASH_VALUE ( p ) ] + base ) ;
if ( delta > MAX_DISTANCE )
delta = MAX_DISTANCE ;
chaintable [ ( size_t ) ( p ) & MAXD_MASK ] = ( u16 ) delta ;
hashtable [ HASH_VALUE ( p ) ] = ( p ) - base ;
hc4 - > nexttoupdate + + ;
}
}
static inline size_t lz4hc_commonlength ( const u8 * p1 , const u8 * p2 ,
const u8 * const matchlimit )
{
const u8 * p1t = p1 ;
while ( p1t < matchlimit - ( STEPSIZE - 1 ) ) {
# if LZ4_ARCH64
u64 diff = A64 ( p2 ) ^ A64 ( p1t ) ;
# else
u32 diff = A32 ( p2 ) ^ A32 ( p1t ) ;
# endif
if ( ! diff ) {
p1t + = STEPSIZE ;
p2 + = STEPSIZE ;
continue ;
}
p1t + = LZ4_NBCOMMONBYTES ( diff ) ;
return p1t - p1 ;
}
# if LZ4_ARCH64
if ( ( p1t < ( matchlimit - 3 ) ) & & ( A32 ( p2 ) = = A32 ( p1t ) ) ) {
p1t + = 4 ;
p2 + = 4 ;
}
# endif
if ( ( p1t < ( matchlimit - 1 ) ) & & ( A16 ( p2 ) = = A16 ( p1t ) ) ) {
p1t + = 2 ;
p2 + = 2 ;
}
if ( ( p1t < matchlimit ) & & ( * p2 = = * p1t ) )
p1t + + ;
return p1t - p1 ;
}
static inline int lz4hc_insertandfindbestmatch ( struct lz4hc_data * hc4 ,
const u8 * ip , const u8 * const matchlimit , const u8 * * matchpos )
{
u16 * const chaintable = hc4 - > chaintable ;
HTYPE * const hashtable = hc4 - > hashtable ;
const u8 * ref ;
# if LZ4_ARCH64
const BYTE * const base = hc4 - > base ;
# else
const int base = 0 ;
# endif
int nbattempts = MAX_NB_ATTEMPTS ;
size_t repl = 0 , ml = 0 ;
u16 delta ;
/* HC4 match finder */
lz4hc_insert ( hc4 , ip ) ;
ref = hashtable [ HASH_VALUE ( ip ) ] + base ;
/* potential repetition */
if ( ref > = ip - 4 ) {
/* confirmed */
if ( A32 ( ref ) = = A32 ( ip ) ) {
delta = ( u16 ) ( ip - ref ) ;
repl = ml = lz4hc_commonlength ( ip + MINMATCH ,
ref + MINMATCH , matchlimit ) + MINMATCH ;
* matchpos = ref ;
}
ref - = ( size_t ) chaintable [ ( size_t ) ( ref ) & MAXD_MASK ] ;
}
while ( ( ref > = ip - MAX_DISTANCE ) & & nbattempts ) {
nbattempts - - ;
if ( * ( ref + ml ) = = * ( ip + ml ) ) {
if ( A32 ( ref ) = = A32 ( ip ) ) {
size_t mlt =
lz4hc_commonlength ( ip + MINMATCH ,
ref + MINMATCH , matchlimit ) + MINMATCH ;
if ( mlt > ml ) {
ml = mlt ;
* matchpos = ref ;
}
}
}
ref - = ( size_t ) chaintable [ ( size_t ) ( ref ) & MAXD_MASK ] ;
}
/* Complete table */
if ( repl ) {
const BYTE * ptr = ip ;
const BYTE * end ;
end = ip + repl - ( MINMATCH - 1 ) ;
/* Pre-Load */
while ( ptr < end - delta ) {
chaintable [ ( size_t ) ( ptr ) & MAXD_MASK ] = delta ;
ptr + + ;
}
do {
chaintable [ ( size_t ) ( ptr ) & MAXD_MASK ] = delta ;
/* Head of chain */
hashtable [ HASH_VALUE ( ptr ) ] = ( ptr ) - base ;
ptr + + ;
} while ( ptr < end ) ;
hc4 - > nexttoupdate = end ;
}
return ( int ) ml ;
}
static inline int lz4hc_insertandgetwidermatch ( struct lz4hc_data * hc4 ,
const u8 * ip , const u8 * startlimit , const u8 * matchlimit , int longest ,
const u8 * * matchpos , const u8 * * startpos )
{
u16 * const chaintable = hc4 - > chaintable ;
HTYPE * const hashtable = hc4 - > hashtable ;
# if LZ4_ARCH64
const BYTE * const base = hc4 - > base ;
# else
const int base = 0 ;
# endif
const u8 * ref ;
int nbattempts = MAX_NB_ATTEMPTS ;
int delta = ( int ) ( ip - startlimit ) ;
/* First Match */
lz4hc_insert ( hc4 , ip ) ;
ref = hashtable [ HASH_VALUE ( ip ) ] + base ;
while ( ( ref > = ip - MAX_DISTANCE ) & & ( ref > = hc4 - > base )
& & ( nbattempts ) ) {
nbattempts - - ;
if ( * ( startlimit + longest ) = = * ( ref - delta + longest ) ) {
if ( A32 ( ref ) = = A32 ( ip ) ) {
const u8 * reft = ref + MINMATCH ;
const u8 * ipt = ip + MINMATCH ;
const u8 * startt = ip ;
while ( ipt < matchlimit - ( STEPSIZE - 1 ) ) {
# if LZ4_ARCH64
u64 diff = A64 ( reft ) ^ A64 ( ipt ) ;
# else
u32 diff = A32 ( reft ) ^ A32 ( ipt ) ;
# endif
if ( ! diff ) {
ipt + = STEPSIZE ;
reft + = STEPSIZE ;
continue ;
}
ipt + = LZ4_NBCOMMONBYTES ( diff ) ;
goto _endcount ;
}
# if LZ4_ARCH64
if ( ( ipt < ( matchlimit - 3 ) )
& & ( A32 ( reft ) = = A32 ( ipt ) ) ) {
ipt + = 4 ;
reft + = 4 ;
}
ipt + = 2 ;
# endif
if ( ( ipt < ( matchlimit - 1 ) )
& & ( A16 ( reft ) = = A16 ( ipt ) ) ) {
reft + = 2 ;
}
if ( ( ipt < matchlimit ) & & ( * reft = = * ipt ) )
ipt + + ;
_endcount :
reft = ref ;
while ( ( startt > startlimit )
& & ( reft > hc4 - > base )
& & ( startt [ - 1 ] = = reft [ - 1 ] ) ) {
startt - - ;
reft - - ;
}
if ( ( ipt - startt ) > longest ) {
longest = ( int ) ( ipt - startt ) ;
* matchpos = reft ;
* startpos = startt ;
}
}
}
ref - = ( size_t ) chaintable [ ( size_t ) ( ref ) & MAXD_MASK ] ;
}
return longest ;
}
static inline int lz4_encodesequence ( const u8 * * ip , u8 * * op , const u8 * * anchor ,
int ml , const u8 * ref )
{
int length , len ;
u8 * token ;
/* Encode Literal length */
length = ( int ) ( * ip - * anchor ) ;
token = ( * op ) + + ;
if ( length > = ( int ) RUN_MASK ) {
* token = ( RUN_MASK < < ML_BITS ) ;
len = length - RUN_MASK ;
for ( ; len > 254 ; len - = 255 )
* ( * op ) + + = 255 ;
* ( * op ) + + = ( u8 ) len ;
} else
* token = ( length < < ML_BITS ) ;
/* Copy Literals */
LZ4_BLINDCOPY ( * anchor , * op , length ) ;
/* Encode Offset */
LZ4_WRITE_LITTLEENDIAN_16 ( * op , ( u16 ) ( * ip - ref ) ) ;
/* Encode MatchLength */
len = ( int ) ( ml - MINMATCH ) ;
if ( len > = ( int ) ML_MASK ) {
* token + = ML_MASK ;
len - = ML_MASK ;
for ( ; len > 509 ; len - = 510 ) {
* ( * op ) + + = 255 ;
* ( * op ) + + = 255 ;
}
if ( len > 254 ) {
len - = 255 ;
* ( * op ) + + = 255 ;
}
* ( * op ) + + = ( u8 ) len ;
} else
* token + = len ;
/* Prepare next loop */
* ip + = ml ;
* anchor = * ip ;
return 0 ;
}
static int lz4_compresshcctx ( struct lz4hc_data * ctx ,
const char * source ,
char * dest ,
int isize )
{
const u8 * ip = ( const u8 * ) source ;
const u8 * anchor = ip ;
const u8 * const iend = ip + isize ;
const u8 * const mflimit = iend - MFLIMIT ;
const u8 * const matchlimit = ( iend - LASTLITERALS ) ;
u8 * op = ( u8 * ) dest ;
int ml , ml2 , ml3 , ml0 ;
const u8 * ref = NULL ;
const u8 * start2 = NULL ;
const u8 * ref2 = NULL ;
const u8 * start3 = NULL ;
const u8 * ref3 = NULL ;
const u8 * start0 ;
const u8 * ref0 ;
int lastrun ;
ip + + ;
/* Main Loop */
while ( ip < mflimit ) {
ml = lz4hc_insertandfindbestmatch ( ctx , ip , matchlimit , ( & ref ) ) ;
if ( ! ml ) {
ip + + ;
continue ;
}
/* saved, in case we would skip too much */
start0 = ip ;
ref0 = ref ;
ml0 = ml ;
_search2 :
if ( ip + ml < mflimit )
ml2 = lz4hc_insertandgetwidermatch ( ctx , ip + ml - 2 ,
ip + 1 , matchlimit , ml , & ref2 , & start2 ) ;
else
ml2 = ml ;
/* No better match */
if ( ml2 = = ml ) {
lz4_encodesequence ( & ip , & op , & anchor , ml , ref ) ;
continue ;
}
if ( start0 < ip ) {
/* empirical */
if ( start2 < ip + ml0 ) {
ip = start0 ;
ref = ref0 ;
ml = ml0 ;
}
}
/*
* Here , start0 = = ip
* First Match too small : removed
*/
if ( ( start2 - ip ) < 3 ) {
ml = ml2 ;
ip = start2 ;
ref = ref2 ;
goto _search2 ;
}
_search3 :
/*
* Currently we have :
* ml2 > ml1 , and
* ip1 + 3 < = ip2 ( usually < ip1 + ml1 )
*/
if ( ( start2 - ip ) < OPTIMAL_ML ) {
int correction ;
int new_ml = ml ;
if ( new_ml > OPTIMAL_ML )
new_ml = OPTIMAL_ML ;
if ( ip + new_ml > start2 + ml2 - MINMATCH )
new_ml = ( int ) ( start2 - ip ) + ml2 - MINMATCH ;
correction = new_ml - ( int ) ( start2 - ip ) ;
if ( correction > 0 ) {
start2 + = correction ;
ref2 + = correction ;
ml2 - = correction ;
}
}
/*
* Now , we have start2 = ip + new_ml ,
* with new_ml = min ( ml , OPTIMAL_ML = 18 )
*/
if ( start2 + ml2 < mflimit )
ml3 = lz4hc_insertandgetwidermatch ( ctx ,
start2 + ml2 - 3 , start2 , matchlimit ,
ml2 , & ref3 , & start3 ) ;
else
ml3 = ml2 ;
/* No better match : 2 sequences to encode */
if ( ml3 = = ml2 ) {
/* ip & ref are known; Now for ml */
if ( start2 < ip + ml )
ml = ( int ) ( start2 - ip ) ;
/* Now, encode 2 sequences */
lz4_encodesequence ( & ip , & op , & anchor , ml , ref ) ;
ip = start2 ;
lz4_encodesequence ( & ip , & op , & anchor , ml2 , ref2 ) ;
continue ;
}
/* Not enough space for match 2 : remove it */
if ( start3 < ip + ml + 3 ) {
/*
* can write Seq1 immediately = = > Seq2 is removed ,
* so Seq3 becomes Seq1
*/
if ( start3 > = ( ip + ml ) ) {
if ( start2 < ip + ml ) {
int correction =
( int ) ( ip + ml - start2 ) ;
start2 + = correction ;
ref2 + = correction ;
ml2 - = correction ;
if ( ml2 < MINMATCH ) {
start2 = start3 ;
ref2 = ref3 ;
ml2 = ml3 ;
}
}
lz4_encodesequence ( & ip , & op , & anchor , ml , ref ) ;
ip = start3 ;
ref = ref3 ;
ml = ml3 ;
start0 = start2 ;
ref0 = ref2 ;
ml0 = ml2 ;
goto _search2 ;
}
start2 = start3 ;
ref2 = ref3 ;
ml2 = ml3 ;
goto _search3 ;
}
/*
* OK , now we have 3 ascending matches ; let ' s write at least
* the first one ip & ref are known ; Now for ml
*/
if ( start2 < ip + ml ) {
if ( ( start2 - ip ) < ( int ) ML_MASK ) {
int correction ;
if ( ml > OPTIMAL_ML )
ml = OPTIMAL_ML ;
if ( ip + ml > start2 + ml2 - MINMATCH )
ml = ( int ) ( start2 - ip ) + ml2
- MINMATCH ;
correction = ml - ( int ) ( start2 - ip ) ;
if ( correction > 0 ) {
start2 + = correction ;
ref2 + = correction ;
ml2 - = correction ;
}
} else
ml = ( int ) ( start2 - ip ) ;
}
lz4_encodesequence ( & ip , & op , & anchor , ml , ref ) ;
ip = start2 ;
ref = ref2 ;
ml = ml2 ;
start2 = start3 ;
ref2 = ref3 ;
ml2 = ml3 ;
goto _search3 ;
}
/* Encode Last Literals */
lastrun = ( int ) ( iend - anchor ) ;
if ( lastrun > = ( int ) RUN_MASK ) {
* op + + = ( RUN_MASK < < ML_BITS ) ;
lastrun - = RUN_MASK ;
for ( ; lastrun > 254 ; lastrun - = 255 )
* op + + = 255 ;
* op + + = ( u8 ) lastrun ;
} else
* op + + = ( lastrun < < ML_BITS ) ;
memcpy ( op , anchor , iend - anchor ) ;
op + = iend - anchor ;
/* End */
return ( int ) ( ( ( char * ) op ) - dest ) ;
}
int lz4hc_compress ( const unsigned char * src , size_t src_len ,
unsigned char * dst , size_t * dst_len , void * wrkmem )
{
int ret = - 1 ;
int out_len = 0 ;
struct lz4hc_data * hc4 = ( struct lz4hc_data * ) wrkmem ;
lz4hc_init ( hc4 , ( const u8 * ) src ) ;
out_len = lz4_compresshcctx ( ( struct lz4hc_data * ) hc4 , ( const u8 * ) src ,
( char * ) dst , ( int ) src_len ) ;
if ( out_len < 0 )
goto exit ;
* dst_len = out_len ;
return 0 ;
exit :
return ret ;
}
2013-08-22 16:35:47 -07:00
EXPORT_SYMBOL ( lz4hc_compress ) ;
2013-07-08 16:01:49 -07:00
2013-08-22 16:35:47 -07:00
MODULE_LICENSE ( " Dual BSD/GPL " ) ;
2013-07-08 16:01:49 -07:00
MODULE_DESCRIPTION ( " LZ4HC compressor " ) ;