/* LZ4 - Fast LZ compression algorithm Copyright (C) 2011-2013, Yann Collet. BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php) Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met: * Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer. * Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. You can contact the author at : - LZ4 homepage : http://fastcompression.blogspot.com/p/lz4.html - LZ4 source repository : http://code.google.com/p/lz4/ */ /* Note : this source file requires "hammer2_lz4_encoder.h" */ //************************************** // Tuning parameters //************************************** // MEMORY_USAGE : // Memory usage formula : N->2^N Bytes (examples : 10 -> 1KB; 12 -> 4KB; // 16 -> 64KB; 20 -> 1MB; etc.) // Increasing memory usage improves compression ratio // Reduced memory usage can improve speed, due to cache effect // Default value is 14, for 16KB, which nicely fits into Intel x86 L1 cache #define MEMORY_USAGE 14 // HEAPMODE : // Select how default compression function will allocate memory for its // hash table, // in memory stack (0:default, fastest), or in memory heap (1:requires // memory allocation (malloc)). // Default allocation strategy is to use stack (HEAPMODE 0) // Note : explicit functions *_stack* and *_heap* are unaffected by this setting #define HEAPMODE 1 // BIG_ENDIAN_NATIVE_BUT_INCOMPATIBLE : // This will provide a small boost to performance for big endian cpu, // but the resulting compressed stream will be incompatible with little-endian CPU. // You can set this option to 1 in situations where data will remain within // closed environment // This option is useless on Little_Endian CPU (such as x86) //#define BIG_ENDIAN_NATIVE_BUT_INCOMPATIBLE 1 //************************************** // CPU Feature Detection //************************************** // 32 or 64 bits ? #if (defined(__x86_64__) || defined(_M_X64)) // Detects 64 bits mode # define LZ4_ARCH64 1 #else # define LZ4_ARCH64 0 #endif //This reduced library code is only Little Endian compatible, //if the need arises, please look for the appropriate defines in the //original complete LZ4 library. //Same is true for unaligned memory access which is enabled by default, //hardware bit count, also enabled by default, and Microsoft/Visual //Studio compilers. //************************************** // Compiler Options //************************************** #if defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L // C99 /* "restrict" is a known keyword */ #else # define restrict // Disable restrict #endif #define GCC_VERSION (__GNUC__ * 100 + __GNUC_MINOR__) #if (GCC_VERSION >= 302) || (__INTEL_COMPILER >= 800) || defined(__clang__) # define expect(expr,value) (__builtin_expect ((expr),(value)) ) #else # define expect(expr,value) (expr) #endif #define likely(expr) expect((expr) != 0, 1) #define unlikely(expr) expect((expr) != 0, 0) //************************************** // Includes //************************************** #include //for malloc macros #include "hammer2.h" #include "hammer2_lz4.h" //Declaration for kmalloc functions MALLOC_DECLARE(C_HASHTABLE); MALLOC_DEFINE(C_HASHTABLE, "comphashtable", "A hash table used by LZ4 compression function."); //************************************** // Basic Types //************************************** #if defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L // C99 # include typedef uint8_t BYTE; typedef uint16_t U16; typedef uint32_t U32; typedef int32_t S32; typedef uint64_t U64; #else typedef unsigned char BYTE; typedef unsigned short U16; typedef unsigned int U32; typedef signed int S32; typedef unsigned long long U64; #endif #if defined(__GNUC__) && !defined(LZ4_FORCE_UNALIGNED_ACCESS) # define _PACKED __attribute__ ((packed)) #else # define _PACKED #endif #if !defined(LZ4_FORCE_UNALIGNED_ACCESS) && !defined(__GNUC__) # pragma pack(push, 1) #endif typedef struct _U16_S { U16 v; } _PACKED U16_S; typedef struct _U32_S { U32 v; } _PACKED U32_S; typedef struct _U64_S { U64 v; } _PACKED U64_S; #if !defined(LZ4_FORCE_UNALIGNED_ACCESS) && !defined(__GNUC__) # pragma pack(pop) #endif #define A64(x) (((U64_S *)(x))->v) #define A32(x) (((U32_S *)(x))->v) #define A16(x) (((U16_S *)(x))->v) //************************************** // Constants //************************************** #define HASHTABLESIZE (1 << MEMORY_USAGE) #define MINMATCH 4 #define COPYLENGTH 8 #define LASTLITERALS 5 #define MFLIMIT (COPYLENGTH+MINMATCH) #define MINLENGTH (MFLIMIT+1) #define LZ4_64KLIMIT ((1<<16) + (MFLIMIT-1)) #define SKIPSTRENGTH 6 // Increasing this value will make the compression run slower on // incompressible data #define MAXD_LOG 16 #define MAX_DISTANCE ((1 << MAXD_LOG) - 1) #define ML_BITS 4 #define ML_MASK ((1U<>3); #elif defined(__GNUC__) && (GCC_VERSION >= 304) && !defined(LZ4_FORCE_SW_BITCOUNT) return (__builtin_clzll(val) >> 3); #else int r; if (!(val>>32)) { r=4; } else { r=0; val>>=32; } if (!(val>>16)) { r+=2; val>>=8; } else { val>>=24; } r += (!val); return r; #endif #else #if defined(_MSC_VER) && !defined(LZ4_FORCE_SW_BITCOUNT) unsigned long r = 0; _BitScanForward64( &r, val ); return (int)(r>>3); #elif defined(__GNUC__) && (GCC_VERSION >= 304) && !defined(LZ4_FORCE_SW_BITCOUNT) return (__builtin_ctzll(val) >> 3); #else static int DeBruijnBytePos[64] = { 0, 0, 0, 0, 0, 1, 1, 2, 0, 3, 1, 3, 1, 4, 2, 7, 0, 2, 3, 6, 1, 5, 3, 5, 1, 3, 4, 4, 2, 5, 6, 7, 7, 0, 1, 2, 3, 3, 4, 6, 2, 6, 5, 5, 3, 4, 5, 6, 7, 1, 2, 4, 6, 4, 4, 5, 7, 2, 6, 5, 7, 6, 7, 7 }; return DeBruijnBytePos[((U64)((val & -val) * 0x0218A392CDABBD3F)) >> 58]; #endif #endif } #else static inline int LZ4_NbCommonBytes (register U32 val) { #if defined(LZ4_BIG_ENDIAN) # if defined(_MSC_VER) && !defined(LZ4_FORCE_SW_BITCOUNT) unsigned long r = 0; _BitScanReverse( &r, val ); return (int)(r>>3); # elif defined(__GNUC__) && (GCC_VERSION >= 304) && !defined(LZ4_FORCE_SW_BITCOUNT) return (__builtin_clz(val) >> 3); # else int r; if (!(val>>16)) { r=2; val>>=8; } else { r=0; val>>=24; } r += (!val); return r; # endif #else # if defined(_MSC_VER) && !defined(LZ4_FORCE_SW_BITCOUNT) unsigned long r; _BitScanForward( &r, val ); return (int)(r>>3); # elif defined(__GNUC__) && (GCC_VERSION >= 304) && !defined(LZ4_FORCE_SW_BITCOUNT) return (__builtin_ctz(val) >> 3); # else static int DeBruijnBytePos[32] = { 0, 0, 3, 0, 3, 1, 3, 0, 3, 2, 2, 1, 3, 2, 0, 1, 3, 3, 1, 2, 2, 2, 2, 0, 3, 1, 2, 0, 1, 0, 1, 1 }; return DeBruijnBytePos[((U32)((val & -(S32)val) * 0x077CB531U)) >> 27]; # endif #endif } #endif //****************************** // Compression functions //****************************** #include "hammer2_lz4_encoder.h" /* void* LZ4_createHeapMemory(); int LZ4_freeHeapMemory(void* ctx); Used to allocate and free hashTable memory to be used by the LZ4_compress_heap* family of functions. LZ4_createHeapMemory() returns NULL is memory allocation fails. */ void* LZ4_create(void) { return kmalloc(HASHTABLESIZE, C_HASHTABLE, M_INTWAIT); } int LZ4_free(void* ctx) { kfree(ctx, C_HASHTABLE); return 0; } int LZ4_compress_limitedOutput(char* source, char* dest, int inputSize, int maxOutputSize) { void* ctx = LZ4_create(); int result; if (ctx == NULL) return 0; // Failed allocation => compression not done if (inputSize < LZ4_64KLIMIT) result = LZ4_compress64k_heap_limitedOutput(ctx, source, dest, inputSize, maxOutputSize); else result = LZ4_compress_heap_limitedOutput(ctx, source, dest, inputSize, maxOutputSize); LZ4_free(ctx); return result; } //**************************** // Decompression functions //**************************** typedef enum { noPrefix = 0, withPrefix = 1 } prefix64k_directive; typedef enum { endOnOutputSize = 0, endOnInputSize = 1 } end_directive; typedef enum { full = 0, partial = 1 } exit_directive; // This generic decompression function cover all use cases. // It shall be instanciated several times, using different sets of directives // Note that it is essential this generic function is really inlined, // in order to remove useless branches during compilation optimisation. static inline int LZ4_decompress_generic( char* source, char* dest, int inputSize, // int outputSize, // OutputSize must be != 0; if endOnInput==endOnInputSize, // this value is the max size of Output Buffer. int endOnInput, // endOnOutputSize, endOnInputSize int prefix64k, // noPrefix, withPrefix int partialDecoding, // full, partial int targetOutputSize // only used if partialDecoding==partial ) { // Local Variables BYTE* restrict ip = (BYTE*) source; BYTE* ref; BYTE* iend = ip + inputSize; BYTE* op = (BYTE*) dest; BYTE* oend = op + outputSize; BYTE* cpy; BYTE* oexit = op + targetOutputSize; size_t dec32table[] = {0, 3, 2, 3, 0, 0, 0, 0}; #if LZ4_ARCH64 size_t dec64table[] = {0, 0, 0, (size_t)-1, 0, 1, 2, 3}; #endif // Special case if ((partialDecoding) && (oexit> oend-MFLIMIT)) oexit = oend-MFLIMIT; // targetOutputSize too large, better decode everything if unlikely(outputSize==0) goto _output_error; // Empty output buffer // Main Loop while (1) { unsigned token; size_t length; // get runlength token = *ip++; if ((length=(token>>ML_BITS)) == RUN_MASK) { unsigned s=255; while (((endOnInput)?ip(partialDecoding?oexit:oend-MFLIMIT)) || (ip+length>iend-(2+1+LASTLITERALS))) ) || ((!endOnInput) && (cpy>oend-COPYLENGTH))) { if (partialDecoding) { if (cpy > oend) goto _output_error; // Error : write attempt beyond end of output buffer if ((endOnInput) && (ip+length > iend)) goto _output_error; // Error : read attempt beyond end of input buffer } else { if ((!endOnInput) && (cpy != oend)) goto _output_error; // Error : block decoding must stop exactly there, // due to parsing restrictions if ((endOnInput) && ((ip+length != iend) || (cpy > oend))) goto _output_error; // Error : not enough place for another match (min 4) + 5 literals } memcpy(op, ip, length); ip += length; op += length; break; // Necessarily EOF, due to parsing restrictions } LZ4_WILDCOPY(ip, op, cpy); ip -= (op-cpy); op = cpy; // get offset LZ4_READ_LITTLEENDIAN_16(ref,cpy,ip); ip+=2; if ((prefix64k==noPrefix) && unlikely(ref < (BYTE*)dest)) goto _output_error; // Error : offset outside destination buffer // get matchlength if ((length=(token&ML_MASK)) == ML_MASK) { while (endOnInput ? ipoend-(COPYLENGTH)-(STEPSIZE-4)) { if (cpy > oend-LASTLITERALS) goto _output_error; // Error : last 5 bytes must be literals LZ4_SECURECOPY(ref, op, (oend-COPYLENGTH)); while(op