|  | /* | 
|  | * LZ4 HC - High Compression Mode of LZ4 | 
|  | * Copyright (C) 2011-2012, Yann Collet. | 
|  | * BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php) | 
|  | * | 
|  | * Redistribution and use in source and binary forms, with or without | 
|  | * modification, are permitted provided that the following conditions are | 
|  | * met: | 
|  | * | 
|  | *     * Redistributions of source code must retain the above copyright | 
|  | * notice, this list of conditions and the following disclaimer. | 
|  | *     * Redistributions in binary form must reproduce the above | 
|  | * copyright notice, this list of conditions and the following disclaimer | 
|  | * in the documentation and/or other materials provided with the | 
|  | * distribution. | 
|  | * | 
|  | * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | 
|  | * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | 
|  | * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | 
|  | * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT | 
|  | * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, | 
|  | * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT | 
|  | * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, | 
|  | * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY | 
|  | * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | 
|  | * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE | 
|  | * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | 
|  | * | 
|  | * You can contact the author at : | 
|  | * - LZ4 homepage : http://fastcompression.blogspot.com/p/lz4.html | 
|  | * - LZ4 source repository : http://code.google.com/p/lz4/ | 
|  | * | 
|  | *  Changed for kernel use by: | 
|  | *  Chanho Min <chanho.min@lge.com> | 
|  | */ | 
|  |  | 
|  | #include <linux/module.h> | 
|  | #include <linux/kernel.h> | 
|  | #include <linux/lz4.h> | 
|  | #include <asm/unaligned.h> | 
|  | #include "lz4defs.h" | 
|  |  | 
|  | struct lz4hc_data { | 
|  | const u8 *base; | 
|  | HTYPE hashtable[HASHTABLESIZE]; | 
|  | u16 chaintable[MAXD]; | 
|  | const u8 *nexttoupdate; | 
|  | } __attribute__((__packed__)); | 
|  |  | 
|  | static inline int lz4hc_init(struct lz4hc_data *hc4, const u8 *base) | 
|  | { | 
|  | memset((void *)hc4->hashtable, 0, sizeof(hc4->hashtable)); | 
|  | memset(hc4->chaintable, 0xFF, sizeof(hc4->chaintable)); | 
|  |  | 
|  | #if LZ4_ARCH64 | 
|  | hc4->nexttoupdate = base + 1; | 
|  | #else | 
|  | hc4->nexttoupdate = base; | 
|  | #endif | 
|  | hc4->base = base; | 
|  | return 1; | 
|  | } | 
|  |  | 
|  | /* Update chains up to ip (excluded) */ | 
|  | static inline void lz4hc_insert(struct lz4hc_data *hc4, const u8 *ip) | 
|  | { | 
|  | u16 *chaintable = hc4->chaintable; | 
|  | HTYPE *hashtable  = hc4->hashtable; | 
|  | #if LZ4_ARCH64 | 
|  | const BYTE * const base = hc4->base; | 
|  | #else | 
|  | const int base = 0; | 
|  | #endif | 
|  |  | 
|  | while (hc4->nexttoupdate < ip) { | 
|  | const u8 *p = hc4->nexttoupdate; | 
|  | size_t delta = p - (hashtable[HASH_VALUE(p)] + base); | 
|  | if (delta > MAX_DISTANCE) | 
|  | delta = MAX_DISTANCE; | 
|  | chaintable[(size_t)(p) & MAXD_MASK] = (u16)delta; | 
|  | hashtable[HASH_VALUE(p)] = (p) - base; | 
|  | hc4->nexttoupdate++; | 
|  | } | 
|  | } | 
|  |  | 
|  | static inline size_t lz4hc_commonlength(const u8 *p1, const u8 *p2, | 
|  | const u8 *const matchlimit) | 
|  | { | 
|  | const u8 *p1t = p1; | 
|  |  | 
|  | while (p1t < matchlimit - (STEPSIZE - 1)) { | 
|  | #if LZ4_ARCH64 | 
|  | u64 diff = A64(p2) ^ A64(p1t); | 
|  | #else | 
|  | u32 diff = A32(p2) ^ A32(p1t); | 
|  | #endif | 
|  | if (!diff) { | 
|  | p1t += STEPSIZE; | 
|  | p2 += STEPSIZE; | 
|  | continue; | 
|  | } | 
|  | p1t += LZ4_NBCOMMONBYTES(diff); | 
|  | return p1t - p1; | 
|  | } | 
|  | #if LZ4_ARCH64 | 
|  | if ((p1t < (matchlimit-3)) && (A32(p2) == A32(p1t))) { | 
|  | p1t += 4; | 
|  | p2 += 4; | 
|  | } | 
|  | #endif | 
|  |  | 
|  | if ((p1t < (matchlimit - 1)) && (A16(p2) == A16(p1t))) { | 
|  | p1t += 2; | 
|  | p2 += 2; | 
|  | } | 
|  | if ((p1t < matchlimit) && (*p2 == *p1t)) | 
|  | p1t++; | 
|  | return p1t - p1; | 
|  | } | 
|  |  | 
|  | static inline int lz4hc_insertandfindbestmatch(struct lz4hc_data *hc4, | 
|  | const u8 *ip, const u8 *const matchlimit, const u8 **matchpos) | 
|  | { | 
|  | u16 *const chaintable = hc4->chaintable; | 
|  | HTYPE *const hashtable = hc4->hashtable; | 
|  | const u8 *ref; | 
|  | #if LZ4_ARCH64 | 
|  | const BYTE * const base = hc4->base; | 
|  | #else | 
|  | const int base = 0; | 
|  | #endif | 
|  | int nbattempts = MAX_NB_ATTEMPTS; | 
|  | size_t repl = 0, ml = 0; | 
|  | u16 delta; | 
|  |  | 
|  | /* HC4 match finder */ | 
|  | lz4hc_insert(hc4, ip); | 
|  | ref = hashtable[HASH_VALUE(ip)] + base; | 
|  |  | 
|  | /* potential repetition */ | 
|  | if (ref >= ip-4) { | 
|  | /* confirmed */ | 
|  | if (A32(ref) == A32(ip)) { | 
|  | delta = (u16)(ip-ref); | 
|  | repl = ml  = lz4hc_commonlength(ip + MINMATCH, | 
|  | ref + MINMATCH, matchlimit) + MINMATCH; | 
|  | *matchpos = ref; | 
|  | } | 
|  | ref -= (size_t)chaintable[(size_t)(ref) & MAXD_MASK]; | 
|  | } | 
|  |  | 
|  | while ((ref >= ip - MAX_DISTANCE) && nbattempts) { | 
|  | nbattempts--; | 
|  | if (*(ref + ml) == *(ip + ml)) { | 
|  | if (A32(ref) == A32(ip)) { | 
|  | size_t mlt = | 
|  | lz4hc_commonlength(ip + MINMATCH, | 
|  | ref + MINMATCH, matchlimit) + MINMATCH; | 
|  | if (mlt > ml) { | 
|  | ml = mlt; | 
|  | *matchpos = ref; | 
|  | } | 
|  | } | 
|  | } | 
|  | ref -= (size_t)chaintable[(size_t)(ref) & MAXD_MASK]; | 
|  | } | 
|  |  | 
|  | /* Complete table */ | 
|  | if (repl) { | 
|  | const BYTE *ptr = ip; | 
|  | const BYTE *end; | 
|  | end = ip + repl - (MINMATCH-1); | 
|  | /* Pre-Load */ | 
|  | while (ptr < end - delta) { | 
|  | chaintable[(size_t)(ptr) & MAXD_MASK] = delta; | 
|  | ptr++; | 
|  | } | 
|  | do { | 
|  | chaintable[(size_t)(ptr) & MAXD_MASK] = delta; | 
|  | /* Head of chain */ | 
|  | hashtable[HASH_VALUE(ptr)] = (ptr) - base; | 
|  | ptr++; | 
|  | } while (ptr < end); | 
|  | hc4->nexttoupdate = end; | 
|  | } | 
|  |  | 
|  | return (int)ml; | 
|  | } | 
|  |  | 
|  | static inline int lz4hc_insertandgetwidermatch(struct lz4hc_data *hc4, | 
|  | const u8 *ip, const u8 *startlimit, const u8 *matchlimit, int longest, | 
|  | const u8 **matchpos, const u8 **startpos) | 
|  | { | 
|  | u16 *const chaintable = hc4->chaintable; | 
|  | HTYPE *const hashtable = hc4->hashtable; | 
|  | #if LZ4_ARCH64 | 
|  | const BYTE * const base = hc4->base; | 
|  | #else | 
|  | const int base = 0; | 
|  | #endif | 
|  | const u8 *ref; | 
|  | int nbattempts = MAX_NB_ATTEMPTS; | 
|  | int delta = (int)(ip - startlimit); | 
|  |  | 
|  | /* First Match */ | 
|  | lz4hc_insert(hc4, ip); | 
|  | ref = hashtable[HASH_VALUE(ip)] + base; | 
|  |  | 
|  | while ((ref >= ip - MAX_DISTANCE) && (ref >= hc4->base) | 
|  | && (nbattempts)) { | 
|  | nbattempts--; | 
|  | if (*(startlimit + longest) == *(ref - delta + longest)) { | 
|  | if (A32(ref) == A32(ip)) { | 
|  | const u8 *reft = ref + MINMATCH; | 
|  | const u8 *ipt = ip + MINMATCH; | 
|  | const u8 *startt = ip; | 
|  |  | 
|  | while (ipt < matchlimit-(STEPSIZE - 1)) { | 
|  | #if LZ4_ARCH64 | 
|  | u64 diff = A64(reft) ^ A64(ipt); | 
|  | #else | 
|  | u32 diff = A32(reft) ^ A32(ipt); | 
|  | #endif | 
|  |  | 
|  | if (!diff) { | 
|  | ipt += STEPSIZE; | 
|  | reft += STEPSIZE; | 
|  | continue; | 
|  | } | 
|  | ipt += LZ4_NBCOMMONBYTES(diff); | 
|  | goto _endcount; | 
|  | } | 
|  | #if LZ4_ARCH64 | 
|  | if ((ipt < (matchlimit - 3)) | 
|  | && (A32(reft) == A32(ipt))) { | 
|  | ipt += 4; | 
|  | reft += 4; | 
|  | } | 
|  | ipt += 2; | 
|  | #endif | 
|  | if ((ipt < (matchlimit - 1)) | 
|  | && (A16(reft) == A16(ipt))) { | 
|  | reft += 2; | 
|  | } | 
|  | if ((ipt < matchlimit) && (*reft == *ipt)) | 
|  | ipt++; | 
|  | _endcount: | 
|  | reft = ref; | 
|  |  | 
|  | while ((startt > startlimit) | 
|  | && (reft > hc4->base) | 
|  | && (startt[-1] == reft[-1])) { | 
|  | startt--; | 
|  | reft--; | 
|  | } | 
|  |  | 
|  | if ((ipt - startt) > longest) { | 
|  | longest = (int)(ipt - startt); | 
|  | *matchpos = reft; | 
|  | *startpos = startt; | 
|  | } | 
|  | } | 
|  | } | 
|  | ref -= (size_t)chaintable[(size_t)(ref) & MAXD_MASK]; | 
|  | } | 
|  | return longest; | 
|  | } | 
|  |  | 
|  | static inline int lz4_encodesequence(const u8 **ip, u8 **op, const u8 **anchor, | 
|  | int ml, const u8 *ref) | 
|  | { | 
|  | int length, len; | 
|  | u8 *token; | 
|  |  | 
|  | /* Encode Literal length */ | 
|  | length = (int)(*ip - *anchor); | 
|  | token = (*op)++; | 
|  | if (length >= (int)RUN_MASK) { | 
|  | *token = (RUN_MASK << ML_BITS); | 
|  | len = length - RUN_MASK; | 
|  | for (; len > 254 ; len -= 255) | 
|  | *(*op)++ = 255; | 
|  | *(*op)++ = (u8)len; | 
|  | } else | 
|  | *token = (length << ML_BITS); | 
|  |  | 
|  | /* Copy Literals */ | 
|  | LZ4_BLINDCOPY(*anchor, *op, length); | 
|  |  | 
|  | /* Encode Offset */ | 
|  | LZ4_WRITE_LITTLEENDIAN_16(*op, (u16)(*ip - ref)); | 
|  |  | 
|  | /* Encode MatchLength */ | 
|  | len = (int)(ml - MINMATCH); | 
|  | if (len >= (int)ML_MASK) { | 
|  | *token += ML_MASK; | 
|  | len -= ML_MASK; | 
|  | for (; len > 509 ; len -= 510) { | 
|  | *(*op)++ = 255; | 
|  | *(*op)++ = 255; | 
|  | } | 
|  | if (len > 254) { | 
|  | len -= 255; | 
|  | *(*op)++ = 255; | 
|  | } | 
|  | *(*op)++ = (u8)len; | 
|  | } else | 
|  | *token += len; | 
|  |  | 
|  | /* Prepare next loop */ | 
|  | *ip += ml; | 
|  | *anchor = *ip; | 
|  |  | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | static int lz4_compresshcctx(struct lz4hc_data *ctx, | 
|  | const char *source, | 
|  | char *dest, | 
|  | int isize) | 
|  | { | 
|  | const u8 *ip = (const u8 *)source; | 
|  | const u8 *anchor = ip; | 
|  | const u8 *const iend = ip + isize; | 
|  | const u8 *const mflimit = iend - MFLIMIT; | 
|  | const u8 *const matchlimit = (iend - LASTLITERALS); | 
|  |  | 
|  | u8 *op = (u8 *)dest; | 
|  |  | 
|  | int ml, ml2, ml3, ml0; | 
|  | const u8 *ref = NULL; | 
|  | const u8 *start2 = NULL; | 
|  | const u8 *ref2 = NULL; | 
|  | const u8 *start3 = NULL; | 
|  | const u8 *ref3 = NULL; | 
|  | const u8 *start0; | 
|  | const u8 *ref0; | 
|  | int lastrun; | 
|  |  | 
|  | ip++; | 
|  |  | 
|  | /* Main Loop */ | 
|  | while (ip < mflimit) { | 
|  | ml = lz4hc_insertandfindbestmatch(ctx, ip, matchlimit, (&ref)); | 
|  | if (!ml) { | 
|  | ip++; | 
|  | continue; | 
|  | } | 
|  |  | 
|  | /* saved, in case we would skip too much */ | 
|  | start0 = ip; | 
|  | ref0 = ref; | 
|  | ml0 = ml; | 
|  | _search2: | 
|  | if (ip+ml < mflimit) | 
|  | ml2 = lz4hc_insertandgetwidermatch(ctx, ip + ml - 2, | 
|  | ip + 1, matchlimit, ml, &ref2, &start2); | 
|  | else | 
|  | ml2 = ml; | 
|  | /* No better match */ | 
|  | if (ml2 == ml) { | 
|  | lz4_encodesequence(&ip, &op, &anchor, ml, ref); | 
|  | continue; | 
|  | } | 
|  |  | 
|  | if (start0 < ip) { | 
|  | /* empirical */ | 
|  | if (start2 < ip + ml0) { | 
|  | ip = start0; | 
|  | ref = ref0; | 
|  | ml = ml0; | 
|  | } | 
|  | } | 
|  | /* | 
|  | * Here, start0==ip | 
|  | * First Match too small : removed | 
|  | */ | 
|  | if ((start2 - ip) < 3) { | 
|  | ml = ml2; | 
|  | ip = start2; | 
|  | ref = ref2; | 
|  | goto _search2; | 
|  | } | 
|  |  | 
|  | _search3: | 
|  | /* | 
|  | * Currently we have : | 
|  | * ml2 > ml1, and | 
|  | * ip1+3 <= ip2 (usually < ip1+ml1) | 
|  | */ | 
|  | if ((start2 - ip) < OPTIMAL_ML) { | 
|  | int correction; | 
|  | int new_ml = ml; | 
|  | if (new_ml > OPTIMAL_ML) | 
|  | new_ml = OPTIMAL_ML; | 
|  | if (ip + new_ml > start2 + ml2 - MINMATCH) | 
|  | new_ml = (int)(start2 - ip) + ml2 - MINMATCH; | 
|  | correction = new_ml - (int)(start2 - ip); | 
|  | if (correction > 0) { | 
|  | start2 += correction; | 
|  | ref2 += correction; | 
|  | ml2 -= correction; | 
|  | } | 
|  | } | 
|  | /* | 
|  | * Now, we have start2 = ip+new_ml, | 
|  | * with new_ml=min(ml, OPTIMAL_ML=18) | 
|  | */ | 
|  | if (start2 + ml2 < mflimit) | 
|  | ml3 = lz4hc_insertandgetwidermatch(ctx, | 
|  | start2 + ml2 - 3, start2, matchlimit, | 
|  | ml2, &ref3, &start3); | 
|  | else | 
|  | ml3 = ml2; | 
|  |  | 
|  | /* No better match : 2 sequences to encode */ | 
|  | if (ml3 == ml2) { | 
|  | /* ip & ref are known; Now for ml */ | 
|  | if (start2 < ip+ml) | 
|  | ml = (int)(start2 - ip); | 
|  |  | 
|  | /* Now, encode 2 sequences */ | 
|  | lz4_encodesequence(&ip, &op, &anchor, ml, ref); | 
|  | ip = start2; | 
|  | lz4_encodesequence(&ip, &op, &anchor, ml2, ref2); | 
|  | continue; | 
|  | } | 
|  |  | 
|  | /* Not enough space for match 2 : remove it */ | 
|  | if (start3 < ip + ml + 3) { | 
|  | /* | 
|  | * can write Seq1 immediately ==> Seq2 is removed, | 
|  | * so Seq3 becomes Seq1 | 
|  | */ | 
|  | if (start3 >= (ip + ml)) { | 
|  | if (start2 < ip + ml) { | 
|  | int correction = | 
|  | (int)(ip + ml - start2); | 
|  | start2 += correction; | 
|  | ref2 += correction; | 
|  | ml2 -= correction; | 
|  | if (ml2 < MINMATCH) { | 
|  | start2 = start3; | 
|  | ref2 = ref3; | 
|  | ml2 = ml3; | 
|  | } | 
|  | } | 
|  |  | 
|  | lz4_encodesequence(&ip, &op, &anchor, ml, ref); | 
|  | ip  = start3; | 
|  | ref = ref3; | 
|  | ml  = ml3; | 
|  |  | 
|  | start0 = start2; | 
|  | ref0 = ref2; | 
|  | ml0 = ml2; | 
|  | goto _search2; | 
|  | } | 
|  |  | 
|  | start2 = start3; | 
|  | ref2 = ref3; | 
|  | ml2 = ml3; | 
|  | goto _search3; | 
|  | } | 
|  |  | 
|  | /* | 
|  | * OK, now we have 3 ascending matches; let's write at least | 
|  | * the first one ip & ref are known; Now for ml | 
|  | */ | 
|  | if (start2 < ip + ml) { | 
|  | if ((start2 - ip) < (int)ML_MASK) { | 
|  | int correction; | 
|  | if (ml > OPTIMAL_ML) | 
|  | ml = OPTIMAL_ML; | 
|  | if (ip + ml > start2 + ml2 - MINMATCH) | 
|  | ml = (int)(start2 - ip) + ml2 | 
|  | - MINMATCH; | 
|  | correction = ml - (int)(start2 - ip); | 
|  | if (correction > 0) { | 
|  | start2 += correction; | 
|  | ref2 += correction; | 
|  | ml2 -= correction; | 
|  | } | 
|  | } else | 
|  | ml = (int)(start2 - ip); | 
|  | } | 
|  | lz4_encodesequence(&ip, &op, &anchor, ml, ref); | 
|  |  | 
|  | ip = start2; | 
|  | ref = ref2; | 
|  | ml = ml2; | 
|  |  | 
|  | start2 = start3; | 
|  | ref2 = ref3; | 
|  | ml2 = ml3; | 
|  |  | 
|  | goto _search3; | 
|  | } | 
|  |  | 
|  | /* Encode Last Literals */ | 
|  | lastrun = (int)(iend - anchor); | 
|  | if (lastrun >= (int)RUN_MASK) { | 
|  | *op++ = (RUN_MASK << ML_BITS); | 
|  | lastrun -= RUN_MASK; | 
|  | for (; lastrun > 254 ; lastrun -= 255) | 
|  | *op++ = 255; | 
|  | *op++ = (u8) lastrun; | 
|  | } else | 
|  | *op++ = (lastrun << ML_BITS); | 
|  | memcpy(op, anchor, iend - anchor); | 
|  | op += iend - anchor; | 
|  | /* End */ | 
|  | return (int) (((char *)op) - dest); | 
|  | } | 
|  |  | 
|  | int lz4hc_compress(const unsigned char *src, size_t src_len, | 
|  | unsigned char *dst, size_t *dst_len, void *wrkmem) | 
|  | { | 
|  | int ret = -1; | 
|  | int out_len = 0; | 
|  |  | 
|  | struct lz4hc_data *hc4 = (struct lz4hc_data *)wrkmem; | 
|  | lz4hc_init(hc4, (const u8 *)src); | 
|  | out_len = lz4_compresshcctx((struct lz4hc_data *)hc4, (const u8 *)src, | 
|  | (char *)dst, (int)src_len); | 
|  |  | 
|  | if (out_len < 0) | 
|  | goto exit; | 
|  |  | 
|  | *dst_len = out_len; | 
|  | return 0; | 
|  |  | 
|  | exit: | 
|  | return ret; | 
|  | } | 
|  | EXPORT_SYMBOL(lz4hc_compress); | 
|  |  | 
|  | MODULE_LICENSE("Dual BSD/GPL"); | 
|  | MODULE_DESCRIPTION("LZ4HC compressor"); |