common/lz4/lz4.c

   1 /*
   2    LZ4 - Fast LZ compression algorithm
   3    Copyright (C) 2011-present, Yann Collet.
   4
   5    BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
   6
   7    Redistribution and use in source and binary forms, with or without
   8    modification, are permitted provided that the following conditions are
   9    met:
  10
  11        * Redistributions of source code must retain the above copyright
  12    notice, this list of conditions and the following disclaimer.
  13        * Redistributions in binary form must reproduce the above
  14    copyright notice, this list of conditions and the following disclaimer
  15    in the documentation and/or other materials provided with the
  16    distribution.
  17
  18    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  19    "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  20    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  21    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  22    OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  23    SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  24    LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  25    DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  26    THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  27    (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  28    OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  29
  30    You can contact the author at :
  31     - LZ4 homepage : http://www.lz4.org
  32     - LZ4 source repository : https://github.com/lz4/lz4
  33 */
  34
  35 /*-************************************
  36 *  Tuning parameters
  37 **************************************/
  38 /*
  39  * LZ4_HEAPMODE :
  40  * Select how default compression functions will allocate memory for their hash table,
  41  * in memory stack (0:default, fastest), or in memory heap (1:requires malloc()).
  42  */
  43 #ifndef LZ4_HEAPMODE
  44 #  define LZ4_HEAPMODE 0
  45 #endif
  46
  47 /*
  48  * LZ4_ACCELERATION_DEFAULT :
  49  * Select "acceleration" for LZ4_compress_fast() when parameter value <= 0
  50  */
  51 #define LZ4_ACCELERATION_DEFAULT 1
  52 /*
  53  * LZ4_ACCELERATION_MAX :
  54  * Any "acceleration" value higher than this threshold
  55  * get treated as LZ4_ACCELERATION_MAX instead (fix #876)
  56  */
  57 #define LZ4_ACCELERATION_MAX 65537
  58
  59
  60 /*-************************************
  61 *  CPU Feature Detection
  62 **************************************/
  63 /* LZ4_FORCE_MEMORY_ACCESS
  64  * By default, access to unaligned memory is controlled by `memcpy()`, which is safe and portable.
  65  * Unfortunately, on some target/compiler combinations, the generated assembly is sub-optimal.
  66  * The below switch allow to select different access method for improved performance.
  67  * Method 0 (default) : use `memcpy()`. Safe and portable.
  68  * Method 1 : `__packed` statement. It depends on compiler extension (ie, not portable).
  69  *            This method is safe if your compiler supports it, and *generally* as fast or faster than `memcpy`.
  70  * Method 2 : direct access. This method is portable but violate C standard.
  71  *            It can generate buggy code on targets which assembly generation depends on alignment.
  72  *            But in some circumstances, it's the only known way to get the most performance (ie GCC + ARMv6)
  73  * See https://fastcompression.blogspot.fr/2015/08/accessing-unaligned-memory.html for details.
  74  * Prefer these methods in priority order (0 > 1 > 2)
  75  */
  76 #ifndef LZ4_FORCE_MEMORY_ACCESS   /* can be defined externally */
  77 #  if defined(__GNUC__) && \
  78   ( defined(__ARM_ARCH_6__) || defined(__ARM_ARCH_6J__) || defined(__ARM_ARCH_6K__) \
  79   || defined(__ARM_ARCH_6Z__) || defined(__ARM_ARCH_6ZK__) || defined(__ARM_ARCH_6T2__) )
  80 #    define LZ4_FORCE_MEMORY_ACCESS 2
  81 #  elif (defined(__INTEL_COMPILER) && !defined(_WIN32)) || defined(__GNUC__)
  82 #    define LZ4_FORCE_MEMORY_ACCESS 1
  83 #  endif
  84 #endif
  85
  86 /*
  87  * LZ4_FORCE_SW_BITCOUNT
  88  * Define this parameter if your target system or compiler does not support hardware bit count
  89  */
  90 #if defined(_MSC_VER) && defined(_WIN32_WCE)   /* Visual Studio for WinCE doesn't support Hardware bit count */
  91 #  undef  LZ4_FORCE_SW_BITCOUNT  /* avoid double def */
  92 #  define LZ4_FORCE_SW_BITCOUNT
  93 #endif
  94
  95
  96
  97 /*-************************************
  98 *  Dependency
  99 **************************************/
 100 /*
 101  * LZ4_SRC_INCLUDED:
 102  * Amalgamation flag, whether lz4.c is included
 103  */
 104 #ifndef LZ4_SRC_INCLUDED
 105 #  define LZ4_SRC_INCLUDED 1
 106 #endif
 107
 108 #ifndef LZ4_STATIC_LINKING_ONLY
 109 #define LZ4_STATIC_LINKING_ONLY
 110 #endif
 111
 112 #ifndef LZ4_DISABLE_DEPRECATE_WARNINGS
 113 #define LZ4_DISABLE_DEPRECATE_WARNINGS /* due to LZ4_decompress_safe_withPrefix64k */
 114 #endif
 115
 116 #define LZ4_STATIC_LINKING_ONLY  /* LZ4_DISTANCE_MAX */
 117 #include "lz4.h"
 118 /* see also "memory routines" below */
 119
 120
 121 /*-************************************
 122 *  Compiler Options
 123 **************************************/
 124 #ifdef _MSC_VER    /* Visual Studio */
 125 #  include <intrin.h>
 126 #  pragma warning(disable : 4127)        /* disable: C4127: conditional expression is constant */
 127 #  pragma warning(disable : 4293)        /* disable: C4293: too large shift (32-bits) */
 128 #endif  /* _MSC_VER */
 129
 130 #ifndef LZ4_FORCE_INLINE
 131 #  ifdef _MSC_VER    /* Visual Studio */
 132 #    define LZ4_FORCE_INLINE static __forceinline
 133 #  else
 134 #    if defined (__cplusplus) || defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L   /* C99 */
 135 #      ifdef __GNUC__
 136 #        define LZ4_FORCE_INLINE static inline __attribute__((always_inline))
 137 #      else
 138 #        define LZ4_FORCE_INLINE static inline
 139 #      endif
 140 #    else
 141 #      define LZ4_FORCE_INLINE static
 142 #    endif /* __STDC_VERSION__ */
 143 #  endif  /* _MSC_VER */
 144 #endif /* LZ4_FORCE_INLINE */
 145
 146 /* LZ4_FORCE_O2_GCC_PPC64LE and LZ4_FORCE_O2_INLINE_GCC_PPC64LE
 147  * gcc on ppc64le generates an unrolled SIMDized loop for LZ4_wildCopy8,
 148  * together with a simple 8-byte copy loop as a fall-back path.
 149  * However, this optimization hurts the decompression speed by >30%,
 150  * because the execution does not go to the optimized loop
 151  * for typical compressible data, and all of the preamble checks
 152  * before going to the fall-back path become useless overhead.
 153  * This optimization happens only with the -O3 flag, and -O2 generates
 154  * a simple 8-byte copy loop.
 155  * With gcc on ppc64le, all of the LZ4_decompress_* and LZ4_wildCopy8
 156  * functions are annotated with __attribute__((optimize("O2"))),
 157  * and also LZ4_wildCopy8 is forcibly inlined, so that the O2 attribute
 158  * of LZ4_wildCopy8 does not affect the compression speed.
 159  */
 160 #if defined(__PPC64__) && defined(__LITTLE_ENDIAN__) && defined(__GNUC__) && !defined(__clang__)
 161 #  define LZ4_FORCE_O2_GCC_PPC64LE __attribute__((optimize("O2")))
 162 #  define LZ4_FORCE_O2_INLINE_GCC_PPC64LE __attribute__((optimize("O2"))) LZ4_FORCE_INLINE
 163 #else
 164 #  define LZ4_FORCE_O2_GCC_PPC64LE
 165 #  define LZ4_FORCE_O2_INLINE_GCC_PPC64LE static
 166 #endif
 167
 168 #if (defined(__GNUC__) && (__GNUC__ >= 3)) || (defined(__INTEL_COMPILER) && (__INTEL_COMPILER >= 800)) || defined(__clang__)
 169 #  define expect(expr,value)    (__builtin_expect ((expr),(value)) )
 170 #else
 171 #  define expect(expr,value)    (expr)
 172 #endif
 173
 174 #ifndef likely
 175 #define likely(expr)     expect((expr) != 0, 1)
 176 #endif
 177 #ifndef unlikely
 178 #define unlikely(expr)   expect((expr) != 0, 0)
 179 #endif
 180
 181
 182 /*-************************************
 183 *  Memory routines
 184 **************************************/
 185 #include <stdlib.h>   /* malloc, calloc, free */
 186 #define ALLOC(s)          malloc(s)
 187 #define ALLOC_AND_ZERO(s) calloc(1,s)
 188 #define FREEMEM(p)        free(p)
 189 #include <string.h>   /* memset, memcpy */
 190 #define MEM_INIT(p,v,s)   memset((p),(v),(s))
 191
 192
 193 /*-************************************
 194 *  Common Constants
 195 **************************************/
 196 #define MINMATCH 4
 197
 198 #define WILDCOPYLENGTH 8
 199 #define LASTLITERALS   5   /* see ../doc/lz4_Block_format.md#parsing-restrictions */
 200 #define MFLIMIT       12   /* see ../doc/lz4_Block_format.md#parsing-restrictions */
 201 #define MATCH_SAFEGUARD_DISTANCE  ((2*WILDCOPYLENGTH) - MINMATCH)   /* ensure it's possible to write 2 x wildcopyLength without overflowing output buffer */
 202 #define FASTLOOP_SAFE_DISTANCE 64
 203 static const int LZ4_minLength = (MFLIMIT + 1);
 204
 205 #define KB *(1 <<10)
 206 #define MB *(1 <<20)
 207 #define GB *(1U<<30)
 208
 209 #define LZ4_DISTANCE_ABSOLUTE_MAX 65535
 210 #if (LZ4_DISTANCE_MAX > LZ4_DISTANCE_ABSOLUTE_MAX)   /* max supported by LZ4 format */
 211 #  error "LZ4_DISTANCE_MAX is too big : must be <= 65535"
 212 #endif
 213
 214 #define ML_BITS  4
 215 #define ML_MASK  ((1U<<ML_BITS)-1)
 216 #define RUN_BITS (8-ML_BITS)
 217 #define RUN_MASK ((1U<<RUN_BITS)-1)
 218
 219
 220 /*-************************************
 221 *  Error detection
 222 **************************************/
 223 #if defined(LZ4_DEBUG) && (LZ4_DEBUG>=1)
 224 #  include <assert.h>
 225 #else
 226 #  ifndef assert
 227 #    define assert(condition) ((void)0)
 228 #  endif
 229 #endif
 230
 231 #define LZ4_STATIC_ASSERT(c)   { enum { LZ4_static_assert = 1/(int)(!!(c)) }; }   /* use after variable declarations */
 232
 233 #if defined(LZ4_DEBUG) && (LZ4_DEBUG>=2)
 234 #  include <stdio.h>
 235 static int g_debuglog_enable = 1;
 236 #  define DEBUGLOG(l, ...) {                          \
 237         if ((g_debuglog_enable) && (l<=LZ4_DEBUG)) {  \
 238             fprintf(stderr, __FILE__ ": ");           \
 239             fprintf(stderr, __VA_ARGS__);             \
 240             fprintf(stderr, " \n");                   \
 241     }   }
 242 #else
 243 #  define DEBUGLOG(l, ...) {}    /* disabled */
 244 #endif
 245
 246
 247 /*-************************************
 248 *  Types
 249 **************************************/
 250 #include <limits.h>
 251 #if defined(__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */)
 252 # include <stdint.h>
 253 typedef  uint8_t BYTE;
 254 typedef uint16_t U16;
 255 typedef uint32_t U32;
 256 typedef  int32_t S32;
 257 typedef uint64_t U64;
 258 typedef uintptr_t uptrval;
 259 #else
 260 # if UINT_MAX != 4294967295UL
 261 #   error "LZ4 code (when not C++ or C99) assumes that sizeof(int) == 4"
 262 # endif
 263 typedef unsigned char       BYTE;
 264 typedef unsigned short      U16;
 265 typedef unsigned int        U32;
 266 typedef   signed int        S32;
 267 typedef unsigned long long  U64;
 268 typedef size_t              uptrval;   /* generally true, except OpenVMS-64 */
 269 #endif
 270
 271 #if defined(__x86_64__)
 272 typedef U64    reg_t;   /* 64-bits in x32 mode */
 273 #else
 274 typedef size_t reg_t;   /* 32-bits in x32 mode */
 275 #endif
 276
 277 typedef enum {
 278     notLimited = 0,
 279     limitedOutput = 1,
 280     fillOutput = 2
 281 } limitedOutput_directive;
 282
 283
 284 /*-************************************
 285 *  Reading and writing into memory
 286 **************************************/
 287
 288 /**
 289  * LZ4 relies on memcpy with a constant size being inlined. In freestanding
 290  * environments, the compiler can't assume the implementation of memcpy() is
 291  * standard compliant, so it can't apply its specialized memcpy() inlining
 292  * logic. When possible, use __builtin_memcpy() to tell the compiler to analyze
 293  * memcpy() as if it were standard compliant, so it can inline it in freestanding
 294  * environments. This is needed when decompressing the Linux Kernel, for example.
 295  */
 296 #if defined(__GNUC__) && (__GNUC__ >= 4)
 297 #define LZ4_memcpy(dst, src, size) __builtin_memcpy(dst, src, size)
 298 #else
 299 #define LZ4_memcpy(dst, src, size) memcpy(dst, src, size)
 300 #endif
 301
 302 static unsigned LZ4_isLittleEndian(void) {
 303     const union { U32 u; BYTE c[4]; } one = { 1 };   /* don't use static : performance detrimental */
 304     return one.c[0];
 305 }
 306
 307
 308 #if defined(LZ4_FORCE_MEMORY_ACCESS) && (LZ4_FORCE_MEMORY_ACCESS==2)
 309 /* lie to the compiler about data alignment; use with caution */
 310
 311 static U16 LZ4_read16(const void *memPtr) { return *(const U16 *) memPtr; }
 312 static U32 LZ4_read32(const void *memPtr) { return *(const U32 *) memPtr; }
 313 static reg_t LZ4_read_ARCH(const void *memPtr) { return *(const reg_t *) memPtr; }
 314
 315 static void LZ4_write16(void *memPtr, U16 value) { *(U16 *)memPtr = value; }
 316 static void LZ4_write32(void *memPtr, U32 value) { *(U32 *)memPtr = value; }
 317
 318 #elif defined(LZ4_FORCE_MEMORY_ACCESS) && (LZ4_FORCE_MEMORY_ACCESS==1)
 319
 320 /* __pack instructions are safer, but compiler specific, hence potentially problematic for some compilers */
 321 /* currently only defined for gcc and icc */
 322 typedef union { U16 u16; U32 u32; reg_t uArch; } __attribute__((packed)) unalign;
 323
 324 static U16 LZ4_read16(const void *ptr) { return ((const unalign *)ptr)->u16; }
 325 // Tolerate reads on buffer boundary
 326 ATTRIBUTE_NO_SANITIZE_ADDRESS
 327 static U32 LZ4_read32(const void *ptr) { return ((const unalign *)ptr)->u32; }
 328 static reg_t LZ4_read_ARCH(const void *ptr) { return ((const unalign *)ptr)->uArch; }
 329
 330 static void LZ4_write16(void *memPtr, U16 value) { ((unalign *)memPtr)->u16 = value; }
 331 static void LZ4_write32(void *memPtr, U32 value) { ((unalign *)memPtr)->u32 = value; }
 332
 333 #else  /* safe and portable access using memcpy() */
 334
 335 static U16 LZ4_read16(const void *memPtr) {
 336     U16 val;
 337     LZ4_memcpy(&val, memPtr, sizeof(val));
 338     return val;
 339 }
 340
 341 static U32 LZ4_read32(const void *memPtr) {
 342     U32 val;
 343     LZ4_memcpy(&val, memPtr, sizeof(val));
 344     return val;
 345 }
 346
 347 static reg_t LZ4_read_ARCH(const void *memPtr) {
 348     reg_t val;
 349     LZ4_memcpy(&val, memPtr, sizeof(val));
 350     return val;
 351 }
 352
 353 static void LZ4_write16(void *memPtr, U16 value) {
 354     LZ4_memcpy(memPtr, &value, sizeof(value));
 355 }
 356
 357 static void LZ4_write32(void *memPtr, U32 value) {
 358     LZ4_memcpy(memPtr, &value, sizeof(value));
 359 }
 360
 361 #endif /* LZ4_FORCE_MEMORY_ACCESS */
 362
 363
 364 static U16 LZ4_readLE16(const void *memPtr) {
 365     if (LZ4_isLittleEndian()) {
 366         return LZ4_read16(memPtr);
 367     } else {
 368         const BYTE *p = (const BYTE *)memPtr;
 369         return (U16)((U16)p[0] + (p[1] << 8));
 370     }
 371 }
 372
 373 static void LZ4_writeLE16(void *memPtr, U16 value) {
 374     if (LZ4_isLittleEndian()) {
 375         LZ4_write16(memPtr, value);
 376     } else {
 377         BYTE *p = (BYTE *)memPtr;
 378         p[0] = (BYTE) value;
 379         p[1] = (BYTE)(value >> 8);
 380     }
 381 }
 382
 383 /* customized variant of memcpy, which can overwrite up to 8 bytes beyond dstEnd */
 384 LZ4_FORCE_O2_INLINE_GCC_PPC64LE
 385 void LZ4_wildCopy8(void *dstPtr, const void *srcPtr, void *dstEnd) {
 386     BYTE *d = (BYTE *)dstPtr;
 387     const BYTE *s = (const BYTE *)srcPtr;
 388     BYTE *const e = (BYTE *)dstEnd;
 389
 390     do { LZ4_memcpy(d, s, 8); d += 8; s += 8; }
 391     while (d < e);
 392 }
 393
 394 static const unsigned inc32table[8] = {0, 1, 2,  1,  0,  4, 4, 4};
 395 static const int      dec64table[8] = {0, 0, 0, -1, -4,  1, 2, 3};
 396
 397
 398 #ifndef LZ4_FAST_DEC_LOOP
 399 #  if defined __i386__ || defined _M_IX86 || defined __x86_64__ || defined _M_X64
 400 #    define LZ4_FAST_DEC_LOOP 1
 401 #  elif defined(__aarch64__) && !defined(__clang__)
 402 /* On aarch64, we disable this optimization for clang because on certain
 403  * mobile chipsets, performance is reduced with clang. For information
 404  * refer to https://github.com/lz4/lz4/pull/707 */
 405 #    define LZ4_FAST_DEC_LOOP 1
 406 #  else
 407 #    define LZ4_FAST_DEC_LOOP 0
 408 #  endif
 409 #endif
 410
 411 #if LZ4_FAST_DEC_LOOP
 412
 413 LZ4_FORCE_O2_INLINE_GCC_PPC64LE void
 414 LZ4_memcpy_using_offset_base(BYTE *dstPtr, const BYTE *srcPtr, BYTE *dstEnd, const size_t offset) {
 415     if (offset < 8) {
 416         dstPtr[0] = srcPtr[0];
 417         dstPtr[1] = srcPtr[1];
 418         dstPtr[2] = srcPtr[2];
 419         dstPtr[3] = srcPtr[3];
 420         srcPtr += inc32table[offset];
 421         LZ4_memcpy(dstPtr + 4, srcPtr, 4);
 422         srcPtr -= dec64table[offset];
 423         dstPtr += 8;
 424     } else {
 425         LZ4_memcpy(dstPtr, srcPtr, 8);
 426         dstPtr += 8;
 427         srcPtr += 8;
 428     }
 429
 430     LZ4_wildCopy8(dstPtr, srcPtr, dstEnd);
 431 }
 432
 433 /* customized variant of memcpy, which can overwrite up to 32 bytes beyond dstEnd
 434  * this version copies two times 16 bytes (instead of one time 32 bytes)
 435  * because it must be compatible with offsets >= 16. */
 436 LZ4_FORCE_O2_INLINE_GCC_PPC64LE void
 437 LZ4_wildCopy32(void *dstPtr, const void *srcPtr, void *dstEnd) {
 438     BYTE *d = (BYTE *)dstPtr;
 439     const BYTE *s = (const BYTE *)srcPtr;
 440     BYTE *const e = (BYTE *)dstEnd;
 441
 442     do { LZ4_memcpy(d, s, 16); LZ4_memcpy(d + 16, s + 16, 16); d += 32; s += 32; }
 443     while (d < e);
 444 }
 445
 446 /* LZ4_memcpy_using_offset()  presumes :
 447  * - dstEnd >= dstPtr + MINMATCH
 448  * - there is at least 8 bytes available to write after dstEnd */
 449 LZ4_FORCE_O2_INLINE_GCC_PPC64LE void
 450 LZ4_memcpy_using_offset(BYTE *dstPtr, const BYTE *srcPtr, BYTE *dstEnd, const size_t offset) {
 451     BYTE v[8];
 452
 453     assert(dstEnd >= dstPtr + MINMATCH);
 454     LZ4_write32(dstPtr, 0);   /* silence an msan warning when offset==0 */
 455
 456     switch (offset) {
 457         case 1:
 458             memset(v, *srcPtr, 8);
 459             break;
 460         case 2:
 461             LZ4_memcpy(v, srcPtr, 2);
 462             LZ4_memcpy(&v[2], srcPtr, 2);
 463             LZ4_memcpy(&v[4], &v[0], 4);
 464             break;
 465         case 4:
 466             LZ4_memcpy(v, srcPtr, 4);
 467             LZ4_memcpy(&v[4], srcPtr, 4);
 468             break;
 469         default:
 470             LZ4_memcpy_using_offset_base(dstPtr, srcPtr, dstEnd, offset);
 471             return;
 472     }
 473
 474     LZ4_memcpy(dstPtr, v, 8);
 475     dstPtr += 8;
 476     while (dstPtr < dstEnd) {
 477         LZ4_memcpy(dstPtr, v, 8);
 478         dstPtr += 8;
 479     }
 480 }
 481 #endif
 482
 483
 484 /*-************************************
 485 *  Common functions
 486 **************************************/
 487 static unsigned LZ4_NbCommonBytes(reg_t val) {
 488     assert(val != 0);
 489     if (LZ4_isLittleEndian()) {
 490         if (sizeof(val) == 8) {
 491 #       if defined(_MSC_VER) && (_MSC_VER >= 1800) && defined(_M_AMD64) && !defined(LZ4_FORCE_SW_BITCOUNT)
 492             /* x64 CPUS without BMI support interpret `TZCNT` as `REP BSF` */
 493             return (unsigned)_tzcnt_u64(val) >> 3;
 494 #       elif defined(_MSC_VER) && defined(_WIN64) && !defined(LZ4_FORCE_SW_BITCOUNT)
 495             unsigned long r = 0;
 496             _BitScanForward64(&r, (U64)val);
 497             return (unsigned)r >> 3;
 498 #       elif (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \
 499                             ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \
 500                                         !defined(LZ4_FORCE_SW_BITCOUNT)
 501             return (unsigned)__builtin_ctzll((U64)val) >> 3;
 502 #       else
 503             const U64 m = 0x0101010101010101ULL;
 504             val ^= val - 1;
 505             return (unsigned)(((U64)((val & (m - 1)) * m)) >> 56);
 506 #       endif
 507         } else /* 32 bits */ {
 508 #       if defined(_MSC_VER) && !defined(LZ4_FORCE_SW_BITCOUNT)
 509             unsigned long r;
 510             _BitScanForward(&r, (U32)val);
 511             return (unsigned)r >> 3;
 512 #       elif (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \
 513                             ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \
 514                         !defined(__TINYC__) && !defined(LZ4_FORCE_SW_BITCOUNT)
 515             return (unsigned)__builtin_ctz((U32)val) >> 3;
 516 #       else
 517             const U32 m = 0x01010101;
 518             return (unsigned)((((val - 1) ^ val) & (m - 1)) * m) >> 24;
 519 #       endif
 520         }
 521     } else { /* Big Endian CPU */
 522         if (sizeof(val) == 8) {
 523 #       if (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \
 524                             ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \
 525                         !defined(__TINYC__) && !defined(LZ4_FORCE_SW_BITCOUNT)
 526             return (unsigned)__builtin_clzll((U64)val) >> 3;
 527 #       else
 528 #if 1
 529             /* this method is probably faster,
 530              * but adds a 128 bytes lookup table */
 531             static const unsigned char ctz7_tab[128] = {
 532                 7, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
 533                 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
 534                 5, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
 535                 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
 536                 6, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
 537                 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
 538                 5, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
 539                 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
 540             };
 541             U64 const mask = 0x0101010101010101ULL;
 542             U64 const t = (((val >> 8) - mask) | val) & mask;
 543             return ctz7_tab[(t * 0x0080402010080402ULL) >> 57];
 544 #else
 545             /* this method doesn't consume memory space like the previous one,
 546              * but it contains several branches,
 547              * that may end up slowing execution */
 548             static const U32 by32 = sizeof(val) * 4;  /* 32 on 64 bits (goal), 16 on 32 bits.
 549             Just to avoid some static analyzer complaining about shift by 32 on 32-bits target.
 550             Note that this code path is never triggered in 32-bits mode. */
 551             unsigned r;
 552             if (!(val >> by32)) { r = 4; }
 553             else { r = 0; val >>= by32; }
 554             if (!(val >> 16)) { r += 2; val >>= 8; }
 555             else { val >>= 24; }
 556             r += (!val);
 557             return r;
 558 #endif
 559 #       endif
 560         } else /* 32 bits */ {
 561 #       if (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \
 562                             ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \
 563                                         !defined(LZ4_FORCE_SW_BITCOUNT)
 564             return (unsigned)__builtin_clz((U32)val) >> 3;
 565 #       else
 566             val >>= 8;
 567             val = ((((val + 0x00FFFF00) | 0x00FFFFFF) + val) |
 568                    (val + 0x00FF0000)) >> 24;
 569             return (unsigned)val ^ 3;
 570 #       endif
 571         }
 572     }
 573 }
 574
 575
 576 #define STEPSIZE sizeof(reg_t)
 577 LZ4_FORCE_INLINE
 578 unsigned LZ4_count(const BYTE *pIn, const BYTE *pMatch, const BYTE *pInLimit) {
 579     const BYTE *const pStart = pIn;
 580
 581     if (likely(pIn < pInLimit - (STEPSIZE - 1))) {
 582         reg_t const diff = LZ4_read_ARCH(pMatch) ^ LZ4_read_ARCH(pIn);
 583         if (!diff) {
 584             pIn += STEPSIZE;
 585             pMatch += STEPSIZE;
 586         } else {
 587             return LZ4_NbCommonBytes(diff);
 588         }
 589     }
 590
 591     while (likely(pIn < pInLimit - (STEPSIZE - 1))) {
 592         reg_t const diff = LZ4_read_ARCH(pMatch) ^ LZ4_read_ARCH(pIn);
 593         if (!diff) { pIn += STEPSIZE; pMatch += STEPSIZE; continue; }
 594         pIn += LZ4_NbCommonBytes(diff);
 595         return (unsigned)(pIn - pStart);
 596     }
 597
 598     if ((STEPSIZE == 8) && (pIn < (pInLimit - 3)) && (LZ4_read32(pMatch) == LZ4_read32(pIn))) { pIn += 4; pMatch += 4; }
 599     if ((pIn < (pInLimit - 1)) && (LZ4_read16(pMatch) == LZ4_read16(pIn))) { pIn += 2; pMatch += 2; }
 600     if ((pIn < pInLimit) && (*pMatch == *pIn)) pIn++;
 601     return (unsigned)(pIn - pStart);
 602 }
 603
 604
 605 #ifndef LZ4_COMMONDEFS_ONLY
 606 /*-************************************
 607 *  Local Constants
 608 **************************************/
 609 static const int LZ4_64Klimit = ((64 KB) + (MFLIMIT - 1));
 610 static const U32 LZ4_skipTrigger = 6;  /* Increase this value ==> compression run slower on incompressible data */
 611
 612
 613 /*-************************************
 614 *  Local Structures and types
 615 **************************************/
 616 typedef enum { clearedTable = 0, byPtr, byU32, byU16 } tableType_t;
 617
 618 /**
 619  * This enum distinguishes several different modes of accessing previous
 620  * content in the stream.
 621  *
 622  * - noDict        : There is no preceding content.
 623  * - withPrefix64k : Table entries up to ctx->dictSize before the current blob
 624  *                   blob being compressed are valid and refer to the preceding
 625  *                   content (of length ctx->dictSize), which is available
 626  *                   contiguously preceding in memory the content currently
 627  *                   being compressed.
 628  * - usingExtDict  : Like withPrefix64k, but the preceding content is somewhere
 629  *                   else in memory, starting at ctx->dictionary with length
 630  *                   ctx->dictSize.
 631  * - usingDictCtx  : Like usingExtDict, but everything concerning the preceding
 632  *                   content is in a separate context, pointed to by
 633  *                   ctx->dictCtx. ctx->dictionary, ctx->dictSize, and table
 634  *                   entries in the current context that refer to positions
 635  *                   preceding the beginning of the current compression are
 636  *                   ignored. Instead, ctx->dictCtx->dictionary and ctx->dictCtx
 637  *                   ->dictSize describe the location and size of the preceding
 638  *                   content, and matches are found by looking in the ctx
 639  *                   ->dictCtx->hashTable.
 640  */
 641 typedef enum { noDict = 0, withPrefix64k, usingExtDict, usingDictCtx } dict_directive;
 642 typedef enum { noDictIssue = 0, dictSmall } dictIssue_directive;
 643
 644
 645 /*-************************************
 646 *  Local Utils
 647 **************************************/
 648 int LZ4_versionNumber(void) { return LZ4_VERSION_NUMBER; }
 649 const char *LZ4_versionString(void) { return LZ4_VERSION_STRING; }
 650 int LZ4_compressBound(int isize)  { return LZ4_COMPRESSBOUND(isize); }
 651 int LZ4_sizeofState(void) { return LZ4_STREAMSIZE; }
 652
 653
 654 /*-************************************
 655 *  Internal Definitions used in Tests
 656 **************************************/
 657 #if defined (__cplusplus)
 658 extern "C" {
 659 #endif
 660
 661 int LZ4_compress_forceExtDict(LZ4_stream_t *LZ4_dict, const char *src, char *dst, int srcSize);
 662
 663 int LZ4_decompress_safe_forceExtDict(const char *src, char *dst,
 664                                      int compressedSize, int dstCapacity,
 665                                      const void *dictStart, size_t dictSize);
 666
 667 #if defined (__cplusplus)
 668 }
 669 #endif
 670
 671 /*-******************************
 672 *  Compression functions
 673 ********************************/
 674 LZ4_FORCE_INLINE U32 LZ4_hash4(U32 sequence, tableType_t const tableType) {
 675     if (tableType == byU16)
 676         return ((sequence * 2654435761U) >> ((MINMATCH * 8) - (LZ4_HASHLOG + 1)));
 677     else
 678         return ((sequence * 2654435761U) >> ((MINMATCH * 8) - LZ4_HASHLOG));
 679 }
 680
 681 LZ4_FORCE_INLINE U32 LZ4_hash5(U64 sequence, tableType_t const tableType) {
 682     const U32 hashLog = (tableType == byU16) ? LZ4_HASHLOG + 1 : LZ4_HASHLOG;
 683     if (LZ4_isLittleEndian()) {
 684         const U64 prime5bytes = 889523592379ULL;
 685         return (U32)(((sequence << 24) * prime5bytes) >> (64 - hashLog));
 686     } else {
 687         const U64 prime8bytes = 11400714785074694791ULL;
 688         return (U32)(((sequence >> 24) * prime8bytes) >> (64 - hashLog));
 689     }
 690 }
 691
 692 LZ4_FORCE_INLINE U32 LZ4_hashPosition(const void *const p, tableType_t const tableType) {
 693     if ((sizeof(reg_t) == 8) && (tableType != byU16)) return LZ4_hash5(LZ4_read_ARCH(p), tableType);
 694     return LZ4_hash4(LZ4_read32(p), tableType);
 695 }
 696
 697 LZ4_FORCE_INLINE void LZ4_clearHash(U32 h, void *tableBase, tableType_t const tableType) {
 698     switch (tableType) {
 699         default: /* fallthrough */
 700         case clearedTable: { /* illegal! */ assert(0); return; }
 701         case byPtr:
 702         { const BYTE **hashTable = (const BYTE **)tableBase; hashTable[h] = NULL; return; }
 703         case byU32:
 704         { U32 *hashTable = (U32 *) tableBase; hashTable[h] = 0; return; }
 705         case byU16:
 706         { U16 *hashTable = (U16 *) tableBase; hashTable[h] = 0; return; }
 707     }
 708 }
 709
 710 LZ4_FORCE_INLINE void LZ4_putIndexOnHash(U32 idx, U32 h, void *tableBase, tableType_t const tableType) {
 711     switch (tableType) {
 712         default: /* fallthrough */
 713         case clearedTable: /* fallthrough */
 714         case byPtr: { /* illegal! */ assert(0); return; }
 715         case byU32:
 716         { U32 *hashTable = (U32 *) tableBase; hashTable[h] = idx; return; }
 717         case byU16:
 718         { U16 *hashTable = (U16 *) tableBase; assert(idx < 65536); hashTable[h] = (U16)idx; return; }
 719     }
 720 }
 721
 722 LZ4_FORCE_INLINE void LZ4_putPositionOnHash(const BYTE *p, U32 h,
 723                                             void *tableBase, tableType_t const tableType,
 724                                             const BYTE *srcBase) {
 725     switch (tableType) {
 726         case clearedTable: { /* illegal! */ assert(0); return; }
 727         case byPtr:
 728         { const BYTE **hashTable = (const BYTE **)tableBase; hashTable[h] = p; return; }
 729         case byU32:
 730         { U32 *hashTable = (U32 *) tableBase; hashTable[h] = (U32)(p - srcBase); return; }
 731         case byU16:
 732         { U16 *hashTable = (U16 *) tableBase; hashTable[h] = (U16)(p - srcBase); return; }
 733     }
 734 }
 735
 736 LZ4_FORCE_INLINE void LZ4_putPosition(const BYTE *p, void *tableBase, tableType_t tableType, const BYTE *srcBase) {
 737     U32 const h = LZ4_hashPosition(p, tableType);
 738     LZ4_putPositionOnHash(p, h, tableBase, tableType, srcBase);
 739 }
 740
 741 /* LZ4_getIndexOnHash() :
 742  * Index of match position registered in hash table.
 743  * hash position must be calculated by using base+index, or dictBase+index.
 744  * Assumption 1 : only valid if tableType == byU32 or byU16.
 745  * Assumption 2 : h is presumed valid (within limits of hash table)
 746  */
 747 LZ4_FORCE_INLINE U32 LZ4_getIndexOnHash(U32 h, const void *tableBase, tableType_t tableType) {
 748     LZ4_STATIC_ASSERT(LZ4_MEMORY_USAGE > 2);
 749     if (tableType == byU32) {
 750         const U32 *const hashTable = (const U32 *) tableBase;
 751         assert(h < (1U << (LZ4_MEMORY_USAGE - 2)));
 752         return hashTable[h];
 753     }
 754     if (tableType == byU16) {
 755         const U16 *const hashTable = (const U16 *) tableBase;
 756         assert(h < (1U << (LZ4_MEMORY_USAGE - 1)));
 757         return hashTable[h];
 758     }
 759     assert(0);
 760     return 0;  /* forbidden case */
 761 }
 762
 763 static const BYTE *LZ4_getPositionOnHash(U32 h, const void *tableBase, tableType_t tableType, const BYTE *srcBase) {
 764     if (tableType == byPtr) { const BYTE *const *hashTable = (const BYTE * const *) tableBase; return hashTable[h]; }
 765     if (tableType == byU32) { const U32 *const hashTable = (const U32 *) tableBase; return hashTable[h] + srcBase; }
 766     { const U16 *const hashTable = (const U16 *) tableBase; return hashTable[h] + srcBase; }  /* default, to ensure a return */
 767 }
 768
 769 LZ4_FORCE_INLINE const BYTE *
 770 LZ4_getPosition(const BYTE *p,
 771                 const void *tableBase, tableType_t tableType,
 772                 const BYTE *srcBase) {
 773     U32 const h = LZ4_hashPosition(p, tableType);
 774     return LZ4_getPositionOnHash(h, tableBase, tableType, srcBase);
 775 }
 776
 777 LZ4_FORCE_INLINE void
 778 LZ4_prepareTable(LZ4_stream_t_internal *const cctx,
 779                  const int srcSize,
 780                  const tableType_t tableType) {
 781     /* If the table hasn't been used, it's guaranteed to be zeroed out, and is
 782      * therefore safe to use no matter what mode we're in. Otherwise, we figure
 783      * out if it's safe to leave as is or whether it needs to be reset.
 784      */
 785     if ((tableType_t)cctx->tableType != clearedTable) {
 786         assert(srcSize >= 0);
 787         if ((tableType_t)cctx->tableType != tableType
 788                 || ((tableType == byU16) && cctx->currentOffset + (unsigned)srcSize >= 0xFFFFU)
 789                 || ((tableType == byU32) && cctx->currentOffset > 1 GB)
 790                 || tableType == byPtr
 791                 || srcSize >= 4 KB) {
 792             DEBUGLOG(4, "LZ4_prepareTable: Resetting table in %p", cctx);
 793             MEM_INIT(cctx->hashTable, 0, LZ4_HASHTABLESIZE);
 794             cctx->currentOffset = 0;
 795             cctx->tableType = (U32)clearedTable;
 796         } else {
 797             DEBUGLOG(4, "LZ4_prepareTable: Re-use hash table (no reset)");
 798         }
 799     }
 800
 801     /* Adding a gap, so all previous entries are > LZ4_DISTANCE_MAX back, is faster
 802      * than compressing without a gap. However, compressing with
 803      * currentOffset == 0 is faster still, so we preserve that case.
 804      */
 805     if (cctx->currentOffset != 0 && tableType == byU32) {
 806         DEBUGLOG(5, "LZ4_prepareTable: adding 64KB to currentOffset");
 807         cctx->currentOffset += 64 KB;
 808     }
 809
 810     /* Finally, clear history */
 811     cctx->dictCtx = NULL;
 812     cctx->dictionary = NULL;
 813     cctx->dictSize = 0;
 814 }
 815
 816 /** LZ4_compress_generic() :
 817  *  inlined, to ensure branches are decided at compilation time.
 818  *  Presumed already validated at this stage:
 819  *  - source != NULL
 820  *  - inputSize > 0
 821  */
 822 LZ4_FORCE_INLINE int LZ4_compress_generic_validated(
 823     LZ4_stream_t_internal *const cctx,
 824     const char *const src,
 825     char *const dst,
 826     const int srcSize,
 827     int *inputConsumed, /* only written when outputDirective == fillOutput */
 828     const int dstCapacity,
 829     const limitedOutput_directive outputDirective,
 830     const tableType_t tableType,
 831     const dict_directive dictDirective,
 832     const dictIssue_directive dictIssue,
 833     const int acceleration) {
 834     int result;
 835     const BYTE *ip = (const BYTE *) src;
 836
 837     U32 const startIndex = cctx->currentOffset;
 838     const BYTE *base = (const BYTE *) src - startIndex;
 839     const BYTE *lowLimit;
 840
 841     const LZ4_stream_t_internal *dictCtx = (const LZ4_stream_t_internal *) cctx->dictCtx;
 842     const BYTE *const dictionary =
 843         dictDirective == usingDictCtx ? dictCtx->dictionary : cctx->dictionary;
 844     const U32 dictSize =
 845         dictDirective == usingDictCtx ? dictCtx->dictSize : cctx->dictSize;
 846     const U32 dictDelta = (dictDirective == usingDictCtx) ? startIndex - dictCtx->currentOffset : 0;   /* make indexes in dictCtx comparable with index in current context */
 847
 848     int const maybe_extMem = (dictDirective == usingExtDict) || (dictDirective == usingDictCtx);
 849     U32 const prefixIdxLimit = startIndex - dictSize;   /* used when dictDirective == dictSmall */
 850     const BYTE *const dictEnd = dictionary ? dictionary + dictSize : dictionary;
 851     const BYTE *anchor = (const BYTE *) src;
 852     const BYTE *const iend = ip + srcSize;
 853     const BYTE *const mflimitPlusOne = iend - MFLIMIT + 1;
 854     const BYTE *const matchlimit = iend - LASTLITERALS;
 855
 856     /* the dictCtx currentOffset is indexed on the start of the dictionary,
 857      * while a dictionary in the current context precedes the currentOffset */
 858     const BYTE *dictBase = !dictionary ? NULL : (dictDirective == usingDictCtx) ?
 859                            dictionary + dictSize - dictCtx->currentOffset :
 860                            dictionary + dictSize - startIndex;
 861
 862     BYTE *op = (BYTE *) dst;
 863     BYTE *const olimit = op + dstCapacity;
 864
 865     U32 offset = 0;
 866     U32 forwardH;
 867
 868     DEBUGLOG(5, "LZ4_compress_generic_validated: srcSize=%i, tableType=%u", srcSize, tableType);
 869     assert(ip != NULL);
 870     /* If init conditions are not met, we don't have to mark stream
 871      * as having dirty context, since no action was taken yet */
 872     if (outputDirective == fillOutput && dstCapacity < 1) { return 0; } /* Impossible to store anything */
 873     if ((tableType == byU16) && (srcSize >= LZ4_64Klimit)) { return 0; } /* Size too large (not within 64K limit) */
 874     if (tableType == byPtr) assert(dictDirective == noDict);  /* only supported use case with byPtr */
 875     assert(acceleration >= 1);
 876
 877     lowLimit = (const BYTE *)src - (dictDirective == withPrefix64k ? dictSize : 0);
 878
 879     /* Update context state */
 880     if (dictDirective == usingDictCtx) {
 881         /* Subsequent linked blocks can't use the dictionary. */
 882         /* Instead, they use the block we just compressed. */
 883         cctx->dictCtx = NULL;
 884         cctx->dictSize = (U32)srcSize;
 885     } else {
 886         cctx->dictSize += (U32)srcSize;
 887     }
 888     cctx->currentOffset += (U32)srcSize;
 889     cctx->tableType = (U32)tableType;
 890
 891     if (srcSize < LZ4_minLength) goto _last_literals;      /* Input too small, no compression (all literals) */
 892
 893     /* First Byte */
 894     LZ4_putPosition(ip, cctx->hashTable, tableType, base);
 895     ip++;
 896     forwardH = LZ4_hashPosition(ip, tableType);
 897
 898     /* Main Loop */
 899     for (; ;) {
 900         const BYTE *match;
 901         BYTE *token;
 902         const BYTE *filledIp;
 903
 904         /* Find a match */
 905         if (tableType == byPtr) {
 906             const BYTE *forwardIp = ip;
 907             int step = 1;
 908             int searchMatchNb = acceleration << LZ4_skipTrigger;
 909             do {
 910                 U32 const h = forwardH;
 911                 ip = forwardIp;
 912                 forwardIp += step;
 913                 step = (searchMatchNb++ >> LZ4_skipTrigger);
 914
 915                 if (unlikely(forwardIp > mflimitPlusOne)) goto _last_literals;
 916                 assert(ip < mflimitPlusOne);
 917
 918                 match = LZ4_getPositionOnHash(h, cctx->hashTable, tableType, base);
 919                 forwardH = LZ4_hashPosition(forwardIp, tableType);
 920                 LZ4_putPositionOnHash(ip, h, cctx->hashTable, tableType, base);
 921
 922             } while ((match + LZ4_DISTANCE_MAX < ip)
 923                      || (LZ4_read32(match) != LZ4_read32(ip)));
 924
 925         } else {   /* byU32, byU16 */
 926
 927             const BYTE *forwardIp = ip;
 928             int step = 1;
 929             int searchMatchNb = acceleration << LZ4_skipTrigger;
 930             do {
 931                 U32 const h = forwardH;
 932                 U32 const current = (U32)(forwardIp - base);
 933                 U32 matchIndex = LZ4_getIndexOnHash(h, cctx->hashTable, tableType);
 934                 assert(matchIndex <= current);
 935                 assert(forwardIp - base < (ptrdiff_t)(2 GB - 1));
 936                 ip = forwardIp;
 937                 forwardIp += step;
 938                 step = (searchMatchNb++ >> LZ4_skipTrigger);
 939
 940                 if (unlikely(forwardIp > mflimitPlusOne)) goto _last_literals;
 941                 assert(ip < mflimitPlusOne);
 942
 943                 if (dictDirective == usingDictCtx) {
 944                     if (matchIndex < startIndex) {
 945                         /* there was no match, try the dictionary */
 946                         assert(tableType == byU32);
 947                         matchIndex = LZ4_getIndexOnHash(h, dictCtx->hashTable, byU32);
 948                         match = dictBase + matchIndex;
 949                         matchIndex += dictDelta;   /* make dictCtx index comparable with current context */
 950                         lowLimit = dictionary;
 951                     } else {
 952                         match = base + matchIndex;
 953                         lowLimit = (const BYTE *)src;
 954                     }
 955                 } else if (dictDirective == usingExtDict) {
 956                     if (matchIndex < startIndex) {
 957                         DEBUGLOG(7, "extDict candidate: matchIndex=%5u  <  startIndex=%5u", matchIndex, startIndex);
 958                         assert(startIndex - matchIndex >= MINMATCH);
 959                         match = dictBase + matchIndex;
 960                         lowLimit = dictionary;
 961                     } else {
 962                         match = base + matchIndex;
 963                         lowLimit = (const BYTE *)src;
 964                     }
 965                 } else {   /* single continuous memory segment */
 966                     match = base + matchIndex;
 967                 }
 968                 forwardH = LZ4_hashPosition(forwardIp, tableType);
 969                 LZ4_putIndexOnHash(current, h, cctx->hashTable, tableType);
 970
 971                 DEBUGLOG(7, "candidate at pos=%u  (offset=%u \n", matchIndex, current - matchIndex);
 972                 if ((dictIssue == dictSmall) && (matchIndex < prefixIdxLimit)) { continue; }    /* match outside of valid area */
 973                 assert(matchIndex < current);
 974                 if (((tableType != byU16) || (LZ4_DISTANCE_MAX < LZ4_DISTANCE_ABSOLUTE_MAX))
 975                         && (matchIndex + LZ4_DISTANCE_MAX < current)) {
 976                     continue;
 977                 } /* too far */
 978                 assert((current - matchIndex) <= LZ4_DISTANCE_MAX);  /* match now expected within distance */
 979
 980                 if (LZ4_read32(match) == LZ4_read32(ip)) {
 981                     if (maybe_extMem) offset = current - matchIndex;
 982                     break;   /* match found */
 983                 }
 984
 985             } while (1);
 986         }
 987
 988         /* Catch up */
 989         filledIp = ip;
 990         while (((ip > anchor) & (match > lowLimit)) && (unlikely(ip[-1] == match[-1]))) { ip--; match--; }
 991
 992         /* Encode Literals */
 993         {
 994             unsigned const litLength = (unsigned)(ip - anchor);
 995             token = op++;
 996             if ((outputDirective == limitedOutput) &&  /* Check output buffer overflow */
 997                     (unlikely(op + litLength + (2 + 1 + LASTLITERALS) + (litLength / 255) > olimit))) {
 998                 return 0;   /* cannot compress within `dst` budget. Stored indexes in hash table are nonetheless fine */
 999             }
1000             if ((outputDirective == fillOutput) &&
1001                     (unlikely(op + (litLength + 240) / 255 /* litlen */ + litLength /* literals */ + 2 /* offset */ + 1 /* token */ + MFLIMIT - MINMATCH /* min last literals so last match is <= end - MFLIMIT */ > olimit))) {
1002                 op--;
1003                 goto _last_literals;
1004             }
1005             if (litLength >= RUN_MASK) {
1006                 int len = (int)(litLength - RUN_MASK);
1007                 *token = (RUN_MASK << ML_BITS);
1008                 for (; len >= 255 ; len -= 255) * op++ = 255;
1009                 *op++ = (BYTE)len;
1010             } else *token = (BYTE)(litLength << ML_BITS);
1011
1012             /* Copy Literals */
1013             LZ4_wildCopy8(op, anchor, op + litLength);
1014             op += litLength;
1015             DEBUGLOG(6, "seq.start:%i, literals=%u, match.start:%i",
1016                      (int)(anchor - (const BYTE *)src), litLength, (int)(ip - (const BYTE *)src));
1017         }
1018
1019 _next_match:
1020         /* at this stage, the following variables must be correctly set :
1021          * - ip : at start of LZ operation
1022          * - match : at start of previous pattern occurence; can be within current prefix, or within extDict
1023          * - offset : if maybe_ext_memSegment==1 (constant)
1024          * - lowLimit : must be == dictionary to mean "match is within extDict"; must be == source otherwise
1025          * - token and *token : position to write 4-bits for match length; higher 4-bits for literal length supposed already written
1026          */
1027
1028         if ((outputDirective == fillOutput) &&
1029                 (op + 2 /* offset */ + 1 /* token */ + MFLIMIT - MINMATCH /* min last literals so last match is <= end - MFLIMIT */ > olimit)) {
1030             /* the match was too close to the end, rewind and go to last literals */
1031             op = token;
1032             goto _last_literals;
1033         }
1034
1035         /* Encode Offset */
1036         if (maybe_extMem) {   /* static test */
1037             DEBUGLOG(6, "             with offset=%u  (ext if > %i)", offset, (int)(ip - (const BYTE *)src));
1038             assert(offset <= LZ4_DISTANCE_MAX && offset > 0);
1039             LZ4_writeLE16(op, (U16)offset);
1040             op += 2;
1041         } else  {
1042             DEBUGLOG(6, "             with offset=%u  (same segment)", (U32)(ip - match));
1043             assert(ip - match <= LZ4_DISTANCE_MAX);
1044             LZ4_writeLE16(op, (U16)(ip - match));
1045             op += 2;
1046         }
1047
1048         /* Encode MatchLength */
1049         {
1050             unsigned matchCode;
1051
1052             if ((dictDirective == usingExtDict || dictDirective == usingDictCtx)
1053                     && (lowLimit == dictionary) /* match within extDict */) {
1054                 const BYTE *limit = ip + (dictEnd - match);
1055                 assert(dictEnd > match);
1056                 if (limit > matchlimit) limit = matchlimit;
1057                 matchCode = LZ4_count(ip + MINMATCH, match + MINMATCH, limit);
1058                 ip += (size_t)matchCode + MINMATCH;
1059                 if (ip == limit) {
1060                     unsigned const more = LZ4_count(limit, (const BYTE *)src, matchlimit);
1061                     matchCode += more;
1062                     ip += more;
1063                 }
1064                 DEBUGLOG(6, "             with matchLength=%u starting in extDict", matchCode + MINMATCH);
1065             } else {
1066                 matchCode = LZ4_count(ip + MINMATCH, match + MINMATCH, matchlimit);
1067                 ip += (size_t)matchCode + MINMATCH;
1068                 DEBUGLOG(6, "             with matchLength=%u", matchCode + MINMATCH);
1069             }
1070
1071             if ((outputDirective) &&    /* Check output buffer overflow */
1072                     (unlikely(op + (1 + LASTLITERALS) + (matchCode + 240) / 255 > olimit))) {
1073                 if (outputDirective == fillOutput) {
1074                     /* Match description too long : reduce it */
1075                     U32 newMatchCode = 15 /* in token */ - 1 /* to avoid needing a zero byte */ + ((U32)(olimit - op) - 1 - LASTLITERALS) * 255;
1076                     ip -= matchCode - newMatchCode;
1077                     assert(newMatchCode < matchCode);
1078                     matchCode = newMatchCode;
1079                     if (unlikely(ip <= filledIp)) {
1080                         /* We have already filled up to filledIp so if ip ends up less than filledIp
1081                          * we have positions in the hash table beyond the current position. This is
1082                          * a problem if we reuse the hash table. So we have to remove these positions
1083                          * from the hash table.
1084                          */
1085                         const BYTE *ptr;
1086                         DEBUGLOG(5, "Clearing %u positions", (U32)(filledIp - ip));
1087                         for (ptr = ip; ptr <= filledIp; ++ptr) {
1088                             U32 const h = LZ4_hashPosition(ptr, tableType);
1089                             LZ4_clearHash(h, cctx->hashTable, tableType);
1090                         }
1091                     }
1092                 } else {
1093                     assert(outputDirective == limitedOutput);
1094                     return 0;   /* cannot compress within `dst` budget. Stored indexes in hash table are nonetheless fine */
1095                 }
1096             }
1097             if (matchCode >= ML_MASK) {
1098                 *token += ML_MASK;
1099                 matchCode -= ML_MASK;
1100                 LZ4_write32(op, 0xFFFFFFFF);
1101                 while (matchCode >= 4 * 255) {
1102                     op += 4;
1103                     LZ4_write32(op, 0xFFFFFFFF);
1104                     matchCode -= 4 * 255;
1105                 }
1106                 op += matchCode / 255;
1107                 *op++ = (BYTE)(matchCode % 255);
1108             } else
1109                 *token += (BYTE)(matchCode);
1110         }
1111         /* Ensure we have enough space for the last literals. */
1112         assert(!(outputDirective == fillOutput && op + 1 + LASTLITERALS > olimit));
1113
1114         anchor = ip;
1115
1116         /* Test end of chunk */
1117         if (ip >= mflimitPlusOne) break;
1118
1119         /* Fill table */
1120         LZ4_putPosition(ip - 2, cctx->hashTable, tableType, base);
1121
1122         /* Test next position */
1123         if (tableType == byPtr) {
1124
1125             match = LZ4_getPosition(ip, cctx->hashTable, tableType, base);
1126             LZ4_putPosition(ip, cctx->hashTable, tableType, base);
1127             if ((match + LZ4_DISTANCE_MAX >= ip)
1128                     && (LZ4_read32(match) == LZ4_read32(ip)))
1129             { token = op++; *token = 0; goto _next_match; }
1130
1131         } else {   /* byU32, byU16 */
1132
1133             U32 const h = LZ4_hashPosition(ip, tableType);
1134             U32 const current = (U32)(ip - base);
1135             U32 matchIndex = LZ4_getIndexOnHash(h, cctx->hashTable, tableType);
1136             assert(matchIndex < current);
1137             if (dictDirective == usingDictCtx) {
1138                 if (matchIndex < startIndex) {
1139                     /* there was no match, try the dictionary */
1140                     matchIndex = LZ4_getIndexOnHash(h, dictCtx->hashTable, byU32);
1141                     match = dictBase + matchIndex;
1142                     lowLimit = dictionary;   /* required for match length counter */
1143                     matchIndex += dictDelta;
1144                 } else {
1145                     match = base + matchIndex;
1146                     lowLimit = (const BYTE *)src; /* required for match length counter */
1147                 }
1148             } else if (dictDirective == usingExtDict) {
1149                 if (matchIndex < startIndex) {
1150                     match = dictBase + matchIndex;
1151                     lowLimit = dictionary;   /* required for match length counter */
1152                 } else {
1153                     match = base + matchIndex;
1154                     lowLimit = (const BYTE *)src;  /* required for match length counter */
1155                 }
1156             } else {   /* single memory segment */
1157                 match = base + matchIndex;
1158             }
1159             LZ4_putIndexOnHash(current, h, cctx->hashTable, tableType);
1160             assert(matchIndex < current);
1161             if (((dictIssue == dictSmall) ? (matchIndex >= prefixIdxLimit) : 1)
1162                     && (((tableType == byU16) && (LZ4_DISTANCE_MAX == LZ4_DISTANCE_ABSOLUTE_MAX)) ? 1 : (matchIndex + LZ4_DISTANCE_MAX >= current))
1163                     && (LZ4_read32(match) == LZ4_read32(ip))) {
1164                 token = op++;
1165                 *token = 0;
1166                 if (maybe_extMem) offset = current - matchIndex;
1167                 DEBUGLOG(6, "seq.start:%i, literals=%u, match.start:%i",
1168                          (int)(anchor - (const BYTE *)src), 0, (int)(ip - (const BYTE *)src));
1169                 goto _next_match;
1170             }
1171         }
1172
1173         /* Prepare next loop */
1174         forwardH = LZ4_hashPosition(++ip, tableType);
1175
1176     }
1177
1178 _last_literals:
1179     /* Encode Last Literals */
1180     {
1181         size_t lastRun = (size_t)(iend - anchor);
1182         if ((outputDirective) &&   /* Check output buffer overflow */
1183                 (op + lastRun + 1 + ((lastRun + 255 - RUN_MASK) / 255) > olimit)) {
1184             if (outputDirective == fillOutput) {
1185                 /* adapt lastRun to fill 'dst' */
1186                 assert(olimit >= op);
1187                 lastRun  = (size_t)(olimit - op) - 1/*token*/;
1188                 lastRun -= (lastRun + 256 - RUN_MASK) / 256;  /*additional length tokens*/
1189             } else {
1190                 assert(outputDirective == limitedOutput);
1191                 return 0;   /* cannot compress within `dst` budget. Stored indexes in hash table are nonetheless fine */
1192             }
1193         }
1194         DEBUGLOG(6, "Final literal run : %i literals", (int)lastRun);
1195         if (lastRun >= RUN_MASK) {
1196             size_t accumulator = lastRun - RUN_MASK;
1197             *op++ = RUN_MASK << ML_BITS;
1198             for (; accumulator >= 255 ; accumulator -= 255) * op++ = 255;
1199             *op++ = (BYTE) accumulator;
1200         } else {
1201             *op++ = (BYTE)(lastRun << ML_BITS);
1202         }
1203         LZ4_memcpy(op, anchor, lastRun);
1204         ip = anchor + lastRun;
1205         op += lastRun;
1206     }
1207
1208     if (outputDirective == fillOutput) {
1209         *inputConsumed = (int)(((const char *)ip) - src);
1210     }
1211     result = (int)(((char *)op) - dst);
1212     assert(result > 0);
1213     DEBUGLOG(5, "LZ4_compress_generic: compressed %i bytes into %i bytes", srcSize, result);
1214     return result;
1215 }
1216
1217 /** LZ4_compress_generic() :
1218  *  inlined, to ensure branches are decided at compilation time;
1219  *  takes care of src == (NULL, 0)
1220  *  and forward the rest to LZ4_compress_generic_validated */
1221 LZ4_FORCE_INLINE int LZ4_compress_generic(
1222     LZ4_stream_t_internal *const cctx,
1223     const char *const src,
1224     char *const dst,
1225     const int srcSize,
1226     int *inputConsumed, /* only written when outputDirective == fillOutput */
1227     const int dstCapacity,
1228     const limitedOutput_directive outputDirective,
1229     const tableType_t tableType,
1230     const dict_directive dictDirective,
1231     const dictIssue_directive dictIssue,
1232     const int acceleration) {
1233     DEBUGLOG(5, "LZ4_compress_generic: srcSize=%i, dstCapacity=%i",
1234              srcSize, dstCapacity);
1235
1236     if ((U32)srcSize > (U32)LZ4_MAX_INPUT_SIZE) { return 0; }  /* Unsupported srcSize, too large (or negative) */
1237     if (srcSize == 0) {   /* src == NULL supported if srcSize == 0 */
1238         if (outputDirective != notLimited && dstCapacity <= 0) return 0;  /* no output, can't write anything */
1239         DEBUGLOG(5, "Generating an empty block");
1240         assert(outputDirective == notLimited || dstCapacity >= 1);
1241         assert(dst != NULL);
1242         dst[0] = 0;
1243         if (outputDirective == fillOutput) {
1244             assert(inputConsumed != NULL);
1245             *inputConsumed = 0;
1246         }
1247         return 1;
1248     }
1249     assert(src != NULL);
1250
1251     return LZ4_compress_generic_validated(cctx, src, dst, srcSize,
1252                                           inputConsumed, /* only written into if outputDirective == fillOutput */
1253                                           dstCapacity, outputDirective,
1254                                           tableType, dictDirective, dictIssue, acceleration);
1255 }
1256
1257
1258 int LZ4_compress_fast_extState(void *state, const char *src, char *dst, int srcSize, int dstCapacity, int acceleration) {
1259     LZ4_stream_t_internal *const ctx = & LZ4_initStream(state, sizeof(LZ4_stream_t)) -> internal_donotuse;
1260     assert(ctx != NULL);
1261     if (acceleration < 1) acceleration = LZ4_ACCELERATION_DEFAULT;
1262     if (acceleration > LZ4_ACCELERATION_MAX) acceleration = LZ4_ACCELERATION_MAX;
1263     if (dstCapacity >= LZ4_compressBound(srcSize)) {
1264         if (srcSize < LZ4_64Klimit) {
1265             return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, 0, notLimited, byU16, noDict, noDictIssue, acceleration);
1266         } else {
1267             const tableType_t tableType = ((sizeof(void *) == 4) && ((uptrval)src > LZ4_DISTANCE_MAX)) ? byPtr : byU32;
1268             return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, 0, notLimited, tableType, noDict, noDictIssue, acceleration);
1269         }
1270     } else {
1271         if (srcSize < LZ4_64Klimit) {
1272             return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, dstCapacity, limitedOutput, byU16, noDict, noDictIssue, acceleration);
1273         } else {
1274             const tableType_t tableType = ((sizeof(void *) == 4) && ((uptrval)src > LZ4_DISTANCE_MAX)) ? byPtr : byU32;
1275             return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, dstCapacity, limitedOutput, tableType, noDict, noDictIssue, acceleration);
1276         }
1277     }
1278 }
1279
1280 /**
1281  * LZ4_compress_fast_extState_fastReset() :
1282  * A variant of LZ4_compress_fast_extState().
1283  *
1284  * Using this variant avoids an expensive initialization step. It is only safe
1285  * to call if the state buffer is known to be correctly initialized already
1286  * (see comment in lz4.h on LZ4_resetStream_fast() for a definition of
1287  * "correctly initialized").
1288  */
1289 int LZ4_compress_fast_extState_fastReset(void *state, const char *src, char *dst, int srcSize, int dstCapacity, int acceleration) {
1290     LZ4_stream_t_internal *ctx = &((LZ4_stream_t *)state)->internal_donotuse;
1291     if (acceleration < 1) acceleration = LZ4_ACCELERATION_DEFAULT;
1292     if (acceleration > LZ4_ACCELERATION_MAX) acceleration = LZ4_ACCELERATION_MAX;
1293
1294     if (dstCapacity >= LZ4_compressBound(srcSize)) {
1295         if (srcSize < LZ4_64Klimit) {
1296             const tableType_t tableType = byU16;
1297             LZ4_prepareTable(ctx, srcSize, tableType);
1298             if (ctx->currentOffset) {
1299                 return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, 0, notLimited, tableType, noDict, dictSmall, acceleration);
1300             } else {
1301                 return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, 0, notLimited, tableType, noDict, noDictIssue, acceleration);
1302             }
1303         } else {
1304             const tableType_t tableType = ((sizeof(void *) == 4) && ((uptrval)src > LZ4_DISTANCE_MAX)) ? byPtr : byU32;
1305             LZ4_prepareTable(ctx, srcSize, tableType);
1306             return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, 0, notLimited, tableType, noDict, noDictIssue, acceleration);
1307         }
1308     } else {
1309         if (srcSize < LZ4_64Klimit) {
1310             const tableType_t tableType = byU16;
1311             LZ4_prepareTable(ctx, srcSize, tableType);
1312             if (ctx->currentOffset) {
1313                 return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, dstCapacity, limitedOutput, tableType, noDict, dictSmall, acceleration);
1314             } else {
1315                 return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, dstCapacity, limitedOutput, tableType, noDict, noDictIssue, acceleration);
1316             }
1317         } else {
1318             const tableType_t tableType = ((sizeof(void *) == 4) && ((uptrval)src > LZ4_DISTANCE_MAX)) ? byPtr : byU32;
1319             LZ4_prepareTable(ctx, srcSize, tableType);
1320             return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, dstCapacity, limitedOutput, tableType, noDict, noDictIssue, acceleration);
1321         }
1322     }
1323 }
1324
1325
1326 int LZ4_compress_fast(const char *src, char *dst, int srcSize, int dstCapacity, int acceleration) {
1327     int result;
1328 #if (LZ4_HEAPMODE)
1329     LZ4_stream_t *ctxPtr = ALLOC(sizeof(LZ4_stream_t));   /* malloc-calloc always properly aligned */
1330     if (ctxPtr == NULL) return 0;
1331 #else
1332     LZ4_stream_t ctx;
1333     LZ4_stream_t *const ctxPtr = &ctx;
1334 #endif
1335     result = LZ4_compress_fast_extState(ctxPtr, src, dst, srcSize, dstCapacity, acceleration);
1336
1337 #if (LZ4_HEAPMODE)
1338     FREEMEM(ctxPtr);
1339 #endif
1340     return result;
1341 }
1342
1343
1344 int LZ4_compress_default(const char *src, char *dst, int srcSize, int dstCapacity) {
1345     return LZ4_compress_fast(src, dst, srcSize, dstCapacity, 1);
1346 }
1347
1348
1349 /* Note!: This function leaves the stream in an unclean/broken state!
1350  * It is not safe to subsequently use the same state with a _fastReset() or
1351  * _continue() call without resetting it. */
1352 static int LZ4_compress_destSize_extState(LZ4_stream_t *state, const char *src, char *dst, int *srcSizePtr, int targetDstSize) {
1353     void *const s = LZ4_initStream(state, sizeof(*state));
1354     assert(s != NULL);
1355     (void)s;
1356
1357     if (targetDstSize >= LZ4_compressBound(*srcSizePtr)) {  /* compression success is guaranteed */
1358         return LZ4_compress_fast_extState(state, src, dst, *srcSizePtr, targetDstSize, 1);
1359     } else {
1360         if (*srcSizePtr < LZ4_64Klimit) {
1361             return LZ4_compress_generic(&state->internal_donotuse, src, dst, *srcSizePtr, srcSizePtr, targetDstSize, fillOutput, byU16, noDict, noDictIssue, 1);
1362         } else {
1363             tableType_t const addrMode = ((sizeof(void *) == 4) && ((uptrval)src > LZ4_DISTANCE_MAX)) ? byPtr : byU32;
1364             return LZ4_compress_generic(&state->internal_donotuse, src, dst, *srcSizePtr, srcSizePtr, targetDstSize, fillOutput, addrMode, noDict, noDictIssue, 1);
1365         }
1366     }
1367 }
1368
1369
1370 int LZ4_compress_destSize(const char *src, char *dst, int *srcSizePtr, int targetDstSize) {
1371 #if (LZ4_HEAPMODE)
1372     LZ4_stream_t *ctx = (LZ4_stream_t *)ALLOC(sizeof(LZ4_stream_t));  /* malloc-calloc always properly aligned */
1373     if (ctx == NULL) return 0;
1374 #else
1375     LZ4_stream_t ctxBody;
1376     LZ4_stream_t *ctx = &ctxBody;
1377 #endif
1378
1379     int result = LZ4_compress_destSize_extState(ctx, src, dst, srcSizePtr, targetDstSize);
1380
1381 #if (LZ4_HEAPMODE)
1382     FREEMEM(ctx);
1383 #endif
1384     return result;
1385 }
1386
1387
1388
1389 /*-******************************
1390 *  Streaming functions
1391 ********************************/
1392
1393 LZ4_stream_t *LZ4_createStream(void) {
1394     LZ4_stream_t *const lz4s = (LZ4_stream_t *)ALLOC(sizeof(LZ4_stream_t));
1395     LZ4_STATIC_ASSERT(LZ4_STREAMSIZE >= sizeof(LZ4_stream_t_internal));    /* A compilation error here means LZ4_STREAMSIZE is not large enough */
1396     DEBUGLOG(4, "LZ4_createStream %p", lz4s);
1397     if (lz4s == NULL) return NULL;
1398     LZ4_initStream(lz4s, sizeof(*lz4s));
1399     return lz4s;
1400 }
1401
1402 #ifndef _MSC_VER  /* for some reason, Visual fails the aligment test on 32-bit x86 :
1403                      it reports an aligment of 8-bytes,
1404                      while actually aligning LZ4_stream_t on 4 bytes. */
1405 static size_t LZ4_stream_t_alignment(void) {
1406     typedef struct { char c; LZ4_stream_t t; } t_a;
1407     return sizeof(t_a) - sizeof(LZ4_stream_t);
1408 }
1409 #endif
1410
1411 LZ4_stream_t *LZ4_initStream(void *buffer, size_t size) {
1412     DEBUGLOG(5, "LZ4_initStream");
1413     if (buffer == NULL) { return NULL; }
1414     if (size < sizeof(LZ4_stream_t)) { return NULL; }
1415 #ifndef _MSC_VER  /* for some reason, Visual fails the aligment test on 32-bit x86 :
1416                      it reports an aligment of 8-bytes,
1417                      while actually aligning LZ4_stream_t on 4 bytes. */
1418     if (((size_t)buffer) & (LZ4_stream_t_alignment() - 1)) { return NULL; } /* alignment check */
1419 #endif
1420     MEM_INIT(buffer, 0, sizeof(LZ4_stream_t));
1421     return (LZ4_stream_t *)buffer;
1422 }
1423
1424 /* resetStream is now deprecated,
1425  * prefer initStream() which is more general */
1426 void LZ4_resetStream(LZ4_stream_t *LZ4_stream) {
1427     DEBUGLOG(5, "LZ4_resetStream (ctx:%p)", LZ4_stream);
1428     MEM_INIT(LZ4_stream, 0, sizeof(LZ4_stream_t));
1429 }
1430
1431 void LZ4_resetStream_fast(LZ4_stream_t *ctx) {
1432     LZ4_prepareTable(&(ctx->internal_donotuse), 0, byU32);
1433 }
1434
1435 int LZ4_freeStream(LZ4_stream_t *LZ4_stream) {
1436     if (!LZ4_stream) return 0;   /* support free on NULL */
1437     DEBUGLOG(5, "LZ4_freeStream %p", LZ4_stream);
1438     FREEMEM(LZ4_stream);
1439     return (0);
1440 }
1441
1442
1443 #define HASH_UNIT sizeof(reg_t)
1444 int LZ4_loadDict(LZ4_stream_t *LZ4_dict, const char *dictionary, int dictSize) {
1445     LZ4_stream_t_internal *dict = &LZ4_dict->internal_donotuse;
1446     const tableType_t tableType = byU32;
1447     const BYTE *p = (const BYTE *)dictionary;
1448     const BYTE *const dictEnd = p + dictSize;
1449     const BYTE *base;
1450
1451     DEBUGLOG(4, "LZ4_loadDict (%i bytes from %p into %p)", dictSize, dictionary, LZ4_dict);
1452
1453     /* It's necessary to reset the context,
1454      * and not just continue it with prepareTable()
1455      * to avoid any risk of generating overflowing matchIndex
1456      * when compressing using this dictionary */
1457     LZ4_resetStream(LZ4_dict);
1458
1459     /* We always increment the offset by 64 KB, since, if the dict is longer,
1460      * we truncate it to the last 64k, and if it's shorter, we still want to
1461      * advance by a whole window length so we can provide the guarantee that
1462      * there are only valid offsets in the window, which allows an optimization
1463      * in LZ4_compress_fast_continue() where it uses noDictIssue even when the
1464      * dictionary isn't a full 64k. */
1465     dict->currentOffset += 64 KB;
1466
1467     if (dictSize < (int)HASH_UNIT) {
1468         return 0;
1469     }
1470
1471     if ((dictEnd - p) > 64 KB) p = dictEnd - 64 KB;
1472     base = dictEnd - dict->currentOffset;
1473     dict->dictionary = p;
1474     dict->dictSize = (U32)(dictEnd - p);
1475     dict->tableType = (U32)tableType;
1476
1477     while (p <= dictEnd - HASH_UNIT) {
1478         LZ4_putPosition(p, dict->hashTable, tableType, base);
1479         p += 3;
1480     }
1481
1482     return (int)dict->dictSize;
1483 }
1484
1485 void LZ4_attach_dictionary(LZ4_stream_t *workingStream, const LZ4_stream_t *dictionaryStream) {
1486     const LZ4_stream_t_internal *dictCtx = dictionaryStream == NULL ? NULL :
1487                                            &(dictionaryStream->internal_donotuse);
1488
1489     DEBUGLOG(4, "LZ4_attach_dictionary (%p, %p, size %u)",
1490              workingStream, dictionaryStream,
1491              dictCtx != NULL ? dictCtx->dictSize : 0);
1492
1493     if (dictCtx != NULL) {
1494         /* If the current offset is zero, we will never look in the
1495          * external dictionary context, since there is no value a table
1496          * entry can take that indicate a miss. In that case, we need
1497          * to bump the offset to something non-zero.
1498          */
1499         if (workingStream->internal_donotuse.currentOffset == 0) {
1500             workingStream->internal_donotuse.currentOffset = 64 KB;
1501         }
1502
1503         /* Don't actually attach an empty dictionary.
1504          */
1505         if (dictCtx->dictSize == 0) {
1506             dictCtx = NULL;
1507         }
1508     }
1509     workingStream->internal_donotuse.dictCtx = dictCtx;
1510 }
1511
1512
1513 static void LZ4_renormDictT(LZ4_stream_t_internal *LZ4_dict, int nextSize) {
1514     assert(nextSize >= 0);
1515     if (LZ4_dict->currentOffset + (unsigned)nextSize > 0x80000000) {   /* potential ptrdiff_t overflow (32-bits mode) */
1516         /* rescale hash table */
1517         U32 const delta = LZ4_dict->currentOffset - 64 KB;
1518         const BYTE *dictEnd = LZ4_dict->dictionary + LZ4_dict->dictSize;
1519         int i;
1520         DEBUGLOG(4, "LZ4_renormDictT");
1521         for (i = 0; i < LZ4_HASH_SIZE_U32; i++) {
1522             if (LZ4_dict->hashTable[i] < delta) LZ4_dict->hashTable[i] = 0;
1523             else LZ4_dict->hashTable[i] -= delta;
1524         }
1525         LZ4_dict->currentOffset = 64 KB;
1526         if (LZ4_dict->dictSize > 64 KB) LZ4_dict->dictSize = 64 KB;
1527         LZ4_dict->dictionary = dictEnd - LZ4_dict->dictSize;
1528     }
1529 }
1530
1531
1532 int LZ4_compress_fast_continue(LZ4_stream_t *LZ4_stream,
1533                                const char *src, char *dst,
1534                                int srcSize, int dstCapacity,
1535                                int acceleration) {
1536     const tableType_t tableType = byU32;
1537     LZ4_stream_t_internal *streamPtr = &LZ4_stream->internal_donotuse;
1538     const BYTE *dictEnd = streamPtr->dictionary + streamPtr->dictSize;
1539
1540     DEBUGLOG(5, "LZ4_compress_fast_continue (srcSize=%i)", srcSize);
1541
1542     LZ4_renormDictT(streamPtr, srcSize);   /* avoid index overflow */
1543     if (acceleration < 1) acceleration = LZ4_ACCELERATION_DEFAULT;
1544     if (acceleration > LZ4_ACCELERATION_MAX) acceleration = LZ4_ACCELERATION_MAX;
1545
1546     /* invalidate tiny dictionaries */
1547     if ((streamPtr->dictSize - 1 < 4 - 1) /* intentional underflow */
1548             && (dictEnd != (const BYTE *)src)) {
1549         DEBUGLOG(5, "LZ4_compress_fast_continue: dictSize(%u) at addr:%p is too small", streamPtr->dictSize, streamPtr->dictionary);
1550         streamPtr->dictSize = 0;
1551         streamPtr->dictionary = (const BYTE *)src;
1552         dictEnd = (const BYTE *)src;
1553     }
1554
1555     /* Check overlapping input/dictionary space */
1556     {
1557         const BYTE *srcEnd = (const BYTE *) src + srcSize;
1558         if ((srcEnd > streamPtr->dictionary) && (srcEnd < dictEnd)) {
1559             streamPtr->dictSize = (U32)(dictEnd - srcEnd);
1560             if (streamPtr->dictSize > 64 KB) streamPtr->dictSize = 64 KB;
1561             if (streamPtr->dictSize < 4) streamPtr->dictSize = 0;
1562             streamPtr->dictionary = dictEnd - streamPtr->dictSize;
1563         }
1564     }
1565
1566     /* prefix mode : source data follows dictionary */
1567     if (dictEnd == (const BYTE *)src) {
1568         if ((streamPtr->dictSize < 64 KB) && (streamPtr->dictSize < streamPtr->currentOffset))
1569             return LZ4_compress_generic(streamPtr, src, dst, srcSize, NULL, dstCapacity, limitedOutput, tableType, withPrefix64k, dictSmall, acceleration);
1570         else
1571             return LZ4_compress_generic(streamPtr, src, dst, srcSize, NULL, dstCapacity, limitedOutput, tableType, withPrefix64k, noDictIssue, acceleration);
1572     }
1573
1574     /* external dictionary mode */
1575     {
1576         int result;
1577         if (streamPtr->dictCtx) {
1578             /* We depend here on the fact that dictCtx'es (produced by
1579              * LZ4_loadDict) guarantee that their tables contain no references
1580              * to offsets between dictCtx->currentOffset - 64 KB and
1581              * dictCtx->currentOffset - dictCtx->dictSize. This makes it safe
1582              * to use noDictIssue even when the dict isn't a full 64 KB.
1583              */
1584             if (srcSize > 4 KB) {
1585                 /* For compressing large blobs, it is faster to pay the setup
1586                  * cost to copy the dictionary's tables into the active context,
1587                  * so that the compression loop is only looking into one table.
1588                  */
1589                 LZ4_memcpy(streamPtr, streamPtr->dictCtx, sizeof(*streamPtr));
1590                 result = LZ4_compress_generic(streamPtr, src, dst, srcSize, NULL, dstCapacity, limitedOutput, tableType, usingExtDict, noDictIssue, acceleration);
1591             } else {
1592                 result = LZ4_compress_generic(streamPtr, src, dst, srcSize, NULL, dstCapacity, limitedOutput, tableType, usingDictCtx, noDictIssue, acceleration);
1593             }
1594         } else {
1595             if ((streamPtr->dictSize < 64 KB) && (streamPtr->dictSize < streamPtr->currentOffset)) {
1596                 result = LZ4_compress_generic(streamPtr, src, dst, srcSize, NULL, dstCapacity, limitedOutput, tableType, usingExtDict, dictSmall, acceleration);
1597             } else {
1598                 result = LZ4_compress_generic(streamPtr, src, dst, srcSize, NULL, dstCapacity, limitedOutput, tableType, usingExtDict, noDictIssue, acceleration);
1599             }
1600         }
1601         streamPtr->dictionary = (const BYTE *)src;
1602         streamPtr->dictSize = (U32)srcSize;
1603         return result;
1604     }
1605 }
1606
1607
1608 /* Hidden debug function, to force-test external dictionary mode */
1609 int LZ4_compress_forceExtDict(LZ4_stream_t *LZ4_dict, const char *src, char *dst, int srcSize) {
1610     LZ4_stream_t_internal *streamPtr = &LZ4_dict->internal_donotuse;
1611     int result;
1612
1613     LZ4_renormDictT(streamPtr, srcSize);
1614
1615     if ((streamPtr->dictSize < 64 KB) && (streamPtr->dictSize < streamPtr->currentOffset)) {
1616         result = LZ4_compress_generic(streamPtr, src, dst, srcSize, NULL, 0, notLimited, byU32, usingExtDict, dictSmall, 1);
1617     } else {
1618         result = LZ4_compress_generic(streamPtr, src, dst, srcSize, NULL, 0, notLimited, byU32, usingExtDict, noDictIssue, 1);
1619     }
1620
1621     streamPtr->dictionary = (const BYTE *)src;
1622     streamPtr->dictSize = (U32)srcSize;
1623
1624     return result;
1625 }
1626
1627
1628 /*! LZ4_saveDict() :
1629  *  If previously compressed data block is not guaranteed to remain available at its memory location,
1630  *  save it into a safer place (char* safeBuffer).
1631  *  Note : you don't need to call LZ4_loadDict() afterwards,
1632  *         dictionary is immediately usable, you can therefore call LZ4_compress_fast_continue().
1633  *  Return : saved dictionary size in bytes (necessarily <= dictSize), or 0 if error.
1634  */
1635 int LZ4_saveDict(LZ4_stream_t *LZ4_dict, char *safeBuffer, int dictSize) {
1636     LZ4_stream_t_internal *const dict = &LZ4_dict->internal_donotuse;
1637     const BYTE *const previousDictEnd = dict->dictionary + dict->dictSize;
1638
1639     if ((U32)dictSize > 64 KB) { dictSize = 64 KB; } /* useless to define a dictionary > 64 KB */
1640     if ((U32)dictSize > dict->dictSize) { dictSize = (int)dict->dictSize; }
1641
1642     memmove(safeBuffer, previousDictEnd - dictSize, dictSize);
1643
1644     dict->dictionary = (const BYTE *)safeBuffer;
1645     dict->dictSize = (U32)dictSize;
1646
1647     return dictSize;
1648 }
1649
1650
1651
1652 /*-*******************************
1653  *  Decompression functions
1654  ********************************/
1655
1656 typedef enum { endOnOutputSize = 0, endOnInputSize = 1 } endCondition_directive;
1657 typedef enum { decode_full_block = 0, partial_decode = 1 } earlyEnd_directive;
1658
1659 #undef MIN
1660 #define MIN(a,b)    ( (a) < (b) ? (a) : (b) )
1661
1662 /* Read the variable-length literal or match length.
1663  *
1664  * ip - pointer to use as input.
1665  * lencheck - end ip.  Return an error if ip advances >= lencheck.
1666  * loop_check - check ip >= lencheck in body of loop.  Returns loop_error if so.
1667  * initial_check - check ip >= lencheck before start of loop.  Returns initial_error if so.
1668  * error (output) - error code.  Should be set to 0 before call.
1669  */
1670 typedef enum { loop_error = -2, initial_error = -1, ok = 0 } variable_length_error;
1671 LZ4_FORCE_INLINE unsigned
1672 read_variable_length(const BYTE **ip, const BYTE *lencheck,
1673                      int loop_check, int initial_check,
1674                      variable_length_error *error) {
1675     U32 length = 0;
1676     U32 s;
1677     if (initial_check && unlikely((*ip) >= lencheck)) {    /* overflow detection */
1678         *error = initial_error;
1679         return length;
1680     }
1681     do {
1682         s = **ip;
1683         (*ip)++;
1684         length += s;
1685         if (loop_check && unlikely((*ip) >= lencheck)) {    /* overflow detection */
1686             *error = loop_error;
1687             return length;
1688         }
1689     } while (s == 255);
1690
1691     return length;
1692 }
1693
1694 int LZ4_decompress_generic(const char *const src, char *const dst, int srcSize, int outputSize, endCondition_directive endOnInput, earlyEnd_directive partialDecoding,
1695                            dict_directive dict, const BYTE *const lowPrefix, const BYTE *const dictStart, const size_t dictSize);
1696
1697 /*! LZ4_decompress_generic() :
1698  *  This generic decompression function covers all use cases.
1699  *  It shall be instantiated several times, using different sets of directives.
1700  *  Note that it is important for performance that this function really get inlined,
1701  *  in order to remove useless branches during compilation optimization.
1702  */
1703 int
1704 LZ4_decompress_generic(
1705     const char *const src,
1706     char *const dst,
1707     int srcSize,
1708     int outputSize,         /* If endOnInput==endOnInputSize, this value is `dstCapacity` */
1709
1710     endCondition_directive endOnInput,   /* endOnOutputSize, endOnInputSize */
1711     earlyEnd_directive partialDecoding,  /* full, partial */
1712     dict_directive dict,                 /* noDict, withPrefix64k, usingExtDict */
1713     const BYTE *const lowPrefix,  /* always <= dst, == dst when no prefix */
1714     const BYTE *const dictStart,  /* only if dict==usingExtDict */
1715     const size_t dictSize         /* note : = 0 if noDict */
1716 ) {
1717     if (src == NULL) { return -1; }
1718
1719     {
1720         const BYTE *ip = (const BYTE *) src;
1721         const BYTE *const iend = ip + srcSize;
1722
1723         BYTE *op = (BYTE *) dst;
1724         BYTE *const oend = op + outputSize;
1725         BYTE *cpy;
1726
1727         const BYTE *const dictEnd = (dictStart == NULL) ? NULL : dictStart + dictSize;
1728
1729         const int safeDecode = (endOnInput == endOnInputSize);
1730         const int checkOffset = ((safeDecode) && (dictSize < (int)(64 KB)));
1731
1732
1733         /* Set up the "end" pointers for the shortcut. */
1734         const BYTE *const shortiend = iend - (endOnInput ? 14 : 8) /*maxLL*/ - 2 /*offset*/;
1735         const BYTE *const shortoend = oend - (endOnInput ? 14 : 8) /*maxLL*/ - 18 /*maxML*/;
1736
1737         const BYTE *match;
1738         size_t offset;
1739         unsigned token;
1740         size_t length;
1741
1742
1743         DEBUGLOG(5, "LZ4_decompress_generic (srcSize:%i, dstSize:%i)", srcSize, outputSize);
1744
1745         /* Special cases */
1746         assert(lowPrefix <= op);
1747         if ((endOnInput) && (unlikely(outputSize == 0))) {
1748             /* Empty output buffer */
1749             if (partialDecoding) return 0;
1750             return ((srcSize == 1) && (*ip == 0)) ? 0 : -1;
1751         }
1752         if ((!endOnInput) && (unlikely(outputSize == 0))) { return (*ip == 0 ? 1 : -1); }
1753         if ((endOnInput) && unlikely(srcSize == 0)) { return -1; }
1754
1755         /* Currently the fast loop shows a regression on qualcomm arm chips. */
1756 #if LZ4_FAST_DEC_LOOP
1757         if ((oend - op) < FASTLOOP_SAFE_DISTANCE) {
1758             DEBUGLOG(6, "skip fast decode loop");
1759             goto safe_decode;
1760         }
1761
1762         /* Fast loop : decode sequences as long as output < iend-FASTLOOP_SAFE_DISTANCE */
1763         while (1) {
1764             /* Main fastloop assertion: We can always wildcopy FASTLOOP_SAFE_DISTANCE */
1765             assert(oend - op >= FASTLOOP_SAFE_DISTANCE);
1766             if (endOnInput) { assert(ip < iend); }
1767             token = *ip++;
1768             length = token >> ML_BITS;  /* literal length */
1769
1770             assert(!endOnInput || ip <= iend); /* ip < iend before the increment */
1771
1772             /* decode literal length */
1773             if (length == RUN_MASK) {
1774                 variable_length_error error = ok;
1775                 length += read_variable_length(&ip, iend - RUN_MASK, (int)endOnInput, (int)endOnInput, &error);
1776                 if (error == initial_error) { goto _output_error; }
1777                 if ((safeDecode) && unlikely((uptrval)(op) + length < (uptrval)(op))) { goto _output_error; } /* overflow detection */
1778                 if ((safeDecode) && unlikely((uptrval)(ip) + length < (uptrval)(ip))) { goto _output_error; } /* overflow detection */
1779
1780                 /* copy literals */
1781                 cpy = op + length;
1782                 LZ4_STATIC_ASSERT(MFLIMIT >= WILDCOPYLENGTH);
1783                 if (endOnInput) {  /* LZ4_decompress_safe() */
1784                     if ((cpy > oend - 32) || (ip + length > iend - 32)) { goto safe_literal_copy; }
1785                     LZ4_wildCopy32(op, ip, cpy);
1786                 } else {   /* LZ4_decompress_fast() */
1787                     if (cpy > oend - 8) { goto safe_literal_copy; }
1788                     LZ4_wildCopy8(op, ip, cpy); /* LZ4_decompress_fast() cannot copy more than 8 bytes at a time :
1789                                                  * it doesn't know input length, and only relies on end-of-block properties */
1790                 }
1791                 ip += length;
1792                 op = cpy;
1793             } else {
1794                 cpy = op + length;
1795                 if (endOnInput) {  /* LZ4_decompress_safe() */
1796                     DEBUGLOG(7, "copy %u bytes in a 16-bytes stripe", (unsigned)length);
1797                     /* We don't need to check oend, since we check it once for each loop below */
1798                     if (ip > iend - (16 + 1/*max lit + offset + nextToken*/)) { goto safe_literal_copy; }
1799                     /* Literals can only be 14, but hope compilers optimize if we copy by a register size */
1800                     LZ4_memcpy(op, ip, 16);
1801                 } else {  /* LZ4_decompress_fast() */
1802                     /* LZ4_decompress_fast() cannot copy more than 8 bytes at a time :
1803                      * it doesn't know input length, and relies on end-of-block properties */
1804                     LZ4_memcpy(op, ip, 8);
1805                     if (length > 8) { LZ4_memcpy(op + 8, ip + 8, 8); }
1806                 }
1807                 ip += length;
1808                 op = cpy;
1809             }
1810
1811             /* get offset */
1812             offset = LZ4_readLE16(ip);
1813             ip += 2;
1814             match = op - offset;
1815             assert(match <= op);
1816
1817             /* get matchlength */
1818             length = token & ML_MASK;
1819
1820             if (length == ML_MASK) {
1821                 variable_length_error error = ok;
1822                 if ((checkOffset) && (unlikely(match + dictSize < lowPrefix))) { goto _output_error; } /* Error : offset outside buffers */
1823                 length += read_variable_length(&ip, iend - LASTLITERALS + 1, (int)endOnInput, 0, &error);
1824                 if (error != ok) { goto _output_error; }
1825                 if ((safeDecode) && unlikely((uptrval)(op) + length < (uptrval)op)) { goto _output_error; } /* overflow detection */
1826                 length += MINMATCH;
1827                 if (op + length >= oend - FASTLOOP_SAFE_DISTANCE) {
1828                     goto safe_match_copy;
1829                 }
1830             } else {
1831                 length += MINMATCH;
1832                 if (op + length >= oend - FASTLOOP_SAFE_DISTANCE) {
1833                     goto safe_match_copy;
1834                 }
1835
1836                 /* Fastpath check: Avoids a branch in LZ4_wildCopy32 if true */
1837                 if ((dict == withPrefix64k) || (match >= lowPrefix)) {
1838                     if (offset >= 8) {
1839                         assert(match >= lowPrefix);
1840                         assert(match <= op);
1841                         assert(op + 18 <= oend);
1842
1843                         LZ4_memcpy(op, match, 8);
1844                         LZ4_memcpy(op + 8, match + 8, 8);
1845                         LZ4_memcpy(op + 16, match + 16, 2);
1846                         op += length;
1847                         continue;
1848                     }
1849                 }
1850             }
1851
1852             if (checkOffset && (unlikely(match + dictSize < lowPrefix))) { goto _output_error; } /* Error : offset outside buffers */
1853             /* match starting within external dictionary */
1854             if ((dict == usingExtDict) && (match < lowPrefix)) {
1855                 if (unlikely(op + length > oend - LASTLITERALS)) {
1856                     if (partialDecoding) {
1857                         DEBUGLOG(7, "partialDecoding: dictionary match, close to dstEnd");
1858                         length = MIN(length, (size_t)(oend - op));
1859                     } else {
1860                         goto _output_error;  /* end-of-block condition violated */
1861                     }
1862                 }
1863
1864                 if (length <= (size_t)(lowPrefix - match)) {
1865                     /* match fits entirely within external dictionary : just copy */
1866                     memmove(op, dictEnd - (lowPrefix - match), length);
1867                     op += length;
1868                 } else {
1869                     /* match stretches into both external dictionary and current block */
1870                     size_t const copySize = (size_t)(lowPrefix - match);
1871                     size_t const restSize = length - copySize;
1872                     LZ4_memcpy(op, dictEnd - copySize, copySize);
1873                     op += copySize;
1874                     if (restSize > (size_t)(op - lowPrefix)) {  /* overlap copy */
1875                         BYTE *const endOfMatch = op + restSize;
1876                         const BYTE *copyFrom = lowPrefix;
1877                         while (op < endOfMatch) { *op++ = *copyFrom++; }
1878                     } else {
1879                         LZ4_memcpy(op, lowPrefix, restSize);
1880                         op += restSize;
1881                     }
1882                 }
1883                 continue;
1884             }
1885
1886             /* copy match within block */
1887             cpy = op + length;
1888
1889             assert((op <= oend) && (oend - op >= 32));
1890             if (unlikely(offset < 16)) {
1891                 LZ4_memcpy_using_offset(op, match, cpy, offset);
1892             } else {
1893                 LZ4_wildCopy32(op, match, cpy);
1894             }
1895
1896             op = cpy;   /* wildcopy correction */
1897         }
1898 safe_decode:
1899 #endif
1900
1901         /* Main Loop : decode remaining sequences where output < FASTLOOP_SAFE_DISTANCE */
1902         while (1) {
1903             token = *ip++;
1904             length = token >> ML_BITS;  /* literal length */
1905
1906             assert(!endOnInput || ip <= iend); /* ip < iend before the increment */
1907
1908             /* A two-stage shortcut for the most common case:
1909              * 1) If the literal length is 0..14, and there is enough space,
1910              * enter the shortcut and copy 16 bytes on behalf of the literals
1911              * (in the fast mode, only 8 bytes can be safely copied this way).
1912              * 2) Further if the match length is 4..18, copy 18 bytes in a similar
1913              * manner; but we ensure that there's enough space in the output for
1914              * those 18 bytes earlier, upon entering the shortcut (in other words,
1915              * there is a combined check for both stages).
1916              */
1917             if ((endOnInput ? length != RUN_MASK : length <= 8)
1918                     /* strictly "less than" on input, to re-enter the loop with at least one byte */
1919                     && likely((endOnInput ? ip < shortiend : 1) & (op <= shortoend))) {
1920                 /* Copy the literals */
1921                 LZ4_memcpy(op, ip, endOnInput ? 16 : 8);
1922                 op += length;
1923                 ip += length;
1924
1925                 /* The second stage: prepare for match copying, decode full info.
1926                  * If it doesn't work out, the info won't be wasted. */
1927                 length = token & ML_MASK; /* match length */
1928                 offset = LZ4_readLE16(ip);
1929                 ip += 2;
1930                 match = op - offset;
1931                 assert(match <= op); /* check overflow */
1932
1933                 /* Do not deal with overlapping matches. */
1934                 if ((length != ML_MASK)
1935                         && (offset >= 8)
1936                         && (dict == withPrefix64k || match >= lowPrefix)) {
1937                     /* Copy the match. */
1938                     LZ4_memcpy(op + 0, match + 0, 8);
1939                     LZ4_memcpy(op + 8, match + 8, 8);
1940                     LZ4_memcpy(op + 16, match + 16, 2);
1941                     op += length + MINMATCH;
1942                     /* Both stages worked, load the next token. */
1943                     continue;
1944                 }
1945
1946                 /* The second stage didn't work out, but the info is ready.
1947                  * Propel it right to the point of match copying. */
1948                 goto _copy_match;
1949             }
1950
1951             /* decode literal length */
1952             if (length == RUN_MASK) {
1953                 variable_length_error error = ok;
1954                 length += read_variable_length(&ip, iend - RUN_MASK, (int)endOnInput, (int)endOnInput, &error);
1955                 if (error == initial_error) { goto _output_error; }
1956                 if ((safeDecode) && unlikely((uptrval)(op) + length < (uptrval)(op))) { goto _output_error; } /* overflow detection */
1957                 if ((safeDecode) && unlikely((uptrval)(ip) + length < (uptrval)(ip))) { goto _output_error; } /* overflow detection */
1958             }
1959
1960             /* copy literals */
1961             cpy = op + length;
1962 #if LZ4_FAST_DEC_LOOP
1963 safe_literal_copy:
1964 #endif
1965             LZ4_STATIC_ASSERT(MFLIMIT >= WILDCOPYLENGTH);
1966             if (((endOnInput) && ((cpy > oend - MFLIMIT) || (ip + length > iend - (2 + 1 + LASTLITERALS))))
1967                     || ((!endOnInput) && (cpy > oend - WILDCOPYLENGTH))) {
1968                 /* We've either hit the input parsing restriction or the output parsing restriction.
1969                  * In the normal scenario, decoding a full block, it must be the last sequence,
1970                  * otherwise it's an error (invalid input or dimensions).
1971                  * In partialDecoding scenario, it's necessary to ensure there is no buffer overflow.
1972                  */
1973                 if (partialDecoding) {
1974                     /* Since we are partial decoding we may be in this block because of the output parsing
1975                      * restriction, which is not valid since the output buffer is allowed to be undersized.
1976                      */
1977                     assert(endOnInput);
1978                     DEBUGLOG(7, "partialDecoding: copying literals, close to input or output end")
1979                     DEBUGLOG(7, "partialDecoding: literal length = %u", (unsigned)length);
1980                     DEBUGLOG(7, "partialDecoding: remaining space in dstBuffer : %i", (int)(oend - op));
1981                     DEBUGLOG(7, "partialDecoding: remaining space in srcBuffer : %i", (int)(iend - ip));
1982                     /* Finishing in the middle of a literals segment,
1983                      * due to lack of input.
1984                      */
1985                     if (ip + length > iend) {
1986                         length = (size_t)(iend - ip);
1987                         cpy = op + length;
1988                     }
1989                     /* Finishing in the middle of a literals segment,
1990                      * due to lack of output space.
1991                      */
1992                     if (cpy > oend) {
1993                         cpy = oend;
1994                         assert(op <= oend);
1995                         length = (size_t)(oend - op);
1996                     }
1997                 } else {
1998                     /* We must be on the last sequence because of the parsing limitations so check
1999                      * that we exactly regenerate the original size (must be exact when !endOnInput).
2000                      */
2001                     if ((!endOnInput) && (cpy != oend)) { goto _output_error; }
2002                     /* We must be on the last sequence (or invalid) because of the parsing limitations
2003                      * so check that we exactly consume the input and don't overrun the output buffer.
2004                      */
2005                     if ((endOnInput) && ((ip + length != iend) || (cpy > oend))) {
2006                         DEBUGLOG(6, "should have been last run of literals")
2007                         DEBUGLOG(6, "ip(%p) + length(%i) = %p != iend (%p)", ip, (int)length, ip + length, iend);
2008                         DEBUGLOG(6, "or cpy(%p) > oend(%p)", cpy, oend);
2009                         goto _output_error;
2010                     }
2011                 }
2012                 memmove(op, ip, length);  /* supports overlapping memory regions; only matters for in-place decompression scenarios */
2013                 ip += length;
2014                 op += length;
2015                 /* Necessarily EOF when !partialDecoding.
2016                  * When partialDecoding, it is EOF if we've either
2017                  * filled the output buffer or
2018                  * can't proceed with reading an offset for following match.
2019                  */
2020                 if (!partialDecoding || (cpy == oend) || (ip >= (iend - 2))) {
2021                     break;
2022                 }
2023             } else {
2024                 LZ4_wildCopy8(op, ip, cpy);   /* may overwrite up to WILDCOPYLENGTH beyond cpy */
2025                 ip += length;
2026                 op = cpy;
2027             }
2028
2029             /* get offset */
2030             offset = LZ4_readLE16(ip);
2031             ip += 2;
2032             match = op - offset;
2033
2034             /* get matchlength */
2035             length = token & ML_MASK;
2036
2037 _copy_match:
2038             if (length == ML_MASK) {
2039                 variable_length_error error = ok;
2040                 length += read_variable_length(&ip, iend - LASTLITERALS + 1, (int)endOnInput, 0, &error);
2041                 if (error != ok) goto _output_error;
2042                 if ((safeDecode) && unlikely((uptrval)(op) + length < (uptrval)op)) goto _output_error; /* overflow detection */
2043             }
2044             length += MINMATCH;
2045
2046 #if LZ4_FAST_DEC_LOOP
2047 safe_match_copy:
2048 #endif
2049             if ((checkOffset) && (unlikely(match + dictSize < lowPrefix))) goto _output_error;   /* Error : offset outside buffers */
2050             /* match starting within external dictionary */
2051             if ((dict == usingExtDict) && (match < lowPrefix)) {
2052                 if (unlikely(op + length > oend - LASTLITERALS)) {
2053                     if (partialDecoding) length = MIN(length, (size_t)(oend - op));
2054                     else goto _output_error;   /* doesn't respect parsing restriction */
2055                 }
2056
2057                 if (length <= (size_t)(lowPrefix - match)) {
2058                     /* match fits entirely within external dictionary : just copy */
2059                     memmove(op, dictEnd - (lowPrefix - match), length);
2060                     op += length;
2061                 } else {
2062                     /* match stretches into both external dictionary and current block */
2063                     size_t const copySize = (size_t)(lowPrefix - match);
2064                     size_t const restSize = length - copySize;
2065                     LZ4_memcpy(op, dictEnd - copySize, copySize);
2066                     op += copySize;
2067                     if (restSize > (size_t)(op - lowPrefix)) {  /* overlap copy */
2068                         BYTE *const endOfMatch = op + restSize;
2069                         const BYTE *copyFrom = lowPrefix;
2070                         while (op < endOfMatch) *op++ = *copyFrom++;
2071                     } else {
2072                         LZ4_memcpy(op, lowPrefix, restSize);
2073                         op += restSize;
2074                     }
2075                 }
2076                 continue;
2077             }
2078             assert(match >= lowPrefix);
2079
2080             /* copy match within block */
2081             cpy = op + length;
2082
2083             /* partialDecoding : may end anywhere within the block */
2084             assert(op <= oend);
2085             if (partialDecoding && (cpy > oend - MATCH_SAFEGUARD_DISTANCE)) {
2086                 size_t const mlen = MIN(length, (size_t)(oend - op));
2087                 const BYTE *const matchEnd = match + mlen;
2088                 BYTE *const copyEnd = op + mlen;
2089                 if (matchEnd > op) {   /* overlap copy */
2090                     while (op < copyEnd) { *op++ = *match++; }
2091                 } else {
2092                     LZ4_memcpy(op, match, mlen);
2093                 }
2094                 op = copyEnd;
2095                 if (op == oend) { break; }
2096                 continue;
2097             }
2098
2099             if (unlikely(offset < 8)) {
2100                 LZ4_write32(op, 0);   /* silence msan warning when offset==0 */
2101                 op[0] = match[0];
2102                 op[1] = match[1];
2103                 op[2] = match[2];
2104                 op[3] = match[3];
2105                 match += inc32table[offset];
2106                 LZ4_memcpy(op + 4, match, 4);
2107                 match -= dec64table[offset];
2108             } else {
2109                 LZ4_memcpy(op, match, 8);
2110                 match += 8;
2111             }
2112             op += 8;
2113
2114             if (unlikely(cpy > oend - MATCH_SAFEGUARD_DISTANCE)) {
2115                 BYTE *const oCopyLimit = oend - (WILDCOPYLENGTH - 1);
2116                 if (cpy > oend - LASTLITERALS) { goto _output_error; } /* Error : last LASTLITERALS bytes must be literals (uncompressed) */
2117                 if (op < oCopyLimit) {
2118                     LZ4_wildCopy8(op, match, oCopyLimit);
2119                     match += oCopyLimit - op;
2120                     op = oCopyLimit;
2121                 }
2122                 while (op < cpy) { *op++ = *match++; }
2123             } else {
2124                 LZ4_memcpy(op, match, 8);
2125                 if (length > 16)  { LZ4_wildCopy8(op + 8, match + 8, cpy); }
2126             }
2127             op = cpy;   /* wildcopy correction */
2128         }
2129
2130         /* end of decoding */
2131         if (endOnInput) {
2132             DEBUGLOG(5, "decoded %i bytes", (int)(((char *)op) - dst));
2133             return (int)(((char *)op) - dst);   /* Nb of output bytes decoded */
2134         } else {
2135             return (int)(((const char *)ip) - src); /* Nb of input bytes read */
2136         }
2137
2138         /* Overflow error detected */
2139 _output_error:
2140         return (int)(-(((const char *)ip) - src)) - 1;
2141     }
2142 }
2143
2144
2145 /*===== Instantiate the API decoding functions. =====*/
2146
2147 LZ4_FORCE_O2_GCC_PPC64LE
2148 int LZ4_decompress_safe(const char *src, char *dst, int compressedSize, int maxDecompressedSize) {
2149     return LZ4_decompress_generic(src, dst, compressedSize, maxDecompressedSize,
2150                                   endOnInputSize, decode_full_block, noDict,
2151                                   (BYTE *)dst, NULL, 0);
2152 }
2153
2154 LZ4_FORCE_O2_GCC_PPC64LE
2155 int LZ4_decompress_safe_partial(const char *src, char *dst, int compressedSize, int targetOutputSize, int dstCapacity) {
2156     dstCapacity = MIN(targetOutputSize, dstCapacity);
2157     return LZ4_decompress_generic(src, dst, compressedSize, dstCapacity,
2158                                   endOnInputSize, partial_decode,
2159                                   noDict, (BYTE *)dst, NULL, 0);
2160 }
2161
2162 LZ4_FORCE_O2_GCC_PPC64LE
2163 int LZ4_decompress_fast(const char *src, char *dst, int originalSize) {
2164     return LZ4_decompress_generic(src, dst, 0, originalSize,
2165                                   endOnOutputSize, decode_full_block, withPrefix64k,
2166                                   (BYTE *)dst - 64 KB, NULL, 0);
2167 }
2168
2169 /*===== Instantiate a few more decoding cases, used more than once. =====*/
2170
2171 LZ4_FORCE_O2_GCC_PPC64LE /* Exported, an obsolete API function. */
2172 int LZ4_decompress_safe_withPrefix64k(const char *src, char *dst, int compressedSize, int dstCapacity) {
2173     return LZ4_decompress_generic(src, dst, compressedSize, dstCapacity,
2174                                   endOnInputSize, decode_full_block, withPrefix64k,
2175                                   (BYTE *)dst - 64 KB, NULL, 0);
2176 }
2177
2178 /* Another obsolete API function, paired with the previous one. */
2179 int LZ4_decompress_fast_withPrefix64k(const char *src, char *dst, int originalSize) {
2180     /* LZ4_decompress_fast doesn't validate match offsets,
2181      * and thus serves well with any prefixed dictionary. */
2182     return LZ4_decompress_fast(src, dst, originalSize);
2183 }
2184
2185 LZ4_FORCE_O2_GCC_PPC64LE
2186 static int LZ4_decompress_safe_withSmallPrefix(const char *src, char *dst, int compressedSize, int dstCapacity,
2187                                                size_t prefixSize) {
2188     return LZ4_decompress_generic(src, dst, compressedSize, dstCapacity,
2189                                   endOnInputSize, decode_full_block, noDict,
2190                                   (BYTE *)dst - prefixSize, NULL, 0);
2191 }
2192
2193 LZ4_FORCE_O2_GCC_PPC64LE
2194 int LZ4_decompress_safe_forceExtDict(const char *src, char *dst,
2195                                      int compressedSize, int dstCapacity,
2196                                      const void *dictStart, size_t dictSize) {
2197     return LZ4_decompress_generic(src, dst, compressedSize, dstCapacity,
2198                                   endOnInputSize, decode_full_block, usingExtDict,
2199                                   (BYTE *)dst, (const BYTE *)dictStart, dictSize);
2200 }
2201
2202 LZ4_FORCE_O2_GCC_PPC64LE
2203 static int LZ4_decompress_fast_extDict(const char *src, char *dst, int originalSize,
2204                                        const void *dictStart, size_t dictSize) {
2205     return LZ4_decompress_generic(src, dst, 0, originalSize,
2206                                   endOnOutputSize, decode_full_block, usingExtDict,
2207                                   (BYTE *)dst, (const BYTE *)dictStart, dictSize);
2208 }
2209
2210 /* The "double dictionary" mode, for use with e.g. ring buffers: the first part
2211  * of the dictionary is passed as prefix, and the second via dictStart + dictSize.
2212  * These routines are used only once, in LZ4_decompress_*_continue().
2213  */
2214 LZ4_FORCE_INLINE
2215 int LZ4_decompress_safe_doubleDict(const char *src, char *dst, int compressedSize, int dstCapacity,
2216                                    size_t prefixSize, const void *dictStart, size_t dictSize) {
2217     return LZ4_decompress_generic(src, dst, compressedSize, dstCapacity,
2218                                   endOnInputSize, decode_full_block, usingExtDict,
2219                                   (BYTE *)dst - prefixSize, (const BYTE *)dictStart, dictSize);
2220 }
2221
2222 LZ4_FORCE_INLINE
2223 int LZ4_decompress_fast_doubleDict(const char *src, char *dst, int originalSize,
2224                                    size_t prefixSize, const void *dictStart, size_t dictSize) {
2225     return LZ4_decompress_generic(src, dst, 0, originalSize,
2226                                   endOnOutputSize, decode_full_block, usingExtDict,
2227                                   (BYTE *)dst - prefixSize, (const BYTE *)dictStart, dictSize);
2228 }
2229
2230 /*===== streaming decompression functions =====*/
2231
2232 LZ4_streamDecode_t *LZ4_createStreamDecode(void) {
2233     LZ4_streamDecode_t *lz4s = (LZ4_streamDecode_t *) ALLOC_AND_ZERO(sizeof(LZ4_streamDecode_t));
2234     LZ4_STATIC_ASSERT(LZ4_STREAMDECODESIZE >= sizeof(LZ4_streamDecode_t_internal));    /* A compilation error here means LZ4_STREAMDECODESIZE is not large enough */
2235     return lz4s;
2236 }
2237
2238 int LZ4_freeStreamDecode(LZ4_streamDecode_t *LZ4_stream) {
2239     if (LZ4_stream == NULL) { return 0; }  /* support free on NULL */
2240     FREEMEM(LZ4_stream);
2241     return 0;
2242 }
2243
2244 /*! LZ4_setStreamDecode() :
2245  *  Use this function to instruct where to find the dictionary.
2246  *  This function is not necessary if previous data is still available where it was decoded.
2247  *  Loading a size of 0 is allowed (same effect as no dictionary).
2248  * @return : 1 if OK, 0 if error
2249  */
2250 int LZ4_setStreamDecode(LZ4_streamDecode_t *LZ4_streamDecode, const char *dictionary, int dictSize) {
2251     LZ4_streamDecode_t_internal *lz4sd = &LZ4_streamDecode->internal_donotuse;
2252     lz4sd->prefixSize = (size_t) dictSize;
2253     lz4sd->prefixEnd = (const BYTE *) dictionary + dictSize;
2254     lz4sd->externalDict = NULL;
2255     lz4sd->extDictSize  = 0;
2256     return 1;
2257 }
2258
2259 /*! LZ4_decoderRingBufferSize() :
2260  *  when setting a ring buffer for streaming decompression (optional scenario),
2261  *  provides the minimum size of this ring buffer
2262  *  to be compatible with any source respecting maxBlockSize condition.
2263  *  Note : in a ring buffer scenario,
2264  *  blocks are presumed decompressed next to each other.
2265  *  When not enough space remains for next block (remainingSize < maxBlockSize),
2266  *  decoding resumes from beginning of ring buffer.
2267  * @return : minimum ring buffer size,
2268  *           or 0 if there is an error (invalid maxBlockSize).
2269  */
2270 int LZ4_decoderRingBufferSize(int maxBlockSize) {
2271     if (maxBlockSize < 0) return 0;
2272     if (maxBlockSize > LZ4_MAX_INPUT_SIZE) return 0;
2273     if (maxBlockSize < 16) maxBlockSize = 16;
2274     return LZ4_DECODER_RING_BUFFER_SIZE(maxBlockSize);
2275 }
2276
2277 /*
2278 *_continue() :
2279     These decoding functions allow decompression of multiple blocks in "streaming" mode.
2280     Previously decoded blocks must still be available at the memory position where they were decoded.
2281     If it's not possible, save the relevant part of decoded data into a safe buffer,
2282     and indicate where it stands using LZ4_setStreamDecode()
2283 */
2284 LZ4_FORCE_O2_GCC_PPC64LE
2285 int LZ4_decompress_safe_continue(LZ4_streamDecode_t *LZ4_streamDecode, const char *src, char *dst, int compressedSize, int dstCapacity) {
2286     LZ4_streamDecode_t_internal *lz4sd = &LZ4_streamDecode->internal_donotuse;
2287     int result;
2288
2289     if (lz4sd->prefixSize == 0) {
2290         /* The first call, no dictionary yet. */
2291         assert(lz4sd->extDictSize == 0);
2292         result = LZ4_decompress_safe(src, dst, compressedSize, dstCapacity);
2293         if (result <= 0) return result;
2294         lz4sd->prefixSize = (size_t)result;
2295         lz4sd->prefixEnd = (BYTE *)dst + result;
2296     } else if (lz4sd->prefixEnd == (BYTE *)dst) {
2297         /* They're rolling the current segment. */
2298         if (lz4sd->prefixSize >= 64 KB - 1)
2299             result = LZ4_decompress_safe_withPrefix64k(src, dst, compressedSize, dstCapacity);
2300         else if (lz4sd->extDictSize == 0)
2301             result = LZ4_decompress_safe_withSmallPrefix(src, dst, compressedSize, dstCapacity,
2302                                                          lz4sd->prefixSize);
2303         else
2304             result = LZ4_decompress_safe_doubleDict(src, dst, compressedSize, dstCapacity,
2305                                                     lz4sd->prefixSize, lz4sd->externalDict, lz4sd->extDictSize);
2306         if (result <= 0) return result;
2307         lz4sd->prefixSize += (size_t)result;
2308         lz4sd->prefixEnd  += result;
2309     } else {
2310         /* The buffer wraps around, or they're switching to another buffer. */
2311         lz4sd->extDictSize = lz4sd->prefixSize;
2312         lz4sd->externalDict = lz4sd->prefixEnd - lz4sd->extDictSize;
2313         result = LZ4_decompress_safe_forceExtDict(src, dst, compressedSize, dstCapacity,
2314                                                   lz4sd->externalDict, lz4sd->extDictSize);
2315         if (result <= 0) return result;
2316         lz4sd->prefixSize = (size_t)result;
2317         lz4sd->prefixEnd  = (BYTE *)dst + result;
2318     }
2319
2320     return result;
2321 }
2322
2323 LZ4_FORCE_O2_GCC_PPC64LE
2324 int LZ4_decompress_fast_continue(LZ4_streamDecode_t *LZ4_streamDecode, const char *src, char *dst, int originalSize) {
2325     LZ4_streamDecode_t_internal *lz4sd = &LZ4_streamDecode->internal_donotuse;
2326     int result;
2327     assert(originalSize >= 0);
2328
2329     if (lz4sd->prefixSize == 0) {
2330         assert(lz4sd->extDictSize == 0);
2331         result = LZ4_decompress_fast(src, dst, originalSize);
2332         if (result <= 0) return result;
2333         lz4sd->prefixSize = (size_t)originalSize;
2334         lz4sd->prefixEnd = (BYTE *)dst + originalSize;
2335     } else if (lz4sd->prefixEnd == (BYTE *)dst) {
2336         if (lz4sd->prefixSize >= 64 KB - 1 || lz4sd->extDictSize == 0)
2337             result = LZ4_decompress_fast(src, dst, originalSize);
2338         else
2339             result = LZ4_decompress_fast_doubleDict(src, dst, originalSize,
2340                                                     lz4sd->prefixSize, lz4sd->externalDict, lz4sd->extDictSize);
2341         if (result <= 0) return result;
2342         lz4sd->prefixSize += (size_t)originalSize;
2343         lz4sd->prefixEnd  += originalSize;
2344     } else {
2345         lz4sd->extDictSize = lz4sd->prefixSize;
2346         lz4sd->externalDict = lz4sd->prefixEnd - lz4sd->extDictSize;
2347         result = LZ4_decompress_fast_extDict(src, dst, originalSize,
2348                                              lz4sd->externalDict, lz4sd->extDictSize);
2349         if (result <= 0) return result;
2350         lz4sd->prefixSize = (size_t)originalSize;
2351         lz4sd->prefixEnd  = (BYTE *)dst + originalSize;
2352     }
2353
2354     return result;
2355 }
2356
2357
2358 /*
2359 Advanced decoding functions :
2360 *_usingDict() :
2361     These decoding functions work the same as "_continue" ones,
2362     the dictionary must be explicitly provided within parameters
2363 */
2364
2365 int LZ4_decompress_safe_usingDict(const char *src, char *dst, int compressedSize, int dstCapacity, const char *dictStart, int dictSize) {
2366     if (dictSize == 0)
2367         return LZ4_decompress_safe(src, dst, compressedSize, dstCapacity);
2368     if (dictStart + dictSize == dst) {
2369         if (dictSize >= 64 KB - 1) {
2370             return LZ4_decompress_safe_withPrefix64k(src, dst, compressedSize, dstCapacity);
2371         }
2372         assert(dictSize >= 0);
2373         return LZ4_decompress_safe_withSmallPrefix(src, dst, compressedSize, dstCapacity, (size_t)dictSize);
2374     }
2375     assert(dictSize >= 0);
2376     return LZ4_decompress_safe_forceExtDict(src, dst, compressedSize, dstCapacity, dictStart, (size_t)dictSize);
2377 }
2378
2379 int LZ4_decompress_fast_usingDict(const char *src, char *dst, int originalSize, const char *dictStart, int dictSize) {
2380     if (dictSize == 0 || dictStart + dictSize == dst)
2381         return LZ4_decompress_fast(src, dst, originalSize);
2382     assert(dictSize >= 0);
2383     return LZ4_decompress_fast_extDict(src, dst, originalSize, dictStart, (size_t)dictSize);
2384 }
2385
2386
2387 /*=*************************************************
2388 *  Obsolete Functions
2389 ***************************************************/
2390 /* obsolete compression functions */
2391 int LZ4_compress_limitedOutput(const char *src, char *dst, int srcSize, int dstCapacity) {
2392     return LZ4_compress_default(src, dst, srcSize, dstCapacity);
2393 }
2394 int LZ4_compress(const char *src, char *dst, int srcSize) {
2395     return LZ4_compress_default(src, dst, srcSize, LZ4_compressBound(srcSize));
2396 }
2397 int LZ4_compress_limitedOutput_withState(void *state, const char *src, char *dst, int srcSize, int dstSize) {
2398     return LZ4_compress_fast_extState(state, src, dst, srcSize, dstSize, 1);
2399 }
2400 int LZ4_compress_withState(void *state, const char *src, char *dst, int srcSize) {
2401     return LZ4_compress_fast_extState(state, src, dst, srcSize, LZ4_compressBound(srcSize), 1);
2402 }
2403 int LZ4_compress_limitedOutput_continue(LZ4_stream_t *LZ4_stream, const char *src, char *dst, int srcSize, int dstCapacity) {
2404     return LZ4_compress_fast_continue(LZ4_stream, src, dst, srcSize, dstCapacity, 1);
2405 }
2406 int LZ4_compress_continue(LZ4_stream_t *LZ4_stream, const char *src, char *dst, int srcSize) {
2407     return LZ4_compress_fast_continue(LZ4_stream, src, dst, srcSize, LZ4_compressBound(srcSize), 1);
2408 }
2409
2410 /*
2411 These decompression functions are deprecated and should no longer be used.
2412 They are only provided here for compatibility with older user programs.
2413 - LZ4_uncompress is totally equivalent to LZ4_decompress_fast
2414 - LZ4_uncompress_unknownOutputSize is totally equivalent to LZ4_decompress_safe
2415 */
2416 int LZ4_uncompress(const char *src, char *dst, int outputSize) {
2417     return LZ4_decompress_fast(src, dst, outputSize);
2418 }
2419 int LZ4_uncompress_unknownOutputSize(const char *src, char *dst, int isize, int dstCapacity) {
2420     return LZ4_decompress_safe(src, dst, isize, dstCapacity);
2421 }
2422
2423 /* Obsolete Streaming functions */
2424
2425 int LZ4_sizeofStreamState(void) { return LZ4_STREAMSIZE; }
2426
2427 int LZ4_resetStreamState(void *state, char *inputBuffer) {
2428     (void)inputBuffer;
2429     LZ4_resetStream((LZ4_stream_t *)state);
2430     return 0;
2431 }
2432
2433 void *LZ4_create(char *inputBuffer) {
2434     (void)inputBuffer;
2435     return LZ4_createStream();
2436 }
2437
2438 char *LZ4_slideInputBuffer(void *state) {
2439     /* avoid const char * -> char * conversion warning */
2440     return (char *)(uptrval)((LZ4_stream_t *)state)->internal_donotuse.dictionary;
2441 }
2442
2443 #endif   /* LZ4_COMMONDEFS_ONLY */