2 * Huffman encoder, part of New Generation Entropy library
3 * Copyright (C) 2013-2016, Yann Collet.
5 * BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions are
11 * * Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * * Redistributions in binary form must reproduce the above
14 * copyright notice, this list of conditions and the following disclaimer
15 * in the documentation and/or other materials provided with the
18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
19 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
20 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
21 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
22 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
23 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
24 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
25 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
26 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
27 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
28 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30 * This program is free software; you can redistribute it and/or modify it under
31 * the terms of the GNU General Public License version 2 as published by the
32 * Free Software Foundation. This program is dual-licensed; you may select
33 * either version 2 of the GNU General Public License ("GPL") or BSD license
36 * You can contact the author at :
37 * - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
40 /* **************************************************************
42 ****************************************************************/
43 #include "bitstream.h"
44 #include "fse.h" /* header compression */
46 #include <linux/kernel.h>
47 #include <linux/string.h> /* memcpy, memset */
49 /* **************************************************************
51 ****************************************************************/
52 #define HUF_STATIC_ASSERT(c) \
54 enum { HUF_static_assert = 1 / (int)(!!(c)) }; \
55 } /* use only *after* variable declarations */
56 #define CHECK_V_F(e, f) \
62 CHECK_V_F(_var_err__, f); \
65 /* **************************************************************
67 ****************************************************************/
68 unsigned HUF_optimalTableLog(unsigned maxTableLog
, size_t srcSize
, unsigned maxSymbolValue
)
70 return FSE_optimalTableLog_internal(maxTableLog
, srcSize
, maxSymbolValue
, 1);
73 /* *******************************************************
74 * HUF : Huffman block compression
75 *********************************************************/
76 /* HUF_compressWeights() :
77 * Same as FSE_compress(), but dedicated to huff0's weights compression.
78 * The use case needs much less stack memory.
79 * Note : all elements within weightTable are supposed to be <= HUF_TABLELOG_MAX.
81 #define MAX_FSE_TABLELOG_FOR_HUFF_HEADER 6
82 size_t HUF_compressWeights_wksp(void *dst
, size_t dstSize
, const void *weightTable
, size_t wtSize
, void *workspace
, size_t workspaceSize
)
84 BYTE
*const ostart
= (BYTE
*)dst
;
86 BYTE
*const oend
= ostart
+ dstSize
;
88 U32 maxSymbolValue
= HUF_TABLELOG_MAX
;
89 U32 tableLog
= MAX_FSE_TABLELOG_FOR_HUFF_HEADER
;
94 size_t spaceUsed32
= 0;
96 HUF_STATIC_ASSERT(sizeof(FSE_CTable
) == sizeof(U32
));
98 CTable
= (FSE_CTable
*)((U32
*)workspace
+ spaceUsed32
);
99 spaceUsed32
+= FSE_CTABLE_SIZE_U32(MAX_FSE_TABLELOG_FOR_HUFF_HEADER
, HUF_TABLELOG_MAX
);
100 count
= (U32
*)workspace
+ spaceUsed32
;
101 spaceUsed32
+= HUF_TABLELOG_MAX
+ 1;
102 norm
= (S16
*)((U32
*)workspace
+ spaceUsed32
);
103 spaceUsed32
+= ALIGN(sizeof(S16
) * (HUF_TABLELOG_MAX
+ 1), sizeof(U32
)) >> 2;
105 if ((spaceUsed32
<< 2) > workspaceSize
)
106 return ERROR(tableLog_tooLarge
);
107 workspace
= (U32
*)workspace
+ spaceUsed32
;
108 workspaceSize
-= (spaceUsed32
<< 2);
110 /* init conditions */
112 return 0; /* Not compressible */
114 /* Scan input and build symbol stats */
116 CHECK_V_F(maxCount
, FSE_count_simple(count
, &maxSymbolValue
, weightTable
, wtSize
));
117 if (maxCount
== wtSize
)
118 return 1; /* only a single symbol in src : rle */
120 return 0; /* each symbol present maximum once => not compressible */
123 tableLog
= FSE_optimalTableLog(tableLog
, wtSize
, maxSymbolValue
);
124 CHECK_F(FSE_normalizeCount(norm
, tableLog
, count
, wtSize
, maxSymbolValue
));
126 /* Write table description header */
128 CHECK_V_F(hSize
, FSE_writeNCount(op
, oend
- op
, norm
, maxSymbolValue
, tableLog
));
133 CHECK_F(FSE_buildCTable_wksp(CTable
, norm
, maxSymbolValue
, tableLog
, workspace
, workspaceSize
));
135 CHECK_V_F(cSize
, FSE_compress_usingCTable(op
, oend
- op
, weightTable
, wtSize
, CTable
));
137 return 0; /* not enough space for compressed data */
147 }; /* typedef'd to HUF_CElt within "huf.h" */
149 /*! HUF_writeCTable_wksp() :
150 `CTable` : Huffman tree to save, using huf representation.
151 @return : size of saved CTable */
152 size_t HUF_writeCTable_wksp(void *dst
, size_t maxDstSize
, const HUF_CElt
*CTable
, U32 maxSymbolValue
, U32 huffLog
, void *workspace
, size_t workspaceSize
)
154 BYTE
*op
= (BYTE
*)dst
;
159 size_t spaceUsed32
= 0;
161 bitsToWeight
= (BYTE
*)((U32
*)workspace
+ spaceUsed32
);
162 spaceUsed32
+= ALIGN(HUF_TABLELOG_MAX
+ 1, sizeof(U32
)) >> 2;
163 huffWeight
= (BYTE
*)((U32
*)workspace
+ spaceUsed32
);
164 spaceUsed32
+= ALIGN(HUF_SYMBOLVALUE_MAX
, sizeof(U32
)) >> 2;
166 if ((spaceUsed32
<< 2) > workspaceSize
)
167 return ERROR(tableLog_tooLarge
);
168 workspace
= (U32
*)workspace
+ spaceUsed32
;
169 workspaceSize
-= (spaceUsed32
<< 2);
171 /* check conditions */
172 if (maxSymbolValue
> HUF_SYMBOLVALUE_MAX
)
173 return ERROR(maxSymbolValue_tooLarge
);
175 /* convert to weight */
177 for (n
= 1; n
< huffLog
+ 1; n
++)
178 bitsToWeight
[n
] = (BYTE
)(huffLog
+ 1 - n
);
179 for (n
= 0; n
< maxSymbolValue
; n
++)
180 huffWeight
[n
] = bitsToWeight
[CTable
[n
].nbBits
];
182 /* attempt weights compression by FSE */
184 CHECK_V_F(hSize
, HUF_compressWeights_wksp(op
+ 1, maxDstSize
- 1, huffWeight
, maxSymbolValue
, workspace
, workspaceSize
));
185 if ((hSize
> 1) & (hSize
< maxSymbolValue
/ 2)) { /* FSE compressed */
191 /* write raw values as 4-bits (max : 15) */
192 if (maxSymbolValue
> (256 - 128))
193 return ERROR(GENERIC
); /* should not happen : likely means source cannot be compressed */
194 if (((maxSymbolValue
+ 1) / 2) + 1 > maxDstSize
)
195 return ERROR(dstSize_tooSmall
); /* not enough space within dst buffer */
196 op
[0] = (BYTE
)(128 /*special case*/ + (maxSymbolValue
- 1));
197 huffWeight
[maxSymbolValue
] = 0; /* to be sure it doesn't cause msan issue in final combination */
198 for (n
= 0; n
< maxSymbolValue
; n
+= 2)
199 op
[(n
/ 2) + 1] = (BYTE
)((huffWeight
[n
] << 4) + huffWeight
[n
+ 1]);
200 return ((maxSymbolValue
+ 1) / 2) + 1;
203 size_t HUF_readCTable_wksp(HUF_CElt
*CTable
, U32 maxSymbolValue
, const void *src
, size_t srcSize
, void *workspace
, size_t workspaceSize
)
210 size_t spaceUsed32
= 0;
212 rankVal
= (U32
*)workspace
+ spaceUsed32
;
213 spaceUsed32
+= HUF_TABLELOG_ABSOLUTEMAX
+ 1;
214 huffWeight
= (BYTE
*)((U32
*)workspace
+ spaceUsed32
);
215 spaceUsed32
+= ALIGN(HUF_SYMBOLVALUE_MAX
+ 1, sizeof(U32
)) >> 2;
217 if ((spaceUsed32
<< 2) > workspaceSize
)
218 return ERROR(tableLog_tooLarge
);
219 workspace
= (U32
*)workspace
+ spaceUsed32
;
220 workspaceSize
-= (spaceUsed32
<< 2);
222 /* get symbol weights */
223 readSize
= HUF_readStats_wksp(huffWeight
, HUF_SYMBOLVALUE_MAX
+ 1, rankVal
, &nbSymbols
, &tableLog
, src
, srcSize
, workspace
, workspaceSize
);
224 if (ERR_isError(readSize
))
228 if (tableLog
> HUF_TABLELOG_MAX
)
229 return ERROR(tableLog_tooLarge
);
230 if (nbSymbols
> maxSymbolValue
+ 1)
231 return ERROR(maxSymbolValue_tooSmall
);
233 /* Prepare base value per rank */
235 U32 n
, nextRankStart
= 0;
236 for (n
= 1; n
<= tableLog
; n
++) {
237 U32 curr
= nextRankStart
;
238 nextRankStart
+= (rankVal
[n
] << (n
- 1));
246 for (n
= 0; n
< nbSymbols
; n
++) {
247 const U32 w
= huffWeight
[n
];
248 CTable
[n
].nbBits
= (BYTE
)(tableLog
+ 1 - w
);
254 U16 nbPerRank
[HUF_TABLELOG_MAX
+ 2] = {0}; /* support w=0=>n=tableLog+1 */
255 U16 valPerRank
[HUF_TABLELOG_MAX
+ 2] = {0};
258 for (n
= 0; n
< nbSymbols
; n
++)
259 nbPerRank
[CTable
[n
].nbBits
]++;
261 /* determine stating value per rank */
262 valPerRank
[tableLog
+ 1] = 0; /* for w==0 */
266 for (n
= tableLog
; n
> 0; n
--) { /* start at n=tablelog <-> w=1 */
267 valPerRank
[n
] = min
; /* get starting value within each rank */
272 /* assign value within rank, symbol order */
275 for (n
= 0; n
<= maxSymbolValue
; n
++)
276 CTable
[n
].val
= valPerRank
[CTable
[n
].nbBits
]++;
283 typedef struct nodeElt_s
{
290 static U32
HUF_setMaxHeight(nodeElt
*huffNode
, U32 lastNonNull
, U32 maxNbBits
)
292 const U32 largestBits
= huffNode
[lastNonNull
].nbBits
;
293 if (largestBits
<= maxNbBits
)
294 return largestBits
; /* early exit : no elt > maxNbBits */
296 /* there are several too large elements (at least >= 2) */
299 const U32 baseCost
= 1 << (largestBits
- maxNbBits
);
302 while (huffNode
[n
].nbBits
> maxNbBits
) {
303 totalCost
+= baseCost
- (1 << (largestBits
- huffNode
[n
].nbBits
));
304 huffNode
[n
].nbBits
= (BYTE
)maxNbBits
;
306 } /* n stops at huffNode[n].nbBits <= maxNbBits */
307 while (huffNode
[n
].nbBits
== maxNbBits
)
308 n
--; /* n end at index of smallest symbol using < maxNbBits */
310 /* renorm totalCost */
311 totalCost
>>= (largestBits
- maxNbBits
); /* note : totalCost is necessarily a multiple of baseCost */
313 /* repay normalized cost */
315 U32
const noSymbol
= 0xF0F0F0F0;
316 U32 rankLast
[HUF_TABLELOG_MAX
+ 2];
319 /* Get pos of last (smallest) symbol per rank */
320 memset(rankLast
, 0xF0, sizeof(rankLast
));
322 U32 currNbBits
= maxNbBits
;
323 for (pos
= n
; pos
>= 0; pos
--) {
324 if (huffNode
[pos
].nbBits
>= currNbBits
)
326 currNbBits
= huffNode
[pos
].nbBits
; /* < maxNbBits */
327 rankLast
[maxNbBits
- currNbBits
] = pos
;
331 while (totalCost
> 0) {
332 U32 nBitsToDecrease
= BIT_highbit32(totalCost
) + 1;
333 for (; nBitsToDecrease
> 1; nBitsToDecrease
--) {
334 U32 highPos
= rankLast
[nBitsToDecrease
];
335 U32 lowPos
= rankLast
[nBitsToDecrease
- 1];
336 if (highPos
== noSymbol
)
338 if (lowPos
== noSymbol
)
341 U32
const highTotal
= huffNode
[highPos
].count
;
342 U32
const lowTotal
= 2 * huffNode
[lowPos
].count
;
343 if (highTotal
<= lowTotal
)
347 /* only triggered when no more rank 1 symbol left => find closest one (note : there is necessarily at least one !) */
348 /* HUF_MAX_TABLELOG test just to please gcc 5+; but it should not be necessary */
349 while ((nBitsToDecrease
<= HUF_TABLELOG_MAX
) && (rankLast
[nBitsToDecrease
] == noSymbol
))
351 totalCost
-= 1 << (nBitsToDecrease
- 1);
352 if (rankLast
[nBitsToDecrease
- 1] == noSymbol
)
353 rankLast
[nBitsToDecrease
- 1] = rankLast
[nBitsToDecrease
]; /* this rank is no longer empty */
354 huffNode
[rankLast
[nBitsToDecrease
]].nbBits
++;
355 if (rankLast
[nBitsToDecrease
] == 0) /* special case, reached largest symbol */
356 rankLast
[nBitsToDecrease
] = noSymbol
;
358 rankLast
[nBitsToDecrease
]--;
359 if (huffNode
[rankLast
[nBitsToDecrease
]].nbBits
!= maxNbBits
- nBitsToDecrease
)
360 rankLast
[nBitsToDecrease
] = noSymbol
; /* this rank is now empty */
362 } /* while (totalCost > 0) */
364 while (totalCost
< 0) { /* Sometimes, cost correction overshoot */
365 if (rankLast
[1] == noSymbol
) { /* special case : no rank 1 symbol (using maxNbBits-1); let's create one from largest rank 0
367 while (huffNode
[n
].nbBits
== maxNbBits
)
369 huffNode
[n
+ 1].nbBits
--;
374 huffNode
[rankLast
[1] + 1].nbBits
--;
379 } /* there are several too large elements (at least >= 2) */
389 static void HUF_sort(nodeElt
*huffNode
, const U32
*count
, U32 maxSymbolValue
)
394 memset(rank
, 0, sizeof(rank
));
395 for (n
= 0; n
<= maxSymbolValue
; n
++) {
396 U32 r
= BIT_highbit32(count
[n
] + 1);
399 for (n
= 30; n
> 0; n
--)
400 rank
[n
- 1].base
+= rank
[n
].base
;
401 for (n
= 0; n
< 32; n
++)
402 rank
[n
].curr
= rank
[n
].base
;
403 for (n
= 0; n
<= maxSymbolValue
; n
++) {
404 U32
const c
= count
[n
];
405 U32
const r
= BIT_highbit32(c
+ 1) + 1;
406 U32 pos
= rank
[r
].curr
++;
407 while ((pos
> rank
[r
].base
) && (c
> huffNode
[pos
- 1].count
))
408 huffNode
[pos
] = huffNode
[pos
- 1], pos
--;
409 huffNode
[pos
].count
= c
;
410 huffNode
[pos
].byte
= (BYTE
)n
;
414 /** HUF_buildCTable_wksp() :
415 * Same as HUF_buildCTable(), but using externally allocated scratch buffer.
416 * `workSpace` must be aligned on 4-bytes boundaries, and be at least as large as a table of 1024 unsigned.
418 #define STARTNODE (HUF_SYMBOLVALUE_MAX + 1)
419 typedef nodeElt huffNodeTable
[2 * HUF_SYMBOLVALUE_MAX
+ 1 + 1];
420 size_t HUF_buildCTable_wksp(HUF_CElt
*tree
, const U32
*count
, U32 maxSymbolValue
, U32 maxNbBits
, void *workSpace
, size_t wkspSize
)
422 nodeElt
*const huffNode0
= (nodeElt
*)workSpace
;
423 nodeElt
*const huffNode
= huffNode0
+ 1;
426 U16 nodeNb
= STARTNODE
;
430 if (wkspSize
< sizeof(huffNodeTable
))
431 return ERROR(GENERIC
); /* workSpace is not large enough */
433 maxNbBits
= HUF_TABLELOG_DEFAULT
;
434 if (maxSymbolValue
> HUF_SYMBOLVALUE_MAX
)
435 return ERROR(GENERIC
);
436 memset(huffNode0
, 0, sizeof(huffNodeTable
));
438 /* sort, decreasing order */
439 HUF_sort(huffNode
, count
, maxSymbolValue
);
441 /* init for parents */
442 nonNullRank
= maxSymbolValue
;
443 while (huffNode
[nonNullRank
].count
== 0)
446 nodeRoot
= nodeNb
+ lowS
- 1;
448 huffNode
[nodeNb
].count
= huffNode
[lowS
].count
+ huffNode
[lowS
- 1].count
;
449 huffNode
[lowS
].parent
= huffNode
[lowS
- 1].parent
= nodeNb
;
452 for (n
= nodeNb
; n
<= nodeRoot
; n
++)
453 huffNode
[n
].count
= (U32
)(1U << 30);
454 huffNode0
[0].count
= (U32
)(1U << 31); /* fake entry, strong barrier */
457 while (nodeNb
<= nodeRoot
) {
458 U32 n1
= (huffNode
[lowS
].count
< huffNode
[lowN
].count
) ? lowS
-- : lowN
++;
459 U32 n2
= (huffNode
[lowS
].count
< huffNode
[lowN
].count
) ? lowS
-- : lowN
++;
460 huffNode
[nodeNb
].count
= huffNode
[n1
].count
+ huffNode
[n2
].count
;
461 huffNode
[n1
].parent
= huffNode
[n2
].parent
= nodeNb
;
465 /* distribute weights (unlimited tree height) */
466 huffNode
[nodeRoot
].nbBits
= 0;
467 for (n
= nodeRoot
- 1; n
>= STARTNODE
; n
--)
468 huffNode
[n
].nbBits
= huffNode
[huffNode
[n
].parent
].nbBits
+ 1;
469 for (n
= 0; n
<= nonNullRank
; n
++)
470 huffNode
[n
].nbBits
= huffNode
[huffNode
[n
].parent
].nbBits
+ 1;
472 /* enforce maxTableLog */
473 maxNbBits
= HUF_setMaxHeight(huffNode
, nonNullRank
, maxNbBits
);
475 /* fill result into tree (val, nbBits) */
477 U16 nbPerRank
[HUF_TABLELOG_MAX
+ 1] = {0};
478 U16 valPerRank
[HUF_TABLELOG_MAX
+ 1] = {0};
479 if (maxNbBits
> HUF_TABLELOG_MAX
)
480 return ERROR(GENERIC
); /* check fit into table */
481 for (n
= 0; n
<= nonNullRank
; n
++)
482 nbPerRank
[huffNode
[n
].nbBits
]++;
483 /* determine stating value per rank */
486 for (n
= maxNbBits
; n
> 0; n
--) {
487 valPerRank
[n
] = min
; /* get starting value within each rank */
492 for (n
= 0; n
<= maxSymbolValue
; n
++)
493 tree
[huffNode
[n
].byte
].nbBits
= huffNode
[n
].nbBits
; /* push nbBits per symbol, symbol order */
494 for (n
= 0; n
<= maxSymbolValue
; n
++)
495 tree
[n
].val
= valPerRank
[tree
[n
].nbBits
]++; /* assign value within rank, symbol order */
501 static size_t HUF_estimateCompressedSize(HUF_CElt
*CTable
, const unsigned *count
, unsigned maxSymbolValue
)
505 for (s
= 0; s
<= (int)maxSymbolValue
; ++s
) {
506 nbBits
+= CTable
[s
].nbBits
* count
[s
];
511 static int HUF_validateCTable(const HUF_CElt
*CTable
, const unsigned *count
, unsigned maxSymbolValue
)
515 for (s
= 0; s
<= (int)maxSymbolValue
; ++s
) {
516 bad
|= (count
[s
] != 0) & (CTable
[s
].nbBits
== 0);
521 static void HUF_encodeSymbol(BIT_CStream_t
*bitCPtr
, U32 symbol
, const HUF_CElt
*CTable
)
523 BIT_addBitsFast(bitCPtr
, CTable
[symbol
].val
, CTable
[symbol
].nbBits
);
526 size_t HUF_compressBound(size_t size
) { return HUF_COMPRESSBOUND(size
); }
528 #define HUF_FLUSHBITS(s) BIT_flushBits(s)
530 #define HUF_FLUSHBITS_1(stream) \
531 if (sizeof((stream)->bitContainer) * 8 < HUF_TABLELOG_MAX * 2 + 7) \
532 HUF_FLUSHBITS(stream)
534 #define HUF_FLUSHBITS_2(stream) \
535 if (sizeof((stream)->bitContainer) * 8 < HUF_TABLELOG_MAX * 4 + 7) \
536 HUF_FLUSHBITS(stream)
538 size_t HUF_compress1X_usingCTable(void *dst
, size_t dstSize
, const void *src
, size_t srcSize
, const HUF_CElt
*CTable
)
540 const BYTE
*ip
= (const BYTE
*)src
;
541 BYTE
*const ostart
= (BYTE
*)dst
;
542 BYTE
*const oend
= ostart
+ dstSize
;
549 return 0; /* not enough space to compress */
551 size_t const initErr
= BIT_initCStream(&bitC
, op
, oend
- op
);
552 if (HUF_isError(initErr
))
556 n
= srcSize
& ~3; /* join to mod 4 */
557 switch (srcSize
& 3) {
558 case 3: HUF_encodeSymbol(&bitC
, ip
[n
+ 2], CTable
); HUF_FLUSHBITS_2(&bitC
);
560 case 2: HUF_encodeSymbol(&bitC
, ip
[n
+ 1], CTable
); HUF_FLUSHBITS_1(&bitC
);
562 case 1: HUF_encodeSymbol(&bitC
, ip
[n
+ 0], CTable
); HUF_FLUSHBITS(&bitC
);
568 for (; n
> 0; n
-= 4) { /* note : n&3==0 at this stage */
569 HUF_encodeSymbol(&bitC
, ip
[n
- 1], CTable
);
570 HUF_FLUSHBITS_1(&bitC
);
571 HUF_encodeSymbol(&bitC
, ip
[n
- 2], CTable
);
572 HUF_FLUSHBITS_2(&bitC
);
573 HUF_encodeSymbol(&bitC
, ip
[n
- 3], CTable
);
574 HUF_FLUSHBITS_1(&bitC
);
575 HUF_encodeSymbol(&bitC
, ip
[n
- 4], CTable
);
576 HUF_FLUSHBITS(&bitC
);
579 return BIT_closeCStream(&bitC
);
582 size_t HUF_compress4X_usingCTable(void *dst
, size_t dstSize
, const void *src
, size_t srcSize
, const HUF_CElt
*CTable
)
584 size_t const segmentSize
= (srcSize
+ 3) / 4; /* first 3 segments */
585 const BYTE
*ip
= (const BYTE
*)src
;
586 const BYTE
*const iend
= ip
+ srcSize
;
587 BYTE
*const ostart
= (BYTE
*)dst
;
588 BYTE
*const oend
= ostart
+ dstSize
;
591 if (dstSize
< 6 + 1 + 1 + 1 + 8)
592 return 0; /* minimum space to compress successfully */
594 return 0; /* no saving possible : too small input */
595 op
+= 6; /* jumpTable */
598 CHECK_V_F(cSize
, HUF_compress1X_usingCTable(op
, oend
- op
, ip
, segmentSize
, CTable
));
601 ZSTD_writeLE16(ostart
, (U16
)cSize
);
607 CHECK_V_F(cSize
, HUF_compress1X_usingCTable(op
, oend
- op
, ip
, segmentSize
, CTable
));
610 ZSTD_writeLE16(ostart
+ 2, (U16
)cSize
);
616 CHECK_V_F(cSize
, HUF_compress1X_usingCTable(op
, oend
- op
, ip
, segmentSize
, CTable
));
619 ZSTD_writeLE16(ostart
+ 4, (U16
)cSize
);
625 CHECK_V_F(cSize
, HUF_compress1X_usingCTable(op
, oend
- op
, ip
, iend
- ip
, CTable
));
634 static size_t HUF_compressCTable_internal(BYTE
*const ostart
, BYTE
*op
, BYTE
*const oend
, const void *src
, size_t srcSize
, unsigned singleStream
,
635 const HUF_CElt
*CTable
)
638 singleStream
? HUF_compress1X_usingCTable(op
, oend
- op
, src
, srcSize
, CTable
) : HUF_compress4X_usingCTable(op
, oend
- op
, src
, srcSize
, CTable
);
639 if (HUF_isError(cSize
)) {
644 } /* uncompressible */
646 /* check compressibility */
647 if ((size_t)(op
- ostart
) >= srcSize
- 1) {
653 /* `workSpace` must a table of at least 1024 unsigned */
654 static size_t HUF_compress_internal(void *dst
, size_t dstSize
, const void *src
, size_t srcSize
, unsigned maxSymbolValue
, unsigned huffLog
,
655 unsigned singleStream
, void *workSpace
, size_t wkspSize
, HUF_CElt
*oldHufTable
, HUF_repeat
*repeat
, int preferRepeat
)
657 BYTE
*const ostart
= (BYTE
*)dst
;
658 BYTE
*const oend
= ostart
+ dstSize
;
662 size_t const countSize
= sizeof(U32
) * (HUF_SYMBOLVALUE_MAX
+ 1);
664 size_t const CTableSize
= sizeof(HUF_CElt
) * (HUF_SYMBOLVALUE_MAX
+ 1);
667 if (wkspSize
< sizeof(huffNodeTable
) + countSize
+ CTableSize
)
668 return ERROR(GENERIC
);
670 return 0; /* Uncompressed (note : 1 means rle, so first byte must be correct) */
672 return 0; /* cannot fit within dst budget */
673 if (srcSize
> HUF_BLOCKSIZE_MAX
)
674 return ERROR(srcSize_wrong
); /* curr block size limit */
675 if (huffLog
> HUF_TABLELOG_MAX
)
676 return ERROR(tableLog_tooLarge
);
678 maxSymbolValue
= HUF_SYMBOLVALUE_MAX
;
680 huffLog
= HUF_TABLELOG_DEFAULT
;
682 count
= (U32
*)workSpace
;
683 workSpace
= (BYTE
*)workSpace
+ countSize
;
684 wkspSize
-= countSize
;
685 CTable
= (HUF_CElt
*)workSpace
;
686 workSpace
= (BYTE
*)workSpace
+ CTableSize
;
687 wkspSize
-= CTableSize
;
689 /* Heuristic : If we don't need to check the validity of the old table use the old table for small inputs */
690 if (preferRepeat
&& repeat
&& *repeat
== HUF_repeat_valid
) {
691 return HUF_compressCTable_internal(ostart
, op
, oend
, src
, srcSize
, singleStream
, oldHufTable
);
694 /* Scan input and build symbol stats */
696 CHECK_V_F(largest
, FSE_count_wksp(count
, &maxSymbolValue
, (const BYTE
*)src
, srcSize
, (U32
*)workSpace
));
697 if (largest
== srcSize
) {
698 *ostart
= ((const BYTE
*)src
)[0];
700 } /* single symbol, rle */
701 if (largest
<= (srcSize
>> 7) + 1)
702 return 0; /* Fast heuristic : not compressible enough */
705 /* Check validity of previous table */
706 if (repeat
&& *repeat
== HUF_repeat_check
&& !HUF_validateCTable(oldHufTable
, count
, maxSymbolValue
)) {
707 *repeat
= HUF_repeat_none
;
709 /* Heuristic : use existing table for small inputs */
710 if (preferRepeat
&& repeat
&& *repeat
!= HUF_repeat_none
) {
711 return HUF_compressCTable_internal(ostart
, op
, oend
, src
, srcSize
, singleStream
, oldHufTable
);
714 /* Build Huffman Tree */
715 huffLog
= HUF_optimalTableLog(huffLog
, srcSize
, maxSymbolValue
);
717 CHECK_V_F(maxBits
, HUF_buildCTable_wksp(CTable
, count
, maxSymbolValue
, huffLog
, workSpace
, wkspSize
));
718 huffLog
= (U32
)maxBits
;
719 /* Zero the unused symbols so we can check it for validity */
720 memset(CTable
+ maxSymbolValue
+ 1, 0, CTableSize
- (maxSymbolValue
+ 1) * sizeof(HUF_CElt
));
723 /* Write table description header */
725 CHECK_V_F(hSize
, HUF_writeCTable_wksp(op
, dstSize
, CTable
, maxSymbolValue
, huffLog
, workSpace
, wkspSize
));
726 /* Check if using the previous table will be beneficial */
727 if (repeat
&& *repeat
!= HUF_repeat_none
) {
728 size_t const oldSize
= HUF_estimateCompressedSize(oldHufTable
, count
, maxSymbolValue
);
729 size_t const newSize
= HUF_estimateCompressedSize(CTable
, count
, maxSymbolValue
);
730 if (oldSize
<= hSize
+ newSize
|| hSize
+ 12 >= srcSize
) {
731 return HUF_compressCTable_internal(ostart
, op
, oend
, src
, srcSize
, singleStream
, oldHufTable
);
734 /* Use the new table */
735 if (hSize
+ 12ul >= srcSize
) {
740 *repeat
= HUF_repeat_none
;
743 memcpy(oldHufTable
, CTable
, CTableSize
);
744 } /* Save the new table */
746 return HUF_compressCTable_internal(ostart
, op
, oend
, src
, srcSize
, singleStream
, CTable
);
749 size_t HUF_compress1X_wksp(void *dst
, size_t dstSize
, const void *src
, size_t srcSize
, unsigned maxSymbolValue
, unsigned huffLog
, void *workSpace
,
752 return HUF_compress_internal(dst
, dstSize
, src
, srcSize
, maxSymbolValue
, huffLog
, 1 /* single stream */, workSpace
, wkspSize
, NULL
, NULL
, 0);
755 size_t HUF_compress1X_repeat(void *dst
, size_t dstSize
, const void *src
, size_t srcSize
, unsigned maxSymbolValue
, unsigned huffLog
, void *workSpace
,
756 size_t wkspSize
, HUF_CElt
*hufTable
, HUF_repeat
*repeat
, int preferRepeat
)
758 return HUF_compress_internal(dst
, dstSize
, src
, srcSize
, maxSymbolValue
, huffLog
, 1 /* single stream */, workSpace
, wkspSize
, hufTable
, repeat
,
762 size_t HUF_compress4X_wksp(void *dst
, size_t dstSize
, const void *src
, size_t srcSize
, unsigned maxSymbolValue
, unsigned huffLog
, void *workSpace
,
765 return HUF_compress_internal(dst
, dstSize
, src
, srcSize
, maxSymbolValue
, huffLog
, 0 /* 4 streams */, workSpace
, wkspSize
, NULL
, NULL
, 0);
768 size_t HUF_compress4X_repeat(void *dst
, size_t dstSize
, const void *src
, size_t srcSize
, unsigned maxSymbolValue
, unsigned huffLog
, void *workSpace
,
769 size_t wkspSize
, HUF_CElt
*hufTable
, HUF_repeat
*repeat
, int preferRepeat
)
771 return HUF_compress_internal(dst
, dstSize
, src
, srcSize
, maxSymbolValue
, huffLog
, 0 /* 4 streams */, workSpace
, wkspSize
, hufTable
, repeat
,