Coverage Report

Created: 2026-01-10 07:04

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/zstd/lib/legacy/zstd_v02.c
Line
Count
Source
1
/*
2
 * Copyright (c) Yann Collet, Meta Platforms, Inc. and affiliates.
3
 * All rights reserved.
4
 *
5
 * This source code is licensed under both the BSD-style license (found in the
6
 * LICENSE file in the root directory of this source tree) and the GPLv2 (found
7
 * in the COPYING file in the root directory of this source tree).
8
 * You may select, at your option, one of the above-listed licenses.
9
 */
10
11
12
#include <stddef.h>    /* size_t, ptrdiff_t */
13
#include "zstd_v02.h"
14
#include "../common/compiler.h"
15
#include "../common/error_private.h"
16
17
18
/******************************************
19
*  Compiler-specific
20
******************************************/
21
#if defined(_MSC_VER)   /* Visual Studio */
22
#   include <stdlib.h>  /* _byteswap_ulong */
23
#   include <intrin.h>  /* _byteswap_* */
24
#endif
25
26
27
/* ******************************************************************
28
   mem.h
29
   low-level memory access routines
30
   Copyright (C) 2013-2015, Yann Collet.
31
32
   BSD 2-Clause License (https://opensource.org/licenses/bsd-license.php)
33
34
   Redistribution and use in source and binary forms, with or without
35
   modification, are permitted provided that the following conditions are
36
   met:
37
38
       * Redistributions of source code must retain the above copyright
39
   notice, this list of conditions and the following disclaimer.
40
       * Redistributions in binary form must reproduce the above
41
   copyright notice, this list of conditions and the following disclaimer
42
   in the documentation and/or other materials provided with the
43
   distribution.
44
45
   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
46
   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
47
   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
48
   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
49
   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
50
   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
51
   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
52
   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
53
   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
54
   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
55
   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
56
57
    You can contact the author at :
58
    - FSE source repository : https://github.com/Cyan4973/FiniteStateEntropy
59
    - Public forum : https://groups.google.com/forum/#!forum/lz4c
60
****************************************************************** */
61
#ifndef MEM_H_MODULE
62
#define MEM_H_MODULE
63
64
#if defined (__cplusplus)
65
extern "C" {
66
#endif
67
68
/******************************************
69
*  Includes
70
******************************************/
71
#include <stddef.h>    /* size_t, ptrdiff_t */
72
#include <string.h>    /* memcpy */
73
74
75
/****************************************************************
76
*  Basic Types
77
*****************************************************************/
78
#if defined (__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */)
79
# if defined(_AIX)
80
#  include <inttypes.h>
81
# else
82
#  include <stdint.h> /* intptr_t */
83
# endif
84
  typedef  uint8_t BYTE;
85
  typedef uint16_t U16;
86
  typedef  int16_t S16;
87
  typedef uint32_t U32;
88
  typedef  int32_t S32;
89
  typedef uint64_t U64;
90
  typedef  int64_t S64;
91
#else
92
  typedef unsigned char       BYTE;
93
  typedef unsigned short      U16;
94
  typedef   signed short      S16;
95
  typedef unsigned int        U32;
96
  typedef   signed int        S32;
97
  typedef unsigned long long  U64;
98
  typedef   signed long long  S64;
99
#endif
100
101
102
/****************************************************************
103
*  Memory I/O
104
*****************************************************************/
105
106
535k
MEM_STATIC unsigned MEM_32bits(void) { return sizeof(void*)==4; }
107
1.38M
MEM_STATIC unsigned MEM_64bits(void) { return sizeof(void*)==8; }
108
109
MEM_STATIC unsigned MEM_isLittleEndian(void)
110
676k
{
111
676k
    const union { U32 u; BYTE c[4]; } one = { 1 };   /* don't use static : performance detrimental  */
112
676k
    return one.c[0];
113
676k
}
114
115
MEM_STATIC U16 MEM_read16(const void* memPtr)
116
9.51k
{
117
9.51k
    U16 val; memcpy(&val, memPtr, sizeof(val)); return val;
118
9.51k
}
119
120
MEM_STATIC U32 MEM_read32(const void* memPtr)
121
102k
{
122
102k
    U32 val; memcpy(&val, memPtr, sizeof(val)); return val;
123
102k
}
124
125
MEM_STATIC U64 MEM_read64(const void* memPtr)
126
489k
{
127
489k
    U64 val; memcpy(&val, memPtr, sizeof(val)); return val;
128
489k
}
129
130
MEM_STATIC void MEM_write16(void* memPtr, U16 value)
131
75.3k
{
132
75.3k
    memcpy(memPtr, &value, sizeof(value));
133
75.3k
}
134
135
MEM_STATIC U16 MEM_readLE16(const void* memPtr)
136
9.51k
{
137
9.51k
    if (MEM_isLittleEndian())
138
9.51k
        return MEM_read16(memPtr);
139
0
    else
140
0
    {
141
0
        const BYTE* p = (const BYTE*)memPtr;
142
0
        return (U16)(p[0] + (p[1]<<8));
143
0
    }
144
9.51k
}
145
146
MEM_STATIC void MEM_writeLE16(void* memPtr, U16 val)
147
75.3k
{
148
75.3k
    if (MEM_isLittleEndian())
149
75.3k
    {
150
75.3k
        MEM_write16(memPtr, val);
151
75.3k
    }
152
0
    else
153
0
    {
154
0
        BYTE* p = (BYTE*)memPtr;
155
0
        p[0] = (BYTE)val;
156
0
        p[1] = (BYTE)(val>>8);
157
0
    }
158
75.3k
}
159
160
MEM_STATIC U32 MEM_readLE24(const void* memPtr)
161
259
{
162
259
    return MEM_readLE16(memPtr) + (((const BYTE*)memPtr)[2] << 16);
163
259
}
164
165
MEM_STATIC U32 MEM_readLE32(const void* memPtr)
166
102k
{
167
102k
    if (MEM_isLittleEndian())
168
102k
        return MEM_read32(memPtr);
169
0
    else
170
0
    {
171
0
        const BYTE* p = (const BYTE*)memPtr;
172
0
        return (U32)((U32)p[0] + ((U32)p[1]<<8) + ((U32)p[2]<<16) + ((U32)p[3]<<24));
173
0
    }
174
102k
}
175
176
177
MEM_STATIC U64 MEM_readLE64(const void* memPtr)
178
489k
{
179
489k
    if (MEM_isLittleEndian())
180
489k
        return MEM_read64(memPtr);
181
0
    else
182
0
    {
183
0
        const BYTE* p = (const BYTE*)memPtr;
184
0
        return (U64)((U64)p[0] + ((U64)p[1]<<8) + ((U64)p[2]<<16) + ((U64)p[3]<<24)
185
0
                     + ((U64)p[4]<<32) + ((U64)p[5]<<40) + ((U64)p[6]<<48) + ((U64)p[7]<<56));
186
0
    }
187
489k
}
188
189
190
MEM_STATIC size_t MEM_readLEST(const void* memPtr)
191
489k
{
192
489k
    if (MEM_32bits())
193
0
        return (size_t)MEM_readLE32(memPtr);
194
489k
    else
195
489k
        return (size_t)MEM_readLE64(memPtr);
196
489k
}
197
198
#if defined (__cplusplus)
199
}
200
#endif
201
202
#endif /* MEM_H_MODULE */
203
204
205
/* ******************************************************************
206
   bitstream
207
   Part of NewGen Entropy library
208
   header file (to include)
209
   Copyright (C) 2013-2015, Yann Collet.
210
211
   BSD 2-Clause License (https://opensource.org/licenses/bsd-license.php)
212
213
   Redistribution and use in source and binary forms, with or without
214
   modification, are permitted provided that the following conditions are
215
   met:
216
217
       * Redistributions of source code must retain the above copyright
218
   notice, this list of conditions and the following disclaimer.
219
       * Redistributions in binary form must reproduce the above
220
   copyright notice, this list of conditions and the following disclaimer
221
   in the documentation and/or other materials provided with the
222
   distribution.
223
224
   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
225
   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
226
   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
227
   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
228
   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
229
   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
230
   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
231
   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
232
   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
233
   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
234
   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
235
236
   You can contact the author at :
237
   - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
238
   - Public forum : https://groups.google.com/forum/#!forum/lz4c
239
****************************************************************** */
240
#ifndef BITSTREAM_H_MODULE
241
#define BITSTREAM_H_MODULE
242
243
#if defined (__cplusplus)
244
extern "C" {
245
#endif
246
247
248
/*
249
*  This API consists of small unitary functions, which highly benefit from being inlined.
250
*  Since link-time-optimization is not available for all compilers,
251
*  these functions are defined into a .h to be included.
252
*/
253
254
255
/**********************************************
256
*  bitStream decompression API (read backward)
257
**********************************************/
258
typedef struct
259
{
260
    size_t   bitContainer;
261
    unsigned bitsConsumed;
262
    const char* ptr;
263
    const char* start;
264
} BIT_DStream_t;
265
266
typedef enum { BIT_DStream_unfinished = 0,
267
               BIT_DStream_endOfBuffer = 1,
268
               BIT_DStream_completed = 2,
269
               BIT_DStream_overflow = 3 } BIT_DStream_status;  /* result of BIT_reloadDStream() */
270
               /* 1,2,4,8 would be better for bitmap combinations, but slows down performance a bit ... :( */
271
272
MEM_STATIC size_t   BIT_initDStream(BIT_DStream_t* bitD, const void* srcBuffer, size_t srcSize);
273
MEM_STATIC size_t   BIT_readBits(BIT_DStream_t* bitD, unsigned nbBits);
274
MEM_STATIC BIT_DStream_status BIT_reloadDStream(BIT_DStream_t* bitD);
275
MEM_STATIC unsigned BIT_endOfDStream(const BIT_DStream_t* bitD);
276
277
278
/******************************************
279
*  unsafe API
280
******************************************/
281
MEM_STATIC size_t BIT_readBitsFast(BIT_DStream_t* bitD, unsigned nbBits);
282
/* faster, but works only if nbBits >= 1 */
283
284
285
286
/****************************************************************
287
*  Helper functions
288
****************************************************************/
289
MEM_STATIC unsigned BIT_highbit32 (U32 val)
290
502k
{
291
#   if defined(_MSC_VER)   /* Visual */
292
    unsigned long r;
293
    return _BitScanReverse(&r, val) ? (unsigned)r : 0;
294
#   elif defined(__GNUC__) && (__GNUC__ >= 3)   /* Use GCC Intrinsic */
295
    return __builtin_clz (val) ^ 31;
296
#   else   /* Software version */
297
    static const unsigned DeBruijnClz[32] = { 0, 9, 1, 10, 13, 21, 2, 29, 11, 14, 16, 18, 22, 25, 3, 30, 8, 12, 20, 28, 15, 17, 24, 7, 19, 27, 23, 6, 26, 5, 4, 31 };
298
    U32 v = val;
299
    unsigned r;
300
    v |= v >> 1;
301
    v |= v >> 2;
302
    v |= v >> 4;
303
    v |= v >> 8;
304
    v |= v >> 16;
305
    r = DeBruijnClz[ (U32) (v * 0x07C4ACDDU) >> 27];
306
    return r;
307
#   endif
308
502k
}
309
310
311
312
/**********************************************************
313
* bitStream decoding
314
**********************************************************/
315
316
/*!BIT_initDStream
317
*  Initialize a BIT_DStream_t.
318
*  @bitD : a pointer to an already allocated BIT_DStream_t structure
319
*  @srcBuffer must point at the beginning of a bitStream
320
*  @srcSize must be the exact size of the bitStream
321
*  @result : size of stream (== srcSize) or an errorCode if a problem is detected
322
*/
323
MEM_STATIC size_t BIT_initDStream(BIT_DStream_t* bitD, const void* srcBuffer, size_t srcSize)
324
9.83k
{
325
9.83k
    if (srcSize < 1) { memset(bitD, 0, sizeof(*bitD)); return ERROR(srcSize_wrong); }
326
327
9.78k
    if (srcSize >=  sizeof(size_t))   /* normal case */
328
1.82k
    {
329
1.82k
        U32 contain32;
330
1.82k
        bitD->start = (const char*)srcBuffer;
331
1.82k
        bitD->ptr   = (const char*)srcBuffer + srcSize - sizeof(size_t);
332
1.82k
        bitD->bitContainer = MEM_readLEST(bitD->ptr);
333
1.82k
        contain32 = ((const BYTE*)srcBuffer)[srcSize-1];
334
1.82k
        if (contain32 == 0) return ERROR(GENERIC);   /* endMark not present */
335
1.76k
        bitD->bitsConsumed = 8 - BIT_highbit32(contain32);
336
1.76k
    }
337
7.96k
    else
338
7.96k
    {
339
7.96k
        U32 contain32;
340
7.96k
        bitD->start = (const char*)srcBuffer;
341
7.96k
        bitD->ptr   = bitD->start;
342
7.96k
        bitD->bitContainer = *(const BYTE*)(bitD->start);
343
7.96k
        switch(srcSize)
344
7.96k
        {
345
48
            case 7: bitD->bitContainer += (size_t)(((const BYTE*)(bitD->start))[6]) << (sizeof(size_t)*8 - 16);
346
                    /* fallthrough */
347
292
            case 6: bitD->bitContainer += (size_t)(((const BYTE*)(bitD->start))[5]) << (sizeof(size_t)*8 - 24);
348
                    /* fallthrough */
349
514
            case 5: bitD->bitContainer += (size_t)(((const BYTE*)(bitD->start))[4]) << (sizeof(size_t)*8 - 32);
350
                    /* fallthrough */
351
1.29k
            case 4: bitD->bitContainer += (size_t)(((const BYTE*)(bitD->start))[3]) << 24;
352
                    /* fallthrough */
353
3.87k
            case 3: bitD->bitContainer += (size_t)(((const BYTE*)(bitD->start))[2]) << 16;
354
                    /* fallthrough */
355
5.20k
            case 2: bitD->bitContainer += (size_t)(((const BYTE*)(bitD->start))[1]) <<  8;
356
                    /* fallthrough */
357
7.96k
            default:;
358
7.96k
        }
359
7.96k
        contain32 = ((const BYTE*)srcBuffer)[srcSize-1];
360
7.96k
        if (contain32 == 0) return ERROR(GENERIC);   /* endMark not present */
361
7.91k
        bitD->bitsConsumed = 8 - BIT_highbit32(contain32);
362
7.91k
        bitD->bitsConsumed += (U32)(sizeof(size_t) - srcSize)*8;
363
7.91k
    }
364
365
9.67k
    return srcSize;
366
9.78k
}
367
368
MEM_STATIC size_t BIT_lookBits(BIT_DStream_t* bitD, U32 nbBits)
369
136k
{
370
136k
    const U32 bitMask = sizeof(bitD->bitContainer)*8 - 1;
371
136k
    return ((bitD->bitContainer << (bitD->bitsConsumed & bitMask)) >> 1) >> ((bitMask-nbBits) & bitMask);
372
136k
}
373
374
/*! BIT_lookBitsFast :
375
*   unsafe version; only works if nbBits >= 1 */
376
MEM_STATIC size_t BIT_lookBitsFast(BIT_DStream_t* bitD, U32 nbBits)
377
9.57M
{
378
9.57M
    const U32 bitMask = sizeof(bitD->bitContainer)*8 - 1;
379
9.57M
    return (bitD->bitContainer << (bitD->bitsConsumed & bitMask)) >> (((bitMask+1)-nbBits) & bitMask);
380
9.57M
}
381
382
MEM_STATIC void BIT_skipBits(BIT_DStream_t* bitD, U32 nbBits)
383
9.70M
{
384
9.70M
    bitD->bitsConsumed += nbBits;
385
9.70M
}
386
387
MEM_STATIC size_t BIT_readBits(BIT_DStream_t* bitD, U32 nbBits)
388
136k
{
389
136k
    size_t value = BIT_lookBits(bitD, nbBits);
390
136k
    BIT_skipBits(bitD, nbBits);
391
136k
    return value;
392
136k
}
393
394
/*!BIT_readBitsFast :
395
*  unsafe version; only works if nbBits >= 1 */
396
MEM_STATIC size_t BIT_readBitsFast(BIT_DStream_t* bitD, U32 nbBits)
397
4.03k
{
398
4.03k
    size_t value = BIT_lookBitsFast(bitD, nbBits);
399
4.03k
    BIT_skipBits(bitD, nbBits);
400
4.03k
    return value;
401
4.03k
}
402
403
MEM_STATIC BIT_DStream_status BIT_reloadDStream(BIT_DStream_t* bitD)
404
535k
{
405
535k
    if (bitD->bitsConsumed > (sizeof(bitD->bitContainer)*8))  /* should never happen */
406
129
        return BIT_DStream_overflow;
407
408
535k
    if (bitD->ptr >= bitD->start + sizeof(bitD->bitContainer))
409
480k
    {
410
480k
        bitD->ptr -= bitD->bitsConsumed >> 3;
411
480k
        bitD->bitsConsumed &= 7;
412
480k
        bitD->bitContainer = MEM_readLEST(bitD->ptr);
413
480k
        return BIT_DStream_unfinished;
414
480k
    }
415
55.3k
    if (bitD->ptr == bitD->start)
416
47.6k
    {
417
47.6k
        if (bitD->bitsConsumed < sizeof(bitD->bitContainer)*8) return BIT_DStream_endOfBuffer;
418
12.9k
        return BIT_DStream_completed;
419
47.6k
    }
420
7.64k
    {
421
7.64k
        U32 nbBytes = bitD->bitsConsumed >> 3;
422
7.64k
        BIT_DStream_status result = BIT_DStream_unfinished;
423
7.64k
        if (bitD->ptr - nbBytes < bitD->start)
424
743
        {
425
743
            nbBytes = (U32)(bitD->ptr - bitD->start);  /* ptr > start */
426
743
            result = BIT_DStream_endOfBuffer;
427
743
        }
428
7.64k
        bitD->ptr -= nbBytes;
429
7.64k
        bitD->bitsConsumed -= nbBytes*8;
430
7.64k
        bitD->bitContainer = MEM_readLEST(bitD->ptr);   /* reminder : srcSize > sizeof(bitD) */
431
7.64k
        return result;
432
55.3k
    }
433
55.3k
}
434
435
/*! BIT_endOfDStream
436
*   @return Tells if DStream has reached its exact end
437
*/
438
MEM_STATIC unsigned BIT_endOfDStream(const BIT_DStream_t* DStream)
439
20.5k
{
440
20.5k
    return ((DStream->ptr == DStream->start) && (DStream->bitsConsumed == sizeof(DStream->bitContainer)*8));
441
20.5k
}
442
443
#if defined (__cplusplus)
444
}
445
#endif
446
447
#endif /* BITSTREAM_H_MODULE */
448
/* ******************************************************************
449
   Error codes and messages
450
   Copyright (C) 2013-2015, Yann Collet
451
452
   BSD 2-Clause License (https://opensource.org/licenses/bsd-license.php)
453
454
   Redistribution and use in source and binary forms, with or without
455
   modification, are permitted provided that the following conditions are
456
   met:
457
458
       * Redistributions of source code must retain the above copyright
459
   notice, this list of conditions and the following disclaimer.
460
       * Redistributions in binary form must reproduce the above
461
   copyright notice, this list of conditions and the following disclaimer
462
   in the documentation and/or other materials provided with the
463
   distribution.
464
465
   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
466
   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
467
   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
468
   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
469
   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
470
   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
471
   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
472
   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
473
   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
474
   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
475
   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
476
477
   You can contact the author at :
478
   - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
479
   - Public forum : https://groups.google.com/forum/#!forum/lz4c
480
****************************************************************** */
481
#ifndef ERROR_H_MODULE
482
#define ERROR_H_MODULE
483
484
#if defined (__cplusplus)
485
extern "C" {
486
#endif
487
488
489
/******************************************
490
*  Compiler-specific
491
******************************************/
492
#if defined (__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */)
493
#  define ERR_STATIC static inline
494
#elif defined(_MSC_VER)
495
#  define ERR_STATIC static __inline
496
#elif defined(__GNUC__)
497
#  define ERR_STATIC static __attribute__((unused))
498
#else
499
#  define ERR_STATIC static  /* this version may generate warnings for unused static functions; disable the relevant warning */
500
#endif
501
502
503
/******************************************
504
*  Error Management
505
******************************************/
506
#define PREFIX(name) ZSTD_error_##name
507
508
#define ERROR(name) (size_t)-PREFIX(name)
509
510
#define ERROR_LIST(ITEM) \
511
        ITEM(PREFIX(No_Error)) ITEM(PREFIX(GENERIC)) \
512
        ITEM(PREFIX(dstSize_tooSmall)) ITEM(PREFIX(srcSize_wrong)) \
513
        ITEM(PREFIX(prefix_unknown)) ITEM(PREFIX(corruption_detected)) \
514
        ITEM(PREFIX(tableLog_tooLarge)) ITEM(PREFIX(maxSymbolValue_tooLarge)) ITEM(PREFIX(maxSymbolValue_tooSmall)) \
515
        ITEM(PREFIX(maxCode))
516
517
#define ERROR_GENERATE_ENUM(ENUM) ENUM,
518
typedef enum { ERROR_LIST(ERROR_GENERATE_ENUM) } ERR_codes;  /* enum is exposed, to detect & handle specific errors; compare function result to -enum value */
519
520
#define ERROR_CONVERTTOSTRING(STRING) #STRING,
521
#define ERROR_GENERATE_STRING(EXPR) ERROR_CONVERTTOSTRING(EXPR)
522
static const char* ERR_strings[] = { ERROR_LIST(ERROR_GENERATE_STRING) };
523
524
ERR_STATIC unsigned ERR_isError(size_t code) { return (code > ERROR(maxCode)); }
525
526
ERR_STATIC const char* ERR_getErrorName(size_t code)
527
{
528
    static const char* codeError = "Unspecified error code";
529
    if (ERR_isError(code)) return ERR_strings[-(int)(code)];
530
    return codeError;
531
}
532
533
534
#if defined (__cplusplus)
535
}
536
#endif
537
538
#endif /* ERROR_H_MODULE */
539
/*
540
Constructor and Destructor of type FSE_CTable
541
    Note that its size depends on 'tableLog' and 'maxSymbolValue' */
542
typedef unsigned FSE_CTable;   /* don't allocate that. It's just a way to be more restrictive than void* */
543
typedef unsigned FSE_DTable;   /* don't allocate that. It's just a way to be more restrictive than void* */
544
545
546
/* ******************************************************************
547
   FSE : Finite State Entropy coder
548
   header file for static linking (only)
549
   Copyright (C) 2013-2015, Yann Collet
550
551
   BSD 2-Clause License (https://opensource.org/licenses/bsd-license.php)
552
553
   Redistribution and use in source and binary forms, with or without
554
   modification, are permitted provided that the following conditions are
555
   met:
556
557
       * Redistributions of source code must retain the above copyright
558
   notice, this list of conditions and the following disclaimer.
559
       * Redistributions in binary form must reproduce the above
560
   copyright notice, this list of conditions and the following disclaimer
561
   in the documentation and/or other materials provided with the
562
   distribution.
563
564
   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
565
   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
566
   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
567
   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
568
   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
569
   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
570
   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
571
   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
572
   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
573
   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
574
   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
575
576
   You can contact the author at :
577
   - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
578
   - Public forum : https://groups.google.com/forum/#!forum/lz4c
579
****************************************************************** */
580
#if defined (__cplusplus)
581
extern "C" {
582
#endif
583
584
585
/******************************************
586
*  Static allocation
587
******************************************/
588
/* FSE buffer bounds */
589
#define FSE_NCOUNTBOUND 512
590
#define FSE_BLOCKBOUND(size) (size + (size>>7))
591
#define FSE_COMPRESSBOUND(size) (FSE_NCOUNTBOUND + FSE_BLOCKBOUND(size))   /* Macro version, useful for static allocation */
592
593
/* You can statically allocate FSE CTable/DTable as a table of unsigned using below macro */
594
#define FSE_CTABLE_SIZE_U32(maxTableLog, maxSymbolValue)   (1 + (1<<(maxTableLog-1)) + ((maxSymbolValue+1)*2))
595
#define FSE_DTABLE_SIZE_U32(maxTableLog)                   (1 + (1<<maxTableLog))
596
597
598
/******************************************
599
*  FSE advanced API
600
******************************************/
601
static size_t FSE_buildDTable_raw (FSE_DTable* dt, unsigned nbBits);
602
/* build a fake FSE_DTable, designed to read an uncompressed bitstream where each symbol uses nbBits */
603
604
static size_t FSE_buildDTable_rle (FSE_DTable* dt, unsigned char symbolValue);
605
/* build a fake FSE_DTable, designed to always generate the same symbolValue */
606
607
608
/******************************************
609
*  FSE symbol decompression API
610
******************************************/
611
typedef struct
612
{
613
    size_t      state;
614
    const void* table;   /* precise table may vary, depending on U16 */
615
} FSE_DState_t;
616
617
618
static void     FSE_initDState(FSE_DState_t* DStatePtr, BIT_DStream_t* bitD, const FSE_DTable* dt);
619
620
static unsigned char FSE_decodeSymbol(FSE_DState_t* DStatePtr, BIT_DStream_t* bitD);
621
622
static unsigned FSE_endOfDState(const FSE_DState_t* DStatePtr);
623
624
625
/******************************************
626
*  FSE unsafe API
627
******************************************/
628
static unsigned char FSE_decodeSymbolFast(FSE_DState_t* DStatePtr, BIT_DStream_t* bitD);
629
/* faster, but works only if nbBits is always >= 1 (otherwise, result will be corrupted) */
630
631
632
/******************************************
633
*  Implementation of inline functions
634
******************************************/
635
636
/* decompression */
637
638
typedef struct {
639
    U16 tableLog;
640
    U16 fastMode;
641
} FSE_DTableHeader;   /* sizeof U32 */
642
643
typedef struct
644
{
645
    unsigned short newState;
646
    unsigned char  symbol;
647
    unsigned char  nbBits;
648
} FSE_decode_t;   /* size == U32 */
649
650
MEM_STATIC void FSE_initDState(FSE_DState_t* DStatePtr, BIT_DStream_t* bitD, const FSE_DTable* dt)
651
19.8k
{
652
19.8k
    FSE_DTableHeader DTableH;
653
19.8k
    memcpy(&DTableH, dt, sizeof(DTableH));
654
19.8k
    DStatePtr->state = BIT_readBits(bitD, DTableH.tableLog);
655
19.8k
    BIT_reloadDStream(bitD);
656
19.8k
    DStatePtr->table = dt + 1;
657
19.8k
}
658
659
MEM_STATIC BYTE FSE_decodeSymbol(FSE_DState_t* DStatePtr, BIT_DStream_t* bitD)
660
93.1k
{
661
93.1k
    const FSE_decode_t DInfo = ((const FSE_decode_t*)(DStatePtr->table))[DStatePtr->state];
662
93.1k
    const U32  nbBits = DInfo.nbBits;
663
93.1k
    BYTE symbol = DInfo.symbol;
664
93.1k
    size_t lowBits = BIT_readBits(bitD, nbBits);
665
666
93.1k
    DStatePtr->state = DInfo.newState + lowBits;
667
93.1k
    return symbol;
668
93.1k
}
669
670
MEM_STATIC BYTE FSE_decodeSymbolFast(FSE_DState_t* DStatePtr, BIT_DStream_t* bitD)
671
4.03k
{
672
4.03k
    const FSE_decode_t DInfo = ((const FSE_decode_t*)(DStatePtr->table))[DStatePtr->state];
673
4.03k
    const U32 nbBits = DInfo.nbBits;
674
4.03k
    BYTE symbol = DInfo.symbol;
675
4.03k
    size_t lowBits = BIT_readBitsFast(bitD, nbBits);
676
677
4.03k
    DStatePtr->state = DInfo.newState + lowBits;
678
4.03k
    return symbol;
679
4.03k
}
680
681
MEM_STATIC unsigned FSE_endOfDState(const FSE_DState_t* DStatePtr)
682
1.82k
{
683
1.82k
    return DStatePtr->state == 0;
684
1.82k
}
685
686
687
#if defined (__cplusplus)
688
}
689
#endif
690
/* ******************************************************************
691
   Huff0 : Huffman coder, part of New Generation Entropy library
692
   header file for static linking (only)
693
   Copyright (C) 2013-2015, Yann Collet
694
695
   BSD 2-Clause License (https://opensource.org/licenses/bsd-license.php)
696
697
   Redistribution and use in source and binary forms, with or without
698
   modification, are permitted provided that the following conditions are
699
   met:
700
701
       * Redistributions of source code must retain the above copyright
702
   notice, this list of conditions and the following disclaimer.
703
       * Redistributions in binary form must reproduce the above
704
   copyright notice, this list of conditions and the following disclaimer
705
   in the documentation and/or other materials provided with the
706
   distribution.
707
708
   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
709
   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
710
   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
711
   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
712
   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
713
   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
714
   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
715
   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
716
   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
717
   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
718
   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
719
720
   You can contact the author at :
721
   - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
722
   - Public forum : https://groups.google.com/forum/#!forum/lz4c
723
****************************************************************** */
724
725
#if defined (__cplusplus)
726
extern "C" {
727
#endif
728
729
/******************************************
730
*  Static allocation macros
731
******************************************/
732
/* Huff0 buffer bounds */
733
#define HUF_CTABLEBOUND 129
734
#define HUF_BLOCKBOUND(size) (size + (size>>8) + 8)   /* only true if incompressible pre-filtered with fast heuristic */
735
#define HUF_COMPRESSBOUND(size) (HUF_CTABLEBOUND + HUF_BLOCKBOUND(size))   /* Macro version, useful for static allocation */
736
737
/* static allocation of Huff0's DTable */
738
#define HUF_DTABLE_SIZE(maxTableLog)   (1 + (1<<maxTableLog))  /* nb Cells; use unsigned short for X2, unsigned int for X4 */
739
#define HUF_CREATE_STATIC_DTABLEX2(DTable, maxTableLog) \
740
800
        unsigned short DTable[HUF_DTABLE_SIZE(maxTableLog)] = { maxTableLog }
741
#define HUF_CREATE_STATIC_DTABLEX4(DTable, maxTableLog) \
742
156
        unsigned int DTable[HUF_DTABLE_SIZE(maxTableLog)] = { maxTableLog }
743
#define HUF_CREATE_STATIC_DTABLEX6(DTable, maxTableLog) \
744
151
        unsigned int DTable[HUF_DTABLE_SIZE(maxTableLog) * 3 / 2] = { maxTableLog }
745
746
747
/******************************************
748
*  Advanced functions
749
******************************************/
750
static size_t HUF_decompress4X2 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /* single-symbol decoder */
751
static size_t HUF_decompress4X4 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /* double-symbols decoder */
752
static size_t HUF_decompress4X6 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /* quad-symbols decoder */
753
754
755
#if defined (__cplusplus)
756
}
757
#endif
758
759
/*
760
    zstd - standard compression library
761
    Header File
762
    Copyright (C) 2014-2015, Yann Collet.
763
764
    BSD 2-Clause License (https://opensource.org/licenses/bsd-license.php)
765
766
    Redistribution and use in source and binary forms, with or without
767
    modification, are permitted provided that the following conditions are
768
    met:
769
    * Redistributions of source code must retain the above copyright
770
    notice, this list of conditions and the following disclaimer.
771
    * Redistributions in binary form must reproduce the above
772
    copyright notice, this list of conditions and the following disclaimer
773
    in the documentation and/or other materials provided with the
774
    distribution.
775
    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
776
    "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
777
    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
778
    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
779
    OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
780
    SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
781
    LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
782
    DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
783
    THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
784
    (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
785
    OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
786
787
    You can contact the author at :
788
    - zstd source repository : https://github.com/Cyan4973/zstd
789
    - ztsd public forum : https://groups.google.com/forum/#!forum/lz4c
790
*/
791
792
#if defined (__cplusplus)
793
extern "C" {
794
#endif
795
796
/* *************************************
797
*  Includes
798
***************************************/
799
#include <stddef.h>   /* size_t */
800
801
802
/* *************************************
803
*  Version
804
***************************************/
805
#define ZSTD_VERSION_MAJOR    0    /* for breaking interface changes  */
806
#define ZSTD_VERSION_MINOR    2    /* for new (non-breaking) interface capabilities */
807
#define ZSTD_VERSION_RELEASE  2    /* for tweaks, bug-fixes, or development */
808
#define ZSTD_VERSION_NUMBER  (ZSTD_VERSION_MAJOR *100*100 + ZSTD_VERSION_MINOR *100 + ZSTD_VERSION_RELEASE)
809
810
811
/* *************************************
812
*  Advanced functions
813
***************************************/
814
typedef struct ZSTD_CCtx_s ZSTD_CCtx;   /* incomplete type */
815
816
#if defined (__cplusplus)
817
}
818
#endif
819
/*
820
    zstd - standard compression library
821
    Header File for static linking only
822
    Copyright (C) 2014-2015, Yann Collet.
823
824
    BSD 2-Clause License (https://opensource.org/licenses/bsd-license.php)
825
826
    Redistribution and use in source and binary forms, with or without
827
    modification, are permitted provided that the following conditions are
828
    met:
829
    * Redistributions of source code must retain the above copyright
830
    notice, this list of conditions and the following disclaimer.
831
    * Redistributions in binary form must reproduce the above
832
    copyright notice, this list of conditions and the following disclaimer
833
    in the documentation and/or other materials provided with the
834
    distribution.
835
    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
836
    "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
837
    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
838
    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
839
    OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
840
    SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
841
    LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
842
    DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
843
    THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
844
    (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
845
    OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
846
847
    You can contact the author at :
848
    - zstd source repository : https://github.com/Cyan4973/zstd
849
    - ztsd public forum : https://groups.google.com/forum/#!forum/lz4c
850
*/
851
852
/* The objects defined into this file should be considered experimental.
853
 * They are not labelled stable, as their prototype may change in the future.
854
 * You can use them for tests, provide feedback, or if you can endure risk of future changes.
855
 */
856
857
#if defined (__cplusplus)
858
extern "C" {
859
#endif
860
861
/* *************************************
862
*  Streaming functions
863
***************************************/
864
865
typedef struct ZSTDv02_Dctx_s ZSTD_DCtx;
866
867
/*
868
  Use above functions alternatively.
869
  ZSTD_nextSrcSizeToDecompress() tells how much bytes to provide as 'srcSize' to ZSTD_decompressContinue().
870
  ZSTD_decompressContinue() will use previous data blocks to improve compression if they are located prior to current block.
871
  Result is the number of bytes regenerated within 'dst'.
872
  It can be zero, which is not an error; it just means ZSTD_decompressContinue() has decoded some header.
873
*/
874
875
/* *************************************
876
*  Prefix - version detection
877
***************************************/
878
4.98k
#define ZSTD_magicNumber 0xFD2FB522   /* v0.2 (current)*/
879
880
881
#if defined (__cplusplus)
882
}
883
#endif
884
/* ******************************************************************
885
   FSE : Finite State Entropy coder
886
   Copyright (C) 2013-2015, Yann Collet.
887
888
   BSD 2-Clause License (https://opensource.org/licenses/bsd-license.php)
889
890
   Redistribution and use in source and binary forms, with or without
891
   modification, are permitted provided that the following conditions are
892
   met:
893
894
       * Redistributions of source code must retain the above copyright
895
   notice, this list of conditions and the following disclaimer.
896
       * Redistributions in binary form must reproduce the above
897
   copyright notice, this list of conditions and the following disclaimer
898
   in the documentation and/or other materials provided with the
899
   distribution.
900
901
   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
902
   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
903
   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
904
   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
905
   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
906
   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
907
   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
908
   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
909
   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
910
   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
911
   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
912
913
    You can contact the author at :
914
    - FSE source repository : https://github.com/Cyan4973/FiniteStateEntropy
915
    - Public forum : https://groups.google.com/forum/#!forum/lz4c
916
****************************************************************** */
917
918
#ifndef FSE_COMMONDEFS_ONLY
919
920
/****************************************************************
921
*  Tuning parameters
922
****************************************************************/
923
/* MEMORY_USAGE :
924
*  Memory usage formula : N->2^N Bytes (examples : 10 -> 1KB; 12 -> 4KB ; 16 -> 64KB; 20 -> 1MB; etc.)
925
*  Increasing memory usage improves compression ratio
926
*  Reduced memory usage can improve speed, due to cache effect
927
*  Recommended max value is 14, for 16KB, which nicely fits into Intel x86 L1 cache */
928
17.2k
#define FSE_MAX_MEMORY_USAGE 14
929
#define FSE_DEFAULT_MEMORY_USAGE 13
930
931
/* FSE_MAX_SYMBOL_VALUE :
932
*  Maximum symbol value authorized.
933
*  Required for proper stack allocation */
934
5.29k
#define FSE_MAX_SYMBOL_VALUE 255
935
936
937
/****************************************************************
938
*  template functions type & suffix
939
****************************************************************/
940
490k
#define FSE_FUNCTION_TYPE BYTE
941
#define FSE_FUNCTION_EXTENSION
942
943
944
/****************************************************************
945
*  Byte symbol type
946
****************************************************************/
947
#endif   /* !FSE_COMMONDEFS_ONLY */
948
949
950
/****************************************************************
951
*  Compiler specifics
952
****************************************************************/
953
#ifdef _MSC_VER    /* Visual Studio */
954
#  define FORCE_INLINE static __forceinline
955
#  include <intrin.h>                    /* For Visual 2005 */
956
#  pragma warning(disable : 4127)        /* disable: C4127: conditional expression is constant */
957
#  pragma warning(disable : 4214)        /* disable: C4214: non-int bitfields */
958
#else
959
#  if defined (__cplusplus) || defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L   /* C99 */
960
#    ifdef __GNUC__
961
#      define FORCE_INLINE static inline __attribute__((always_inline))
962
#    else
963
#      define FORCE_INLINE static inline
964
#    endif
965
#  else
966
#    define FORCE_INLINE static
967
#  endif /* __STDC_VERSION__ */
968
#endif
969
970
971
/****************************************************************
972
*  Includes
973
****************************************************************/
974
#include <stdlib.h>     /* malloc, free, qsort */
975
#include <string.h>     /* memcpy, memset */
976
#include <stdio.h>      /* printf (debug) */
977
978
/****************************************************************
979
*  Constants
980
*****************************************************************/
981
17.2k
#define FSE_MAX_TABLELOG  (FSE_MAX_MEMORY_USAGE-2)
982
#define FSE_MAX_TABLESIZE (1U<<FSE_MAX_TABLELOG)
983
#define FSE_MAXTABLESIZE_MASK (FSE_MAX_TABLESIZE-1)
984
#define FSE_DEFAULT_TABLELOG (FSE_DEFAULT_MEMORY_USAGE-2)
985
5.11k
#define FSE_MIN_TABLELOG 5
986
987
5.11k
#define FSE_TABLELOG_ABSOLUTE_MAX 15
988
#if FSE_MAX_TABLELOG > FSE_TABLELOG_ABSOLUTE_MAX
989
#error "FSE_MAX_TABLELOG > FSE_TABLELOG_ABSOLUTE_MAX is not supported"
990
#endif
991
992
993
/****************************************************************
994
*  Error Management
995
****************************************************************/
996
#define FSE_STATIC_ASSERT(c) { enum { FSE_static_assert = 1/(int)(!!(c)) }; }   /* use only *after* variable declarations */
997
998
999
/****************************************************************
1000
*  Complex types
1001
****************************************************************/
1002
typedef U32 DTable_max_t[FSE_DTABLE_SIZE_U32(FSE_MAX_TABLELOG)];
1003
1004
1005
/****************************************************************
1006
*  Templates
1007
****************************************************************/
1008
/*
1009
  designed to be included
1010
  for type-specific functions (template emulation in C)
1011
  Objective is to write these functions only once, for improved maintenance
1012
*/
1013
1014
/* safety checks */
1015
#ifndef FSE_FUNCTION_EXTENSION
1016
#  error "FSE_FUNCTION_EXTENSION must be defined"
1017
#endif
1018
#ifndef FSE_FUNCTION_TYPE
1019
#  error "FSE_FUNCTION_TYPE must be defined"
1020
#endif
1021
1022
/* Function names */
1023
#define FSE_CAT(X,Y) X##Y
1024
#define FSE_FUNCTION_NAME(X,Y) FSE_CAT(X,Y)
1025
#define FSE_TYPE_NAME(X,Y) FSE_CAT(X,Y)
1026
1027
1028
/* Function templates */
1029
1030
5.02k
#define FSE_DECODE_TYPE FSE_decode_t
1031
1032
5.02k
static U32 FSE_tableStep(U32 tableSize) { return (tableSize>>1) + (tableSize>>3) + 3; }
1033
1034
static size_t FSE_buildDTable
1035
(FSE_DTable* dt, const short* normalizedCounter, unsigned maxSymbolValue, unsigned tableLog)
1036
5.02k
{
1037
5.02k
    void* ptr = dt+1;
1038
5.02k
    FSE_DECODE_TYPE* const tableDecode = (FSE_DECODE_TYPE*)ptr;
1039
5.02k
    FSE_DTableHeader DTableH;
1040
5.02k
    const U32 tableSize = 1 << tableLog;
1041
5.02k
    const U32 tableMask = tableSize-1;
1042
5.02k
    const U32 step = FSE_tableStep(tableSize);
1043
5.02k
    U16 symbolNext[FSE_MAX_SYMBOL_VALUE+1];
1044
5.02k
    U32 position = 0;
1045
5.02k
    U32 highThreshold = tableSize-1;
1046
5.02k
    const S16 largeLimit= (S16)(1 << (tableLog-1));
1047
5.02k
    U32 noLarge = 1;
1048
5.02k
    U32 s;
1049
1050
    /* Sanity Checks */
1051
5.02k
    if (maxSymbolValue > FSE_MAX_SYMBOL_VALUE) return ERROR(maxSymbolValue_tooLarge);
1052
5.02k
    if (tableLog > FSE_MAX_TABLELOG) return ERROR(tableLog_tooLarge);
1053
1054
    /* Init, lay down lowprob symbols */
1055
5.02k
    DTableH.tableLog = (U16)tableLog;
1056
53.2k
    for (s=0; s<=maxSymbolValue; s++)
1057
48.2k
    {
1058
48.2k
        if (normalizedCounter[s]==-1)
1059
13.9k
        {
1060
13.9k
            tableDecode[highThreshold--].symbol = (FSE_FUNCTION_TYPE)s;
1061
13.9k
            symbolNext[s] = 1;
1062
13.9k
        }
1063
34.3k
        else
1064
34.3k
        {
1065
34.3k
            if (normalizedCounter[s] >= largeLimit) noLarge=0;
1066
34.3k
            symbolNext[s] = normalizedCounter[s];
1067
34.3k
        }
1068
48.2k
    }
1069
1070
    /* Spread symbols */
1071
53.2k
    for (s=0; s<=maxSymbolValue; s++)
1072
48.2k
    {
1073
48.2k
        int i;
1074
524k
        for (i=0; i<normalizedCounter[s]; i++)
1075
476k
        {
1076
476k
            tableDecode[position].symbol = (FSE_FUNCTION_TYPE)s;
1077
476k
            position = (position + step) & tableMask;
1078
489k
            while (position > highThreshold) position = (position + step) & tableMask;   /* lowprob area */
1079
476k
        }
1080
48.2k
    }
1081
1082
5.02k
    if (position!=0) return ERROR(GENERIC);   /* position must reach all cells once, otherwise normalizedCounter is incorrect */
1083
1084
    /* Build Decoding table */
1085
5.02k
    {
1086
5.02k
        U32 i;
1087
495k
        for (i=0; i<tableSize; i++)
1088
490k
        {
1089
490k
            FSE_FUNCTION_TYPE symbol = (FSE_FUNCTION_TYPE)(tableDecode[i].symbol);
1090
490k
            U16 nextState = symbolNext[symbol]++;
1091
490k
            tableDecode[i].nbBits = (BYTE) (tableLog - BIT_highbit32 ((U32)nextState) );
1092
490k
            tableDecode[i].newState = (U16) ( (nextState << tableDecode[i].nbBits) - tableSize);
1093
490k
        }
1094
5.02k
    }
1095
1096
5.02k
    DTableH.fastMode = (U16)noLarge;
1097
5.02k
    memcpy(dt, &DTableH, sizeof(DTableH));   /* memcpy(), to avoid strict aliasing warnings */
1098
5.02k
    return 0;
1099
5.02k
}
1100
1101
1102
#ifndef FSE_COMMONDEFS_ONLY
1103
/******************************************
1104
*  FSE helper functions
1105
******************************************/
1106
5.84k
static unsigned FSE_isError(size_t code) { return ERR_isError(code); }
1107
1108
1109
/****************************************************************
1110
*  FSE NCount encoding-decoding
1111
****************************************************************/
1112
static short FSE_abs(short a)
1113
35.9k
{
1114
35.9k
    return (short)(a<0 ? -a : a);
1115
35.9k
}
1116
1117
static size_t FSE_readNCount (short* normalizedCounter, unsigned* maxSVPtr, unsigned* tableLogPtr,
1118
                 const void* headerBuffer, size_t hbSize)
1119
5.13k
{
1120
5.13k
    const BYTE* const istart = (const BYTE*) headerBuffer;
1121
5.13k
    const BYTE* const iend = istart + hbSize;
1122
5.13k
    const BYTE* ip = istart;
1123
5.13k
    int nbBits;
1124
5.13k
    int remaining;
1125
5.13k
    int threshold;
1126
5.13k
    U32 bitStream;
1127
5.13k
    int bitCount;
1128
5.13k
    unsigned charnum = 0;
1129
5.13k
    int previous0 = 0;
1130
1131
5.13k
    if (hbSize < 4) return ERROR(srcSize_wrong);
1132
5.11k
    bitStream = MEM_readLE32(ip);
1133
5.11k
    nbBits = (bitStream & 0xF) + FSE_MIN_TABLELOG;   /* extract tableLog */
1134
5.11k
    if (nbBits > FSE_TABLELOG_ABSOLUTE_MAX) return ERROR(tableLog_tooLarge);
1135
5.10k
    bitStream >>= 4;
1136
5.10k
    bitCount = 4;
1137
5.10k
    *tableLogPtr = nbBits;
1138
5.10k
    remaining = (1<<nbBits)+1;
1139
5.10k
    threshold = 1<<nbBits;
1140
5.10k
    nbBits++;
1141
1142
41.0k
    while ((remaining>1) && (charnum<=*maxSVPtr))
1143
35.9k
    {
1144
35.9k
        if (previous0)
1145
4.64k
        {
1146
4.64k
            unsigned n0 = charnum;
1147
49.2k
            while ((bitStream & 0xFFFF) == 0xFFFF)
1148
44.5k
            {
1149
44.5k
                n0+=24;
1150
44.5k
                if (ip < iend-5)
1151
44.4k
                {
1152
44.4k
                    ip+=2;
1153
44.4k
                    bitStream = MEM_readLE32(ip) >> bitCount;
1154
44.4k
                }
1155
70
                else
1156
70
                {
1157
70
                    bitStream >>= 16;
1158
70
                    bitCount+=16;
1159
70
                }
1160
44.5k
            }
1161
6.17k
            while ((bitStream & 3) == 3)
1162
1.52k
            {
1163
1.52k
                n0+=3;
1164
1.52k
                bitStream>>=2;
1165
1.52k
                bitCount+=2;
1166
1.52k
            }
1167
4.64k
            n0 += bitStream & 3;
1168
4.64k
            bitCount += 2;
1169
4.64k
            if (n0 > *maxSVPtr) return ERROR(maxSymbolValue_tooSmall);
1170
23.2k
            while (charnum < n0) normalizedCounter[charnum++] = 0;
1171
4.63k
            if ((ip <= iend-7) || (ip + (bitCount>>3) <= iend-4))
1172
2.95k
            {
1173
2.95k
                ip += bitCount>>3;
1174
2.95k
                bitCount &= 7;
1175
2.95k
                bitStream = MEM_readLE32(ip) >> bitCount;
1176
2.95k
            }
1177
1.68k
            else
1178
1.68k
                bitStream >>= 2;
1179
4.63k
        }
1180
35.9k
        {
1181
35.9k
            const short max = (short)((2*threshold-1)-remaining);
1182
35.9k
            short count;
1183
1184
35.9k
            if ((bitStream & (threshold-1)) < (U32)max)
1185
21.8k
            {
1186
21.8k
                count = (short)(bitStream & (threshold-1));
1187
21.8k
                bitCount   += nbBits-1;
1188
21.8k
            }
1189
14.1k
            else
1190
14.1k
            {
1191
14.1k
                count = (short)(bitStream & (2*threshold-1));
1192
14.1k
                if (count >= threshold) count -= max;
1193
14.1k
                bitCount   += nbBits;
1194
14.1k
            }
1195
1196
35.9k
            count--;   /* extra accuracy */
1197
35.9k
            remaining -= FSE_abs(count);
1198
35.9k
            normalizedCounter[charnum++] = count;
1199
35.9k
            previous0 = !count;
1200
64.5k
            while (remaining < threshold)
1201
28.6k
            {
1202
28.6k
                nbBits--;
1203
28.6k
                threshold >>= 1;
1204
28.6k
            }
1205
1206
35.9k
            {
1207
35.9k
                if ((ip <= iend-7) || (ip + (bitCount>>3) <= iend-4))
1208
30.3k
                {
1209
30.3k
                    ip += bitCount>>3;
1210
30.3k
                    bitCount &= 7;
1211
30.3k
                }
1212
5.58k
                else
1213
5.58k
                {
1214
5.58k
                    bitCount -= (int)(8 * (iend - 4 - ip));
1215
5.58k
                    ip = iend - 4;
1216
5.58k
                }
1217
35.9k
                bitStream = MEM_readLE32(ip) >> (bitCount & 31);
1218
35.9k
            }
1219
35.9k
        }
1220
35.9k
    }
1221
5.08k
    if (remaining != 1) return ERROR(GENERIC);
1222
5.07k
    *maxSVPtr = charnum-1;
1223
1224
5.07k
    ip += (bitCount+7)>>3;
1225
5.07k
    if ((size_t)(ip-istart) > hbSize) return ERROR(srcSize_wrong);
1226
5.04k
    return ip-istart;
1227
5.07k
}
1228
1229
1230
/*********************************************************
1231
*  Decompression (Byte symbols)
1232
*********************************************************/
1233
static size_t FSE_buildDTable_rle (FSE_DTable* dt, BYTE symbolValue)
1234
4.07k
{
1235
4.07k
    void* ptr = dt;
1236
4.07k
    FSE_DTableHeader* const DTableH = (FSE_DTableHeader*)ptr;
1237
4.07k
    FSE_decode_t* const cell = (FSE_decode_t*)(ptr) + 1;   /* because dt is unsigned */
1238
1239
4.07k
    DTableH->tableLog = 0;
1240
4.07k
    DTableH->fastMode = 0;
1241
1242
4.07k
    cell->newState = 0;
1243
4.07k
    cell->symbol = symbolValue;
1244
4.07k
    cell->nbBits = 0;
1245
1246
4.07k
    return 0;
1247
4.07k
}
1248
1249
1250
static size_t FSE_buildDTable_raw (FSE_DTable* dt, unsigned nbBits)
1251
10.7k
{
1252
10.7k
    void* ptr = dt;
1253
10.7k
    FSE_DTableHeader* const DTableH = (FSE_DTableHeader*)ptr;
1254
10.7k
    FSE_decode_t* const dinfo = (FSE_decode_t*)(ptr) + 1;   /* because dt is unsigned */
1255
10.7k
    const unsigned tableSize = 1 << nbBits;
1256
10.7k
    const unsigned tableMask = tableSize - 1;
1257
10.7k
    const unsigned maxSymbolValue = tableMask;
1258
10.7k
    unsigned s;
1259
1260
    /* Sanity checks */
1261
10.7k
    if (nbBits < 1) return ERROR(GENERIC);         /* min size */
1262
1263
    /* Build Decoding Table */
1264
10.7k
    DTableH->tableLog = (U16)nbBits;
1265
10.7k
    DTableH->fastMode = 1;
1266
869k
    for (s=0; s<=maxSymbolValue; s++)
1267
858k
    {
1268
858k
        dinfo[s].newState = 0;
1269
858k
        dinfo[s].symbol = (BYTE)s;
1270
858k
        dinfo[s].nbBits = (BYTE)nbBits;
1271
858k
    }
1272
1273
10.7k
    return 0;
1274
10.7k
}
1275
1276
FORCE_INLINE size_t FSE_decompress_usingDTable_generic(
1277
          void* dst, size_t maxDstSize,
1278
    const void* cSrc, size_t cSrcSize,
1279
    const FSE_DTable* dt, const unsigned fast)
1280
220
{
1281
220
    BYTE* const ostart = (BYTE*) dst;
1282
220
    BYTE* op = ostart;
1283
220
    BYTE* const omax = op + maxDstSize;
1284
220
    BYTE* const olimit = omax-3;
1285
1286
220
    BIT_DStream_t bitD;
1287
220
    FSE_DState_t state1;
1288
220
    FSE_DState_t state2;
1289
220
    size_t errorCode;
1290
1291
    /* Init */
1292
220
    errorCode = BIT_initDStream(&bitD, cSrc, cSrcSize);   /* replaced last arg by maxCompressed Size */
1293
220
    if (FSE_isError(errorCode)) return errorCode;
1294
1295
206
    FSE_initDState(&state1, &bitD, dt);
1296
206
    FSE_initDState(&state2, &bitD, dt);
1297
1298
27.4k
#define FSE_GETSYMBOL(statePtr) fast ? FSE_decodeSymbolFast(statePtr, &bitD) : FSE_decodeSymbol(statePtr, &bitD)
1299
1300
    /* 4 symbols per loop */
1301
4.26k
    for ( ; (BIT_reloadDStream(&bitD)==BIT_DStream_unfinished) && (op<olimit) ; op+=4)
1302
4.06k
    {
1303
4.06k
        op[0] = FSE_GETSYMBOL(&state1);
1304
1305
4.06k
        if (FSE_MAX_TABLELOG*2+7 > sizeof(bitD.bitContainer)*8)    /* This test must be static */
1306
0
            BIT_reloadDStream(&bitD);
1307
1308
4.06k
        op[1] = FSE_GETSYMBOL(&state2);
1309
1310
4.06k
        if (FSE_MAX_TABLELOG*4+7 > sizeof(bitD.bitContainer)*8)    /* This test must be static */
1311
0
            { if (BIT_reloadDStream(&bitD) > BIT_DStream_unfinished) { op+=2; break; } }
1312
1313
4.06k
        op[2] = FSE_GETSYMBOL(&state1);
1314
1315
4.06k
        if (FSE_MAX_TABLELOG*2+7 > sizeof(bitD.bitContainer)*8)    /* This test must be static */
1316
0
            BIT_reloadDStream(&bitD);
1317
1318
4.06k
        op[3] = FSE_GETSYMBOL(&state2);
1319
4.06k
    }
1320
1321
    /* tail */
1322
    /* note : BIT_reloadDStream(&bitD) >= FSE_DStream_partiallyFilled; Ends at exactly BIT_DStream_completed */
1323
5.73k
    while (1)
1324
5.73k
    {
1325
5.73k
        if ( (BIT_reloadDStream(&bitD)>BIT_DStream_completed) || (op==omax) || (BIT_endOfDStream(&bitD) && (fast || FSE_endOfDState(&state1))) )
1326
95
            break;
1327
1328
5.64k
        *op++ = FSE_GETSYMBOL(&state1);
1329
1330
5.64k
        if ( (BIT_reloadDStream(&bitD)>BIT_DStream_completed) || (op==omax) || (BIT_endOfDStream(&bitD) && (fast || FSE_endOfDState(&state2))) )
1331
111
            break;
1332
1333
5.53k
        *op++ = FSE_GETSYMBOL(&state2);
1334
5.53k
    }
1335
1336
    /* end ? */
1337
206
    if (BIT_endOfDStream(&bitD) && FSE_endOfDState(&state1) && FSE_endOfDState(&state2))
1338
91
        return op-ostart;
1339
1340
115
    if (op==omax) return ERROR(dstSize_tooSmall);   /* dst buffer is full, but cSrc unfinished */
1341
1342
83
    return ERROR(corruption_detected);
1343
115
}
1344
1345
1346
static size_t FSE_decompress_usingDTable(void* dst, size_t originalSize,
1347
                            const void* cSrc, size_t cSrcSize,
1348
                            const FSE_DTable* dt)
1349
220
{
1350
220
    FSE_DTableHeader DTableH;
1351
220
    memcpy(&DTableH, dt, sizeof(DTableH));
1352
1353
    /* select fast mode (static) */
1354
220
    if (DTableH.fastMode) return FSE_decompress_usingDTable_generic(dst, originalSize, cSrc, cSrcSize, dt, 1);
1355
159
    return FSE_decompress_usingDTable_generic(dst, originalSize, cSrc, cSrcSize, dt, 0);
1356
220
}
1357
1358
1359
static size_t FSE_decompress(void* dst, size_t maxDstSize, const void* cSrc, size_t cSrcSize)
1360
265
{
1361
265
    const BYTE* const istart = (const BYTE*)cSrc;
1362
265
    const BYTE* ip = istart;
1363
265
    short counting[FSE_MAX_SYMBOL_VALUE+1];
1364
265
    DTable_max_t dt;   /* Static analyzer seems unable to understand this table will be properly initialized later */
1365
265
    unsigned tableLog;
1366
265
    unsigned maxSymbolValue = FSE_MAX_SYMBOL_VALUE;
1367
265
    size_t errorCode;
1368
1369
265
    if (cSrcSize<2) return ERROR(srcSize_wrong);   /* too small input size */
1370
1371
    /* normal FSE decoding mode */
1372
255
    errorCode = FSE_readNCount (counting, &maxSymbolValue, &tableLog, istart, cSrcSize);
1373
255
    if (FSE_isError(errorCode)) return errorCode;
1374
224
    if (errorCode >= cSrcSize) return ERROR(srcSize_wrong);   /* too small input size */
1375
221
    ip += errorCode;
1376
221
    cSrcSize -= errorCode;
1377
1378
221
    errorCode = FSE_buildDTable (dt, counting, maxSymbolValue, tableLog);
1379
221
    if (FSE_isError(errorCode)) return errorCode;
1380
1381
    /* always return, even if it is an error code */
1382
220
    return FSE_decompress_usingDTable (dst, maxDstSize, ip, cSrcSize, dt);
1383
221
}
1384
1385
1386
1387
#endif   /* FSE_COMMONDEFS_ONLY */
1388
/* ******************************************************************
1389
   Huff0 : Huffman coder, part of New Generation Entropy library
1390
   Copyright (C) 2013-2015, Yann Collet.
1391
1392
   BSD 2-Clause License (https://opensource.org/licenses/bsd-license.php)
1393
1394
   Redistribution and use in source and binary forms, with or without
1395
   modification, are permitted provided that the following conditions are
1396
   met:
1397
1398
       * Redistributions of source code must retain the above copyright
1399
   notice, this list of conditions and the following disclaimer.
1400
       * Redistributions in binary form must reproduce the above
1401
   copyright notice, this list of conditions and the following disclaimer
1402
   in the documentation and/or other materials provided with the
1403
   distribution.
1404
1405
   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
1406
   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
1407
   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
1408
   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
1409
   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
1410
   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
1411
   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
1412
   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
1413
   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
1414
   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
1415
   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
1416
1417
    You can contact the author at :
1418
    - FSE+Huff0 source repository : https://github.com/Cyan4973/FiniteStateEntropy
1419
    - Public forum : https://groups.google.com/forum/#!forum/lz4c
1420
****************************************************************** */
1421
1422
/****************************************************************
1423
*  Compiler specifics
1424
****************************************************************/
1425
#if defined (__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */)
1426
/* inline is defined */
1427
#elif defined(_MSC_VER)
1428
#  define inline __inline
1429
#else
1430
#  define inline /* disable inline */
1431
#endif
1432
1433
1434
#ifdef _MSC_VER    /* Visual Studio */
1435
#  pragma warning(disable : 4127)        /* disable: C4127: conditional expression is constant */
1436
#endif
1437
1438
1439
/****************************************************************
1440
*  Includes
1441
****************************************************************/
1442
#include <stdlib.h>     /* malloc, free, qsort */
1443
#include <string.h>     /* memcpy, memset */
1444
#include <stdio.h>      /* printf (debug) */
1445
1446
/****************************************************************
1447
*  Error Management
1448
****************************************************************/
1449
956
#define HUF_STATIC_ASSERT(c) { enum { HUF_static_assert = 1/(int)(!!(c)) }; }   /* use only *after* variable declarations */
1450
1451
1452
/******************************************
1453
*  Helper functions
1454
******************************************/
1455
6.85k
static unsigned HUF_isError(size_t code) { return ERR_isError(code); }
1456
1457
92.6k
#define HUF_ABSOLUTEMAX_TABLELOG  16   /* absolute limit of HUF_MAX_TABLELOG. Beyond that value, code does not work */
1458
0
#define HUF_MAX_TABLELOG  12           /* max configured tableLog (for static allocation); can be modified up to HUF_ABSOLUTEMAX_TABLELOG */
1459
#define HUF_DEFAULT_TABLELOG  HUF_MAX_TABLELOG   /* tableLog by default, when not specified */
1460
1.10k
#define HUF_MAX_SYMBOL_VALUE 255
1461
#if (HUF_MAX_TABLELOG > HUF_ABSOLUTEMAX_TABLELOG)
1462
#  error "HUF_MAX_TABLELOG is too large !"
1463
#endif
1464
1465
1466
1467
/*********************************************************
1468
*  Huff0 : Huffman block decompression
1469
*********************************************************/
1470
typedef struct { BYTE byte; BYTE nbBits; } HUF_DEltX2;   /* single-symbol decoding */
1471
1472
typedef struct { U16 sequence; BYTE nbBits; BYTE length; } HUF_DEltX4;  /* double-symbols decoding */
1473
1474
typedef struct { BYTE symbol; BYTE weight; } sortedSymbol_t;
1475
1476
/*! HUF_readStats
1477
    Read compact Huffman tree, saved by HUF_writeCTable
1478
    @huffWeight : destination buffer
1479
    @return : size read from `src`
1480
*/
1481
static size_t HUF_readStats(BYTE* huffWeight, size_t hwSize, U32* rankStats,
1482
                            U32* nbSymbolsPtr, U32* tableLogPtr,
1483
                            const void* src, size_t srcSize)
1484
1.10k
{
1485
1.10k
    U32 weightTotal;
1486
1.10k
    U32 tableLog;
1487
1.10k
    const BYTE* ip = (const BYTE*) src;
1488
1.10k
    size_t iSize;
1489
1.10k
    size_t oSize;
1490
1.10k
    U32 n;
1491
1492
1.10k
    if (!srcSize) return ERROR(srcSize_wrong);
1493
1.10k
    iSize = ip[0];
1494
    //memset(huffWeight, 0, hwSize);   /* is not necessary, even though some analyzer complain ... */
1495
1496
1.10k
    if (iSize >= 128)  /* special header */
1497
838
    {
1498
838
        if (iSize >= (242))   /* RLE */
1499
724
        {
1500
724
            static int l[14] = { 1, 2, 3, 4, 7, 8, 15, 16, 31, 32, 63, 64, 127, 128 };
1501
724
            oSize = l[iSize-242];
1502
724
            memset(huffWeight, 1, hwSize);
1503
724
            iSize = 0;
1504
724
        }
1505
114
        else   /* Incompressible */
1506
114
        {
1507
114
            oSize = iSize - 127;
1508
114
            iSize = ((oSize+1)/2);
1509
114
            if (iSize+1 > srcSize) return ERROR(srcSize_wrong);
1510
112
            if (oSize >= hwSize) return ERROR(corruption_detected);
1511
112
            ip += 1;
1512
3.68k
            for (n=0; n<oSize; n+=2)
1513
3.57k
            {
1514
3.57k
                huffWeight[n]   = ip[n/2] >> 4;
1515
3.57k
                huffWeight[n+1] = ip[n/2] & 15;
1516
3.57k
            }
1517
112
        }
1518
838
    }
1519
266
    else  /* header compressed with FSE (normal case) */
1520
266
    {
1521
266
        if (iSize+1 > srcSize) return ERROR(srcSize_wrong);
1522
265
        oSize = FSE_decompress(huffWeight, hwSize-1, ip+1, iSize);   /* max (hwSize-1) values decoded, as last one is implied */
1523
265
        if (FSE_isError(oSize)) return oSize;
1524
265
    }
1525
1526
    /* collect weight stats */
1527
927
    memset(rankStats, 0, (HUF_ABSOLUTEMAX_TABLELOG + 1) * sizeof(U32));
1528
927
    weightTotal = 0;
1529
91.4k
    for (n=0; n<oSize; n++)
1530
90.5k
    {
1531
90.5k
        if (huffWeight[n] >= HUF_ABSOLUTEMAX_TABLELOG) return ERROR(corruption_detected);
1532
90.5k
        rankStats[huffWeight[n]]++;
1533
90.5k
        weightTotal += (1 << huffWeight[n]) >> 1;
1534
90.5k
    }
1535
926
    if (weightTotal == 0) return ERROR(corruption_detected);
1536
1537
    /* get last non-null symbol weight (implied, total must be 2^n) */
1538
922
    tableLog = BIT_highbit32(weightTotal) + 1;
1539
922
    if (tableLog > HUF_ABSOLUTEMAX_TABLELOG) return ERROR(corruption_detected);
1540
916
    {
1541
916
        U32 total = 1 << tableLog;
1542
916
        U32 rest = total - weightTotal;
1543
916
        U32 verif = 1 << BIT_highbit32(rest);
1544
916
        U32 lastWeight = BIT_highbit32(rest) + 1;
1545
916
        if (verif != rest) return ERROR(corruption_detected);    /* last value must be a clean power of 2 */
1546
911
        huffWeight[oSize] = (BYTE)lastWeight;
1547
911
        rankStats[lastWeight]++;
1548
911
    }
1549
1550
    /* check tree construction validity */
1551
911
    if ((rankStats[1] < 2) || (rankStats[1] & 1)) return ERROR(corruption_detected);   /* by construction : at least 2 elts of rank 1, must be even */
1552
1553
    /* results */
1554
910
    *nbSymbolsPtr = (U32)(oSize+1);
1555
910
    *tableLogPtr = tableLog;
1556
910
    return iSize+1;
1557
911
}
1558
1559
1560
/**************************/
1561
/* single-symbol decoding */
1562
/**************************/
1563
1564
static size_t HUF_readDTableX2 (U16* DTable, const void* src, size_t srcSize)
1565
800
{
1566
800
    BYTE huffWeight[HUF_MAX_SYMBOL_VALUE + 1];
1567
800
    U32 rankVal[HUF_ABSOLUTEMAX_TABLELOG + 1];   /* large enough for values from 0 to 16 */
1568
800
    U32 tableLog = 0;
1569
800
    const BYTE* ip = (const BYTE*) src;
1570
800
    size_t iSize = ip[0];
1571
800
    U32 nbSymbols = 0;
1572
800
    U32 n;
1573
800
    U32 nextRankStart;
1574
800
    void* ptr = DTable+1;
1575
800
    HUF_DEltX2* const dt = (HUF_DEltX2*)ptr;
1576
1577
800
    HUF_STATIC_ASSERT(sizeof(HUF_DEltX2) == sizeof(U16));   /* if compilation fails here, assertion is false */
1578
    //memset(huffWeight, 0, sizeof(huffWeight));   /* is not necessary, even though some analyzer complain ... */
1579
1580
800
    iSize = HUF_readStats(huffWeight, HUF_MAX_SYMBOL_VALUE + 1, rankVal, &nbSymbols, &tableLog, src, srcSize);
1581
800
    if (HUF_isError(iSize)) return iSize;
1582
1583
    /* check result */
1584
613
    if (tableLog > DTable[0]) return ERROR(tableLog_tooLarge);   /* DTable is too small */
1585
612
    DTable[0] = (U16)tableLog;   /* maybe should separate sizeof DTable, as allocated, from used size of DTable, in case of DTable re-use */
1586
1587
    /* Prepare ranks */
1588
612
    nextRankStart = 0;
1589
4.86k
    for (n=1; n<=tableLog; n++)
1590
4.25k
    {
1591
4.25k
        U32 current = nextRankStart;
1592
4.25k
        nextRankStart += (rankVal[n] << (n-1));
1593
4.25k
        rankVal[n] = current;
1594
4.25k
    }
1595
1596
    /* fill DTable */
1597
58.7k
    for (n=0; n<nbSymbols; n++)
1598
58.1k
    {
1599
58.1k
        const U32 w = huffWeight[n];
1600
58.1k
        const U32 length = (1 << w) >> 1;
1601
58.1k
        U32 i;
1602
58.1k
        HUF_DEltX2 D;
1603
58.1k
        D.byte = (BYTE)n; D.nbBits = (BYTE)(tableLog + 1 - w);
1604
196k
        for (i = rankVal[w]; i < rankVal[w] + length; i++)
1605
138k
            dt[i] = D;
1606
58.1k
        rankVal[w] += length;
1607
58.1k
    }
1608
1609
612
    return iSize;
1610
613
}
1611
1612
static BYTE HUF_decodeSymbolX2(BIT_DStream_t* Dstream, const HUF_DEltX2* dt, const U32 dtLog)
1613
7.17M
{
1614
7.17M
        const size_t val = BIT_lookBitsFast(Dstream, dtLog); /* note : dtLog >= 1 */
1615
7.17M
        const BYTE c = dt[val].byte;
1616
7.17M
        BIT_skipBits(Dstream, dt[val].nbBits);
1617
7.17M
        return c;
1618
7.17M
}
1619
1620
#define HUF_DECODE_SYMBOLX2_0(ptr, DStreamPtr) \
1621
7.17M
    *ptr++ = HUF_decodeSymbolX2(DStreamPtr, dt, dtLog)
1622
1623
#define HUF_DECODE_SYMBOLX2_1(ptr, DStreamPtr) \
1624
155k
    if (MEM_64bits() || (HUF_MAX_TABLELOG<=12)) \
1625
155k
        HUF_DECODE_SYMBOLX2_0(ptr, DStreamPtr)
1626
1627
#define HUF_DECODE_SYMBOLX2_2(ptr, DStreamPtr) \
1628
311k
    if (MEM_64bits()) \
1629
311k
        HUF_DECODE_SYMBOLX2_0(ptr, DStreamPtr)
1630
1631
static inline size_t HUF_decodeStreamX2(BYTE* p, BIT_DStream_t* const bitDPtr, BYTE* const pEnd, const HUF_DEltX2* const dt, const U32 dtLog)
1632
2.11k
{
1633
2.11k
    BYTE* const pStart = p;
1634
1635
    /* up to 4 symbols at a time */
1636
92.3k
    while ((BIT_reloadDStream(bitDPtr) == BIT_DStream_unfinished) && (p <= pEnd-4))
1637
90.2k
    {
1638
90.2k
        HUF_DECODE_SYMBOLX2_2(p, bitDPtr);
1639
90.2k
        HUF_DECODE_SYMBOLX2_1(p, bitDPtr);
1640
90.2k
        HUF_DECODE_SYMBOLX2_2(p, bitDPtr);
1641
90.2k
        HUF_DECODE_SYMBOLX2_0(p, bitDPtr);
1642
90.2k
    }
1643
1644
    /* closer to the end */
1645
2.25k
    while ((BIT_reloadDStream(bitDPtr) == BIT_DStream_unfinished) && (p < pEnd))
1646
135
        HUF_DECODE_SYMBOLX2_0(p, bitDPtr);
1647
1648
    /* no more data to retrieve from bitstream, hence no need to reload */
1649
6.55M
    while (p < pEnd)
1650
6.55M
        HUF_DECODE_SYMBOLX2_0(p, bitDPtr);
1651
1652
2.11k
    return pEnd-pStart;
1653
2.11k
}
1654
1655
1656
static size_t HUF_decompress4X2_usingDTable(
1657
          void* dst,  size_t dstSize,
1658
    const void* cSrc, size_t cSrcSize,
1659
    const U16* DTable)
1660
600
{
1661
600
    if (cSrcSize < 10) return ERROR(corruption_detected);   /* strict minimum : jump table + 1 byte per stream */
1662
1663
581
    {
1664
581
        const BYTE* const istart = (const BYTE*) cSrc;
1665
581
        BYTE* const ostart = (BYTE*) dst;
1666
581
        BYTE* const oend = ostart + dstSize;
1667
1668
581
        const void* ptr = DTable;
1669
581
        const HUF_DEltX2* const dt = ((const HUF_DEltX2*)ptr) +1;
1670
581
        const U32 dtLog = DTable[0];
1671
581
        size_t errorCode;
1672
1673
        /* Init */
1674
581
        BIT_DStream_t bitD1;
1675
581
        BIT_DStream_t bitD2;
1676
581
        BIT_DStream_t bitD3;
1677
581
        BIT_DStream_t bitD4;
1678
581
        const size_t length1 = MEM_readLE16(istart);
1679
581
        const size_t length2 = MEM_readLE16(istart+2);
1680
581
        const size_t length3 = MEM_readLE16(istart+4);
1681
581
        size_t length4;
1682
581
        const BYTE* const istart1 = istart + 6;  /* jumpTable */
1683
581
        const BYTE* const istart2 = istart1 + length1;
1684
581
        const BYTE* const istart3 = istart2 + length2;
1685
581
        const BYTE* const istart4 = istart3 + length3;
1686
581
        const size_t segmentSize = (dstSize+3) / 4;
1687
581
        BYTE* const opStart2 = ostart + segmentSize;
1688
581
        BYTE* const opStart3 = opStart2 + segmentSize;
1689
581
        BYTE* const opStart4 = opStart3 + segmentSize;
1690
581
        BYTE* op1 = ostart;
1691
581
        BYTE* op2 = opStart2;
1692
581
        BYTE* op3 = opStart3;
1693
581
        BYTE* op4 = opStart4;
1694
581
        U32 endSignal;
1695
1696
581
        length4 = cSrcSize - (length1 + length2 + length3 + 6);
1697
581
        if (length4 > cSrcSize) return ERROR(corruption_detected);   /* overflow */
1698
577
        errorCode = BIT_initDStream(&bitD1, istart1, length1);
1699
577
        if (HUF_isError(errorCode)) return errorCode;
1700
572
        errorCode = BIT_initDStream(&bitD2, istart2, length2);
1701
572
        if (HUF_isError(errorCode)) return errorCode;
1702
556
        errorCode = BIT_initDStream(&bitD3, istart3, length3);
1703
556
        if (HUF_isError(errorCode)) return errorCode;
1704
540
        errorCode = BIT_initDStream(&bitD4, istart4, length4);
1705
540
        if (HUF_isError(errorCode)) return errorCode;
1706
1707
        /* 16-32 symbols per loop (4-8 symbols per stream) */
1708
529
        endSignal = BIT_reloadDStream(&bitD1) | BIT_reloadDStream(&bitD2) | BIT_reloadDStream(&bitD3) | BIT_reloadDStream(&bitD4);
1709
16.8k
        for ( ; (endSignal==BIT_DStream_unfinished) && (op4<(oend-7)) ; )
1710
16.3k
        {
1711
16.3k
            HUF_DECODE_SYMBOLX2_2(op1, &bitD1);
1712
16.3k
            HUF_DECODE_SYMBOLX2_2(op2, &bitD2);
1713
16.3k
            HUF_DECODE_SYMBOLX2_2(op3, &bitD3);
1714
16.3k
            HUF_DECODE_SYMBOLX2_2(op4, &bitD4);
1715
16.3k
            HUF_DECODE_SYMBOLX2_1(op1, &bitD1);
1716
16.3k
            HUF_DECODE_SYMBOLX2_1(op2, &bitD2);
1717
16.3k
            HUF_DECODE_SYMBOLX2_1(op3, &bitD3);
1718
16.3k
            HUF_DECODE_SYMBOLX2_1(op4, &bitD4);
1719
16.3k
            HUF_DECODE_SYMBOLX2_2(op1, &bitD1);
1720
16.3k
            HUF_DECODE_SYMBOLX2_2(op2, &bitD2);
1721
16.3k
            HUF_DECODE_SYMBOLX2_2(op3, &bitD3);
1722
16.3k
            HUF_DECODE_SYMBOLX2_2(op4, &bitD4);
1723
16.3k
            HUF_DECODE_SYMBOLX2_0(op1, &bitD1);
1724
16.3k
            HUF_DECODE_SYMBOLX2_0(op2, &bitD2);
1725
16.3k
            HUF_DECODE_SYMBOLX2_0(op3, &bitD3);
1726
16.3k
            HUF_DECODE_SYMBOLX2_0(op4, &bitD4);
1727
1728
16.3k
            endSignal = BIT_reloadDStream(&bitD1) | BIT_reloadDStream(&bitD2) | BIT_reloadDStream(&bitD3) | BIT_reloadDStream(&bitD4);
1729
16.3k
        }
1730
1731
        /* check corruption */
1732
529
        if (op1 > opStart2) return ERROR(corruption_detected);
1733
529
        if (op2 > opStart3) return ERROR(corruption_detected);
1734
529
        if (op3 > opStart4) return ERROR(corruption_detected);
1735
        /* note : op4 supposed already verified within main loop */
1736
1737
        /* finish bitStreams one by one */
1738
529
        HUF_decodeStreamX2(op1, &bitD1, opStart2, dt, dtLog);
1739
529
        HUF_decodeStreamX2(op2, &bitD2, opStart3, dt, dtLog);
1740
529
        HUF_decodeStreamX2(op3, &bitD3, opStart4, dt, dtLog);
1741
529
        HUF_decodeStreamX2(op4, &bitD4, oend,     dt, dtLog);
1742
1743
        /* check */
1744
529
        endSignal = BIT_endOfDStream(&bitD1) & BIT_endOfDStream(&bitD2) & BIT_endOfDStream(&bitD3) & BIT_endOfDStream(&bitD4);
1745
529
        if (!endSignal) return ERROR(corruption_detected);
1746
1747
        /* decoded size */
1748
379
        return dstSize;
1749
529
    }
1750
529
}
1751
1752
1753
static size_t HUF_decompress4X2 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize)
1754
800
{
1755
800
    HUF_CREATE_STATIC_DTABLEX2(DTable, HUF_MAX_TABLELOG);
1756
800
    const BYTE* ip = (const BYTE*) cSrc;
1757
800
    size_t errorCode;
1758
1759
800
    errorCode = HUF_readDTableX2 (DTable, cSrc, cSrcSize);
1760
800
    if (HUF_isError(errorCode)) return errorCode;
1761
612
    if (errorCode >= cSrcSize) return ERROR(srcSize_wrong);
1762
600
    ip += errorCode;
1763
600
    cSrcSize -= errorCode;
1764
1765
600
    return HUF_decompress4X2_usingDTable (dst, dstSize, ip, cSrcSize, DTable);
1766
612
}
1767
1768
1769
/***************************/
1770
/* double-symbols decoding */
1771
/***************************/
1772
1773
static void HUF_fillDTableX4Level2(HUF_DEltX4* DTable, U32 sizeLog, const U32 consumed,
1774
                           const U32* rankValOrigin, const int minWeight,
1775
                           const sortedSymbol_t* sortedSymbols, const U32 sortedListSize,
1776
                           U32 nbBitsBaseline, U16 baseSeq)
1777
12.4k
{
1778
12.4k
    HUF_DEltX4 DElt;
1779
12.4k
    U32 rankVal[HUF_ABSOLUTEMAX_TABLELOG + 1];
1780
12.4k
    U32 s;
1781
1782
    /* get pre-calculated rankVal */
1783
12.4k
    memcpy(rankVal, rankValOrigin, sizeof(rankVal));
1784
1785
    /* fill skipped values */
1786
12.4k
    if (minWeight>1)
1787
11.7k
    {
1788
11.7k
        U32 i, skipSize = rankVal[minWeight];
1789
11.7k
        MEM_writeLE16(&(DElt.sequence), baseSeq);
1790
11.7k
        DElt.nbBits   = (BYTE)(consumed);
1791
11.7k
        DElt.length   = 1;
1792
117k
        for (i = 0; i < skipSize; i++)
1793
105k
            DTable[i] = DElt;
1794
11.7k
    }
1795
1796
    /* fill DTable */
1797
72.9k
    for (s=0; s<sortedListSize; s++)   /* note : sortedSymbols already skipped */
1798
60.5k
    {
1799
60.5k
        const U32 symbol = sortedSymbols[s].symbol;
1800
60.5k
        const U32 weight = sortedSymbols[s].weight;
1801
60.5k
        const U32 nbBits = nbBitsBaseline - weight;
1802
60.5k
        const U32 length = 1 << (sizeLog-nbBits);
1803
60.5k
        const U32 start = rankVal[weight];
1804
60.5k
        U32 i = start;
1805
60.5k
        const U32 end = start + length;
1806
1807
60.5k
        MEM_writeLE16(&(DElt.sequence), (U16)(baseSeq + (symbol << 8)));
1808
60.5k
        DElt.nbBits = (BYTE)(nbBits + consumed);
1809
60.5k
        DElt.length = 2;
1810
450k
        do { DTable[i++] = DElt; } while (i<end);   /* since length >= 1 */
1811
1812
60.5k
        rankVal[weight] += length;
1813
60.5k
    }
1814
12.4k
}
1815
1816
typedef U32 rankVal_t[HUF_ABSOLUTEMAX_TABLELOG][HUF_ABSOLUTEMAX_TABLELOG + 1];
1817
1818
static void HUF_fillDTableX4(HUF_DEltX4* DTable, const U32 targetLog,
1819
                           const sortedSymbol_t* sortedList, const U32 sortedListSize,
1820
                           const U32* rankStart, rankVal_t rankValOrigin, const U32 maxWeight,
1821
                           const U32 nbBitsBaseline)
1822
150
{
1823
150
    U32 rankVal[HUF_ABSOLUTEMAX_TABLELOG + 1];
1824
150
    const int scaleLog = nbBitsBaseline - targetLog;   /* note : targetLog >= srcLog, hence scaleLog <= 1 */
1825
150
    const U32 minBits  = nbBitsBaseline - maxWeight;
1826
150
    U32 s;
1827
1828
150
    memcpy(rankVal, rankValOrigin, sizeof(rankVal));
1829
1830
    /* fill DTable */
1831
15.5k
    for (s=0; s<sortedListSize; s++)
1832
15.4k
    {
1833
15.4k
        const U16 symbol = sortedList[s].symbol;
1834
15.4k
        const U32 weight = sortedList[s].weight;
1835
15.4k
        const U32 nbBits = nbBitsBaseline - weight;
1836
15.4k
        const U32 start = rankVal[weight];
1837
15.4k
        const U32 length = 1 << (targetLog-nbBits);
1838
1839
15.4k
        if (targetLog-nbBits >= minBits)   /* enough room for a second symbol */
1840
12.4k
        {
1841
12.4k
            U32 sortedRank;
1842
12.4k
            int minWeight = nbBits + scaleLog;
1843
12.4k
            if (minWeight < 1) minWeight = 1;
1844
12.4k
            sortedRank = rankStart[minWeight];
1845
12.4k
            HUF_fillDTableX4Level2(DTable+start, targetLog-nbBits, nbBits,
1846
12.4k
                           rankValOrigin[nbBits], minWeight,
1847
12.4k
                           sortedList+sortedRank, sortedListSize-sortedRank,
1848
12.4k
                           nbBitsBaseline, symbol);
1849
12.4k
        }
1850
3.01k
        else
1851
3.01k
        {
1852
3.01k
            U32 i;
1853
3.01k
            const U32 end = start + length;
1854
3.01k
            HUF_DEltX4 DElt;
1855
1856
3.01k
            MEM_writeLE16(&(DElt.sequence), symbol);
1857
3.01k
            DElt.nbBits   = (BYTE)(nbBits);
1858
3.01k
            DElt.length   = 1;
1859
61.4k
            for (i = start; i < end; i++)
1860
58.4k
                DTable[i] = DElt;
1861
3.01k
        }
1862
15.4k
        rankVal[weight] += length;
1863
15.4k
    }
1864
150
}
1865
1866
static size_t HUF_readDTableX4 (U32* DTable, const void* src, size_t srcSize)
1867
156
{
1868
156
    BYTE weightList[HUF_MAX_SYMBOL_VALUE + 1];
1869
156
    sortedSymbol_t sortedSymbol[HUF_MAX_SYMBOL_VALUE + 1];
1870
156
    U32 rankStats[HUF_ABSOLUTEMAX_TABLELOG + 1] = { 0 };
1871
156
    U32 rankStart0[HUF_ABSOLUTEMAX_TABLELOG + 2] = { 0 };
1872
156
    U32* const rankStart = rankStart0+1;
1873
156
    rankVal_t rankVal;
1874
156
    U32 tableLog, maxW, sizeOfSort, nbSymbols;
1875
156
    const U32 memLog = DTable[0];
1876
156
    const BYTE* ip = (const BYTE*) src;
1877
156
    size_t iSize = ip[0];
1878
156
    void* ptr = DTable;
1879
156
    HUF_DEltX4* const dt = ((HUF_DEltX4*)ptr) + 1;
1880
1881
156
    HUF_STATIC_ASSERT(sizeof(HUF_DEltX4) == sizeof(U32));   /* if compilation fails here, assertion is false */
1882
156
    if (memLog > HUF_ABSOLUTEMAX_TABLELOG) return ERROR(tableLog_tooLarge);
1883
    //memset(weightList, 0, sizeof(weightList));   /* is not necessary, even though some analyzer complain ... */
1884
1885
156
    iSize = HUF_readStats(weightList, HUF_MAX_SYMBOL_VALUE + 1, rankStats, &nbSymbols, &tableLog, src, srcSize);
1886
156
    if (HUF_isError(iSize)) return iSize;
1887
1888
    /* check result */
1889
151
    if (tableLog > memLog) return ERROR(tableLog_tooLarge);   /* DTable can't fit code depth */
1890
1891
    /* find maxWeight */
1892
300
    for (maxW = tableLog; rankStats[maxW]==0; maxW--)
1893
150
        {if (!maxW) return ERROR(GENERIC); }  /* necessarily finds a solution before maxW==0 */
1894
1895
    /* Get start index of each weight */
1896
150
    {
1897
150
        U32 w, nextRankStart = 0;
1898
1.15k
        for (w=1; w<=maxW; w++)
1899
1.00k
        {
1900
1.00k
            U32 current = nextRankStart;
1901
1.00k
            nextRankStart += rankStats[w];
1902
1.00k
            rankStart[w] = current;
1903
1.00k
        }
1904
150
        rankStart[0] = nextRankStart;   /* put all 0w symbols at the end of sorted list*/
1905
150
        sizeOfSort = nextRankStart;
1906
150
    }
1907
1908
    /* sort symbols by weight */
1909
150
    {
1910
150
        U32 s;
1911
19.6k
        for (s=0; s<nbSymbols; s++)
1912
19.4k
        {
1913
19.4k
            U32 w = weightList[s];
1914
19.4k
            U32 r = rankStart[w]++;
1915
19.4k
            sortedSymbol[r].symbol = (BYTE)s;
1916
19.4k
            sortedSymbol[r].weight = (BYTE)w;
1917
19.4k
        }
1918
150
        rankStart[0] = 0;   /* forget 0w symbols; this is beginning of weight(1) */
1919
150
    }
1920
1921
    /* Build rankVal */
1922
150
    {
1923
150
        const U32 minBits = tableLog+1 - maxW;
1924
150
        U32 nextRankVal = 0;
1925
150
        U32 w, consumed;
1926
150
        const int rescale = (memLog-tableLog) - 1;   /* tableLog <= memLog */
1927
150
        U32* rankVal0 = rankVal[0];
1928
1.15k
        for (w=1; w<=maxW; w++)
1929
1.00k
        {
1930
1.00k
            U32 current = nextRankVal;
1931
1.00k
            nextRankVal += rankStats[w] << (w+rescale);
1932
1.00k
            rankVal0[w] = current;
1933
1.00k
        }
1934
1.50k
        for (consumed = minBits; consumed <= memLog - minBits; consumed++)
1935
1.35k
        {
1936
1.35k
            U32* rankValPtr = rankVal[consumed];
1937
11.3k
            for (w = 1; w <= maxW; w++)
1938
10.0k
            {
1939
10.0k
                rankValPtr[w] = rankVal0[w] >> consumed;
1940
10.0k
            }
1941
1.35k
        }
1942
150
    }
1943
1944
150
    HUF_fillDTableX4(dt, memLog,
1945
150
                   sortedSymbol, sizeOfSort,
1946
150
                   rankStart0, rankVal, maxW,
1947
150
                   tableLog+1);
1948
1949
150
    return iSize;
1950
150
}
1951
1952
1953
static U32 HUF_decodeSymbolX4(void* op, BIT_DStream_t* DStream, const HUF_DEltX4* dt, const U32 dtLog)
1954
1.35M
{
1955
1.35M
    const size_t val = BIT_lookBitsFast(DStream, dtLog);   /* note : dtLog >= 1 */
1956
1.35M
    memcpy(op, dt+val, 2);
1957
1.35M
    BIT_skipBits(DStream, dt[val].nbBits);
1958
1.35M
    return dt[val].length;
1959
1.35M
}
1960
1961
static U32 HUF_decodeLastSymbolX4(void* op, BIT_DStream_t* DStream, const HUF_DEltX4* dt, const U32 dtLog)
1962
221
{
1963
221
    const size_t val = BIT_lookBitsFast(DStream, dtLog);   /* note : dtLog >= 1 */
1964
221
    memcpy(op, dt+val, 1);
1965
221
    if (dt[val].length==1) BIT_skipBits(DStream, dt[val].nbBits);
1966
127
    else
1967
127
    {
1968
127
        if (DStream->bitsConsumed < (sizeof(DStream->bitContainer)*8))
1969
66
        {
1970
66
            BIT_skipBits(DStream, dt[val].nbBits);
1971
66
            if (DStream->bitsConsumed > (sizeof(DStream->bitContainer)*8))
1972
13
                DStream->bitsConsumed = (sizeof(DStream->bitContainer)*8);   /* ugly hack; works only because it's the last symbol. Note : can't easily extract nbBits from just this symbol */
1973
66
        }
1974
127
    }
1975
221
    return 1;
1976
221
}
1977
1978
1979
#define HUF_DECODE_SYMBOLX4_0(ptr, DStreamPtr) \
1980
693k
    ptr += HUF_decodeSymbolX4(ptr, DStreamPtr, dt, dtLog)
1981
1982
#define HUF_DECODE_SYMBOLX4_1(ptr, DStreamPtr) \
1983
221k
    if (MEM_64bits() || (HUF_MAX_TABLELOG<=12)) \
1984
221k
        ptr += HUF_decodeSymbolX4(ptr, DStreamPtr, dt, dtLog)
1985
1986
#define HUF_DECODE_SYMBOLX4_2(ptr, DStreamPtr) \
1987
443k
    if (MEM_64bits()) \
1988
443k
        ptr += HUF_decodeSymbolX4(ptr, DStreamPtr, dt, dtLog)
1989
1990
static inline size_t HUF_decodeStreamX4(BYTE* p, BIT_DStream_t* bitDPtr, BYTE* const pEnd, const HUF_DEltX4* const dt, const U32 dtLog)
1991
372
{
1992
372
    BYTE* const pStart = p;
1993
1994
    /* up to 8 symbols at a time */
1995
157k
    while ((BIT_reloadDStream(bitDPtr) == BIT_DStream_unfinished) && (p < pEnd-7))
1996
157k
    {
1997
157k
        HUF_DECODE_SYMBOLX4_2(p, bitDPtr);
1998
157k
        HUF_DECODE_SYMBOLX4_1(p, bitDPtr);
1999
157k
        HUF_DECODE_SYMBOLX4_2(p, bitDPtr);
2000
157k
        HUF_DECODE_SYMBOLX4_0(p, bitDPtr);
2001
157k
    }
2002
2003
    /* closer to the end */
2004
590
    while ((BIT_reloadDStream(bitDPtr) == BIT_DStream_unfinished) && (p <= pEnd-2))
2005
218
        HUF_DECODE_SYMBOLX4_0(p, bitDPtr);
2006
2007
471k
    while (p <= pEnd-2)
2008
471k
        HUF_DECODE_SYMBOLX4_0(p, bitDPtr);   /* no need to reload : reached the end of DStream */
2009
2010
372
    if (p < pEnd)
2011
221
        p += HUF_decodeLastSymbolX4(p, bitDPtr, dt, dtLog);
2012
2013
372
    return p-pStart;
2014
372
}
2015
2016
2017
2018
static size_t HUF_decompress4X4_usingDTable(
2019
          void* dst,  size_t dstSize,
2020
    const void* cSrc, size_t cSrcSize,
2021
    const U32* DTable)
2022
150
{
2023
150
    if (cSrcSize < 10) return ERROR(corruption_detected);   /* strict minimum : jump table + 1 byte per stream */
2024
2025
150
    {
2026
150
        const BYTE* const istart = (const BYTE*) cSrc;
2027
150
        BYTE* const ostart = (BYTE*) dst;
2028
150
        BYTE* const oend = ostart + dstSize;
2029
2030
150
        const void* ptr = DTable;
2031
150
        const HUF_DEltX4* const dt = ((const HUF_DEltX4*)ptr) +1;
2032
150
        const U32 dtLog = DTable[0];
2033
150
        size_t errorCode;
2034
2035
        /* Init */
2036
150
        BIT_DStream_t bitD1;
2037
150
        BIT_DStream_t bitD2;
2038
150
        BIT_DStream_t bitD3;
2039
150
        BIT_DStream_t bitD4;
2040
150
        const size_t length1 = MEM_readLE16(istart);
2041
150
        const size_t length2 = MEM_readLE16(istart+2);
2042
150
        const size_t length3 = MEM_readLE16(istart+4);
2043
150
        size_t length4;
2044
150
        const BYTE* const istart1 = istart + 6;  /* jumpTable */
2045
150
        const BYTE* const istart2 = istart1 + length1;
2046
150
        const BYTE* const istart3 = istart2 + length2;
2047
150
        const BYTE* const istart4 = istart3 + length3;
2048
150
        const size_t segmentSize = (dstSize+3) / 4;
2049
150
        BYTE* const opStart2 = ostart + segmentSize;
2050
150
        BYTE* const opStart3 = opStart2 + segmentSize;
2051
150
        BYTE* const opStart4 = opStart3 + segmentSize;
2052
150
        BYTE* op1 = ostart;
2053
150
        BYTE* op2 = opStart2;
2054
150
        BYTE* op3 = opStart3;
2055
150
        BYTE* op4 = opStart4;
2056
150
        U32 endSignal;
2057
2058
150
        length4 = cSrcSize - (length1 + length2 + length3 + 6);
2059
150
        if (length4 > cSrcSize) return ERROR(corruption_detected);   /* overflow */
2060
121
        errorCode = BIT_initDStream(&bitD1, istart1, length1);
2061
121
        if (HUF_isError(errorCode)) return errorCode;
2062
115
        errorCode = BIT_initDStream(&bitD2, istart2, length2);
2063
115
        if (HUF_isError(errorCode)) return errorCode;
2064
108
        errorCode = BIT_initDStream(&bitD3, istart3, length3);
2065
108
        if (HUF_isError(errorCode)) return errorCode;
2066
102
        errorCode = BIT_initDStream(&bitD4, istart4, length4);
2067
102
        if (HUF_isError(errorCode)) return errorCode;
2068
2069
        /* 16-32 symbols per loop (4-8 symbols per stream) */
2070
96
        endSignal = BIT_reloadDStream(&bitD1) | BIT_reloadDStream(&bitD2) | BIT_reloadDStream(&bitD3) | BIT_reloadDStream(&bitD4);
2071
16.2k
        for ( ; (endSignal==BIT_DStream_unfinished) && (op4<(oend-7)) ; )
2072
16.1k
        {
2073
16.1k
            HUF_DECODE_SYMBOLX4_2(op1, &bitD1);
2074
16.1k
            HUF_DECODE_SYMBOLX4_2(op2, &bitD2);
2075
16.1k
            HUF_DECODE_SYMBOLX4_2(op3, &bitD3);
2076
16.1k
            HUF_DECODE_SYMBOLX4_2(op4, &bitD4);
2077
16.1k
            HUF_DECODE_SYMBOLX4_1(op1, &bitD1);
2078
16.1k
            HUF_DECODE_SYMBOLX4_1(op2, &bitD2);
2079
16.1k
            HUF_DECODE_SYMBOLX4_1(op3, &bitD3);
2080
16.1k
            HUF_DECODE_SYMBOLX4_1(op4, &bitD4);
2081
16.1k
            HUF_DECODE_SYMBOLX4_2(op1, &bitD1);
2082
16.1k
            HUF_DECODE_SYMBOLX4_2(op2, &bitD2);
2083
16.1k
            HUF_DECODE_SYMBOLX4_2(op3, &bitD3);
2084
16.1k
            HUF_DECODE_SYMBOLX4_2(op4, &bitD4);
2085
16.1k
            HUF_DECODE_SYMBOLX4_0(op1, &bitD1);
2086
16.1k
            HUF_DECODE_SYMBOLX4_0(op2, &bitD2);
2087
16.1k
            HUF_DECODE_SYMBOLX4_0(op3, &bitD3);
2088
16.1k
            HUF_DECODE_SYMBOLX4_0(op4, &bitD4);
2089
2090
16.1k
            endSignal = BIT_reloadDStream(&bitD1) | BIT_reloadDStream(&bitD2) | BIT_reloadDStream(&bitD3) | BIT_reloadDStream(&bitD4);
2091
16.1k
        }
2092
2093
        /* check corruption */
2094
96
        if (op1 > opStart2) return ERROR(corruption_detected);
2095
95
        if (op2 > opStart3) return ERROR(corruption_detected);
2096
94
        if (op3 > opStart4) return ERROR(corruption_detected);
2097
        /* note : op4 supposed already verified within main loop */
2098
2099
        /* finish bitStreams one by one */
2100
93
        HUF_decodeStreamX4(op1, &bitD1, opStart2, dt, dtLog);
2101
93
        HUF_decodeStreamX4(op2, &bitD2, opStart3, dt, dtLog);
2102
93
        HUF_decodeStreamX4(op3, &bitD3, opStart4, dt, dtLog);
2103
93
        HUF_decodeStreamX4(op4, &bitD4, oend,     dt, dtLog);
2104
2105
        /* check */
2106
93
        endSignal = BIT_endOfDStream(&bitD1) & BIT_endOfDStream(&bitD2) & BIT_endOfDStream(&bitD3) & BIT_endOfDStream(&bitD4);
2107
93
        if (!endSignal) return ERROR(corruption_detected);
2108
2109
        /* decoded size */
2110
1
        return dstSize;
2111
93
    }
2112
93
}
2113
2114
2115
static size_t HUF_decompress4X4 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize)
2116
156
{
2117
156
    HUF_CREATE_STATIC_DTABLEX4(DTable, HUF_MAX_TABLELOG);
2118
156
    const BYTE* ip = (const BYTE*) cSrc;
2119
2120
156
    size_t hSize = HUF_readDTableX4 (DTable, cSrc, cSrcSize);
2121
156
    if (HUF_isError(hSize)) return hSize;
2122
150
    if (hSize >= cSrcSize) return ERROR(srcSize_wrong);
2123
150
    ip += hSize;
2124
150
    cSrcSize -= hSize;
2125
2126
150
    return HUF_decompress4X4_usingDTable (dst, dstSize, ip, cSrcSize, DTable);
2127
150
}
2128
2129
2130
/**********************************/
2131
/* quad-symbol decoding           */
2132
/**********************************/
2133
typedef struct { BYTE nbBits; BYTE nbBytes; } HUF_DDescX6;
2134
typedef union { BYTE byte[4]; U32 sequence; } HUF_DSeqX6;
2135
2136
/* recursive, up to level 3; may benefit from <template>-like strategy to nest each level inline */
2137
static void HUF_fillDTableX6LevelN(HUF_DDescX6* DDescription, HUF_DSeqX6* DSequence, int sizeLog,
2138
                           const rankVal_t rankValOrigin, const U32 consumed, const int minWeight, const U32 maxWeight,
2139
                           const sortedSymbol_t* sortedSymbols, const U32 sortedListSize, const U32* rankStart,
2140
                           const U32 nbBitsBaseline, HUF_DSeqX6 baseSeq, HUF_DDescX6 DDesc)
2141
18.1k
{
2142
18.1k
    const int scaleLog = nbBitsBaseline - sizeLog;   /* note : targetLog >= (nbBitsBaseline-1), hence scaleLog <= 1 */
2143
18.1k
    const int minBits  = nbBitsBaseline - maxWeight;
2144
18.1k
    const U32 level = DDesc.nbBytes;
2145
18.1k
    U32 rankVal[HUF_ABSOLUTEMAX_TABLELOG + 1];
2146
18.1k
    U32 symbolStartPos, s;
2147
2148
    /* local rankVal, will be modified */
2149
18.1k
    memcpy(rankVal, rankValOrigin[consumed], sizeof(rankVal));
2150
2151
    /* fill skipped values */
2152
18.1k
    if (minWeight>1)
2153
16.2k
    {
2154
16.2k
        U32 i;
2155
16.2k
        const U32 skipSize = rankVal[minWeight];
2156
149k
        for (i = 0; i < skipSize; i++)
2157
133k
        {
2158
133k
            DSequence[i] = baseSeq;
2159
133k
            DDescription[i] = DDesc;
2160
133k
        }
2161
16.2k
    }
2162
2163
    /* fill DTable */
2164
18.1k
    DDesc.nbBytes++;
2165
18.1k
    symbolStartPos = rankStart[minWeight];
2166
94.7k
    for (s=symbolStartPos; s<sortedListSize; s++)
2167
76.6k
    {
2168
76.6k
        const BYTE symbol = sortedSymbols[s].symbol;
2169
76.6k
        const U32  weight = sortedSymbols[s].weight;   /* >= 1 (sorted) */
2170
76.6k
        const int  nbBits = nbBitsBaseline - weight;   /* >= 1 (by construction) */
2171
76.6k
        const int  totalBits = consumed+nbBits;
2172
76.6k
        const U32  start  = rankVal[weight];
2173
76.6k
        const U32  length = 1 << (sizeLog-nbBits);
2174
76.6k
        baseSeq.byte[level] = symbol;
2175
76.6k
        DDesc.nbBits = (BYTE)totalBits;
2176
2177
76.6k
        if ((level<3) && (sizeLog-totalBits >= minBits))   /* enough room for another symbol */
2178
17.9k
        {
2179
17.9k
            int nextMinWeight = totalBits + scaleLog;
2180
17.9k
            if (nextMinWeight < 1) nextMinWeight = 1;
2181
17.9k
            HUF_fillDTableX6LevelN(DDescription+start, DSequence+start, sizeLog-nbBits,
2182
17.9k
                           rankValOrigin, totalBits, nextMinWeight, maxWeight,
2183
17.9k
                           sortedSymbols, sortedListSize, rankStart,
2184
17.9k
                           nbBitsBaseline, baseSeq, DDesc);   /* recursive (max : level 3) */
2185
17.9k
        }
2186
58.6k
        else
2187
58.6k
        {
2188
58.6k
            U32 i;
2189
58.6k
            const U32 end = start + length;
2190
519k
            for (i = start; i < end; i++)
2191
460k
            {
2192
460k
                DDescription[i] = DDesc;
2193
460k
                DSequence[i] = baseSeq;
2194
460k
            }
2195
58.6k
        }
2196
76.6k
        rankVal[weight] += length;
2197
76.6k
    }
2198
18.1k
}
2199
2200
2201
/* note : same preparation as X4 */
2202
static size_t HUF_readDTableX6 (U32* DTable, const void* src, size_t srcSize)
2203
151
{
2204
151
    BYTE weightList[HUF_MAX_SYMBOL_VALUE + 1];
2205
151
    sortedSymbol_t sortedSymbol[HUF_MAX_SYMBOL_VALUE + 1];
2206
151
    U32 rankStats[HUF_ABSOLUTEMAX_TABLELOG + 1] = { 0 };
2207
151
    U32 rankStart0[HUF_ABSOLUTEMAX_TABLELOG + 2] = { 0 };
2208
151
    U32* const rankStart = rankStart0+1;
2209
151
    U32 tableLog, maxW, sizeOfSort, nbSymbols;
2210
151
    rankVal_t rankVal;
2211
151
    const U32 memLog = DTable[0];
2212
151
    const BYTE* ip = (const BYTE*) src;
2213
151
    size_t iSize = ip[0];
2214
2215
151
    if (memLog > HUF_ABSOLUTEMAX_TABLELOG) return ERROR(tableLog_tooLarge);
2216
    //memset(weightList, 0, sizeof(weightList));   /* is not necessary, even though some analyzer complain ... */
2217
2218
151
    iSize = HUF_readStats(weightList, HUF_MAX_SYMBOL_VALUE + 1, rankStats, &nbSymbols, &tableLog, src, srcSize);
2219
151
    if (HUF_isError(iSize)) return iSize;
2220
2221
    /* check result */
2222
146
    if (tableLog > memLog) return ERROR(tableLog_tooLarge);   /* DTable is too small */
2223
2224
    /* find maxWeight */
2225
232
    for (maxW = tableLog; rankStats[maxW]==0; maxW--)
2226
87
        { if (!maxW) return ERROR(GENERIC); }  /* necessarily finds a solution before maxW==0 */
2227
2228
2229
    /* Get start index of each weight */
2230
145
    {
2231
145
        U32 w, nextRankStart = 0;
2232
1.10k
        for (w=1; w<=maxW; w++)
2233
956
        {
2234
956
            U32 current = nextRankStart;
2235
956
            nextRankStart += rankStats[w];
2236
956
            rankStart[w] = current;
2237
956
        }
2238
145
        rankStart[0] = nextRankStart;   /* put all 0w symbols at the end of sorted list*/
2239
145
        sizeOfSort = nextRankStart;
2240
145
    }
2241
2242
    /* sort symbols by weight */
2243
145
    {
2244
145
        U32 s;
2245
13.1k
        for (s=0; s<nbSymbols; s++)
2246
12.9k
        {
2247
12.9k
            U32 w = weightList[s];
2248
12.9k
            U32 r = rankStart[w]++;
2249
12.9k
            sortedSymbol[r].symbol = (BYTE)s;
2250
12.9k
            sortedSymbol[r].weight = (BYTE)w;
2251
12.9k
        }
2252
145
        rankStart[0] = 0;   /* forget 0w symbols; this is beginning of weight(1) */
2253
145
    }
2254
2255
    /* Build rankVal */
2256
145
    {
2257
145
        const U32 minBits = tableLog+1 - maxW;
2258
145
        U32 nextRankVal = 0;
2259
145
        U32 w, consumed;
2260
145
        const int rescale = (memLog-tableLog) - 1;   /* tableLog <= memLog */
2261
145
        U32* rankVal0 = rankVal[0];
2262
1.10k
        for (w=1; w<=maxW; w++)
2263
956
        {
2264
956
            U32 current = nextRankVal;
2265
956
            nextRankVal += rankStats[w] << (w+rescale);
2266
956
            rankVal0[w] = current;
2267
956
        }
2268
1.56k
        for (consumed = minBits; consumed <= memLog - minBits; consumed++)
2269
1.42k
        {
2270
1.42k
            U32* rankValPtr = rankVal[consumed];
2271
11.4k
            for (w = 1; w <= maxW; w++)
2272
9.99k
            {
2273
9.99k
                rankValPtr[w] = rankVal0[w] >> consumed;
2274
9.99k
            }
2275
1.42k
        }
2276
145
    }
2277
2278
2279
    /* fill tables */
2280
145
    {
2281
145
        void* ptr = DTable+1;
2282
145
        HUF_DDescX6* DDescription = (HUF_DDescX6*)(ptr);
2283
145
        void* dSeqStart = DTable + 1 + ((size_t)1<<(memLog-1));
2284
145
        HUF_DSeqX6* DSequence = (HUF_DSeqX6*)(dSeqStart);
2285
145
        HUF_DSeqX6 DSeq;
2286
145
        HUF_DDescX6 DDesc;
2287
145
        DSeq.sequence = 0;
2288
145
        DDesc.nbBits = 0;
2289
145
        DDesc.nbBytes = 0;
2290
145
        HUF_fillDTableX6LevelN(DDescription, DSequence, memLog,
2291
145
                       (const U32 (*)[HUF_ABSOLUTEMAX_TABLELOG + 1])rankVal, 0, 1, maxW,
2292
145
                       sortedSymbol, sizeOfSort, rankStart0,
2293
145
                       tableLog+1, DSeq, DDesc);
2294
145
    }
2295
2296
145
    return iSize;
2297
145
}
2298
2299
2300
static U32 HUF_decodeSymbolX6(void* op, BIT_DStream_t* DStream, const HUF_DDescX6* dd, const HUF_DSeqX6* ds, const U32 dtLog)
2301
1.03M
{
2302
1.03M
    const size_t val = BIT_lookBitsFast(DStream, dtLog);   /* note : dtLog >= 1 */
2303
1.03M
    memcpy(op, ds+val, sizeof(HUF_DSeqX6));
2304
1.03M
    BIT_skipBits(DStream, dd[val].nbBits);
2305
1.03M
    return dd[val].nbBytes;
2306
1.03M
}
2307
2308
static U32 HUF_decodeLastSymbolsX6(void* op, const U32 maxL, BIT_DStream_t* DStream,
2309
                                  const HUF_DDescX6* dd, const HUF_DSeqX6* ds, const U32 dtLog)
2310
442
{
2311
442
    const size_t val = BIT_lookBitsFast(DStream, dtLog);   /* note : dtLog >= 1 */
2312
442
    U32 length = dd[val].nbBytes;
2313
442
    if (length <= maxL)
2314
273
    {
2315
273
        memcpy(op, ds+val, length);
2316
273
        BIT_skipBits(DStream, dd[val].nbBits);
2317
273
        return length;
2318
273
    }
2319
169
    memcpy(op, ds+val, maxL);
2320
169
    if (DStream->bitsConsumed < (sizeof(DStream->bitContainer)*8))
2321
69
    {
2322
69
        BIT_skipBits(DStream, dd[val].nbBits);
2323
69
        if (DStream->bitsConsumed > (sizeof(DStream->bitContainer)*8))
2324
15
            DStream->bitsConsumed = (sizeof(DStream->bitContainer)*8);   /* ugly hack; works only because it's the last symbol. Note : can't easily extract nbBits from just this symbol */
2325
69
    }
2326
169
    return maxL;
2327
442
}
2328
2329
2330
#define HUF_DECODE_SYMBOLX6_0(ptr, DStreamPtr) \
2331
1.28M
    ptr += HUF_decodeSymbolX6(ptr, DStreamPtr, dd, ds, dtLog)
2332
2333
#define HUF_DECODE_SYMBOLX6_1(ptr, DStreamPtr) \
2334
84.0k
    if (MEM_64bits() || (HUF_MAX_TABLELOG<=12)) \
2335
84.0k
        HUF_DECODE_SYMBOLX6_0(ptr, DStreamPtr)
2336
2337
#define HUF_DECODE_SYMBOLX6_2(ptr, DStreamPtr) \
2338
168k
    if (MEM_64bits()) \
2339
168k
        HUF_DECODE_SYMBOLX6_0(ptr, DStreamPtr)
2340
2341
static inline size_t HUF_decodeStreamX6(BYTE* p, BIT_DStream_t* bitDPtr, BYTE* const pEnd, const U32* DTable, const U32 dtLog)
2342
328
{
2343
328
    const void* ddPtr = DTable+1;
2344
328
    const HUF_DDescX6* dd = (const HUF_DDescX6*)(ddPtr);
2345
328
    const void* dsPtr = DTable + 1 + ((size_t)1<<(dtLog-1));
2346
328
    const HUF_DSeqX6* ds = (const HUF_DSeqX6*)(dsPtr);
2347
328
    BYTE* const pStart = p;
2348
2349
    /* up to 16 symbols at a time */
2350
72.6k
    while ((BIT_reloadDStream(bitDPtr) == BIT_DStream_unfinished) && (p <= pEnd-16))
2351
72.3k
    {
2352
72.3k
        HUF_DECODE_SYMBOLX6_2(p, bitDPtr);
2353
72.3k
        HUF_DECODE_SYMBOLX6_1(p, bitDPtr);
2354
72.3k
        HUF_DECODE_SYMBOLX6_2(p, bitDPtr);
2355
72.3k
        HUF_DECODE_SYMBOLX6_0(p, bitDPtr);
2356
72.3k
    }
2357
2358
    /* closer to the end, up to 4 symbols at a time */
2359
541
    while ((BIT_reloadDStream(bitDPtr) == BIT_DStream_unfinished) && (p <= pEnd-4))
2360
213
        HUF_DECODE_SYMBOLX6_0(p, bitDPtr);
2361
2362
694k
    while (p <= pEnd-4)
2363
693k
        HUF_DECODE_SYMBOLX6_0(p, bitDPtr);   /* no need to reload : reached the end of DStream */
2364
2365
770
    while (p < pEnd)
2366
442
        p += HUF_decodeLastSymbolsX6(p, (U32)(pEnd-p), bitDPtr, dd, ds, dtLog);
2367
2368
328
    return p-pStart;
2369
328
}
2370
2371
2372
2373
static size_t HUF_decompress4X6_usingDTable(
2374
          void* dst,  size_t dstSize,
2375
    const void* cSrc, size_t cSrcSize,
2376
    const U32* DTable)
2377
145
{
2378
145
    if (cSrcSize < 10) return ERROR(corruption_detected);   /* strict minimum : jump table + 1 byte per stream */
2379
2380
145
    {
2381
145
        const BYTE* const istart = (const BYTE*) cSrc;
2382
145
        BYTE* const ostart = (BYTE*) dst;
2383
145
        BYTE* const oend = ostart + dstSize;
2384
2385
145
        const U32 dtLog = DTable[0];
2386
145
        const void* ddPtr = DTable+1;
2387
145
        const HUF_DDescX6* dd = (const HUF_DDescX6*)(ddPtr);
2388
145
        const void* dsPtr = DTable + 1 + ((size_t)1<<(dtLog-1));
2389
145
        const HUF_DSeqX6* ds = (const HUF_DSeqX6*)(dsPtr);
2390
145
        size_t errorCode;
2391
2392
        /* Init */
2393
145
        BIT_DStream_t bitD1;
2394
145
        BIT_DStream_t bitD2;
2395
145
        BIT_DStream_t bitD3;
2396
145
        BIT_DStream_t bitD4;
2397
145
        const size_t length1 = MEM_readLE16(istart);
2398
145
        const size_t length2 = MEM_readLE16(istart+2);
2399
145
        const size_t length3 = MEM_readLE16(istart+4);
2400
145
        size_t length4;
2401
145
        const BYTE* const istart1 = istart + 6;  /* jumpTable */
2402
145
        const BYTE* const istart2 = istart1 + length1;
2403
145
        const BYTE* const istart3 = istart2 + length2;
2404
145
        const BYTE* const istart4 = istart3 + length3;
2405
145
        const size_t segmentSize = (dstSize+3) / 4;
2406
145
        BYTE* const opStart2 = ostart + segmentSize;
2407
145
        BYTE* const opStart3 = opStart2 + segmentSize;
2408
145
        BYTE* const opStart4 = opStart3 + segmentSize;
2409
145
        BYTE* op1 = ostart;
2410
145
        BYTE* op2 = opStart2;
2411
145
        BYTE* op3 = opStart3;
2412
145
        BYTE* op4 = opStart4;
2413
145
        U32 endSignal;
2414
2415
145
        length4 = cSrcSize - (length1 + length2 + length3 + 6);
2416
145
        if (length4 > cSrcSize) return ERROR(corruption_detected);   /* overflow */
2417
113
        errorCode = BIT_initDStream(&bitD1, istart1, length1);
2418
113
        if (HUF_isError(errorCode)) return errorCode;
2419
106
        errorCode = BIT_initDStream(&bitD2, istart2, length2);
2420
106
        if (HUF_isError(errorCode)) return errorCode;
2421
100
        errorCode = BIT_initDStream(&bitD3, istart3, length3);
2422
100
        if (HUF_isError(errorCode)) return errorCode;
2423
92
        errorCode = BIT_initDStream(&bitD4, istart4, length4);
2424
92
        if (HUF_isError(errorCode)) return errorCode;
2425
2426
        /* 16-64 symbols per loop (4-16 symbols per stream) */
2427
85
        endSignal = BIT_reloadDStream(&bitD1) | BIT_reloadDStream(&bitD2) | BIT_reloadDStream(&bitD3) | BIT_reloadDStream(&bitD4);
2428
3.00k
        for ( ; (op3 <= opStart4) && (endSignal==BIT_DStream_unfinished) && (op4<=(oend-16)) ; )
2429
2.92k
        {
2430
2.92k
            HUF_DECODE_SYMBOLX6_2(op1, &bitD1);
2431
2.92k
            HUF_DECODE_SYMBOLX6_2(op2, &bitD2);
2432
2.92k
            HUF_DECODE_SYMBOLX6_2(op3, &bitD3);
2433
2.92k
            HUF_DECODE_SYMBOLX6_2(op4, &bitD4);
2434
2.92k
            HUF_DECODE_SYMBOLX6_1(op1, &bitD1);
2435
2.92k
            HUF_DECODE_SYMBOLX6_1(op2, &bitD2);
2436
2.92k
            HUF_DECODE_SYMBOLX6_1(op3, &bitD3);
2437
2.92k
            HUF_DECODE_SYMBOLX6_1(op4, &bitD4);
2438
2.92k
            HUF_DECODE_SYMBOLX6_2(op1, &bitD1);
2439
2.92k
            HUF_DECODE_SYMBOLX6_2(op2, &bitD2);
2440
2.92k
            HUF_DECODE_SYMBOLX6_2(op3, &bitD3);
2441
2.92k
            HUF_DECODE_SYMBOLX6_2(op4, &bitD4);
2442
2.92k
            HUF_DECODE_SYMBOLX6_0(op1, &bitD1);
2443
2.92k
            HUF_DECODE_SYMBOLX6_0(op2, &bitD2);
2444
2.92k
            HUF_DECODE_SYMBOLX6_0(op3, &bitD3);
2445
2.92k
            HUF_DECODE_SYMBOLX6_0(op4, &bitD4);
2446
2447
2.92k
            endSignal = BIT_reloadDStream(&bitD1) | BIT_reloadDStream(&bitD2) | BIT_reloadDStream(&bitD3) | BIT_reloadDStream(&bitD4);
2448
2.92k
        }
2449
2450
        /* check corruption */
2451
85
        if (op1 > opStart2) return ERROR(corruption_detected);
2452
84
        if (op2 > opStart3) return ERROR(corruption_detected);
2453
83
        if (op3 > opStart4) return ERROR(corruption_detected);
2454
        /* note : op4 supposed already verified within main loop */
2455
2456
        /* finish bitStreams one by one */
2457
82
        HUF_decodeStreamX6(op1, &bitD1, opStart2, DTable, dtLog);
2458
82
        HUF_decodeStreamX6(op2, &bitD2, opStart3, DTable, dtLog);
2459
82
        HUF_decodeStreamX6(op3, &bitD3, opStart4, DTable, dtLog);
2460
82
        HUF_decodeStreamX6(op4, &bitD4, oend,     DTable, dtLog);
2461
2462
        /* check */
2463
82
        endSignal = BIT_endOfDStream(&bitD1) & BIT_endOfDStream(&bitD2) & BIT_endOfDStream(&bitD3) & BIT_endOfDStream(&bitD4);
2464
82
        if (!endSignal) return ERROR(corruption_detected);
2465
2466
        /* decoded size */
2467
2
        return dstSize;
2468
82
    }
2469
82
}
2470
2471
2472
static size_t HUF_decompress4X6 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize)
2473
151
{
2474
151
    HUF_CREATE_STATIC_DTABLEX6(DTable, HUF_MAX_TABLELOG);
2475
151
    const BYTE* ip = (const BYTE*) cSrc;
2476
2477
151
    size_t hSize = HUF_readDTableX6 (DTable, cSrc, cSrcSize);
2478
151
    if (HUF_isError(hSize)) return hSize;
2479
145
    if (hSize >= cSrcSize) return ERROR(srcSize_wrong);
2480
145
    ip += hSize;
2481
145
    cSrcSize -= hSize;
2482
2483
145
    return HUF_decompress4X6_usingDTable (dst, dstSize, ip, cSrcSize, DTable);
2484
145
}
2485
2486
2487
/**********************************/
2488
/* Generic decompression selector */
2489
/**********************************/
2490
2491
typedef struct { U32 tableTime; U32 decode256Time; } algo_time_t;
2492
static const algo_time_t algoTime[16 /* Quantization */][3 /* single, double, quad */] =
2493
{
2494
    /* single, double, quad */
2495
    {{0,0}, {1,1}, {2,2}},  /* Q==0 : impossible */
2496
    {{0,0}, {1,1}, {2,2}},  /* Q==1 : impossible */
2497
    {{  38,130}, {1313, 74}, {2151, 38}},   /* Q == 2 : 12-18% */
2498
    {{ 448,128}, {1353, 74}, {2238, 41}},   /* Q == 3 : 18-25% */
2499
    {{ 556,128}, {1353, 74}, {2238, 47}},   /* Q == 4 : 25-32% */
2500
    {{ 714,128}, {1418, 74}, {2436, 53}},   /* Q == 5 : 32-38% */
2501
    {{ 883,128}, {1437, 74}, {2464, 61}},   /* Q == 6 : 38-44% */
2502
    {{ 897,128}, {1515, 75}, {2622, 68}},   /* Q == 7 : 44-50% */
2503
    {{ 926,128}, {1613, 75}, {2730, 75}},   /* Q == 8 : 50-56% */
2504
    {{ 947,128}, {1729, 77}, {3359, 77}},   /* Q == 9 : 56-62% */
2505
    {{1107,128}, {2083, 81}, {4006, 84}},   /* Q ==10 : 62-69% */
2506
    {{1177,128}, {2379, 87}, {4785, 88}},   /* Q ==11 : 69-75% */
2507
    {{1242,128}, {2415, 93}, {5155, 84}},   /* Q ==12 : 75-81% */
2508
    {{1349,128}, {2644,106}, {5260,106}},   /* Q ==13 : 81-87% */
2509
    {{1455,128}, {2422,124}, {4174,124}},   /* Q ==14 : 87-93% */
2510
    {{ 722,128}, {1891,145}, {1936,146}},   /* Q ==15 : 93-99% */
2511
};
2512
2513
typedef size_t (*decompressionAlgo)(void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);
2514
2515
static size_t HUF_decompress (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize)
2516
1.53k
{
2517
1.53k
    static const decompressionAlgo decompress[3] = { HUF_decompress4X2, HUF_decompress4X4, HUF_decompress4X6 };
2518
    /* estimate decompression time */
2519
1.53k
    U32 Q;
2520
1.53k
    const U32 D256 = (U32)(dstSize >> 8);
2521
1.53k
    U32 Dtime[3];
2522
1.53k
    U32 algoNb = 0;
2523
1.53k
    int n;
2524
2525
    /* validation checks */
2526
1.53k
    if (dstSize == 0) return ERROR(dstSize_tooSmall);
2527
1.53k
    if (cSrcSize > dstSize) return ERROR(corruption_detected);   /* invalid */
2528
1.52k
    if (cSrcSize == dstSize) { memcpy(dst, cSrc, dstSize); return dstSize; }   /* not compressed */
2529
1.32k
    if (cSrcSize == 1) { memset(dst, *(const BYTE*)cSrc, dstSize); return dstSize; }   /* RLE */
2530
2531
    /* decoder timing evaluation */
2532
1.10k
    Q = (U32)(cSrcSize * 16 / dstSize);   /* Q < 16 since dstSize > cSrcSize */
2533
4.42k
    for (n=0; n<3; n++)
2534
3.32k
        Dtime[n] = algoTime[Q][n].tableTime + (algoTime[Q][n].decode256Time * D256);
2535
2536
1.10k
    Dtime[1] += Dtime[1] >> 4; Dtime[2] += Dtime[2] >> 3; /* advantage to algorithms using less memory, for cache eviction */
2537
2538
1.10k
    if (Dtime[1] < Dtime[0]) algoNb = 1;
2539
1.10k
    if (Dtime[2] < Dtime[algoNb]) algoNb = 2;
2540
2541
1.10k
    return decompress[algoNb](dst, dstSize, cSrc, cSrcSize);
2542
2543
    //return HUF_decompress4X2(dst, dstSize, cSrc, cSrcSize);   /* multi-streams single-symbol decoding */
2544
    //return HUF_decompress4X4(dst, dstSize, cSrc, cSrcSize);   /* multi-streams double-symbols decoding */
2545
    //return HUF_decompress4X6(dst, dstSize, cSrc, cSrcSize);   /* multi-streams quad-symbols decoding */
2546
1.32k
}
2547
/*
2548
    zstd - standard compression library
2549
    Copyright (C) 2014-2015, Yann Collet.
2550
2551
    BSD 2-Clause License (https://opensource.org/licenses/bsd-license.php)
2552
2553
    Redistribution and use in source and binary forms, with or without
2554
    modification, are permitted provided that the following conditions are
2555
    met:
2556
    * Redistributions of source code must retain the above copyright
2557
    notice, this list of conditions and the following disclaimer.
2558
    * Redistributions in binary form must reproduce the above
2559
    copyright notice, this list of conditions and the following disclaimer
2560
    in the documentation and/or other materials provided with the
2561
    distribution.
2562
    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
2563
    "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
2564
    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
2565
    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
2566
    OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
2567
    SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
2568
    LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
2569
    DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
2570
    THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
2571
    (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
2572
    OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
2573
2574
    You can contact the author at :
2575
    - zstd source repository : https://github.com/Cyan4973/zstd
2576
    - ztsd public forum : https://groups.google.com/forum/#!forum/lz4c
2577
*/
2578
2579
/* ***************************************************************
2580
*  Tuning parameters
2581
*****************************************************************/
2582
/*!
2583
*  MEMORY_USAGE :
2584
*  Memory usage formula : N->2^N Bytes (examples : 10 -> 1KB; 12 -> 4KB ; 16 -> 64KB; 20 -> 1MB; etc.)
2585
*  Increasing memory usage improves compression ratio
2586
*  Reduced memory usage can improve speed, due to cache effect
2587
*/
2588
#define ZSTD_MEMORY_USAGE 17
2589
2590
/*!
2591
 * HEAPMODE :
2592
 * Select how default compression functions will allocate memory for their hash table,
2593
 * in memory stack (0, fastest), or in memory heap (1, requires malloc())
2594
 * Note that compression context is fairly large, as a consequence heap memory is recommended.
2595
 */
2596
#ifndef ZSTD_HEAPMODE
2597
#  define ZSTD_HEAPMODE 1
2598
#endif /* ZSTD_HEAPMODE */
2599
2600
/*!
2601
*  LEGACY_SUPPORT :
2602
*  decompressor can decode older formats (starting from Zstd 0.1+)
2603
*/
2604
#ifndef ZSTD_LEGACY_SUPPORT
2605
#  define ZSTD_LEGACY_SUPPORT 1
2606
#endif
2607
2608
2609
/* *******************************************************
2610
*  Includes
2611
*********************************************************/
2612
#include <stdlib.h>      /* calloc */
2613
#include <string.h>      /* memcpy, memmove */
2614
#include <stdio.h>       /* debug : printf */
2615
2616
2617
/* *******************************************************
2618
*  Compiler specifics
2619
*********************************************************/
2620
#ifdef __AVX2__
2621
#  include <immintrin.h>   /* AVX2 intrinsics */
2622
#endif
2623
2624
#ifdef _MSC_VER    /* Visual Studio */
2625
#  include <intrin.h>                    /* For Visual 2005 */
2626
#  pragma warning(disable : 4127)        /* disable: C4127: conditional expression is constant */
2627
#  pragma warning(disable : 4324)        /* disable: C4324: padded structure */
2628
#endif
2629
2630
2631
/* *******************************************************
2632
*  Constants
2633
*********************************************************/
2634
#define HASH_LOG (ZSTD_MEMORY_USAGE - 2)
2635
#define HASH_TABLESIZE (1 << HASH_LOG)
2636
#define HASH_MASK (HASH_TABLESIZE - 1)
2637
2638
#define KNUTH 2654435761
2639
2640
#define BIT7 128
2641
#define BIT6  64
2642
#define BIT5  32
2643
#define BIT4  16
2644
2.41k
#define BIT1   2
2645
3.47k
#define BIT0   1
2646
2647
6.52k
#define KB *(1 <<10)
2648
#define MB *(1 <<20)
2649
#define GB *(1U<<30)
2650
2651
6.52k
#define BLOCKSIZE (128 KB)                 /* define, for static allocation */
2652
7.79k
#define MIN_SEQUENCES_SIZE (2 /*seqNb*/ + 2 /*dumps*/ + 3 /*seqTables*/ + 1 /*bitStream*/)
2653
7.79k
#define MIN_CBLOCK_SIZE (3 /*litCSize*/ + MIN_SEQUENCES_SIZE)
2654
3.47k
#define IS_RAW BIT0
2655
2.41k
#define IS_RLE BIT1
2656
2657
#define WORKPLACESIZE (BLOCKSIZE*3)
2658
46.1k
#define MINMATCH 4
2659
32.5k
#define MLbits   7
2660
33.1k
#define LLbits   6
2661
5.24k
#define Offbits  5
2662
24.6k
#define MaxML  ((1<<MLbits )-1)
2663
24.7k
#define MaxLL  ((1<<LLbits )-1)
2664
3.95k
#define MaxOff   31
2665
#define LitFSELog  11
2666
1.42k
#define MLFSELog   10
2667
1.50k
#define LLFSELog   10
2668
1.88k
#define OffFSELog   9
2669
#define MAX(a,b) ((a)<(b)?(b):(a))
2670
#define MaxSeq MAX(MaxLL, MaxML)
2671
2672
#define LITERAL_NOENTROPY 63
2673
#define COMMAND_NOENTROPY 7   /* to remove */
2674
2675
82
#define ZSTD_CONTENTSIZE_ERROR   (0ULL - 2)
2676
2677
static const size_t ZSTD_blockHeaderSize = 3;
2678
static const size_t ZSTD_frameHeaderSize = 4;
2679
2680
2681
/* *******************************************************
2682
*  Memory operations
2683
**********************************************************/
2684
11.0k
static void   ZSTD_copy4(void* dst, const void* src) { memcpy(dst, src, 4); }
2685
2686
1.61M
static void   ZSTD_copy8(void* dst, const void* src) { memcpy(dst, src, 8); }
2687
2688
1.60M
#define COPY8(d,s) { ZSTD_copy8(d,s); d+=8; s+=8; }
2689
2690
/*! ZSTD_wildcopy : custom version of memcpy(), can copy up to 7-8 bytes too many */
2691
static void ZSTD_wildcopy(void* dst, const void* src, ptrdiff_t length)
2692
45.8k
{
2693
45.8k
    const BYTE* ip = (const BYTE*)src;
2694
45.8k
    BYTE* op = (BYTE*)dst;
2695
45.8k
    BYTE* const oend = op + length;
2696
1.60M
    do COPY8(op, ip) while (op < oend);
2697
45.8k
}
2698
2699
2700
/* **************************************
2701
*  Local structures
2702
****************************************/
2703
typedef enum { bt_compressed, bt_raw, bt_rle, bt_end } blockType_t;
2704
2705
typedef struct
2706
{
2707
    blockType_t blockType;
2708
    U32 origSize;
2709
} blockProperties_t;
2710
2711
typedef struct {
2712
    void* buffer;
2713
    U32*  offsetStart;
2714
    U32*  offset;
2715
    BYTE* offCodeStart;
2716
    BYTE* offCode;
2717
    BYTE* litStart;
2718
    BYTE* lit;
2719
    BYTE* litLengthStart;
2720
    BYTE* litLength;
2721
    BYTE* matchLengthStart;
2722
    BYTE* matchLength;
2723
    BYTE* dumpsStart;
2724
    BYTE* dumps;
2725
} SeqStore_t;
2726
2727
2728
/* *************************************
2729
*  Error Management
2730
***************************************/
2731
/*! ZSTD_isError
2732
*   tells if a return value is an error code */
2733
66.5k
static unsigned ZSTD_isError(size_t code) { return ERR_isError(code); }
2734
2735
2736
2737
/* *************************************************************
2738
*   Decompression section
2739
***************************************************************/
2740
struct ZSTDv02_Dctx_s
2741
{
2742
    U32 LLTable[FSE_DTABLE_SIZE_U32(LLFSELog)];
2743
    U32 OffTable[FSE_DTABLE_SIZE_U32(OffFSELog)];
2744
    U32 MLTable[FSE_DTABLE_SIZE_U32(MLFSELog)];
2745
    void* previousDstEnd;
2746
    void* base;
2747
    size_t expected;
2748
    blockType_t bType;
2749
    U32 phase;
2750
    const BYTE* litPtr;
2751
    size_t litSize;
2752
    BYTE litBuffer[BLOCKSIZE + 8 /* margin for wildcopy */];
2753
};   /* typedef'd to ZSTD_Dctx within "zstd_static.h" */
2754
2755
2756
static size_t ZSTD_getcBlockSize(const void* src, size_t srcSize, blockProperties_t* bpPtr)
2757
20.6k
{
2758
20.6k
    const BYTE* const in = (const BYTE* const)src;
2759
20.6k
    BYTE headerFlags;
2760
20.6k
    U32 cSize;
2761
2762
20.6k
    if (srcSize < 3) return ERROR(srcSize_wrong);
2763
2764
20.6k
    headerFlags = *in;
2765
20.6k
    cSize = in[2] + (in[1]<<8) + ((in[0] & 7)<<16);
2766
2767
20.6k
    bpPtr->blockType = (blockType_t)(headerFlags >> 6);
2768
20.6k
    bpPtr->origSize = (bpPtr->blockType == bt_rle) ? cSize : 0;
2769
2770
20.6k
    if (bpPtr->blockType == bt_end) return 0;
2771
18.7k
    if (bpPtr->blockType == bt_rle) return 1;
2772
18.1k
    return cSize;
2773
18.7k
}
2774
2775
static size_t ZSTD_copyUncompressedBlock(void* dst, size_t maxDstSize, const void* src, size_t srcSize)
2776
1.01k
{
2777
1.01k
    if (srcSize > maxDstSize) return ERROR(dstSize_tooSmall);
2778
1.00k
    if (srcSize > 0) {
2779
689
        memcpy(dst, src, srcSize);
2780
689
    }
2781
1.00k
    return srcSize;
2782
1.01k
}
2783
2784
2785
/** ZSTD_decompressLiterals
2786
    @return : nb of bytes read from src, or an error code*/
2787
static size_t ZSTD_decompressLiterals(void* dst, size_t* maxDstSizePtr,
2788
                                const void* src, size_t srcSize)
2789
1.56k
{
2790
1.56k
    const BYTE* ip = (const BYTE*)src;
2791
2792
1.56k
    const size_t litSize = (MEM_readLE32(src) & 0x1FFFFF) >> 2;   /* no buffer issue : srcSize >= MIN_CBLOCK_SIZE */
2793
1.56k
    const size_t litCSize = (MEM_readLE32(ip+2) & 0xFFFFFF) >> 5;   /* no buffer issue : srcSize >= MIN_CBLOCK_SIZE */
2794
2795
1.56k
    if (litSize > *maxDstSizePtr) return ERROR(corruption_detected);
2796
1.55k
    if (litCSize + 5 > srcSize) return ERROR(corruption_detected);
2797
2798
1.53k
    if (HUF_isError(HUF_decompress(dst, litSize, ip+5, litCSize))) return ERROR(corruption_detected);
2799
2800
796
    *maxDstSizePtr = litSize;
2801
796
    return litCSize + 5;
2802
1.53k
}
2803
2804
2805
/** ZSTD_decodeLiteralsBlock
2806
    @return : nb of bytes read from src (< srcSize )*/
2807
static size_t ZSTD_decodeLiteralsBlock(void* ctx,
2808
                          const void* src, size_t srcSize)
2809
7.79k
{
2810
7.79k
    ZSTD_DCtx* dctx = (ZSTD_DCtx*)ctx;
2811
7.79k
    const BYTE* const istart = (const BYTE* const)src;
2812
2813
    /* any compressed block with literals segment must be at least this size */
2814
7.79k
    if (srcSize < MIN_CBLOCK_SIZE) return ERROR(corruption_detected);
2815
2816
7.44k
    switch(*istart & 3)
2817
7.44k
    {
2818
312
    default:
2819
1.56k
    case 0:
2820
1.56k
        {
2821
1.56k
            size_t litSize = BLOCKSIZE;
2822
1.56k
            const size_t readSize = ZSTD_decompressLiterals(dctx->litBuffer, &litSize, src, srcSize);
2823
1.56k
            dctx->litPtr = dctx->litBuffer;
2824
1.56k
            dctx->litSize = litSize;
2825
1.56k
            memset(dctx->litBuffer + dctx->litSize, 0, 8);
2826
1.56k
            return readSize;   /* works if it's an error too */
2827
312
        }
2828
3.47k
    case IS_RAW:
2829
3.47k
        {
2830
3.47k
            const size_t litSize = (MEM_readLE32(istart) & 0xFFFFFF) >> 2;   /* no buffer issue : srcSize >= MIN_CBLOCK_SIZE */
2831
3.47k
            if (litSize > srcSize-11)   /* risk of reading too far with wildcopy */
2832
96
            {
2833
96
                if (litSize > BLOCKSIZE) return ERROR(corruption_detected);
2834
88
                if (litSize > srcSize-3) return ERROR(corruption_detected);
2835
72
                memcpy(dctx->litBuffer, istart, litSize);
2836
72
                dctx->litPtr = dctx->litBuffer;
2837
72
                dctx->litSize = litSize;
2838
72
                memset(dctx->litBuffer + dctx->litSize, 0, 8);
2839
72
                return litSize+3;
2840
88
            }
2841
            /* direct reference into compressed stream */
2842
3.37k
            dctx->litPtr = istart+3;
2843
3.37k
            dctx->litSize = litSize;
2844
3.37k
            return litSize+3;
2845
3.47k
        }
2846
2.41k
    case IS_RLE:
2847
2.41k
        {
2848
2.41k
            const size_t litSize = (MEM_readLE32(istart) & 0xFFFFFF) >> 2;   /* no buffer issue : srcSize >= MIN_CBLOCK_SIZE */
2849
2.41k
            if (litSize > BLOCKSIZE) return ERROR(corruption_detected);
2850
2.40k
            memset(dctx->litBuffer, istart[3], litSize + 8);
2851
2.40k
            dctx->litPtr = dctx->litBuffer;
2852
2.40k
            dctx->litSize = litSize;
2853
2.40k
            return 4;
2854
2.41k
        }
2855
7.44k
    }
2856
7.44k
}
2857
2858
2859
static size_t ZSTD_decodeSeqHeaders(int* nbSeq, const BYTE** dumpsPtr, size_t* dumpsLengthPtr,
2860
                         FSE_DTable* DTableLL, FSE_DTable* DTableML, FSE_DTable* DTableOffb,
2861
                         const void* src, size_t srcSize)
2862
6.64k
{
2863
6.64k
    const BYTE* const istart = (const BYTE* const)src;
2864
6.64k
    const BYTE* ip = istart;
2865
6.64k
    const BYTE* const iend = istart + srcSize;
2866
6.64k
    U32 LLtype, Offtype, MLtype;
2867
6.64k
    U32 LLlog, Offlog, MLlog;
2868
6.64k
    size_t dumpsLength;
2869
2870
    /* check */
2871
6.64k
    if (srcSize < 5) return ERROR(srcSize_wrong);
2872
2873
    /* SeqHead */
2874
6.62k
    *nbSeq = MEM_readLE16(ip); ip+=2;
2875
6.62k
    LLtype  = *ip >> 6;
2876
6.62k
    Offtype = (*ip >> 4) & 3;
2877
6.62k
    MLtype  = (*ip >> 2) & 3;
2878
6.62k
    if (*ip & 2)
2879
3.30k
    {
2880
3.30k
        dumpsLength  = ip[2];
2881
3.30k
        dumpsLength += ip[1] << 8;
2882
3.30k
        ip += 3;
2883
3.30k
    }
2884
3.32k
    else
2885
3.32k
    {
2886
3.32k
        dumpsLength  = ip[1];
2887
3.32k
        dumpsLength += (ip[0] & 1) << 8;
2888
3.32k
        ip += 2;
2889
3.32k
    }
2890
6.62k
    *dumpsPtr = ip;
2891
6.62k
    ip += dumpsLength;
2892
6.62k
    *dumpsLengthPtr = dumpsLength;
2893
2894
    /* check */
2895
6.62k
    if (ip > iend-3) return ERROR(srcSize_wrong); /* min : all 3 are "raw", hence no header, but at least xxLog bits per type */
2896
2897
    /* sequences */
2898
6.60k
    {
2899
6.60k
        S16 norm[MaxML+1];    /* assumption : MaxML >= MaxLL and MaxOff */
2900
6.60k
        size_t headerSize;
2901
2902
        /* Build DTables */
2903
6.60k
        switch(LLtype)
2904
6.60k
        {
2905
876
        case bt_rle :
2906
876
            LLlog = 0;
2907
876
            FSE_buildDTable_rle(DTableLL, *ip++); break;
2908
4.19k
        case bt_raw :
2909
4.19k
            LLlog = LLbits;
2910
4.19k
            FSE_buildDTable_raw(DTableLL, LLbits); break;
2911
1.52k
        default :
2912
1.52k
            {   U32 max = MaxLL;
2913
1.52k
                headerSize = FSE_readNCount(norm, &max, &LLlog, ip, iend-ip);
2914
1.52k
                if (FSE_isError(headerSize)) return ERROR(GENERIC);
2915
1.50k
                if (LLlog > LLFSELog) return ERROR(corruption_detected);
2916
1.50k
                ip += headerSize;
2917
1.50k
                FSE_buildDTable(DTableLL, norm, max, LLlog);
2918
1.50k
        }   }
2919
2920
6.57k
        switch(Offtype)
2921
6.57k
        {
2922
2.04k
        case bt_rle :
2923
2.04k
            Offlog = 0;
2924
2.04k
            if (ip > iend-2) return ERROR(srcSize_wrong);   /* min : "raw", hence no header, but at least xxLog bits */
2925
2.04k
            FSE_buildDTable_rle(DTableOffb, *ip++ & MaxOff); /* if *ip > MaxOff, data is corrupted */
2926
2.04k
            break;
2927
2.62k
        case bt_raw :
2928
2.62k
            Offlog = Offbits;
2929
2.62k
            FSE_buildDTable_raw(DTableOffb, Offbits); break;
2930
1.90k
        default :
2931
1.90k
            {   U32 max = MaxOff;
2932
1.90k
                headerSize = FSE_readNCount(norm, &max, &Offlog, ip, iend-ip);
2933
1.90k
                if (FSE_isError(headerSize)) return ERROR(GENERIC);
2934
1.88k
                if (Offlog > OffFSELog) return ERROR(corruption_detected);
2935
1.88k
                ip += headerSize;
2936
1.88k
                FSE_buildDTable(DTableOffb, norm, max, Offlog);
2937
1.88k
        }   }
2938
2939
6.55k
        switch(MLtype)
2940
6.55k
        {
2941
1.15k
        case bt_rle :
2942
1.15k
            MLlog = 0;
2943
1.15k
            if (ip > iend-2) return ERROR(srcSize_wrong); /* min : "raw", hence no header, but at least xxLog bits */
2944
1.15k
            FSE_buildDTable_rle(DTableML, *ip++); break;
2945
3.95k
        case bt_raw :
2946
3.95k
            MLlog = MLbits;
2947
3.95k
            FSE_buildDTable_raw(DTableML, MLbits); break;
2948
1.44k
        default :
2949
1.44k
            {   U32 max = MaxML;
2950
1.44k
                headerSize = FSE_readNCount(norm, &max, &MLlog, ip, iend-ip);
2951
1.44k
                if (FSE_isError(headerSize)) return ERROR(GENERIC);
2952
1.42k
                if (MLlog > MLFSELog) return ERROR(corruption_detected);
2953
1.41k
                ip += headerSize;
2954
1.41k
                FSE_buildDTable(DTableML, norm, max, MLlog);
2955
1.41k
    }   }   }
2956
2957
6.51k
    return ip-istart;
2958
6.55k
}
2959
2960
2961
typedef struct {
2962
    size_t litLength;
2963
    size_t offset;
2964
    size_t matchLength;
2965
} seq_t;
2966
2967
typedef struct {
2968
    BIT_DStream_t DStream;
2969
    FSE_DState_t stateLL;
2970
    FSE_DState_t stateOffb;
2971
    FSE_DState_t stateML;
2972
    size_t prevOffset;
2973
    const BYTE* dumps;
2974
    const BYTE* dumpsEnd;
2975
} seqState_t;
2976
2977
2978
static void ZSTD_decodeSequence(seq_t* seq, seqState_t* seqState)
2979
23.2k
{
2980
23.2k
    size_t litLength;
2981
23.2k
    size_t prevOffset;
2982
23.2k
    size_t offset;
2983
23.2k
    size_t matchLength;
2984
23.2k
    const BYTE* dumps = seqState->dumps;
2985
23.2k
    const BYTE* const de = seqState->dumpsEnd;
2986
2987
    /* Literal length */
2988
23.2k
    litLength = FSE_decodeSymbol(&(seqState->stateLL), &(seqState->DStream));
2989
23.2k
    prevOffset = litLength ? seq->offset : seqState->prevOffset;
2990
23.2k
    seqState->prevOffset = seq->offset;
2991
23.2k
    if (litLength == MaxLL)
2992
2.01k
    {
2993
2.01k
        const U32 add = dumps<de ? *dumps++ : 0;
2994
2.01k
        if (add < 255) litLength += add;
2995
308
        else if (dumps + 3 <= de)
2996
112
        {
2997
112
            litLength = MEM_readLE24(dumps);
2998
112
            dumps += 3;
2999
112
        }
3000
2.01k
        if (dumps >= de) dumps = de-1;   /* late correction, to avoid read overflow (data is now corrupted anyway) */
3001
2.01k
    }
3002
3003
    /* Offset */
3004
23.2k
    {
3005
23.2k
        static const size_t offsetPrefix[MaxOff+1] = {  /* note : size_t faster than U32 */
3006
23.2k
                1 /*fake*/, 1, 2, 4, 8, 16, 32, 64, 128, 256,
3007
23.2k
                512, 1024, 2048, 4096, 8192, 16384, 32768, 65536, 131072, 262144,
3008
23.2k
                524288, 1048576, 2097152, 4194304, 8388608, 16777216, 33554432, /*fake*/ 1, 1, 1, 1, 1 };
3009
23.2k
        U32 offsetCode, nbBits;
3010
23.2k
        offsetCode = FSE_decodeSymbol(&(seqState->stateOffb), &(seqState->DStream));   /* <= maxOff, by table construction */
3011
23.2k
        if (MEM_32bits()) BIT_reloadDStream(&(seqState->DStream));
3012
23.2k
        nbBits = offsetCode - 1;
3013
23.2k
        if (offsetCode==0) nbBits = 0;   /* cmove */
3014
23.2k
        offset = offsetPrefix[offsetCode] + BIT_readBits(&(seqState->DStream), nbBits);
3015
23.2k
        if (MEM_32bits()) BIT_reloadDStream(&(seqState->DStream));
3016
23.2k
        if (offsetCode==0) offset = prevOffset;   /* cmove */
3017
23.2k
    }
3018
3019
    /* MatchLength */
3020
23.2k
    matchLength = FSE_decodeSymbol(&(seqState->stateML), &(seqState->DStream));
3021
23.2k
    if (matchLength == MaxML)
3022
2.56k
    {
3023
2.56k
        const U32 add = dumps<de ? *dumps++ : 0;
3024
2.56k
        if (add < 255) matchLength += add;
3025
345
        else if (dumps + 3 <= de)
3026
147
        {
3027
147
            matchLength = MEM_readLE24(dumps);
3028
147
            dumps += 3;
3029
147
        }
3030
2.56k
        if (dumps >= de) dumps = de-1;   /* late correction, to avoid read overflow (data is now corrupted anyway) */
3031
2.56k
    }
3032
23.2k
    matchLength += MINMATCH;
3033
3034
    /* save result */
3035
23.2k
    seq->litLength = litLength;
3036
23.2k
    seq->offset = offset;
3037
23.2k
    seq->matchLength = matchLength;
3038
23.2k
    seqState->dumps = dumps;
3039
23.2k
}
3040
3041
3042
static size_t ZSTD_execSequence(BYTE* op,
3043
                                seq_t sequence,
3044
                                const BYTE** litPtr, const BYTE* const litLimit,
3045
                                BYTE* const base, BYTE* const oend)
3046
23.2k
{
3047
23.2k
    static const int dec32table[] = {0, 1, 2, 1, 4, 4, 4, 4};   /* added */
3048
23.2k
    static const int dec64table[] = {8, 8, 8, 7, 8, 9,10,11};   /* subtracted */
3049
23.2k
    const BYTE* const ostart = op;
3050
23.2k
    BYTE* const oLitEnd = op + sequence.litLength;
3051
23.2k
    BYTE* const oMatchEnd = op + sequence.litLength + sequence.matchLength;   /* risk : address space overflow (32-bits) */
3052
23.2k
    BYTE* const oend_8 = oend-8;
3053
23.2k
    const BYTE* const litEnd = *litPtr + sequence.litLength;
3054
3055
    /* checks */
3056
23.2k
    size_t const seqLength = sequence.litLength + sequence.matchLength;
3057
3058
23.2k
    if (seqLength > (size_t)(oend - op)) return ERROR(dstSize_tooSmall);
3059
23.0k
    if (sequence.litLength > (size_t)(litLimit - *litPtr)) return ERROR(corruption_detected);
3060
    /* Now we know there are no overflow in literal nor match lengths, can use the pointer check */
3061
23.0k
    if (oLitEnd > oend_8) return ERROR(dstSize_tooSmall);
3062
22.9k
    if (sequence.offset > (U32)(oLitEnd - base)) return ERROR(corruption_detected);
3063
3064
22.9k
    if (oMatchEnd > oend) return ERROR(dstSize_tooSmall);   /* overwrite beyond dst buffer */
3065
22.9k
    if (litEnd > litLimit) return ERROR(corruption_detected);   /* overRead beyond lit buffer */
3066
3067
    /* copy Literals */
3068
22.9k
    ZSTD_wildcopy(op, *litPtr, (ptrdiff_t)sequence.litLength);   /* note : oLitEnd <= oend-8 : no risk of overwrite beyond oend */
3069
22.9k
    op = oLitEnd;
3070
22.9k
    *litPtr = litEnd;   /* update for next sequence */
3071
3072
    /* copy Match */
3073
22.9k
    {
3074
22.9k
        const BYTE* match = op - sequence.offset;
3075
3076
        /* check */
3077
22.9k
        if (sequence.offset > (size_t)op) return ERROR(corruption_detected);   /* address space overflow test (this test seems kept by clang optimizer) */
3078
        //if (match > op) return ERROR(corruption_detected);   /* address space overflow test (is clang optimizer removing this test ?) */
3079
22.9k
        if (match < base) return ERROR(corruption_detected);
3080
3081
        /* close range match, overlap */
3082
22.9k
        if (sequence.offset < 8)
3083
11.0k
        {
3084
11.0k
            const int dec64 = dec64table[sequence.offset];
3085
11.0k
            op[0] = match[0];
3086
11.0k
            op[1] = match[1];
3087
11.0k
            op[2] = match[2];
3088
11.0k
            op[3] = match[3];
3089
11.0k
            match += dec32table[sequence.offset];
3090
11.0k
            ZSTD_copy4(op+4, match);
3091
11.0k
            match -= dec64;
3092
11.0k
        }
3093
11.8k
        else
3094
11.8k
        {
3095
11.8k
            ZSTD_copy8(op, match);
3096
11.8k
        }
3097
22.9k
        op += 8; match += 8;
3098
3099
22.9k
        if (oMatchEnd > oend-(16-MINMATCH))
3100
90
        {
3101
90
            if (op < oend_8)
3102
34
            {
3103
34
                ZSTD_wildcopy(op, match, oend_8 - op);
3104
34
                match += oend_8 - op;
3105
34
                op = oend_8;
3106
34
            }
3107
211
            while (op < oMatchEnd) *op++ = *match++;
3108
90
        }
3109
22.8k
        else
3110
22.8k
        {
3111
22.8k
            ZSTD_wildcopy(op, match, (ptrdiff_t)sequence.matchLength-8);   /* works even if matchLength < 8 */
3112
22.8k
        }
3113
22.9k
    }
3114
3115
0
    return oMatchEnd - ostart;
3116
22.9k
}
3117
3118
static size_t ZSTD_decompressSequences(
3119
                               void* ctx,
3120
                               void* dst, size_t maxDstSize,
3121
                         const void* seqStart, size_t seqSize)
3122
6.64k
{
3123
6.64k
    ZSTD_DCtx* dctx = (ZSTD_DCtx*)ctx;
3124
6.64k
    const BYTE* ip = (const BYTE*)seqStart;
3125
6.64k
    const BYTE* const iend = ip + seqSize;
3126
6.64k
    BYTE* const ostart = (BYTE* const)dst;
3127
6.64k
    BYTE* op = ostart;
3128
6.64k
    BYTE* const oend = ostart + maxDstSize;
3129
6.64k
    size_t errorCode, dumpsLength;
3130
6.64k
    const BYTE* litPtr = dctx->litPtr;
3131
6.64k
    const BYTE* const litEnd = litPtr + dctx->litSize;
3132
6.64k
    int nbSeq;
3133
6.64k
    const BYTE* dumps;
3134
6.64k
    U32* DTableLL = dctx->LLTable;
3135
6.64k
    U32* DTableML = dctx->MLTable;
3136
6.64k
    U32* DTableOffb = dctx->OffTable;
3137
6.64k
    BYTE* const base = (BYTE*) (dctx->base);
3138
3139
    /* Build Decoding Tables */
3140
6.64k
    errorCode = ZSTD_decodeSeqHeaders(&nbSeq, &dumps, &dumpsLength,
3141
6.64k
                                      DTableLL, DTableML, DTableOffb,
3142
6.64k
                                      ip, iend-ip);
3143
6.64k
    if (ZSTD_isError(errorCode)) return errorCode;
3144
6.51k
    ip += errorCode;
3145
3146
    /* Regen sequences */
3147
6.51k
    {
3148
6.51k
        seq_t sequence;
3149
6.51k
        seqState_t seqState;
3150
3151
6.51k
        memset(&sequence, 0, sizeof(sequence));
3152
6.51k
        seqState.dumps = dumps;
3153
6.51k
        seqState.dumpsEnd = dumps + dumpsLength;
3154
6.51k
        seqState.prevOffset = 1;
3155
6.51k
        errorCode = BIT_initDStream(&(seqState.DStream), ip, iend-ip);
3156
6.51k
        if (ERR_isError(errorCode)) return ERROR(corruption_detected);
3157
6.47k
        FSE_initDState(&(seqState.stateLL), &(seqState.DStream), DTableLL);
3158
6.47k
        FSE_initDState(&(seqState.stateOffb), &(seqState.DStream), DTableOffb);
3159
6.47k
        FSE_initDState(&(seqState.stateML), &(seqState.DStream), DTableML);
3160
3161
29.4k
        for ( ; (BIT_reloadDStream(&(seqState.DStream)) <= BIT_DStream_completed) && (nbSeq>0) ; )
3162
23.2k
        {
3163
23.2k
            size_t oneSeqSize;
3164
23.2k
            nbSeq--;
3165
23.2k
            ZSTD_decodeSequence(&sequence, &seqState);
3166
23.2k
            oneSeqSize = ZSTD_execSequence(op, sequence, &litPtr, litEnd, base, oend);
3167
23.2k
            if (ZSTD_isError(oneSeqSize)) return oneSeqSize;
3168
22.9k
            op += oneSeqSize;
3169
22.9k
        }
3170
3171
        /* check if reached exact end */
3172
6.18k
        if ( !BIT_endOfDStream(&(seqState.DStream)) ) return ERROR(corruption_detected);   /* requested too much : data is corrupted */
3173
6.09k
        if (nbSeq<0) return ERROR(corruption_detected);   /* requested too many sequences : data is corrupted */
3174
3175
        /* last literal segment */
3176
6.09k
        {
3177
6.09k
            size_t lastLLSize = litEnd - litPtr;
3178
6.09k
            if (litPtr > litEnd) return ERROR(corruption_detected);
3179
6.09k
            if (op+lastLLSize > oend) return ERROR(dstSize_tooSmall);
3180
6.08k
            if (lastLLSize > 0) {
3181
2.82k
                if (op != litPtr) memmove(op, litPtr, lastLLSize);
3182
2.82k
                op += lastLLSize;
3183
2.82k
            }
3184
6.08k
        }
3185
6.08k
    }
3186
3187
0
    return op-ostart;
3188
6.09k
}
3189
3190
3191
static size_t ZSTD_decompressBlock(
3192
                            void* ctx,
3193
                            void* dst, size_t maxDstSize,
3194
                      const void* src, size_t srcSize)
3195
7.79k
{
3196
    /* blockType == blockCompressed */
3197
7.79k
    const BYTE* ip = (const BYTE*)src;
3198
3199
    /* Decode literals sub-block */
3200
7.79k
    size_t litCSize = ZSTD_decodeLiteralsBlock(ctx, src, srcSize);
3201
7.79k
    if (ZSTD_isError(litCSize)) return litCSize;
3202
6.64k
    ip += litCSize;
3203
6.64k
    srcSize -= litCSize;
3204
3205
6.64k
    return ZSTD_decompressSequences(ctx, dst, maxDstSize, ip, srcSize);
3206
7.79k
}
3207
3208
3209
static size_t ZSTD_decompressDCtx(void* ctx, void* dst, size_t maxDstSize, const void* src, size_t srcSize)
3210
2.45k
{
3211
2.45k
    const BYTE* ip = (const BYTE*)src;
3212
2.45k
    const BYTE* iend = ip + srcSize;
3213
2.45k
    BYTE* const ostart = (BYTE* const)dst;
3214
2.45k
    BYTE* op = ostart;
3215
2.45k
    BYTE* const oend = ostart + maxDstSize;
3216
2.45k
    size_t remainingSize = srcSize;
3217
2.45k
    U32 magicNumber;
3218
2.45k
    blockProperties_t blockProperties;
3219
3220
    /* Frame Header */
3221
2.45k
    if (srcSize < ZSTD_frameHeaderSize+ZSTD_blockHeaderSize) return ERROR(srcSize_wrong);
3222
2.45k
    magicNumber = MEM_readLE32(src);
3223
2.45k
    if (magicNumber != ZSTD_magicNumber) return ERROR(prefix_unknown);
3224
2.45k
    ip += ZSTD_frameHeaderSize; remainingSize -= ZSTD_frameHeaderSize;
3225
3226
    /* Loop on each block */
3227
9.23k
    while (1)
3228
9.23k
    {
3229
9.23k
        size_t decodedSize=0;
3230
9.23k
        size_t cBlockSize = ZSTD_getcBlockSize(ip, iend-ip, &blockProperties);
3231
9.23k
        if (ZSTD_isError(cBlockSize)) return cBlockSize;
3232
3233
9.23k
        ip += ZSTD_blockHeaderSize;
3234
9.23k
        remainingSize -= ZSTD_blockHeaderSize;
3235
9.23k
        if (cBlockSize > remainingSize) return ERROR(srcSize_wrong);
3236
3237
9.23k
        switch(blockProperties.blockType)
3238
9.23k
        {
3239
7.79k
        case bt_compressed:
3240
7.79k
            decodedSize = ZSTD_decompressBlock(ctx, op, oend-op, ip, cBlockSize);
3241
7.79k
            break;
3242
1.01k
        case bt_raw :
3243
1.01k
            decodedSize = ZSTD_copyUncompressedBlock(op, oend-op, ip, cBlockSize);
3244
1.01k
            break;
3245
4
        case bt_rle :
3246
4
            return ERROR(GENERIC);   /* not yet supported */
3247
0
            break;
3248
418
        case bt_end :
3249
            /* end of frame */
3250
418
            if (remainingSize) return ERROR(srcSize_wrong);
3251
418
            break;
3252
418
        default:
3253
0
            return ERROR(GENERIC);   /* impossible */
3254
9.23k
        }
3255
9.22k
        if (cBlockSize == 0) break;   /* bt_end */
3256
3257
8.14k
        if (ZSTD_isError(decodedSize)) return decodedSize;
3258
6.77k
        op += decodedSize;
3259
6.77k
        ip += cBlockSize;
3260
6.77k
        remainingSize -= cBlockSize;
3261
6.77k
    }
3262
3263
1.08k
    return op-ostart;
3264
2.45k
}
3265
3266
static size_t ZSTD_decompress(void* dst, size_t maxDstSize, const void* src, size_t srcSize)
3267
2.45k
{
3268
2.45k
    ZSTD_DCtx ctx;
3269
2.45k
    ctx.base = dst;
3270
2.45k
    return ZSTD_decompressDCtx(&ctx, dst, maxDstSize, src, srcSize);
3271
2.45k
}
3272
3273
/* ZSTD_errorFrameSizeInfoLegacy() :
3274
   assumes `cSize` and `dBound` are _not_ NULL */
3275
static void ZSTD_errorFrameSizeInfoLegacy(size_t* cSize, unsigned long long* dBound, size_t ret)
3276
82
{
3277
82
    *cSize = ret;
3278
82
    *dBound = ZSTD_CONTENTSIZE_ERROR;
3279
82
}
3280
3281
void ZSTDv02_findFrameSizeInfoLegacy(const void *src, size_t srcSize, size_t* cSize, unsigned long long* dBound)
3282
2.53k
{
3283
2.53k
    const BYTE* ip = (const BYTE*)src;
3284
2.53k
    size_t remainingSize = srcSize;
3285
2.53k
    size_t nbBlocks = 0;
3286
2.53k
    U32 magicNumber;
3287
2.53k
    blockProperties_t blockProperties;
3288
3289
    /* Frame Header */
3290
2.53k
    if (srcSize < ZSTD_frameHeaderSize+ZSTD_blockHeaderSize) {
3291
8
        ZSTD_errorFrameSizeInfoLegacy(cSize, dBound, ERROR(srcSize_wrong));
3292
8
        return;
3293
8
    }
3294
2.52k
    magicNumber = MEM_readLE32(src);
3295
2.52k
    if (magicNumber != ZSTD_magicNumber) {
3296
0
        ZSTD_errorFrameSizeInfoLegacy(cSize, dBound, ERROR(prefix_unknown));
3297
0
        return;
3298
0
    }
3299
2.52k
    ip += ZSTD_frameHeaderSize; remainingSize -= ZSTD_frameHeaderSize;
3300
3301
    /* Loop on each block */
3302
11.4k
    while (1)
3303
11.4k
    {
3304
11.4k
        size_t cBlockSize = ZSTD_getcBlockSize(ip, remainingSize, &blockProperties);
3305
11.4k
        if (ZSTD_isError(cBlockSize)) {
3306
21
            ZSTD_errorFrameSizeInfoLegacy(cSize, dBound, cBlockSize);
3307
21
            return;
3308
21
        }
3309
3310
11.4k
        ip += ZSTD_blockHeaderSize;
3311
11.4k
        remainingSize -= ZSTD_blockHeaderSize;
3312
11.4k
        if (cBlockSize > remainingSize) {
3313
53
            ZSTD_errorFrameSizeInfoLegacy(cSize, dBound, ERROR(srcSize_wrong));
3314
53
            return;
3315
53
        }
3316
3317
11.3k
        if (cBlockSize == 0) break;   /* bt_end */
3318
3319
8.92k
        ip += cBlockSize;
3320
8.92k
        remainingSize -= cBlockSize;
3321
8.92k
        nbBlocks++;
3322
8.92k
    }
3323
3324
2.45k
    *cSize = ip - (const BYTE*)src;
3325
2.45k
    *dBound = nbBlocks * BLOCKSIZE;
3326
2.45k
}
3327
3328
/*******************************
3329
*  Streaming Decompression API
3330
*******************************/
3331
3332
static size_t ZSTD_resetDCtx(ZSTD_DCtx* dctx)
3333
0
{
3334
0
    dctx->expected = ZSTD_frameHeaderSize;
3335
0
    dctx->phase = 0;
3336
0
    dctx->previousDstEnd = NULL;
3337
0
    dctx->base = NULL;
3338
0
    return 0;
3339
0
}
3340
3341
static ZSTD_DCtx* ZSTD_createDCtx(void)
3342
0
{
3343
0
    ZSTD_DCtx* dctx = (ZSTD_DCtx*)malloc(sizeof(ZSTD_DCtx));
3344
0
    if (dctx==NULL) return NULL;
3345
0
    ZSTD_resetDCtx(dctx);
3346
0
    return dctx;
3347
0
}
3348
3349
static size_t ZSTD_freeDCtx(ZSTD_DCtx* dctx)
3350
0
{
3351
0
    free(dctx);
3352
0
    return 0;
3353
0
}
3354
3355
static size_t ZSTD_nextSrcSizeToDecompress(ZSTD_DCtx* dctx)
3356
0
{
3357
0
    return dctx->expected;
3358
0
}
3359
3360
static size_t ZSTD_decompressContinue(ZSTD_DCtx* ctx, void* dst, size_t maxDstSize, const void* src, size_t srcSize)
3361
0
{
3362
    /* Sanity check */
3363
0
    if (srcSize != ctx->expected) return ERROR(srcSize_wrong);
3364
0
    if (dst != ctx->previousDstEnd)  /* not contiguous */
3365
0
        ctx->base = dst;
3366
3367
    /* Decompress : frame header */
3368
0
    if (ctx->phase == 0)
3369
0
    {
3370
        /* Check frame magic header */
3371
0
        U32 magicNumber = MEM_readLE32(src);
3372
0
        if (magicNumber != ZSTD_magicNumber) return ERROR(prefix_unknown);
3373
0
        ctx->phase = 1;
3374
0
        ctx->expected = ZSTD_blockHeaderSize;
3375
0
        return 0;
3376
0
    }
3377
3378
    /* Decompress : block header */
3379
0
    if (ctx->phase == 1)
3380
0
    {
3381
0
        blockProperties_t bp;
3382
0
        size_t blockSize = ZSTD_getcBlockSize(src, ZSTD_blockHeaderSize, &bp);
3383
0
        if (ZSTD_isError(blockSize)) return blockSize;
3384
0
        if (bp.blockType == bt_end)
3385
0
        {
3386
0
            ctx->expected = 0;
3387
0
            ctx->phase = 0;
3388
0
        }
3389
0
        else
3390
0
        {
3391
0
            ctx->expected = blockSize;
3392
0
            ctx->bType = bp.blockType;
3393
0
            ctx->phase = 2;
3394
0
        }
3395
3396
0
        return 0;
3397
0
    }
3398
3399
    /* Decompress : block content */
3400
0
    {
3401
0
        size_t rSize;
3402
0
        switch(ctx->bType)
3403
0
        {
3404
0
        case bt_compressed:
3405
0
            rSize = ZSTD_decompressBlock(ctx, dst, maxDstSize, src, srcSize);
3406
0
            break;
3407
0
        case bt_raw :
3408
0
            rSize = ZSTD_copyUncompressedBlock(dst, maxDstSize, src, srcSize);
3409
0
            break;
3410
0
        case bt_rle :
3411
0
            return ERROR(GENERIC);   /* not yet handled */
3412
0
            break;
3413
0
        case bt_end :   /* should never happen (filtered at phase 1) */
3414
0
            rSize = 0;
3415
0
            break;
3416
0
        default:
3417
0
            return ERROR(GENERIC);
3418
0
        }
3419
0
        ctx->phase = 1;
3420
0
        ctx->expected = ZSTD_blockHeaderSize;
3421
0
        if (ZSTD_isError(rSize)) return rSize;
3422
0
        ctx->previousDstEnd = (void*)( ((char*)dst) + rSize);
3423
0
        return rSize;
3424
0
    }
3425
3426
0
}
3427
3428
3429
/* wrapper layer */
3430
3431
unsigned ZSTDv02_isError(size_t code)
3432
0
{
3433
0
    return ZSTD_isError(code);
3434
0
}
3435
3436
size_t ZSTDv02_decompress( void* dst, size_t maxOriginalSize,
3437
                     const void* src, size_t compressedSize)
3438
2.45k
{
3439
2.45k
    return ZSTD_decompress(dst, maxOriginalSize, src, compressedSize);
3440
2.45k
}
3441
3442
ZSTDv02_Dctx* ZSTDv02_createDCtx(void)
3443
0
{
3444
0
    return (ZSTDv02_Dctx*)ZSTD_createDCtx();
3445
0
}
3446
3447
size_t ZSTDv02_freeDCtx(ZSTDv02_Dctx* dctx)
3448
0
{
3449
0
    return ZSTD_freeDCtx((ZSTD_DCtx*)dctx);
3450
0
}
3451
3452
size_t ZSTDv02_resetDCtx(ZSTDv02_Dctx* dctx)
3453
0
{
3454
0
    return ZSTD_resetDCtx((ZSTD_DCtx*)dctx);
3455
0
}
3456
3457
size_t ZSTDv02_nextSrcSizeToDecompress(ZSTDv02_Dctx* dctx)
3458
0
{
3459
0
    return ZSTD_nextSrcSizeToDecompress((ZSTD_DCtx*)dctx);
3460
0
}
3461
3462
size_t ZSTDv02_decompressContinue(ZSTDv02_Dctx* dctx, void* dst, size_t maxDstSize, const void* src, size_t srcSize)
3463
0
{
3464
0
    return ZSTD_decompressContinue((ZSTD_DCtx*)dctx, dst, maxDstSize, src, srcSize);
3465
0
}