Line | Count | Source (jump to first uncovered line) |
1 | | /* |
2 | | LZ4 - Fast LZ compression algorithm |
3 | | Copyright (c) Yann Collet. All rights reserved. |
4 | | |
5 | | BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php) |
6 | | |
7 | | Redistribution and use in source and binary forms, with or without |
8 | | modification, are permitted provided that the following conditions are |
9 | | met: |
10 | | |
11 | | * Redistributions of source code must retain the above copyright |
12 | | notice, this list of conditions and the following disclaimer. |
13 | | * Redistributions in binary form must reproduce the above |
14 | | copyright notice, this list of conditions and the following disclaimer |
15 | | in the documentation and/or other materials provided with the |
16 | | distribution. |
17 | | |
18 | | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
19 | | "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
20 | | LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
21 | | A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
22 | | OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
23 | | SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
24 | | LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
25 | | DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
26 | | THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
27 | | (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
28 | | OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
29 | | |
30 | | You can contact the author at : |
31 | | - LZ4 homepage : http://www.lz4.org |
32 | | - LZ4 source repository : https://github.com/lz4/lz4 |
33 | | */ |
34 | | |
35 | | /*-************************************ |
36 | | * Tuning parameters |
37 | | **************************************/ |
38 | | /* |
39 | | * LZ4_HEAPMODE : |
40 | | * Select how stateless compression functions like `LZ4_compress_default()` |
41 | | * allocate memory for their hash table, |
42 | | * in memory stack (0:default, fastest), or in memory heap (1:requires malloc()). |
43 | | */ |
44 | | #ifndef LZ4_HEAPMODE |
45 | | # define LZ4_HEAPMODE 0 |
46 | | #endif |
47 | | |
48 | | /* |
49 | | * LZ4_ACCELERATION_DEFAULT : |
50 | | * Select "acceleration" for LZ4_compress_fast() when parameter value <= 0 |
51 | | */ |
52 | 0 | #define LZ4_ACCELERATION_DEFAULT 1 |
53 | | /* |
54 | | * LZ4_ACCELERATION_MAX : |
55 | | * Any "acceleration" value higher than this threshold |
56 | | * get treated as LZ4_ACCELERATION_MAX instead (fix #876) |
57 | | */ |
58 | 4.00k | #define LZ4_ACCELERATION_MAX 65537 |
59 | | |
60 | | |
61 | | /*-************************************ |
62 | | * CPU Feature Detection |
63 | | **************************************/ |
64 | | /* LZ4_FORCE_MEMORY_ACCESS |
65 | | * By default, access to unaligned memory is controlled by `memcpy()`, which is safe and portable. |
66 | | * Unfortunately, on some target/compiler combinations, the generated assembly is sub-optimal. |
67 | | * The below switch allow to select different access method for improved performance. |
68 | | * Method 0 (default) : use `memcpy()`. Safe and portable. |
69 | | * Method 1 : `__packed` statement. It depends on compiler extension (ie, not portable). |
70 | | * This method is safe if your compiler supports it, and *generally* as fast or faster than `memcpy`. |
71 | | * Method 2 : direct access. This method is portable but violate C standard. |
72 | | * It can generate buggy code on targets which assembly generation depends on alignment. |
73 | | * But in some circumstances, it's the only known way to get the most performance (ie GCC + ARMv6) |
74 | | * See https://fastcompression.blogspot.fr/2015/08/accessing-unaligned-memory.html for details. |
75 | | * Prefer these methods in priority order (0 > 1 > 2) |
76 | | */ |
77 | | #ifndef LZ4_FORCE_MEMORY_ACCESS /* can be defined externally */ |
78 | | # if defined(__GNUC__) && \ |
79 | | ( defined(__ARM_ARCH_6__) || defined(__ARM_ARCH_6J__) || defined(__ARM_ARCH_6K__) \ |
80 | | || defined(__ARM_ARCH_6Z__) || defined(__ARM_ARCH_6ZK__) || defined(__ARM_ARCH_6T2__) ) |
81 | | # define LZ4_FORCE_MEMORY_ACCESS 2 |
82 | | # elif (defined(__INTEL_COMPILER) && !defined(_WIN32)) || defined(__GNUC__) || defined(_MSC_VER) |
83 | | # define LZ4_FORCE_MEMORY_ACCESS 1 |
84 | | # endif |
85 | | #endif |
86 | | |
87 | | /* |
88 | | * LZ4_FORCE_SW_BITCOUNT |
89 | | * Define this parameter if your target system or compiler does not support hardware bit count |
90 | | */ |
91 | | #if defined(_MSC_VER) && defined(_WIN32_WCE) /* Visual Studio for WinCE doesn't support Hardware bit count */ |
92 | | # undef LZ4_FORCE_SW_BITCOUNT /* avoid double def */ |
93 | | # define LZ4_FORCE_SW_BITCOUNT |
94 | | #endif |
95 | | |
96 | | |
97 | | |
98 | | /*-************************************ |
99 | | * Dependency |
100 | | **************************************/ |
101 | | /* |
102 | | * LZ4_SRC_INCLUDED: |
103 | | * Amalgamation flag, whether lz4.c is included |
104 | | */ |
105 | | #ifndef LZ4_SRC_INCLUDED |
106 | | # define LZ4_SRC_INCLUDED 1 |
107 | | #endif |
108 | | |
109 | | #ifndef LZ4_DISABLE_DEPRECATE_WARNINGS |
110 | | # define LZ4_DISABLE_DEPRECATE_WARNINGS /* due to LZ4_decompress_safe_withPrefix64k */ |
111 | | #endif |
112 | | |
113 | | #ifndef LZ4_STATIC_LINKING_ONLY |
114 | | # define LZ4_STATIC_LINKING_ONLY |
115 | | #endif |
116 | | #include "lz4.h" |
117 | | /* see also "memory routines" below */ |
118 | | |
119 | | |
120 | | /*-************************************ |
121 | | * Compiler Options |
122 | | **************************************/ |
123 | | #if defined(_MSC_VER) && (_MSC_VER >= 1400) /* Visual Studio 2005+ */ |
124 | | # include <intrin.h> /* only present in VS2005+ */ |
125 | | # pragma warning(disable : 4127) /* disable: C4127: conditional expression is constant */ |
126 | | # pragma warning(disable : 6237) /* disable: C6237: conditional expression is always 0 */ |
127 | | # pragma warning(disable : 6239) /* disable: C6239: (<non-zero constant> && <expression>) always evaluates to the result of <expression> */ |
128 | | # pragma warning(disable : 6240) /* disable: C6240: (<expression> && <non-zero constant>) always evaluates to the result of <expression> */ |
129 | | # pragma warning(disable : 6326) /* disable: C6326: Potential comparison of a constant with another constant */ |
130 | | #endif /* _MSC_VER */ |
131 | | |
132 | | #ifndef LZ4_FORCE_INLINE |
133 | | # if defined (_MSC_VER) && !defined (__clang__) /* MSVC */ |
134 | | # define LZ4_FORCE_INLINE static __forceinline |
135 | | # else |
136 | | # if defined (__cplusplus) || defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L /* C99 */ |
137 | | # if defined (__GNUC__) || defined (__clang__) |
138 | | # define LZ4_FORCE_INLINE static inline __attribute__((always_inline)) |
139 | | # else |
140 | | # define LZ4_FORCE_INLINE static inline |
141 | | # endif |
142 | | # else |
143 | | # define LZ4_FORCE_INLINE static |
144 | | # endif /* __STDC_VERSION__ */ |
145 | | # endif /* _MSC_VER */ |
146 | | #endif /* LZ4_FORCE_INLINE */ |
147 | | |
148 | | /* LZ4_FORCE_O2 and LZ4_FORCE_INLINE |
149 | | * gcc on ppc64le generates an unrolled SIMDized loop for LZ4_wildCopy8, |
150 | | * together with a simple 8-byte copy loop as a fall-back path. |
151 | | * However, this optimization hurts the decompression speed by >30%, |
152 | | * because the execution does not go to the optimized loop |
153 | | * for typical compressible data, and all of the preamble checks |
154 | | * before going to the fall-back path become useless overhead. |
155 | | * This optimization happens only with the -O3 flag, and -O2 generates |
156 | | * a simple 8-byte copy loop. |
157 | | * With gcc on ppc64le, all of the LZ4_decompress_* and LZ4_wildCopy8 |
158 | | * functions are annotated with __attribute__((optimize("O2"))), |
159 | | * and also LZ4_wildCopy8 is forcibly inlined, so that the O2 attribute |
160 | | * of LZ4_wildCopy8 does not affect the compression speed. |
161 | | */ |
162 | | #if defined(__PPC64__) && defined(__LITTLE_ENDIAN__) && defined(__GNUC__) && !defined(__clang__) |
163 | | # define LZ4_FORCE_O2 __attribute__((optimize("O2"))) |
164 | | # undef LZ4_FORCE_INLINE |
165 | | # define LZ4_FORCE_INLINE static __inline __attribute__((optimize("O2"),always_inline)) |
166 | | #else |
167 | | # define LZ4_FORCE_O2 |
168 | | #endif |
169 | | |
170 | | #if (defined(__GNUC__) && (__GNUC__ >= 3)) || (defined(__INTEL_COMPILER) && (__INTEL_COMPILER >= 800)) || defined(__clang__) |
171 | 2.33G | # define expect(expr,value) (__builtin_expect ((expr),(value)) ) |
172 | | #else |
173 | | # define expect(expr,value) (expr) |
174 | | #endif |
175 | | |
176 | | #ifndef likely |
177 | 68.2M | #define likely(expr) expect((expr) != 0, 1) |
178 | | #endif |
179 | | #ifndef unlikely |
180 | 34.4M | #define unlikely(expr) expect((expr) != 0, 0) |
181 | | #endif |
182 | | |
183 | | /* Should the alignment test prove unreliable, for some reason, |
184 | | * it can be disabled by setting LZ4_ALIGN_TEST to 0 */ |
185 | | #ifndef LZ4_ALIGN_TEST /* can be externally provided */ |
186 | | # define LZ4_ALIGN_TEST 1 |
187 | | #endif |
188 | | |
189 | | |
190 | | /*-************************************ |
191 | | * Memory routines |
192 | | **************************************/ |
193 | | |
194 | | /*! LZ4_STATIC_LINKING_ONLY_DISABLE_MEMORY_ALLOCATION : |
195 | | * Disable relatively high-level LZ4/HC functions that use dynamic memory |
196 | | * allocation functions (malloc(), calloc(), free()). |
197 | | * |
198 | | * Note that this is a compile-time switch. And since it disables |
199 | | * public/stable LZ4 v1 API functions, we don't recommend using this |
200 | | * symbol to generate a library for distribution. |
201 | | * |
202 | | * The following public functions are removed when this symbol is defined. |
203 | | * - lz4 : LZ4_createStream, LZ4_freeStream, |
204 | | * LZ4_createStreamDecode, LZ4_freeStreamDecode, LZ4_create (deprecated) |
205 | | * - lz4hc : LZ4_createStreamHC, LZ4_freeStreamHC, |
206 | | * LZ4_createHC (deprecated), LZ4_freeHC (deprecated) |
207 | | * - lz4frame, lz4file : All LZ4F_* functions |
208 | | */ |
209 | | #if defined(LZ4_STATIC_LINKING_ONLY_DISABLE_MEMORY_ALLOCATION) |
210 | | # define ALLOC(s) lz4_error_memory_allocation_is_disabled |
211 | | # define ALLOC_AND_ZERO(s) lz4_error_memory_allocation_is_disabled |
212 | | # define FREEMEM(p) lz4_error_memory_allocation_is_disabled |
213 | | #elif defined(LZ4_USER_MEMORY_FUNCTIONS) |
214 | | /* memory management functions can be customized by user project. |
215 | | * Below functions must exist somewhere in the Project |
216 | | * and be available at link time */ |
217 | | void* LZ4_malloc(size_t s); |
218 | | void* LZ4_calloc(size_t n, size_t s); |
219 | | void LZ4_free(void* p); |
220 | | # define ALLOC(s) LZ4_malloc(s) |
221 | | # define ALLOC_AND_ZERO(s) LZ4_calloc(1,s) |
222 | | # define FREEMEM(p) LZ4_free(p) |
223 | | #else |
224 | | # include <stdlib.h> /* malloc, calloc, free */ |
225 | 5.28k | # define ALLOC(s) malloc(s) |
226 | 0 | # define ALLOC_AND_ZERO(s) calloc(1,s) |
227 | 5.28k | # define FREEMEM(p) free(p) |
228 | | #endif |
229 | | |
230 | | #if ! LZ4_FREESTANDING |
231 | | # include <string.h> /* memset, memcpy */ |
232 | | #endif |
233 | | #if !defined(LZ4_memset) |
234 | 113k | # define LZ4_memset(p,v,s) memset((p),(v),(s)) |
235 | | #endif |
236 | 113k | #define MEM_INIT(p,v,s) LZ4_memset((p),(v),(s)) |
237 | | |
238 | | |
239 | | /*-************************************ |
240 | | * Common Constants |
241 | | **************************************/ |
242 | 1.08G | #define MINMATCH 4 |
243 | | |
244 | 4.72k | #define WILDCOPYLENGTH 8 |
245 | 16.1M | #define LASTLITERALS 5 /* see ../doc/lz4_Block_format.md#parsing-restrictions */ |
246 | 47.9k | #define MFLIMIT 12 /* see ../doc/lz4_Block_format.md#parsing-restrictions */ |
247 | 0 | #define MATCH_SAFEGUARD_DISTANCE ((2*WILDCOPYLENGTH) - MINMATCH) /* ensure it's possible to write 2 x wildcopyLength without overflowing output buffer */ |
248 | 10.2M | #define FASTLOOP_SAFE_DISTANCE 64 |
249 | | static const int LZ4_minLength = (MFLIMIT+1); |
250 | | |
251 | 31.9k | #define KB *(1 <<10) |
252 | | #define MB *(1 <<20) |
253 | 13.5k | #define GB *(1U<<30) |
254 | | |
255 | 5.75M | #define LZ4_DISTANCE_ABSOLUTE_MAX 65535 |
256 | | #if (LZ4_DISTANCE_MAX > LZ4_DISTANCE_ABSOLUTE_MAX) /* max supported by LZ4 format */ |
257 | | # error "LZ4_DISTANCE_MAX is too big : must be <= 65535" |
258 | | #endif |
259 | | |
260 | 476M | #define ML_BITS 4 |
261 | 261M | #define ML_MASK ((1U<<ML_BITS)-1) |
262 | 195M | #define RUN_BITS (8-ML_BITS) |
263 | 195M | #define RUN_MASK ((1U<<RUN_BITS)-1) |
264 | | |
265 | | |
266 | | /*-************************************ |
267 | | * Error detection |
268 | | **************************************/ |
269 | | #if defined(LZ4_DEBUG) && (LZ4_DEBUG>=1) |
270 | | # include <assert.h> |
271 | | #else |
272 | | # ifndef assert |
273 | | # define assert(condition) ((void)0) |
274 | | # endif |
275 | | #endif |
276 | | |
277 | 26.1M | #define LZ4_STATIC_ASSERT(c) { enum { LZ4_static_assert = 1/(int)(!!(c)) }; } /* use after variable declarations */ |
278 | | |
279 | | #if defined(LZ4_DEBUG) && (LZ4_DEBUG>=2) |
280 | | # include <stdio.h> |
281 | | static int g_debuglog_enable = 1; |
282 | | # define DEBUGLOG(l, ...) { \ |
283 | | if ((g_debuglog_enable) && (l<=LZ4_DEBUG)) { \ |
284 | | fprintf(stderr, __FILE__ " %i: ", __LINE__); \ |
285 | | fprintf(stderr, __VA_ARGS__); \ |
286 | | fprintf(stderr, " \n"); \ |
287 | | } } |
288 | | #else |
289 | 597M | # define DEBUGLOG(l, ...) {} /* disabled */ |
290 | | #endif |
291 | | |
292 | | static int LZ4_isAligned(const void* ptr, size_t alignment) |
293 | 20.0k | { |
294 | 20.0k | return ((size_t)ptr & (alignment -1)) == 0; |
295 | 20.0k | } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_isAligned Unexecuted instantiation: lz4_helpers.c:LZ4_isAligned Unexecuted instantiation: fuzz_data_producer.c:LZ4_isAligned Line | Count | Source | 293 | 1.61k | { | 294 | 1.61k | return ((size_t)ptr & (alignment -1)) == 0; | 295 | 1.61k | } |
Line | Count | Source | 293 | 18.4k | { | 294 | 18.4k | return ((size_t)ptr & (alignment -1)) == 0; | 295 | 18.4k | } |
|
296 | | |
297 | | |
298 | | /*-************************************ |
299 | | * Types |
300 | | **************************************/ |
301 | | #include <limits.h> |
302 | | #if defined(__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */) |
303 | | # include <stdint.h> |
304 | | typedef unsigned char BYTE; /*uint8_t not necessarily blessed to alias arbitrary type*/ |
305 | | typedef uint16_t U16; |
306 | | typedef uint32_t U32; |
307 | | typedef int32_t S32; |
308 | | typedef uint64_t U64; |
309 | | typedef uintptr_t uptrval; |
310 | | #else |
311 | | # if UINT_MAX != 4294967295UL |
312 | | # error "LZ4 code (when not C++ or C99) assumes that sizeof(int) == 4" |
313 | | # endif |
314 | | typedef unsigned char BYTE; |
315 | | typedef unsigned short U16; |
316 | | typedef unsigned int U32; |
317 | | typedef signed int S32; |
318 | | typedef unsigned long long U64; |
319 | | typedef size_t uptrval; /* generally true, except OpenVMS-64 */ |
320 | | #endif |
321 | | |
322 | | #if defined(__x86_64__) |
323 | | typedef U64 reg_t; /* 64-bits in x32 mode */ |
324 | | #else |
325 | | typedef size_t reg_t; /* 32-bits in x32 mode */ |
326 | | #endif |
327 | | |
328 | | typedef enum { |
329 | | notLimited = 0, |
330 | | limitedOutput = 1, |
331 | | fillOutput = 2 |
332 | | } limitedOutput_directive; |
333 | | |
334 | | |
335 | | /*-************************************ |
336 | | * Reading and writing into memory |
337 | | **************************************/ |
338 | | |
339 | | /** |
340 | | * LZ4 relies on memcpy with a constant size being inlined. In freestanding |
341 | | * environments, the compiler can't assume the implementation of memcpy() is |
342 | | * standard compliant, so it can't apply its specialized memcpy() inlining |
343 | | * logic. When possible, use __builtin_memcpy() to tell the compiler to analyze |
344 | | * memcpy() as if it were standard compliant, so it can inline it in freestanding |
345 | | * environments. This is needed when decompressing the Linux Kernel, for example. |
346 | | */ |
347 | | #if !defined(LZ4_memcpy) |
348 | | # if defined(__GNUC__) && (__GNUC__ >= 4) |
349 | 111M | # define LZ4_memcpy(dst, src, size) __builtin_memcpy(dst, src, size) |
350 | | # else |
351 | | # define LZ4_memcpy(dst, src, size) memcpy(dst, src, size) |
352 | | # endif |
353 | | #endif |
354 | | |
355 | | #if !defined(LZ4_memmove) |
356 | | # if defined(__GNUC__) && (__GNUC__ >= 4) |
357 | 51.1k | # define LZ4_memmove __builtin_memmove |
358 | | # else |
359 | | # define LZ4_memmove memmove |
360 | | # endif |
361 | | #endif |
362 | | |
363 | | static unsigned LZ4_isLittleEndian(void) |
364 | 186M | { |
365 | 186M | const union { U32 u; BYTE c[4]; } one = { 1 }; /* don't use static : performance detrimental */ |
366 | 186M | return one.c[0]; |
367 | 186M | } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_isLittleEndian Unexecuted instantiation: lz4_helpers.c:LZ4_isLittleEndian Unexecuted instantiation: fuzz_data_producer.c:LZ4_isLittleEndian Line | Count | Source | 364 | 31.3M | { | 365 | 31.3M | const union { U32 u; BYTE c[4]; } one = { 1 }; /* don't use static : performance detrimental */ | 366 | 31.3M | return one.c[0]; | 367 | 31.3M | } |
lz4hc.c:LZ4_isLittleEndian Line | Count | Source | 364 | 155M | { | 365 | 155M | const union { U32 u; BYTE c[4]; } one = { 1 }; /* don't use static : performance detrimental */ | 366 | 155M | return one.c[0]; | 367 | 155M | } |
|
368 | | |
369 | | #if defined(__GNUC__) || defined(__INTEL_COMPILER) |
370 | | #define LZ4_PACK( __Declaration__ ) __Declaration__ __attribute__((__packed__)) |
371 | | #elif defined(_MSC_VER) |
372 | | #define LZ4_PACK( __Declaration__ ) __pragma( pack(push, 1) ) __Declaration__ __pragma( pack(pop)) |
373 | | #endif |
374 | | |
375 | | #if defined(LZ4_FORCE_MEMORY_ACCESS) && (LZ4_FORCE_MEMORY_ACCESS==2) |
376 | | /* lie to the compiler about data alignment; use with caution */ |
377 | | |
378 | | static U16 LZ4_read16(const void* memPtr) { return *(const U16*) memPtr; } |
379 | | static U32 LZ4_read32(const void* memPtr) { return *(const U32*) memPtr; } |
380 | | static reg_t LZ4_read_ARCH(const void* memPtr) { return *(const reg_t*) memPtr; } |
381 | | |
382 | | static void LZ4_write16(void* memPtr, U16 value) { *(U16*)memPtr = value; } |
383 | | static void LZ4_write32(void* memPtr, U32 value) { *(U32*)memPtr = value; } |
384 | | |
385 | | #elif defined(LZ4_FORCE_MEMORY_ACCESS) && (LZ4_FORCE_MEMORY_ACCESS==1) |
386 | | |
387 | | /* __pack instructions are safer, but compiler specific, hence potentially problematic for some compilers */ |
388 | | /* currently only defined for gcc and icc */ |
389 | | LZ4_PACK(typedef struct { U16 u16; }) LZ4_unalign16; |
390 | | LZ4_PACK(typedef struct { U32 u32; }) LZ4_unalign32; |
391 | | LZ4_PACK(typedef struct { reg_t uArch; }) LZ4_unalignST; |
392 | | |
393 | 1.09G | static U16 LZ4_read16(const void* ptr) { return ((const LZ4_unalign16*)ptr)->u16; } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_read16 Unexecuted instantiation: lz4_helpers.c:LZ4_read16 Unexecuted instantiation: fuzz_data_producer.c:LZ4_read16 Line | Count | Source | 393 | 10.2M | static U16 LZ4_read16(const void* ptr) { return ((const LZ4_unalign16*)ptr)->u16; } |
Line | Count | Source | 393 | 1.08G | static U16 LZ4_read16(const void* ptr) { return ((const LZ4_unalign16*)ptr)->u16; } |
|
394 | 2.24G | static U32 LZ4_read32(const void* ptr) { return ((const LZ4_unalign32*)ptr)->u32; } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_read32 Unexecuted instantiation: lz4_helpers.c:LZ4_read32 Unexecuted instantiation: fuzz_data_producer.c:LZ4_read32 Line | Count | Source | 394 | 41.0M | static U32 LZ4_read32(const void* ptr) { return ((const LZ4_unalign32*)ptr)->u32; } |
Line | Count | Source | 394 | 2.20G | static U32 LZ4_read32(const void* ptr) { return ((const LZ4_unalign32*)ptr)->u32; } |
|
395 | 1.52G | static reg_t LZ4_read_ARCH(const void* ptr) { return ((const LZ4_unalignST*)ptr)->uArch; } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_read_ARCH Unexecuted instantiation: lz4_helpers.c:LZ4_read_ARCH Unexecuted instantiation: fuzz_data_producer.c:LZ4_read_ARCH Line | Count | Source | 395 | 57.3M | static reg_t LZ4_read_ARCH(const void* ptr) { return ((const LZ4_unalignST*)ptr)->uArch; } |
Line | Count | Source | 395 | 1.47G | static reg_t LZ4_read_ARCH(const void* ptr) { return ((const LZ4_unalignST*)ptr)->uArch; } |
|
396 | | |
397 | 10.2M | static void LZ4_write16(void* memPtr, U16 value) { ((LZ4_unalign16*)memPtr)->u16 = value; } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_write16 Unexecuted instantiation: lz4_helpers.c:LZ4_write16 Unexecuted instantiation: fuzz_data_producer.c:LZ4_write16 Line | Count | Source | 397 | 2.97M | static void LZ4_write16(void* memPtr, U16 value) { ((LZ4_unalign16*)memPtr)->u16 = value; } |
Line | Count | Source | 397 | 7.28M | static void LZ4_write16(void* memPtr, U16 value) { ((LZ4_unalign16*)memPtr)->u16 = value; } |
|
398 | 1.00M | static void LZ4_write32(void* memPtr, U32 value) { ((LZ4_unalign32*)memPtr)->u32 = value; } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_write32 Unexecuted instantiation: lz4_helpers.c:LZ4_write32 Unexecuted instantiation: fuzz_data_producer.c:LZ4_write32 Line | Count | Source | 398 | 1.00M | static void LZ4_write32(void* memPtr, U32 value) { ((LZ4_unalign32*)memPtr)->u32 = value; } |
Unexecuted instantiation: lz4hc.c:LZ4_write32 |
399 | | |
400 | | #else /* safe and portable access using memcpy() */ |
401 | | |
402 | | static U16 LZ4_read16(const void* memPtr) |
403 | | { |
404 | | U16 val; LZ4_memcpy(&val, memPtr, sizeof(val)); return val; |
405 | | } |
406 | | |
407 | | static U32 LZ4_read32(const void* memPtr) |
408 | | { |
409 | | U32 val; LZ4_memcpy(&val, memPtr, sizeof(val)); return val; |
410 | | } |
411 | | |
412 | | static reg_t LZ4_read_ARCH(const void* memPtr) |
413 | | { |
414 | | reg_t val; LZ4_memcpy(&val, memPtr, sizeof(val)); return val; |
415 | | } |
416 | | |
417 | | static void LZ4_write16(void* memPtr, U16 value) |
418 | | { |
419 | | LZ4_memcpy(memPtr, &value, sizeof(value)); |
420 | | } |
421 | | |
422 | | static void LZ4_write32(void* memPtr, U32 value) |
423 | | { |
424 | | LZ4_memcpy(memPtr, &value, sizeof(value)); |
425 | | } |
426 | | |
427 | | #endif /* LZ4_FORCE_MEMORY_ACCESS */ |
428 | | |
429 | | |
430 | | static U16 LZ4_readLE16(const void* memPtr) |
431 | 10.2M | { |
432 | 10.2M | if (LZ4_isLittleEndian()) { |
433 | 10.2M | return LZ4_read16(memPtr); |
434 | 10.2M | } else { |
435 | 0 | const BYTE* p = (const BYTE*)memPtr; |
436 | 0 | return (U16)((U16)p[0] | (p[1]<<8)); |
437 | 0 | } |
438 | 10.2M | } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_readLE16 Unexecuted instantiation: lz4_helpers.c:LZ4_readLE16 Unexecuted instantiation: fuzz_data_producer.c:LZ4_readLE16 Line | Count | Source | 431 | 10.2M | { | 432 | 10.2M | if (LZ4_isLittleEndian()) { | 433 | 10.2M | return LZ4_read16(memPtr); | 434 | 10.2M | } else { | 435 | 0 | const BYTE* p = (const BYTE*)memPtr; | 436 | 0 | return (U16)((U16)p[0] | (p[1]<<8)); | 437 | 0 | } | 438 | 10.2M | } |
Unexecuted instantiation: lz4hc.c:LZ4_readLE16 |
439 | | |
440 | | #ifdef LZ4_STATIC_LINKING_ONLY_ENDIANNESS_INDEPENDENT_OUTPUT |
441 | | static U32 LZ4_readLE32(const void* memPtr) |
442 | | { |
443 | | if (LZ4_isLittleEndian()) { |
444 | | return LZ4_read32(memPtr); |
445 | | } else { |
446 | | const BYTE* p = (const BYTE*)memPtr; |
447 | | return (U32)p[0] | (p[1]<<8) | (p[2]<<16) | (p[3]<<24); |
448 | | } |
449 | | } |
450 | | #endif |
451 | | |
452 | | static void LZ4_writeLE16(void* memPtr, U16 value) |
453 | 10.2M | { |
454 | 10.2M | if (LZ4_isLittleEndian()) { |
455 | 10.2M | LZ4_write16(memPtr, value); |
456 | 10.2M | } else { |
457 | 0 | BYTE* p = (BYTE*)memPtr; |
458 | 0 | p[0] = (BYTE) value; |
459 | 0 | p[1] = (BYTE)(value>>8); |
460 | 0 | } |
461 | 10.2M | } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_writeLE16 Unexecuted instantiation: lz4_helpers.c:LZ4_writeLE16 Unexecuted instantiation: fuzz_data_producer.c:LZ4_writeLE16 Line | Count | Source | 453 | 2.97M | { | 454 | 2.97M | if (LZ4_isLittleEndian()) { | 455 | 2.97M | LZ4_write16(memPtr, value); | 456 | 2.97M | } else { | 457 | 0 | BYTE* p = (BYTE*)memPtr; | 458 | 0 | p[0] = (BYTE) value; | 459 | 0 | p[1] = (BYTE)(value>>8); | 460 | 0 | } | 461 | 2.97M | } |
Line | Count | Source | 453 | 7.28M | { | 454 | 7.28M | if (LZ4_isLittleEndian()) { | 455 | 7.28M | LZ4_write16(memPtr, value); | 456 | 7.28M | } else { | 457 | 0 | BYTE* p = (BYTE*)memPtr; | 458 | 0 | p[0] = (BYTE) value; | 459 | 0 | p[1] = (BYTE)(value>>8); | 460 | 0 | } | 461 | 7.28M | } |
|
462 | | |
463 | | /* customized variant of memcpy, which can overwrite up to 8 bytes beyond dstEnd */ |
464 | | LZ4_FORCE_INLINE |
465 | | void LZ4_wildCopy8(void* dstPtr, const void* srcPtr, void* dstEnd) |
466 | 8.82M | { |
467 | 8.82M | BYTE* d = (BYTE*)dstPtr; |
468 | 8.82M | const BYTE* s = (const BYTE*)srcPtr; |
469 | 8.82M | BYTE* const e = (BYTE*)dstEnd; |
470 | | |
471 | 38.5M | do { LZ4_memcpy(d,s,8); d+=8; s+=8; } while (d<e); |
472 | 8.82M | } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_wildCopy8 Unexecuted instantiation: lz4_helpers.c:LZ4_wildCopy8 Unexecuted instantiation: fuzz_data_producer.c:LZ4_wildCopy8 Line | Count | Source | 466 | 1.53M | { | 467 | 1.53M | BYTE* d = (BYTE*)dstPtr; | 468 | 1.53M | const BYTE* s = (const BYTE*)srcPtr; | 469 | 1.53M | BYTE* const e = (BYTE*)dstEnd; | 470 | | | 471 | 17.5M | do { LZ4_memcpy(d,s,8); d+=8; s+=8; } while (d<e); | 472 | 1.53M | } |
Line | Count | Source | 466 | 7.28M | { | 467 | 7.28M | BYTE* d = (BYTE*)dstPtr; | 468 | 7.28M | const BYTE* s = (const BYTE*)srcPtr; | 469 | 7.28M | BYTE* const e = (BYTE*)dstEnd; | 470 | | | 471 | 20.9M | do { LZ4_memcpy(d,s,8); d+=8; s+=8; } while (d<e); | 472 | 7.28M | } |
|
473 | | |
474 | | static const unsigned inc32table[8] = {0, 1, 2, 1, 0, 4, 4, 4}; |
475 | | static const int dec64table[8] = {0, 0, 0, -1, -4, 1, 2, 3}; |
476 | | |
477 | | |
478 | | #ifndef LZ4_FAST_DEC_LOOP |
479 | | # if defined __i386__ || defined _M_IX86 || defined __x86_64__ || defined _M_X64 |
480 | | # define LZ4_FAST_DEC_LOOP 1 |
481 | | # elif defined(__aarch64__) |
482 | | # if defined(__clang__) && defined(__ANDROID__) |
483 | | /* On Android aarch64, we disable this optimization for clang because |
484 | | * on certain mobile chipsets, performance is reduced with clang. For |
485 | | * more information refer to https://github.com/lz4/lz4/pull/707 */ |
486 | | # define LZ4_FAST_DEC_LOOP 0 |
487 | | # else |
488 | | # define LZ4_FAST_DEC_LOOP 1 |
489 | | # endif |
490 | | # else |
491 | | # define LZ4_FAST_DEC_LOOP 0 |
492 | | # endif |
493 | | #endif |
494 | | |
495 | | #if LZ4_FAST_DEC_LOOP |
496 | | |
497 | | LZ4_FORCE_INLINE void |
498 | | LZ4_memcpy_using_offset_base(BYTE* dstPtr, const BYTE* srcPtr, BYTE* dstEnd, const size_t offset) |
499 | 116k | { |
500 | 116k | assert(srcPtr + offset == dstPtr); |
501 | 116k | if (offset < 8) { |
502 | 98.1k | LZ4_write32(dstPtr, 0); /* silence an msan warning when offset==0 */ |
503 | 98.1k | dstPtr[0] = srcPtr[0]; |
504 | 98.1k | dstPtr[1] = srcPtr[1]; |
505 | 98.1k | dstPtr[2] = srcPtr[2]; |
506 | 98.1k | dstPtr[3] = srcPtr[3]; |
507 | 98.1k | srcPtr += inc32table[offset]; |
508 | 98.1k | LZ4_memcpy(dstPtr+4, srcPtr, 4); |
509 | 98.1k | srcPtr -= dec64table[offset]; |
510 | 98.1k | dstPtr += 8; |
511 | 98.1k | } else { |
512 | 18.1k | LZ4_memcpy(dstPtr, srcPtr, 8); |
513 | 18.1k | dstPtr += 8; |
514 | 18.1k | srcPtr += 8; |
515 | 18.1k | } |
516 | | |
517 | 116k | LZ4_wildCopy8(dstPtr, srcPtr, dstEnd); |
518 | 116k | } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_memcpy_using_offset_base Unexecuted instantiation: lz4_helpers.c:LZ4_memcpy_using_offset_base Unexecuted instantiation: fuzz_data_producer.c:LZ4_memcpy_using_offset_base lz4.c:LZ4_memcpy_using_offset_base Line | Count | Source | 499 | 116k | { | 500 | 116k | assert(srcPtr + offset == dstPtr); | 501 | 116k | if (offset < 8) { | 502 | 98.1k | LZ4_write32(dstPtr, 0); /* silence an msan warning when offset==0 */ | 503 | 98.1k | dstPtr[0] = srcPtr[0]; | 504 | 98.1k | dstPtr[1] = srcPtr[1]; | 505 | 98.1k | dstPtr[2] = srcPtr[2]; | 506 | 98.1k | dstPtr[3] = srcPtr[3]; | 507 | 98.1k | srcPtr += inc32table[offset]; | 508 | 98.1k | LZ4_memcpy(dstPtr+4, srcPtr, 4); | 509 | 98.1k | srcPtr -= dec64table[offset]; | 510 | 98.1k | dstPtr += 8; | 511 | 98.1k | } else { | 512 | 18.1k | LZ4_memcpy(dstPtr, srcPtr, 8); | 513 | 18.1k | dstPtr += 8; | 514 | 18.1k | srcPtr += 8; | 515 | 18.1k | } | 516 | | | 517 | 116k | LZ4_wildCopy8(dstPtr, srcPtr, dstEnd); | 518 | 116k | } |
Unexecuted instantiation: lz4hc.c:LZ4_memcpy_using_offset_base |
519 | | |
520 | | /* customized variant of memcpy, which can overwrite up to 32 bytes beyond dstEnd |
521 | | * this version copies two times 16 bytes (instead of one time 32 bytes) |
522 | | * because it must be compatible with offsets >= 16. */ |
523 | | LZ4_FORCE_INLINE void |
524 | | LZ4_wildCopy32(void* dstPtr, const void* srcPtr, void* dstEnd) |
525 | 2.07M | { |
526 | 2.07M | BYTE* d = (BYTE*)dstPtr; |
527 | 2.07M | const BYTE* s = (const BYTE*)srcPtr; |
528 | 2.07M | BYTE* const e = (BYTE*)dstEnd; |
529 | | |
530 | 12.1M | do { LZ4_memcpy(d,s,16); LZ4_memcpy(d+16,s+16,16); d+=32; s+=32; } while (d<e); |
531 | 2.07M | } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_wildCopy32 Unexecuted instantiation: lz4_helpers.c:LZ4_wildCopy32 Unexecuted instantiation: fuzz_data_producer.c:LZ4_wildCopy32 Line | Count | Source | 525 | 2.07M | { | 526 | 2.07M | BYTE* d = (BYTE*)dstPtr; | 527 | 2.07M | const BYTE* s = (const BYTE*)srcPtr; | 528 | 2.07M | BYTE* const e = (BYTE*)dstEnd; | 529 | | | 530 | 12.1M | do { LZ4_memcpy(d,s,16); LZ4_memcpy(d+16,s+16,16); d+=32; s+=32; } while (d<e); | 531 | 2.07M | } |
Unexecuted instantiation: lz4hc.c:LZ4_wildCopy32 |
532 | | |
533 | | /* LZ4_memcpy_using_offset() presumes : |
534 | | * - dstEnd >= dstPtr + MINMATCH |
535 | | * - there is at least 12 bytes available to write after dstEnd */ |
536 | | LZ4_FORCE_INLINE void |
537 | | LZ4_memcpy_using_offset(BYTE* dstPtr, const BYTE* srcPtr, BYTE* dstEnd, const size_t offset) |
538 | 595k | { |
539 | 595k | BYTE v[8]; |
540 | | |
541 | 595k | assert(dstEnd >= dstPtr + MINMATCH); |
542 | | |
543 | 595k | switch(offset) { |
544 | 102k | case 1: |
545 | 102k | MEM_INIT(v, *srcPtr, 8); |
546 | 102k | break; |
547 | 332k | case 2: |
548 | 332k | LZ4_memcpy(v, srcPtr, 2); |
549 | 332k | LZ4_memcpy(&v[2], srcPtr, 2); |
550 | | #if defined(_MSC_VER) && (_MSC_VER <= 1937) /* MSVC 2022 ver 17.7 or earlier */ |
551 | | # pragma warning(push) |
552 | | # pragma warning(disable : 6385) /* warning C6385: Reading invalid data from 'v'. */ |
553 | | #endif |
554 | 332k | LZ4_memcpy(&v[4], v, 4); |
555 | | #if defined(_MSC_VER) && (_MSC_VER <= 1937) /* MSVC 2022 ver 17.7 or earlier */ |
556 | | # pragma warning(pop) |
557 | | #endif |
558 | 332k | break; |
559 | 44.4k | case 4: |
560 | 44.4k | LZ4_memcpy(v, srcPtr, 4); |
561 | 44.4k | LZ4_memcpy(&v[4], srcPtr, 4); |
562 | 44.4k | break; |
563 | 116k | default: |
564 | 116k | LZ4_memcpy_using_offset_base(dstPtr, srcPtr, dstEnd, offset); |
565 | 116k | return; |
566 | 595k | } |
567 | | |
568 | 479k | LZ4_memcpy(dstPtr, v, 8); |
569 | 479k | dstPtr += 8; |
570 | 13.1M | while (dstPtr < dstEnd) { |
571 | 12.6M | LZ4_memcpy(dstPtr, v, 8); |
572 | 12.6M | dstPtr += 8; |
573 | 12.6M | } |
574 | 479k | } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_memcpy_using_offset Unexecuted instantiation: lz4_helpers.c:LZ4_memcpy_using_offset Unexecuted instantiation: fuzz_data_producer.c:LZ4_memcpy_using_offset lz4.c:LZ4_memcpy_using_offset Line | Count | Source | 538 | 595k | { | 539 | 595k | BYTE v[8]; | 540 | | | 541 | 595k | assert(dstEnd >= dstPtr + MINMATCH); | 542 | | | 543 | 595k | switch(offset) { | 544 | 102k | case 1: | 545 | 102k | MEM_INIT(v, *srcPtr, 8); | 546 | 102k | break; | 547 | 332k | case 2: | 548 | 332k | LZ4_memcpy(v, srcPtr, 2); | 549 | 332k | LZ4_memcpy(&v[2], srcPtr, 2); | 550 | | #if defined(_MSC_VER) && (_MSC_VER <= 1937) /* MSVC 2022 ver 17.7 or earlier */ | 551 | | # pragma warning(push) | 552 | | # pragma warning(disable : 6385) /* warning C6385: Reading invalid data from 'v'. */ | 553 | | #endif | 554 | 332k | LZ4_memcpy(&v[4], v, 4); | 555 | | #if defined(_MSC_VER) && (_MSC_VER <= 1937) /* MSVC 2022 ver 17.7 or earlier */ | 556 | | # pragma warning(pop) | 557 | | #endif | 558 | 332k | break; | 559 | 44.4k | case 4: | 560 | 44.4k | LZ4_memcpy(v, srcPtr, 4); | 561 | 44.4k | LZ4_memcpy(&v[4], srcPtr, 4); | 562 | 44.4k | break; | 563 | 116k | default: | 564 | 116k | LZ4_memcpy_using_offset_base(dstPtr, srcPtr, dstEnd, offset); | 565 | 116k | return; | 566 | 595k | } | 567 | | | 568 | 479k | LZ4_memcpy(dstPtr, v, 8); | 569 | 479k | dstPtr += 8; | 570 | 13.1M | while (dstPtr < dstEnd) { | 571 | 12.6M | LZ4_memcpy(dstPtr, v, 8); | 572 | 12.6M | dstPtr += 8; | 573 | 12.6M | } | 574 | 479k | } |
Unexecuted instantiation: lz4hc.c:LZ4_memcpy_using_offset |
575 | | #endif |
576 | | |
577 | | |
578 | | /*-************************************ |
579 | | * Common functions |
580 | | **************************************/ |
581 | | static unsigned LZ4_NbCommonBytes (reg_t val) |
582 | 111M | { |
583 | 111M | assert(val != 0); |
584 | 111M | if (LZ4_isLittleEndian()) { |
585 | 111M | if (sizeof(val) == 8) { |
586 | | # if defined(_MSC_VER) && (_MSC_VER >= 1800) && (defined(_M_AMD64) && !defined(_M_ARM64EC)) && !defined(LZ4_FORCE_SW_BITCOUNT) |
587 | | /*-************************************************************************************************* |
588 | | * ARM64EC is a Microsoft-designed ARM64 ABI compatible with AMD64 applications on ARM64 Windows 11. |
589 | | * The ARM64EC ABI does not support AVX/AVX2/AVX512 instructions, nor their relevant intrinsics |
590 | | * including _tzcnt_u64. Therefore, we need to neuter the _tzcnt_u64 code path for ARM64EC. |
591 | | ****************************************************************************************************/ |
592 | | # if defined(__clang__) && (__clang_major__ < 10) |
593 | | /* Avoid undefined clang-cl intrinsics issue. |
594 | | * See https://github.com/lz4/lz4/pull/1017 for details. */ |
595 | | return (unsigned)__builtin_ia32_tzcnt_u64(val) >> 3; |
596 | | # else |
597 | | /* x64 CPUS without BMI support interpret `TZCNT` as `REP BSF` */ |
598 | | return (unsigned)_tzcnt_u64(val) >> 3; |
599 | | # endif |
600 | | # elif defined(_MSC_VER) && defined(_WIN64) && !defined(LZ4_FORCE_SW_BITCOUNT) |
601 | | unsigned long r = 0; |
602 | | _BitScanForward64(&r, (U64)val); |
603 | | return (unsigned)r >> 3; |
604 | | # elif (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \ |
605 | | ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \ |
606 | | !defined(LZ4_FORCE_SW_BITCOUNT) |
607 | | return (unsigned)__builtin_ctzll((U64)val) >> 3; |
608 | | # else |
609 | | const U64 m = 0x0101010101010101ULL; |
610 | | val ^= val - 1; |
611 | | return (unsigned)(((U64)((val & (m - 1)) * m)) >> 56); |
612 | | # endif |
613 | 111M | } else /* 32 bits */ { |
614 | | # if defined(_MSC_VER) && (_MSC_VER >= 1400) && !defined(LZ4_FORCE_SW_BITCOUNT) |
615 | | unsigned long r; |
616 | | _BitScanForward(&r, (U32)val); |
617 | | return (unsigned)r >> 3; |
618 | | # elif (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \ |
619 | | ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \ |
620 | | !defined(__TINYC__) && !defined(LZ4_FORCE_SW_BITCOUNT) |
621 | | return (unsigned)__builtin_ctz((U32)val) >> 3; |
622 | | # else |
623 | | const U32 m = 0x01010101; |
624 | | return (unsigned)((((val - 1) ^ val) & (m - 1)) * m) >> 24; |
625 | | # endif |
626 | 0 | } |
627 | 111M | } else /* Big Endian CPU */ { |
628 | 0 | if (sizeof(val)==8) { |
629 | 0 | # if (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \ |
630 | 0 | ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \ |
631 | 0 | !defined(__TINYC__) && !defined(LZ4_FORCE_SW_BITCOUNT) |
632 | 0 | return (unsigned)__builtin_clzll((U64)val) >> 3; |
633 | | # else |
634 | | #if 1 |
635 | | /* this method is probably faster, |
636 | | * but adds a 128 bytes lookup table */ |
637 | | static const unsigned char ctz7_tab[128] = { |
638 | | 7, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, |
639 | | 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, |
640 | | 5, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, |
641 | | 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, |
642 | | 6, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, |
643 | | 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, |
644 | | 5, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, |
645 | | 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, |
646 | | }; |
647 | | U64 const mask = 0x0101010101010101ULL; |
648 | | U64 const t = (((val >> 8) - mask) | val) & mask; |
649 | | return ctz7_tab[(t * 0x0080402010080402ULL) >> 57]; |
650 | | #else |
651 | | /* this method doesn't consume memory space like the previous one, |
652 | | * but it contains several branches, |
653 | | * that may end up slowing execution */ |
654 | | static const U32 by32 = sizeof(val)*4; /* 32 on 64 bits (goal), 16 on 32 bits. |
655 | | Just to avoid some static analyzer complaining about shift by 32 on 32-bits target. |
656 | | Note that this code path is never triggered in 32-bits mode. */ |
657 | | unsigned r; |
658 | | if (!(val>>by32)) { r=4; } else { r=0; val>>=by32; } |
659 | | if (!(val>>16)) { r+=2; val>>=8; } else { val>>=24; } |
660 | | r += (!val); |
661 | | return r; |
662 | | #endif |
663 | | # endif |
664 | 0 | } else /* 32 bits */ { |
665 | 0 | # if (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \ |
666 | 0 | ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \ |
667 | 0 | !defined(LZ4_FORCE_SW_BITCOUNT) |
668 | 0 | return (unsigned)__builtin_clz((U32)val) >> 3; |
669 | | # else |
670 | | val >>= 8; |
671 | | val = ((((val + 0x00FFFF00) | 0x00FFFFFF) + val) | |
672 | | (val + 0x00FF0000)) >> 24; |
673 | | return (unsigned)val ^ 3; |
674 | | # endif |
675 | 0 | } |
676 | 0 | } |
677 | 111M | } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_NbCommonBytes Unexecuted instantiation: lz4_helpers.c:LZ4_NbCommonBytes Unexecuted instantiation: fuzz_data_producer.c:LZ4_NbCommonBytes Line | Count | Source | 582 | 2.97M | { | 583 | 2.97M | assert(val != 0); | 584 | 2.97M | if (LZ4_isLittleEndian()) { | 585 | 2.97M | if (sizeof(val) == 8) { | 586 | | # if defined(_MSC_VER) && (_MSC_VER >= 1800) && (defined(_M_AMD64) && !defined(_M_ARM64EC)) && !defined(LZ4_FORCE_SW_BITCOUNT) | 587 | | /*-************************************************************************************************* | 588 | | * ARM64EC is a Microsoft-designed ARM64 ABI compatible with AMD64 applications on ARM64 Windows 11. | 589 | | * The ARM64EC ABI does not support AVX/AVX2/AVX512 instructions, nor their relevant intrinsics | 590 | | * including _tzcnt_u64. Therefore, we need to neuter the _tzcnt_u64 code path for ARM64EC. | 591 | | ****************************************************************************************************/ | 592 | | # if defined(__clang__) && (__clang_major__ < 10) | 593 | | /* Avoid undefined clang-cl intrinsics issue. | 594 | | * See https://github.com/lz4/lz4/pull/1017 for details. */ | 595 | | return (unsigned)__builtin_ia32_tzcnt_u64(val) >> 3; | 596 | | # else | 597 | | /* x64 CPUS without BMI support interpret `TZCNT` as `REP BSF` */ | 598 | | return (unsigned)_tzcnt_u64(val) >> 3; | 599 | | # endif | 600 | | # elif defined(_MSC_VER) && defined(_WIN64) && !defined(LZ4_FORCE_SW_BITCOUNT) | 601 | | unsigned long r = 0; | 602 | | _BitScanForward64(&r, (U64)val); | 603 | | return (unsigned)r >> 3; | 604 | | # elif (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \ | 605 | | ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \ | 606 | | !defined(LZ4_FORCE_SW_BITCOUNT) | 607 | | return (unsigned)__builtin_ctzll((U64)val) >> 3; | 608 | | # else | 609 | | const U64 m = 0x0101010101010101ULL; | 610 | | val ^= val - 1; | 611 | | return (unsigned)(((U64)((val & (m - 1)) * m)) >> 56); | 612 | | # endif | 613 | 2.97M | } else /* 32 bits */ { | 614 | | # if defined(_MSC_VER) && (_MSC_VER >= 1400) && !defined(LZ4_FORCE_SW_BITCOUNT) | 615 | | unsigned long r; | 616 | | _BitScanForward(&r, (U32)val); | 617 | | return (unsigned)r >> 3; | 618 | | # elif (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \ | 619 | | ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \ | 620 | | !defined(__TINYC__) && !defined(LZ4_FORCE_SW_BITCOUNT) | 621 | | return (unsigned)__builtin_ctz((U32)val) >> 3; | 622 | | # else | 623 | | const U32 m = 0x01010101; | 624 | | return (unsigned)((((val - 1) ^ val) & (m - 1)) * m) >> 24; | 625 | | # endif | 626 | 0 | } | 627 | 2.97M | } else /* Big Endian CPU */ { | 628 | 0 | if (sizeof(val)==8) { | 629 | 0 | # if (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \ | 630 | 0 | ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \ | 631 | 0 | !defined(__TINYC__) && !defined(LZ4_FORCE_SW_BITCOUNT) | 632 | 0 | return (unsigned)__builtin_clzll((U64)val) >> 3; | 633 | | # else | 634 | | #if 1 | 635 | | /* this method is probably faster, | 636 | | * but adds a 128 bytes lookup table */ | 637 | | static const unsigned char ctz7_tab[128] = { | 638 | | 7, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 639 | | 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 640 | | 5, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 641 | | 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 642 | | 6, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 643 | | 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 644 | | 5, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 645 | | 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 646 | | }; | 647 | | U64 const mask = 0x0101010101010101ULL; | 648 | | U64 const t = (((val >> 8) - mask) | val) & mask; | 649 | | return ctz7_tab[(t * 0x0080402010080402ULL) >> 57]; | 650 | | #else | 651 | | /* this method doesn't consume memory space like the previous one, | 652 | | * but it contains several branches, | 653 | | * that may end up slowing execution */ | 654 | | static const U32 by32 = sizeof(val)*4; /* 32 on 64 bits (goal), 16 on 32 bits. | 655 | | Just to avoid some static analyzer complaining about shift by 32 on 32-bits target. | 656 | | Note that this code path is never triggered in 32-bits mode. */ | 657 | | unsigned r; | 658 | | if (!(val>>by32)) { r=4; } else { r=0; val>>=by32; } | 659 | | if (!(val>>16)) { r+=2; val>>=8; } else { val>>=24; } | 660 | | r += (!val); | 661 | | return r; | 662 | | #endif | 663 | | # endif | 664 | 0 | } else /* 32 bits */ { | 665 | 0 | # if (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \ | 666 | 0 | ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \ | 667 | 0 | !defined(LZ4_FORCE_SW_BITCOUNT) | 668 | 0 | return (unsigned)__builtin_clz((U32)val) >> 3; | 669 | | # else | 670 | | val >>= 8; | 671 | | val = ((((val + 0x00FFFF00) | 0x00FFFFFF) + val) | | 672 | | (val + 0x00FF0000)) >> 24; | 673 | | return (unsigned)val ^ 3; | 674 | | # endif | 675 | 0 | } | 676 | 0 | } | 677 | 2.97M | } |
lz4hc.c:LZ4_NbCommonBytes Line | Count | Source | 582 | 108M | { | 583 | 108M | assert(val != 0); | 584 | 108M | if (LZ4_isLittleEndian()) { | 585 | 108M | if (sizeof(val) == 8) { | 586 | | # if defined(_MSC_VER) && (_MSC_VER >= 1800) && (defined(_M_AMD64) && !defined(_M_ARM64EC)) && !defined(LZ4_FORCE_SW_BITCOUNT) | 587 | | /*-************************************************************************************************* | 588 | | * ARM64EC is a Microsoft-designed ARM64 ABI compatible with AMD64 applications on ARM64 Windows 11. | 589 | | * The ARM64EC ABI does not support AVX/AVX2/AVX512 instructions, nor their relevant intrinsics | 590 | | * including _tzcnt_u64. Therefore, we need to neuter the _tzcnt_u64 code path for ARM64EC. | 591 | | ****************************************************************************************************/ | 592 | | # if defined(__clang__) && (__clang_major__ < 10) | 593 | | /* Avoid undefined clang-cl intrinsics issue. | 594 | | * See https://github.com/lz4/lz4/pull/1017 for details. */ | 595 | | return (unsigned)__builtin_ia32_tzcnt_u64(val) >> 3; | 596 | | # else | 597 | | /* x64 CPUS without BMI support interpret `TZCNT` as `REP BSF` */ | 598 | | return (unsigned)_tzcnt_u64(val) >> 3; | 599 | | # endif | 600 | | # elif defined(_MSC_VER) && defined(_WIN64) && !defined(LZ4_FORCE_SW_BITCOUNT) | 601 | | unsigned long r = 0; | 602 | | _BitScanForward64(&r, (U64)val); | 603 | | return (unsigned)r >> 3; | 604 | | # elif (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \ | 605 | | ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \ | 606 | | !defined(LZ4_FORCE_SW_BITCOUNT) | 607 | | return (unsigned)__builtin_ctzll((U64)val) >> 3; | 608 | | # else | 609 | | const U64 m = 0x0101010101010101ULL; | 610 | | val ^= val - 1; | 611 | | return (unsigned)(((U64)((val & (m - 1)) * m)) >> 56); | 612 | | # endif | 613 | 108M | } else /* 32 bits */ { | 614 | | # if defined(_MSC_VER) && (_MSC_VER >= 1400) && !defined(LZ4_FORCE_SW_BITCOUNT) | 615 | | unsigned long r; | 616 | | _BitScanForward(&r, (U32)val); | 617 | | return (unsigned)r >> 3; | 618 | | # elif (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \ | 619 | | ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \ | 620 | | !defined(__TINYC__) && !defined(LZ4_FORCE_SW_BITCOUNT) | 621 | | return (unsigned)__builtin_ctz((U32)val) >> 3; | 622 | | # else | 623 | | const U32 m = 0x01010101; | 624 | | return (unsigned)((((val - 1) ^ val) & (m - 1)) * m) >> 24; | 625 | | # endif | 626 | 0 | } | 627 | 108M | } else /* Big Endian CPU */ { | 628 | 0 | if (sizeof(val)==8) { | 629 | 0 | # if (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \ | 630 | 0 | ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \ | 631 | 0 | !defined(__TINYC__) && !defined(LZ4_FORCE_SW_BITCOUNT) | 632 | 0 | return (unsigned)__builtin_clzll((U64)val) >> 3; | 633 | | # else | 634 | | #if 1 | 635 | | /* this method is probably faster, | 636 | | * but adds a 128 bytes lookup table */ | 637 | | static const unsigned char ctz7_tab[128] = { | 638 | | 7, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 639 | | 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 640 | | 5, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 641 | | 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 642 | | 6, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 643 | | 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 644 | | 5, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 645 | | 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, | 646 | | }; | 647 | | U64 const mask = 0x0101010101010101ULL; | 648 | | U64 const t = (((val >> 8) - mask) | val) & mask; | 649 | | return ctz7_tab[(t * 0x0080402010080402ULL) >> 57]; | 650 | | #else | 651 | | /* this method doesn't consume memory space like the previous one, | 652 | | * but it contains several branches, | 653 | | * that may end up slowing execution */ | 654 | | static const U32 by32 = sizeof(val)*4; /* 32 on 64 bits (goal), 16 on 32 bits. | 655 | | Just to avoid some static analyzer complaining about shift by 32 on 32-bits target. | 656 | | Note that this code path is never triggered in 32-bits mode. */ | 657 | | unsigned r; | 658 | | if (!(val>>by32)) { r=4; } else { r=0; val>>=by32; } | 659 | | if (!(val>>16)) { r+=2; val>>=8; } else { val>>=24; } | 660 | | r += (!val); | 661 | | return r; | 662 | | #endif | 663 | | # endif | 664 | 0 | } else /* 32 bits */ { | 665 | 0 | # if (defined(__clang__) || (defined(__GNUC__) && ((__GNUC__ > 3) || \ | 666 | 0 | ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 4))))) && \ | 667 | 0 | !defined(LZ4_FORCE_SW_BITCOUNT) | 668 | 0 | return (unsigned)__builtin_clz((U32)val) >> 3; | 669 | | # else | 670 | | val >>= 8; | 671 | | val = ((((val + 0x00FFFF00) | 0x00FFFFFF) + val) | | 672 | | (val + 0x00FF0000)) >> 24; | 673 | | return (unsigned)val ^ 3; | 674 | | # endif | 675 | 0 | } | 676 | 0 | } | 677 | 108M | } |
|
678 | | |
679 | | |
680 | 1.26G | #define STEPSIZE sizeof(reg_t) |
681 | | LZ4_FORCE_INLINE |
682 | | unsigned LZ4_count(const BYTE* pIn, const BYTE* pMatch, const BYTE* pInLimit) |
683 | 63.1M | { |
684 | 63.1M | const BYTE* const pStart = pIn; |
685 | | |
686 | 63.1M | if (likely(pIn < pInLimit-(STEPSIZE-1))) { |
687 | 63.0M | reg_t const diff = LZ4_read_ARCH(pMatch) ^ LZ4_read_ARCH(pIn); |
688 | 63.0M | if (!diff) { |
689 | 12.8M | pIn+=STEPSIZE; pMatch+=STEPSIZE; |
690 | 50.1M | } else { |
691 | 50.1M | return LZ4_NbCommonBytes(diff); |
692 | 50.1M | } } |
693 | | |
694 | 631M | while (likely(pIn < pInLimit-(STEPSIZE-1))) { |
695 | 631M | reg_t const diff = LZ4_read_ARCH(pMatch) ^ LZ4_read_ARCH(pIn); |
696 | 631M | if (!diff) { pIn+=STEPSIZE; pMatch+=STEPSIZE; continue; } |
697 | 12.3M | pIn += LZ4_NbCommonBytes(diff); |
698 | 12.3M | return (unsigned)(pIn - pStart); |
699 | 631M | } |
700 | | |
701 | 636k | if ((STEPSIZE==8) && (pIn<(pInLimit-3)) && (LZ4_read32(pMatch) == LZ4_read32(pIn))) { pIn+=4; pMatch+=4; } |
702 | 636k | if ((pIn<(pInLimit-1)) && (LZ4_read16(pMatch) == LZ4_read16(pIn))) { pIn+=2; pMatch+=2; } |
703 | 636k | if ((pIn<pInLimit) && (*pMatch == *pIn)) pIn++; |
704 | 636k | return (unsigned)(pIn - pStart); |
705 | 12.9M | } Unexecuted instantiation: round_trip_frame_fuzzer.c:LZ4_count Unexecuted instantiation: lz4_helpers.c:LZ4_count Unexecuted instantiation: fuzz_data_producer.c:LZ4_count Line | Count | Source | 683 | 2.97M | { | 684 | 2.97M | const BYTE* const pStart = pIn; | 685 | | | 686 | 2.97M | if (likely(pIn < pInLimit-(STEPSIZE-1))) { | 687 | 2.97M | reg_t const diff = LZ4_read_ARCH(pMatch) ^ LZ4_read_ARCH(pIn); | 688 | 2.97M | if (!diff) { | 689 | 1.05M | pIn+=STEPSIZE; pMatch+=STEPSIZE; | 690 | 1.91M | } else { | 691 | 1.91M | return LZ4_NbCommonBytes(diff); | 692 | 1.91M | } } | 693 | | | 694 | 18.1M | while (likely(pIn < pInLimit-(STEPSIZE-1))) { | 695 | 18.1M | reg_t const diff = LZ4_read_ARCH(pMatch) ^ LZ4_read_ARCH(pIn); | 696 | 18.1M | if (!diff) { pIn+=STEPSIZE; pMatch+=STEPSIZE; continue; } | 697 | 1.05M | pIn += LZ4_NbCommonBytes(diff); | 698 | 1.05M | return (unsigned)(pIn - pStart); | 699 | 18.1M | } | 700 | | | 701 | 2.58k | if ((STEPSIZE==8) && (pIn<(pInLimit-3)) && (LZ4_read32(pMatch) == LZ4_read32(pIn))) { pIn+=4; pMatch+=4; } | 702 | 2.58k | if ((pIn<(pInLimit-1)) && (LZ4_read16(pMatch) == LZ4_read16(pIn))) { pIn+=2; pMatch+=2; } | 703 | 2.58k | if ((pIn<pInLimit) && (*pMatch == *pIn)) pIn++; | 704 | 2.58k | return (unsigned)(pIn - pStart); | 705 | 1.05M | } |
Line | Count | Source | 683 | 60.1M | { | 684 | 60.1M | const BYTE* const pStart = pIn; | 685 | | | 686 | 60.1M | if (likely(pIn < pInLimit-(STEPSIZE-1))) { | 687 | 60.0M | reg_t const diff = LZ4_read_ARCH(pMatch) ^ LZ4_read_ARCH(pIn); | 688 | 60.0M | if (!diff) { | 689 | 11.7M | pIn+=STEPSIZE; pMatch+=STEPSIZE; | 690 | 48.2M | } else { | 691 | 48.2M | return LZ4_NbCommonBytes(diff); | 692 | 48.2M | } } | 693 | | | 694 | 613M | while (likely(pIn < pInLimit-(STEPSIZE-1))) { | 695 | 613M | reg_t const diff = LZ4_read_ARCH(pMatch) ^ LZ4_read_ARCH(pIn); | 696 | 613M | if (!diff) { pIn+=STEPSIZE; pMatch+=STEPSIZE; continue; } | 697 | 11.2M | pIn += LZ4_NbCommonBytes(diff); | 698 | 11.2M | return (unsigned)(pIn - pStart); | 699 | 613M | } | 700 | | | 701 | 633k | if ((STEPSIZE==8) && (pIn<(pInLimit-3)) && (LZ4_read32(pMatch) == LZ4_read32(pIn))) { pIn+=4; pMatch+=4; } | 702 | 633k | if ((pIn<(pInLimit-1)) && (LZ4_read16(pMatch) == LZ4_read16(pIn))) { pIn+=2; pMatch+=2; } | 703 | 633k | if ((pIn<pInLimit) && (*pMatch == *pIn)) pIn++; | 704 | 633k | return (unsigned)(pIn - pStart); | 705 | 11.8M | } |
|
706 | | |
707 | | |
708 | | #ifndef LZ4_COMMONDEFS_ONLY |
709 | | /*-************************************ |
710 | | * Local Constants |
711 | | **************************************/ |
712 | | static const int LZ4_64Klimit = ((64 KB) + (MFLIMIT-1)); |
713 | | static const U32 LZ4_skipTrigger = 6; /* Increase this value ==> compression run slower on incompressible data */ |
714 | | |
715 | | |
716 | | /*-************************************ |
717 | | * Local Structures and types |
718 | | **************************************/ |
719 | | typedef enum { clearedTable = 0, byPtr, byU32, byU16 } tableType_t; |
720 | | |
721 | | /** |
722 | | * This enum distinguishes several different modes of accessing previous |
723 | | * content in the stream. |
724 | | * |
725 | | * - noDict : There is no preceding content. |
726 | | * - withPrefix64k : Table entries up to ctx->dictSize before the current blob |
727 | | * blob being compressed are valid and refer to the preceding |
728 | | * content (of length ctx->dictSize), which is available |
729 | | * contiguously preceding in memory the content currently |
730 | | * being compressed. |
731 | | * - usingExtDict : Like withPrefix64k, but the preceding content is somewhere |
732 | | * else in memory, starting at ctx->dictionary with length |
733 | | * ctx->dictSize. |
734 | | * - usingDictCtx : Everything concerning the preceding content is |
735 | | * in a separate context, pointed to by ctx->dictCtx. |
736 | | * ctx->dictionary, ctx->dictSize, and table entries |
737 | | * in the current context that refer to positions |
738 | | * preceding the beginning of the current compression are |
739 | | * ignored. Instead, ctx->dictCtx->dictionary and ctx->dictCtx |
740 | | * ->dictSize describe the location and size of the preceding |
741 | | * content, and matches are found by looking in the ctx |
742 | | * ->dictCtx->hashTable. |
743 | | */ |
744 | | typedef enum { noDict = 0, withPrefix64k, usingExtDict, usingDictCtx } dict_directive; |
745 | | typedef enum { noDictIssue = 0, dictSmall } dictIssue_directive; |
746 | | |
747 | | |
748 | | /*-************************************ |
749 | | * Local Utils |
750 | | **************************************/ |
751 | 0 | int LZ4_versionNumber (void) { return LZ4_VERSION_NUMBER; } |
752 | 0 | const char* LZ4_versionString(void) { return LZ4_VERSION_STRING; } |
753 | 24.9k | int LZ4_compressBound(int isize) { return LZ4_COMPRESSBOUND(isize); } |
754 | 3.23k | int LZ4_sizeofState(void) { return sizeof(LZ4_stream_t); } |
755 | | |
756 | | |
757 | | /*-**************************************** |
758 | | * Internal Definitions, used only in Tests |
759 | | *******************************************/ |
760 | | #if defined (__cplusplus) |
761 | | extern "C" { |
762 | | #endif |
763 | | |
764 | | int LZ4_compress_forceExtDict (LZ4_stream_t* LZ4_dict, const char* source, char* dest, int srcSize); |
765 | | |
766 | | int LZ4_decompress_safe_forceExtDict(const char* source, char* dest, |
767 | | int compressedSize, int maxOutputSize, |
768 | | const void* dictStart, size_t dictSize); |
769 | | int LZ4_decompress_safe_partial_forceExtDict(const char* source, char* dest, |
770 | | int compressedSize, int targetOutputSize, int dstCapacity, |
771 | | const void* dictStart, size_t dictSize); |
772 | | #if defined (__cplusplus) |
773 | | } |
774 | | #endif |
775 | | |
776 | | /*-****************************** |
777 | | * Compression functions |
778 | | ********************************/ |
779 | | LZ4_FORCE_INLINE U32 LZ4_hash4(U32 sequence, tableType_t const tableType) |
780 | 7.31M | { |
781 | 7.31M | if (tableType == byU16) |
782 | 7.31M | return ((sequence * 2654435761U) >> ((MINMATCH*8)-(LZ4_HASHLOG+1))); |
783 | 0 | else |
784 | 0 | return ((sequence * 2654435761U) >> ((MINMATCH*8)-LZ4_HASHLOG)); |
785 | 7.31M | } |
786 | | |
787 | | LZ4_FORCE_INLINE U32 LZ4_hash5(U64 sequence, tableType_t const tableType) |
788 | 15.1M | { |
789 | 15.1M | const U32 hashLog = (tableType == byU16) ? LZ4_HASHLOG+1 : LZ4_HASHLOG; |
790 | 15.1M | if (LZ4_isLittleEndian()) { |
791 | 15.1M | const U64 prime5bytes = 889523592379ULL; |
792 | 15.1M | return (U32)(((sequence << 24) * prime5bytes) >> (64 - hashLog)); |
793 | 15.1M | } else { |
794 | 0 | const U64 prime8bytes = 11400714785074694791ULL; |
795 | 0 | return (U32)(((sequence >> 24) * prime8bytes) >> (64 - hashLog)); |
796 | 0 | } |
797 | 15.1M | } |
798 | | |
799 | | LZ4_FORCE_INLINE U32 LZ4_hashPosition(const void* const p, tableType_t const tableType) |
800 | 22.4M | { |
801 | 22.4M | if ((sizeof(reg_t)==8) && (tableType != byU16)) return LZ4_hash5(LZ4_read_ARCH(p), tableType); |
802 | | |
803 | | #ifdef LZ4_STATIC_LINKING_ONLY_ENDIANNESS_INDEPENDENT_OUTPUT |
804 | | return LZ4_hash4(LZ4_readLE32(p), tableType); |
805 | | #else |
806 | 7.31M | return LZ4_hash4(LZ4_read32(p), tableType); |
807 | 22.4M | #endif |
808 | 22.4M | } |
809 | | |
810 | | LZ4_FORCE_INLINE void LZ4_clearHash(U32 h, void* tableBase, tableType_t const tableType) |
811 | 0 | { |
812 | 0 | switch (tableType) |
813 | 0 | { |
814 | 0 | default: /* fallthrough */ |
815 | 0 | case clearedTable: { /* illegal! */ assert(0); return; } |
816 | 0 | case byPtr: { const BYTE** hashTable = (const BYTE**)tableBase; hashTable[h] = NULL; return; } |
817 | 0 | case byU32: { U32* hashTable = (U32*) tableBase; hashTable[h] = 0; return; } |
818 | 0 | case byU16: { U16* hashTable = (U16*) tableBase; hashTable[h] = 0; return; } |
819 | 0 | } |
820 | 0 | } |
821 | | |
822 | | LZ4_FORCE_INLINE void LZ4_putIndexOnHash(U32 idx, U32 h, void* tableBase, tableType_t const tableType) |
823 | 21.0M | { |
824 | 21.0M | switch (tableType) |
825 | 21.0M | { |
826 | 0 | default: /* fallthrough */ |
827 | 0 | case clearedTable: /* fallthrough */ |
828 | 0 | case byPtr: { /* illegal! */ assert(0); return; } |
829 | 14.1M | case byU32: { U32* hashTable = (U32*) tableBase; hashTable[h] = idx; return; } |
830 | 6.94M | case byU16: { U16* hashTable = (U16*) tableBase; assert(idx < 65536); hashTable[h] = (U16)idx; return; } |
831 | 21.0M | } |
832 | 21.0M | } |
833 | | |
834 | | /* LZ4_putPosition*() : only used in byPtr mode */ |
835 | | LZ4_FORCE_INLINE void LZ4_putPositionOnHash(const BYTE* p, U32 h, |
836 | | void* tableBase, tableType_t const tableType) |
837 | 0 | { |
838 | 0 | const BYTE** const hashTable = (const BYTE**)tableBase; |
839 | 0 | assert(tableType == byPtr); (void)tableType; |
840 | 0 | hashTable[h] = p; |
841 | 0 | } |
842 | | |
843 | | LZ4_FORCE_INLINE void LZ4_putPosition(const BYTE* p, void* tableBase, tableType_t tableType) |
844 | 0 | { |
845 | 0 | U32 const h = LZ4_hashPosition(p, tableType); |
846 | 0 | LZ4_putPositionOnHash(p, h, tableBase, tableType); |
847 | 0 | } |
848 | | |
849 | | /* LZ4_getIndexOnHash() : |
850 | | * Index of match position registered in hash table. |
851 | | * hash position must be calculated by using base+index, or dictBase+index. |
852 | | * Assumption 1 : only valid if tableType == byU32 or byU16. |
853 | | * Assumption 2 : h is presumed valid (within limits of hash table) |
854 | | */ |
855 | | LZ4_FORCE_INLINE U32 LZ4_getIndexOnHash(U32 h, const void* tableBase, tableType_t tableType) |
856 | 18.1M | { |
857 | 18.1M | LZ4_STATIC_ASSERT(LZ4_MEMORY_USAGE > 2); |
858 | 18.1M | if (tableType == byU32) { |
859 | 12.3M | const U32* const hashTable = (const U32*) tableBase; |
860 | 12.3M | assert(h < (1U << (LZ4_MEMORY_USAGE-2))); |
861 | 12.3M | return hashTable[h]; |
862 | 12.3M | } |
863 | 5.75M | if (tableType == byU16) { |
864 | 5.75M | const U16* const hashTable = (const U16*) tableBase; |
865 | 5.75M | assert(h < (1U << (LZ4_MEMORY_USAGE-1))); |
866 | 5.75M | return hashTable[h]; |
867 | 5.75M | } |
868 | 0 | assert(0); return 0; /* forbidden case */ |
869 | 0 | } |
870 | | |
871 | | static const BYTE* LZ4_getPositionOnHash(U32 h, const void* tableBase, tableType_t tableType) |
872 | 0 | { |
873 | 0 | assert(tableType == byPtr); (void)tableType; |
874 | 0 | { const BYTE* const* hashTable = (const BYTE* const*) tableBase; return hashTable[h]; } |
875 | 0 | } |
876 | | |
877 | | LZ4_FORCE_INLINE const BYTE* |
878 | | LZ4_getPosition(const BYTE* p, |
879 | | const void* tableBase, tableType_t tableType) |
880 | 0 | { |
881 | 0 | U32 const h = LZ4_hashPosition(p, tableType); |
882 | 0 | return LZ4_getPositionOnHash(h, tableBase, tableType); |
883 | 0 | } |
884 | | |
885 | | LZ4_FORCE_INLINE void |
886 | | LZ4_prepareTable(LZ4_stream_t_internal* const cctx, |
887 | | const int inputSize, |
888 | 2.51k | const tableType_t tableType) { |
889 | | /* If the table hasn't been used, it's guaranteed to be zeroed out, and is |
890 | | * therefore safe to use no matter what mode we're in. Otherwise, we figure |
891 | | * out if it's safe to leave as is or whether it needs to be reset. |
892 | | */ |
893 | 2.51k | if ((tableType_t)cctx->tableType != clearedTable) { |
894 | 915 | assert(inputSize >= 0); |
895 | 915 | if ((tableType_t)cctx->tableType != tableType |
896 | 915 | || ((tableType == byU16) && cctx->currentOffset + (unsigned)inputSize >= 0xFFFFU) |
897 | 915 | || ((tableType == byU32) && cctx->currentOffset > 1 GB) |
898 | 915 | || tableType == byPtr |
899 | 915 | || inputSize >= 4 KB) |
900 | 915 | { |
901 | 915 | DEBUGLOG(4, "LZ4_prepareTable: Resetting table in %p", (void*)cctx); |
902 | 915 | MEM_INIT(cctx->hashTable, 0, LZ4_HASHTABLESIZE); |
903 | 915 | cctx->currentOffset = 0; |
904 | 915 | cctx->tableType = (U32)clearedTable; |
905 | 915 | } else { |
906 | 0 | DEBUGLOG(4, "LZ4_prepareTable: Re-use hash table (no reset)"); |
907 | 0 | } |
908 | 915 | } |
909 | | |
910 | | /* Adding a gap, so all previous entries are > LZ4_DISTANCE_MAX back, |
911 | | * is faster than compressing without a gap. |
912 | | * However, compressing with currentOffset == 0 is faster still, |
913 | | * so we preserve that case. |
914 | | */ |
915 | 2.51k | if (cctx->currentOffset != 0 && tableType == byU32) { |
916 | 0 | DEBUGLOG(5, "LZ4_prepareTable: adding 64KB to currentOffset"); |
917 | 0 | cctx->currentOffset += 64 KB; |
918 | 0 | } |
919 | | |
920 | | /* Finally, clear history */ |
921 | 2.51k | cctx->dictCtx = NULL; |
922 | 2.51k | cctx->dictionary = NULL; |
923 | 2.51k | cctx->dictSize = 0; |
924 | 2.51k | } |
925 | | |
926 | | /** LZ4_compress_generic_validated() : |
927 | | * inlined, to ensure branches are decided at compilation time. |
928 | | * The following conditions are presumed already validated: |
929 | | * - source != NULL |
930 | | * - inputSize > 0 |
931 | | */ |
932 | | LZ4_FORCE_INLINE int LZ4_compress_generic_validated( |
933 | | LZ4_stream_t_internal* const cctx, |
934 | | const char* const source, |
935 | | char* const dest, |
936 | | const int inputSize, |
937 | | int* inputConsumed, /* only written when outputDirective == fillOutput */ |
938 | | const int maxOutputSize, |
939 | | const limitedOutput_directive outputDirective, |
940 | | const tableType_t tableType, |
941 | | const dict_directive dictDirective, |
942 | | const dictIssue_directive dictIssue, |
943 | | const int acceleration) |
944 | 4.00k | { |
945 | 4.00k | int result; |
946 | 4.00k | const BYTE* ip = (const BYTE*)source; |
947 | | |
948 | 4.00k | U32 const startIndex = cctx->currentOffset; |
949 | 4.00k | const BYTE* base = (const BYTE*)source - startIndex; |
950 | 4.00k | const BYTE* lowLimit; |
951 | | |
952 | 4.00k | const LZ4_stream_t_internal* dictCtx = (const LZ4_stream_t_internal*) cctx->dictCtx; |
953 | 4.00k | const BYTE* const dictionary = |
954 | 4.00k | dictDirective == usingDictCtx ? dictCtx->dictionary : cctx->dictionary; |
955 | 4.00k | const U32 dictSize = |
956 | 4.00k | dictDirective == usingDictCtx ? dictCtx->dictSize : cctx->dictSize; |
957 | 4.00k | const U32 dictDelta = |
958 | 4.00k | (dictDirective == usingDictCtx) ? startIndex - dictCtx->currentOffset : 0; /* make indexes in dictCtx comparable with indexes in current context */ |
959 | | |
960 | 4.00k | int const maybe_extMem = (dictDirective == usingExtDict) || (dictDirective == usingDictCtx); |
961 | 4.00k | U32 const prefixIdxLimit = startIndex - dictSize; /* used when dictDirective == dictSmall */ |
962 | 4.00k | const BYTE* const dictEnd = dictionary ? dictionary + dictSize : dictionary; |
963 | 4.00k | const BYTE* anchor = (const BYTE*) source; |
964 | 4.00k | const BYTE* const iend = ip + inputSize; |
965 | 4.00k | const BYTE* const mflimitPlusOne = iend - MFLIMIT + 1; |
966 | 4.00k | const BYTE* const matchlimit = iend - LASTLITERALS; |
967 | | |
968 | | /* the dictCtx currentOffset is indexed on the start of the dictionary, |
969 | | * while a dictionary in the current context precedes the currentOffset */ |
970 | 4.00k | const BYTE* dictBase = (dictionary == NULL) ? NULL : |
971 | 4.00k | (dictDirective == usingDictCtx) ? |
972 | 0 | dictionary + dictSize - dictCtx->currentOffset : |
973 | 1.99k | dictionary + dictSize - startIndex; |
974 | | |
975 | 4.00k | BYTE* op = (BYTE*) dest; |
976 | 4.00k | BYTE* const olimit = op + maxOutputSize; |
977 | | |
978 | 4.00k | U32 offset = 0; |
979 | 4.00k | U32 forwardH; |
980 | | |
981 | 4.00k | DEBUGLOG(5, "LZ4_compress_generic_validated: srcSize=%i, tableType=%u", inputSize, tableType); |
982 | 4.00k | assert(ip != NULL); |
983 | 4.00k | if (tableType == byU16) assert(inputSize<LZ4_64Klimit); /* Size too large (not within 64K limit) */ |
984 | 4.00k | if (tableType == byPtr) assert(dictDirective==noDict); /* only supported use case with byPtr */ |
985 | | /* If init conditions are not met, we don't have to mark stream |
986 | | * as having dirty context, since no action was taken yet */ |
987 | 4.00k | if (outputDirective == fillOutput && maxOutputSize < 1) { return 0; } /* Impossible to store anything */ |
988 | 4.00k | assert(acceleration >= 1); |
989 | | |
990 | 4.00k | lowLimit = (const BYTE*)source - (dictDirective == withPrefix64k ? dictSize : 0); |
991 | | |
992 | | /* Update context state */ |
993 | 4.00k | if (dictDirective == usingDictCtx) { |
994 | | /* Subsequent linked blocks can't use the dictionary. */ |
995 | | /* Instead, they use the block we just compressed. */ |
996 | 0 | cctx->dictCtx = NULL; |
997 | 0 | cctx->dictSize = (U32)inputSize; |
998 | 4.00k | } else { |
999 | 4.00k | cctx->dictSize += (U32)inputSize; |
1000 | 4.00k | } |
1001 | 4.00k | cctx->currentOffset += (U32)inputSize; |
1002 | 4.00k | cctx->tableType = (U32)tableType; |
1003 | | |
1004 | 4.00k | if (inputSize<LZ4_minLength) goto _last_literals; /* Input too small, no compression (all literals) */ |
1005 | | |
1006 | | /* First Byte */ |
1007 | 3.87k | { U32 const h = LZ4_hashPosition(ip, tableType); |
1008 | 3.87k | if (tableType == byPtr) { |
1009 | 0 | LZ4_putPositionOnHash(ip, h, cctx->hashTable, byPtr); |
1010 | 3.87k | } else { |
1011 | 3.87k | LZ4_putIndexOnHash(startIndex, h, cctx->hashTable, tableType); |
1012 | 3.87k | } } |
1013 | 3.87k | ip++; forwardH = LZ4_hashPosition(ip, tableType); |
1014 | | |
1015 | | /* Main Loop */ |
1016 | 1.39M | for ( ; ; ) { |
1017 | 1.39M | const BYTE* match; |
1018 | 1.39M | BYTE* token; |
1019 | 1.39M | const BYTE* filledIp; |
1020 | | |
1021 | | /* Find a match */ |
1022 | 1.39M | if (tableType == byPtr) { |
1023 | 0 | const BYTE* forwardIp = ip; |
1024 | 0 | int step = 1; |
1025 | 0 | int searchMatchNb = acceleration << LZ4_skipTrigger; |
1026 | 0 | do { |
1027 | 0 | U32 const h = forwardH; |
1028 | 0 | ip = forwardIp; |
1029 | 0 | forwardIp += step; |
1030 | 0 | step = (searchMatchNb++ >> LZ4_skipTrigger); |
1031 | |
|
1032 | 0 | if (unlikely(forwardIp > mflimitPlusOne)) goto _last_literals; |
1033 | 0 | assert(ip < mflimitPlusOne); |
1034 | | |
1035 | 0 | match = LZ4_getPositionOnHash(h, cctx->hashTable, tableType); |
1036 | 0 | forwardH = LZ4_hashPosition(forwardIp, tableType); |
1037 | 0 | LZ4_putPositionOnHash(ip, h, cctx->hashTable, tableType); |
1038 | |
|
1039 | 0 | } while ( (match+LZ4_DISTANCE_MAX < ip) |
1040 | 0 | || (LZ4_read32(match) != LZ4_read32(ip)) ); |
1041 | |
|
1042 | 1.39M | } else { /* byU32, byU16 */ |
1043 | | |
1044 | 1.39M | const BYTE* forwardIp = ip; |
1045 | 1.39M | int step = 1; |
1046 | 1.39M | int searchMatchNb = acceleration << LZ4_skipTrigger; |
1047 | 15.1M | do { |
1048 | 15.1M | U32 const h = forwardH; |
1049 | 15.1M | U32 const current = (U32)(forwardIp - base); |
1050 | 15.1M | U32 matchIndex = LZ4_getIndexOnHash(h, cctx->hashTable, tableType); |
1051 | 15.1M | assert(matchIndex <= current); |
1052 | 15.1M | assert(forwardIp - base < (ptrdiff_t)(2 GB - 1)); |
1053 | 15.1M | ip = forwardIp; |
1054 | 15.1M | forwardIp += step; |
1055 | 15.1M | step = (searchMatchNb++ >> LZ4_skipTrigger); |
1056 | | |
1057 | 15.1M | if (unlikely(forwardIp > mflimitPlusOne)) goto _last_literals; |
1058 | 15.1M | assert(ip < mflimitPlusOne); |
1059 | | |
1060 | 15.1M | if (dictDirective == usingDictCtx) { |
1061 | 0 | if (matchIndex < startIndex) { |
1062 | | /* there was no match, try the dictionary */ |
1063 | 0 | assert(tableType == byU32); |
1064 | 0 | matchIndex = LZ4_getIndexOnHash(h, dictCtx->hashTable, byU32); |
1065 | 0 | match = dictBase + matchIndex; |
1066 | 0 | matchIndex += dictDelta; /* make dictCtx index comparable with current context */ |
1067 | 0 | lowLimit = dictionary; |
1068 | 0 | } else { |
1069 | 0 | match = base + matchIndex; |
1070 | 0 | lowLimit = (const BYTE*)source; |
1071 | 0 | } |
1072 | 15.1M | } else if (dictDirective == usingExtDict) { |
1073 | 0 | if (matchIndex < startIndex) { |
1074 | 0 | DEBUGLOG(7, "extDict candidate: matchIndex=%5u < startIndex=%5u", matchIndex, startIndex); |
1075 | 0 | assert(startIndex - matchIndex >= MINMATCH); |
1076 | 0 | assert(dictBase); |
1077 | 0 | match = dictBase + matchIndex; |
1078 | 0 | lowLimit = dictionary; |
1079 | 0 | } else { |
1080 | 0 | match = base + matchIndex; |
1081 | 0 | lowLimit = (const BYTE*)source; |
1082 | 0 | } |
1083 | 15.1M | } else { /* single continuous memory segment */ |
1084 | 15.1M | match = base + matchIndex; |
1085 | 15.1M | } |
1086 | 15.1M | forwardH = LZ4_hashPosition(forwardIp, tableType); |
1087 | 15.1M | LZ4_putIndexOnHash(current, h, cctx->hashTable, tableType); |
1088 | | |
1089 | 15.1M | DEBUGLOG(7, "candidate at pos=%u (offset=%u \n", matchIndex, current - matchIndex); |
1090 | 15.1M | if ((dictIssue == dictSmall) && (matchIndex < prefixIdxLimit)) { continue; } /* match outside of valid area */ |
1091 | 15.1M | assert(matchIndex < current); |
1092 | 15.1M | if ( ((tableType != byU16) || (LZ4_DISTANCE_MAX < LZ4_DISTANCE_ABSOLUTE_MAX)) |
1093 | 15.1M | && (matchIndex+LZ4_DISTANCE_MAX < current)) { |
1094 | 1.08M | continue; |
1095 | 1.08M | } /* too far */ |
1096 | 14.0M | assert((current - matchIndex) <= LZ4_DISTANCE_MAX); /* match now expected within distance */ |
1097 | | |
1098 | 14.0M | if (LZ4_read32(match) == LZ4_read32(ip)) { |
1099 | 1.39M | if (maybe_extMem) offset = current - matchIndex; |
1100 | 1.39M | break; /* match found */ |
1101 | 1.39M | } |
1102 | | |
1103 | 14.0M | } while(1); |
1104 | 1.39M | } |
1105 | | |
1106 | | /* Catch up */ |
1107 | 1.39M | filledIp = ip; |
1108 | 1.39M | assert(ip > anchor); /* this is always true as ip has been advanced before entering the main loop */ |
1109 | 1.39M | if ((match > lowLimit) && unlikely(ip[-1] == match[-1])) { |
1110 | 1.12M | do { ip--; match--; } while (((ip > anchor) & (match > lowLimit)) && (unlikely(ip[-1] == match[-1]))); |
1111 | 371k | } |
1112 | | |
1113 | | /* Encode Literals */ |
1114 | 1.39M | { unsigned const litLength = (unsigned)(ip - anchor); |
1115 | 1.39M | token = op++; |
1116 | 1.39M | if ((outputDirective == limitedOutput) && /* Check output buffer overflow */ |
1117 | 1.39M | (unlikely(op + litLength + (2 + 1 + LASTLITERALS) + (litLength/255) > olimit)) ) { |
1118 | 44 | return 0; /* cannot compress within `dst` budget. Stored indexes in hash table are nonetheless fine */ |
1119 | 44 | } |
1120 | 1.39M | if ((outputDirective == fillOutput) && |
1121 | 1.39M | (unlikely(op + (litLength+240)/255 /* litlen */ + litLength /* literals */ + 2 /* offset */ + 1 /* token */ + MFLIMIT - MINMATCH /* min last literals so last match is <= end - MFLIMIT */ > olimit))) { |
1122 | 0 | op--; |
1123 | 0 | goto _last_literals; |
1124 | 0 | } |
1125 | 1.39M | if (litLength >= RUN_MASK) { |
1126 | 217k | unsigned len = litLength - RUN_MASK; |
1127 | 217k | *token = (RUN_MASK<<ML_BITS); |
1128 | 382k | for(; len >= 255 ; len-=255) *op++ = 255; |
1129 | 217k | *op++ = (BYTE)len; |
1130 | 217k | } |
1131 | 1.17M | else *token = (BYTE)(litLength<<ML_BITS); |
1132 | | |
1133 | | /* Copy Literals */ |
1134 | 1.39M | LZ4_wildCopy8(op, anchor, op+litLength); |
1135 | 1.39M | op+=litLength; |
1136 | 1.39M | DEBUGLOG(6, "seq.start:%i, literals=%u, match.start:%i", |
1137 | 1.39M | (int)(anchor-(const BYTE*)source), litLength, (int)(ip-(const BYTE*)source)); |
1138 | 1.39M | } |
1139 | | |
1140 | 2.97M | _next_match: |
1141 | | /* at this stage, the following variables must be correctly set : |
1142 | | * - ip : at start of LZ operation |
1143 | | * - match : at start of previous pattern occurrence; can be within current prefix, or within extDict |
1144 | | * - offset : if maybe_ext_memSegment==1 (constant) |
1145 | | * - lowLimit : must be == dictionary to mean "match is within extDict"; must be == source otherwise |
1146 | | * - token and *token : position to write 4-bits for match length; higher 4-bits for literal length supposed already written |
1147 | | */ |
1148 | | |
1149 | 2.97M | if ((outputDirective == fillOutput) && |
1150 | 2.97M | (op + 2 /* offset */ + 1 /* token */ + MFLIMIT - MINMATCH /* min last literals so last match is <= end - MFLIMIT */ > olimit)) { |
1151 | | /* the match was too close to the end, rewind and go to last literals */ |
1152 | 0 | op = token; |
1153 | 0 | goto _last_literals; |
1154 | 0 | } |
1155 | | |
1156 | | /* Encode Offset */ |
1157 | 2.97M | if (maybe_extMem) { /* static test */ |
1158 | 0 | DEBUGLOG(6, " with offset=%u (ext if > %i)", offset, (int)(ip - (const BYTE*)source)); |
1159 | 0 | assert(offset <= LZ4_DISTANCE_MAX && offset > 0); |
1160 | 0 | LZ4_writeLE16(op, (U16)offset); op+=2; |
1161 | 2.97M | } else { |
1162 | 2.97M | DEBUGLOG(6, " with offset=%u (same segment)", (U32)(ip - match)); |
1163 | 2.97M | assert(ip-match <= LZ4_DISTANCE_MAX); |
1164 | 2.97M | LZ4_writeLE16(op, (U16)(ip - match)); op+=2; |
1165 | 2.97M | } |
1166 | | |
1167 | | /* Encode MatchLength */ |
1168 | 2.97M | { unsigned matchCode; |
1169 | | |
1170 | 2.97M | if ( (dictDirective==usingExtDict || dictDirective==usingDictCtx) |
1171 | 2.97M | && (lowLimit==dictionary) /* match within extDict */ ) { |
1172 | 0 | const BYTE* limit = ip + (dictEnd-match); |
1173 | 0 | assert(dictEnd > match); |
1174 | 0 | if (limit > matchlimit) limit = matchlimit; |
1175 | 0 | matchCode = LZ4_count(ip+MINMATCH, match+MINMATCH, limit); |
1176 | 0 | ip += (size_t)matchCode + MINMATCH; |
1177 | 0 | if (ip==limit) { |
1178 | 0 | unsigned const more = LZ4_count(limit, (const BYTE*)source, matchlimit); |
1179 | 0 | matchCode += more; |
1180 | 0 | ip += more; |
1181 | 0 | } |
1182 | 0 | DEBUGLOG(6, " with matchLength=%u starting in extDict", matchCode+MINMATCH); |
1183 | 2.97M | } else { |
1184 | 2.97M | matchCode = LZ4_count(ip+MINMATCH, match+MINMATCH, matchlimit); |
1185 | 2.97M | ip += (size_t)matchCode + MINMATCH; |
1186 | 2.97M | DEBUGLOG(6, " with matchLength=%u", matchCode+MINMATCH); |
1187 | 2.97M | } |
1188 | | |
1189 | 2.97M | if ((outputDirective) && /* Check output buffer overflow */ |
1190 | 2.97M | (unlikely(op + (1 + LASTLITERALS) + (matchCode+240)/255 > olimit)) ) { |
1191 | 14 | if (outputDirective == fillOutput) { |
1192 | | /* Match description too long : reduce it */ |
1193 | 0 | U32 newMatchCode = 15 /* in token */ - 1 /* to avoid needing a zero byte */ + ((U32)(olimit - op) - 1 - LASTLITERALS) * 255; |
1194 | 0 | ip -= matchCode - newMatchCode; |
1195 | 0 | assert(newMatchCode < matchCode); |
1196 | 0 | matchCode = newMatchCode; |
1197 | 0 | if (unlikely(ip <= filledIp)) { |
1198 | | /* We have already filled up to filledIp so if ip ends up less than filledIp |
1199 | | * we have positions in the hash table beyond the current position. This is |
1200 | | * a problem if we reuse the hash table. So we have to remove these positions |
1201 | | * from the hash table. |
1202 | | */ |
1203 | 0 | const BYTE* ptr; |
1204 | 0 | DEBUGLOG(5, "Clearing %u positions", (U32)(filledIp - ip)); |
1205 | 0 | for (ptr = ip; ptr <= filledIp; ++ptr) { |
1206 | 0 | U32 const h = LZ4_hashPosition(ptr, tableType); |
1207 | 0 | LZ4_clearHash(h, cctx->hashTable, tableType); |
1208 | 0 | } |
1209 | 0 | } |
1210 | 14 | } else { |
1211 | 14 | assert(outputDirective == limitedOutput); |
1212 | 14 | return 0; /* cannot compress within `dst` budget. Stored indexes in hash table are nonetheless fine */ |
1213 | 14 | } |
1214 | 14 | } |
1215 | 2.97M | if (matchCode >= ML_MASK) { |
1216 | 808k | *token += ML_MASK; |
1217 | 808k | matchCode -= ML_MASK; |
1218 | 808k | LZ4_write32(op, 0xFFFFFFFF); |
1219 | 894k | while (matchCode >= 4*255) { |
1220 | 85.9k | op+=4; |
1221 | 85.9k | LZ4_write32(op, 0xFFFFFFFF); |
1222 | 85.9k | matchCode -= 4*255; |
1223 | 85.9k | } |
1224 | 808k | op += matchCode / 255; |
1225 | 808k | *op++ = (BYTE)(matchCode % 255); |
1226 | 808k | } else |
1227 | 2.16M | *token += (BYTE)(matchCode); |
1228 | 2.97M | } |
1229 | | /* Ensure we have enough space for the last literals. */ |
1230 | 0 | assert(!(outputDirective == fillOutput && op + 1 + LASTLITERALS > olimit)); |
1231 | | |
1232 | 2.97M | anchor = ip; |
1233 | | |
1234 | | /* Test end of chunk */ |
1235 | 2.97M | if (ip >= mflimitPlusOne) break; |
1236 | | |
1237 | | /* Fill table */ |
1238 | 2.97M | { U32 const h = LZ4_hashPosition(ip-2, tableType); |
1239 | 2.97M | if (tableType == byPtr) { |
1240 | 0 | LZ4_putPositionOnHash(ip-2, h, cctx->hashTable, byPtr); |
1241 | 2.97M | } else { |
1242 | 2.97M | U32 const idx = (U32)((ip-2) - base); |
1243 | 2.97M | LZ4_putIndexOnHash(idx, h, cctx->hashTable, tableType); |
1244 | 2.97M | } } |
1245 | | |
1246 | | /* Test next position */ |
1247 | 2.97M | if (tableType == byPtr) { |
1248 | |
|
1249 | 0 | match = LZ4_getPosition(ip, cctx->hashTable, tableType); |
1250 | 0 | LZ4_putPosition(ip, cctx->hashTable, tableType); |
1251 | 0 | if ( (match+LZ4_DISTANCE_MAX >= ip) |
1252 | 0 | && (LZ4_read32(match) == LZ4_read32(ip)) ) |
1253 | 0 | { token=op++; *token=0; goto _next_match; } |
1254 | |
|
1255 | 2.97M | } else { /* byU32, byU16 */ |
1256 | | |
1257 | 2.97M | U32 const h = LZ4_hashPosition(ip, tableType); |
1258 | 2.97M | U32 const current = (U32)(ip-base); |
1259 | 2.97M | U32 matchIndex = LZ4_getIndexOnHash(h, cctx->hashTable, tableType); |
1260 | 2.97M | assert(matchIndex < current); |
1261 | 2.97M | if (dictDirective == usingDictCtx) { |
1262 | 0 | if (matchIndex < startIndex) { |
1263 | | /* there was no match, try the dictionary */ |
1264 | 0 | assert(tableType == byU32); |
1265 | 0 | matchIndex = LZ4_getIndexOnHash(h, dictCtx->hashTable, byU32); |
1266 | 0 | match = dictBase + matchIndex; |
1267 | 0 | lowLimit = dictionary; /* required for match length counter */ |
1268 | 0 | matchIndex += dictDelta; |
1269 | 0 | } else { |
1270 | 0 | match = base + matchIndex; |
1271 | 0 | lowLimit = (const BYTE*)source; /* required for match length counter */ |
1272 | 0 | } |
1273 | 2.97M | } else if (dictDirective==usingExtDict) { |
1274 | 0 | if (matchIndex < startIndex) { |
1275 | 0 | assert(dictBase); |
1276 | 0 | match = dictBase + matchIndex; |
1277 | 0 | lowLimit = dictionary; /* required for match length counter */ |
1278 | 0 | } else { |
1279 | 0 | match = base + matchIndex; |
1280 | 0 | lowLimit = (const BYTE*)source; /* required for match length counter */ |
1281 | 0 | } |
1282 | 2.97M | } else { /* single memory segment */ |
1283 | 2.97M | match = base + matchIndex; |
1284 | 2.97M | } |
1285 | 2.97M | LZ4_putIndexOnHash(current, h, cctx->hashTable, tableType); |
1286 | 2.97M | assert(matchIndex < current); |
1287 | 2.97M | if ( ((dictIssue==dictSmall) ? (matchIndex >= prefixIdxLimit) : 1) |
1288 | 2.97M | && (((tableType==byU16) && (LZ4_DISTANCE_MAX == LZ4_DISTANCE_ABSOLUTE_MAX)) ? 1 : (matchIndex+LZ4_DISTANCE_MAX >= current)) |
1289 | 2.97M | && (LZ4_read32(match) == LZ4_read32(ip)) ) { |
1290 | 1.57M | token=op++; |
1291 | 1.57M | *token=0; |
1292 | 1.57M | if (maybe_extMem) offset = current - matchIndex; |
1293 | 1.57M | DEBUGLOG(6, "seq.start:%i, literals=%u, match.start:%i", |
1294 | 1.57M | (int)(anchor-(const BYTE*)source), 0, (int)(ip-(const BYTE*)source)); |
1295 | 1.57M | goto _next_match; |
1296 | 1.57M | } |
1297 | 2.97M | } |
1298 | | |
1299 | | /* Prepare next loop */ |
1300 | 1.39M | forwardH = LZ4_hashPosition(++ip, tableType); |
1301 | | |
1302 | 1.39M | } |
1303 | | |
1304 | 3.94k | _last_literals: |
1305 | | /* Encode Last Literals */ |
1306 | 3.94k | { size_t lastRun = (size_t)(iend - anchor); |
1307 | 3.94k | if ( (outputDirective) && /* Check output buffer overflow */ |
1308 | 3.94k | (op + lastRun + 1 + ((lastRun+255-RUN_MASK)/255) > olimit)) { |
1309 | 524 | if (outputDirective == fillOutput) { |
1310 | | /* adapt lastRun to fill 'dst' */ |
1311 | 0 | assert(olimit >= op); |
1312 | 0 | lastRun = (size_t)(olimit-op) - 1/*token*/; |
1313 | 0 | lastRun -= (lastRun + 256 - RUN_MASK) / 256; /*additional length tokens*/ |
1314 | 524 | } else { |
1315 | 524 | assert(outputDirective == limitedOutput); |
1316 | 524 | return 0; /* cannot compress within `dst` budget. Stored indexes in hash table are nonetheless fine */ |
1317 | 524 | } |
1318 | 524 | } |
1319 | 3.42k | DEBUGLOG(6, "Final literal run : %i literals", (int)lastRun); |
1320 | 3.42k | if (lastRun >= RUN_MASK) { |
1321 | 722 | size_t accumulator = lastRun - RUN_MASK; |
1322 | 722 | *op++ = RUN_MASK << ML_BITS; |
1323 | 25.9k | for(; accumulator >= 255 ; accumulator-=255) *op++ = 255; |
1324 | 722 | *op++ = (BYTE) accumulator; |
1325 | 2.70k | } else { |
1326 | 2.70k | *op++ = (BYTE)(lastRun<<ML_BITS); |
1327 | 2.70k | } |
1328 | 3.42k | LZ4_memcpy(op, anchor, lastRun); |
1329 | 3.42k | ip = anchor + lastRun; |
1330 | 3.42k | op += lastRun; |
1331 | 3.42k | } |
1332 | | |
1333 | 3.42k | if (outputDirective == fillOutput) { |
1334 | 0 | *inputConsumed = (int) (((const char*)ip)-source); |
1335 | 0 | } |
1336 | 3.42k | result = (int)(((char*)op) - dest); |
1337 | 3.42k | assert(result > 0); |
1338 | 3.42k | DEBUGLOG(5, "LZ4_compress_generic: compressed %i bytes into %i bytes", inputSize, result); |
1339 | 3.42k | return result; |
1340 | 3.42k | } |
1341 | | |
1342 | | /** LZ4_compress_generic() : |
1343 | | * inlined, to ensure branches are decided at compilation time; |
1344 | | * takes care of src == (NULL, 0) |
1345 | | * and forward the rest to LZ4_compress_generic_validated */ |
1346 | | LZ4_FORCE_INLINE int LZ4_compress_generic( |
1347 | | LZ4_stream_t_internal* const cctx, |
1348 | | const char* const src, |
1349 | | char* const dst, |
1350 | | const int srcSize, |
1351 | | int *inputConsumed, /* only written when outputDirective == fillOutput */ |
1352 | | const int dstCapacity, |
1353 | | const limitedOutput_directive outputDirective, |
1354 | | const tableType_t tableType, |
1355 | | const dict_directive dictDirective, |
1356 | | const dictIssue_directive dictIssue, |
1357 | | const int acceleration) |
1358 | 4.00k | { |
1359 | 4.00k | DEBUGLOG(5, "LZ4_compress_generic: srcSize=%i, dstCapacity=%i", |
1360 | 4.00k | srcSize, dstCapacity); |
1361 | | |
1362 | 4.00k | if ((U32)srcSize > (U32)LZ4_MAX_INPUT_SIZE) { return 0; } /* Unsupported srcSize, too large (or negative) */ |
1363 | 4.00k | if (srcSize == 0) { /* src == NULL supported if srcSize == 0 */ |
1364 | 0 | if (outputDirective != notLimited && dstCapacity <= 0) return 0; /* no output, can't write anything */ |
1365 | 0 | DEBUGLOG(5, "Generating an empty block"); |
1366 | 0 | assert(outputDirective == notLimited || dstCapacity >= 1); |
1367 | 0 | assert(dst != NULL); |
1368 | 0 | dst[0] = 0; |
1369 | 0 | if (outputDirective == fillOutput) { |
1370 | 0 | assert (inputConsumed != NULL); |
1371 | 0 | *inputConsumed = 0; |
1372 | 0 | } |
1373 | 0 | return 1; |
1374 | 0 | } |
1375 | 4.00k | assert(src != NULL); |
1376 | | |
1377 | 4.00k | return LZ4_compress_generic_validated(cctx, src, dst, srcSize, |
1378 | 4.00k | inputConsumed, /* only written into if outputDirective == fillOutput */ |
1379 | 4.00k | dstCapacity, outputDirective, |
1380 | 4.00k | tableType, dictDirective, dictIssue, acceleration); |
1381 | 4.00k | } |
1382 | | |
1383 | | |
1384 | | int LZ4_compress_fast_extState(void* state, const char* source, char* dest, int inputSize, int maxOutputSize, int acceleration) |
1385 | 0 | { |
1386 | 0 | LZ4_stream_t_internal* const ctx = & LZ4_initStream(state, sizeof(LZ4_stream_t)) -> internal_donotuse; |
1387 | 0 | assert(ctx != NULL); |
1388 | 0 | if (acceleration < 1) acceleration = LZ4_ACCELERATION_DEFAULT; |
1389 | 0 | if (acceleration > LZ4_ACCELERATION_MAX) acceleration = LZ4_ACCELERATION_MAX; |
1390 | 0 | if (maxOutputSize >= LZ4_compressBound(inputSize)) { |
1391 | 0 | if (inputSize < LZ4_64Klimit) { |
1392 | 0 | return LZ4_compress_generic(ctx, source, dest, inputSize, NULL, 0, notLimited, byU16, noDict, noDictIssue, acceleration); |
1393 | 0 | } else { |
1394 | 0 | const tableType_t tableType = ((sizeof(void*)==4) && ((uptrval)source > LZ4_DISTANCE_MAX)) ? byPtr : byU32; |
1395 | 0 | return LZ4_compress_generic(ctx, source, dest, inputSize, NULL, 0, notLimited, tableType, noDict, noDictIssue, acceleration); |
1396 | 0 | } |
1397 | 0 | } else { |
1398 | 0 | if (inputSize < LZ4_64Klimit) { |
1399 | 0 | return LZ4_compress_generic(ctx, source, dest, inputSize, NULL, maxOutputSize, limitedOutput, byU16, noDict, noDictIssue, acceleration); |
1400 | 0 | } else { |
1401 | 0 | const tableType_t tableType = ((sizeof(void*)==4) && ((uptrval)source > LZ4_DISTANCE_MAX)) ? byPtr : byU32; |
1402 | 0 | return LZ4_compress_generic(ctx, source, dest, inputSize, NULL, maxOutputSize, limitedOutput, tableType, noDict, noDictIssue, acceleration); |
1403 | 0 | } |
1404 | 0 | } |
1405 | 0 | } |
1406 | | |
1407 | | /** |
1408 | | * LZ4_compress_fast_extState_fastReset() : |
1409 | | * A variant of LZ4_compress_fast_extState(). |
1410 | | * |
1411 | | * Using this variant avoids an expensive initialization step. It is only safe |
1412 | | * to call if the state buffer is known to be correctly initialized already |
1413 | | * (see comment in lz4.h on LZ4_resetStream_fast() for a definition of |
1414 | | * "correctly initialized"). |
1415 | | */ |
1416 | | int LZ4_compress_fast_extState_fastReset(void* state, const char* src, char* dst, int srcSize, int dstCapacity, int acceleration) |
1417 | 2.00k | { |
1418 | 2.00k | LZ4_stream_t_internal* const ctx = &((LZ4_stream_t*)state)->internal_donotuse; |
1419 | 2.00k | if (acceleration < 1) acceleration = LZ4_ACCELERATION_DEFAULT; |
1420 | 2.00k | if (acceleration > LZ4_ACCELERATION_MAX) acceleration = LZ4_ACCELERATION_MAX; |
1421 | 2.00k | assert(ctx != NULL); |
1422 | | |
1423 | 2.00k | if (dstCapacity >= LZ4_compressBound(srcSize)) { |
1424 | 0 | if (srcSize < LZ4_64Klimit) { |
1425 | 0 | const tableType_t tableType = byU16; |
1426 | 0 | LZ4_prepareTable(ctx, srcSize, tableType); |
1427 | 0 | if (ctx->currentOffset) { |
1428 | 0 | return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, 0, notLimited, tableType, noDict, dictSmall, acceleration); |
1429 | 0 | } else { |
1430 | 0 | return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, 0, notLimited, tableType, noDict, noDictIssue, acceleration); |
1431 | 0 | } |
1432 | 0 | } else { |
1433 | 0 | const tableType_t tableType = ((sizeof(void*)==4) && ((uptrval)src > LZ4_DISTANCE_MAX)) ? byPtr : byU32; |
1434 | 0 | LZ4_prepareTable(ctx, srcSize, tableType); |
1435 | 0 | return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, 0, notLimited, tableType, noDict, noDictIssue, acceleration); |
1436 | 0 | } |
1437 | 2.00k | } else { |
1438 | 2.00k | if (srcSize < LZ4_64Klimit) { |
1439 | 1.71k | const tableType_t tableType = byU16; |
1440 | 1.71k | LZ4_prepareTable(ctx, srcSize, tableType); |
1441 | 1.71k | if (ctx->currentOffset) { |
1442 | 0 | return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, dstCapacity, limitedOutput, tableType, noDict, dictSmall, acceleration); |
1443 | 1.71k | } else { |
1444 | 1.71k | return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, dstCapacity, limitedOutput, tableType, noDict, noDictIssue, acceleration); |
1445 | 1.71k | } |
1446 | 1.71k | } else { |
1447 | 297 | const tableType_t tableType = ((sizeof(void*)==4) && ((uptrval)src > LZ4_DISTANCE_MAX)) ? byPtr : byU32; |
1448 | 297 | LZ4_prepareTable(ctx, srcSize, tableType); |
1449 | 297 | return LZ4_compress_generic(ctx, src, dst, srcSize, NULL, dstCapacity, limitedOutput, tableType, noDict, noDictIssue, acceleration); |
1450 | 297 | } |
1451 | 2.00k | } |
1452 | 2.00k | } |
1453 | | |
1454 | | |
1455 | | int LZ4_compress_fast(const char* src, char* dest, int srcSize, int dstCapacity, int acceleration) |
1456 | 0 | { |
1457 | 0 | int result; |
1458 | | #if (LZ4_HEAPMODE) |
1459 | | LZ4_stream_t* const ctxPtr = (LZ4_stream_t*)ALLOC(sizeof(LZ4_stream_t)); /* malloc-calloc always properly aligned */ |
1460 | | if (ctxPtr == NULL) return 0; |
1461 | | #else |
1462 | 0 | LZ4_stream_t ctx; |
1463 | 0 | LZ4_stream_t* const ctxPtr = &ctx; |
1464 | 0 | #endif |
1465 | 0 | result = LZ4_compress_fast_extState(ctxPtr, src, dest, srcSize, dstCapacity, acceleration); |
1466 | |
|
1467 | | #if (LZ4_HEAPMODE) |
1468 | | FREEMEM(ctxPtr); |
1469 | | #endif |
1470 | 0 | return result; |
1471 | 0 | } |
1472 | | |
1473 | | |
1474 | | int LZ4_compress_default(const char* src, char* dst, int srcSize, int dstCapacity) |
1475 | 0 | { |
1476 | 0 | return LZ4_compress_fast(src, dst, srcSize, dstCapacity, 1); |
1477 | 0 | } |
1478 | | |
1479 | | |
1480 | | /* Note!: This function leaves the stream in an unclean/broken state! |
1481 | | * It is not safe to subsequently use the same state with a _fastReset() or |
1482 | | * _continue() call without resetting it. */ |
1483 | | static int LZ4_compress_destSize_extState_internal(LZ4_stream_t* state, const char* src, char* dst, int* srcSizePtr, int targetDstSize, int acceleration) |
1484 | 0 | { |
1485 | 0 | void* const s = LZ4_initStream(state, sizeof (*state)); |
1486 | 0 | assert(s != NULL); (void)s; |
1487 | |
|
1488 | 0 | if (targetDstSize >= LZ4_compressBound(*srcSizePtr)) { /* compression success is guaranteed */ |
1489 | 0 | return LZ4_compress_fast_extState(state, src, dst, *srcSizePtr, targetDstSize, acceleration); |
1490 | 0 | } else { |
1491 | 0 | if (*srcSizePtr < LZ4_64Klimit) { |
1492 | 0 | return LZ4_compress_generic(&state->internal_donotuse, src, dst, *srcSizePtr, srcSizePtr, targetDstSize, fillOutput, byU16, noDict, noDictIssue, acceleration); |
1493 | 0 | } else { |
1494 | 0 | tableType_t const addrMode = ((sizeof(void*)==4) && ((uptrval)src > LZ4_DISTANCE_MAX)) ? byPtr : byU32; |
1495 | 0 | return LZ4_compress_generic(&state->internal_donotuse, src, dst, *srcSizePtr, srcSizePtr, targetDstSize, fillOutput, addrMode, noDict, noDictIssue, acceleration); |
1496 | 0 | } } |
1497 | 0 | } |
1498 | | |
1499 | | int LZ4_compress_destSize_extState(void* state, const char* src, char* dst, int* srcSizePtr, int targetDstSize, int acceleration) |
1500 | 0 | { |
1501 | 0 | int const r = LZ4_compress_destSize_extState_internal((LZ4_stream_t*)state, src, dst, srcSizePtr, targetDstSize, acceleration); |
1502 | | /* clean the state on exit */ |
1503 | 0 | LZ4_initStream(state, sizeof (LZ4_stream_t)); |
1504 | 0 | return r; |
1505 | 0 | } |
1506 | | |
1507 | | |
1508 | | int LZ4_compress_destSize(const char* src, char* dst, int* srcSizePtr, int targetDstSize) |
1509 | 0 | { |
1510 | | #if (LZ4_HEAPMODE) |
1511 | | LZ4_stream_t* const ctx = (LZ4_stream_t*)ALLOC(sizeof(LZ4_stream_t)); /* malloc-calloc always properly aligned */ |
1512 | | if (ctx == NULL) return 0; |
1513 | | #else |
1514 | 0 | LZ4_stream_t ctxBody; |
1515 | 0 | LZ4_stream_t* const ctx = &ctxBody; |
1516 | 0 | #endif |
1517 | |
|
1518 | 0 | int result = LZ4_compress_destSize_extState_internal(ctx, src, dst, srcSizePtr, targetDstSize, 1); |
1519 | |
|
1520 | | #if (LZ4_HEAPMODE) |
1521 | | FREEMEM(ctx); |
1522 | | #endif |
1523 | 0 | return result; |
1524 | 0 | } |
1525 | | |
1526 | | |
1527 | | |
1528 | | /*-****************************** |
1529 | | * Streaming functions |
1530 | | ********************************/ |
1531 | | |
1532 | | #if !defined(LZ4_STATIC_LINKING_ONLY_DISABLE_MEMORY_ALLOCATION) |
1533 | | LZ4_stream_t* LZ4_createStream(void) |
1534 | 0 | { |
1535 | 0 | LZ4_stream_t* const lz4s = (LZ4_stream_t*)ALLOC(sizeof(LZ4_stream_t)); |
1536 | 0 | LZ4_STATIC_ASSERT(sizeof(LZ4_stream_t) >= sizeof(LZ4_stream_t_internal)); |
1537 | 0 | DEBUGLOG(4, "LZ4_createStream %p", (void*)lz4s); |
1538 | 0 | if (lz4s == NULL) return NULL; |
1539 | 0 | LZ4_initStream(lz4s, sizeof(*lz4s)); |
1540 | 0 | return lz4s; |
1541 | 0 | } |
1542 | | #endif |
1543 | | |
1544 | | static size_t LZ4_stream_t_alignment(void) |
1545 | 1.61k | { |
1546 | 1.61k | #if LZ4_ALIGN_TEST |
1547 | 1.61k | typedef struct { char c; LZ4_stream_t t; } t_a; |
1548 | 1.61k | return sizeof(t_a) - sizeof(LZ4_stream_t); |
1549 | | #else |
1550 | | return 1; /* effectively disabled */ |
1551 | | #endif |
1552 | 1.61k | } |
1553 | | |
1554 | | LZ4_stream_t* LZ4_initStream (void* buffer, size_t size) |
1555 | 1.61k | { |
1556 | 1.61k | DEBUGLOG(5, "LZ4_initStream"); |
1557 | 1.61k | if (buffer == NULL) { return NULL; } |
1558 | 1.61k | if (size < sizeof(LZ4_stream_t)) { return NULL; } |
1559 | 1.61k | if (!LZ4_isAligned(buffer, LZ4_stream_t_alignment())) return NULL; |
1560 | 1.61k | MEM_INIT(buffer, 0, sizeof(LZ4_stream_t_internal)); |
1561 | 1.61k | return (LZ4_stream_t*)buffer; |
1562 | 1.61k | } |
1563 | | |
1564 | | /* resetStream is now deprecated, |
1565 | | * prefer initStream() which is more general */ |
1566 | | void LZ4_resetStream (LZ4_stream_t* LZ4_stream) |
1567 | 0 | { |
1568 | 0 | DEBUGLOG(5, "LZ4_resetStream (ctx:%p)", (void*)LZ4_stream); |
1569 | 0 | MEM_INIT(LZ4_stream, 0, sizeof(LZ4_stream_t_internal)); |
1570 | 0 | } |
1571 | | |
1572 | 503 | void LZ4_resetStream_fast(LZ4_stream_t* ctx) { |
1573 | 503 | LZ4_prepareTable(&(ctx->internal_donotuse), 0, byU32); |
1574 | 503 | } |
1575 | | |
1576 | | #if !defined(LZ4_STATIC_LINKING_ONLY_DISABLE_MEMORY_ALLOCATION) |
1577 | | int LZ4_freeStream (LZ4_stream_t* LZ4_stream) |
1578 | 0 | { |
1579 | 0 | if (!LZ4_stream) return 0; /* support free on NULL */ |
1580 | 0 | DEBUGLOG(5, "LZ4_freeStream %p", (void*)LZ4_stream); |
1581 | 0 | FREEMEM(LZ4_stream); |
1582 | 0 | return (0); |
1583 | 0 | } |
1584 | | #endif |
1585 | | |
1586 | | |
1587 | | typedef enum { _ld_fast, _ld_slow } LoadDict_mode_e; |
1588 | 0 | #define HASH_UNIT sizeof(reg_t) |
1589 | | int LZ4_loadDict_internal(LZ4_stream_t* LZ4_dict, |
1590 | | const char* dictionary, int dictSize, |
1591 | | LoadDict_mode_e _ld) |
1592 | 0 | { |
1593 | 0 | LZ4_stream_t_internal* const dict = &LZ4_dict->internal_donotuse; |
1594 | 0 | const tableType_t tableType = byU32; |
1595 | 0 | const BYTE* p = (const BYTE*)dictionary; |
1596 | 0 | const BYTE* const dictEnd = p + dictSize; |
1597 | 0 | U32 idx32; |
1598 | |
|
1599 | 0 | DEBUGLOG(4, "LZ4_loadDict (%i bytes from %p into %p)", dictSize, (void*)dictionary, (void*)LZ4_dict); |
1600 | | |
1601 | | /* It's necessary to reset the context, |
1602 | | * and not just continue it with prepareTable() |
1603 | | * to avoid any risk of generating overflowing matchIndex |
1604 | | * when compressing using this dictionary */ |
1605 | 0 | LZ4_resetStream(LZ4_dict); |
1606 | | |
1607 | | /* We always increment the offset by 64 KB, since, if the dict is longer, |
1608 | | * we truncate it to the last 64k, and if it's shorter, we still want to |
1609 | | * advance by a whole window length so we can provide the guarantee that |
1610 | | * there are only valid offsets in the window, which allows an optimization |
1611 | | * in LZ4_compress_fast_continue() where it uses noDictIssue even when the |
1612 | | * dictionary isn't a full 64k. */ |
1613 | 0 | dict->currentOffset += 64 KB; |
1614 | |
|
1615 | 0 | if (dictSize < (int)HASH_UNIT) { |
1616 | 0 | return 0; |
1617 | 0 | } |
1618 | | |
1619 | 0 | if ((dictEnd - p) > 64 KB) p = dictEnd - 64 KB; |
1620 | 0 | dict->dictionary = p; |
1621 | 0 | dict->dictSize = (U32)(dictEnd - p); |
1622 | 0 | dict->tableType = (U32)tableType; |
1623 | 0 | idx32 = dict->currentOffset - dict->dictSize; |
1624 | |
|
1625 | 0 | while (p <= dictEnd-HASH_UNIT) { |
1626 | 0 | U32 const h = LZ4_hashPosition(p, tableType); |
1627 | | /* Note: overwriting => favors positions end of dictionary */ |
1628 | 0 | LZ4_putIndexOnHash(idx32, h, dict->hashTable, tableType); |
1629 | 0 | p+=3; idx32+=3; |
1630 | 0 | } |
1631 | |
|
1632 | 0 | if (_ld == _ld_slow) { |
1633 | | /* Fill hash table with additional references, to improve compression capability */ |
1634 | 0 | p = dict->dictionary; |
1635 | 0 | idx32 = dict->currentOffset - dict->dictSize; |
1636 | 0 | while (p <= dictEnd-HASH_UNIT) { |
1637 | 0 | U32 const h = LZ4_hashPosition(p, tableType); |
1638 | 0 | U32 const limit = dict->currentOffset - 64 KB; |
1639 | 0 | if (LZ4_getIndexOnHash(h, dict->hashTable, tableType) <= limit) { |
1640 | | /* Note: not overwriting => favors positions beginning of dictionary */ |
1641 | 0 | LZ4_putIndexOnHash(idx32, h, dict->hashTable, tableType); |
1642 | 0 | } |
1643 | 0 | p++; idx32++; |
1644 | 0 | } |
1645 | 0 | } |
1646 | |
|
1647 | 0 | return (int)dict->dictSize; |
1648 | 0 | } |
1649 | | |
1650 | | int LZ4_loadDict(LZ4_stream_t* LZ4_dict, const char* dictionary, int dictSize) |
1651 | 0 | { |
1652 | 0 | return LZ4_loadDict_internal(LZ4_dict, dictionary, dictSize, _ld_fast); |
1653 | 0 | } |
1654 | | |
1655 | | int LZ4_loadDictSlow(LZ4_stream_t* LZ4_dict, const char* dictionary, int dictSize) |
1656 | 0 | { |
1657 | 0 | return LZ4_loadDict_internal(LZ4_dict, dictionary, dictSize, _ld_slow); |
1658 | 0 | } |
1659 | | |
1660 | | void LZ4_attach_dictionary(LZ4_stream_t* workingStream, const LZ4_stream_t* dictionaryStream) |
1661 | 0 | { |
1662 | 0 | const LZ4_stream_t_internal* dictCtx = (dictionaryStream == NULL) ? NULL : |
1663 | 0 | &(dictionaryStream->internal_donotuse); |
1664 | |
|
1665 | 0 | DEBUGLOG(4, "LZ4_attach_dictionary (%p, %p, size %u)", |
1666 | 0 | (void*)workingStream, (void*)dictionaryStream, |
1667 | 0 | dictCtx != NULL ? dictCtx->dictSize : 0); |
1668 | |
|
1669 | 0 | if (dictCtx != NULL) { |
1670 | | /* If the current offset is zero, we will never look in the |
1671 | | * external dictionary context, since there is no value a table |
1672 | | * entry can take that indicate a miss. In that case, we need |
1673 | | * to bump the offset to something non-zero. |
1674 | | */ |
1675 | 0 | if (workingStream->internal_donotuse.currentOffset == 0) { |
1676 | 0 | workingStream->internal_donotuse.currentOffset = 64 KB; |
1677 | 0 | } |
1678 | | |
1679 | | /* Don't actually attach an empty dictionary. |
1680 | | */ |
1681 | 0 | if (dictCtx->dictSize == 0) { |
1682 | 0 | dictCtx = NULL; |
1683 | 0 | } |
1684 | 0 | } |
1685 | 0 | workingStream->internal_donotuse.dictCtx = dictCtx; |
1686 | 0 | } |
1687 | | |
1688 | | |
1689 | | static void LZ4_renormDictT(LZ4_stream_t_internal* LZ4_dict, int nextSize) |
1690 | 1.99k | { |
1691 | 1.99k | assert(nextSize >= 0); |
1692 | 1.99k | if (LZ4_dict->currentOffset + (unsigned)nextSize > 0x80000000) { /* potential ptrdiff_t overflow (32-bits mode) */ |
1693 | | /* rescale hash table */ |
1694 | 0 | U32 const delta = LZ4_dict->currentOffset - 64 KB; |
1695 | 0 | const BYTE* dictEnd = LZ4_dict->dictionary + LZ4_dict->dictSize; |
1696 | 0 | int i; |
1697 | 0 | DEBUGLOG(4, "LZ4_renormDictT"); |
1698 | 0 | for (i=0; i<LZ4_HASH_SIZE_U32; i++) { |
1699 | 0 | if (LZ4_dict->hashTable[i] < delta) LZ4_dict->hashTable[i]=0; |
1700 | 0 | else LZ4_dict->hashTable[i] -= delta; |
1701 | 0 | } |
1702 | 0 | LZ4_dict->currentOffset = 64 KB; |
1703 | 0 | if (LZ4_dict->dictSize > 64 KB) LZ4_dict->dictSize = 64 KB; |
1704 | 0 | LZ4_dict->dictionary = dictEnd - LZ4_dict->dictSize; |
1705 | 0 | } |
1706 | 1.99k | } |
1707 | | |
1708 | | |
1709 | | int LZ4_compress_fast_continue (LZ4_stream_t* LZ4_stream, |
1710 | | const char* source, char* dest, |
1711 | | int inputSize, int maxOutputSize, |
1712 | | int acceleration) |
1713 | 1.99k | { |
1714 | 1.99k | const tableType_t tableType = byU32; |
1715 | 1.99k | LZ4_stream_t_internal* const streamPtr = &LZ4_stream->internal_donotuse; |
1716 | 1.99k | const char* dictEnd = streamPtr->dictSize ? (const char*)streamPtr->dictionary + streamPtr->dictSize : NULL; |
1717 | | |
1718 | 1.99k | DEBUGLOG(5, "LZ4_compress_fast_continue (inputSize=%i, dictSize=%u)", inputSize, streamPtr->dictSize); |
1719 | | |
1720 | 1.99k | LZ4_renormDictT(streamPtr, inputSize); /* fix index overflow */ |
1721 | 1.99k | if (acceleration < 1) acceleration = LZ4_ACCELERATION_DEFAULT; |
1722 | 1.99k | if (acceleration > LZ4_ACCELERATION_MAX) acceleration = LZ4_ACCELERATION_MAX; |
1723 | | |
1724 | | /* invalidate tiny dictionaries */ |
1725 | 1.99k | if ( (streamPtr->dictSize < 4) /* tiny dictionary : not enough for a hash */ |
1726 | 1.99k | && (dictEnd != source) /* prefix mode */ |
1727 | 1.99k | && (inputSize > 0) /* tolerance : don't lose history, in case next invocation would use prefix mode */ |
1728 | 1.99k | && (streamPtr->dictCtx == NULL) /* usingDictCtx */ |
1729 | 1.99k | ) { |
1730 | 503 | DEBUGLOG(5, "LZ4_compress_fast_continue: dictSize(%u) at addr:%p is too small", streamPtr->dictSize, (void*)streamPtr->dictionary); |
1731 | | /* remove dictionary existence from history, to employ faster prefix mode */ |
1732 | 503 | streamPtr->dictSize = 0; |
1733 | 503 | streamPtr->dictionary = (const BYTE*)source; |
1734 | 503 | dictEnd = source; |
1735 | 503 | } |
1736 | | |
1737 | | /* Check overlapping input/dictionary space */ |
1738 | 1.99k | { const char* const sourceEnd = source + inputSize; |
1739 | 1.99k | if ((sourceEnd > (const char*)streamPtr->dictionary) && (sourceEnd < dictEnd)) { |
1740 | 0 | streamPtr->dictSize = (U32)(dictEnd - sourceEnd); |
1741 | 0 | if (streamPtr->dictSize > 64 KB) streamPtr->dictSize = 64 KB; |
1742 | 0 | if (streamPtr->dictSize < 4) streamPtr->dictSize = 0; |
1743 | 0 | streamPtr->dictionary = (const BYTE*)dictEnd - streamPtr->dictSize; |
1744 | 0 | } |
1745 | 1.99k | } |
1746 | | |
1747 | | /* prefix mode : source data follows dictionary */ |
1748 | 1.99k | if (dictEnd == source) { |
1749 | 1.99k | if ((streamPtr->dictSize < 64 KB) && (streamPtr->dictSize < streamPtr->currentOffset)) |
1750 | 0 | return LZ4_compress_generic(streamPtr, source, dest, inputSize, NULL, maxOutputSize, limitedOutput, tableType, withPrefix64k, dictSmall, acceleration); |
1751 | 1.99k | else |
1752 | 1.99k | return LZ4_compress_generic(streamPtr, source, dest, inputSize, NULL, maxOutputSize, limitedOutput, tableType, withPrefix64k, noDictIssue, acceleration); |
1753 | 1.99k | } |
1754 | | |
1755 | | /* external dictionary mode */ |
1756 | 0 | { int result; |
1757 | 0 | if (streamPtr->dictCtx) { |
1758 | | /* We depend here on the fact that dictCtx'es (produced by |
1759 | | * LZ4_loadDict) guarantee that their tables contain no references |
1760 | | * to offsets between dictCtx->currentOffset - 64 KB and |
1761 | | * dictCtx->currentOffset - dictCtx->dictSize. This makes it safe |
1762 | | * to use noDictIssue even when the dict isn't a full 64 KB. |
1763 | | */ |
1764 | 0 | if (inputSize > 4 KB) { |
1765 | | /* For compressing large blobs, it is faster to pay the setup |
1766 | | * cost to copy the dictionary's tables into the active context, |
1767 | | * so that the compression loop is only looking into one table. |
1768 | | */ |
1769 | 0 | LZ4_memcpy(streamPtr, streamPtr->dictCtx, sizeof(*streamPtr)); |
1770 | 0 | result = LZ4_compress_generic(streamPtr, source, dest, inputSize, NULL, maxOutputSize, limitedOutput, tableType, usingExtDict, noDictIssue, acceleration); |
1771 | 0 | } else { |
1772 | 0 | result = LZ4_compress_generic(streamPtr, source, dest, inputSize, NULL, maxOutputSize, limitedOutput, tableType, usingDictCtx, noDictIssue, acceleration); |
1773 | 0 | } |
1774 | 0 | } else { /* small data <= 4 KB */ |
1775 | 0 | if ((streamPtr->dictSize < 64 KB) && (streamPtr->dictSize < streamPtr->currentOffset)) { |
1776 | 0 | result = LZ4_compress_generic(streamPtr, source, dest, inputSize, NULL, maxOutputSize, limitedOutput, tableType, usingExtDict, dictSmall, acceleration); |
1777 | 0 | } else { |
1778 | 0 | result = LZ4_compress_generic(streamPtr, source, dest, inputSize, NULL, maxOutputSize, limitedOutput, tableType, usingExtDict, noDictIssue, acceleration); |
1779 | 0 | } |
1780 | 0 | } |
1781 | 0 | streamPtr->dictionary = (const BYTE*)source; |
1782 | 0 | streamPtr->dictSize = (U32)inputSize; |
1783 | 0 | return result; |
1784 | 1.99k | } |
1785 | 1.99k | } |
1786 | | |
1787 | | |
1788 | | /* Hidden debug function, to force-test external dictionary mode */ |
1789 | | int LZ4_compress_forceExtDict (LZ4_stream_t* LZ4_dict, const char* source, char* dest, int srcSize) |
1790 | 0 | { |
1791 | 0 | LZ4_stream_t_internal* const streamPtr = &LZ4_dict->internal_donotuse; |
1792 | 0 | int result; |
1793 | |
|
1794 | 0 | LZ4_renormDictT(streamPtr, srcSize); |
1795 | |
|
1796 | 0 | if ((streamPtr->dictSize < 64 KB) && (streamPtr->dictSize < streamPtr->currentOffset)) { |
1797 | 0 | result = LZ4_compress_generic(streamPtr, source, dest, srcSize, NULL, 0, notLimited, byU32, usingExtDict, dictSmall, 1); |
1798 | 0 | } else { |
1799 | 0 | result = LZ4_compress_generic(streamPtr, source, dest, srcSize, NULL, 0, notLimited, byU32, usingExtDict, noDictIssue, 1); |
1800 | 0 | } |
1801 | |
|
1802 | 0 | streamPtr->dictionary = (const BYTE*)source; |
1803 | 0 | streamPtr->dictSize = (U32)srcSize; |
1804 | |
|
1805 | 0 | return result; |
1806 | 0 | } |
1807 | | |
1808 | | |
1809 | | /*! LZ4_saveDict() : |
1810 | | * If previously compressed data block is not guaranteed to remain available at its memory location, |
1811 | | * save it into a safer place (char* safeBuffer). |
1812 | | * Note : no need to call LZ4_loadDict() afterwards, dictionary is immediately usable, |
1813 | | * one can therefore call LZ4_compress_fast_continue() right after. |
1814 | | * @return : saved dictionary size in bytes (necessarily <= dictSize), or 0 if error. |
1815 | | */ |
1816 | | int LZ4_saveDict (LZ4_stream_t* LZ4_dict, char* safeBuffer, int dictSize) |
1817 | 0 | { |
1818 | 0 | LZ4_stream_t_internal* const dict = &LZ4_dict->internal_donotuse; |
1819 | |
|
1820 | 0 | DEBUGLOG(5, "LZ4_saveDict : dictSize=%i, safeBuffer=%p", dictSize, (void*)safeBuffer); |
1821 | |
|
1822 | 0 | if ((U32)dictSize > 64 KB) { dictSize = 64 KB; } /* useless to define a dictionary > 64 KB */ |
1823 | 0 | if ((U32)dictSize > dict->dictSize) { dictSize = (int)dict->dictSize; } |
1824 | |
|
1825 | 0 | if (safeBuffer == NULL) assert(dictSize == 0); |
1826 | 0 | if (dictSize > 0) { |
1827 | 0 | const BYTE* const previousDictEnd = dict->dictionary + dict->dictSize; |
1828 | 0 | assert(dict->dictionary); |
1829 | 0 | LZ4_memmove(safeBuffer, previousDictEnd - dictSize, (size_t)dictSize); |
1830 | 0 | } |
1831 | | |
1832 | 0 | dict->dictionary = (const BYTE*)safeBuffer; |
1833 | 0 | dict->dictSize = (U32)dictSize; |
1834 | |
|
1835 | 0 | return dictSize; |
1836 | 0 | } |
1837 | | |
1838 | | |
1839 | | |
1840 | | /*-******************************* |
1841 | | * Decompression functions |
1842 | | ********************************/ |
1843 | | |
1844 | | typedef enum { decode_full_block = 0, partial_decode = 1 } earlyEnd_directive; |
1845 | | |
1846 | | #undef MIN |
1847 | 0 | #define MIN(a,b) ( (a) < (b) ? (a) : (b) ) |
1848 | | |
1849 | | |
1850 | | /* variant for decompress_unsafe() |
1851 | | * does not know end of input |
1852 | | * presumes input is well formed |
1853 | | * note : will consume at least one byte */ |
1854 | | static size_t read_long_length_no_check(const BYTE** pp) |
1855 | 0 | { |
1856 | 0 | size_t b, l = 0; |
1857 | 0 | do { b = **pp; (*pp)++; l += b; } while (b==255); |
1858 | 0 | DEBUGLOG(6, "read_long_length_no_check: +length=%zu using %zu input bytes", l, l/255 + 1) |
1859 | 0 | return l; |
1860 | 0 | } |
1861 | | |
1862 | | /* core decoder variant for LZ4_decompress_fast*() |
1863 | | * for legacy support only : these entry points are deprecated. |
1864 | | * - Presumes input is correctly formed (no defense vs malformed inputs) |
1865 | | * - Does not know input size (presume input buffer is "large enough") |
1866 | | * - Decompress a full block (only) |
1867 | | * @return : nb of bytes read from input. |
1868 | | * Note : this variant is not optimized for speed, just for maintenance. |
1869 | | * the goal is to remove support of decompress_fast*() variants by v2.0 |
1870 | | **/ |
1871 | | LZ4_FORCE_INLINE int |
1872 | | LZ4_decompress_unsafe_generic( |
1873 | | const BYTE* const istart, |
1874 | | BYTE* const ostart, |
1875 | | int decompressedSize, |
1876 | | |
1877 | | size_t prefixSize, |
1878 | | const BYTE* const dictStart, /* only if dict==usingExtDict */ |
1879 | | const size_t dictSize /* note: =0 if dictStart==NULL */ |
1880 | | ) |
1881 | 0 | { |
1882 | 0 | const BYTE* ip = istart; |
1883 | 0 | BYTE* op = (BYTE*)ostart; |
1884 | 0 | BYTE* const oend = ostart + decompressedSize; |
1885 | 0 | const BYTE* const prefixStart = ostart - prefixSize; |
1886 | |
|
1887 | 0 | DEBUGLOG(5, "LZ4_decompress_unsafe_generic"); |
1888 | 0 | if (dictStart == NULL) assert(dictSize == 0); |
1889 | | |
1890 | 0 | while (1) { |
1891 | | /* start new sequence */ |
1892 | 0 | unsigned token = *ip++; |
1893 | | |
1894 | | /* literals */ |
1895 | 0 | { size_t ll = token >> ML_BITS; |
1896 | 0 | if (ll==15) { |
1897 | | /* long literal length */ |
1898 | 0 | ll += read_long_length_no_check(&ip); |
1899 | 0 | } |
1900 | 0 | if ((size_t)(oend-op) < ll) return -1; /* output buffer overflow */ |
1901 | 0 | LZ4_memmove(op, ip, ll); /* support in-place decompression */ |
1902 | 0 | op += ll; |
1903 | 0 | ip += ll; |
1904 | 0 | if ((size_t)(oend-op) < MFLIMIT) { |
1905 | 0 | if (op==oend) break; /* end of block */ |
1906 | 0 | DEBUGLOG(5, "invalid: literals end at distance %zi from end of block", oend-op); |
1907 | | /* incorrect end of block : |
1908 | | * last match must start at least MFLIMIT==12 bytes before end of output block */ |
1909 | 0 | return -1; |
1910 | 0 | } } |
1911 | | |
1912 | | /* match */ |
1913 | 0 | { size_t ml = token & 15; |
1914 | 0 | size_t const offset = LZ4_readLE16(ip); |
1915 | 0 | ip+=2; |
1916 | |
|
1917 | 0 | if (ml==15) { |
1918 | | /* long literal length */ |
1919 | 0 | ml += read_long_length_no_check(&ip); |
1920 | 0 | } |
1921 | 0 | ml += MINMATCH; |
1922 | |
|
1923 | 0 | if ((size_t)(oend-op) < ml) return -1; /* output buffer overflow */ |
1924 | | |
1925 | 0 | { const BYTE* match = op - offset; |
1926 | | |
1927 | | /* out of range */ |
1928 | 0 | if (offset > (size_t)(op - prefixStart) + dictSize) { |
1929 | 0 | DEBUGLOG(6, "offset out of range"); |
1930 | 0 | return -1; |
1931 | 0 | } |
1932 | | |
1933 | | /* check special case : extDict */ |
1934 | 0 | if (offset > (size_t)(op - prefixStart)) { |
1935 | | /* extDict scenario */ |
1936 | 0 | const BYTE* const dictEnd = dictStart + dictSize; |
1937 | 0 | const BYTE* extMatch = dictEnd - (offset - (size_t)(op-prefixStart)); |
1938 | 0 | size_t const extml = (size_t)(dictEnd - extMatch); |
1939 | 0 | if (extml > ml) { |
1940 | | /* match entirely within extDict */ |
1941 | 0 | LZ4_memmove(op, extMatch, ml); |
1942 | 0 | op += ml; |
1943 | 0 | ml = 0; |
1944 | 0 | } else { |
1945 | | /* match split between extDict & prefix */ |
1946 | 0 | LZ4_memmove(op, extMatch, extml); |
1947 | 0 | op += extml; |
1948 | 0 | ml -= extml; |
1949 | 0 | } |
1950 | 0 | match = prefixStart; |
1951 | 0 | } |
1952 | | |
1953 | | /* match copy - slow variant, supporting overlap copy */ |
1954 | 0 | { size_t u; |
1955 | 0 | for (u=0; u<ml; u++) { |
1956 | 0 | op[u] = match[u]; |
1957 | 0 | } } } |
1958 | 0 | op += ml; |
1959 | 0 | if ((size_t)(oend-op) < LASTLITERALS) { |
1960 | 0 | DEBUGLOG(5, "invalid: match ends at distance %zi from end of block", oend-op); |
1961 | | /* incorrect end of block : |
1962 | | * last match must stop at least LASTLITERALS==5 bytes before end of output block */ |
1963 | 0 | return -1; |
1964 | 0 | } |
1965 | 0 | } /* match */ |
1966 | 0 | } /* main loop */ |
1967 | 0 | return (int)(ip - istart); |
1968 | 0 | } |
1969 | | |
1970 | | |
1971 | | /* Read the variable-length literal or match length. |
1972 | | * |
1973 | | * @ip : input pointer |
1974 | | * @ilimit : position after which if length is not decoded, the input is necessarily corrupted. |
1975 | | * @initial_check - check ip >= ipmax before start of loop. Returns initial_error if so. |
1976 | | * @error (output) - error code. Must be set to 0 before call. |
1977 | | **/ |
1978 | | typedef size_t Rvl_t; |
1979 | | static const Rvl_t rvl_error = (Rvl_t)(-1); |
1980 | | LZ4_FORCE_INLINE Rvl_t |
1981 | | read_variable_length(const BYTE** ip, const BYTE* ilimit, |
1982 | | int initial_check) |
1983 | 2.27M | { |
1984 | 2.27M | Rvl_t s, length = 0; |
1985 | 2.27M | assert(ip != NULL); |
1986 | 2.27M | assert(*ip != NULL); |
1987 | 2.27M | assert(ilimit != NULL); |
1988 | 2.27M | if (initial_check && unlikely((*ip) >= ilimit)) { /* read limit reached */ |
1989 | 0 | return rvl_error; |
1990 | 0 | } |
1991 | 2.27M | s = **ip; |
1992 | 2.27M | (*ip)++; |
1993 | 2.27M | length += s; |
1994 | 2.27M | if (unlikely((*ip) > ilimit)) { /* read limit reached */ |
1995 | 0 | return rvl_error; |
1996 | 0 | } |
1997 | | /* accumulator overflow detection (32-bit mode only) */ |
1998 | 2.27M | if ((sizeof(length) < 8) && unlikely(length > ((Rvl_t)(-1)/2)) ) { |
1999 | 0 | return rvl_error; |
2000 | 0 | } |
2001 | 2.27M | if (likely(s != 255)) return length; |
2002 | 1.62M | do { |
2003 | 1.62M | s = **ip; |
2004 | 1.62M | (*ip)++; |
2005 | 1.62M | length += s; |
2006 | 1.62M | if (unlikely((*ip) > ilimit)) { /* read limit reached */ |
2007 | 0 | return rvl_error; |
2008 | 0 | } |
2009 | | /* accumulator overflow detection (32-bit mode only) */ |
2010 | 1.62M | if ((sizeof(length) < 8) && unlikely(length > ((Rvl_t)(-1)/2)) ) { |
2011 | 0 | return rvl_error; |
2012 | 0 | } |
2013 | 1.62M | } while (s == 255); |
2014 | | |
2015 | 214k | return length; |
2016 | 214k | } |
2017 | | |
2018 | | /*! LZ4_decompress_generic() : |
2019 | | * This generic decompression function covers all use cases. |
2020 | | * It shall be instantiated several times, using different sets of directives. |
2021 | | * Note that it is important for performance that this function really get inlined, |
2022 | | * in order to remove useless branches during compilation optimization. |
2023 | | */ |
2024 | | LZ4_FORCE_INLINE int |
2025 | | LZ4_decompress_generic( |
2026 | | const char* const src, |
2027 | | char* const dst, |
2028 | | int srcSize, |
2029 | | int outputSize, /* If endOnInput==endOnInputSize, this value is `dstCapacity` */ |
2030 | | |
2031 | | earlyEnd_directive partialDecoding, /* full, partial */ |
2032 | | dict_directive dict, /* noDict, withPrefix64k, usingExtDict */ |
2033 | | const BYTE* const lowPrefix, /* always <= dst, == dst when no prefix */ |
2034 | | const BYTE* const dictStart, /* only if dict==usingExtDict */ |
2035 | | const size_t dictSize /* note : = 0 if noDict */ |
2036 | | ) |
2037 | 14.5k | { |
2038 | 14.5k | if ((src == NULL) || (outputSize < 0)) { return -1; } |
2039 | | |
2040 | 14.5k | { const BYTE* ip = (const BYTE*) src; |
2041 | 14.5k | const BYTE* const iend = ip + srcSize; |
2042 | | |
2043 | 14.5k | BYTE* op = (BYTE*) dst; |
2044 | 14.5k | BYTE* const oend = op + outputSize; |
2045 | 14.5k | BYTE* cpy; |
2046 | | |
2047 | 14.5k | const BYTE* const dictEnd = (dictStart == NULL) ? NULL : dictStart + dictSize; |
2048 | | |
2049 | 14.5k | const int checkOffset = (dictSize < (int)(64 KB)); |
2050 | | |
2051 | | |
2052 | | /* Set up the "end" pointers for the shortcut. */ |
2053 | 14.5k | const BYTE* const shortiend = iend - 14 /*maxLL*/ - 2 /*offset*/; |
2054 | 14.5k | const BYTE* const shortoend = oend - 14 /*maxLL*/ - 18 /*maxML*/; |
2055 | | |
2056 | 14.5k | const BYTE* match; |
2057 | 14.5k | size_t offset; |
2058 | 14.5k | unsigned token; |
2059 | 14.5k | size_t length; |
2060 | | |
2061 | | |
2062 | 14.5k | DEBUGLOG(5, "LZ4_decompress_generic (srcSize:%i, dstSize:%i)", srcSize, outputSize); |
2063 | | |
2064 | | /* Special cases */ |
2065 | 14.5k | assert(lowPrefix <= op); |
2066 | 14.5k | if (unlikely(outputSize==0)) { |
2067 | | /* Empty output buffer */ |
2068 | 0 | if (partialDecoding) return 0; |
2069 | 0 | return ((srcSize==1) && (*ip==0)) ? 0 : -1; |
2070 | 0 | } |
2071 | 14.5k | if (unlikely(srcSize==0)) { return -1; } |
2072 | | |
2073 | | /* LZ4_FAST_DEC_LOOP: |
2074 | | * designed for modern OoO performance cpus, |
2075 | | * where copying reliably 32-bytes is preferable to an unpredictable branch. |
2076 | | * note : fast loop may show a regression for some client arm chips. */ |
2077 | 14.5k | #if LZ4_FAST_DEC_LOOP |
2078 | 14.5k | if ((oend - op) < FASTLOOP_SAFE_DISTANCE) { |
2079 | 0 | DEBUGLOG(6, "move to safe decode loop"); |
2080 | 0 | goto safe_decode; |
2081 | 0 | } |
2082 | | |
2083 | | /* Fast loop : decode sequences as long as output < oend-FASTLOOP_SAFE_DISTANCE */ |
2084 | 14.5k | DEBUGLOG(6, "using fast decode loop"); |
2085 | 10.2M | while (1) { |
2086 | | /* Main fastloop assertion: We can always wildcopy FASTLOOP_SAFE_DISTANCE */ |
2087 | 10.2M | assert(oend - op >= FASTLOOP_SAFE_DISTANCE); |
2088 | 10.2M | assert(ip < iend); |
2089 | 10.2M | token = *ip++; |
2090 | 10.2M | length = token >> ML_BITS; /* literal length */ |
2091 | 10.2M | DEBUGLOG(7, "blockPos%6u: litLength token = %u", (unsigned)(op-(BYTE*)dst), (unsigned)length); |
2092 | | |
2093 | | /* decode literal length */ |
2094 | 10.2M | if (length == RUN_MASK) { |
2095 | 760k | size_t const addl = read_variable_length(&ip, iend-RUN_MASK, 1); |
2096 | 760k | if (addl == rvl_error) { |
2097 | 0 | DEBUGLOG(6, "error reading long literal length"); |
2098 | 0 | goto _output_error; |
2099 | 0 | } |
2100 | 760k | length += addl; |
2101 | 760k | if (unlikely((uptrval)(op)+length<(uptrval)(op))) { goto _output_error; } /* overflow detection */ |
2102 | 760k | if (unlikely((uptrval)(ip)+length<(uptrval)(ip))) { goto _output_error; } /* overflow detection */ |
2103 | | |
2104 | | /* copy literals */ |
2105 | 760k | LZ4_STATIC_ASSERT(MFLIMIT >= WILDCOPYLENGTH); |
2106 | 760k | if ((op+length>oend-32) || (ip+length>iend-32)) { goto safe_literal_copy; } |
2107 | 757k | LZ4_wildCopy32(op, ip, op+length); |
2108 | 757k | ip += length; op += length; |
2109 | 9.47M | } else if (ip <= iend-(16 + 1/*max lit + offset + nextToken*/)) { |
2110 | | /* We don't need to check oend, since we check it once for each loop below */ |
2111 | 9.46M | DEBUGLOG(7, "copy %u bytes in a 16-bytes stripe", (unsigned)length); |
2112 | | /* Literals can only be <= 14, but hope compilers optimize better when copy by a register size */ |
2113 | 9.46M | LZ4_memcpy(op, ip, 16); |
2114 | 9.46M | ip += length; op += length; |
2115 | 9.46M | } else { |
2116 | 8.34k | goto safe_literal_copy; |
2117 | 8.34k | } |
2118 | | |
2119 | | /* get offset */ |
2120 | 10.2M | offset = LZ4_readLE16(ip); ip+=2; |
2121 | 10.2M | DEBUGLOG(6, "blockPos%6u: offset = %u", (unsigned)(op-(BYTE*)dst), (unsigned)offset); |
2122 | 10.2M | match = op - offset; |
2123 | 10.2M | assert(match <= op); /* overflow check */ |
2124 | | |
2125 | | /* get matchlength */ |
2126 | 10.2M | length = token & ML_MASK; |
2127 | 10.2M | DEBUGLOG(7, " match length token = %u (len==%u)", (unsigned)length, (unsigned)length+MINMATCH); |
2128 | | |
2129 | 10.2M | if (length == ML_MASK) { |
2130 | 1.50M | size_t const addl = read_variable_length(&ip, iend - LASTLITERALS + 1, 0); |
2131 | 1.50M | if (addl == rvl_error) { |
2132 | 0 | DEBUGLOG(5, "error reading long match length"); |
2133 | 0 | goto _output_error; |
2134 | 0 | } |
2135 | 1.50M | length += addl; |
2136 | 1.50M | length += MINMATCH; |
2137 | 1.50M | DEBUGLOG(7, " long match length == %u", (unsigned)length); |
2138 | 1.50M | if (unlikely((uptrval)(op)+length<(uptrval)op)) { goto _output_error; } /* overflow detection */ |
2139 | 1.50M | if (op + length >= oend - FASTLOOP_SAFE_DISTANCE) { |
2140 | 2.32k | goto safe_match_copy; |
2141 | 2.32k | } |
2142 | 8.71M | } else { |
2143 | 8.71M | length += MINMATCH; |
2144 | 8.71M | if (op + length >= oend - FASTLOOP_SAFE_DISTANCE) { |
2145 | 1.17k | DEBUGLOG(7, "moving to safe_match_copy (ml==%u)", (unsigned)length); |
2146 | 1.17k | goto safe_match_copy; |
2147 | 1.17k | } |
2148 | | |
2149 | | /* Fastpath check: skip LZ4_wildCopy32 when true */ |
2150 | 8.71M | if ((dict == withPrefix64k) || (match >= lowPrefix)) { |
2151 | 8.68M | if (offset >= 8) { |
2152 | 8.26M | assert(match >= lowPrefix); |
2153 | 8.26M | assert(match <= op); |
2154 | 8.26M | assert(op + 18 <= oend); |
2155 | | |
2156 | 8.26M | LZ4_memcpy(op, match, 8); |
2157 | 8.26M | LZ4_memcpy(op+8, match+8, 8); |
2158 | 8.26M | LZ4_memcpy(op+16, match+16, 2); |
2159 | 8.26M | op += length; |
2160 | 8.26M | continue; |
2161 | 8.26M | } } } |
2162 | | |
2163 | 1.95M | if ( checkOffset && (unlikely(match + dictSize < lowPrefix)) ) { |
2164 | 0 | DEBUGLOG(5, "Error : pos=%zi, offset=%zi => outside buffers", op-lowPrefix, op-match); |
2165 | 0 | goto _output_error; |
2166 | 0 | } |
2167 | | /* match starting within external dictionary */ |
2168 | 1.95M | if ((dict==usingExtDict) && (match < lowPrefix)) { |
2169 | 36.6k | assert(dictEnd != NULL); |
2170 | 36.6k | if (unlikely(op+length > oend-LASTLITERALS)) { |
2171 | 0 | if (partialDecoding) { |
2172 | 0 | DEBUGLOG(7, "partialDecoding: dictionary match, close to dstEnd"); |
2173 | 0 | length = MIN(length, (size_t)(oend-op)); |
2174 | 0 | } else { |
2175 | 0 | DEBUGLOG(6, "end-of-block condition violated") |
2176 | 0 | goto _output_error; |
2177 | 0 | } } |
2178 | | |
2179 | 36.6k | if (length <= (size_t)(lowPrefix-match)) { |
2180 | | /* match fits entirely within external dictionary : just copy */ |
2181 | 36.1k | LZ4_memmove(op, dictEnd - (lowPrefix-match), length); |
2182 | 36.1k | op += length; |
2183 | 36.1k | } else { |
2184 | | /* match stretches into both external dictionary and current block */ |
2185 | 423 | size_t const copySize = (size_t)(lowPrefix - match); |
2186 | 423 | size_t const restSize = length - copySize; |
2187 | 423 | LZ4_memcpy(op, dictEnd - copySize, copySize); |
2188 | 423 | op += copySize; |
2189 | 423 | if (restSize > (size_t)(op - lowPrefix)) { /* overlap copy */ |
2190 | 190 | BYTE* const endOfMatch = op + restSize; |
2191 | 190 | const BYTE* copyFrom = lowPrefix; |
2192 | 1.49M | while (op < endOfMatch) { *op++ = *copyFrom++; } |
2193 | 233 | } else { |
2194 | 233 | LZ4_memcpy(op, lowPrefix, restSize); |
2195 | 233 | op += restSize; |
2196 | 233 | } } |
2197 | 36.6k | continue; |
2198 | 36.6k | } |
2199 | | |
2200 | | /* copy match within block */ |
2201 | 1.91M | cpy = op + length; |
2202 | | |
2203 | 1.91M | assert((op <= oend) && (oend-op >= 32)); |
2204 | 1.91M | if (unlikely(offset<16)) { |
2205 | 595k | LZ4_memcpy_using_offset(op, match, cpy, offset); |
2206 | 1.32M | } else { |
2207 | 1.32M | LZ4_wildCopy32(op, match, cpy); |
2208 | 1.32M | } |
2209 | | |
2210 | 1.91M | op = cpy; /* wildcopy correction */ |
2211 | 1.91M | } |
2212 | 0 | safe_decode: |
2213 | 0 | #endif |
2214 | | |
2215 | | /* Main Loop : decode remaining sequences where output < FASTLOOP_SAFE_DISTANCE */ |
2216 | 0 | DEBUGLOG(6, "using safe decode loop"); |
2217 | 25.2k | while (1) { |
2218 | 25.2k | assert(ip < iend); |
2219 | 25.2k | token = *ip++; |
2220 | 25.2k | length = token >> ML_BITS; /* literal length */ |
2221 | 25.2k | DEBUGLOG(7, "blockPos%6u: litLength token = %u", (unsigned)(op-(BYTE*)dst), (unsigned)length); |
2222 | | |
2223 | | /* A two-stage shortcut for the most common case: |
2224 | | * 1) If the literal length is 0..14, and there is enough space, |
2225 | | * enter the shortcut and copy 16 bytes on behalf of the literals |
2226 | | * (in the fast mode, only 8 bytes can be safely copied this way). |
2227 | | * 2) Further if the match length is 4..18, copy 18 bytes in a similar |
2228 | | * manner; but we ensure that there's enough space in the output for |
2229 | | * those 18 bytes earlier, upon entering the shortcut (in other words, |
2230 | | * there is a combined check for both stages). |
2231 | | */ |
2232 | 25.2k | if ( (length != RUN_MASK) |
2233 | | /* strictly "less than" on input, to re-enter the loop with at least one byte */ |
2234 | 25.2k | && likely((ip < shortiend) & (op <= shortoend)) ) { |
2235 | | /* Copy the literals */ |
2236 | 5.07k | LZ4_memcpy(op, ip, 16); |
2237 | 5.07k | op += length; ip += length; |
2238 | | |
2239 | | /* The second stage: prepare for match copying, decode full info. |
2240 | | * If it doesn't work out, the info won't be wasted. */ |
2241 | 5.07k | length = token & ML_MASK; /* match length */ |
2242 | 5.07k | DEBUGLOG(7, "blockPos%6u: matchLength token = %u (len=%u)", (unsigned)(op-(BYTE*)dst), (unsigned)length, (unsigned)length + 4); |
2243 | 5.07k | offset = LZ4_readLE16(ip); ip += 2; |
2244 | 5.07k | match = op - offset; |
2245 | 5.07k | assert(match <= op); /* check overflow */ |
2246 | | |
2247 | | /* Do not deal with overlapping matches. */ |
2248 | 5.07k | if ( (length != ML_MASK) |
2249 | 5.07k | && (offset >= 8) |
2250 | 5.07k | && (dict==withPrefix64k || match >= lowPrefix) ) { |
2251 | | /* Copy the match. */ |
2252 | 3.85k | LZ4_memcpy(op + 0, match + 0, 8); |
2253 | 3.85k | LZ4_memcpy(op + 8, match + 8, 8); |
2254 | 3.85k | LZ4_memcpy(op +16, match +16, 2); |
2255 | 3.85k | op += length + MINMATCH; |
2256 | | /* Both stages worked, load the next token. */ |
2257 | 3.85k | continue; |
2258 | 3.85k | } |
2259 | | |
2260 | | /* The second stage didn't work out, but the info is ready. |
2261 | | * Propel it right to the point of match copying. */ |
2262 | 1.22k | goto _copy_match; |
2263 | 5.07k | } |
2264 | | |
2265 | | /* decode literal length */ |
2266 | 20.1k | if (length == RUN_MASK) { |
2267 | 742 | size_t const addl = read_variable_length(&ip, iend-RUN_MASK, 1); |
2268 | 742 | if (addl == rvl_error) { goto _output_error; } |
2269 | 742 | length += addl; |
2270 | 742 | if (unlikely((uptrval)(op)+length<(uptrval)(op))) { goto _output_error; } /* overflow detection */ |
2271 | 742 | if (unlikely((uptrval)(ip)+length<(uptrval)(ip))) { goto _output_error; } /* overflow detection */ |
2272 | 742 | } |
2273 | | |
2274 | 20.1k | #if LZ4_FAST_DEC_LOOP |
2275 | 31.2k | safe_literal_copy: |
2276 | 31.2k | #endif |
2277 | | /* copy literals */ |
2278 | 31.2k | cpy = op+length; |
2279 | | |
2280 | 31.2k | LZ4_STATIC_ASSERT(MFLIMIT >= WILDCOPYLENGTH); |
2281 | 31.2k | if ((cpy>oend-MFLIMIT) || (ip+length>iend-(2+1+LASTLITERALS))) { |
2282 | | /* We've either hit the input parsing restriction or the output parsing restriction. |
2283 | | * In the normal scenario, decoding a full block, it must be the last sequence, |
2284 | | * otherwise it's an error (invalid input or dimensions). |
2285 | | * In partialDecoding scenario, it's necessary to ensure there is no buffer overflow. |
2286 | | */ |
2287 | 14.5k | if (partialDecoding) { |
2288 | | /* Since we are partial decoding we may be in this block because of the output parsing |
2289 | | * restriction, which is not valid since the output buffer is allowed to be undersized. |
2290 | | */ |
2291 | 0 | DEBUGLOG(7, "partialDecoding: copying literals, close to input or output end") |
2292 | 0 | DEBUGLOG(7, "partialDecoding: literal length = %u", (unsigned)length); |
2293 | 0 | DEBUGLOG(7, "partialDecoding: remaining space in dstBuffer : %i", (int)(oend - op)); |
2294 | 0 | DEBUGLOG(7, "partialDecoding: remaining space in srcBuffer : %i", (int)(iend - ip)); |
2295 | | /* Finishing in the middle of a literals segment, |
2296 | | * due to lack of input. |
2297 | | */ |
2298 | 0 | if (ip+length > iend) { |
2299 | 0 | length = (size_t)(iend-ip); |
2300 | 0 | cpy = op + length; |
2301 | 0 | } |
2302 | | /* Finishing in the middle of a literals segment, |
2303 | | * due to lack of output space. |
2304 | | */ |
2305 | 0 | if (cpy > oend) { |
2306 | 0 | cpy = oend; |
2307 | 0 | assert(op<=oend); |
2308 | 0 | length = (size_t)(oend-op); |
2309 | 0 | } |
2310 | 14.5k | } else { |
2311 | | /* We must be on the last sequence (or invalid) because of the parsing limitations |
2312 | | * so check that we exactly consume the input and don't overrun the output buffer. |
2313 | | */ |
2314 | 14.5k | if ((ip+length != iend) || (cpy > oend)) { |
2315 | 0 | DEBUGLOG(5, "should have been last run of literals") |
2316 | 0 | DEBUGLOG(5, "ip(%p) + length(%i) = %p != iend (%p)", (void*)ip, (int)length, (void*)(ip+length), (void*)iend); |
2317 | 0 | DEBUGLOG(5, "or cpy(%p) > (oend-MFLIMIT)(%p)", (void*)cpy, (void*)(oend-MFLIMIT)); |
2318 | 0 | DEBUGLOG(5, "after writing %u bytes / %i bytes available", (unsigned)(op-(BYTE*)dst), outputSize); |
2319 | 0 | goto _output_error; |
2320 | 0 | } |
2321 | 14.5k | } |
2322 | 14.5k | LZ4_memmove(op, ip, length); /* supports overlapping memory regions, for in-place decompression scenarios */ |
2323 | 14.5k | ip += length; |
2324 | 14.5k | op += length; |
2325 | | /* Necessarily EOF when !partialDecoding. |
2326 | | * When partialDecoding, it is EOF if we've either |
2327 | | * filled the output buffer or |
2328 | | * can't proceed with reading an offset for following match. |
2329 | | */ |
2330 | 14.5k | if (!partialDecoding || (cpy == oend) || (ip >= (iend-2))) { |
2331 | 14.5k | break; |
2332 | 14.5k | } |
2333 | 16.6k | } else { |
2334 | 16.6k | LZ4_wildCopy8(op, ip, cpy); /* can overwrite up to 8 bytes beyond cpy */ |
2335 | 16.6k | ip += length; op = cpy; |
2336 | 16.6k | } |
2337 | | |
2338 | | /* get offset */ |
2339 | 16.6k | offset = LZ4_readLE16(ip); ip+=2; |
2340 | 16.6k | match = op - offset; |
2341 | | |
2342 | | /* get matchlength */ |
2343 | 16.6k | length = token & ML_MASK; |
2344 | 16.6k | DEBUGLOG(7, "blockPos%6u: matchLength token = %u", (unsigned)(op-(BYTE*)dst), (unsigned)length); |
2345 | | |
2346 | 17.9k | _copy_match: |
2347 | 17.9k | if (length == ML_MASK) { |
2348 | 5.30k | size_t const addl = read_variable_length(&ip, iend - LASTLITERALS + 1, 0); |
2349 | 5.30k | if (addl == rvl_error) { goto _output_error; } |
2350 | 5.30k | length += addl; |
2351 | 5.30k | if (unlikely((uptrval)(op)+length<(uptrval)op)) goto _output_error; /* overflow detection */ |
2352 | 5.30k | } |
2353 | 17.9k | length += MINMATCH; |
2354 | | |
2355 | 17.9k | #if LZ4_FAST_DEC_LOOP |
2356 | 21.3k | safe_match_copy: |
2357 | 21.3k | #endif |
2358 | 21.3k | if ((checkOffset) && (unlikely(match + dictSize < lowPrefix))) goto _output_error; /* Error : offset outside buffers */ |
2359 | | /* match starting within external dictionary */ |
2360 | 21.3k | if ((dict==usingExtDict) && (match < lowPrefix)) { |
2361 | 551 | assert(dictEnd != NULL); |
2362 | 551 | if (unlikely(op+length > oend-LASTLITERALS)) { |
2363 | 0 | if (partialDecoding) length = MIN(length, (size_t)(oend-op)); |
2364 | 0 | else goto _output_error; /* doesn't respect parsing restriction */ |
2365 | 0 | } |
2366 | | |
2367 | 551 | if (length <= (size_t)(lowPrefix-match)) { |
2368 | | /* match fits entirely within external dictionary : just copy */ |
2369 | 389 | LZ4_memmove(op, dictEnd - (lowPrefix-match), length); |
2370 | 389 | op += length; |
2371 | 389 | } else { |
2372 | | /* match stretches into both external dictionary and current block */ |
2373 | 162 | size_t const copySize = (size_t)(lowPrefix - match); |
2374 | 162 | size_t const restSize = length - copySize; |
2375 | 162 | LZ4_memcpy(op, dictEnd - copySize, copySize); |
2376 | 162 | op += copySize; |
2377 | 162 | if (restSize > (size_t)(op - lowPrefix)) { /* overlap copy */ |
2378 | 119 | BYTE* const endOfMatch = op + restSize; |
2379 | 119 | const BYTE* copyFrom = lowPrefix; |
2380 | 2.05M | while (op < endOfMatch) *op++ = *copyFrom++; |
2381 | 119 | } else { |
2382 | 43 | LZ4_memcpy(op, lowPrefix, restSize); |
2383 | 43 | op += restSize; |
2384 | 43 | } } |
2385 | 551 | continue; |
2386 | 551 | } |
2387 | 20.8k | assert(match >= lowPrefix); |
2388 | | |
2389 | | /* copy match within block */ |
2390 | 20.8k | cpy = op + length; |
2391 | | |
2392 | | /* partialDecoding : may end anywhere within the block */ |
2393 | 20.8k | assert(op<=oend); |
2394 | 20.8k | if (partialDecoding && (cpy > oend-MATCH_SAFEGUARD_DISTANCE)) { |
2395 | 0 | size_t const mlen = MIN(length, (size_t)(oend-op)); |
2396 | 0 | const BYTE* const matchEnd = match + mlen; |
2397 | 0 | BYTE* const copyEnd = op + mlen; |
2398 | 0 | if (matchEnd > op) { /* overlap copy */ |
2399 | 0 | while (op < copyEnd) { *op++ = *match++; } |
2400 | 0 | } else { |
2401 | 0 | LZ4_memcpy(op, match, mlen); |
2402 | 0 | } |
2403 | 0 | op = copyEnd; |
2404 | 0 | if (op == oend) { break; } |
2405 | 0 | continue; |
2406 | 0 | } |
2407 | | |
2408 | 20.8k | if (unlikely(offset<8)) { |
2409 | 7.41k | LZ4_write32(op, 0); /* silence msan warning when offset==0 */ |
2410 | 7.41k | op[0] = match[0]; |
2411 | 7.41k | op[1] = match[1]; |
2412 | 7.41k | op[2] = match[2]; |
2413 | 7.41k | op[3] = match[3]; |
2414 | 7.41k | match += inc32table[offset]; |
2415 | 7.41k | LZ4_memcpy(op+4, match, 4); |
2416 | 7.41k | match -= dec64table[offset]; |
2417 | 13.4k | } else { |
2418 | 13.4k | LZ4_memcpy(op, match, 8); |
2419 | 13.4k | match += 8; |
2420 | 13.4k | } |
2421 | 20.8k | op += 8; |
2422 | | |
2423 | 20.8k | if (unlikely(cpy > oend-MATCH_SAFEGUARD_DISTANCE)) { |
2424 | 4.72k | BYTE* const oCopyLimit = oend - (WILDCOPYLENGTH-1); |
2425 | 4.72k | if (cpy > oend-LASTLITERALS) { goto _output_error; } /* Error : last LASTLITERALS bytes must be literals (uncompressed) */ |
2426 | 4.72k | if (op < oCopyLimit) { |
2427 | 4.03k | LZ4_wildCopy8(op, match, oCopyLimit); |
2428 | 4.03k | match += oCopyLimit - op; |
2429 | 4.03k | op = oCopyLimit; |
2430 | 4.03k | } |
2431 | 12.2k | while (op < cpy) { *op++ = *match++; } |
2432 | 16.1k | } else { |
2433 | 16.1k | LZ4_memcpy(op, match, 8); |
2434 | 16.1k | if (length > 16) { LZ4_wildCopy8(op+8, match+8, cpy); } |
2435 | 16.1k | } |
2436 | 20.8k | op = cpy; /* wildcopy correction */ |
2437 | 20.8k | } |
2438 | | |
2439 | | /* end of decoding */ |
2440 | 14.5k | DEBUGLOG(5, "decoded %i bytes", (int) (((char*)op)-dst)); |
2441 | 14.5k | return (int) (((char*)op)-dst); /* Nb of output bytes decoded */ |
2442 | | |
2443 | | /* Overflow error detected */ |
2444 | 0 | _output_error: |
2445 | 0 | return (int) (-(((const char*)ip)-src))-1; |
2446 | 0 | } |
2447 | 0 | } |
2448 | | |
2449 | | |
2450 | | /*===== Instantiate the API decoding functions. =====*/ |
2451 | | |
2452 | | LZ4_FORCE_O2 |
2453 | | int LZ4_decompress_safe(const char* source, char* dest, int compressedSize, int maxDecompressedSize) |
2454 | 11.1k | { |
2455 | 11.1k | return LZ4_decompress_generic(source, dest, compressedSize, maxDecompressedSize, |
2456 | 11.1k | decode_full_block, noDict, |
2457 | 11.1k | (BYTE*)dest, NULL, 0); |
2458 | 11.1k | } |
2459 | | |
2460 | | LZ4_FORCE_O2 |
2461 | | int LZ4_decompress_safe_partial(const char* src, char* dst, int compressedSize, int targetOutputSize, int dstCapacity) |
2462 | 0 | { |
2463 | 0 | dstCapacity = MIN(targetOutputSize, dstCapacity); |
2464 | 0 | return LZ4_decompress_generic(src, dst, compressedSize, dstCapacity, |
2465 | 0 | partial_decode, |
2466 | 0 | noDict, (BYTE*)dst, NULL, 0); |
2467 | 0 | } |
2468 | | |
2469 | | LZ4_FORCE_O2 |
2470 | | int LZ4_decompress_fast(const char* source, char* dest, int originalSize) |
2471 | 0 | { |
2472 | 0 | DEBUGLOG(5, "LZ4_decompress_fast"); |
2473 | 0 | return LZ4_decompress_unsafe_generic( |
2474 | 0 | (const BYTE*)source, (BYTE*)dest, originalSize, |
2475 | 0 | 0, NULL, 0); |
2476 | 0 | } |
2477 | | |
2478 | | /*===== Instantiate a few more decoding cases, used more than once. =====*/ |
2479 | | |
2480 | | LZ4_FORCE_O2 /* Exported, an obsolete API function. */ |
2481 | | int LZ4_decompress_safe_withPrefix64k(const char* source, char* dest, int compressedSize, int maxOutputSize) |
2482 | 2.48k | { |
2483 | 2.48k | return LZ4_decompress_generic(source, dest, compressedSize, maxOutputSize, |
2484 | 2.48k | decode_full_block, withPrefix64k, |
2485 | 2.48k | (BYTE*)dest - 64 KB, NULL, 0); |
2486 | 2.48k | } |
2487 | | |
2488 | | LZ4_FORCE_O2 |
2489 | | static int LZ4_decompress_safe_partial_withPrefix64k(const char* source, char* dest, int compressedSize, int targetOutputSize, int dstCapacity) |
2490 | 0 | { |
2491 | 0 | dstCapacity = MIN(targetOutputSize, dstCapacity); |
2492 | 0 | return LZ4_decompress_generic(source, dest, compressedSize, dstCapacity, |
2493 | 0 | partial_decode, withPrefix64k, |
2494 | 0 | (BYTE*)dest - 64 KB, NULL, 0); |
2495 | 0 | } |
2496 | | |
2497 | | /* Another obsolete API function, paired with the previous one. */ |
2498 | | int LZ4_decompress_fast_withPrefix64k(const char* source, char* dest, int originalSize) |
2499 | 0 | { |
2500 | 0 | return LZ4_decompress_unsafe_generic( |
2501 | 0 | (const BYTE*)source, (BYTE*)dest, originalSize, |
2502 | 0 | 64 KB, NULL, 0); |
2503 | 0 | } |
2504 | | |
2505 | | LZ4_FORCE_O2 |
2506 | | static int LZ4_decompress_safe_withSmallPrefix(const char* source, char* dest, int compressedSize, int maxOutputSize, |
2507 | | size_t prefixSize) |
2508 | 0 | { |
2509 | 0 | return LZ4_decompress_generic(source, dest, compressedSize, maxOutputSize, |
2510 | 0 | decode_full_block, noDict, |
2511 | 0 | (BYTE*)dest-prefixSize, NULL, 0); |
2512 | 0 | } |
2513 | | |
2514 | | LZ4_FORCE_O2 |
2515 | | static int LZ4_decompress_safe_partial_withSmallPrefix(const char* source, char* dest, int compressedSize, int targetOutputSize, int dstCapacity, |
2516 | | size_t prefixSize) |
2517 | 0 | { |
2518 | 0 | dstCapacity = MIN(targetOutputSize, dstCapacity); |
2519 | 0 | return LZ4_decompress_generic(source, dest, compressedSize, dstCapacity, |
2520 | 0 | partial_decode, noDict, |
2521 | 0 | (BYTE*)dest-prefixSize, NULL, 0); |
2522 | 0 | } |
2523 | | |
2524 | | LZ4_FORCE_O2 |
2525 | | int LZ4_decompress_safe_forceExtDict(const char* source, char* dest, |
2526 | | int compressedSize, int maxOutputSize, |
2527 | | const void* dictStart, size_t dictSize) |
2528 | 944 | { |
2529 | 944 | DEBUGLOG(5, "LZ4_decompress_safe_forceExtDict"); |
2530 | 944 | return LZ4_decompress_generic(source, dest, compressedSize, maxOutputSize, |
2531 | 944 | decode_full_block, usingExtDict, |
2532 | 944 | (BYTE*)dest, (const BYTE*)dictStart, dictSize); |
2533 | 944 | } |
2534 | | |
2535 | | LZ4_FORCE_O2 |
2536 | | int LZ4_decompress_safe_partial_forceExtDict(const char* source, char* dest, |
2537 | | int compressedSize, int targetOutputSize, int dstCapacity, |
2538 | | const void* dictStart, size_t dictSize) |
2539 | 0 | { |
2540 | 0 | dstCapacity = MIN(targetOutputSize, dstCapacity); |
2541 | 0 | return LZ4_decompress_generic(source, dest, compressedSize, dstCapacity, |
2542 | 0 | partial_decode, usingExtDict, |
2543 | 0 | (BYTE*)dest, (const BYTE*)dictStart, dictSize); |
2544 | 0 | } |
2545 | | |
2546 | | LZ4_FORCE_O2 |
2547 | | static int LZ4_decompress_fast_extDict(const char* source, char* dest, int originalSize, |
2548 | | const void* dictStart, size_t dictSize) |
2549 | 0 | { |
2550 | 0 | return LZ4_decompress_unsafe_generic( |
2551 | 0 | (const BYTE*)source, (BYTE*)dest, originalSize, |
2552 | 0 | 0, (const BYTE*)dictStart, dictSize); |
2553 | 0 | } |
2554 | | |
2555 | | /* The "double dictionary" mode, for use with e.g. ring buffers: the first part |
2556 | | * of the dictionary is passed as prefix, and the second via dictStart + dictSize. |
2557 | | * These routines are used only once, in LZ4_decompress_*_continue(). |
2558 | | */ |
2559 | | LZ4_FORCE_INLINE |
2560 | | int LZ4_decompress_safe_doubleDict(const char* source, char* dest, int compressedSize, int maxOutputSize, |
2561 | | size_t prefixSize, const void* dictStart, size_t dictSize) |
2562 | 0 | { |
2563 | 0 | return LZ4_decompress_generic(source, dest, compressedSize, maxOutputSize, |
2564 | 0 | decode_full_block, usingExtDict, |
2565 | 0 | (BYTE*)dest-prefixSize, (const BYTE*)dictStart, dictSize); |
2566 | 0 | } |
2567 | | |
2568 | | /*===== streaming decompression functions =====*/ |
2569 | | |
2570 | | #if !defined(LZ4_STATIC_LINKING_ONLY_DISABLE_MEMORY_ALLOCATION) |
2571 | | LZ4_streamDecode_t* LZ4_createStreamDecode(void) |
2572 | 0 | { |
2573 | 0 | LZ4_STATIC_ASSERT(sizeof(LZ4_streamDecode_t) >= sizeof(LZ4_streamDecode_t_internal)); |
2574 | 0 | return (LZ4_streamDecode_t*) ALLOC_AND_ZERO(sizeof(LZ4_streamDecode_t)); |
2575 | 0 | } |
2576 | | |
2577 | | int LZ4_freeStreamDecode (LZ4_streamDecode_t* LZ4_stream) |
2578 | 0 | { |
2579 | 0 | if (LZ4_stream == NULL) { return 0; } /* support free on NULL */ |
2580 | 0 | FREEMEM(LZ4_stream); |
2581 | 0 | return 0; |
2582 | 0 | } |
2583 | | #endif |
2584 | | |
2585 | | /*! LZ4_setStreamDecode() : |
2586 | | * Use this function to instruct where to find the dictionary. |
2587 | | * This function is not necessary if previous data is still available where it was decoded. |
2588 | | * Loading a size of 0 is allowed (same effect as no dictionary). |
2589 | | * @return : 1 if OK, 0 if error |
2590 | | */ |
2591 | | int LZ4_setStreamDecode (LZ4_streamDecode_t* LZ4_streamDecode, const char* dictionary, int dictSize) |
2592 | 0 | { |
2593 | 0 | LZ4_streamDecode_t_internal* lz4sd = &LZ4_streamDecode->internal_donotuse; |
2594 | 0 | lz4sd->prefixSize = (size_t)dictSize; |
2595 | 0 | if (dictSize) { |
2596 | 0 | assert(dictionary != NULL); |
2597 | 0 | lz4sd->prefixEnd = (const BYTE*) dictionary + dictSize; |
2598 | 0 | } else { |
2599 | 0 | lz4sd->prefixEnd = (const BYTE*) dictionary; |
2600 | 0 | } |
2601 | 0 | lz4sd->externalDict = NULL; |
2602 | 0 | lz4sd->extDictSize = 0; |
2603 | 0 | return 1; |
2604 | 0 | } |
2605 | | |
2606 | | /*! LZ4_decoderRingBufferSize() : |
2607 | | * when setting a ring buffer for streaming decompression (optional scenario), |
2608 | | * provides the minimum size of this ring buffer |
2609 | | * to be compatible with any source respecting maxBlockSize condition. |
2610 | | * Note : in a ring buffer scenario, |
2611 | | * blocks are presumed decompressed next to each other. |
2612 | | * When not enough space remains for next block (remainingSize < maxBlockSize), |
2613 | | * decoding resumes from beginning of ring buffer. |
2614 | | * @return : minimum ring buffer size, |
2615 | | * or 0 if there is an error (invalid maxBlockSize). |
2616 | | */ |
2617 | | int LZ4_decoderRingBufferSize(int maxBlockSize) |
2618 | 0 | { |
2619 | 0 | if (maxBlockSize < 0) return 0; |
2620 | 0 | if (maxBlockSize > LZ4_MAX_INPUT_SIZE) return 0; |
2621 | 0 | if (maxBlockSize < 16) maxBlockSize = 16; |
2622 | 0 | return LZ4_DECODER_RING_BUFFER_SIZE(maxBlockSize); |
2623 | 0 | } |
2624 | | |
2625 | | /* |
2626 | | *_continue() : |
2627 | | These decoding functions allow decompression of multiple blocks in "streaming" mode. |
2628 | | Previously decoded blocks must still be available at the memory position where they were decoded. |
2629 | | If it's not possible, save the relevant part of decoded data into a safe buffer, |
2630 | | and indicate where it stands using LZ4_setStreamDecode() |
2631 | | */ |
2632 | | LZ4_FORCE_O2 |
2633 | | int LZ4_decompress_safe_continue (LZ4_streamDecode_t* LZ4_streamDecode, const char* source, char* dest, int compressedSize, int maxOutputSize) |
2634 | 0 | { |
2635 | 0 | LZ4_streamDecode_t_internal* lz4sd = &LZ4_streamDecode->internal_donotuse; |
2636 | 0 | int result; |
2637 | |
|
2638 | 0 | if (lz4sd->prefixSize == 0) { |
2639 | | /* The first call, no dictionary yet. */ |
2640 | 0 | assert(lz4sd->extDictSize == 0); |
2641 | 0 | result = LZ4_decompress_safe(source, dest, compressedSize, maxOutputSize); |
2642 | 0 | if (result <= 0) return result; |
2643 | 0 | lz4sd->prefixSize = (size_t)result; |
2644 | 0 | lz4sd->prefixEnd = (BYTE*)dest + result; |
2645 | 0 | } else if (lz4sd->prefixEnd == (BYTE*)dest) { |
2646 | | /* They're rolling the current segment. */ |
2647 | 0 | if (lz4sd->prefixSize >= 64 KB - 1) |
2648 | 0 | result = LZ4_decompress_safe_withPrefix64k(source, dest, compressedSize, maxOutputSize); |
2649 | 0 | else if (lz4sd->extDictSize == 0) |
2650 | 0 | result = LZ4_decompress_safe_withSmallPrefix(source, dest, compressedSize, maxOutputSize, |
2651 | 0 | lz4sd->prefixSize); |
2652 | 0 | else |
2653 | 0 | result = LZ4_decompress_safe_doubleDict(source, dest, compressedSize, maxOutputSize, |
2654 | 0 | lz4sd->prefixSize, lz4sd->externalDict, lz4sd->extDictSize); |
2655 | 0 | if (result <= 0) return result; |
2656 | 0 | lz4sd->prefixSize += (size_t)result; |
2657 | 0 | lz4sd->prefixEnd += result; |
2658 | 0 | } else { |
2659 | | /* The buffer wraps around, or they're switching to another buffer. */ |
2660 | 0 | lz4sd->extDictSize = lz4sd->prefixSize; |
2661 | 0 | lz4sd->externalDict = lz4sd->prefixEnd - lz4sd->extDictSize; |
2662 | 0 | result = LZ4_decompress_safe_forceExtDict(source, dest, compressedSize, maxOutputSize, |
2663 | 0 | lz4sd->externalDict, lz4sd->extDictSize); |
2664 | 0 | if (result <= 0) return result; |
2665 | 0 | lz4sd->prefixSize = (size_t)result; |
2666 | 0 | lz4sd->prefixEnd = (BYTE*)dest + result; |
2667 | 0 | } |
2668 | | |
2669 | 0 | return result; |
2670 | 0 | } |
2671 | | |
2672 | | LZ4_FORCE_O2 int |
2673 | | LZ4_decompress_fast_continue (LZ4_streamDecode_t* LZ4_streamDecode, |
2674 | | const char* source, char* dest, int originalSize) |
2675 | 0 | { |
2676 | 0 | LZ4_streamDecode_t_internal* const lz4sd = |
2677 | 0 | (assert(LZ4_streamDecode!=NULL), &LZ4_streamDecode->internal_donotuse); |
2678 | 0 | int result; |
2679 | |
|
2680 | 0 | DEBUGLOG(5, "LZ4_decompress_fast_continue (toDecodeSize=%i)", originalSize); |
2681 | 0 | assert(originalSize >= 0); |
2682 | | |
2683 | 0 | if (lz4sd->prefixSize == 0) { |
2684 | 0 | DEBUGLOG(5, "first invocation : no prefix nor extDict"); |
2685 | 0 | assert(lz4sd->extDictSize == 0); |
2686 | 0 | result = LZ4_decompress_fast(source, dest, originalSize); |
2687 | 0 | if (result <= 0) return result; |
2688 | 0 | lz4sd->prefixSize = (size_t)originalSize; |
2689 | 0 | lz4sd->prefixEnd = (BYTE*)dest + originalSize; |
2690 | 0 | } else if (lz4sd->prefixEnd == (BYTE*)dest) { |
2691 | 0 | DEBUGLOG(5, "continue using existing prefix"); |
2692 | 0 | result = LZ4_decompress_unsafe_generic( |
2693 | 0 | (const BYTE*)source, (BYTE*)dest, originalSize, |
2694 | 0 | lz4sd->prefixSize, |
2695 | 0 | lz4sd->externalDict, lz4sd->extDictSize); |
2696 | 0 | if (result <= 0) return result; |
2697 | 0 | lz4sd->prefixSize += (size_t)originalSize; |
2698 | 0 | lz4sd->prefixEnd += originalSize; |
2699 | 0 | } else { |
2700 | 0 | DEBUGLOG(5, "prefix becomes extDict"); |
2701 | 0 | lz4sd->extDictSize = lz4sd->prefixSize; |
2702 | 0 | lz4sd->externalDict = lz4sd->prefixEnd - lz4sd->extDictSize; |
2703 | 0 | result = LZ4_decompress_fast_extDict(source, dest, originalSize, |
2704 | 0 | lz4sd->externalDict, lz4sd->extDictSize); |
2705 | 0 | if (result <= 0) return result; |
2706 | 0 | lz4sd->prefixSize = (size_t)originalSize; |
2707 | 0 | lz4sd->prefixEnd = (BYTE*)dest + originalSize; |
2708 | 0 | } |
2709 | | |
2710 | 0 | return result; |
2711 | 0 | } |
2712 | | |
2713 | | |
2714 | | /* |
2715 | | Advanced decoding functions : |
2716 | | *_usingDict() : |
2717 | | These decoding functions work the same as "_continue" ones, |
2718 | | the dictionary must be explicitly provided within parameters |
2719 | | */ |
2720 | | |
2721 | | int LZ4_decompress_safe_usingDict(const char* source, char* dest, int compressedSize, int maxOutputSize, const char* dictStart, int dictSize) |
2722 | 14.5k | { |
2723 | 14.5k | if (dictSize==0) |
2724 | 11.1k | return LZ4_decompress_safe(source, dest, compressedSize, maxOutputSize); |
2725 | 3.42k | if (dictStart+dictSize == dest) { |
2726 | 2.48k | if (dictSize >= 64 KB - 1) { |
2727 | 2.48k | return LZ4_decompress_safe_withPrefix64k(source, dest, compressedSize, maxOutputSize); |
2728 | 2.48k | } |
2729 | 0 | assert(dictSize >= 0); |
2730 | 0 | return LZ4_decompress_safe_withSmallPrefix(source, dest, compressedSize, maxOutputSize, (size_t)dictSize); |
2731 | 0 | } |
2732 | 944 | assert(dictSize >= 0); |
2733 | 944 | return LZ4_decompress_safe_forceExtDict(source, dest, compressedSize, maxOutputSize, dictStart, (size_t)dictSize); |
2734 | 944 | } |
2735 | | |
2736 | | int LZ4_decompress_safe_partial_usingDict(const char* source, char* dest, int compressedSize, int targetOutputSize, int dstCapacity, const char* dictStart, int dictSize) |
2737 | 0 | { |
2738 | 0 | if (dictSize==0) |
2739 | 0 | return LZ4_decompress_safe_partial(source, dest, compressedSize, targetOutputSize, dstCapacity); |
2740 | 0 | if (dictStart+dictSize == dest) { |
2741 | 0 | if (dictSize >= 64 KB - 1) { |
2742 | 0 | return LZ4_decompress_safe_partial_withPrefix64k(source, dest, compressedSize, targetOutputSize, dstCapacity); |
2743 | 0 | } |
2744 | 0 | assert(dictSize >= 0); |
2745 | 0 | return LZ4_decompress_safe_partial_withSmallPrefix(source, dest, compressedSize, targetOutputSize, dstCapacity, (size_t)dictSize); |
2746 | 0 | } |
2747 | 0 | assert(dictSize >= 0); |
2748 | 0 | return LZ4_decompress_safe_partial_forceExtDict(source, dest, compressedSize, targetOutputSize, dstCapacity, dictStart, (size_t)dictSize); |
2749 | 0 | } |
2750 | | |
2751 | | int LZ4_decompress_fast_usingDict(const char* source, char* dest, int originalSize, const char* dictStart, int dictSize) |
2752 | 0 | { |
2753 | 0 | if (dictSize==0 || dictStart+dictSize == dest) |
2754 | 0 | return LZ4_decompress_unsafe_generic( |
2755 | 0 | (const BYTE*)source, (BYTE*)dest, originalSize, |
2756 | 0 | (size_t)dictSize, NULL, 0); |
2757 | 0 | assert(dictSize >= 0); |
2758 | 0 | return LZ4_decompress_fast_extDict(source, dest, originalSize, dictStart, (size_t)dictSize); |
2759 | 0 | } |
2760 | | |
2761 | | |
2762 | | /*=************************************************* |
2763 | | * Obsolete Functions |
2764 | | ***************************************************/ |
2765 | | /* obsolete compression functions */ |
2766 | | int LZ4_compress_limitedOutput(const char* source, char* dest, int inputSize, int maxOutputSize) |
2767 | 0 | { |
2768 | 0 | return LZ4_compress_default(source, dest, inputSize, maxOutputSize); |
2769 | 0 | } |
2770 | | int LZ4_compress(const char* src, char* dest, int srcSize) |
2771 | 0 | { |
2772 | 0 | return LZ4_compress_default(src, dest, srcSize, LZ4_compressBound(srcSize)); |
2773 | 0 | } |
2774 | | int LZ4_compress_limitedOutput_withState (void* state, const char* src, char* dst, int srcSize, int dstSize) |
2775 | 0 | { |
2776 | 0 | return LZ4_compress_fast_extState(state, src, dst, srcSize, dstSize, 1); |
2777 | 0 | } |
2778 | | int LZ4_compress_withState (void* state, const char* src, char* dst, int srcSize) |
2779 | 0 | { |
2780 | 0 | return LZ4_compress_fast_extState(state, src, dst, srcSize, LZ4_compressBound(srcSize), 1); |
2781 | 0 | } |
2782 | | int LZ4_compress_limitedOutput_continue (LZ4_stream_t* LZ4_stream, const char* src, char* dst, int srcSize, int dstCapacity) |
2783 | 0 | { |
2784 | 0 | return LZ4_compress_fast_continue(LZ4_stream, src, dst, srcSize, dstCapacity, 1); |
2785 | 0 | } |
2786 | | int LZ4_compress_continue (LZ4_stream_t* LZ4_stream, const char* source, char* dest, int inputSize) |
2787 | 0 | { |
2788 | 0 | return LZ4_compress_fast_continue(LZ4_stream, source, dest, inputSize, LZ4_compressBound(inputSize), 1); |
2789 | 0 | } |
2790 | | |
2791 | | /* |
2792 | | These decompression functions are deprecated and should no longer be used. |
2793 | | They are only provided here for compatibility with older user programs. |
2794 | | - LZ4_uncompress is totally equivalent to LZ4_decompress_fast |
2795 | | - LZ4_uncompress_unknownOutputSize is totally equivalent to LZ4_decompress_safe |
2796 | | */ |
2797 | | int LZ4_uncompress (const char* source, char* dest, int outputSize) |
2798 | 0 | { |
2799 | 0 | return LZ4_decompress_fast(source, dest, outputSize); |
2800 | 0 | } |
2801 | | int LZ4_uncompress_unknownOutputSize (const char* source, char* dest, int isize, int maxOutputSize) |
2802 | 0 | { |
2803 | 0 | return LZ4_decompress_safe(source, dest, isize, maxOutputSize); |
2804 | 0 | } |
2805 | | |
2806 | | /* Obsolete Streaming functions */ |
2807 | | |
2808 | 0 | int LZ4_sizeofStreamState(void) { return sizeof(LZ4_stream_t); } |
2809 | | |
2810 | | int LZ4_resetStreamState(void* state, char* inputBuffer) |
2811 | 0 | { |
2812 | 0 | (void)inputBuffer; |
2813 | 0 | LZ4_resetStream((LZ4_stream_t*)state); |
2814 | 0 | return 0; |
2815 | 0 | } |
2816 | | |
2817 | | #if !defined(LZ4_STATIC_LINKING_ONLY_DISABLE_MEMORY_ALLOCATION) |
2818 | | void* LZ4_create (char* inputBuffer) |
2819 | 0 | { |
2820 | 0 | (void)inputBuffer; |
2821 | 0 | return LZ4_createStream(); |
2822 | 0 | } |
2823 | | #endif |
2824 | | |
2825 | | char* LZ4_slideInputBuffer (void* state) |
2826 | 0 | { |
2827 | | /* avoid const char * -> char * conversion warning */ |
2828 | 0 | return (char *)(uptrval)((LZ4_stream_t*)state)->internal_donotuse.dictionary; |
2829 | 0 | } |
2830 | | |
2831 | | #endif /* LZ4_COMMONDEFS_ONLY */ |