Coverage Report

Created: 2025-08-26 06:35

/src/lzma-fuzz/sdk/C/LzFind.c
Line
Count
Source (jump to first uncovered line)
1
/* LzFind.c -- Match finder for LZ algorithms
2
2018-07-08 : Igor Pavlov : Public domain */
3
4
#include "Precomp.h"
5
6
#include <string.h>
7
8
#include "LzFind.h"
9
#include "LzHash.h"
10
11
59.8G
#define kEmptyHashValue 0
12
5.11M
#define kMaxValForNormalize ((UInt32)0xFFFFFFFF)
13
0
#define kNormalizeStepMin (1 << 10) /* it must be power of 2 */
14
0
#define kNormalizeMask (~(UInt32)(kNormalizeStepMin - 1))
15
22.1k
#define kMaxHistorySize ((UInt32)7 << 29)
16
17
#define kStartMaxLen 3
18
19
static void LzInWindow_Free(CMatchFinder *p, ISzAllocPtr alloc)
20
44.3k
{
21
44.3k
  if (!p->directInput)
22
44.3k
  {
23
44.3k
    ISzAlloc_Free(alloc, p->bufferBase);
24
44.3k
    p->bufferBase = NULL;
25
44.3k
  }
26
44.3k
}
27
28
/* keepSizeBefore + keepSizeAfter + keepSizeReserv must be < 4G) */
29
30
static int LzInWindow_Create(CMatchFinder *p, UInt32 keepSizeReserv, ISzAllocPtr alloc)
31
22.1k
{
32
22.1k
  UInt32 blockSize = p->keepSizeBefore + p->keepSizeAfter + keepSizeReserv;
33
22.1k
  if (p->directInput)
34
0
  {
35
0
    p->blockSize = blockSize;
36
0
    return 1;
37
0
  }
38
22.1k
  if (!p->bufferBase || p->blockSize != blockSize)
39
22.1k
  {
40
22.1k
    LzInWindow_Free(p, alloc);
41
22.1k
    p->blockSize = blockSize;
42
22.1k
    p->bufferBase = (Byte *)ISzAlloc_Alloc(alloc, (size_t)blockSize);
43
22.1k
  }
44
22.1k
  return (p->bufferBase != NULL);
45
22.1k
}
46
47
528M
Byte *MatchFinder_GetPointerToCurrentPos(CMatchFinder *p) { return p->buffer; }
48
49
505M
UInt32 MatchFinder_GetNumAvailableBytes(CMatchFinder *p) { return p->streamPos - p->pos; }
50
51
void MatchFinder_ReduceOffsets(CMatchFinder *p, UInt32 subValue)
52
0
{
53
0
  p->posLimit -= subValue;
54
0
  p->pos -= subValue;
55
0
  p->streamPos -= subValue;
56
0
}
57
58
static void MatchFinder_ReadBlock(CMatchFinder *p)
59
28.0k
{
60
28.0k
  if (p->streamEndWasReached || p->result != SZ_OK)
61
0
    return;
62
63
  /* We use (p->streamPos - p->pos) value. (p->streamPos < p->pos) is allowed. */
64
65
28.0k
  if (p->directInput)
66
0
  {
67
0
    UInt32 curSize = 0xFFFFFFFF - (p->streamPos - p->pos);
68
0
    if (curSize > p->directInputRem)
69
0
      curSize = (UInt32)p->directInputRem;
70
0
    p->directInputRem -= curSize;
71
0
    p->streamPos += curSize;
72
0
    if (p->directInputRem == 0)
73
0
      p->streamEndWasReached = 1;
74
0
    return;
75
0
  }
76
  
77
28.0k
  for (;;)
78
45.8k
  {
79
45.8k
    Byte *dest = p->buffer + (p->streamPos - p->pos);
80
45.8k
    size_t size = (p->bufferBase + p->blockSize - dest);
81
45.8k
    if (size == 0)
82
0
      return;
83
84
45.8k
    p->result = ISeqInStream_Read(p->stream, dest, &size);
85
45.8k
    if (p->result != SZ_OK)
86
0
      return;
87
45.8k
    if (size == 0)
88
22.1k
    {
89
22.1k
      p->streamEndWasReached = 1;
90
22.1k
      return;
91
22.1k
    }
92
23.6k
    p->streamPos += (UInt32)size;
93
23.6k
    if (p->streamPos - p->pos > p->keepSizeAfter)
94
5.91k
      return;
95
23.6k
  }
96
28.0k
}
97
98
void MatchFinder_MoveBlock(CMatchFinder *p)
99
0
{
100
0
  memmove(p->bufferBase,
101
0
      p->buffer - p->keepSizeBefore,
102
0
      (size_t)(p->streamPos - p->pos) + p->keepSizeBefore);
103
0
  p->buffer = p->bufferBase + p->keepSizeBefore;
104
0
}
105
106
int MatchFinder_NeedMove(CMatchFinder *p)
107
5.91k
{
108
5.91k
  if (p->directInput)
109
0
    return 0;
110
  /* if (p->streamEndWasReached) return 0; */
111
5.91k
  return ((size_t)(p->bufferBase + p->blockSize - p->buffer) <= p->keepSizeAfter);
112
5.91k
}
113
114
void MatchFinder_ReadIfRequired(CMatchFinder *p)
115
0
{
116
0
  if (p->streamEndWasReached)
117
0
    return;
118
0
  if (p->keepSizeAfter >= p->streamPos - p->pos)
119
0
    MatchFinder_ReadBlock(p);
120
0
}
121
122
static void MatchFinder_CheckAndMoveAndRead(CMatchFinder *p)
123
5.91k
{
124
5.91k
  if (MatchFinder_NeedMove(p))
125
0
    MatchFinder_MoveBlock(p);
126
5.91k
  MatchFinder_ReadBlock(p);
127
5.91k
}
128
129
static void MatchFinder_SetDefaultSettings(CMatchFinder *p)
130
22.1k
{
131
22.1k
  p->cutValue = 32;
132
22.1k
  p->btMode = 1;
133
22.1k
  p->numHashBytes = 4;
134
22.1k
  p->bigHash = 0;
135
22.1k
}
136
137
45.3M
#define kCrcPoly 0xEDB88320
138
139
void MatchFinder_Construct(CMatchFinder *p)
140
22.1k
{
141
22.1k
  unsigned i;
142
22.1k
  p->bufferBase = NULL;
143
22.1k
  p->directInput = 0;
144
22.1k
  p->hash = NULL;
145
22.1k
  p->expectedDataSize = (UInt64)(Int64)-1;
146
22.1k
  MatchFinder_SetDefaultSettings(p);
147
148
5.69M
  for (i = 0; i < 256; i++)
149
5.67M
  {
150
5.67M
    UInt32 r = (UInt32)i;
151
5.67M
    unsigned j;
152
51.0M
    for (j = 0; j < 8; j++)
153
45.3M
      r = (r >> 1) ^ (kCrcPoly & ((UInt32)0 - (r & 1)));
154
5.67M
    p->crc[i] = r;
155
5.67M
  }
156
22.1k
}
157
158
static void MatchFinder_FreeThisClassMemory(CMatchFinder *p, ISzAllocPtr alloc)
159
44.3k
{
160
44.3k
  ISzAlloc_Free(alloc, p->hash);
161
44.3k
  p->hash = NULL;
162
44.3k
}
163
164
void MatchFinder_Free(CMatchFinder *p, ISzAllocPtr alloc)
165
22.1k
{
166
22.1k
  MatchFinder_FreeThisClassMemory(p, alloc);
167
22.1k
  LzInWindow_Free(p, alloc);
168
22.1k
}
169
170
static CLzRef* AllocRefs(size_t num, ISzAllocPtr alloc)
171
22.1k
{
172
22.1k
  size_t sizeInBytes = (size_t)num * sizeof(CLzRef);
173
22.1k
  if (sizeInBytes / sizeof(CLzRef) != num)
174
0
    return NULL;
175
22.1k
  return (CLzRef *)ISzAlloc_Alloc(alloc, sizeInBytes);
176
22.1k
}
177
178
int MatchFinder_Create(CMatchFinder *p, UInt32 historySize,
179
    UInt32 keepAddBufferBefore, UInt32 matchMaxLen, UInt32 keepAddBufferAfter,
180
    ISzAllocPtr alloc)
181
22.1k
{
182
22.1k
  UInt32 sizeReserv;
183
  
184
22.1k
  if (historySize > kMaxHistorySize)
185
0
  {
186
0
    MatchFinder_Free(p, alloc);
187
0
    return 0;
188
0
  }
189
  
190
22.1k
  sizeReserv = historySize >> 1;
191
22.1k
       if (historySize >= ((UInt32)3 << 30)) sizeReserv = historySize >> 3;
192
22.1k
  else if (historySize >= ((UInt32)2 << 30)) sizeReserv = historySize >> 2;
193
  
194
22.1k
  sizeReserv += (keepAddBufferBefore + matchMaxLen + keepAddBufferAfter) / 2 + (1 << 19);
195
196
22.1k
  p->keepSizeBefore = historySize + keepAddBufferBefore + 1;
197
22.1k
  p->keepSizeAfter = matchMaxLen + keepAddBufferAfter;
198
  
199
  /* we need one additional byte, since we use MoveBlock after pos++ and before dictionary using */
200
  
201
22.1k
  if (LzInWindow_Create(p, sizeReserv, alloc))
202
22.1k
  {
203
22.1k
    UInt32 newCyclicBufferSize = historySize + 1;
204
22.1k
    UInt32 hs;
205
22.1k
    p->matchMaxLen = matchMaxLen;
206
22.1k
    {
207
22.1k
      p->fixedHashSize = 0;
208
22.1k
      if (p->numHashBytes == 2)
209
6.82k
        hs = (1 << 16) - 1;
210
15.3k
      else
211
15.3k
      {
212
15.3k
        hs = historySize;
213
15.3k
        if (hs > p->expectedDataSize)
214
8.45k
          hs = (UInt32)p->expectedDataSize;
215
15.3k
        if (hs != 0)
216
15.3k
          hs--;
217
15.3k
        hs |= (hs >> 1);
218
15.3k
        hs |= (hs >> 2);
219
15.3k
        hs |= (hs >> 4);
220
15.3k
        hs |= (hs >> 8);
221
15.3k
        hs >>= 1;
222
15.3k
        hs |= 0xFFFF; /* don't change it! It's required for Deflate */
223
15.3k
        if (hs > (1 << 24))
224
0
        {
225
0
          if (p->numHashBytes == 3)
226
0
            hs = (1 << 24) - 1;
227
0
          else
228
0
            hs >>= 1;
229
          /* if (bigHash) mode, GetHeads4b() in LzFindMt.c needs (hs >= ((1 << 24) - 1))) */
230
0
        }
231
15.3k
      }
232
22.1k
      p->hashMask = hs;
233
22.1k
      hs++;
234
22.1k
      if (p->numHashBytes > 2) p->fixedHashSize += kHash2Size;
235
22.1k
      if (p->numHashBytes > 3) p->fixedHashSize += kHash3Size;
236
22.1k
      if (p->numHashBytes > 4) p->fixedHashSize += kHash4Size;
237
22.1k
      hs += p->fixedHashSize;
238
22.1k
    }
239
240
22.1k
    {
241
22.1k
      size_t newSize;
242
22.1k
      size_t numSons;
243
22.1k
      p->historySize = historySize;
244
22.1k
      p->hashSizeSum = hs;
245
22.1k
      p->cyclicBufferSize = newCyclicBufferSize;
246
      
247
22.1k
      numSons = newCyclicBufferSize;
248
22.1k
      if (p->btMode)
249
19.1k
        numSons <<= 1;
250
22.1k
      newSize = hs + numSons;
251
252
22.1k
      if (p->hash && p->numRefs == newSize)
253
0
        return 1;
254
      
255
22.1k
      MatchFinder_FreeThisClassMemory(p, alloc);
256
22.1k
      p->numRefs = newSize;
257
22.1k
      p->hash = AllocRefs(newSize, alloc);
258
      
259
22.1k
      if (p->hash)
260
22.1k
      {
261
22.1k
        p->son = p->hash + p->hashSizeSum;
262
22.1k
        return 1;
263
22.1k
      }
264
22.1k
    }
265
22.1k
  }
266
267
0
  MatchFinder_Free(p, alloc);
268
0
  return 0;
269
22.1k
}
270
271
static void MatchFinder_SetLimits(CMatchFinder *p)
272
2.56M
{
273
2.56M
  UInt32 limit = kMaxValForNormalize - p->pos;
274
2.56M
  UInt32 limit2 = p->cyclicBufferSize - p->cyclicBufferPos;
275
  
276
2.56M
  if (limit2 < limit)
277
2.56M
    limit = limit2;
278
2.56M
  limit2 = p->streamPos - p->pos;
279
  
280
2.56M
  if (limit2 <= p->keepSizeAfter)
281
2.56M
  {
282
2.56M
    if (limit2 > 0)
283
2.54M
      limit2 = 1;
284
2.56M
  }
285
5.91k
  else
286
5.91k
    limit2 -= p->keepSizeAfter;
287
  
288
2.56M
  if (limit2 < limit)
289
2.56M
    limit = limit2;
290
  
291
2.56M
  {
292
2.56M
    UInt32 lenLimit = p->streamPos - p->pos;
293
2.56M
    if (lenLimit > p->matchMaxLen)
294
1.78M
      lenLimit = p->matchMaxLen;
295
2.56M
    p->lenLimit = lenLimit;
296
2.56M
  }
297
2.56M
  p->posLimit = p->pos + limit;
298
2.56M
}
299
300
301
void MatchFinder_Init_LowHash(CMatchFinder *p)
302
22.1k
{
303
22.1k
  size_t i;
304
22.1k
  CLzRef *items = p->hash;
305
22.1k
  size_t numItems = p->fixedHashSize;
306
832M
  for (i = 0; i < numItems; i++)
307
832M
    items[i] = kEmptyHashValue;
308
22.1k
}
309
310
311
void MatchFinder_Init_HighHash(CMatchFinder *p)
312
22.1k
{
313
22.1k
  size_t i;
314
22.1k
  CLzRef *items = p->hash + p->fixedHashSize;
315
22.1k
  size_t numItems = (size_t)p->hashMask + 1;
316
58.6G
  for (i = 0; i < numItems; i++)
317
58.6G
    items[i] = kEmptyHashValue;
318
22.1k
}
319
320
321
void MatchFinder_Init_3(CMatchFinder *p, int readData)
322
22.1k
{
323
22.1k
  p->cyclicBufferPos = 0;
324
22.1k
  p->buffer = p->bufferBase;
325
22.1k
  p->pos =
326
22.1k
  p->streamPos = p->cyclicBufferSize;
327
22.1k
  p->result = SZ_OK;
328
22.1k
  p->streamEndWasReached = 0;
329
  
330
22.1k
  if (readData)
331
22.1k
    MatchFinder_ReadBlock(p);
332
  
333
22.1k
  MatchFinder_SetLimits(p);
334
22.1k
}
335
336
337
void MatchFinder_Init(CMatchFinder *p)
338
22.1k
{
339
22.1k
  MatchFinder_Init_HighHash(p);
340
22.1k
  MatchFinder_Init_LowHash(p);
341
22.1k
  MatchFinder_Init_3(p, True);
342
22.1k
}
343
344
  
345
static UInt32 MatchFinder_GetSubValue(CMatchFinder *p)
346
0
{
347
0
  return (p->pos - p->historySize - 1) & kNormalizeMask;
348
0
}
349
350
void MatchFinder_Normalize3(UInt32 subValue, CLzRef *items, size_t numItems)
351
0
{
352
0
  size_t i;
353
0
  for (i = 0; i < numItems; i++)
354
0
  {
355
0
    UInt32 value = items[i];
356
0
    if (value <= subValue)
357
0
      value = kEmptyHashValue;
358
0
    else
359
0
      value -= subValue;
360
0
    items[i] = value;
361
0
  }
362
0
}
363
364
static void MatchFinder_Normalize(CMatchFinder *p)
365
0
{
366
0
  UInt32 subValue = MatchFinder_GetSubValue(p);
367
0
  MatchFinder_Normalize3(subValue, p->hash, p->numRefs);
368
0
  MatchFinder_ReduceOffsets(p, subValue);
369
0
}
370
371
372
MY_NO_INLINE
373
static void MatchFinder_CheckLimits(CMatchFinder *p)
374
2.54M
{
375
2.54M
  if (p->pos == kMaxValForNormalize)
376
0
    MatchFinder_Normalize(p);
377
2.54M
  if (!p->streamEndWasReached && p->keepSizeAfter == p->streamPos - p->pos)
378
5.91k
    MatchFinder_CheckAndMoveAndRead(p);
379
2.54M
  if (p->cyclicBufferPos == p->cyclicBufferSize)
380
0
    p->cyclicBufferPos = 0;
381
2.54M
  MatchFinder_SetLimits(p);
382
2.54M
}
383
384
385
/*
386
  (lenLimit > maxLen)
387
*/
388
MY_FORCE_INLINE
389
static UInt32 * Hc_GetMatchesSpec(unsigned lenLimit, UInt32 curMatch, UInt32 pos, const Byte *cur, CLzRef *son,
390
    UInt32 _cyclicBufferPos, UInt32 _cyclicBufferSize, UInt32 cutValue,
391
    UInt32 *distances, unsigned maxLen)
392
1.58M
{
393
  /*
394
  son[_cyclicBufferPos] = curMatch;
395
  for (;;)
396
  {
397
    UInt32 delta = pos - curMatch;
398
    if (cutValue-- == 0 || delta >= _cyclicBufferSize)
399
      return distances;
400
    {
401
      const Byte *pb = cur - delta;
402
      curMatch = son[_cyclicBufferPos - delta + ((delta > _cyclicBufferPos) ? _cyclicBufferSize : 0)];
403
      if (pb[maxLen] == cur[maxLen] && *pb == *cur)
404
      {
405
        UInt32 len = 0;
406
        while (++len != lenLimit)
407
          if (pb[len] != cur[len])
408
            break;
409
        if (maxLen < len)
410
        {
411
          maxLen = len;
412
          *distances++ = len;
413
          *distances++ = delta - 1;
414
          if (len == lenLimit)
415
            return distances;
416
        }
417
      }
418
    }
419
  }
420
  */
421
422
1.58M
  const Byte *lim = cur + lenLimit;
423
1.58M
  son[_cyclicBufferPos] = curMatch;
424
1.58M
  do
425
11.2M
  {
426
11.2M
    UInt32 delta = pos - curMatch;
427
11.2M
    if (delta >= _cyclicBufferSize)
428
1.13M
      break;
429
10.1M
    {
430
10.1M
      ptrdiff_t diff;
431
10.1M
      curMatch = son[_cyclicBufferPos - delta + ((delta > _cyclicBufferPos) ? _cyclicBufferSize : 0)];
432
10.1M
      diff = (ptrdiff_t)0 - delta;
433
10.1M
      if (cur[maxLen] == cur[maxLen + diff])
434
1.93M
      {
435
1.93M
        const Byte *c = cur;
436
32.8M
        while (*c == c[diff])
437
30.9M
        {
438
30.9M
          if (++c == lim)
439
39.0k
          {
440
39.0k
            distances[0] = (UInt32)(lim - cur);
441
39.0k
            distances[1] = delta - 1;
442
39.0k
            return distances + 2;
443
39.0k
          }
444
30.9M
        }
445
1.89M
        {
446
1.89M
          unsigned len = (unsigned)(c - cur);
447
1.89M
          if (maxLen < len)
448
268k
          {
449
268k
            maxLen = len;
450
268k
            distances[0] = (UInt32)len;
451
268k
            distances[1] = delta - 1;
452
268k
            distances += 2;
453
268k
          }
454
1.89M
        }
455
1.89M
      }
456
10.1M
    }
457
10.1M
  }
458
10.1M
  while (--cutValue);
459
  
460
1.54M
  return distances;
461
1.58M
}
462
463
464
MY_FORCE_INLINE
465
UInt32 * GetMatchesSpec1(UInt32 lenLimit, UInt32 curMatch, UInt32 pos, const Byte *cur, CLzRef *son,
466
    UInt32 _cyclicBufferPos, UInt32 _cyclicBufferSize, UInt32 cutValue,
467
    UInt32 *distances, UInt32 maxLen)
468
302M
{
469
302M
  CLzRef *ptr0 = son + ((size_t)_cyclicBufferPos << 1) + 1;
470
302M
  CLzRef *ptr1 = son + ((size_t)_cyclicBufferPos << 1);
471
302M
  unsigned len0 = 0, len1 = 0;
472
302M
  for (;;)
473
637M
  {
474
637M
    UInt32 delta = pos - curMatch;
475
637M
    if (cutValue-- == 0 || delta >= _cyclicBufferSize)
476
301M
    {
477
301M
      *ptr0 = *ptr1 = kEmptyHashValue;
478
301M
      return distances;
479
301M
    }
480
336M
    {
481
336M
      CLzRef *pair = son + ((size_t)(_cyclicBufferPos - delta + ((delta > _cyclicBufferPos) ? _cyclicBufferSize : 0)) << 1);
482
336M
      const Byte *pb = cur - delta;
483
336M
      unsigned len = (len0 < len1 ? len0 : len1);
484
336M
      UInt32 pair0 = pair[0];
485
336M
      if (pb[len] == cur[len])
486
142M
      {
487
142M
        if (++len != lenLimit && pb[len] == cur[len])
488
694M
          while (++len != lenLimit)
489
693M
            if (pb[len] != cur[len])
490
116M
              break;
491
142M
        if (maxLen < len)
492
47.9M
        {
493
47.9M
          maxLen = (UInt32)len;
494
47.9M
          *distances++ = (UInt32)len;
495
47.9M
          *distances++ = delta - 1;
496
47.9M
          if (len == lenLimit)
497
646k
          {
498
646k
            *ptr1 = pair0;
499
646k
            *ptr0 = pair[1];
500
646k
            return distances;
501
646k
          }
502
47.9M
        }
503
142M
      }
504
335M
      if (pb[len] < cur[len])
505
113M
      {
506
113M
        *ptr1 = curMatch;
507
113M
        ptr1 = pair + 1;
508
113M
        curMatch = *ptr1;
509
113M
        len1 = len;
510
113M
      }
511
222M
      else
512
222M
      {
513
222M
        *ptr0 = curMatch;
514
222M
        ptr0 = pair;
515
222M
        curMatch = *ptr0;
516
222M
        len0 = len;
517
222M
      }
518
335M
    }
519
335M
  }
520
302M
}
521
522
static void SkipMatchesSpec(UInt32 lenLimit, UInt32 curMatch, UInt32 pos, const Byte *cur, CLzRef *son,
523
    UInt32 _cyclicBufferPos, UInt32 _cyclicBufferSize, UInt32 cutValue)
524
152M
{
525
152M
  CLzRef *ptr0 = son + ((size_t)_cyclicBufferPos << 1) + 1;
526
152M
  CLzRef *ptr1 = son + ((size_t)_cyclicBufferPos << 1);
527
152M
  unsigned len0 = 0, len1 = 0;
528
152M
  for (;;)
529
655M
  {
530
655M
    UInt32 delta = pos - curMatch;
531
655M
    if (cutValue-- == 0 || delta >= _cyclicBufferSize)
532
25.1M
    {
533
25.1M
      *ptr0 = *ptr1 = kEmptyHashValue;
534
25.1M
      return;
535
25.1M
    }
536
630M
    {
537
630M
      CLzRef *pair = son + ((size_t)(_cyclicBufferPos - delta + ((delta > _cyclicBufferPos) ? _cyclicBufferSize : 0)) << 1);
538
630M
      const Byte *pb = cur - delta;
539
630M
      unsigned len = (len0 < len1 ? len0 : len1);
540
630M
      if (pb[len] == cur[len])
541
390M
      {
542
5.64G
        while (++len != lenLimit)
543
5.51G
          if (pb[len] != cur[len])
544
263M
            break;
545
390M
        {
546
390M
          if (len == lenLimit)
547
127M
          {
548
127M
            *ptr1 = pair[0];
549
127M
            *ptr0 = pair[1];
550
127M
            return;
551
127M
          }
552
390M
        }
553
390M
      }
554
502M
      if (pb[len] < cur[len])
555
143M
      {
556
143M
        *ptr1 = curMatch;
557
143M
        ptr1 = pair + 1;
558
143M
        curMatch = *ptr1;
559
143M
        len1 = len;
560
143M
      }
561
358M
      else
562
358M
      {
563
358M
        *ptr0 = curMatch;
564
358M
        ptr0 = pair;
565
358M
        curMatch = *ptr0;
566
358M
        len0 = len;
567
358M
      }
568
502M
    }
569
502M
  }
570
152M
}
571
572
#define MOVE_POS \
573
460M
  ++p->cyclicBufferPos; \
574
460M
  p->buffer++; \
575
460M
  if (++p->pos == p->posLimit) MatchFinder_CheckLimits(p);
576
577
304M
#define MOVE_POS_RET MOVE_POS return (UInt32)offset;
578
579
49.7k
static void MatchFinder_MovePos(CMatchFinder *p) { MOVE_POS; }
580
581
#define GET_MATCHES_HEADER2(minLen, ret_op) \
582
460M
  unsigned lenLimit; UInt32 hv; const Byte *cur; UInt32 curMatch; \
583
460M
  lenLimit = (unsigned)p->lenLimit; { if (lenLimit < minLen) { MatchFinder_MovePos(p); ret_op; }} \
584
460M
  cur = p->buffer;
585
586
304M
#define GET_MATCHES_HEADER(minLen) GET_MATCHES_HEADER2(minLen, return 0)
587
156M
#define SKIP_HEADER(minLen)        GET_MATCHES_HEADER2(minLen, continue)
588
589
456M
#define MF_PARAMS(p) p->pos, p->buffer, p->son, p->cyclicBufferPos, p->cyclicBufferSize, p->cutValue
590
591
#define GET_MATCHES_FOOTER(offset, maxLen) \
592
302M
  offset = (unsigned)(GetMatchesSpec1((UInt32)lenLimit, curMatch, MF_PARAMS(p), \
593
302M
  distances + offset, (UInt32)maxLen) - distances); MOVE_POS_RET;
594
595
#define SKIP_FOOTER \
596
151M
  SkipMatchesSpec((UInt32)lenLimit, curMatch, MF_PARAMS(p)); MOVE_POS;
597
598
83.9M
#define UPDATE_maxLen { \
599
83.9M
    ptrdiff_t diff = (ptrdiff_t)0 - d2; \
600
83.9M
    const Byte *c = cur + maxLen; \
601
83.9M
    const Byte *lim = cur + lenLimit; \
602
253M
    for (; c != lim; c++) if (*(c + diff) != *c) break; \
603
83.9M
    maxLen = (unsigned)(c - cur); }
604
605
static UInt32 Bt2_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
606
9.24M
{
607
9.24M
  unsigned offset;
608
9.24M
  GET_MATCHES_HEADER(2)
609
9.23M
  HASH2_CALC;
610
9.23M
  curMatch = p->hash[hv];
611
9.23M
  p->hash[hv] = p->pos;
612
9.23M
  offset = 0;
613
9.23M
  GET_MATCHES_FOOTER(offset, 1)
614
0
}
615
616
UInt32 Bt3Zip_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
617
0
{
618
0
  unsigned offset;
619
0
  GET_MATCHES_HEADER(3)
620
0
  HASH_ZIP_CALC;
621
0
  curMatch = p->hash[hv];
622
0
  p->hash[hv] = p->pos;
623
0
  offset = 0;
624
0
  GET_MATCHES_FOOTER(offset, 2)
625
0
}
626
627
static UInt32 Bt3_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
628
4.77M
{
629
4.77M
  UInt32 h2, d2, pos;
630
4.77M
  unsigned maxLen, offset;
631
4.77M
  UInt32 *hash;
632
4.77M
  GET_MATCHES_HEADER(3)
633
634
4.77M
  HASH3_CALC;
635
636
4.77M
  hash = p->hash;
637
4.77M
  pos = p->pos;
638
639
4.77M
  d2 = pos - hash[h2];
640
641
4.77M
  curMatch = (hash + kFix3HashSize)[hv];
642
  
643
4.77M
  hash[h2] = pos;
644
4.77M
  (hash + kFix3HashSize)[hv] = pos;
645
646
4.77M
  maxLen = 2;
647
4.77M
  offset = 0;
648
649
4.77M
  if (d2 < p->cyclicBufferSize && *(cur - d2) == *cur)
650
1.06M
  {
651
1.06M
    UPDATE_maxLen
652
1.06M
    distances[0] = (UInt32)maxLen;
653
1.06M
    distances[1] = d2 - 1;
654
1.06M
    offset = 2;
655
1.06M
    if (maxLen == lenLimit)
656
22.8k
    {
657
22.8k
      SkipMatchesSpec((UInt32)lenLimit, curMatch, MF_PARAMS(p));
658
22.8k
      MOVE_POS_RET;
659
0
    }
660
1.06M
  }
661
  
662
4.75M
  GET_MATCHES_FOOTER(offset, maxLen)
663
0
}
664
665
static UInt32 Bt4_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
666
288M
{
667
288M
  UInt32 h2, h3, d2, d3, pos;
668
288M
  unsigned maxLen, offset;
669
288M
  UInt32 *hash;
670
288M
  GET_MATCHES_HEADER(4)
671
672
288M
  HASH4_CALC;
673
674
288M
  hash = p->hash;
675
288M
  pos = p->pos;
676
677
288M
  d2 = pos - hash                  [h2];
678
288M
  d3 = pos - (hash + kFix3HashSize)[h3];
679
680
288M
  curMatch = (hash + kFix4HashSize)[hv];
681
682
288M
  hash                  [h2] = pos;
683
288M
  (hash + kFix3HashSize)[h3] = pos;
684
288M
  (hash + kFix4HashSize)[hv] = pos;
685
686
288M
  maxLen = 0;
687
288M
  offset = 0;
688
  
689
288M
  if (d2 < p->cyclicBufferSize && *(cur - d2) == *cur)
690
66.7M
  {
691
66.7M
    maxLen = 2;
692
66.7M
    distances[0] = 2;
693
66.7M
    distances[1] = d2 - 1;
694
66.7M
    offset = 2;
695
66.7M
  }
696
  
697
288M
  if (d2 != d3 && d3 < p->cyclicBufferSize && *(cur - d3) == *cur)
698
36.6M
  {
699
36.6M
    maxLen = 3;
700
36.6M
    distances[(size_t)offset + 1] = d3 - 1;
701
36.6M
    offset += 2;
702
36.6M
    d2 = d3;
703
36.6M
  }
704
  
705
288M
  if (offset != 0)
706
82.2M
  {
707
82.2M
    UPDATE_maxLen
708
82.2M
    distances[(size_t)offset - 2] = (UInt32)maxLen;
709
82.2M
    if (maxLen == lenLimit)
710
684k
    {
711
684k
      SkipMatchesSpec((UInt32)lenLimit, curMatch, MF_PARAMS(p));
712
684k
      MOVE_POS_RET;
713
0
    }
714
82.2M
  }
715
  
716
288M
  if (maxLen < 3)
717
224M
    maxLen = 3;
718
  
719
288M
  GET_MATCHES_FOOTER(offset, maxLen)
720
0
}
721
722
/*
723
static UInt32 Bt5_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
724
{
725
  UInt32 h2, h3, h4, d2, d3, d4, maxLen, offset, pos;
726
  UInt32 *hash;
727
  GET_MATCHES_HEADER(5)
728
729
  HASH5_CALC;
730
731
  hash = p->hash;
732
  pos = p->pos;
733
734
  d2 = pos - hash                  [h2];
735
  d3 = pos - (hash + kFix3HashSize)[h3];
736
  d4 = pos - (hash + kFix4HashSize)[h4];
737
738
  curMatch = (hash + kFix5HashSize)[hv];
739
740
  hash                  [h2] = pos;
741
  (hash + kFix3HashSize)[h3] = pos;
742
  (hash + kFix4HashSize)[h4] = pos;
743
  (hash + kFix5HashSize)[hv] = pos;
744
745
  maxLen = 0;
746
  offset = 0;
747
748
  if (d2 < p->cyclicBufferSize && *(cur - d2) == *cur)
749
  {
750
    distances[0] = maxLen = 2;
751
    distances[1] = d2 - 1;
752
    offset = 2;
753
    if (*(cur - d2 + 2) == cur[2])
754
      distances[0] = maxLen = 3;
755
    else if (d3 < p->cyclicBufferSize && *(cur - d3) == *cur)
756
    {
757
      distances[2] = maxLen = 3;
758
      distances[3] = d3 - 1;
759
      offset = 4;
760
      d2 = d3;
761
    }
762
  }
763
  else if (d3 < p->cyclicBufferSize && *(cur - d3) == *cur)
764
  {
765
    distances[0] = maxLen = 3;
766
    distances[1] = d3 - 1;
767
    offset = 2;
768
    d2 = d3;
769
  }
770
  
771
  if (d2 != d4 && d4 < p->cyclicBufferSize
772
      && *(cur - d4) == *cur
773
      && *(cur - d4 + 3) == *(cur + 3))
774
  {
775
    maxLen = 4;
776
    distances[(size_t)offset + 1] = d4 - 1;
777
    offset += 2;
778
    d2 = d4;
779
  }
780
  
781
  if (offset != 0)
782
  {
783
    UPDATE_maxLen
784
    distances[(size_t)offset - 2] = maxLen;
785
    if (maxLen == lenLimit)
786
    {
787
      SkipMatchesSpec(lenLimit, curMatch, MF_PARAMS(p));
788
      MOVE_POS_RET;
789
    }
790
  }
791
792
  if (maxLen < 4)
793
    maxLen = 4;
794
  
795
  GET_MATCHES_FOOTER(offset, maxLen)
796
}
797
*/
798
799
static UInt32 Hc4_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
800
1.67M
{
801
1.67M
  UInt32 h2, h3, d2, d3, pos;
802
1.67M
  unsigned maxLen, offset;
803
1.67M
  UInt32 *hash;
804
1.67M
  GET_MATCHES_HEADER(4)
805
806
1.66M
  HASH4_CALC;
807
808
1.66M
  hash = p->hash;
809
1.66M
  pos = p->pos;
810
  
811
1.66M
  d2 = pos - hash                  [h2];
812
1.66M
  d3 = pos - (hash + kFix3HashSize)[h3];
813
1.66M
  curMatch = (hash + kFix4HashSize)[hv];
814
815
1.66M
  hash                  [h2] = pos;
816
1.66M
  (hash + kFix3HashSize)[h3] = pos;
817
1.66M
  (hash + kFix4HashSize)[hv] = pos;
818
819
1.66M
  maxLen = 0;
820
1.66M
  offset = 0;
821
822
1.66M
  if (d2 < p->cyclicBufferSize && *(cur - d2) == *cur)
823
644k
  {
824
644k
    maxLen = 2;
825
644k
    distances[0] = 2;
826
644k
    distances[1] = d2 - 1;
827
644k
    offset = 2;
828
644k
  }
829
  
830
1.66M
  if (d2 != d3 && d3 < p->cyclicBufferSize && *(cur - d3) == *cur)
831
289k
  {
832
289k
    maxLen = 3;
833
289k
    distances[(size_t)offset + 1] = d3 - 1;
834
289k
    offset += 2;
835
289k
    d2 = d3;
836
289k
  }
837
  
838
1.66M
  if (offset != 0)
839
672k
  {
840
672k
    UPDATE_maxLen
841
672k
    distances[(size_t)offset - 2] = (UInt32)maxLen;
842
672k
    if (maxLen == lenLimit)
843
84.4k
    {
844
84.4k
      p->son[p->cyclicBufferPos] = curMatch;
845
84.4k
      MOVE_POS_RET;
846
0
    }
847
672k
  }
848
  
849
1.58M
  if (maxLen < 3)
850
1.11M
    maxLen = 3;
851
852
1.58M
  offset = (unsigned)(Hc_GetMatchesSpec(lenLimit, curMatch, MF_PARAMS(p),
853
1.58M
      distances + offset, maxLen) - (distances));
854
1.58M
  MOVE_POS_RET
855
1.66M
}
856
857
/*
858
static UInt32 Hc5_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
859
{
860
  UInt32 h2, h3, h4, d2, d3, d4, maxLen, offset, pos
861
  UInt32 *hash;
862
  GET_MATCHES_HEADER(5)
863
864
  HASH5_CALC;
865
866
  hash = p->hash;
867
  pos = p->pos;
868
  
869
  d2 = pos - hash                  [h2];
870
  d3 = pos - (hash + kFix3HashSize)[h3];
871
  d4 = pos - (hash + kFix4HashSize)[h4];
872
873
  curMatch = (hash + kFix5HashSize)[hv];
874
875
  hash                  [h2] = pos;
876
  (hash + kFix3HashSize)[h3] = pos;
877
  (hash + kFix4HashSize)[h4] = pos;
878
  (hash + kFix5HashSize)[hv] = pos;
879
880
  maxLen = 0;
881
  offset = 0;
882
883
  if (d2 < p->cyclicBufferSize && *(cur - d2) == *cur)
884
  {
885
    distances[0] = maxLen = 2;
886
    distances[1] = d2 - 1;
887
    offset = 2;
888
    if (*(cur - d2 + 2) == cur[2])
889
      distances[0] = maxLen = 3;
890
    else if (d3 < p->cyclicBufferSize && *(cur - d3) == *cur)
891
    {
892
      distances[2] = maxLen = 3;
893
      distances[3] = d3 - 1;
894
      offset = 4;
895
      d2 = d3;
896
    }
897
  }
898
  else if (d3 < p->cyclicBufferSize && *(cur - d3) == *cur)
899
  {
900
    distances[0] = maxLen = 3;
901
    distances[1] = d3 - 1;
902
    offset = 2;
903
    d2 = d3;
904
  }
905
  
906
  if (d2 != d4 && d4 < p->cyclicBufferSize
907
      && *(cur - d4) == *cur
908
      && *(cur - d4 + 3) == *(cur + 3))
909
  {
910
    maxLen = 4;
911
    distances[(size_t)offset + 1] = d4 - 1;
912
    offset += 2;
913
    d2 = d4;
914
  }
915
  
916
  if (offset != 0)
917
  {
918
    UPDATE_maxLen
919
    distances[(size_t)offset - 2] = maxLen;
920
    if (maxLen == lenLimit)
921
    {
922
      p->son[p->cyclicBufferPos] = curMatch;
923
      MOVE_POS_RET;
924
    }
925
  }
926
  
927
  if (maxLen < 4)
928
    maxLen = 4;
929
930
  offset = (UInt32)(Hc_GetMatchesSpec(lenLimit, curMatch, MF_PARAMS(p),
931
      distances + offset, maxLen) - (distances));
932
  MOVE_POS_RET
933
}
934
*/
935
936
UInt32 Hc3Zip_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
937
0
{
938
0
  unsigned offset;
939
0
  GET_MATCHES_HEADER(3)
940
0
  HASH_ZIP_CALC;
941
0
  curMatch = p->hash[hv];
942
0
  p->hash[hv] = p->pos;
943
0
  offset = (unsigned)(Hc_GetMatchesSpec(lenLimit, curMatch, MF_PARAMS(p),
944
0
      distances, 2) - (distances));
945
0
  MOVE_POS_RET
946
0
}
947
948
static void Bt2_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
949
200k
{
950
200k
  do
951
4.78M
  {
952
4.78M
    SKIP_HEADER(2)
953
4.77M
    HASH2_CALC;
954
4.77M
    curMatch = p->hash[hv];
955
4.77M
    p->hash[hv] = p->pos;
956
4.77M
    SKIP_FOOTER
957
4.77M
  }
958
4.78M
  while (--num != 0);
959
200k
}
960
961
void Bt3Zip_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
962
0
{
963
0
  do
964
0
  {
965
0
    SKIP_HEADER(3)
966
0
    HASH_ZIP_CALC;
967
0
    curMatch = p->hash[hv];
968
0
    p->hash[hv] = p->pos;
969
0
    SKIP_FOOTER
970
0
  }
971
0
  while (--num != 0);
972
0
}
973
974
static void Bt3_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
975
122k
{
976
122k
  do
977
4.15M
  {
978
4.15M
    UInt32 h2;
979
4.15M
    UInt32 *hash;
980
4.15M
    SKIP_HEADER(3)
981
4.15M
    HASH3_CALC;
982
4.15M
    hash = p->hash;
983
4.15M
    curMatch = (hash + kFix3HashSize)[hv];
984
4.15M
    hash[h2] =
985
4.15M
    (hash + kFix3HashSize)[hv] = p->pos;
986
4.15M
    SKIP_FOOTER
987
4.15M
  }
988
4.15M
  while (--num != 0);
989
122k
}
990
991
static void Bt4_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
992
1.22M
{
993
1.22M
  do
994
142M
  {
995
142M
    UInt32 h2, h3;
996
142M
    UInt32 *hash;
997
142M
    SKIP_HEADER(4)
998
142M
    HASH4_CALC;
999
142M
    hash = p->hash;
1000
142M
    curMatch = (hash + kFix4HashSize)[hv];
1001
142M
    hash                  [h2] =
1002
142M
    (hash + kFix3HashSize)[h3] =
1003
142M
    (hash + kFix4HashSize)[hv] = p->pos;
1004
142M
    SKIP_FOOTER
1005
142M
  }
1006
142M
  while (--num != 0);
1007
1.22M
}
1008
1009
/*
1010
static void Bt5_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
1011
{
1012
  do
1013
  {
1014
    UInt32 h2, h3, h4;
1015
    UInt32 *hash;
1016
    SKIP_HEADER(5)
1017
    HASH5_CALC;
1018
    hash = p->hash;
1019
    curMatch = (hash + kFix5HashSize)[hv];
1020
    hash                  [h2] =
1021
    (hash + kFix3HashSize)[h3] =
1022
    (hash + kFix4HashSize)[h4] =
1023
    (hash + kFix5HashSize)[hv] = p->pos;
1024
    SKIP_FOOTER
1025
  }
1026
  while (--num != 0);
1027
}
1028
*/
1029
1030
static void Hc4_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
1031
187k
{
1032
187k
  do
1033
4.38M
  {
1034
4.38M
    UInt32 h2, h3;
1035
4.38M
    UInt32 *hash;
1036
4.38M
    SKIP_HEADER(4)
1037
4.38M
    HASH4_CALC;
1038
4.38M
    hash = p->hash;
1039
4.38M
    curMatch = (hash + kFix4HashSize)[hv];
1040
4.38M
    hash                  [h2] =
1041
4.38M
    (hash + kFix3HashSize)[h3] =
1042
4.38M
    (hash + kFix4HashSize)[hv] = p->pos;
1043
4.38M
    p->son[p->cyclicBufferPos] = curMatch;
1044
4.38M
    MOVE_POS
1045
4.38M
  }
1046
4.38M
  while (--num != 0);
1047
187k
}
1048
1049
/*
1050
static void Hc5_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
1051
{
1052
  do
1053
  {
1054
    UInt32 h2, h3, h4;
1055
    UInt32 *hash;
1056
    SKIP_HEADER(5)
1057
    HASH5_CALC;
1058
    hash = p->hash;
1059
    curMatch = hash + kFix5HashSize)[hv];
1060
    hash                  [h2] =
1061
    (hash + kFix3HashSize)[h3] =
1062
    (hash + kFix4HashSize)[h4] =
1063
    (hash + kFix5HashSize)[hv] = p->pos;
1064
    p->son[p->cyclicBufferPos] = curMatch;
1065
    MOVE_POS
1066
  }
1067
  while (--num != 0);
1068
}
1069
*/
1070
1071
void Hc3Zip_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
1072
0
{
1073
0
  do
1074
0
  {
1075
0
    SKIP_HEADER(3)
1076
0
    HASH_ZIP_CALC;
1077
0
    curMatch = p->hash[hv];
1078
0
    p->hash[hv] = p->pos;
1079
0
    p->son[p->cyclicBufferPos] = curMatch;
1080
0
    MOVE_POS
1081
0
  }
1082
0
  while (--num != 0);
1083
0
}
1084
1085
void MatchFinder_CreateVTable(CMatchFinder *p, IMatchFinder *vTable)
1086
22.1k
{
1087
22.1k
  vTable->Init = (Mf_Init_Func)MatchFinder_Init;
1088
22.1k
  vTable->GetNumAvailableBytes = (Mf_GetNumAvailableBytes_Func)MatchFinder_GetNumAvailableBytes;
1089
22.1k
  vTable->GetPointerToCurrentPos = (Mf_GetPointerToCurrentPos_Func)MatchFinder_GetPointerToCurrentPos;
1090
22.1k
  if (!p->btMode)
1091
2.98k
  {
1092
    /* if (p->numHashBytes <= 4) */
1093
2.98k
    {
1094
2.98k
      vTable->GetMatches = (Mf_GetMatches_Func)Hc4_MatchFinder_GetMatches;
1095
2.98k
      vTable->Skip = (Mf_Skip_Func)Hc4_MatchFinder_Skip;
1096
2.98k
    }
1097
    /*
1098
    else
1099
    {
1100
      vTable->GetMatches = (Mf_GetMatches_Func)Hc5_MatchFinder_GetMatches;
1101
      vTable->Skip = (Mf_Skip_Func)Hc5_MatchFinder_Skip;
1102
    }
1103
    */
1104
2.98k
  }
1105
19.1k
  else if (p->numHashBytes == 2)
1106
6.82k
  {
1107
6.82k
    vTable->GetMatches = (Mf_GetMatches_Func)Bt2_MatchFinder_GetMatches;
1108
6.82k
    vTable->Skip = (Mf_Skip_Func)Bt2_MatchFinder_Skip;
1109
6.82k
  }
1110
12.3k
  else if (p->numHashBytes == 3)
1111
2.86k
  {
1112
2.86k
    vTable->GetMatches = (Mf_GetMatches_Func)Bt3_MatchFinder_GetMatches;
1113
2.86k
    vTable->Skip = (Mf_Skip_Func)Bt3_MatchFinder_Skip;
1114
2.86k
  }
1115
9.47k
  else /* if (p->numHashBytes == 4) */
1116
9.47k
  {
1117
9.47k
    vTable->GetMatches = (Mf_GetMatches_Func)Bt4_MatchFinder_GetMatches;
1118
9.47k
    vTable->Skip = (Mf_Skip_Func)Bt4_MatchFinder_Skip;
1119
9.47k
  }
1120
  /*
1121
  else
1122
  {
1123
    vTable->GetMatches = (Mf_GetMatches_Func)Bt5_MatchFinder_GetMatches;
1124
    vTable->Skip = (Mf_Skip_Func)Bt5_MatchFinder_Skip;
1125
  }
1126
  */
1127
22.1k
}