Coverage Report

Created: 2024-07-27 06:13

/src/lzma-fuzz/sdk/C/LzFind.c
Line
Count
Source (jump to first uncovered line)
1
/* LzFind.c -- Match finder for LZ algorithms
2
2018-07-08 : Igor Pavlov : Public domain */
3
4
#include "Precomp.h"
5
6
#include <string.h>
7
8
#include "LzFind.h"
9
#include "LzHash.h"
10
11
684M
#define kEmptyHashValue 0
12
1.70M
#define kMaxValForNormalize ((UInt32)0xFFFFFFFF)
13
0
#define kNormalizeStepMin (1 << 10) /* it must be power of 2 */
14
0
#define kNormalizeMask (~(UInt32)(kNormalizeStepMin - 1))
15
7.55k
#define kMaxHistorySize ((UInt32)7 << 29)
16
17
#define kStartMaxLen 3
18
19
static void LzInWindow_Free(CMatchFinder *p, ISzAllocPtr alloc)
20
15.1k
{
21
15.1k
  if (!p->directInput)
22
15.1k
  {
23
15.1k
    ISzAlloc_Free(alloc, p->bufferBase);
24
15.1k
    p->bufferBase = NULL;
25
15.1k
  }
26
15.1k
}
27
28
/* keepSizeBefore + keepSizeAfter + keepSizeReserv must be < 4G) */
29
30
static int LzInWindow_Create(CMatchFinder *p, UInt32 keepSizeReserv, ISzAllocPtr alloc)
31
7.55k
{
32
7.55k
  UInt32 blockSize = p->keepSizeBefore + p->keepSizeAfter + keepSizeReserv;
33
7.55k
  if (p->directInput)
34
0
  {
35
0
    p->blockSize = blockSize;
36
0
    return 1;
37
0
  }
38
7.55k
  if (!p->bufferBase || p->blockSize != blockSize)
39
7.55k
  {
40
7.55k
    LzInWindow_Free(p, alloc);
41
7.55k
    p->blockSize = blockSize;
42
7.55k
    p->bufferBase = (Byte *)ISzAlloc_Alloc(alloc, (size_t)blockSize);
43
7.55k
  }
44
7.55k
  return (p->bufferBase != NULL);
45
7.55k
}
46
47
8.30M
Byte *MatchFinder_GetPointerToCurrentPos(CMatchFinder *p) { return p->buffer; }
48
49
8.03M
UInt32 MatchFinder_GetNumAvailableBytes(CMatchFinder *p) { return p->streamPos - p->pos; }
50
51
void MatchFinder_ReduceOffsets(CMatchFinder *p, UInt32 subValue)
52
0
{
53
0
  p->posLimit -= subValue;
54
0
  p->pos -= subValue;
55
0
  p->streamPos -= subValue;
56
0
}
57
58
static void MatchFinder_ReadBlock(CMatchFinder *p)
59
8.99k
{
60
8.99k
  if (p->streamEndWasReached || p->result != SZ_OK)
61
0
    return;
62
63
  /* We use (p->streamPos - p->pos) value. (p->streamPos < p->pos) is allowed. */
64
65
8.99k
  if (p->directInput)
66
0
  {
67
0
    UInt32 curSize = 0xFFFFFFFF - (p->streamPos - p->pos);
68
0
    if (curSize > p->directInputRem)
69
0
      curSize = (UInt32)p->directInputRem;
70
0
    p->directInputRem -= curSize;
71
0
    p->streamPos += curSize;
72
0
    if (p->directInputRem == 0)
73
0
      p->streamEndWasReached = 1;
74
0
    return;
75
0
  }
76
  
77
8.99k
  for (;;)
78
15.1k
  {
79
15.1k
    Byte *dest = p->buffer + (p->streamPos - p->pos);
80
15.1k
    size_t size = (p->bufferBase + p->blockSize - dest);
81
15.1k
    if (size == 0)
82
0
      return;
83
84
15.1k
    p->result = ISeqInStream_Read(p->stream, dest, &size);
85
15.1k
    if (p->result != SZ_OK)
86
0
      return;
87
15.1k
    if (size == 0)
88
7.55k
    {
89
7.55k
      p->streamEndWasReached = 1;
90
7.55k
      return;
91
7.55k
    }
92
7.55k
    p->streamPos += (UInt32)size;
93
7.55k
    if (p->streamPos - p->pos > p->keepSizeAfter)
94
1.43k
      return;
95
7.55k
  }
96
8.99k
}
97
98
void MatchFinder_MoveBlock(CMatchFinder *p)
99
0
{
100
0
  memmove(p->bufferBase,
101
0
      p->buffer - p->keepSizeBefore,
102
0
      (size_t)(p->streamPos - p->pos) + p->keepSizeBefore);
103
0
  p->buffer = p->bufferBase + p->keepSizeBefore;
104
0
}
105
106
int MatchFinder_NeedMove(CMatchFinder *p)
107
1.43k
{
108
1.43k
  if (p->directInput)
109
0
    return 0;
110
  /* if (p->streamEndWasReached) return 0; */
111
1.43k
  return ((size_t)(p->bufferBase + p->blockSize - p->buffer) <= p->keepSizeAfter);
112
1.43k
}
113
114
void MatchFinder_ReadIfRequired(CMatchFinder *p)
115
0
{
116
0
  if (p->streamEndWasReached)
117
0
    return;
118
0
  if (p->keepSizeAfter >= p->streamPos - p->pos)
119
0
    MatchFinder_ReadBlock(p);
120
0
}
121
122
static void MatchFinder_CheckAndMoveAndRead(CMatchFinder *p)
123
1.43k
{
124
1.43k
  if (MatchFinder_NeedMove(p))
125
0
    MatchFinder_MoveBlock(p);
126
1.43k
  MatchFinder_ReadBlock(p);
127
1.43k
}
128
129
static void MatchFinder_SetDefaultSettings(CMatchFinder *p)
130
7.55k
{
131
7.55k
  p->cutValue = 32;
132
7.55k
  p->btMode = 1;
133
7.55k
  p->numHashBytes = 4;
134
7.55k
  p->bigHash = 0;
135
7.55k
}
136
137
15.4M
#define kCrcPoly 0xEDB88320
138
139
void MatchFinder_Construct(CMatchFinder *p)
140
7.55k
{
141
7.55k
  unsigned i;
142
7.55k
  p->bufferBase = NULL;
143
7.55k
  p->directInput = 0;
144
7.55k
  p->hash = NULL;
145
7.55k
  p->expectedDataSize = (UInt64)(Int64)-1;
146
7.55k
  MatchFinder_SetDefaultSettings(p);
147
148
1.94M
  for (i = 0; i < 256; i++)
149
1.93M
  {
150
1.93M
    UInt32 r = (UInt32)i;
151
1.93M
    unsigned j;
152
17.4M
    for (j = 0; j < 8; j++)
153
15.4M
      r = (r >> 1) ^ (kCrcPoly & ((UInt32)0 - (r & 1)));
154
1.93M
    p->crc[i] = r;
155
1.93M
  }
156
7.55k
}
157
158
static void MatchFinder_FreeThisClassMemory(CMatchFinder *p, ISzAllocPtr alloc)
159
15.1k
{
160
15.1k
  ISzAlloc_Free(alloc, p->hash);
161
15.1k
  p->hash = NULL;
162
15.1k
}
163
164
void MatchFinder_Free(CMatchFinder *p, ISzAllocPtr alloc)
165
7.55k
{
166
7.55k
  MatchFinder_FreeThisClassMemory(p, alloc);
167
7.55k
  LzInWindow_Free(p, alloc);
168
7.55k
}
169
170
static CLzRef* AllocRefs(size_t num, ISzAllocPtr alloc)
171
7.55k
{
172
7.55k
  size_t sizeInBytes = (size_t)num * sizeof(CLzRef);
173
7.55k
  if (sizeInBytes / sizeof(CLzRef) != num)
174
0
    return NULL;
175
7.55k
  return (CLzRef *)ISzAlloc_Alloc(alloc, sizeInBytes);
176
7.55k
}
177
178
int MatchFinder_Create(CMatchFinder *p, UInt32 historySize,
179
    UInt32 keepAddBufferBefore, UInt32 matchMaxLen, UInt32 keepAddBufferAfter,
180
    ISzAllocPtr alloc)
181
7.55k
{
182
7.55k
  UInt32 sizeReserv;
183
  
184
7.55k
  if (historySize > kMaxHistorySize)
185
0
  {
186
0
    MatchFinder_Free(p, alloc);
187
0
    return 0;
188
0
  }
189
  
190
7.55k
  sizeReserv = historySize >> 1;
191
7.55k
       if (historySize >= ((UInt32)3 << 30)) sizeReserv = historySize >> 3;
192
7.55k
  else if (historySize >= ((UInt32)2 << 30)) sizeReserv = historySize >> 2;
193
  
194
7.55k
  sizeReserv += (keepAddBufferBefore + matchMaxLen + keepAddBufferAfter) / 2 + (1 << 19);
195
196
7.55k
  p->keepSizeBefore = historySize + keepAddBufferBefore + 1;
197
7.55k
  p->keepSizeAfter = matchMaxLen + keepAddBufferAfter;
198
  
199
  /* we need one additional byte, since we use MoveBlock after pos++ and before dictionary using */
200
  
201
7.55k
  if (LzInWindow_Create(p, sizeReserv, alloc))
202
7.55k
  {
203
7.55k
    UInt32 newCyclicBufferSize = historySize + 1;
204
7.55k
    UInt32 hs;
205
7.55k
    p->matchMaxLen = matchMaxLen;
206
7.55k
    {
207
7.55k
      p->fixedHashSize = 0;
208
7.55k
      if (p->numHashBytes == 2)
209
3.39k
        hs = (1 << 16) - 1;
210
4.15k
      else
211
4.15k
      {
212
4.15k
        hs = historySize;
213
4.15k
        if (hs > p->expectedDataSize)
214
4.15k
          hs = (UInt32)p->expectedDataSize;
215
4.15k
        if (hs != 0)
216
4.15k
          hs--;
217
4.15k
        hs |= (hs >> 1);
218
4.15k
        hs |= (hs >> 2);
219
4.15k
        hs |= (hs >> 4);
220
4.15k
        hs |= (hs >> 8);
221
4.15k
        hs >>= 1;
222
4.15k
        hs |= 0xFFFF; /* don't change it! It's required for Deflate */
223
4.15k
        if (hs > (1 << 24))
224
0
        {
225
0
          if (p->numHashBytes == 3)
226
0
            hs = (1 << 24) - 1;
227
0
          else
228
0
            hs >>= 1;
229
          /* if (bigHash) mode, GetHeads4b() in LzFindMt.c needs (hs >= ((1 << 24) - 1))) */
230
0
        }
231
4.15k
      }
232
7.55k
      p->hashMask = hs;
233
7.55k
      hs++;
234
7.55k
      if (p->numHashBytes > 2) p->fixedHashSize += kHash2Size;
235
7.55k
      if (p->numHashBytes > 3) p->fixedHashSize += kHash3Size;
236
7.55k
      if (p->numHashBytes > 4) p->fixedHashSize += kHash4Size;
237
7.55k
      hs += p->fixedHashSize;
238
7.55k
    }
239
240
7.55k
    {
241
7.55k
      size_t newSize;
242
7.55k
      size_t numSons;
243
7.55k
      p->historySize = historySize;
244
7.55k
      p->hashSizeSum = hs;
245
7.55k
      p->cyclicBufferSize = newCyclicBufferSize;
246
      
247
7.55k
      numSons = newCyclicBufferSize;
248
7.55k
      if (p->btMode)
249
6.20k
        numSons <<= 1;
250
7.55k
      newSize = hs + numSons;
251
252
7.55k
      if (p->hash && p->numRefs == newSize)
253
0
        return 1;
254
      
255
7.55k
      MatchFinder_FreeThisClassMemory(p, alloc);
256
7.55k
      p->numRefs = newSize;
257
7.55k
      p->hash = AllocRefs(newSize, alloc);
258
      
259
7.55k
      if (p->hash)
260
7.55k
      {
261
7.55k
        p->son = p->hash + p->hashSizeSum;
262
7.55k
        return 1;
263
7.55k
      }
264
7.55k
    }
265
7.55k
  }
266
267
0
  MatchFinder_Free(p, alloc);
268
0
  return 0;
269
7.55k
}
270
271
static void MatchFinder_SetLimits(CMatchFinder *p)
272
855k
{
273
855k
  UInt32 limit = kMaxValForNormalize - p->pos;
274
855k
  UInt32 limit2 = p->cyclicBufferSize - p->cyclicBufferPos;
275
  
276
855k
  if (limit2 < limit)
277
855k
    limit = limit2;
278
855k
  limit2 = p->streamPos - p->pos;
279
  
280
855k
  if (limit2 <= p->keepSizeAfter)
281
854k
  {
282
854k
    if (limit2 > 0)
283
846k
      limit2 = 1;
284
854k
  }
285
1.43k
  else
286
1.43k
    limit2 -= p->keepSizeAfter;
287
  
288
855k
  if (limit2 < limit)
289
855k
    limit = limit2;
290
  
291
855k
  {
292
855k
    UInt32 lenLimit = p->streamPos - p->pos;
293
855k
    if (lenLimit > p->matchMaxLen)
294
513k
      lenLimit = p->matchMaxLen;
295
855k
    p->lenLimit = lenLimit;
296
855k
  }
297
855k
  p->posLimit = p->pos + limit;
298
855k
}
299
300
301
void MatchFinder_Init_LowHash(CMatchFinder *p)
302
7.55k
{
303
7.55k
  size_t i;
304
7.55k
  CLzRef *items = p->hash;
305
7.55k
  size_t numItems = p->fixedHashSize;
306
180M
  for (i = 0; i < numItems; i++)
307
180M
    items[i] = kEmptyHashValue;
308
7.55k
}
309
310
311
void MatchFinder_Init_HighHash(CMatchFinder *p)
312
7.55k
{
313
7.55k
  size_t i;
314
7.55k
  CLzRef *items = p->hash + p->fixedHashSize;
315
7.55k
  size_t numItems = (size_t)p->hashMask + 1;
316
495M
  for (i = 0; i < numItems; i++)
317
495M
    items[i] = kEmptyHashValue;
318
7.55k
}
319
320
321
void MatchFinder_Init_3(CMatchFinder *p, int readData)
322
7.55k
{
323
7.55k
  p->cyclicBufferPos = 0;
324
7.55k
  p->buffer = p->bufferBase;
325
7.55k
  p->pos =
326
7.55k
  p->streamPos = p->cyclicBufferSize;
327
7.55k
  p->result = SZ_OK;
328
7.55k
  p->streamEndWasReached = 0;
329
  
330
7.55k
  if (readData)
331
7.55k
    MatchFinder_ReadBlock(p);
332
  
333
7.55k
  MatchFinder_SetLimits(p);
334
7.55k
}
335
336
337
void MatchFinder_Init(CMatchFinder *p)
338
7.55k
{
339
7.55k
  MatchFinder_Init_HighHash(p);
340
7.55k
  MatchFinder_Init_LowHash(p);
341
7.55k
  MatchFinder_Init_3(p, True);
342
7.55k
}
343
344
  
345
static UInt32 MatchFinder_GetSubValue(CMatchFinder *p)
346
0
{
347
0
  return (p->pos - p->historySize - 1) & kNormalizeMask;
348
0
}
349
350
void MatchFinder_Normalize3(UInt32 subValue, CLzRef *items, size_t numItems)
351
0
{
352
0
  size_t i;
353
0
  for (i = 0; i < numItems; i++)
354
0
  {
355
0
    UInt32 value = items[i];
356
0
    if (value <= subValue)
357
0
      value = kEmptyHashValue;
358
0
    else
359
0
      value -= subValue;
360
0
    items[i] = value;
361
0
  }
362
0
}
363
364
static void MatchFinder_Normalize(CMatchFinder *p)
365
0
{
366
0
  UInt32 subValue = MatchFinder_GetSubValue(p);
367
0
  MatchFinder_Normalize3(subValue, p->hash, p->numRefs);
368
0
  MatchFinder_ReduceOffsets(p, subValue);
369
0
}
370
371
372
MY_NO_INLINE
373
static void MatchFinder_CheckLimits(CMatchFinder *p)
374
848k
{
375
848k
  if (p->pos == kMaxValForNormalize)
376
0
    MatchFinder_Normalize(p);
377
848k
  if (!p->streamEndWasReached && p->keepSizeAfter == p->streamPos - p->pos)
378
1.43k
    MatchFinder_CheckAndMoveAndRead(p);
379
848k
  if (p->cyclicBufferPos == p->cyclicBufferSize)
380
0
    p->cyclicBufferPos = 0;
381
848k
  MatchFinder_SetLimits(p);
382
848k
}
383
384
385
/*
386
  (lenLimit > maxLen)
387
*/
388
MY_FORCE_INLINE
389
static UInt32 * Hc_GetMatchesSpec(unsigned lenLimit, UInt32 curMatch, UInt32 pos, const Byte *cur, CLzRef *son,
390
    UInt32 _cyclicBufferPos, UInt32 _cyclicBufferSize, UInt32 cutValue,
391
    UInt32 *distances, unsigned maxLen)
392
384k
{
393
  /*
394
  son[_cyclicBufferPos] = curMatch;
395
  for (;;)
396
  {
397
    UInt32 delta = pos - curMatch;
398
    if (cutValue-- == 0 || delta >= _cyclicBufferSize)
399
      return distances;
400
    {
401
      const Byte *pb = cur - delta;
402
      curMatch = son[_cyclicBufferPos - delta + ((delta > _cyclicBufferPos) ? _cyclicBufferSize : 0)];
403
      if (pb[maxLen] == cur[maxLen] && *pb == *cur)
404
      {
405
        UInt32 len = 0;
406
        while (++len != lenLimit)
407
          if (pb[len] != cur[len])
408
            break;
409
        if (maxLen < len)
410
        {
411
          maxLen = len;
412
          *distances++ = len;
413
          *distances++ = delta - 1;
414
          if (len == lenLimit)
415
            return distances;
416
        }
417
      }
418
    }
419
  }
420
  */
421
422
384k
  const Byte *lim = cur + lenLimit;
423
384k
  son[_cyclicBufferPos] = curMatch;
424
384k
  do
425
3.42M
  {
426
3.42M
    UInt32 delta = pos - curMatch;
427
3.42M
    if (delta >= _cyclicBufferSize)
428
268k
      break;
429
3.15M
    {
430
3.15M
      ptrdiff_t diff;
431
3.15M
      curMatch = son[_cyclicBufferPos - delta + ((delta > _cyclicBufferPos) ? _cyclicBufferSize : 0)];
432
3.15M
      diff = (ptrdiff_t)0 - delta;
433
3.15M
      if (cur[maxLen] == cur[maxLen + diff])
434
420k
      {
435
420k
        const Byte *c = cur;
436
6.15M
        while (*c == c[diff])
437
5.74M
        {
438
5.74M
          if (++c == lim)
439
20.2k
          {
440
20.2k
            distances[0] = (UInt32)(lim - cur);
441
20.2k
            distances[1] = delta - 1;
442
20.2k
            return distances + 2;
443
20.2k
          }
444
5.74M
        }
445
400k
        {
446
400k
          unsigned len = (unsigned)(c - cur);
447
400k
          if (maxLen < len)
448
82.0k
          {
449
82.0k
            maxLen = len;
450
82.0k
            distances[0] = (UInt32)len;
451
82.0k
            distances[1] = delta - 1;
452
82.0k
            distances += 2;
453
82.0k
          }
454
400k
        }
455
400k
      }
456
3.15M
    }
457
3.15M
  }
458
3.13M
  while (--cutValue);
459
  
460
364k
  return distances;
461
384k
}
462
463
464
MY_FORCE_INLINE
465
UInt32 * GetMatchesSpec1(UInt32 lenLimit, UInt32 curMatch, UInt32 pos, const Byte *cur, CLzRef *son,
466
    UInt32 _cyclicBufferPos, UInt32 _cyclicBufferSize, UInt32 cutValue,
467
    UInt32 *distances, UInt32 maxLen)
468
5.72M
{
469
5.72M
  CLzRef *ptr0 = son + ((size_t)_cyclicBufferPos << 1) + 1;
470
5.72M
  CLzRef *ptr1 = son + ((size_t)_cyclicBufferPos << 1);
471
5.72M
  unsigned len0 = 0, len1 = 0;
472
5.72M
  for (;;)
473
15.4M
  {
474
15.4M
    UInt32 delta = pos - curMatch;
475
15.4M
    if (cutValue-- == 0 || delta >= _cyclicBufferSize)
476
5.61M
    {
477
5.61M
      *ptr0 = *ptr1 = kEmptyHashValue;
478
5.61M
      return distances;
479
5.61M
    }
480
9.87M
    {
481
9.87M
      CLzRef *pair = son + ((size_t)(_cyclicBufferPos - delta + ((delta > _cyclicBufferPos) ? _cyclicBufferSize : 0)) << 1);
482
9.87M
      const Byte *pb = cur - delta;
483
9.87M
      unsigned len = (len0 < len1 ? len0 : len1);
484
9.87M
      UInt32 pair0 = pair[0];
485
9.87M
      if (pb[len] == cur[len])
486
8.94M
      {
487
8.94M
        if (++len != lenLimit && pb[len] == cur[len])
488
45.1M
          while (++len != lenLimit)
489
45.0M
            if (pb[len] != cur[len])
490
6.23M
              break;
491
8.94M
        if (maxLen < len)
492
5.03M
        {
493
5.03M
          maxLen = (UInt32)len;
494
5.03M
          *distances++ = (UInt32)len;
495
5.03M
          *distances++ = delta - 1;
496
5.03M
          if (len == lenLimit)
497
113k
          {
498
113k
            *ptr1 = pair0;
499
113k
            *ptr0 = pair[1];
500
113k
            return distances;
501
113k
          }
502
5.03M
        }
503
8.94M
      }
504
9.75M
      if (pb[len] < cur[len])
505
4.26M
      {
506
4.26M
        *ptr1 = curMatch;
507
4.26M
        ptr1 = pair + 1;
508
4.26M
        curMatch = *ptr1;
509
4.26M
        len1 = len;
510
4.26M
      }
511
5.49M
      else
512
5.49M
      {
513
5.49M
        *ptr0 = curMatch;
514
5.49M
        ptr0 = pair;
515
5.49M
        curMatch = *ptr0;
516
5.49M
        len0 = len;
517
5.49M
      }
518
9.75M
    }
519
9.75M
  }
520
5.72M
}
521
522
static void SkipMatchesSpec(UInt32 lenLimit, UInt32 curMatch, UInt32 pos, const Byte *cur, CLzRef *son,
523
    UInt32 _cyclicBufferPos, UInt32 _cyclicBufferSize, UInt32 cutValue)
524
8.05M
{
525
8.05M
  CLzRef *ptr0 = son + ((size_t)_cyclicBufferPos << 1) + 1;
526
8.05M
  CLzRef *ptr1 = son + ((size_t)_cyclicBufferPos << 1);
527
8.05M
  unsigned len0 = 0, len1 = 0;
528
8.05M
  for (;;)
529
27.3M
  {
530
27.3M
    UInt32 delta = pos - curMatch;
531
27.3M
    if (cutValue-- == 0 || delta >= _cyclicBufferSize)
532
3.88M
    {
533
3.88M
      *ptr0 = *ptr1 = kEmptyHashValue;
534
3.88M
      return;
535
3.88M
    }
536
23.5M
    {
537
23.5M
      CLzRef *pair = son + ((size_t)(_cyclicBufferPos - delta + ((delta > _cyclicBufferPos) ? _cyclicBufferSize : 0)) << 1);
538
23.5M
      const Byte *pb = cur - delta;
539
23.5M
      unsigned len = (len0 < len1 ? len0 : len1);
540
23.5M
      if (pb[len] == cur[len])
541
20.8M
      {
542
321M
        while (++len != lenLimit)
543
317M
          if (pb[len] != cur[len])
544
16.7M
            break;
545
20.8M
        {
546
20.8M
          if (len == lenLimit)
547
4.17M
          {
548
4.17M
            *ptr1 = pair[0];
549
4.17M
            *ptr0 = pair[1];
550
4.17M
            return;
551
4.17M
          }
552
20.8M
        }
553
20.8M
      }
554
19.3M
      if (pb[len] < cur[len])
555
9.74M
      {
556
9.74M
        *ptr1 = curMatch;
557
9.74M
        ptr1 = pair + 1;
558
9.74M
        curMatch = *ptr1;
559
9.74M
        len1 = len;
560
9.74M
      }
561
9.59M
      else
562
9.59M
      {
563
9.59M
        *ptr0 = curMatch;
564
9.59M
        ptr0 = pair;
565
9.59M
        curMatch = *ptr0;
566
9.59M
        len0 = len;
567
9.59M
      }
568
19.3M
    }
569
19.3M
  }
570
8.05M
}
571
572
#define MOVE_POS \
573
15.8M
  ++p->cyclicBufferPos; \
574
15.8M
  p->buffer++; \
575
15.8M
  if (++p->pos == p->posLimit) MatchFinder_CheckLimits(p);
576
577
6.17M
#define MOVE_POS_RET MOVE_POS return (UInt32)offset;
578
579
14.2k
static void MatchFinder_MovePos(CMatchFinder *p) { MOVE_POS; }
580
581
#define GET_MATCHES_HEADER2(minLen, ret_op) \
582
15.8M
  unsigned lenLimit; UInt32 hv; const Byte *cur; UInt32 curMatch; \
583
15.8M
  lenLimit = (unsigned)p->lenLimit; { if (lenLimit < minLen) { MatchFinder_MovePos(p); ret_op; }} \
584
15.8M
  cur = p->buffer;
585
586
6.19M
#define GET_MATCHES_HEADER(minLen) GET_MATCHES_HEADER2(minLen, return 0)
587
9.70M
#define SKIP_HEADER(minLen)        GET_MATCHES_HEADER2(minLen, continue)
588
589
14.1M
#define MF_PARAMS(p) p->pos, p->buffer, p->son, p->cyclicBufferPos, p->cyclicBufferSize, p->cutValue
590
591
#define GET_MATCHES_FOOTER(offset, maxLen) \
592
5.72M
  offset = (unsigned)(GetMatchesSpec1((UInt32)lenLimit, curMatch, MF_PARAMS(p), \
593
5.72M
  distances + offset, (UInt32)maxLen) - distances); MOVE_POS_RET;
594
595
#define SKIP_FOOTER \
596
8.01M
  SkipMatchesSpec((UInt32)lenLimit, curMatch, MF_PARAMS(p)); MOVE_POS;
597
598
1.12M
#define UPDATE_maxLen { \
599
1.12M
    ptrdiff_t diff = (ptrdiff_t)0 - d2; \
600
1.12M
    const Byte *c = cur + maxLen; \
601
1.12M
    const Byte *lim = cur + lenLimit; \
602
8.72M
    for (; c != lim; c++) if (*(c + diff) != *c) break; \
603
1.12M
    maxLen = (unsigned)(c - cur); }
604
605
static UInt32 Bt2_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
606
4.48M
{
607
4.48M
  unsigned offset;
608
4.48M
  GET_MATCHES_HEADER(2)
609
4.48M
  HASH2_CALC;
610
4.48M
  curMatch = p->hash[hv];
611
4.48M
  p->hash[hv] = p->pos;
612
4.48M
  offset = 0;
613
4.48M
  GET_MATCHES_FOOTER(offset, 1)
614
0
}
615
616
UInt32 Bt3Zip_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
617
0
{
618
0
  unsigned offset;
619
0
  GET_MATCHES_HEADER(3)
620
0
  HASH_ZIP_CALC;
621
0
  curMatch = p->hash[hv];
622
0
  p->hash[hv] = p->pos;
623
0
  offset = 0;
624
0
  GET_MATCHES_FOOTER(offset, 2)
625
0
}
626
627
static UInt32 Bt3_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
628
696k
{
629
696k
  UInt32 h2, d2, pos;
630
696k
  unsigned maxLen, offset;
631
696k
  UInt32 *hash;
632
696k
  GET_MATCHES_HEADER(3)
633
634
694k
  HASH3_CALC;
635
636
694k
  hash = p->hash;
637
694k
  pos = p->pos;
638
639
694k
  d2 = pos - hash[h2];
640
641
694k
  curMatch = (hash + kFix3HashSize)[hv];
642
  
643
694k
  hash[h2] = pos;
644
694k
  (hash + kFix3HashSize)[hv] = pos;
645
646
694k
  maxLen = 2;
647
694k
  offset = 0;
648
649
694k
  if (d2 < p->cyclicBufferSize && *(cur - d2) == *cur)
650
512k
  {
651
512k
    UPDATE_maxLen
652
512k
    distances[0] = (UInt32)maxLen;
653
512k
    distances[1] = d2 - 1;
654
512k
    offset = 2;
655
512k
    if (maxLen == lenLimit)
656
11.0k
    {
657
11.0k
      SkipMatchesSpec((UInt32)lenLimit, curMatch, MF_PARAMS(p));
658
11.0k
      MOVE_POS_RET;
659
0
    }
660
512k
  }
661
  
662
683k
  GET_MATCHES_FOOTER(offset, maxLen)
663
0
}
664
665
static UInt32 Bt4_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
666
586k
{
667
586k
  UInt32 h2, h3, d2, d3, pos;
668
586k
  unsigned maxLen, offset;
669
586k
  UInt32 *hash;
670
586k
  GET_MATCHES_HEADER(4)
671
672
583k
  HASH4_CALC;
673
674
583k
  hash = p->hash;
675
583k
  pos = p->pos;
676
677
583k
  d2 = pos - hash                  [h2];
678
583k
  d3 = pos - (hash + kFix3HashSize)[h3];
679
680
583k
  curMatch = (hash + kFix4HashSize)[hv];
681
682
583k
  hash                  [h2] = pos;
683
583k
  (hash + kFix3HashSize)[h3] = pos;
684
583k
  (hash + kFix4HashSize)[hv] = pos;
685
686
583k
  maxLen = 0;
687
583k
  offset = 0;
688
  
689
583k
  if (d2 < p->cyclicBufferSize && *(cur - d2) == *cur)
690
354k
  {
691
354k
    maxLen = 2;
692
354k
    distances[0] = 2;
693
354k
    distances[1] = d2 - 1;
694
354k
    offset = 2;
695
354k
  }
696
  
697
583k
  if (d2 != d3 && d3 < p->cyclicBufferSize && *(cur - d3) == *cur)
698
153k
  {
699
153k
    maxLen = 3;
700
153k
    distances[(size_t)offset + 1] = d3 - 1;
701
153k
    offset += 2;
702
153k
    d2 = d3;
703
153k
  }
704
  
705
583k
  if (offset != 0)
706
369k
  {
707
369k
    UPDATE_maxLen
708
369k
    distances[(size_t)offset - 2] = (UInt32)maxLen;
709
369k
    if (maxLen == lenLimit)
710
26.0k
    {
711
26.0k
      SkipMatchesSpec((UInt32)lenLimit, curMatch, MF_PARAMS(p));
712
26.0k
      MOVE_POS_RET;
713
0
    }
714
369k
  }
715
  
716
557k
  if (maxLen < 3)
717
283k
    maxLen = 3;
718
  
719
557k
  GET_MATCHES_FOOTER(offset, maxLen)
720
0
}
721
722
/*
723
static UInt32 Bt5_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
724
{
725
  UInt32 h2, h3, h4, d2, d3, d4, maxLen, offset, pos;
726
  UInt32 *hash;
727
  GET_MATCHES_HEADER(5)
728
729
  HASH5_CALC;
730
731
  hash = p->hash;
732
  pos = p->pos;
733
734
  d2 = pos - hash                  [h2];
735
  d3 = pos - (hash + kFix3HashSize)[h3];
736
  d4 = pos - (hash + kFix4HashSize)[h4];
737
738
  curMatch = (hash + kFix5HashSize)[hv];
739
740
  hash                  [h2] = pos;
741
  (hash + kFix3HashSize)[h3] = pos;
742
  (hash + kFix4HashSize)[h4] = pos;
743
  (hash + kFix5HashSize)[hv] = pos;
744
745
  maxLen = 0;
746
  offset = 0;
747
748
  if (d2 < p->cyclicBufferSize && *(cur - d2) == *cur)
749
  {
750
    distances[0] = maxLen = 2;
751
    distances[1] = d2 - 1;
752
    offset = 2;
753
    if (*(cur - d2 + 2) == cur[2])
754
      distances[0] = maxLen = 3;
755
    else if (d3 < p->cyclicBufferSize && *(cur - d3) == *cur)
756
    {
757
      distances[2] = maxLen = 3;
758
      distances[3] = d3 - 1;
759
      offset = 4;
760
      d2 = d3;
761
    }
762
  }
763
  else if (d3 < p->cyclicBufferSize && *(cur - d3) == *cur)
764
  {
765
    distances[0] = maxLen = 3;
766
    distances[1] = d3 - 1;
767
    offset = 2;
768
    d2 = d3;
769
  }
770
  
771
  if (d2 != d4 && d4 < p->cyclicBufferSize
772
      && *(cur - d4) == *cur
773
      && *(cur - d4 + 3) == *(cur + 3))
774
  {
775
    maxLen = 4;
776
    distances[(size_t)offset + 1] = d4 - 1;
777
    offset += 2;
778
    d2 = d4;
779
  }
780
  
781
  if (offset != 0)
782
  {
783
    UPDATE_maxLen
784
    distances[(size_t)offset - 2] = maxLen;
785
    if (maxLen == lenLimit)
786
    {
787
      SkipMatchesSpec(lenLimit, curMatch, MF_PARAMS(p));
788
      MOVE_POS_RET;
789
    }
790
  }
791
792
  if (maxLen < 4)
793
    maxLen = 4;
794
  
795
  GET_MATCHES_FOOTER(offset, maxLen)
796
}
797
*/
798
799
static UInt32 Hc4_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
800
419k
{
801
419k
  UInt32 h2, h3, d2, d3, pos;
802
419k
  unsigned maxLen, offset;
803
419k
  UInt32 *hash;
804
419k
  GET_MATCHES_HEADER(4)
805
806
416k
  HASH4_CALC;
807
808
416k
  hash = p->hash;
809
416k
  pos = p->pos;
810
  
811
416k
  d2 = pos - hash                  [h2];
812
416k
  d3 = pos - (hash + kFix3HashSize)[h3];
813
416k
  curMatch = (hash + kFix4HashSize)[hv];
814
815
416k
  hash                  [h2] = pos;
816
416k
  (hash + kFix3HashSize)[h3] = pos;
817
416k
  (hash + kFix4HashSize)[hv] = pos;
818
819
416k
  maxLen = 0;
820
416k
  offset = 0;
821
822
416k
  if (d2 < p->cyclicBufferSize && *(cur - d2) == *cur)
823
229k
  {
824
229k
    maxLen = 2;
825
229k
    distances[0] = 2;
826
229k
    distances[1] = d2 - 1;
827
229k
    offset = 2;
828
229k
  }
829
  
830
416k
  if (d2 != d3 && d3 < p->cyclicBufferSize && *(cur - d3) == *cur)
831
103k
  {
832
103k
    maxLen = 3;
833
103k
    distances[(size_t)offset + 1] = d3 - 1;
834
103k
    offset += 2;
835
103k
    d2 = d3;
836
103k
  }
837
  
838
416k
  if (offset != 0)
839
238k
  {
840
238k
    UPDATE_maxLen
841
238k
    distances[(size_t)offset - 2] = (UInt32)maxLen;
842
238k
    if (maxLen == lenLimit)
843
32.1k
    {
844
32.1k
      p->son[p->cyclicBufferPos] = curMatch;
845
32.1k
      MOVE_POS_RET;
846
0
    }
847
238k
  }
848
  
849
384k
  if (maxLen < 3)
850
219k
    maxLen = 3;
851
852
384k
  offset = (unsigned)(Hc_GetMatchesSpec(lenLimit, curMatch, MF_PARAMS(p),
853
384k
      distances + offset, maxLen) - (distances));
854
384k
  MOVE_POS_RET
855
416k
}
856
857
/*
858
static UInt32 Hc5_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
859
{
860
  UInt32 h2, h3, h4, d2, d3, d4, maxLen, offset, pos
861
  UInt32 *hash;
862
  GET_MATCHES_HEADER(5)
863
864
  HASH5_CALC;
865
866
  hash = p->hash;
867
  pos = p->pos;
868
  
869
  d2 = pos - hash                  [h2];
870
  d3 = pos - (hash + kFix3HashSize)[h3];
871
  d4 = pos - (hash + kFix4HashSize)[h4];
872
873
  curMatch = (hash + kFix5HashSize)[hv];
874
875
  hash                  [h2] = pos;
876
  (hash + kFix3HashSize)[h3] = pos;
877
  (hash + kFix4HashSize)[h4] = pos;
878
  (hash + kFix5HashSize)[hv] = pos;
879
880
  maxLen = 0;
881
  offset = 0;
882
883
  if (d2 < p->cyclicBufferSize && *(cur - d2) == *cur)
884
  {
885
    distances[0] = maxLen = 2;
886
    distances[1] = d2 - 1;
887
    offset = 2;
888
    if (*(cur - d2 + 2) == cur[2])
889
      distances[0] = maxLen = 3;
890
    else if (d3 < p->cyclicBufferSize && *(cur - d3) == *cur)
891
    {
892
      distances[2] = maxLen = 3;
893
      distances[3] = d3 - 1;
894
      offset = 4;
895
      d2 = d3;
896
    }
897
  }
898
  else if (d3 < p->cyclicBufferSize && *(cur - d3) == *cur)
899
  {
900
    distances[0] = maxLen = 3;
901
    distances[1] = d3 - 1;
902
    offset = 2;
903
    d2 = d3;
904
  }
905
  
906
  if (d2 != d4 && d4 < p->cyclicBufferSize
907
      && *(cur - d4) == *cur
908
      && *(cur - d4 + 3) == *(cur + 3))
909
  {
910
    maxLen = 4;
911
    distances[(size_t)offset + 1] = d4 - 1;
912
    offset += 2;
913
    d2 = d4;
914
  }
915
  
916
  if (offset != 0)
917
  {
918
    UPDATE_maxLen
919
    distances[(size_t)offset - 2] = maxLen;
920
    if (maxLen == lenLimit)
921
    {
922
      p->son[p->cyclicBufferPos] = curMatch;
923
      MOVE_POS_RET;
924
    }
925
  }
926
  
927
  if (maxLen < 4)
928
    maxLen = 4;
929
930
  offset = (UInt32)(Hc_GetMatchesSpec(lenLimit, curMatch, MF_PARAMS(p),
931
      distances + offset, maxLen) - (distances));
932
  MOVE_POS_RET
933
}
934
*/
935
936
UInt32 Hc3Zip_MatchFinder_GetMatches(CMatchFinder *p, UInt32 *distances)
937
0
{
938
0
  unsigned offset;
939
0
  GET_MATCHES_HEADER(3)
940
0
  HASH_ZIP_CALC;
941
0
  curMatch = p->hash[hv];
942
0
  p->hash[hv] = p->pos;
943
0
  offset = (unsigned)(Hc_GetMatchesSpec(lenLimit, curMatch, MF_PARAMS(p),
944
0
      distances, 2) - (distances));
945
0
  MOVE_POS_RET
946
0
}
947
948
static void Bt2_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
949
153k
{
950
153k
  do
951
3.36M
  {
952
3.36M
    SKIP_HEADER(2)
953
3.36M
    HASH2_CALC;
954
3.36M
    curMatch = p->hash[hv];
955
3.36M
    p->hash[hv] = p->pos;
956
3.36M
    SKIP_FOOTER
957
3.36M
  }
958
3.36M
  while (--num != 0);
959
153k
}
960
961
void Bt3Zip_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
962
0
{
963
0
  do
964
0
  {
965
0
    SKIP_HEADER(3)
966
0
    HASH_ZIP_CALC;
967
0
    curMatch = p->hash[hv];
968
0
    p->hash[hv] = p->pos;
969
0
    SKIP_FOOTER
970
0
  }
971
0
  while (--num != 0);
972
0
}
973
974
static void Bt3_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
975
65.2k
{
976
65.2k
  do
977
2.21M
  {
978
2.21M
    UInt32 h2;
979
2.21M
    UInt32 *hash;
980
2.21M
    SKIP_HEADER(3)
981
2.21M
    HASH3_CALC;
982
2.21M
    hash = p->hash;
983
2.21M
    curMatch = (hash + kFix3HashSize)[hv];
984
2.21M
    hash[h2] =
985
2.21M
    (hash + kFix3HashSize)[hv] = p->pos;
986
2.21M
    SKIP_FOOTER
987
2.21M
  }
988
2.21M
  while (--num != 0);
989
65.2k
}
990
991
static void Bt4_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
992
69.2k
{
993
69.2k
  do
994
2.43M
  {
995
2.43M
    UInt32 h2, h3;
996
2.43M
    UInt32 *hash;
997
2.43M
    SKIP_HEADER(4)
998
2.43M
    HASH4_CALC;
999
2.43M
    hash = p->hash;
1000
2.43M
    curMatch = (hash + kFix4HashSize)[hv];
1001
2.43M
    hash                  [h2] =
1002
2.43M
    (hash + kFix3HashSize)[h3] =
1003
2.43M
    (hash + kFix4HashSize)[hv] = p->pos;
1004
2.43M
    SKIP_FOOTER
1005
2.43M
  }
1006
2.43M
  while (--num != 0);
1007
69.2k
}
1008
1009
/*
1010
static void Bt5_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
1011
{
1012
  do
1013
  {
1014
    UInt32 h2, h3, h4;
1015
    UInt32 *hash;
1016
    SKIP_HEADER(5)
1017
    HASH5_CALC;
1018
    hash = p->hash;
1019
    curMatch = (hash + kFix5HashSize)[hv];
1020
    hash                  [h2] =
1021
    (hash + kFix3HashSize)[h3] =
1022
    (hash + kFix4HashSize)[h4] =
1023
    (hash + kFix5HashSize)[hv] = p->pos;
1024
    SKIP_FOOTER
1025
  }
1026
  while (--num != 0);
1027
}
1028
*/
1029
1030
static void Hc4_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
1031
76.4k
{
1032
76.4k
  do
1033
1.68M
  {
1034
1.68M
    UInt32 h2, h3;
1035
1.68M
    UInt32 *hash;
1036
1.68M
    SKIP_HEADER(4)
1037
1.68M
    HASH4_CALC;
1038
1.68M
    hash = p->hash;
1039
1.68M
    curMatch = (hash + kFix4HashSize)[hv];
1040
1.68M
    hash                  [h2] =
1041
1.68M
    (hash + kFix3HashSize)[h3] =
1042
1.68M
    (hash + kFix4HashSize)[hv] = p->pos;
1043
1.68M
    p->son[p->cyclicBufferPos] = curMatch;
1044
1.68M
    MOVE_POS
1045
1.68M
  }
1046
1.68M
  while (--num != 0);
1047
76.4k
}
1048
1049
/*
1050
static void Hc5_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
1051
{
1052
  do
1053
  {
1054
    UInt32 h2, h3, h4;
1055
    UInt32 *hash;
1056
    SKIP_HEADER(5)
1057
    HASH5_CALC;
1058
    hash = p->hash;
1059
    curMatch = hash + kFix5HashSize)[hv];
1060
    hash                  [h2] =
1061
    (hash + kFix3HashSize)[h3] =
1062
    (hash + kFix4HashSize)[h4] =
1063
    (hash + kFix5HashSize)[hv] = p->pos;
1064
    p->son[p->cyclicBufferPos] = curMatch;
1065
    MOVE_POS
1066
  }
1067
  while (--num != 0);
1068
}
1069
*/
1070
1071
void Hc3Zip_MatchFinder_Skip(CMatchFinder *p, UInt32 num)
1072
0
{
1073
0
  do
1074
0
  {
1075
0
    SKIP_HEADER(3)
1076
0
    HASH_ZIP_CALC;
1077
0
    curMatch = p->hash[hv];
1078
0
    p->hash[hv] = p->pos;
1079
0
    p->son[p->cyclicBufferPos] = curMatch;
1080
0
    MOVE_POS
1081
0
  }
1082
0
  while (--num != 0);
1083
0
}
1084
1085
void MatchFinder_CreateVTable(CMatchFinder *p, IMatchFinder *vTable)
1086
7.55k
{
1087
7.55k
  vTable->Init = (Mf_Init_Func)MatchFinder_Init;
1088
7.55k
  vTable->GetNumAvailableBytes = (Mf_GetNumAvailableBytes_Func)MatchFinder_GetNumAvailableBytes;
1089
7.55k
  vTable->GetPointerToCurrentPos = (Mf_GetPointerToCurrentPos_Func)MatchFinder_GetPointerToCurrentPos;
1090
7.55k
  if (!p->btMode)
1091
1.34k
  {
1092
    /* if (p->numHashBytes <= 4) */
1093
1.34k
    {
1094
1.34k
      vTable->GetMatches = (Mf_GetMatches_Func)Hc4_MatchFinder_GetMatches;
1095
1.34k
      vTable->Skip = (Mf_Skip_Func)Hc4_MatchFinder_Skip;
1096
1.34k
    }
1097
    /*
1098
    else
1099
    {
1100
      vTable->GetMatches = (Mf_GetMatches_Func)Hc5_MatchFinder_GetMatches;
1101
      vTable->Skip = (Mf_Skip_Func)Hc5_MatchFinder_Skip;
1102
    }
1103
    */
1104
1.34k
  }
1105
6.20k
  else if (p->numHashBytes == 2)
1106
3.39k
  {
1107
3.39k
    vTable->GetMatches = (Mf_GetMatches_Func)Bt2_MatchFinder_GetMatches;
1108
3.39k
    vTable->Skip = (Mf_Skip_Func)Bt2_MatchFinder_Skip;
1109
3.39k
  }
1110
2.81k
  else if (p->numHashBytes == 3)
1111
1.47k
  {
1112
1.47k
    vTable->GetMatches = (Mf_GetMatches_Func)Bt3_MatchFinder_GetMatches;
1113
1.47k
    vTable->Skip = (Mf_Skip_Func)Bt3_MatchFinder_Skip;
1114
1.47k
  }
1115
1.33k
  else /* if (p->numHashBytes == 4) */
1116
1.33k
  {
1117
1.33k
    vTable->GetMatches = (Mf_GetMatches_Func)Bt4_MatchFinder_GetMatches;
1118
1.33k
    vTable->Skip = (Mf_Skip_Func)Bt4_MatchFinder_Skip;
1119
1.33k
  }
1120
  /*
1121
  else
1122
  {
1123
    vTable->GetMatches = (Mf_GetMatches_Func)Bt5_MatchFinder_GetMatches;
1124
    vTable->Skip = (Mf_Skip_Func)Bt5_MatchFinder_Skip;
1125
  }
1126
  */
1127
7.55k
}