Coverage Report

Created: 2025-08-11 06:31

/src/lzma-fuzz/sdk/C/LzmaEnc.c
Line
Count
Source (jump to first uncovered line)
1
/* LzmaEnc.c -- LZMA Encoder
2
2019-01-10: Igor Pavlov : Public domain */
3
4
#include "Precomp.h"
5
6
#include <string.h>
7
8
/* #define SHOW_STAT */
9
/* #define SHOW_STAT2 */
10
11
#if defined(SHOW_STAT) || defined(SHOW_STAT2)
12
#include <stdio.h>
13
#endif
14
15
#include "LzmaEnc.h"
16
17
#include "LzFind.h"
18
#ifndef _7ZIP_ST
19
#include "LzFindMt.h"
20
#endif
21
22
#ifdef SHOW_STAT
23
static unsigned g_STAT_OFFSET = 0;
24
#endif
25
26
15.5k
#define kLzmaMaxHistorySize ((UInt32)3 << 29)
27
/* #define kLzmaMaxHistorySize ((UInt32)7 << 29) */
28
29
87.3M
#define kNumTopBits 24
30
87.3M
#define kTopValue ((UInt32)1 << kNumTopBits)
31
32
431M
#define kNumBitModelTotalBits 11
33
343M
#define kBitModelTotal (1 << kNumBitModelTotalBits)
34
234M
#define kNumMoveBits 5
35
146M
#define kProbInitValue (kBitModelTotal >> 1)
36
37
141M
#define kNumMoveReducingBits 4
38
2.82M
#define kNumBitPriceShiftBits 4
39
#define kBitPrice (1 << kNumBitPriceShiftBits)
40
41
26.4k
#define REP_LEN_COUNT 64
42
43
void LzmaEncProps_Init(CLzmaEncProps *p)
44
23.3k
{
45
23.3k
  p->level = 5;
46
23.3k
  p->dictSize = p->mc = 0;
47
23.3k
  p->reduceSize = (UInt64)(Int64)-1;
48
23.3k
  p->lc = p->lp = p->pb = p->algo = p->fb = p->btMode = p->numHashBytes = p->numThreads = -1;
49
23.3k
  p->writeEndMark = 0;
50
23.3k
}
51
52
void LzmaEncProps_Normalize(CLzmaEncProps *p)
53
77.8k
{
54
77.8k
  int level = p->level;
55
77.8k
  if (level < 0) level = 5;
56
77.8k
  p->level = level;
57
  
58
77.8k
  if (p->dictSize == 0) p->dictSize = (level <= 5 ? (1 << (level * 2 + 14)) : (level <= 7 ? (1 << 25) : (1 << 26)));
59
77.8k
  if (p->dictSize > p->reduceSize)
60
0
  {
61
0
    unsigned i;
62
0
    UInt32 reduceSize = (UInt32)p->reduceSize;
63
0
    for (i = 11; i <= 30; i++)
64
0
    {
65
0
      if (reduceSize <= ((UInt32)2 << i)) { p->dictSize = ((UInt32)2 << i); break; }
66
0
      if (reduceSize <= ((UInt32)3 << i)) { p->dictSize = ((UInt32)3 << i); break; }
67
0
    }
68
0
  }
69
70
77.8k
  if (p->lc < 0) p->lc = 3;
71
77.8k
  if (p->lp < 0) p->lp = 0;
72
77.8k
  if (p->pb < 0) p->pb = 2;
73
74
77.8k
  if (p->algo < 0) p->algo = (level < 5 ? 0 : 1);
75
77.8k
  if (p->fb < 0) p->fb = (level < 7 ? 32 : 64);
76
77.8k
  if (p->btMode < 0) p->btMode = (p->algo == 0 ? 0 : 1);
77
77.8k
  if (p->numHashBytes < 0) p->numHashBytes = 4;
78
77.8k
  if (p->mc == 0) p->mc = (16 + (p->fb >> 1)) >> (p->btMode ? 0 : 1);
79
  
80
77.8k
  if (p->numThreads < 0)
81
38.9k
    p->numThreads =
82
      #ifndef _7ZIP_ST
83
      ((p->btMode && p->algo) ? 2 : 1);
84
      #else
85
38.9k
      1;
86
77.8k
      #endif
87
77.8k
}
88
89
UInt32 LzmaEncProps_GetDictSize(const CLzmaEncProps *props2)
90
7.77k
{
91
7.77k
  CLzmaEncProps props = *props2;
92
7.77k
  LzmaEncProps_Normalize(&props);
93
7.77k
  return props.dictSize;
94
7.77k
}
95
96
#if (_MSC_VER >= 1400)
97
/* BSR code is fast for some new CPUs */
98
/* #define LZMA_LOG_BSR */
99
#endif
100
101
#ifdef LZMA_LOG_BSR
102
103
#define kDicLogSizeMaxCompress 32
104
105
#define BSR2_RET(pos, res) { unsigned long zz; _BitScanReverse(&zz, (pos)); res = (zz + zz) + ((pos >> (zz - 1)) & 1); }
106
107
static unsigned GetPosSlot1(UInt32 pos)
108
{
109
  unsigned res;
110
  BSR2_RET(pos, res);
111
  return res;
112
}
113
#define GetPosSlot2(pos, res) { BSR2_RET(pos, res); }
114
#define GetPosSlot(pos, res) { if (pos < 2) res = pos; else BSR2_RET(pos, res); }
115
116
#else
117
118
3.88M
#define kNumLogBits (9 + sizeof(size_t) / 2)
119
/* #define kNumLogBits (11 + sizeof(size_t) / 8 * 3) */
120
121
15.5k
#define kDicLogSizeMaxCompress ((kNumLogBits - 1) * 2 + 7)
122
123
static void LzmaEnc_FastPosInit(Byte *g_FastPos)
124
7.77k
{
125
7.77k
  unsigned slot;
126
7.77k
  g_FastPos[0] = 0;
127
7.77k
  g_FastPos[1] = 1;
128
7.77k
  g_FastPos += 2;
129
  
130
194k
  for (slot = 2; slot < kNumLogBits * 2; slot++)
131
186k
  {
132
186k
    size_t k = ((size_t)1 << ((slot >> 1) - 1));
133
186k
    size_t j;
134
63.8M
    for (j = 0; j < k; j++)
135
63.6M
      g_FastPos[j] = (Byte)slot;
136
186k
    g_FastPos += k;
137
186k
  }
138
7.77k
}
139
140
/* we can use ((limit - pos) >> 31) only if (pos < ((UInt32)1 << 31)) */
141
/*
142
#define BSR2_RET(pos, res) { unsigned zz = 6 + ((kNumLogBits - 1) & \
143
  (0 - (((((UInt32)1 << (kNumLogBits + 6)) - 1) - pos) >> 31))); \
144
  res = p->g_FastPos[pos >> zz] + (zz * 2); }
145
*/
146
147
/*
148
#define BSR2_RET(pos, res) { unsigned zz = 6 + ((kNumLogBits - 1) & \
149
  (0 - (((((UInt32)1 << (kNumLogBits)) - 1) - (pos >> 6)) >> 31))); \
150
  res = p->g_FastPos[pos >> zz] + (zz * 2); }
151
*/
152
153
3.67M
#define BSR2_RET(pos, res) { unsigned zz = (pos < (1 << (kNumLogBits + 6))) ? 6 : 6 + kNumLogBits - 1; \
154
3.67M
  res = p->g_FastPos[pos >> zz] + (zz * 2); }
155
156
/*
157
#define BSR2_RET(pos, res) { res = (pos < (1 << (kNumLogBits + 6))) ? \
158
  p->g_FastPos[pos >> 6] + 12 : \
159
  p->g_FastPos[pos >> (6 + kNumLogBits - 1)] + (6 + (kNumLogBits - 1)) * 2; }
160
*/
161
162
7.86M
#define GetPosSlot1(pos) p->g_FastPos[pos]
163
3.54M
#define GetPosSlot2(pos, res) { BSR2_RET(pos, res); }
164
823k
#define GetPosSlot(pos, res) { if (pos < kNumFullDistances) res = p->g_FastPos[pos & (kNumFullDistances - 1)]; else BSR2_RET(pos, res); }
165
166
#endif
167
168
169
75.6M
#define LZMA_NUM_REPS 4
170
171
typedef UInt16 CState;
172
typedef UInt16 CExtra;
173
174
typedef struct
175
{
176
  UInt32 price;
177
  CState state;
178
  CExtra extra;
179
      // 0   : normal
180
      // 1   : LIT : MATCH
181
      // > 1 : MATCH (extra-1) : LIT : REP0 (len)
182
  UInt32 len;
183
  UInt32 dist;
184
  UInt32 reps[LZMA_NUM_REPS];
185
} COptimal;
186
187
188
// 18.06
189
59.3M
#define kNumOpts (1 << 11)
190
7.58M
#define kPackReserve (kNumOpts * 8)
191
// #define kNumOpts (1 << 12)
192
// #define kPackReserve (1 + kNumOpts * 2)
193
194
25.6M
#define kNumLenToPosStates 4
195
25.0M
#define kNumPosSlotBits 6
196
#define kDicLogSizeMin 0
197
139k
#define kDicLogSizeMax 32
198
#define kDistTableSizeMax (kDicLogSizeMax * 2)
199
200
4.49M
#define kNumAlignBits 4
201
4.09M
#define kAlignTableSize (1 << kNumAlignBits)
202
3.86M
#define kAlignMask (kAlignTableSize - 1)
203
204
848k
#define kStartPosModelIndex 4
205
37.1M
#define kEndPosModelIndex 14
206
37.7M
#define kNumFullDistances (1 << (kEndPosModelIndex >> 1))
207
208
typedef
209
#ifdef _LZMA_PROB32
210
  UInt32
211
#else
212
  UInt16
213
#endif
214
  CLzmaProb;
215
216
12.5M
#define LZMA_PB_MAX 4
217
31.0k
#define LZMA_LC_MAX 8
218
31.0k
#define LZMA_LP_MAX 4
219
220
12.5M
#define LZMA_NUM_PB_STATES_MAX (1 << LZMA_PB_MAX)
221
222
29.3M
#define kLenNumLowBits 3
223
18.7M
#define kLenNumLowSymbols (1 << kLenNumLowBits)
224
28.8M
#define kLenNumHighBits 8
225
24.4M
#define kLenNumHighSymbols (1 << kLenNumHighBits)
226
15.4M
#define kLenNumSymbolsTotal (kLenNumLowSymbols * 2 + kLenNumHighSymbols)
227
228
104M
#define LZMA_MATCH_LEN_MIN 2
229
15.4M
#define LZMA_MATCH_LEN_MAX (LZMA_MATCH_LEN_MIN + kLenNumSymbolsTotal - 1)
230
231
227k
#define kNumStates 12
232
233
234
typedef struct
235
{
236
  CLzmaProb low[LZMA_NUM_PB_STATES_MAX << (kLenNumLowBits + 1)];
237
  CLzmaProb high[kLenNumHighSymbols];
238
} CLenEnc;
239
240
241
typedef struct
242
{
243
  unsigned tableSize;
244
  UInt32 prices[LZMA_NUM_PB_STATES_MAX][kLenNumSymbolsTotal];
245
  // UInt32 prices1[LZMA_NUM_PB_STATES_MAX][kLenNumLowSymbols * 2];
246
  // UInt32 prices2[kLenNumSymbolsTotal];
247
} CLenPriceEnc;
248
249
#define GET_PRICE_LEN(p, posState, len) \
250
88.2M
    ((p)->prices[posState][(size_t)(len) - LZMA_MATCH_LEN_MIN])
251
252
/*
253
#define GET_PRICE_LEN(p, posState, len) \
254
    ((p)->prices2[(size_t)(len) - 2] + ((p)->prices1[posState][((len) - 2) & (kLenNumLowSymbols * 2 - 1)] & (((len) - 2 - kLenNumLowSymbols * 2) >> 9)))
255
*/
256
257
typedef struct
258
{
259
  UInt32 range;
260
  unsigned cache;
261
  UInt64 low;
262
  UInt64 cacheSize;
263
  Byte *buf;
264
  Byte *bufLim;
265
  Byte *bufBase;
266
  ISeqOutStream *outStream;
267
  UInt64 processed;
268
  SRes res;
269
} CRangeEnc;
270
271
272
typedef struct
273
{
274
  CLzmaProb *litProbs;
275
276
  unsigned state;
277
  UInt32 reps[LZMA_NUM_REPS];
278
279
  CLzmaProb posAlignEncoder[1 << kNumAlignBits];
280
  CLzmaProb isRep[kNumStates];
281
  CLzmaProb isRepG0[kNumStates];
282
  CLzmaProb isRepG1[kNumStates];
283
  CLzmaProb isRepG2[kNumStates];
284
  CLzmaProb isMatch[kNumStates][LZMA_NUM_PB_STATES_MAX];
285
  CLzmaProb isRep0Long[kNumStates][LZMA_NUM_PB_STATES_MAX];
286
287
  CLzmaProb posSlotEncoder[kNumLenToPosStates][1 << kNumPosSlotBits];
288
  CLzmaProb posEncoders[kNumFullDistances];
289
  
290
  CLenEnc lenProbs;
291
  CLenEnc repLenProbs;
292
293
} CSaveState;
294
295
296
typedef UInt32 CProbPrice;
297
298
299
typedef struct
300
{
301
  void *matchFinderObj;
302
  IMatchFinder matchFinder;
303
304
  unsigned optCur;
305
  unsigned optEnd;
306
307
  unsigned longestMatchLen;
308
  unsigned numPairs;
309
  UInt32 numAvail;
310
311
  unsigned state;
312
  unsigned numFastBytes;
313
  unsigned additionalOffset;
314
  UInt32 reps[LZMA_NUM_REPS];
315
  unsigned lpMask, pbMask;
316
  CLzmaProb *litProbs;
317
  CRangeEnc rc;
318
319
  UInt32 backRes;
320
321
  unsigned lc, lp, pb;
322
  unsigned lclp;
323
324
  BoolInt fastMode;
325
  BoolInt writeEndMark;
326
  BoolInt finished;
327
  BoolInt multiThread;
328
  BoolInt needInit;
329
  // BoolInt _maxMode;
330
331
  UInt64 nowPos64;
332
  
333
  unsigned matchPriceCount;
334
  // unsigned alignPriceCount;
335
  int repLenEncCounter;
336
337
  unsigned distTableSize;
338
339
  UInt32 dictSize;
340
  SRes result;
341
342
  #ifndef _7ZIP_ST
343
  BoolInt mtMode;
344
  // begin of CMatchFinderMt is used in LZ thread
345
  CMatchFinderMt matchFinderMt;
346
  // end of CMatchFinderMt is used in BT and HASH threads
347
  #endif
348
349
  CMatchFinder matchFinderBase;
350
351
  #ifndef _7ZIP_ST
352
  Byte pad[128];
353
  #endif
354
  
355
  // LZ thread
356
  CProbPrice ProbPrices[kBitModelTotal >> kNumMoveReducingBits];
357
358
  UInt32 matches[LZMA_MATCH_LEN_MAX * 2 + 2 + 1];
359
360
  UInt32 alignPrices[kAlignTableSize];
361
  UInt32 posSlotPrices[kNumLenToPosStates][kDistTableSizeMax];
362
  UInt32 distancesPrices[kNumLenToPosStates][kNumFullDistances];
363
364
  CLzmaProb posAlignEncoder[1 << kNumAlignBits];
365
  CLzmaProb isRep[kNumStates];
366
  CLzmaProb isRepG0[kNumStates];
367
  CLzmaProb isRepG1[kNumStates];
368
  CLzmaProb isRepG2[kNumStates];
369
  CLzmaProb isMatch[kNumStates][LZMA_NUM_PB_STATES_MAX];
370
  CLzmaProb isRep0Long[kNumStates][LZMA_NUM_PB_STATES_MAX];
371
  CLzmaProb posSlotEncoder[kNumLenToPosStates][1 << kNumPosSlotBits];
372
  CLzmaProb posEncoders[kNumFullDistances];
373
  
374
  CLenEnc lenProbs;
375
  CLenEnc repLenProbs;
376
377
  #ifndef LZMA_LOG_BSR
378
  Byte g_FastPos[1 << kNumLogBits];
379
  #endif
380
381
  CLenPriceEnc lenEnc;
382
  CLenPriceEnc repLenEnc;
383
384
  COptimal opt[kNumOpts];
385
386
  CSaveState saveState;
387
388
  #ifndef _7ZIP_ST
389
  Byte pad2[128];
390
  #endif
391
} CLzmaEnc;
392
393
394
395
176k
#define COPY_ARR(dest, src, arr) memcpy(dest->arr, src->arr, sizeof(src->arr));
396
397
void LzmaEnc_SaveState(CLzmaEncHandle pp)
398
15.6k
{
399
15.6k
  CLzmaEnc *p = (CLzmaEnc *)pp;
400
15.6k
  CSaveState *dest = &p->saveState;
401
  
402
15.6k
  dest->state = p->state;
403
  
404
15.6k
  dest->lenProbs = p->lenProbs;
405
15.6k
  dest->repLenProbs = p->repLenProbs;
406
407
15.6k
  COPY_ARR(dest, p, reps);
408
409
15.6k
  COPY_ARR(dest, p, posAlignEncoder);
410
15.6k
  COPY_ARR(dest, p, isRep);
411
15.6k
  COPY_ARR(dest, p, isRepG0);
412
15.6k
  COPY_ARR(dest, p, isRepG1);
413
15.6k
  COPY_ARR(dest, p, isRepG2);
414
15.6k
  COPY_ARR(dest, p, isMatch);
415
15.6k
  COPY_ARR(dest, p, isRep0Long);
416
15.6k
  COPY_ARR(dest, p, posSlotEncoder);
417
15.6k
  COPY_ARR(dest, p, posEncoders);
418
419
15.6k
  memcpy(dest->litProbs, p->litProbs, ((UInt32)0x300 << p->lclp) * sizeof(CLzmaProb));
420
15.6k
}
421
422
423
void LzmaEnc_RestoreState(CLzmaEncHandle pp)
424
1.97k
{
425
1.97k
  CLzmaEnc *dest = (CLzmaEnc *)pp;
426
1.97k
  const CSaveState *p = &dest->saveState;
427
428
1.97k
  dest->state = p->state;
429
430
1.97k
  dest->lenProbs = p->lenProbs;
431
1.97k
  dest->repLenProbs = p->repLenProbs;
432
  
433
1.97k
  COPY_ARR(dest, p, reps);
434
  
435
1.97k
  COPY_ARR(dest, p, posAlignEncoder);
436
1.97k
  COPY_ARR(dest, p, isRep);
437
1.97k
  COPY_ARR(dest, p, isRepG0);
438
1.97k
  COPY_ARR(dest, p, isRepG1);
439
1.97k
  COPY_ARR(dest, p, isRepG2);
440
1.97k
  COPY_ARR(dest, p, isMatch);
441
1.97k
  COPY_ARR(dest, p, isRep0Long);
442
1.97k
  COPY_ARR(dest, p, posSlotEncoder);
443
1.97k
  COPY_ARR(dest, p, posEncoders);
444
445
1.97k
  memcpy(dest->litProbs, p->litProbs, ((UInt32)0x300 << dest->lclp) * sizeof(CLzmaProb));
446
1.97k
}
447
448
449
450
SRes LzmaEnc_SetProps(CLzmaEncHandle pp, const CLzmaEncProps *props2)
451
15.5k
{
452
15.5k
  CLzmaEnc *p = (CLzmaEnc *)pp;
453
15.5k
  CLzmaEncProps props = *props2;
454
15.5k
  LzmaEncProps_Normalize(&props);
455
456
15.5k
  if (props.lc > LZMA_LC_MAX
457
15.5k
      || props.lp > LZMA_LP_MAX
458
15.5k
      || props.pb > LZMA_PB_MAX
459
15.5k
      || props.dictSize > ((UInt64)1 << kDicLogSizeMaxCompress)
460
15.5k
      || props.dictSize > kLzmaMaxHistorySize)
461
0
    return SZ_ERROR_PARAM;
462
463
15.5k
  p->dictSize = props.dictSize;
464
15.5k
  {
465
15.5k
    unsigned fb = props.fb;
466
15.5k
    if (fb < 5)
467
0
      fb = 5;
468
15.5k
    if (fb > LZMA_MATCH_LEN_MAX)
469
0
      fb = LZMA_MATCH_LEN_MAX;
470
15.5k
    p->numFastBytes = fb;
471
15.5k
  }
472
15.5k
  p->lc = props.lc;
473
15.5k
  p->lp = props.lp;
474
15.5k
  p->pb = props.pb;
475
15.5k
  p->fastMode = (props.algo == 0);
476
  // p->_maxMode = True;
477
15.5k
  p->matchFinderBase.btMode = (Byte)(props.btMode ? 1 : 0);
478
15.5k
  {
479
15.5k
    unsigned numHashBytes = 4;
480
15.5k
    if (props.btMode)
481
14.0k
    {
482
14.0k
      if (props.numHashBytes < 2)
483
0
        numHashBytes = 2;
484
14.0k
      else if (props.numHashBytes < 4)
485
4.92k
        numHashBytes = props.numHashBytes;
486
14.0k
    }
487
15.5k
    p->matchFinderBase.numHashBytes = numHashBytes;
488
15.5k
  }
489
490
15.5k
  p->matchFinderBase.cutValue = props.mc;
491
492
15.5k
  p->writeEndMark = props.writeEndMark;
493
494
  #ifndef _7ZIP_ST
495
  /*
496
  if (newMultiThread != _multiThread)
497
  {
498
    ReleaseMatchFinder();
499
    _multiThread = newMultiThread;
500
  }
501
  */
502
  p->multiThread = (props.numThreads > 1);
503
  #endif
504
505
15.5k
  return SZ_OK;
506
15.5k
}
507
508
509
void LzmaEnc_SetDataSize(CLzmaEncHandle pp, UInt64 expectedDataSiize)
510
7.77k
{
511
7.77k
  CLzmaEnc *p = (CLzmaEnc *)pp;
512
7.77k
  p->matchFinderBase.expectedDataSize = expectedDataSiize;
513
7.77k
}
514
515
516
7.77k
#define kState_Start 0
517
851k
#define kState_LitAfterMatch 4
518
1.76M
#define kState_LitAfterRep   5
519
0
#define kState_MatchAfterLit 7
520
44.5k
#define kState_RepAfterLit   8
521
522
static const Byte kLiteralNextStates[kNumStates] = {0, 0, 0, 0, 1, 2, 3, 4,  5,  6,   4, 5};
523
static const Byte kMatchNextStates[kNumStates]   = {7, 7, 7, 7, 7, 7, 7, 10, 10, 10, 10, 10};
524
static const Byte kRepNextStates[kNumStates]     = {8, 8, 8, 8, 8, 8, 8, 11, 11, 11, 11, 11};
525
static const Byte kShortRepNextStates[kNumStates]= {9, 9, 9, 9, 9, 9, 9, 11, 11, 11, 11, 11};
526
527
13.8M
#define IsLitState(s) ((s) < 7)
528
13.6M
#define GetLenToPosState2(len) (((len) < kNumLenToPosStates - 1) ? (len) : kNumLenToPosStates - 1)
529
1.44M
#define GetLenToPosState(len) (((len) < kNumLenToPosStates + 1) ? (len) - 2 : kNumLenToPosStates - 1)
530
531
48.9M
#define kInfinityPrice (1 << 30)
532
533
static void RangeEnc_Construct(CRangeEnc *p)
534
7.77k
{
535
7.77k
  p->outStream = NULL;
536
7.77k
  p->bufBase = NULL;
537
7.77k
}
538
539
#define RangeEnc_GetProcessed(p)       ((p)->processed + ((p)->buf - (p)->bufBase) + (p)->cacheSize)
540
7.58M
#define RangeEnc_GetProcessed_sizet(p) ((size_t)(p)->processed + ((p)->buf - (p)->bufBase) + (size_t)(p)->cacheSize)
541
542
7.77k
#define RC_BUF_SIZE (1 << 16)
543
544
static int RangeEnc_Alloc(CRangeEnc *p, ISzAllocPtr alloc)
545
7.77k
{
546
7.77k
  if (!p->bufBase)
547
7.77k
  {
548
7.77k
    p->bufBase = (Byte *)ISzAlloc_Alloc(alloc, RC_BUF_SIZE);
549
7.77k
    if (!p->bufBase)
550
0
      return 0;
551
7.77k
    p->bufLim = p->bufBase + RC_BUF_SIZE;
552
7.77k
  }
553
7.77k
  return 1;
554
7.77k
}
555
556
static void RangeEnc_Free(CRangeEnc *p, ISzAllocPtr alloc)
557
7.77k
{
558
7.77k
  ISzAlloc_Free(alloc, p->bufBase);
559
7.77k
  p->bufBase = 0;
560
7.77k
}
561
562
static void RangeEnc_Init(CRangeEnc *p)
563
33.1k
{
564
  /* Stream.Init(); */
565
33.1k
  p->range = 0xFFFFFFFF;
566
33.1k
  p->cache = 0;
567
33.1k
  p->low = 0;
568
33.1k
  p->cacheSize = 0;
569
570
33.1k
  p->buf = p->bufBase;
571
572
33.1k
  p->processed = 0;
573
33.1k
  p->res = SZ_OK;
574
33.1k
}
575
576
MY_NO_INLINE static void RangeEnc_FlushStream(CRangeEnc *p)
577
15.6k
{
578
15.6k
  size_t num;
579
15.6k
  if (p->res != SZ_OK)
580
0
    return;
581
15.6k
  num = p->buf - p->bufBase;
582
15.6k
  if (num != ISeqOutStream_Write(p->outStream, p->bufBase, num))
583
0
    p->res = SZ_ERROR_WRITE;
584
15.6k
  p->processed += num;
585
15.6k
  p->buf = p->bufBase;
586
15.6k
}
587
588
MY_NO_INLINE static void MY_FAST_CALL RangeEnc_ShiftLow(CRangeEnc *p)
589
9.12M
{
590
9.12M
  UInt32 low = (UInt32)p->low;
591
9.12M
  unsigned high = (unsigned)(p->low >> 32);
592
9.12M
  p->low = (UInt32)(low << 8);
593
9.12M
  if (low < (UInt32)0xFF000000 || high != 0)
594
9.08M
  {
595
9.08M
    {
596
9.08M
      Byte *buf = p->buf;
597
9.08M
      *buf++ = (Byte)(p->cache + high);
598
9.08M
      p->cache = (unsigned)(low >> 24);
599
9.08M
      p->buf = buf;
600
9.08M
      if (buf == p->bufLim)
601
0
        RangeEnc_FlushStream(p);
602
9.08M
      if (p->cacheSize == 0)
603
9.04M
        return;
604
9.08M
    }
605
36.1k
    high += 0xFF;
606
36.1k
    for (;;)
607
36.4k
    {
608
36.4k
      Byte *buf = p->buf;
609
36.4k
      *buf++ = (Byte)(high);
610
36.4k
      p->buf = buf;
611
36.4k
      if (buf == p->bufLim)
612
0
        RangeEnc_FlushStream(p);
613
36.4k
      if (--p->cacheSize == 0)
614
36.1k
        return;
615
36.4k
    }
616
36.1k
  }
617
36.4k
  p->cacheSize++;
618
36.4k
}
619
620
static void RangeEnc_FlushData(CRangeEnc *p)
621
15.6k
{
622
15.6k
  int i;
623
93.8k
  for (i = 0; i < 5; i++)
624
78.1k
    RangeEnc_ShiftLow(p);
625
15.6k
}
626
627
87.3M
#define RC_NORM(p) if (range < kTopValue) { range <<= 8; RangeEnc_ShiftLow(p); }
628
629
#define RC_BIT_PRE(p, prob) \
630
86.7M
  ttt = *(prob); \
631
86.7M
  newBound = (range >> kNumBitModelTotalBits) * ttt;
632
633
// #define _LZMA_ENC_USE_BRANCH
634
635
#ifdef _LZMA_ENC_USE_BRANCH
636
637
#define RC_BIT(p, prob, bit) { \
638
  RC_BIT_PRE(p, prob) \
639
  if (bit == 0) { range = newBound; ttt += (kBitModelTotal - ttt) >> kNumMoveBits; } \
640
  else { (p)->low += newBound; range -= newBound; ttt -= ttt >> kNumMoveBits; } \
641
  *(prob) = (CLzmaProb)ttt; \
642
  RC_NORM(p) \
643
  }
644
645
#else
646
647
73.6M
#define RC_BIT(p, prob, bit) { \
648
73.6M
  UInt32 mask; \
649
73.6M
  RC_BIT_PRE(p, prob) \
650
73.6M
  mask = 0 - (UInt32)bit; \
651
73.6M
  range &= mask; \
652
73.6M
  mask &= newBound; \
653
73.6M
  range -= mask; \
654
73.6M
  (p)->low += mask; \
655
73.6M
  mask = (UInt32)bit - 1; \
656
73.6M
  range += newBound & mask; \
657
73.6M
  mask &= (kBitModelTotal - ((1 << kNumMoveBits) - 1)); \
658
73.6M
  mask += ((1 << kNumMoveBits) - 1); \
659
73.6M
  ttt += (Int32)(mask - ttt) >> kNumMoveBits; \
660
73.6M
  *(prob) = (CLzmaProb)ttt; \
661
73.6M
  RC_NORM(p) \
662
73.6M
  }
663
664
#endif
665
666
667
668
669
#define RC_BIT_0_BASE(p, prob) \
670
10.3M
  range = newBound; *(prob) = (CLzmaProb)(ttt + ((kBitModelTotal - ttt) >> kNumMoveBits));
671
672
#define RC_BIT_1_BASE(p, prob) \
673
2.74M
  range -= newBound; (p)->low += newBound; *(prob) = (CLzmaProb)(ttt - (ttt >> kNumMoveBits)); \
674
675
#define RC_BIT_0(p, prob) \
676
10.0M
  RC_BIT_0_BASE(p, prob) \
677
10.0M
  RC_NORM(p)
678
679
#define RC_BIT_1(p, prob) \
680
2.57M
  RC_BIT_1_BASE(p, prob) \
681
2.57M
  RC_NORM(p)
682
683
static void RangeEnc_EncodeBit_0(CRangeEnc *p, CLzmaProb *prob)
684
7.77k
{
685
7.77k
  UInt32 range, ttt, newBound;
686
7.77k
  range = p->range;
687
7.77k
  RC_BIT_PRE(p, prob)
688
7.77k
  RC_BIT_0(p, prob)
689
7.77k
  p->range = range;
690
7.77k
}
691
692
static void LitEnc_Encode(CRangeEnc *p, CLzmaProb *probs, UInt32 sym)
693
7.64M
{
694
7.64M
  UInt32 range = p->range;
695
7.64M
  sym |= 0x100;
696
7.64M
  do
697
61.1M
  {
698
61.1M
    UInt32 ttt, newBound;
699
    // RangeEnc_EncodeBit(p, probs + (sym >> 8), (sym >> 7) & 1);
700
61.1M
    CLzmaProb *prob = probs + (sym >> 8);
701
61.1M
    UInt32 bit = (sym >> 7) & 1;
702
61.1M
    sym <<= 1;
703
61.1M
    RC_BIT(p, prob, bit);
704
61.1M
  }
705
61.1M
  while (sym < 0x10000);
706
7.64M
  p->range = range;
707
7.64M
}
708
709
static void LitEnc_EncodeMatched(CRangeEnc *p, CLzmaProb *probs, UInt32 sym, UInt32 matchByte)
710
326k
{
711
326k
  UInt32 range = p->range;
712
326k
  UInt32 offs = 0x100;
713
326k
  sym |= 0x100;
714
326k
  do
715
2.61M
  {
716
2.61M
    UInt32 ttt, newBound;
717
2.61M
    CLzmaProb *prob;
718
2.61M
    UInt32 bit;
719
2.61M
    matchByte <<= 1;
720
    // RangeEnc_EncodeBit(p, probs + (offs + (matchByte & offs) + (sym >> 8)), (sym >> 7) & 1);
721
2.61M
    prob = probs + (offs + (matchByte & offs) + (sym >> 8));
722
2.61M
    bit = (sym >> 7) & 1;
723
2.61M
    sym <<= 1;
724
2.61M
    offs &= ~(matchByte ^ sym);
725
2.61M
    RC_BIT(p, prob, bit);
726
2.61M
  }
727
2.61M
  while (sym < 0x10000);
728
326k
  p->range = range;
729
326k
}
730
731
732
733
static void LzmaEnc_InitPriceTables(CProbPrice *ProbPrices)
734
7.77k
{
735
7.77k
  UInt32 i;
736
1.00M
  for (i = 0; i < (kBitModelTotal >> kNumMoveReducingBits); i++)
737
994k
  {
738
994k
    const unsigned kCyclesBits = kNumBitPriceShiftBits;
739
994k
    UInt32 w = (i << kNumMoveReducingBits) + (1 << (kNumMoveReducingBits - 1));
740
994k
    unsigned bitCount = 0;
741
994k
    unsigned j;
742
4.97M
    for (j = 0; j < kCyclesBits; j++)
743
3.97M
    {
744
3.97M
      w = w * w;
745
3.97M
      bitCount <<= 1;
746
53.5M
      while (w >= ((UInt32)1 << 16))
747
49.6M
      {
748
49.6M
        w >>= 1;
749
49.6M
        bitCount++;
750
49.6M
      }
751
3.97M
    }
752
994k
    ProbPrices[i] = (CProbPrice)((kNumBitModelTotalBits << kCyclesBits) - 15 - bitCount);
753
    // printf("\n%3d: %5d", i, ProbPrices[i]);
754
994k
  }
755
7.77k
}
756
757
758
#define GET_PRICE(prob, bit) \
759
2.00M
  p->ProbPrices[((prob) ^ (unsigned)(((-(int)(bit))) & (kBitModelTotal - 1))) >> kNumMoveReducingBits];
760
761
#define GET_PRICEa(prob, bit) \
762
76.0M
     ProbPrices[((prob) ^ (unsigned)((-((int)(bit))) & (kBitModelTotal - 1))) >> kNumMoveReducingBits];
763
764
15.7M
#define GET_PRICE_0(prob) p->ProbPrices[(prob) >> kNumMoveReducingBits]
765
23.9M
#define GET_PRICE_1(prob) p->ProbPrices[((prob) ^ (kBitModelTotal - 1)) >> kNumMoveReducingBits]
766
767
10.1M
#define GET_PRICEa_0(prob) ProbPrices[(prob) >> kNumMoveReducingBits]
768
10.1M
#define GET_PRICEa_1(prob) ProbPrices[((prob) ^ (kBitModelTotal - 1)) >> kNumMoveReducingBits]
769
770
771
static UInt32 LitEnc_GetPrice(const CLzmaProb *probs, UInt32 sym, const CProbPrice *ProbPrices)
772
1.04M
{
773
1.04M
  UInt32 price = 0;
774
1.04M
  sym |= 0x100;
775
1.04M
  do
776
8.37M
  {
777
8.37M
    unsigned bit = sym & 1;
778
8.37M
    sym >>= 1;
779
8.37M
    price += GET_PRICEa(probs[sym], bit);
780
8.37M
  }
781
8.37M
  while (sym >= 2);
782
1.04M
  return price;
783
1.04M
}
784
785
786
static UInt32 LitEnc_Matched_GetPrice(const CLzmaProb *probs, UInt32 sym, UInt32 matchByte, const CProbPrice *ProbPrices)
787
3.41M
{
788
3.41M
  UInt32 price = 0;
789
3.41M
  UInt32 offs = 0x100;
790
3.41M
  sym |= 0x100;
791
3.41M
  do
792
27.3M
  {
793
27.3M
    matchByte <<= 1;
794
27.3M
    price += GET_PRICEa(probs[offs + (matchByte & offs) + (sym >> 8)], (sym >> 7) & 1);
795
27.3M
    sym <<= 1;
796
27.3M
    offs &= ~(matchByte ^ sym);
797
27.3M
  }
798
27.3M
  while (sym < 0x10000);
799
3.41M
  return price;
800
3.41M
}
801
802
803
static void RcTree_ReverseEncode(CRangeEnc *rc, CLzmaProb *probs, unsigned numBits, unsigned sym)
804
409k
{
805
409k
  UInt32 range = rc->range;
806
409k
  unsigned m = 1;
807
409k
  do
808
874k
  {
809
874k
    UInt32 ttt, newBound;
810
874k
    unsigned bit = sym & 1;
811
    // RangeEnc_EncodeBit(rc, probs + m, bit);
812
874k
    sym >>= 1;
813
874k
    RC_BIT(rc, probs + m, bit);
814
874k
    m = (m << 1) | bit;
815
874k
  }
816
874k
  while (--numBits);
817
409k
  rc->range = range;
818
409k
}
819
820
821
822
static void LenEnc_Init(CLenEnc *p)
823
35.0k
{
824
35.0k
  unsigned i;
825
8.99M
  for (i = 0; i < (LZMA_NUM_PB_STATES_MAX << (kLenNumLowBits + 1)); i++)
826
8.96M
    p->low[i] = kProbInitValue;
827
8.99M
  for (i = 0; i < kLenNumHighSymbols; i++)
828
8.96M
    p->high[i] = kProbInitValue;
829
35.0k
}
830
831
static void LenEnc_Encode(CLenEnc *p, CRangeEnc *rc, unsigned sym, unsigned posState)
832
1.26M
{
833
1.26M
  UInt32 range, ttt, newBound;
834
1.26M
  CLzmaProb *probs = p->low;
835
1.26M
  range = rc->range;
836
1.26M
  RC_BIT_PRE(rc, probs);
837
1.26M
  if (sym >= kLenNumLowSymbols)
838
135k
  {
839
135k
    RC_BIT_1(rc, probs);
840
135k
    probs += kLenNumLowSymbols;
841
135k
    RC_BIT_PRE(rc, probs);
842
135k
    if (sym >= kLenNumLowSymbols * 2)
843
88.5k
    {
844
88.5k
      RC_BIT_1(rc, probs);
845
88.5k
      rc->range = range;
846
      // RcTree_Encode(rc, p->high, kLenNumHighBits, sym - kLenNumLowSymbols * 2);
847
88.5k
      LitEnc_Encode(rc, p->high, sym - kLenNumLowSymbols * 2);
848
88.5k
      return;
849
88.5k
    }
850
47.0k
    sym -= kLenNumLowSymbols;
851
47.0k
  }
852
853
  // RcTree_Encode(rc, probs + (posState << kLenNumLowBits), kLenNumLowBits, sym);
854
1.17M
  {
855
1.17M
    unsigned m;
856
1.17M
    unsigned bit;
857
1.17M
    RC_BIT_0(rc, probs);
858
1.17M
    probs += (posState << (1 + kLenNumLowBits));
859
1.17M
    bit = (sym >> 2)    ; RC_BIT(rc, probs + 1, bit); m = (1 << 1) + bit;
860
1.17M
    bit = (sym >> 1) & 1; RC_BIT(rc, probs + m, bit); m = (m << 1) + bit;
861
1.17M
    bit =  sym       & 1; RC_BIT(rc, probs + m, bit);
862
1.17M
    rc->range = range;
863
1.17M
  }
864
1.17M
}
865
866
static void SetPrices_3(const CLzmaProb *probs, UInt32 startPrice, UInt32 *prices, const CProbPrice *ProbPrices)
867
915k
{
868
915k
  unsigned i;
869
4.57M
  for (i = 0; i < 8; i += 2)
870
3.66M
  {
871
3.66M
    UInt32 price = startPrice;
872
3.66M
    UInt32 prob;
873
3.66M
    price += GET_PRICEa(probs[1           ], (i >> 2));
874
3.66M
    price += GET_PRICEa(probs[2 + (i >> 2)], (i >> 1) & 1);
875
3.66M
    prob = probs[4 + (i >> 1)];
876
3.66M
    prices[i    ] = price + GET_PRICEa_0(prob);
877
3.66M
    prices[i + 1] = price + GET_PRICEa_1(prob);
878
3.66M
  }
879
915k
}
880
881
882
MY_NO_INLINE static void MY_FAST_CALL LenPriceEnc_UpdateTables(
883
    CLenPriceEnc *p,
884
    unsigned numPosStates,
885
    const CLenEnc *enc,
886
    const CProbPrice *ProbPrices)
887
59.0k
{
888
59.0k
  UInt32 b;
889
 
890
59.0k
  {
891
59.0k
    unsigned prob = enc->low[0];
892
59.0k
    UInt32 a, c;
893
59.0k
    unsigned posState;
894
59.0k
    b = GET_PRICEa_1(prob);
895
59.0k
    a = GET_PRICEa_0(prob);
896
59.0k
    c = b + GET_PRICEa_0(enc->low[kLenNumLowSymbols]);
897
516k
    for (posState = 0; posState < numPosStates; posState++)
898
457k
    {
899
457k
      UInt32 *prices = p->prices[posState];
900
457k
      const CLzmaProb *probs = enc->low + (posState << (1 + kLenNumLowBits));
901
457k
      SetPrices_3(probs, a, prices, ProbPrices);
902
457k
      SetPrices_3(probs + kLenNumLowSymbols, c, prices + kLenNumLowSymbols, ProbPrices);
903
457k
    }
904
59.0k
  }
905
906
  /*
907
  {
908
    unsigned i;
909
    UInt32 b;
910
    a = GET_PRICEa_0(enc->low[0]);
911
    for (i = 0; i < kLenNumLowSymbols; i++)
912
      p->prices2[i] = a;
913
    a = GET_PRICEa_1(enc->low[0]);
914
    b = a + GET_PRICEa_0(enc->low[kLenNumLowSymbols]);
915
    for (i = kLenNumLowSymbols; i < kLenNumLowSymbols * 2; i++)
916
      p->prices2[i] = b;
917
    a += GET_PRICEa_1(enc->low[kLenNumLowSymbols]);
918
  }
919
  */
920
 
921
  // p->counter = numSymbols;
922
  // p->counter = 64;
923
924
59.0k
  {
925
59.0k
    unsigned i = p->tableSize;
926
    
927
59.0k
    if (i > kLenNumLowSymbols * 2)
928
33.6k
    {
929
33.6k
      const CLzmaProb *probs = enc->high;
930
33.6k
      UInt32 *prices = p->prices[0] + kLenNumLowSymbols * 2;
931
33.6k
      i -= kLenNumLowSymbols * 2 - 1;
932
33.6k
      i >>= 1;
933
33.6k
      b += GET_PRICEa_1(enc->low[kLenNumLowSymbols]);
934
33.6k
      do
935
2.18M
      {
936
        /*
937
        p->prices2[i] = a +
938
        // RcTree_GetPrice(enc->high, kLenNumHighBits, i - kLenNumLowSymbols * 2, ProbPrices);
939
        LitEnc_GetPrice(probs, i - kLenNumLowSymbols * 2, ProbPrices);
940
        */
941
        // UInt32 price = a + RcTree_GetPrice(probs, kLenNumHighBits - 1, sym, ProbPrices);
942
2.18M
        unsigned sym = --i + (1 << (kLenNumHighBits - 1));
943
2.18M
        UInt32 price = b;
944
2.18M
        do
945
15.3M
        {
946
15.3M
          unsigned bit = sym & 1;
947
15.3M
          sym >>= 1;
948
15.3M
          price += GET_PRICEa(probs[sym], bit);
949
15.3M
        }
950
15.3M
        while (sym >= 2);
951
952
2.18M
        {
953
2.18M
          unsigned prob = probs[(size_t)i + (1 << (kLenNumHighBits - 1))];
954
2.18M
          prices[(size_t)i * 2    ] = price + GET_PRICEa_0(prob);
955
2.18M
          prices[(size_t)i * 2 + 1] = price + GET_PRICEa_1(prob);
956
2.18M
        }
957
2.18M
      }
958
2.18M
      while (i);
959
960
33.6k
      {
961
33.6k
        unsigned posState;
962
33.6k
        size_t num = (p->tableSize - kLenNumLowSymbols * 2) * sizeof(p->prices[0][0]);
963
318k
        for (posState = 1; posState < numPosStates; posState++)
964
284k
          memcpy(p->prices[posState] + kLenNumLowSymbols * 2, p->prices[0] + kLenNumLowSymbols * 2, num);
965
33.6k
      }
966
33.6k
    }
967
59.0k
  }
968
59.0k
}
969
970
/*
971
  #ifdef SHOW_STAT
972
  g_STAT_OFFSET += num;
973
  printf("\n MovePos %u", num);
974
  #endif
975
*/
976
  
977
278k
#define MOVE_POS(p, num) { \
978
278k
    p->additionalOffset += (num); \
979
278k
    p->matchFinder.Skip(p->matchFinderObj, (UInt32)(num)); }
980
981
982
static unsigned ReadMatchDistances(CLzmaEnc *p, unsigned *numPairsRes)
983
11.9M
{
984
11.9M
  unsigned numPairs;
985
  
986
11.9M
  p->additionalOffset++;
987
11.9M
  p->numAvail = p->matchFinder.GetNumAvailableBytes(p->matchFinderObj);
988
11.9M
  numPairs = p->matchFinder.GetMatches(p->matchFinderObj, p->matches);
989
11.9M
  *numPairsRes = numPairs;
990
  
991
  #ifdef SHOW_STAT
992
  printf("\n i = %u numPairs = %u    ", g_STAT_OFFSET, numPairs / 2);
993
  g_STAT_OFFSET++;
994
  {
995
    unsigned i;
996
    for (i = 0; i < numPairs; i += 2)
997
      printf("%2u %6u   | ", p->matches[i], p->matches[i + 1]);
998
  }
999
  #endif
1000
  
1001
11.9M
  if (numPairs == 0)
1002
6.98M
    return 0;
1003
4.92M
  {
1004
4.92M
    unsigned len = p->matches[(size_t)numPairs - 2];
1005
4.92M
    if (len != p->numFastBytes)
1006
4.75M
      return len;
1007
161k
    {
1008
161k
      UInt32 numAvail = p->numAvail;
1009
161k
      if (numAvail > LZMA_MATCH_LEN_MAX)
1010
150k
        numAvail = LZMA_MATCH_LEN_MAX;
1011
161k
      {
1012
161k
        const Byte *p1 = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1013
161k
        const Byte *p2 = p1 + len;
1014
161k
        ptrdiff_t dif = (ptrdiff_t)-1 - p->matches[(size_t)numPairs - 1];
1015
161k
        const Byte *lim = p1 + numAvail;
1016
4.51M
        for (; p2 != lim && *p2 == p2[dif]; p2++)
1017
4.35M
        {}
1018
161k
        return (unsigned)(p2 - p1);
1019
4.92M
      }
1020
4.92M
    }
1021
4.92M
  }
1022
4.92M
}
1023
1024
17.6M
#define MARK_LIT ((UInt32)(Int32)-1)
1025
1026
1.32M
#define MakeAs_Lit(p)       { (p)->dist = MARK_LIT; (p)->extra = 0; }
1027
109k
#define MakeAs_ShortRep(p)  { (p)->dist = 0; (p)->extra = 0; }
1028
1.04M
#define IsShortRep(p)       ((p)->dist == 0)
1029
1030
1031
#define GetPrice_ShortRep(p, state, posState) \
1032
134k
  ( GET_PRICE_0(p->isRepG0[state]) + GET_PRICE_0(p->isRep0Long[state][posState]))
1033
1034
2.72M
#define GetPrice_Rep_0(p, state, posState) ( \
1035
2.72M
    GET_PRICE_1(p->isMatch[state][posState]) \
1036
2.72M
  + GET_PRICE_1(p->isRep0Long[state][posState])) \
1037
2.72M
  + GET_PRICE_1(p->isRep[state]) \
1038
2.72M
  + GET_PRICE_0(p->isRepG0[state])
1039
  
1040
MY_FORCE_INLINE
1041
static UInt32 GetPrice_PureRep(const CLzmaEnc *p, unsigned repIndex, size_t state, size_t posState)
1042
4.58M
{
1043
4.58M
  UInt32 price;
1044
4.58M
  UInt32 prob = p->isRepG0[state];
1045
4.58M
  if (repIndex == 0)
1046
1.50M
  {
1047
1.50M
    price = GET_PRICE_0(prob);
1048
1.50M
    price += GET_PRICE_1(p->isRep0Long[state][posState]);
1049
1.50M
  }
1050
3.08M
  else
1051
3.08M
  {
1052
3.08M
    price = GET_PRICE_1(prob);
1053
3.08M
    prob = p->isRepG1[state];
1054
3.08M
    if (repIndex == 1)
1055
1.07M
      price += GET_PRICE_0(prob);
1056
2.00M
    else
1057
2.00M
    {
1058
2.00M
      price += GET_PRICE_1(prob);
1059
2.00M
      price += GET_PRICE(p->isRepG2[state], repIndex - 2);
1060
2.00M
    }
1061
3.08M
  }
1062
4.58M
  return price;
1063
4.58M
}
1064
1065
1066
static unsigned Backward(CLzmaEnc *p, unsigned cur)
1067
416k
{
1068
416k
  unsigned wr = cur + 1;
1069
416k
  p->optEnd = wr;
1070
1071
416k
  for (;;)
1072
1.90M
  {
1073
1.90M
    UInt32 dist = p->opt[cur].dist;
1074
1.90M
    unsigned len = (unsigned)p->opt[cur].len;
1075
1.90M
    unsigned extra = (unsigned)p->opt[cur].extra;
1076
1.90M
    cur -= len;
1077
1078
1.90M
    if (extra)
1079
22.0k
    {
1080
22.0k
      wr--;
1081
22.0k
      p->opt[wr].len = (UInt32)len;
1082
22.0k
      cur -= extra;
1083
22.0k
      len = extra;
1084
22.0k
      if (extra == 1)
1085
566
      {
1086
566
        p->opt[wr].dist = dist;
1087
566
        dist = MARK_LIT;
1088
566
      }
1089
21.4k
      else
1090
21.4k
      {
1091
21.4k
        p->opt[wr].dist = 0;
1092
21.4k
        len--;
1093
21.4k
        wr--;
1094
21.4k
        p->opt[wr].dist = MARK_LIT;
1095
21.4k
        p->opt[wr].len = 1;
1096
21.4k
      }
1097
22.0k
    }
1098
1099
1.90M
    if (cur == 0)
1100
416k
    {
1101
416k
      p->backRes = dist;
1102
416k
      p->optCur = wr;
1103
416k
      return len;
1104
416k
    }
1105
    
1106
1.48M
    wr--;
1107
1.48M
    p->opt[wr].dist = dist;
1108
1.48M
    p->opt[wr].len = (UInt32)len;
1109
1.48M
  }
1110
416k
}
1111
1112
1113
1114
#define LIT_PROBS(pos, prevByte) \
1115
12.3M
  (p->litProbs + (UInt32)3 * (((((pos) << 8) + (prevByte)) & p->lpMask) << p->lc))
1116
1117
1118
static unsigned GetOptimum(CLzmaEnc *p, UInt32 position)
1119
3.58M
{
1120
3.58M
  unsigned last, cur;
1121
3.58M
  UInt32 reps[LZMA_NUM_REPS];
1122
3.58M
  unsigned repLens[LZMA_NUM_REPS];
1123
3.58M
  UInt32 *matches;
1124
1125
3.58M
  {
1126
3.58M
    UInt32 numAvail;
1127
3.58M
    unsigned numPairs, mainLen, repMaxIndex, i, posState;
1128
3.58M
    UInt32 matchPrice, repMatchPrice;
1129
3.58M
    const Byte *data;
1130
3.58M
    Byte curByte, matchByte;
1131
    
1132
3.58M
    p->optCur = p->optEnd = 0;
1133
    
1134
3.58M
    if (p->additionalOffset == 0)
1135
3.55M
      mainLen = ReadMatchDistances(p, &numPairs);
1136
35.4k
    else
1137
35.4k
    {
1138
35.4k
      mainLen = p->longestMatchLen;
1139
35.4k
      numPairs = p->numPairs;
1140
35.4k
    }
1141
    
1142
3.58M
    numAvail = p->numAvail;
1143
3.58M
    if (numAvail < 2)
1144
1.89k
    {
1145
1.89k
      p->backRes = MARK_LIT;
1146
1.89k
      return 1;
1147
1.89k
    }
1148
3.58M
    if (numAvail > LZMA_MATCH_LEN_MAX)
1149
3.45M
      numAvail = LZMA_MATCH_LEN_MAX;
1150
    
1151
3.58M
    data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1152
3.58M
    repMaxIndex = 0;
1153
    
1154
17.9M
    for (i = 0; i < LZMA_NUM_REPS; i++)
1155
14.3M
    {
1156
14.3M
      unsigned len;
1157
14.3M
      const Byte *data2;
1158
14.3M
      reps[i] = p->reps[i];
1159
14.3M
      data2 = data - reps[i];
1160
14.3M
      if (data[0] != data2[0] || data[1] != data2[1])
1161
14.1M
      {
1162
14.1M
        repLens[i] = 0;
1163
14.1M
        continue;
1164
14.1M
      }
1165
4.48M
      for (len = 2; len < numAvail && data[len] == data2[len]; len++)
1166
4.32M
      {}
1167
157k
      repLens[i] = len;
1168
157k
      if (len > repLens[repMaxIndex])
1169
83.6k
        repMaxIndex = i;
1170
157k
    }
1171
    
1172
3.58M
    if (repLens[repMaxIndex] >= p->numFastBytes)
1173
53.0k
    {
1174
53.0k
      unsigned len;
1175
53.0k
      p->backRes = (UInt32)repMaxIndex;
1176
53.0k
      len = repLens[repMaxIndex];
1177
53.0k
      MOVE_POS(p, len - 1)
1178
53.0k
      return len;
1179
53.0k
    }
1180
    
1181
3.53M
    matches = p->matches;
1182
    
1183
3.53M
    if (mainLen >= p->numFastBytes)
1184
50.5k
    {
1185
50.5k
      p->backRes = matches[(size_t)numPairs - 1] + LZMA_NUM_REPS;
1186
50.5k
      MOVE_POS(p, mainLen - 1)
1187
50.5k
      return mainLen;
1188
50.5k
    }
1189
    
1190
3.48M
    curByte = *data;
1191
3.48M
    matchByte = *(data - reps[0]);
1192
1193
3.48M
    last = repLens[repMaxIndex];
1194
3.48M
    if (last <= mainLen)
1195
3.48M
      last = mainLen;
1196
    
1197
3.48M
    if (last < 2 && curByte != matchByte)
1198
3.03M
    {
1199
3.03M
      p->backRes = MARK_LIT;
1200
3.03M
      return 1;
1201
3.03M
    }
1202
    
1203
444k
    p->opt[0].state = (CState)p->state;
1204
    
1205
444k
    posState = (position & p->pbMask);
1206
    
1207
444k
    {
1208
444k
      const CLzmaProb *probs = LIT_PROBS(position, *(data - 1));
1209
444k
      p->opt[1].price = GET_PRICE_0(p->isMatch[p->state][posState]) +
1210
444k
        (!IsLitState(p->state) ?
1211
62.6k
          LitEnc_Matched_GetPrice(probs, curByte, matchByte, p->ProbPrices) :
1212
444k
          LitEnc_GetPrice(probs, curByte, p->ProbPrices));
1213
444k
    }
1214
1215
444k
    MakeAs_Lit(&p->opt[1]);
1216
    
1217
444k
    matchPrice = GET_PRICE_1(p->isMatch[p->state][posState]);
1218
444k
    repMatchPrice = matchPrice + GET_PRICE_1(p->isRep[p->state]);
1219
    
1220
    // 18.06
1221
444k
    if (matchByte == curByte && repLens[0] == 0)
1222
38.2k
    {
1223
38.2k
      UInt32 shortRepPrice = repMatchPrice + GetPrice_ShortRep(p, p->state, posState);
1224
38.2k
      if (shortRepPrice < p->opt[1].price)
1225
32.7k
      {
1226
32.7k
        p->opt[1].price = shortRepPrice;
1227
32.7k
        MakeAs_ShortRep(&p->opt[1]);
1228
32.7k
      }
1229
38.2k
      if (last < 2)
1230
28.7k
      {
1231
28.7k
        p->backRes = p->opt[1].dist;
1232
28.7k
        return 1;
1233
28.7k
      }
1234
38.2k
    }
1235
   
1236
416k
    p->opt[1].len = 1;
1237
    
1238
416k
    p->opt[0].reps[0] = reps[0];
1239
416k
    p->opt[0].reps[1] = reps[1];
1240
416k
    p->opt[0].reps[2] = reps[2];
1241
416k
    p->opt[0].reps[3] = reps[3];
1242
    
1243
    // ---------- REP ----------
1244
    
1245
2.08M
    for (i = 0; i < LZMA_NUM_REPS; i++)
1246
1.66M
    {
1247
1.66M
      unsigned repLen = repLens[i];
1248
1.66M
      UInt32 price;
1249
1.66M
      if (repLen < 2)
1250
1.60M
        continue;
1251
57.1k
      price = repMatchPrice + GetPrice_PureRep(p, i, p->state, posState);
1252
57.1k
      do
1253
313k
      {
1254
313k
        UInt32 price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState, repLen);
1255
313k
        COptimal *opt = &p->opt[repLen];
1256
313k
        if (price2 < opt->price)
1257
194k
        {
1258
194k
          opt->price = price2;
1259
194k
          opt->len = (UInt32)repLen;
1260
194k
          opt->dist = (UInt32)i;
1261
194k
          opt->extra = 0;
1262
194k
        }
1263
313k
      }
1264
313k
      while (--repLen >= 2);
1265
57.1k
    }
1266
    
1267
    
1268
    // ---------- MATCH ----------
1269
416k
    {
1270
416k
      unsigned len = repLens[0] + 1;
1271
416k
      if (len <= mainLen)
1272
406k
      {
1273
406k
        unsigned offs = 0;
1274
406k
        UInt32 normalMatchPrice = matchPrice + GET_PRICE_0(p->isRep[p->state]);
1275
1276
406k
        if (len < 2)
1277
405k
          len = 2;
1278
1.16k
        else
1279
3.72k
          while (len > matches[offs])
1280
2.56k
            offs += 2;
1281
    
1282
406k
        for (; ; len++)
1283
622k
        {
1284
622k
          COptimal *opt;
1285
622k
          UInt32 dist = matches[(size_t)offs + 1];
1286
622k
          UInt32 price = normalMatchPrice + GET_PRICE_LEN(&p->lenEnc, posState, len);
1287
622k
          unsigned lenToPosState = GetLenToPosState(len);
1288
       
1289
622k
          if (dist < kNumFullDistances)
1290
229k
            price += p->distancesPrices[lenToPosState][dist & (kNumFullDistances - 1)];
1291
393k
          else
1292
393k
          {
1293
393k
            unsigned slot;
1294
393k
            GetPosSlot2(dist, slot);
1295
393k
            price += p->alignPrices[dist & kAlignMask];
1296
393k
            price += p->posSlotPrices[lenToPosState][slot];
1297
393k
          }
1298
          
1299
622k
          opt = &p->opt[len];
1300
          
1301
622k
          if (price < opt->price)
1302
576k
          {
1303
576k
            opt->price = price;
1304
576k
            opt->len = (UInt32)len;
1305
576k
            opt->dist = dist + LZMA_NUM_REPS;
1306
576k
            opt->extra = 0;
1307
576k
          }
1308
          
1309
622k
          if (len == matches[offs])
1310
464k
          {
1311
464k
            offs += 2;
1312
464k
            if (offs == numPairs)
1313
406k
              break;
1314
464k
          }
1315
622k
        }
1316
406k
      }
1317
416k
    }
1318
    
1319
1320
416k
    cur = 0;
1321
1322
    #ifdef SHOW_STAT2
1323
    /* if (position >= 0) */
1324
    {
1325
      unsigned i;
1326
      printf("\n pos = %4X", position);
1327
      for (i = cur; i <= last; i++)
1328
      printf("\nprice[%4X] = %u", position - cur + i, p->opt[i].price);
1329
    }
1330
    #endif
1331
416k
  }
1332
1333
1334
  
1335
  // ---------- Optimal Parsing ----------
1336
1337
0
  for (;;)
1338
4.56M
  {
1339
4.56M
    unsigned numAvail;
1340
4.56M
    UInt32 numAvailFull;
1341
4.56M
    unsigned newLen, numPairs, prev, state, posState, startLen;
1342
4.56M
    UInt32 litPrice, matchPrice, repMatchPrice;
1343
4.56M
    BoolInt nextIsLit;
1344
4.56M
    Byte curByte, matchByte;
1345
4.56M
    const Byte *data;
1346
4.56M
    COptimal *curOpt, *nextOpt;
1347
1348
4.56M
    if (++cur == last)
1349
380k
      break;
1350
    
1351
    // 18.06
1352
4.18M
    if (cur >= kNumOpts - 64)
1353
402
    {
1354
402
      unsigned j, best;
1355
402
      UInt32 price = p->opt[cur].price;
1356
402
      best = cur;
1357
10.0k
      for (j = cur + 1; j <= last; j++)
1358
9.60k
      {
1359
9.60k
        UInt32 price2 = p->opt[j].price;
1360
9.60k
        if (price >= price2)
1361
862
        {
1362
862
          price = price2;
1363
862
          best = j;
1364
862
        }
1365
9.60k
      }
1366
402
      {
1367
402
        unsigned delta = best - cur;
1368
402
        if (delta != 0)
1369
244
        {
1370
244
          MOVE_POS(p, delta);
1371
244
        }
1372
402
      }
1373
402
      cur = best;
1374
402
      break;
1375
402
    }
1376
1377
4.18M
    newLen = ReadMatchDistances(p, &numPairs);
1378
    
1379
4.18M
    if (newLen >= p->numFastBytes)
1380
35.4k
    {
1381
35.4k
      p->numPairs = numPairs;
1382
35.4k
      p->longestMatchLen = newLen;
1383
35.4k
      break;
1384
35.4k
    }
1385
    
1386
4.14M
    curOpt = &p->opt[cur];
1387
1388
4.14M
    position++;
1389
1390
    // we need that check here, if skip_items in p->opt are possible
1391
    /*
1392
    if (curOpt->price >= kInfinityPrice)
1393
      continue;
1394
    */
1395
1396
4.14M
    prev = cur - curOpt->len;
1397
1398
4.14M
    if (curOpt->len == 1)
1399
1.04M
    {
1400
1.04M
      state = (unsigned)p->opt[prev].state;
1401
1.04M
      if (IsShortRep(curOpt))
1402
78.9k
        state = kShortRepNextStates[state];
1403
962k
      else
1404
962k
        state = kLiteralNextStates[state];
1405
1.04M
    }
1406
3.10M
    else
1407
3.10M
    {
1408
3.10M
      const COptimal *prevOpt;
1409
3.10M
      UInt32 b0;
1410
3.10M
      UInt32 dist = curOpt->dist;
1411
1412
3.10M
      if (curOpt->extra)
1413
43.7k
      {
1414
43.7k
        prev -= (unsigned)curOpt->extra;
1415
43.7k
        state = kState_RepAfterLit;
1416
43.7k
        if (curOpt->extra == 1)
1417
801
          state = (dist < LZMA_NUM_REPS ? kState_RepAfterLit : kState_MatchAfterLit);
1418
43.7k
      }
1419
3.06M
      else
1420
3.06M
      {
1421
3.06M
        state = (unsigned)p->opt[prev].state;
1422
3.06M
        if (dist < LZMA_NUM_REPS)
1423
1.41M
          state = kRepNextStates[state];
1424
1.64M
        else
1425
1.64M
          state = kMatchNextStates[state];
1426
3.06M
      }
1427
1428
3.10M
      prevOpt = &p->opt[prev];
1429
3.10M
      b0 = prevOpt->reps[0];
1430
1431
3.10M
      if (dist < LZMA_NUM_REPS)
1432
1.44M
      {
1433
1.44M
        if (dist == 0)
1434
330k
        {
1435
330k
          reps[0] = b0;
1436
330k
          reps[1] = prevOpt->reps[1];
1437
330k
          reps[2] = prevOpt->reps[2];
1438
330k
          reps[3] = prevOpt->reps[3];
1439
330k
        }
1440
1.11M
        else
1441
1.11M
        {
1442
1.11M
          reps[1] = b0;
1443
1.11M
          b0 = prevOpt->reps[1];
1444
1.11M
          if (dist == 1)
1445
650k
          {
1446
650k
            reps[0] = b0;
1447
650k
            reps[2] = prevOpt->reps[2];
1448
650k
            reps[3] = prevOpt->reps[3];
1449
650k
          }
1450
466k
          else
1451
466k
          {
1452
466k
            reps[2] = b0;
1453
466k
            reps[0] = prevOpt->reps[dist];
1454
466k
            reps[3] = prevOpt->reps[dist ^ 1];
1455
466k
          }
1456
1.11M
        }
1457
1.44M
      }
1458
1.65M
      else
1459
1.65M
      {
1460
1.65M
        reps[0] = (dist - LZMA_NUM_REPS + 1);
1461
1.65M
        reps[1] = b0;
1462
1.65M
        reps[2] = prevOpt->reps[1];
1463
1.65M
        reps[3] = prevOpt->reps[2];
1464
1.65M
      }
1465
3.10M
    }
1466
    
1467
4.14M
    curOpt->state = (CState)state;
1468
4.14M
    curOpt->reps[0] = reps[0];
1469
4.14M
    curOpt->reps[1] = reps[1];
1470
4.14M
    curOpt->reps[2] = reps[2];
1471
4.14M
    curOpt->reps[3] = reps[3];
1472
1473
4.14M
    data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1474
4.14M
    curByte = *data;
1475
4.14M
    matchByte = *(data - reps[0]);
1476
1477
4.14M
    posState = (position & p->pbMask);
1478
1479
    /*
1480
    The order of Price checks:
1481
       <  LIT
1482
       <= SHORT_REP
1483
       <  LIT : REP_0
1484
       <  REP    [ : LIT : REP_0 ]
1485
       <  MATCH  [ : LIT : REP_0 ]
1486
    */
1487
1488
4.14M
    {
1489
4.14M
      UInt32 curPrice = curOpt->price;
1490
4.14M
      unsigned prob = p->isMatch[state][posState];
1491
4.14M
      matchPrice = curPrice + GET_PRICE_1(prob);
1492
4.14M
      litPrice = curPrice + GET_PRICE_0(prob);
1493
4.14M
    }
1494
1495
4.14M
    nextOpt = &p->opt[(size_t)cur + 1];
1496
4.14M
    nextIsLit = False;
1497
1498
    // here we can allow skip_items in p->opt, if we don't check (nextOpt->price < kInfinityPrice)
1499
    // 18.new.06
1500
4.14M
    if ((nextOpt->price < kInfinityPrice
1501
        // && !IsLitState(state)
1502
4.14M
        && matchByte == curByte)
1503
4.14M
        || litPrice > nextOpt->price
1504
4.14M
        )
1505
2.74M
      litPrice = 0;
1506
1.39M
    else
1507
1.39M
    {
1508
1.39M
      const CLzmaProb *probs = LIT_PROBS(position, *(data - 1));
1509
1.39M
      litPrice += (!IsLitState(state) ?
1510
733k
          LitEnc_Matched_GetPrice(probs, curByte, matchByte, p->ProbPrices) :
1511
1.39M
          LitEnc_GetPrice(probs, curByte, p->ProbPrices));
1512
      
1513
1.39M
      if (litPrice < nextOpt->price)
1514
879k
      {
1515
879k
        nextOpt->price = litPrice;
1516
879k
        nextOpt->len = 1;
1517
879k
        MakeAs_Lit(nextOpt);
1518
879k
        nextIsLit = True;
1519
879k
      }
1520
1.39M
    }
1521
1522
4.14M
    repMatchPrice = matchPrice + GET_PRICE_1(p->isRep[state]);
1523
    
1524
4.14M
    numAvailFull = p->numAvail;
1525
4.14M
    {
1526
4.14M
      unsigned temp = kNumOpts - 1 - cur;
1527
4.14M
      if (numAvailFull > temp)
1528
3.32M
        numAvailFull = (UInt32)temp;
1529
4.14M
    }
1530
1531
    // 18.06
1532
    // ---------- SHORT_REP ----------
1533
4.14M
    if (IsLitState(state)) // 18.new
1534
962k
    if (matchByte == curByte)
1535
191k
    if (repMatchPrice < nextOpt->price) // 18.new
1536
    // if (numAvailFull < 2 || data[1] != *(data - reps[0] + 1))
1537
97.3k
    if (
1538
        // nextOpt->price >= kInfinityPrice ||
1539
97.3k
        nextOpt->len < 2   // we can check nextOpt->len, if skip items are not allowed in p->opt
1540
97.3k
        || (nextOpt->dist != 0
1541
            // && nextOpt->extra <= 1 // 17.old
1542
90.1k
            )
1543
97.3k
        )
1544
96.3k
    {
1545
96.3k
      UInt32 shortRepPrice = repMatchPrice + GetPrice_ShortRep(p, state, posState);
1546
      // if (shortRepPrice <= nextOpt->price) // 17.old
1547
96.3k
      if (shortRepPrice < nextOpt->price)  // 18.new
1548
76.3k
      {
1549
76.3k
        nextOpt->price = shortRepPrice;
1550
76.3k
        nextOpt->len = 1;
1551
76.3k
        MakeAs_ShortRep(nextOpt);
1552
76.3k
        nextIsLit = False;
1553
76.3k
      }
1554
96.3k
    }
1555
    
1556
4.14M
    if (numAvailFull < 2)
1557
3.10k
      continue;
1558
4.14M
    numAvail = (numAvailFull <= p->numFastBytes ? numAvailFull : p->numFastBytes);
1559
1560
    // numAvail <= p->numFastBytes
1561
1562
    // ---------- LIT : REP_0 ----------
1563
1564
4.14M
    if (!nextIsLit
1565
4.14M
        && litPrice != 0 // 18.new
1566
4.14M
        && matchByte != curByte
1567
4.14M
        && numAvailFull > 2)
1568
517k
    {
1569
517k
      const Byte *data2 = data - reps[0];
1570
517k
      if (data[1] == data2[1] && data[2] == data2[2])
1571
103k
      {
1572
103k
        unsigned len;
1573
103k
        unsigned limit = p->numFastBytes + 1;
1574
103k
        if (limit > numAvailFull)
1575
4.98k
          limit = numAvailFull;
1576
267k
        for (len = 3; len < limit && data[len] == data2[len]; len++)
1577
164k
        {}
1578
        
1579
103k
        {
1580
103k
          unsigned state2 = kLiteralNextStates[state];
1581
103k
          unsigned posState2 = (position + 1) & p->pbMask;
1582
103k
          UInt32 price = litPrice + GetPrice_Rep_0(p, state2, posState2);
1583
103k
          {
1584
103k
            unsigned offset = cur + len;
1585
1586
103k
            if (last < offset)
1587
4.75k
              last = offset;
1588
          
1589
            // do
1590
103k
            {
1591
103k
              UInt32 price2;
1592
103k
              COptimal *opt;
1593
103k
              len--;
1594
              // price2 = price + GetPrice_Len_Rep_0(p, len, state2, posState2);
1595
103k
              price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState2, len);
1596
1597
103k
              opt = &p->opt[offset];
1598
              // offset--;
1599
103k
              if (price2 < opt->price)
1600
7.52k
              {
1601
7.52k
                opt->price = price2;
1602
7.52k
                opt->len = (UInt32)len;
1603
7.52k
                opt->dist = 0;
1604
7.52k
                opt->extra = 1;
1605
7.52k
              }
1606
103k
            }
1607
            // while (len >= 3);
1608
103k
          }
1609
103k
        }
1610
103k
      }
1611
517k
    }
1612
    
1613
4.14M
    startLen = 2; /* speed optimization */
1614
1615
4.14M
    {
1616
      // ---------- REP ----------
1617
4.14M
      unsigned repIndex = 0; // 17.old
1618
      // unsigned repIndex = IsLitState(state) ? 0 : 1; // 18.notused
1619
20.7M
      for (; repIndex < LZMA_NUM_REPS; repIndex++)
1620
16.5M
      {
1621
16.5M
        unsigned len;
1622
16.5M
        UInt32 price;
1623
16.5M
        const Byte *data2 = data - reps[repIndex];
1624
16.5M
        if (data[0] != data2[0] || data[1] != data2[1])
1625
12.0M
          continue;
1626
        
1627
69.1M
        for (len = 2; len < numAvail && data[len] == data2[len]; len++)
1628
64.6M
        {}
1629
        
1630
        // if (len < startLen) continue; // 18.new: speed optimization
1631
1632
4.53M
        {
1633
4.53M
          unsigned offset = cur + len;
1634
4.53M
          if (last < offset)
1635
196k
            last = offset;
1636
4.53M
        }
1637
4.53M
        {
1638
4.53M
          unsigned len2 = len;
1639
4.53M
          price = repMatchPrice + GetPrice_PureRep(p, repIndex, state, posState);
1640
4.53M
          do
1641
69.1M
          {
1642
69.1M
            UInt32 price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState, len2);
1643
69.1M
            COptimal *opt = &p->opt[cur + len2];
1644
69.1M
            if (price2 < opt->price)
1645
2.72M
            {
1646
2.72M
              opt->price = price2;
1647
2.72M
              opt->len = (UInt32)len2;
1648
2.72M
              opt->dist = (UInt32)repIndex;
1649
2.72M
              opt->extra = 0;
1650
2.72M
            }
1651
69.1M
          }
1652
69.1M
          while (--len2 >= 2);
1653
4.53M
        }
1654
        
1655
4.53M
        if (repIndex == 0) startLen = len + 1;  // 17.old
1656
        // startLen = len + 1; // 18.new
1657
1658
        /* if (_maxMode) */
1659
4.53M
        {
1660
          // ---------- REP : LIT : REP_0 ----------
1661
          // numFastBytes + 1 + numFastBytes
1662
1663
4.53M
          unsigned len2 = len + 1;
1664
4.53M
          unsigned limit = len2 + p->numFastBytes;
1665
4.53M
          if (limit > numAvailFull)
1666
372k
            limit = numAvailFull;
1667
          
1668
4.53M
          len2 += 2;
1669
4.53M
          if (len2 <= limit)
1670
4.44M
          if (data[len2 - 2] == data2[len2 - 2])
1671
2.55M
          if (data[len2 - 1] == data2[len2 - 1])
1672
1.76M
          {
1673
1.76M
            unsigned state2 = kRepNextStates[state];
1674
1.76M
            unsigned posState2 = (position + len) & p->pbMask;
1675
1.76M
            price += GET_PRICE_LEN(&p->repLenEnc, posState, len)
1676
1.76M
                + GET_PRICE_0(p->isMatch[state2][posState2])
1677
1.76M
                + LitEnc_Matched_GetPrice(LIT_PROBS(position + len, data[(size_t)len - 1]),
1678
1.76M
                    data[len], data2[len], p->ProbPrices);
1679
            
1680
            // state2 = kLiteralNextStates[state2];
1681
1.76M
            state2 = kState_LitAfterRep;
1682
1.76M
            posState2 = (posState2 + 1) & p->pbMask;
1683
1684
1685
1.76M
            price += GetPrice_Rep_0(p, state2, posState2);
1686
1687
19.2M
          for (; len2 < limit && data[len2] == data2[len2]; len2++)
1688
17.4M
          {}
1689
          
1690
1.76M
          len2 -= len;
1691
          // if (len2 >= 3)
1692
1.76M
          {
1693
1.76M
            {
1694
1.76M
              unsigned offset = cur + len + len2;
1695
1696
1.76M
              if (last < offset)
1697
510k
                last = offset;
1698
              // do
1699
1.76M
              {
1700
1.76M
                UInt32 price2;
1701
1.76M
                COptimal *opt;
1702
1.76M
                len2--;
1703
                // price2 = price + GetPrice_Len_Rep_0(p, len2, state2, posState2);
1704
1.76M
                price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState2, len2);
1705
1706
1.76M
                opt = &p->opt[offset];
1707
                // offset--;
1708
1.76M
                if (price2 < opt->price)
1709
613k
                {
1710
613k
                  opt->price = price2;
1711
613k
                  opt->len = (UInt32)len2;
1712
613k
                  opt->extra = (CExtra)(len + 1);
1713
613k
                  opt->dist = (UInt32)repIndex;
1714
613k
                }
1715
1.76M
              }
1716
              // while (len2 >= 3);
1717
1.76M
            }
1718
1.76M
          }
1719
1.76M
          }
1720
4.53M
        }
1721
4.53M
      }
1722
4.14M
    }
1723
1724
1725
    // ---------- MATCH ----------
1726
    /* for (unsigned len = 2; len <= newLen; len++) */
1727
4.14M
    if (newLen > numAvail)
1728
552
    {
1729
552
      newLen = numAvail;
1730
1.66k
      for (numPairs = 0; newLen > matches[numPairs]; numPairs += 2);
1731
552
      matches[numPairs] = (UInt32)newLen;
1732
552
      numPairs += 2;
1733
552
    }
1734
    
1735
    // startLen = 2; /* speed optimization */
1736
1737
4.14M
    if (newLen >= startLen)
1738
2.53M
    {
1739
2.53M
      UInt32 normalMatchPrice = matchPrice + GET_PRICE_0(p->isRep[state]);
1740
2.53M
      UInt32 dist;
1741
2.53M
      unsigned offs, posSlot, len;
1742
      
1743
2.53M
      {
1744
2.53M
        unsigned offset = cur + newLen;
1745
2.53M
        if (last < offset)
1746
722k
          last = offset;
1747
2.53M
      }
1748
1749
2.53M
      offs = 0;
1750
2.83M
      while (startLen > matches[offs])
1751
297k
        offs += 2;
1752
2.53M
      dist = matches[(size_t)offs + 1];
1753
      
1754
      // if (dist >= kNumFullDistances)
1755
2.53M
      GetPosSlot2(dist, posSlot);
1756
      
1757
11.0M
      for (len = /*2*/ startLen; ; len++)
1758
13.6M
      {
1759
13.6M
        UInt32 price = normalMatchPrice + GET_PRICE_LEN(&p->lenEnc, posState, len);
1760
13.6M
        {
1761
13.6M
          COptimal *opt;
1762
13.6M
          unsigned lenNorm = len - 2;
1763
13.6M
          lenNorm = GetLenToPosState2(lenNorm);
1764
13.6M
          if (dist < kNumFullDistances)
1765
10.1M
            price += p->distancesPrices[lenNorm][dist & (kNumFullDistances - 1)];
1766
3.47M
          else
1767
3.47M
            price += p->posSlotPrices[lenNorm][posSlot] + p->alignPrices[dist & kAlignMask];
1768
          
1769
13.6M
          opt = &p->opt[cur + len];
1770
13.6M
          if (price < opt->price)
1771
3.00M
          {
1772
3.00M
            opt->price = price;
1773
3.00M
            opt->len = (UInt32)len;
1774
3.00M
            opt->dist = dist + LZMA_NUM_REPS;
1775
3.00M
            opt->extra = 0;
1776
3.00M
          }
1777
13.6M
        }
1778
1779
13.6M
        if (len == matches[offs])
1780
3.14M
        {
1781
          // if (p->_maxMode) {
1782
          // MATCH : LIT : REP_0
1783
1784
3.14M
          const Byte *data2 = data - dist - 1;
1785
3.14M
          unsigned len2 = len + 1;
1786
3.14M
          unsigned limit = len2 + p->numFastBytes;
1787
3.14M
          if (limit > numAvailFull)
1788
126k
            limit = numAvailFull;
1789
          
1790
3.14M
          len2 += 2;
1791
3.14M
          if (len2 <= limit)
1792
3.13M
          if (data[len2 - 2] == data2[len2 - 2])
1793
1.33M
          if (data[len2 - 1] == data2[len2 - 1])
1794
851k
          {
1795
3.41M
          for (; len2 < limit && data[len2] == data2[len2]; len2++)
1796
2.56M
          {}
1797
          
1798
851k
          len2 -= len;
1799
          
1800
          // if (len2 >= 3)
1801
851k
          {
1802
851k
            unsigned state2 = kMatchNextStates[state];
1803
851k
            unsigned posState2 = (position + len) & p->pbMask;
1804
851k
            unsigned offset;
1805
851k
            price += GET_PRICE_0(p->isMatch[state2][posState2]);
1806
851k
            price += LitEnc_Matched_GetPrice(LIT_PROBS(position + len, data[(size_t)len - 1]),
1807
851k
                    data[len], data2[len], p->ProbPrices);
1808
1809
            // state2 = kLiteralNextStates[state2];
1810
851k
            state2 = kState_LitAfterMatch;
1811
1812
851k
            posState2 = (posState2 + 1) & p->pbMask;
1813
851k
            price += GetPrice_Rep_0(p, state2, posState2);
1814
1815
851k
            offset = cur + len + len2;
1816
1817
851k
            if (last < offset)
1818
109k
              last = offset;
1819
            // do
1820
851k
            {
1821
851k
              UInt32 price2;
1822
851k
              COptimal *opt;
1823
851k
              len2--;
1824
              // price2 = price + GetPrice_Len_Rep_0(p, len2, state2, posState2);
1825
851k
              price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState2, len2);
1826
851k
              opt = &p->opt[offset];
1827
              // offset--;
1828
851k
              if (price2 < opt->price)
1829
400k
              {
1830
400k
                opt->price = price2;
1831
400k
                opt->len = (UInt32)len2;
1832
400k
                opt->extra = (CExtra)(len + 1);
1833
400k
                opt->dist = dist + LZMA_NUM_REPS;
1834
400k
              }
1835
851k
            }
1836
            // while (len2 >= 3);
1837
851k
          }
1838
1839
851k
          }
1840
        
1841
3.14M
          offs += 2;
1842
3.14M
          if (offs == numPairs)
1843
2.53M
            break;
1844
613k
          dist = matches[(size_t)offs + 1];
1845
          // if (dist >= kNumFullDistances)
1846
613k
            GetPosSlot2(dist, posSlot);
1847
613k
        }
1848
13.6M
      }
1849
2.53M
    }
1850
4.14M
  }
1851
1852
416k
  do
1853
4.80M
    p->opt[last].price = kInfinityPrice;
1854
4.80M
  while (--last);
1855
1856
416k
  return Backward(p, cur);
1857
444k
}
1858
1859
1860
1861
94.8k
#define ChangePair(smallDist, bigDist) (((bigDist) >> 7) > (smallDist))
1862
1863
1864
1865
static unsigned GetOptimumFast(CLzmaEnc *p)
1866
4.08M
{
1867
4.08M
  UInt32 numAvail, mainDist;
1868
4.08M
  unsigned mainLen, numPairs, repIndex, repLen, i;
1869
4.08M
  const Byte *data;
1870
1871
4.08M
  if (p->additionalOffset == 0)
1872
4.03M
    mainLen = ReadMatchDistances(p, &numPairs);
1873
47.3k
  else
1874
47.3k
  {
1875
47.3k
    mainLen = p->longestMatchLen;
1876
47.3k
    numPairs = p->numPairs;
1877
47.3k
  }
1878
1879
4.08M
  numAvail = p->numAvail;
1880
4.08M
  p->backRes = MARK_LIT;
1881
4.08M
  if (numAvail < 2)
1882
1.27k
    return 1;
1883
  // if (mainLen < 2 && p->state == 0) return 1; // 18.06.notused
1884
4.08M
  if (numAvail > LZMA_MATCH_LEN_MAX)
1885
3.98M
    numAvail = LZMA_MATCH_LEN_MAX;
1886
4.08M
  data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1887
4.08M
  repLen = repIndex = 0;
1888
  
1889
20.3M
  for (i = 0; i < LZMA_NUM_REPS; i++)
1890
16.2M
  {
1891
16.2M
    unsigned len;
1892
16.2M
    const Byte *data2 = data - p->reps[i];
1893
16.2M
    if (data[0] != data2[0] || data[1] != data2[1])
1894
16.1M
      continue;
1895
2.79M
    for (len = 2; len < numAvail && data[len] == data2[len]; len++)
1896
2.66M
    {}
1897
134k
    if (len >= p->numFastBytes)
1898
28.2k
    {
1899
28.2k
      p->backRes = (UInt32)i;
1900
28.2k
      MOVE_POS(p, len - 1)
1901
28.2k
      return len;
1902
28.2k
    }
1903
105k
    if (len > repLen)
1904
79.8k
    {
1905
79.8k
      repIndex = i;
1906
79.8k
      repLen = len;
1907
79.8k
    }
1908
105k
  }
1909
1910
4.05M
  if (mainLen >= p->numFastBytes)
1911
36.4k
  {
1912
36.4k
    p->backRes = p->matches[(size_t)numPairs - 1] + LZMA_NUM_REPS;
1913
36.4k
    MOVE_POS(p, mainLen - 1)
1914
36.4k
    return mainLen;
1915
36.4k
  }
1916
1917
4.01M
  mainDist = 0; /* for GCC */
1918
  
1919
4.01M
  if (mainLen >= 2)
1920
557k
  {
1921
557k
    mainDist = p->matches[(size_t)numPairs - 1];
1922
560k
    while (numPairs > 2)
1923
53.2k
    {
1924
53.2k
      UInt32 dist2;
1925
53.2k
      if (mainLen != p->matches[(size_t)numPairs - 4] + 1)
1926
17.2k
        break;
1927
35.9k
      dist2 = p->matches[(size_t)numPairs - 3];
1928
35.9k
      if (!ChangePair(dist2, mainDist))
1929
32.6k
        break;
1930
3.29k
      numPairs -= 2;
1931
3.29k
      mainLen--;
1932
3.29k
      mainDist = dist2;
1933
3.29k
    }
1934
557k
    if (mainLen == 2 && mainDist >= 0x80)
1935
368k
      mainLen = 1;
1936
557k
  }
1937
1938
4.01M
  if (repLen >= 2)
1939
64.2k
    if (    repLen + 1 >= mainLen
1940
64.2k
        || (repLen + 2 >= mainLen && mainDist >= (1 << 9))
1941
64.2k
        || (repLen + 3 >= mainLen && mainDist >= (1 << 15)))
1942
57.4k
  {
1943
57.4k
    p->backRes = (UInt32)repIndex;
1944
57.4k
    MOVE_POS(p, repLen - 1)
1945
57.4k
    return repLen;
1946
57.4k
  }
1947
  
1948
3.95M
  if (mainLen < 2 || numAvail <= 2)
1949
3.82M
    return 1;
1950
1951
132k
  {
1952
132k
    unsigned len1 = ReadMatchDistances(p, &p->numPairs);
1953
132k
    p->longestMatchLen = len1;
1954
  
1955
132k
    if (len1 >= 2)
1956
104k
    {
1957
104k
      UInt32 newDist = p->matches[(size_t)p->numPairs - 1];
1958
104k
      if (   (len1 >= mainLen && newDist < mainDist)
1959
104k
          || (len1 == mainLen + 1 && !ChangePair(mainDist, newDist))
1960
104k
          || (len1 >  mainLen + 1)
1961
104k
          || (len1 + 1 >= mainLen && mainLen >= 3 && ChangePair(newDist, mainDist)))
1962
39.6k
        return 1;
1963
104k
    }
1964
132k
  }
1965
  
1966
92.7k
  data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1967
  
1968
440k
  for (i = 0; i < LZMA_NUM_REPS; i++)
1969
354k
  {
1970
354k
    unsigned len, limit;
1971
354k
    const Byte *data2 = data - p->reps[i];
1972
354k
    if (data[0] != data2[0] || data[1] != data2[1])
1973
339k
      continue;
1974
15.8k
    limit = mainLen - 1;
1975
20.1k
    for (len = 2;; len++)
1976
35.9k
    {
1977
35.9k
      if (len >= limit)
1978
7.65k
        return 1;
1979
28.2k
      if (data[len] != data2[len])
1980
8.16k
        break;
1981
28.2k
    }
1982
15.8k
  }
1983
  
1984
85.1k
  p->backRes = mainDist + LZMA_NUM_REPS;
1985
85.1k
  if (mainLen != 2)
1986
52.6k
  {
1987
52.6k
    MOVE_POS(p, mainLen - 2)
1988
52.6k
  }
1989
85.1k
  return mainLen;
1990
92.7k
}
1991
1992
1993
1994
1995
static void WriteEndMarker(CLzmaEnc *p, unsigned posState)
1996
0
{
1997
0
  UInt32 range;
1998
0
  range = p->rc.range;
1999
0
  {
2000
0
    UInt32 ttt, newBound;
2001
0
    CLzmaProb *prob = &p->isMatch[p->state][posState];
2002
0
    RC_BIT_PRE(&p->rc, prob)
2003
0
    RC_BIT_1(&p->rc, prob)
2004
0
    prob = &p->isRep[p->state];
2005
0
    RC_BIT_PRE(&p->rc, prob)
2006
0
    RC_BIT_0(&p->rc, prob)
2007
0
  }
2008
0
  p->state = kMatchNextStates[p->state];
2009
  
2010
0
  p->rc.range = range;
2011
0
  LenEnc_Encode(&p->lenProbs, &p->rc, 0, posState);
2012
0
  range = p->rc.range;
2013
2014
0
  {
2015
    // RcTree_Encode_PosSlot(&p->rc, p->posSlotEncoder[0], (1 << kNumPosSlotBits) - 1);
2016
0
    CLzmaProb *probs = p->posSlotEncoder[0];
2017
0
    unsigned m = 1;
2018
0
    do
2019
0
    {
2020
0
      UInt32 ttt, newBound;
2021
0
      RC_BIT_PRE(p, probs + m)
2022
0
      RC_BIT_1(&p->rc, probs + m);
2023
0
      m = (m << 1) + 1;
2024
0
    }
2025
0
    while (m < (1 << kNumPosSlotBits));
2026
0
  }
2027
0
  {
2028
    // RangeEnc_EncodeDirectBits(&p->rc, ((UInt32)1 << (30 - kNumAlignBits)) - 1, 30 - kNumAlignBits);    UInt32 range = p->range;
2029
0
    unsigned numBits = 30 - kNumAlignBits;
2030
0
    do
2031
0
    {
2032
0
      range >>= 1;
2033
0
      p->rc.low += range;
2034
0
      RC_NORM(&p->rc)
2035
0
    }
2036
0
    while (--numBits);
2037
0
  }
2038
   
2039
0
  {
2040
    // RcTree_ReverseEncode(&p->rc, p->posAlignEncoder, kNumAlignBits, kAlignMask);
2041
0
    CLzmaProb *probs = p->posAlignEncoder;
2042
0
    unsigned m = 1;
2043
0
    do
2044
0
    {
2045
0
      UInt32 ttt, newBound;
2046
0
      RC_BIT_PRE(p, probs + m)
2047
0
      RC_BIT_1(&p->rc, probs + m);
2048
0
      m = (m << 1) + 1;
2049
0
    }
2050
0
    while (m < kAlignTableSize);
2051
0
  }
2052
0
  p->rc.range = range;
2053
0
}
2054
2055
2056
static SRes CheckErrors(CLzmaEnc *p)
2057
31.2k
{
2058
31.2k
  if (p->result != SZ_OK)
2059
0
    return p->result;
2060
31.2k
  if (p->rc.res != SZ_OK)
2061
0
    p->result = SZ_ERROR_WRITE;
2062
31.2k
  if (p->matchFinderBase.result != SZ_OK)
2063
0
    p->result = SZ_ERROR_READ;
2064
31.2k
  if (p->result != SZ_OK)
2065
0
    p->finished = True;
2066
31.2k
  return p->result;
2067
31.2k
}
2068
2069
2070
MY_NO_INLINE static SRes Flush(CLzmaEnc *p, UInt32 nowPos)
2071
15.6k
{
2072
  /* ReleaseMFStream(); */
2073
15.6k
  p->finished = True;
2074
15.6k
  if (p->writeEndMark)
2075
0
    WriteEndMarker(p, nowPos & p->pbMask);
2076
15.6k
  RangeEnc_FlushData(&p->rc);
2077
15.6k
  RangeEnc_FlushStream(&p->rc);
2078
15.6k
  return CheckErrors(p);
2079
15.6k
}
2080
2081
2082
MY_NO_INLINE static void FillAlignPrices(CLzmaEnc *p)
2083
25.3k
{
2084
25.3k
  unsigned i;
2085
25.3k
  const CProbPrice *ProbPrices = p->ProbPrices;
2086
25.3k
  const CLzmaProb *probs = p->posAlignEncoder;
2087
  // p->alignPriceCount = 0;
2088
228k
  for (i = 0; i < kAlignTableSize / 2; i++)
2089
202k
  {
2090
202k
    UInt32 price = 0;
2091
202k
    unsigned sym = i;
2092
202k
    unsigned m = 1;
2093
202k
    unsigned bit;
2094
202k
    UInt32 prob;
2095
202k
    bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[m], bit); m = (m << 1) + bit;
2096
202k
    bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[m], bit); m = (m << 1) + bit;
2097
202k
    bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[m], bit); m = (m << 1) + bit;
2098
202k
    prob = probs[m];
2099
202k
    p->alignPrices[i    ] = price + GET_PRICEa_0(prob);
2100
202k
    p->alignPrices[i + 8] = price + GET_PRICEa_1(prob);
2101
    // p->alignPrices[i] = RcTree_ReverseGetPrice(p->posAlignEncoder, kNumAlignBits, i, p->ProbPrices);
2102
202k
  }
2103
25.3k
}
2104
2105
2106
MY_NO_INLINE static void FillDistancesPrices(CLzmaEnc *p)
2107
25.3k
{
2108
  // int y; for (y = 0; y < 100; y++) {
2109
2110
25.3k
  UInt32 tempPrices[kNumFullDistances];
2111
25.3k
  unsigned i, lps;
2112
2113
25.3k
  const CProbPrice *ProbPrices = p->ProbPrices;
2114
25.3k
  p->matchPriceCount = 0;
2115
2116
1.59M
  for (i = kStartPosModelIndex / 2; i < kNumFullDistances / 2; i++)
2117
1.57M
  {
2118
1.57M
    unsigned posSlot = GetPosSlot1(i);
2119
1.57M
    unsigned footerBits = (posSlot >> 1) - 1;
2120
1.57M
    unsigned base = ((2 | (posSlot & 1)) << footerBits);
2121
1.57M
    const CLzmaProb *probs = p->posEncoders + (size_t)base * 2;
2122
    // tempPrices[i] = RcTree_ReverseGetPrice(p->posEncoders + base, footerBits, i - base, p->ProbPrices);
2123
1.57M
    UInt32 price = 0;
2124
1.57M
    unsigned m = 1;
2125
1.57M
    unsigned sym = i;
2126
1.57M
    unsigned offset = (unsigned)1 << footerBits;
2127
1.57M
    base += i;
2128
    
2129
1.57M
    if (footerBits)
2130
1.52M
    do
2131
4.97M
    {
2132
4.97M
      unsigned bit = sym & 1;
2133
4.97M
      sym >>= 1;
2134
4.97M
      price += GET_PRICEa(probs[m], bit);
2135
4.97M
      m = (m << 1) + bit;
2136
4.97M
    }
2137
4.97M
    while (--footerBits);
2138
2139
1.57M
    {
2140
1.57M
      unsigned prob = probs[m];
2141
1.57M
      tempPrices[base         ] = price + GET_PRICEa_0(prob);
2142
1.57M
      tempPrices[base + offset] = price + GET_PRICEa_1(prob);
2143
1.57M
    }
2144
1.57M
  }
2145
2146
126k
  for (lps = 0; lps < kNumLenToPosStates; lps++)
2147
101k
  {
2148
101k
    unsigned slot;
2149
101k
    unsigned distTableSize2 = (p->distTableSize + 1) >> 1;
2150
101k
    UInt32 *posSlotPrices = p->posSlotPrices[lps];
2151
101k
    const CLzmaProb *probs = p->posSlotEncoder[lps];
2152
    
2153
2.53M
    for (slot = 0; slot < distTableSize2; slot++)
2154
2.43M
    {
2155
      // posSlotPrices[slot] = RcTree_GetPrice(encoder, kNumPosSlotBits, slot, p->ProbPrices);
2156
2.43M
      UInt32 price;
2157
2.43M
      unsigned bit;
2158
2.43M
      unsigned sym = slot + (1 << (kNumPosSlotBits - 1));
2159
2.43M
      unsigned prob;
2160
2.43M
      bit = sym & 1; sym >>= 1; price  = GET_PRICEa(probs[sym], bit);
2161
2.43M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2162
2.43M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2163
2.43M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2164
2.43M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2165
2.43M
      prob = probs[(size_t)slot + (1 << (kNumPosSlotBits - 1))];
2166
2.43M
      posSlotPrices[(size_t)slot * 2    ] = price + GET_PRICEa_0(prob);
2167
2.43M
      posSlotPrices[(size_t)slot * 2 + 1] = price + GET_PRICEa_1(prob);
2168
2.43M
    }
2169
    
2170
101k
    {
2171
101k
      UInt32 delta = ((UInt32)((kEndPosModelIndex / 2 - 1) - kNumAlignBits) << kNumBitPriceShiftBits);
2172
1.82M
      for (slot = kEndPosModelIndex / 2; slot < distTableSize2; slot++)
2173
1.72M
      {
2174
1.72M
        posSlotPrices[(size_t)slot * 2    ] += delta;
2175
1.72M
        posSlotPrices[(size_t)slot * 2 + 1] += delta;
2176
1.72M
        delta += ((UInt32)1 << kNumBitPriceShiftBits);
2177
1.72M
      }
2178
101k
    }
2179
2180
101k
    {
2181
101k
      UInt32 *dp = p->distancesPrices[lps];
2182
      
2183
101k
      dp[0] = posSlotPrices[0];
2184
101k
      dp[1] = posSlotPrices[1];
2185
101k
      dp[2] = posSlotPrices[2];
2186
101k
      dp[3] = posSlotPrices[3];
2187
2188
6.39M
      for (i = 4; i < kNumFullDistances; i += 2)
2189
6.29M
      {
2190
6.29M
        UInt32 slotPrice = posSlotPrices[GetPosSlot1(i)];
2191
6.29M
        dp[i    ] = slotPrice + tempPrices[i];
2192
6.29M
        dp[i + 1] = slotPrice + tempPrices[i + 1];
2193
6.29M
      }
2194
101k
    }
2195
101k
  }
2196
  // }
2197
25.3k
}
2198
2199
2200
2201
void LzmaEnc_Construct(CLzmaEnc *p)
2202
7.77k
{
2203
7.77k
  RangeEnc_Construct(&p->rc);
2204
7.77k
  MatchFinder_Construct(&p->matchFinderBase);
2205
  
2206
  #ifndef _7ZIP_ST
2207
  MatchFinderMt_Construct(&p->matchFinderMt);
2208
  p->matchFinderMt.MatchFinder = &p->matchFinderBase;
2209
  #endif
2210
2211
7.77k
  {
2212
7.77k
    CLzmaEncProps props;
2213
7.77k
    LzmaEncProps_Init(&props);
2214
7.77k
    LzmaEnc_SetProps(p, &props);
2215
7.77k
  }
2216
2217
7.77k
  #ifndef LZMA_LOG_BSR
2218
7.77k
  LzmaEnc_FastPosInit(p->g_FastPos);
2219
7.77k
  #endif
2220
2221
7.77k
  LzmaEnc_InitPriceTables(p->ProbPrices);
2222
7.77k
  p->litProbs = NULL;
2223
7.77k
  p->saveState.litProbs = NULL;
2224
2225
7.77k
}
2226
2227
CLzmaEncHandle LzmaEnc_Create(ISzAllocPtr alloc)
2228
7.77k
{
2229
7.77k
  void *p;
2230
7.77k
  p = ISzAlloc_Alloc(alloc, sizeof(CLzmaEnc));
2231
7.77k
  if (p)
2232
7.77k
    LzmaEnc_Construct((CLzmaEnc *)p);
2233
7.77k
  return p;
2234
7.77k
}
2235
2236
void LzmaEnc_FreeLits(CLzmaEnc *p, ISzAllocPtr alloc)
2237
15.5k
{
2238
15.5k
  ISzAlloc_Free(alloc, p->litProbs);
2239
15.5k
  ISzAlloc_Free(alloc, p->saveState.litProbs);
2240
15.5k
  p->litProbs = NULL;
2241
15.5k
  p->saveState.litProbs = NULL;
2242
15.5k
}
2243
2244
void LzmaEnc_Destruct(CLzmaEnc *p, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2245
7.77k
{
2246
  #ifndef _7ZIP_ST
2247
  MatchFinderMt_Destruct(&p->matchFinderMt, allocBig);
2248
  #endif
2249
  
2250
7.77k
  MatchFinder_Free(&p->matchFinderBase, allocBig);
2251
7.77k
  LzmaEnc_FreeLits(p, alloc);
2252
7.77k
  RangeEnc_Free(&p->rc, alloc);
2253
7.77k
}
2254
2255
void LzmaEnc_Destroy(CLzmaEncHandle p, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2256
7.77k
{
2257
7.77k
  LzmaEnc_Destruct((CLzmaEnc *)p, alloc, allocBig);
2258
7.77k
  ISzAlloc_Free(alloc, p);
2259
7.77k
}
2260
2261
2262
static SRes LzmaEnc_CodeOneBlock(CLzmaEnc *p, UInt32 maxPackSize, UInt32 maxUnpackSize)
2263
15.6k
{
2264
15.6k
  UInt32 nowPos32, startPos32;
2265
15.6k
  if (p->needInit)
2266
7.77k
  {
2267
7.77k
    p->matchFinder.Init(p->matchFinderObj);
2268
7.77k
    p->needInit = 0;
2269
7.77k
  }
2270
2271
15.6k
  if (p->finished)
2272
0
    return p->result;
2273
15.6k
  RINOK(CheckErrors(p));
2274
2275
15.6k
  nowPos32 = (UInt32)p->nowPos64;
2276
15.6k
  startPos32 = nowPos32;
2277
2278
15.6k
  if (p->nowPos64 == 0)
2279
7.77k
  {
2280
7.77k
    unsigned numPairs;
2281
7.77k
    Byte curByte;
2282
7.77k
    if (p->matchFinder.GetNumAvailableBytes(p->matchFinderObj) == 0)
2283
0
      return Flush(p, nowPos32);
2284
7.77k
    ReadMatchDistances(p, &numPairs);
2285
7.77k
    RangeEnc_EncodeBit_0(&p->rc, &p->isMatch[kState_Start][0]);
2286
    // p->state = kLiteralNextStates[p->state];
2287
7.77k
    curByte = *(p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - p->additionalOffset);
2288
7.77k
    LitEnc_Encode(&p->rc, p->litProbs, curByte);
2289
7.77k
    p->additionalOffset--;
2290
7.77k
    nowPos32++;
2291
7.77k
  }
2292
2293
15.6k
  if (p->matchFinder.GetNumAvailableBytes(p->matchFinderObj) != 0)
2294
  
2295
7.82k
  for (;;)
2296
9.20M
  {
2297
9.20M
    UInt32 dist;
2298
9.20M
    unsigned len, posState;
2299
9.20M
    UInt32 range, ttt, newBound;
2300
9.20M
    CLzmaProb *probs;
2301
  
2302
9.20M
    if (p->fastMode)
2303
4.08M
      len = GetOptimumFast(p);
2304
5.11M
    else
2305
5.11M
    {
2306
5.11M
      unsigned oci = p->optCur;
2307
5.11M
      if (p->optEnd == oci)
2308
3.58M
        len = GetOptimum(p, nowPos32);
2309
1.53M
      else
2310
1.53M
      {
2311
1.53M
        const COptimal *opt = &p->opt[oci];
2312
1.53M
        len = opt->len;
2313
1.53M
        p->backRes = opt->dist;
2314
1.53M
        p->optCur = oci + 1;
2315
1.53M
      }
2316
5.11M
    }
2317
2318
9.20M
    posState = (unsigned)nowPos32 & p->pbMask;
2319
9.20M
    range = p->rc.range;
2320
9.20M
    probs = &p->isMatch[p->state][posState];
2321
    
2322
9.20M
    RC_BIT_PRE(&p->rc, probs)
2323
    
2324
9.20M
    dist = p->backRes;
2325
2326
    #ifdef SHOW_STAT2
2327
    printf("\n pos = %6X, len = %3u  pos = %6u", nowPos32, len, dist);
2328
    #endif
2329
2330
9.20M
    if (dist == MARK_LIT)
2331
7.87M
    {
2332
7.87M
      Byte curByte;
2333
7.87M
      const Byte *data;
2334
7.87M
      unsigned state;
2335
2336
7.87M
      RC_BIT_0(&p->rc, probs);
2337
7.87M
      p->rc.range = range;
2338
7.87M
      data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - p->additionalOffset;
2339
7.87M
      probs = LIT_PROBS(nowPos32, *(data - 1));
2340
7.87M
      curByte = *data;
2341
7.87M
      state = p->state;
2342
7.87M
      p->state = kLiteralNextStates[state];
2343
7.87M
      if (IsLitState(state))
2344
7.55M
        LitEnc_Encode(&p->rc, probs, curByte);
2345
326k
      else
2346
326k
        LitEnc_EncodeMatched(&p->rc, probs, curByte, *(data - p->reps[0]));
2347
7.87M
    }
2348
1.32M
    else
2349
1.32M
    {
2350
1.32M
      RC_BIT_1(&p->rc, probs);
2351
1.32M
      probs = &p->isRep[p->state];
2352
1.32M
      RC_BIT_PRE(&p->rc, probs)
2353
      
2354
1.32M
      if (dist < LZMA_NUM_REPS)
2355
499k
      {
2356
499k
        RC_BIT_1(&p->rc, probs);
2357
499k
        probs = &p->isRepG0[p->state];
2358
499k
        RC_BIT_PRE(&p->rc, probs)
2359
499k
        if (dist == 0)
2360
159k
        {
2361
159k
          RC_BIT_0(&p->rc, probs);
2362
159k
          probs = &p->isRep0Long[p->state][posState];
2363
159k
          RC_BIT_PRE(&p->rc, probs)
2364
159k
          if (len != 1)
2365
97.9k
          {
2366
97.9k
            RC_BIT_1_BASE(&p->rc, probs);
2367
97.9k
          }
2368
61.2k
          else
2369
61.2k
          {
2370
61.2k
            RC_BIT_0_BASE(&p->rc, probs);
2371
61.2k
            p->state = kShortRepNextStates[p->state];
2372
61.2k
          }
2373
159k
        }
2374
340k
        else
2375
340k
        {
2376
340k
          RC_BIT_1(&p->rc, probs);
2377
340k
          probs = &p->isRepG1[p->state];
2378
340k
          RC_BIT_PRE(&p->rc, probs)
2379
340k
          if (dist == 1)
2380
151k
          {
2381
151k
            RC_BIT_0_BASE(&p->rc, probs);
2382
151k
            dist = p->reps[1];
2383
151k
          }
2384
188k
          else
2385
188k
          {
2386
188k
            RC_BIT_1(&p->rc, probs);
2387
188k
            probs = &p->isRepG2[p->state];
2388
188k
            RC_BIT_PRE(&p->rc, probs)
2389
188k
            if (dist == 2)
2390
118k
            {
2391
118k
              RC_BIT_0_BASE(&p->rc, probs);
2392
118k
              dist = p->reps[2];
2393
118k
            }
2394
69.9k
            else
2395
69.9k
            {
2396
69.9k
              RC_BIT_1_BASE(&p->rc, probs);
2397
69.9k
              dist = p->reps[3];
2398
69.9k
              p->reps[3] = p->reps[2];
2399
69.9k
            }
2400
188k
            p->reps[2] = p->reps[1];
2401
188k
          }
2402
340k
          p->reps[1] = p->reps[0];
2403
340k
          p->reps[0] = dist;
2404
340k
        }
2405
2406
499k
        RC_NORM(&p->rc)
2407
2408
499k
        p->rc.range = range;
2409
2410
499k
        if (len != 1)
2411
438k
        {
2412
438k
          LenEnc_Encode(&p->repLenProbs, &p->rc, len - LZMA_MATCH_LEN_MIN, posState);
2413
438k
          --p->repLenEncCounter;
2414
438k
          p->state = kRepNextStates[p->state];
2415
438k
        }
2416
499k
      }
2417
823k
      else
2418
823k
      {
2419
823k
        unsigned posSlot;
2420
823k
        RC_BIT_0(&p->rc, probs);
2421
823k
        p->rc.range = range;
2422
823k
        p->state = kMatchNextStates[p->state];
2423
2424
823k
        LenEnc_Encode(&p->lenProbs, &p->rc, len - LZMA_MATCH_LEN_MIN, posState);
2425
        // --p->lenEnc.counter;
2426
2427
823k
        dist -= LZMA_NUM_REPS;
2428
823k
        p->reps[3] = p->reps[2];
2429
823k
        p->reps[2] = p->reps[1];
2430
823k
        p->reps[1] = p->reps[0];
2431
823k
        p->reps[0] = dist + 1;
2432
        
2433
823k
        p->matchPriceCount++;
2434
823k
        GetPosSlot(dist, posSlot);
2435
        // RcTree_Encode_PosSlot(&p->rc, p->posSlotEncoder[GetLenToPosState(len)], posSlot);
2436
823k
        {
2437
823k
          UInt32 sym = (UInt32)posSlot + (1 << kNumPosSlotBits);
2438
823k
          range = p->rc.range;
2439
823k
          probs = p->posSlotEncoder[GetLenToPosState(len)];
2440
823k
          do
2441
4.94M
          {
2442
4.94M
            CLzmaProb *prob = probs + (sym >> kNumPosSlotBits);
2443
4.94M
            UInt32 bit = (sym >> (kNumPosSlotBits - 1)) & 1;
2444
4.94M
            sym <<= 1;
2445
4.94M
            RC_BIT(&p->rc, prob, bit);
2446
4.94M
          }
2447
4.94M
          while (sym < (1 << kNumPosSlotBits * 2));
2448
823k
          p->rc.range = range;
2449
823k
        }
2450
        
2451
823k
        if (dist >= kStartPosModelIndex)
2452
543k
        {
2453
543k
          unsigned footerBits = ((posSlot >> 1) - 1);
2454
2455
543k
          if (dist < kNumFullDistances)
2456
409k
          {
2457
409k
            unsigned base = ((2 | (posSlot & 1)) << footerBits);
2458
409k
            RcTree_ReverseEncode(&p->rc, p->posEncoders + base, footerBits, (unsigned)(dist /* - base */));
2459
409k
          }
2460
133k
          else
2461
133k
          {
2462
133k
            UInt32 pos2 = (dist | 0xF) << (32 - footerBits);
2463
133k
            range = p->rc.range;
2464
            // RangeEnc_EncodeDirectBits(&p->rc, posReduced >> kNumAlignBits, footerBits - kNumAlignBits);
2465
            /*
2466
            do
2467
            {
2468
              range >>= 1;
2469
              p->rc.low += range & (0 - ((dist >> --footerBits) & 1));
2470
              RC_NORM(&p->rc)
2471
            }
2472
            while (footerBits > kNumAlignBits);
2473
            */
2474
133k
            do
2475
572k
            {
2476
572k
              range >>= 1;
2477
572k
              p->rc.low += range & (0 - (pos2 >> 31));
2478
572k
              pos2 += pos2;
2479
572k
              RC_NORM(&p->rc)
2480
572k
            }
2481
572k
            while (pos2 != 0xF0000000);
2482
2483
2484
            // RcTree_ReverseEncode(&p->rc, p->posAlignEncoder, kNumAlignBits, posReduced & kAlignMask);
2485
2486
133k
            {
2487
133k
              unsigned m = 1;
2488
133k
              unsigned bit;
2489
133k
              bit = dist & 1; dist >>= 1; RC_BIT(&p->rc, p->posAlignEncoder + m, bit); m = (m << 1) + bit;
2490
133k
              bit = dist & 1; dist >>= 1; RC_BIT(&p->rc, p->posAlignEncoder + m, bit); m = (m << 1) + bit;
2491
133k
              bit = dist & 1; dist >>= 1; RC_BIT(&p->rc, p->posAlignEncoder + m, bit); m = (m << 1) + bit;
2492
133k
              bit = dist & 1;             RC_BIT(&p->rc, p->posAlignEncoder + m, bit);
2493
133k
              p->rc.range = range;
2494
              // p->alignPriceCount++;
2495
133k
            }
2496
133k
          }
2497
543k
        }
2498
823k
      }
2499
1.32M
    }
2500
2501
9.20M
    nowPos32 += (UInt32)len;
2502
9.20M
    p->additionalOffset -= len;
2503
    
2504
9.20M
    if (p->additionalOffset == 0)
2505
7.58M
    {
2506
7.58M
      UInt32 processed;
2507
2508
7.58M
      if (!p->fastMode)
2509
3.55M
      {
2510
        /*
2511
        if (p->alignPriceCount >= 16) // kAlignTableSize
2512
          FillAlignPrices(p);
2513
        if (p->matchPriceCount >= 128)
2514
          FillDistancesPrices(p);
2515
        if (p->lenEnc.counter <= 0)
2516
          LenPriceEnc_UpdateTables(&p->lenEnc, 1 << p->pb, &p->lenProbs, p->ProbPrices);
2517
        */
2518
3.55M
        if (p->matchPriceCount >= 64)
2519
9.16k
        {
2520
9.16k
          FillAlignPrices(p);
2521
          // { int y; for (y = 0; y < 100; y++) {
2522
9.16k
          FillDistancesPrices(p);
2523
          // }}
2524
9.16k
          LenPriceEnc_UpdateTables(&p->lenEnc, 1 << p->pb, &p->lenProbs, p->ProbPrices);
2525
9.16k
        }
2526
3.55M
        if (p->repLenEncCounter <= 0)
2527
3.03k
        {
2528
3.03k
          p->repLenEncCounter = REP_LEN_COUNT;
2529
3.03k
          LenPriceEnc_UpdateTables(&p->repLenEnc, 1 << p->pb, &p->repLenProbs, p->ProbPrices);
2530
3.03k
        }
2531
3.55M
      }
2532
    
2533
7.58M
      if (p->matchFinder.GetNumAvailableBytes(p->matchFinderObj) == 0)
2534
7.74k
        break;
2535
7.58M
      processed = nowPos32 - startPos32;
2536
      
2537
7.58M
      if (maxPackSize)
2538
7.58M
      {
2539
7.58M
        if (processed + kNumOpts + 300 >= maxUnpackSize
2540
7.58M
            || RangeEnc_GetProcessed_sizet(&p->rc) + kPackReserve >= maxPackSize)
2541
88
          break;
2542
7.58M
      }
2543
0
      else if (processed >= (1 << 17))
2544
0
      {
2545
0
        p->nowPos64 += nowPos32 - startPos32;
2546
0
        return CheckErrors(p);
2547
0
      }
2548
7.58M
    }
2549
9.20M
  }
2550
2551
15.6k
  p->nowPos64 += nowPos32 - startPos32;
2552
15.6k
  return Flush(p, nowPos32);
2553
15.6k
}
2554
2555
2556
2557
7.77k
#define kBigHashDicLimit ((UInt32)1 << 24)
2558
2559
static SRes LzmaEnc_Alloc(CLzmaEnc *p, UInt32 keepWindowSize, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2560
7.77k
{
2561
7.77k
  UInt32 beforeSize = kNumOpts;
2562
7.77k
  if (!RangeEnc_Alloc(&p->rc, alloc))
2563
0
    return SZ_ERROR_MEM;
2564
2565
  #ifndef _7ZIP_ST
2566
  p->mtMode = (p->multiThread && !p->fastMode && (p->matchFinderBase.btMode != 0));
2567
  #endif
2568
2569
7.77k
  {
2570
7.77k
    unsigned lclp = p->lc + p->lp;
2571
7.77k
    if (!p->litProbs || !p->saveState.litProbs || p->lclp != lclp)
2572
7.77k
    {
2573
7.77k
      LzmaEnc_FreeLits(p, alloc);
2574
7.77k
      p->litProbs = (CLzmaProb *)ISzAlloc_Alloc(alloc, ((UInt32)0x300 << lclp) * sizeof(CLzmaProb));
2575
7.77k
      p->saveState.litProbs = (CLzmaProb *)ISzAlloc_Alloc(alloc, ((UInt32)0x300 << lclp) * sizeof(CLzmaProb));
2576
7.77k
      if (!p->litProbs || !p->saveState.litProbs)
2577
0
      {
2578
0
        LzmaEnc_FreeLits(p, alloc);
2579
0
        return SZ_ERROR_MEM;
2580
0
      }
2581
7.77k
      p->lclp = lclp;
2582
7.77k
    }
2583
7.77k
  }
2584
2585
7.77k
  p->matchFinderBase.bigHash = (Byte)(p->dictSize > kBigHashDicLimit ? 1 : 0);
2586
2587
7.77k
  if (beforeSize + p->dictSize < keepWindowSize)
2588
0
    beforeSize = keepWindowSize - p->dictSize;
2589
2590
  #ifndef _7ZIP_ST
2591
  if (p->mtMode)
2592
  {
2593
    RINOK(MatchFinderMt_Create(&p->matchFinderMt, p->dictSize, beforeSize, p->numFastBytes,
2594
        LZMA_MATCH_LEN_MAX
2595
        + 1  /* 18.04 */
2596
        , allocBig));
2597
    p->matchFinderObj = &p->matchFinderMt;
2598
    p->matchFinderBase.bigHash = (Byte)(
2599
        (p->dictSize > kBigHashDicLimit && p->matchFinderBase.hashMask >= 0xFFFFFF) ? 1 : 0);
2600
    MatchFinderMt_CreateVTable(&p->matchFinderMt, &p->matchFinder);
2601
  }
2602
  else
2603
  #endif
2604
7.77k
  {
2605
7.77k
    if (!MatchFinder_Create(&p->matchFinderBase, p->dictSize, beforeSize, p->numFastBytes, LZMA_MATCH_LEN_MAX, allocBig))
2606
0
      return SZ_ERROR_MEM;
2607
7.77k
    p->matchFinderObj = &p->matchFinderBase;
2608
7.77k
    MatchFinder_CreateVTable(&p->matchFinderBase, &p->matchFinder);
2609
7.77k
  }
2610
  
2611
7.77k
  return SZ_OK;
2612
7.77k
}
2613
2614
void LzmaEnc_Init(CLzmaEnc *p)
2615
17.5k
{
2616
17.5k
  unsigned i;
2617
17.5k
  p->state = 0;
2618
17.5k
  p->reps[0] =
2619
17.5k
  p->reps[1] =
2620
17.5k
  p->reps[2] =
2621
17.5k
  p->reps[3] = 1;
2622
2623
17.5k
  RangeEnc_Init(&p->rc);
2624
2625
297k
  for (i = 0; i < (1 << kNumAlignBits); i++)
2626
280k
    p->posAlignEncoder[i] = kProbInitValue;
2627
2628
227k
  for (i = 0; i < kNumStates; i++)
2629
210k
  {
2630
210k
    unsigned j;
2631
3.57M
    for (j = 0; j < LZMA_NUM_PB_STATES_MAX; j++)
2632
3.36M
    {
2633
3.36M
      p->isMatch[i][j] = kProbInitValue;
2634
3.36M
      p->isRep0Long[i][j] = kProbInitValue;
2635
3.36M
    }
2636
210k
    p->isRep[i] = kProbInitValue;
2637
210k
    p->isRepG0[i] = kProbInitValue;
2638
210k
    p->isRepG1[i] = kProbInitValue;
2639
210k
    p->isRepG2[i] = kProbInitValue;
2640
210k
  }
2641
2642
17.5k
  {
2643
87.5k
    for (i = 0; i < kNumLenToPosStates; i++)
2644
70.0k
    {
2645
70.0k
      CLzmaProb *probs = p->posSlotEncoder[i];
2646
70.0k
      unsigned j;
2647
4.55M
      for (j = 0; j < (1 << kNumPosSlotBits); j++)
2648
4.48M
        probs[j] = kProbInitValue;
2649
70.0k
    }
2650
17.5k
  }
2651
17.5k
  {
2652
2.25M
    for (i = 0; i < kNumFullDistances; i++)
2653
2.24M
      p->posEncoders[i] = kProbInitValue;
2654
17.5k
  }
2655
2656
17.5k
  {
2657
17.5k
    UInt32 num = (UInt32)0x300 << (p->lp + p->lc);
2658
17.5k
    UInt32 k;
2659
17.5k
    CLzmaProb *probs = p->litProbs;
2660
113M
    for (k = 0; k < num; k++)
2661
113M
      probs[k] = kProbInitValue;
2662
17.5k
  }
2663
2664
2665
17.5k
  LenEnc_Init(&p->lenProbs);
2666
17.5k
  LenEnc_Init(&p->repLenProbs);
2667
2668
17.5k
  p->optEnd = 0;
2669
17.5k
  p->optCur = 0;
2670
2671
17.5k
  {
2672
35.8M
    for (i = 0; i < kNumOpts; i++)
2673
35.8M
      p->opt[i].price = kInfinityPrice;
2674
17.5k
  }
2675
2676
17.5k
  p->additionalOffset = 0;
2677
2678
17.5k
  p->pbMask = (1 << p->pb) - 1;
2679
17.5k
  p->lpMask = ((UInt32)0x100 << p->lp) - ((unsigned)0x100 >> p->lc);
2680
17.5k
}
2681
2682
2683
void LzmaEnc_InitPrices(CLzmaEnc *p)
2684
23.4k
{
2685
23.4k
  if (!p->fastMode)
2686
16.2k
  {
2687
16.2k
    FillDistancesPrices(p);
2688
16.2k
    FillAlignPrices(p);
2689
16.2k
  }
2690
2691
23.4k
  p->lenEnc.tableSize =
2692
23.4k
  p->repLenEnc.tableSize =
2693
23.4k
      p->numFastBytes + 1 - LZMA_MATCH_LEN_MIN;
2694
2695
23.4k
  p->repLenEncCounter = REP_LEN_COUNT;
2696
2697
23.4k
  LenPriceEnc_UpdateTables(&p->lenEnc, 1 << p->pb, &p->lenProbs, p->ProbPrices);
2698
23.4k
  LenPriceEnc_UpdateTables(&p->repLenEnc, 1 << p->pb, &p->repLenProbs, p->ProbPrices);
2699
23.4k
}
2700
2701
static SRes LzmaEnc_AllocAndInit(CLzmaEnc *p, UInt32 keepWindowSize, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2702
7.77k
{
2703
7.77k
  unsigned i;
2704
139k
  for (i = kEndPosModelIndex / 2; i < kDicLogSizeMax; i++)
2705
139k
    if (p->dictSize <= ((UInt32)1 << i))
2706
7.77k
      break;
2707
7.77k
  p->distTableSize = i * 2;
2708
2709
7.77k
  p->finished = False;
2710
7.77k
  p->result = SZ_OK;
2711
7.77k
  RINOK(LzmaEnc_Alloc(p, keepWindowSize, alloc, allocBig));
2712
7.77k
  LzmaEnc_Init(p);
2713
7.77k
  LzmaEnc_InitPrices(p);
2714
7.77k
  p->nowPos64 = 0;
2715
7.77k
  return SZ_OK;
2716
7.77k
}
2717
2718
static SRes LzmaEnc_Prepare(CLzmaEncHandle pp, ISeqOutStream *outStream, ISeqInStream *inStream,
2719
    ISzAllocPtr alloc, ISzAllocPtr allocBig)
2720
0
{
2721
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
2722
0
  p->matchFinderBase.stream = inStream;
2723
0
  p->needInit = 1;
2724
0
  p->rc.outStream = outStream;
2725
0
  return LzmaEnc_AllocAndInit(p, 0, alloc, allocBig);
2726
0
}
2727
2728
SRes LzmaEnc_PrepareForLzma2(CLzmaEncHandle pp,
2729
    ISeqInStream *inStream, UInt32 keepWindowSize,
2730
    ISzAllocPtr alloc, ISzAllocPtr allocBig)
2731
7.77k
{
2732
7.77k
  CLzmaEnc *p = (CLzmaEnc *)pp;
2733
7.77k
  p->matchFinderBase.stream = inStream;
2734
7.77k
  p->needInit = 1;
2735
7.77k
  return LzmaEnc_AllocAndInit(p, keepWindowSize, alloc, allocBig);
2736
7.77k
}
2737
2738
static void LzmaEnc_SetInputBuf(CLzmaEnc *p, const Byte *src, SizeT srcLen)
2739
0
{
2740
0
  p->matchFinderBase.directInput = 1;
2741
0
  p->matchFinderBase.bufferBase = (Byte *)src;
2742
0
  p->matchFinderBase.directInputRem = srcLen;
2743
0
}
2744
2745
SRes LzmaEnc_MemPrepare(CLzmaEncHandle pp, const Byte *src, SizeT srcLen,
2746
    UInt32 keepWindowSize, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2747
0
{
2748
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
2749
0
  LzmaEnc_SetInputBuf(p, src, srcLen);
2750
0
  p->needInit = 1;
2751
2752
0
  LzmaEnc_SetDataSize(pp, srcLen);
2753
0
  return LzmaEnc_AllocAndInit(p, keepWindowSize, alloc, allocBig);
2754
0
}
2755
2756
void LzmaEnc_Finish(CLzmaEncHandle pp)
2757
7.77k
{
2758
  #ifndef _7ZIP_ST
2759
  CLzmaEnc *p = (CLzmaEnc *)pp;
2760
  if (p->mtMode)
2761
    MatchFinderMt_ReleaseStream(&p->matchFinderMt);
2762
  #else
2763
7.77k
  UNUSED_VAR(pp);
2764
7.77k
  #endif
2765
7.77k
}
2766
2767
2768
typedef struct
2769
{
2770
  ISeqOutStream vt;
2771
  Byte *data;
2772
  SizeT rem;
2773
  BoolInt overflow;
2774
} CLzmaEnc_SeqOutStreamBuf;
2775
2776
static size_t SeqOutStreamBuf_Write(const ISeqOutStream *pp, const void *data, size_t size)
2777
15.6k
{
2778
15.6k
  CLzmaEnc_SeqOutStreamBuf *p = CONTAINER_FROM_VTBL(pp, CLzmaEnc_SeqOutStreamBuf, vt);
2779
15.6k
  if (p->rem < size)
2780
0
  {
2781
0
    size = p->rem;
2782
0
    p->overflow = True;
2783
0
  }
2784
15.6k
  memcpy(p->data, data, size);
2785
15.6k
  p->rem -= size;
2786
15.6k
  p->data += size;
2787
15.6k
  return size;
2788
15.6k
}
2789
2790
2791
UInt32 LzmaEnc_GetNumAvailableBytes(CLzmaEncHandle pp)
2792
0
{
2793
0
  const CLzmaEnc *p = (CLzmaEnc *)pp;
2794
0
  return p->matchFinder.GetNumAvailableBytes(p->matchFinderObj);
2795
0
}
2796
2797
2798
const Byte *LzmaEnc_GetCurBuf(CLzmaEncHandle pp)
2799
1.97k
{
2800
1.97k
  const CLzmaEnc *p = (CLzmaEnc *)pp;
2801
1.97k
  return p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - p->additionalOffset;
2802
1.97k
}
2803
2804
2805
SRes LzmaEnc_CodeOneMemBlock(CLzmaEncHandle pp, BoolInt reInit,
2806
    Byte *dest, size_t *destLen, UInt32 desiredPackSize, UInt32 *unpackSize)
2807
15.6k
{
2808
15.6k
  CLzmaEnc *p = (CLzmaEnc *)pp;
2809
15.6k
  UInt64 nowPos64;
2810
15.6k
  SRes res;
2811
15.6k
  CLzmaEnc_SeqOutStreamBuf outStream;
2812
2813
15.6k
  outStream.vt.Write = SeqOutStreamBuf_Write;
2814
15.6k
  outStream.data = dest;
2815
15.6k
  outStream.rem = *destLen;
2816
15.6k
  outStream.overflow = False;
2817
2818
15.6k
  p->writeEndMark = False;
2819
15.6k
  p->finished = False;
2820
15.6k
  p->result = SZ_OK;
2821
2822
15.6k
  if (reInit)
2823
9.72k
    LzmaEnc_Init(p);
2824
15.6k
  LzmaEnc_InitPrices(p);
2825
2826
15.6k
  nowPos64 = p->nowPos64;
2827
15.6k
  RangeEnc_Init(&p->rc);
2828
15.6k
  p->rc.outStream = &outStream.vt;
2829
2830
15.6k
  if (desiredPackSize == 0)
2831
0
    return SZ_ERROR_OUTPUT_EOF;
2832
2833
15.6k
  res = LzmaEnc_CodeOneBlock(p, desiredPackSize, *unpackSize);
2834
  
2835
15.6k
  *unpackSize = (UInt32)(p->nowPos64 - nowPos64);
2836
15.6k
  *destLen -= outStream.rem;
2837
15.6k
  if (outStream.overflow)
2838
0
    return SZ_ERROR_OUTPUT_EOF;
2839
2840
15.6k
  return res;
2841
15.6k
}
2842
2843
2844
static SRes LzmaEnc_Encode2(CLzmaEnc *p, ICompressProgress *progress)
2845
0
{
2846
0
  SRes res = SZ_OK;
2847
2848
  #ifndef _7ZIP_ST
2849
  Byte allocaDummy[0x300];
2850
  allocaDummy[0] = 0;
2851
  allocaDummy[1] = allocaDummy[0];
2852
  #endif
2853
2854
0
  for (;;)
2855
0
  {
2856
0
    res = LzmaEnc_CodeOneBlock(p, 0, 0);
2857
0
    if (res != SZ_OK || p->finished)
2858
0
      break;
2859
0
    if (progress)
2860
0
    {
2861
0
      res = ICompressProgress_Progress(progress, p->nowPos64, RangeEnc_GetProcessed(&p->rc));
2862
0
      if (res != SZ_OK)
2863
0
      {
2864
0
        res = SZ_ERROR_PROGRESS;
2865
0
        break;
2866
0
      }
2867
0
    }
2868
0
  }
2869
  
2870
0
  LzmaEnc_Finish(p);
2871
2872
  /*
2873
  if (res == SZ_OK && !Inline_MatchFinder_IsFinishedOK(&p->matchFinderBase))
2874
    res = SZ_ERROR_FAIL;
2875
  }
2876
  */
2877
2878
0
  return res;
2879
0
}
2880
2881
2882
SRes LzmaEnc_Encode(CLzmaEncHandle pp, ISeqOutStream *outStream, ISeqInStream *inStream, ICompressProgress *progress,
2883
    ISzAllocPtr alloc, ISzAllocPtr allocBig)
2884
0
{
2885
0
  RINOK(LzmaEnc_Prepare(pp, outStream, inStream, alloc, allocBig));
2886
0
  return LzmaEnc_Encode2((CLzmaEnc *)pp, progress);
2887
0
}
2888
2889
2890
SRes LzmaEnc_WriteProperties(CLzmaEncHandle pp, Byte *props, SizeT *size)
2891
7.77k
{
2892
7.77k
  CLzmaEnc *p = (CLzmaEnc *)pp;
2893
7.77k
  unsigned i;
2894
7.77k
  UInt32 dictSize = p->dictSize;
2895
7.77k
  if (*size < LZMA_PROPS_SIZE)
2896
0
    return SZ_ERROR_PARAM;
2897
7.77k
  *size = LZMA_PROPS_SIZE;
2898
7.77k
  props[0] = (Byte)((p->pb * 5 + p->lp) * 9 + p->lc);
2899
2900
7.77k
  if (dictSize >= ((UInt32)1 << 22))
2901
7.77k
  {
2902
7.77k
    UInt32 kDictMask = ((UInt32)1 << 20) - 1;
2903
7.77k
    if (dictSize < (UInt32)0xFFFFFFFF - kDictMask)
2904
7.77k
      dictSize = (dictSize + kDictMask) & ~kDictMask;
2905
7.77k
  }
2906
0
  else for (i = 11; i <= 30; i++)
2907
0
  {
2908
0
    if (dictSize <= ((UInt32)2 << i)) { dictSize = (2 << i); break; }
2909
0
    if (dictSize <= ((UInt32)3 << i)) { dictSize = (3 << i); break; }
2910
0
  }
2911
2912
38.8k
  for (i = 0; i < 4; i++)
2913
31.0k
    props[1 + i] = (Byte)(dictSize >> (8 * i));
2914
7.77k
  return SZ_OK;
2915
7.77k
}
2916
2917
2918
unsigned LzmaEnc_IsWriteEndMark(CLzmaEncHandle pp)
2919
0
{
2920
0
  return ((CLzmaEnc *)pp)->writeEndMark;
2921
0
}
2922
2923
2924
SRes LzmaEnc_MemEncode(CLzmaEncHandle pp, Byte *dest, SizeT *destLen, const Byte *src, SizeT srcLen,
2925
    int writeEndMark, ICompressProgress *progress, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2926
0
{
2927
0
  SRes res;
2928
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
2929
2930
0
  CLzmaEnc_SeqOutStreamBuf outStream;
2931
2932
0
  outStream.vt.Write = SeqOutStreamBuf_Write;
2933
0
  outStream.data = dest;
2934
0
  outStream.rem = *destLen;
2935
0
  outStream.overflow = False;
2936
2937
0
  p->writeEndMark = writeEndMark;
2938
0
  p->rc.outStream = &outStream.vt;
2939
2940
0
  res = LzmaEnc_MemPrepare(pp, src, srcLen, 0, alloc, allocBig);
2941
  
2942
0
  if (res == SZ_OK)
2943
0
  {
2944
0
    res = LzmaEnc_Encode2(p, progress);
2945
0
    if (res == SZ_OK && p->nowPos64 != srcLen)
2946
0
      res = SZ_ERROR_FAIL;
2947
0
  }
2948
2949
0
  *destLen -= outStream.rem;
2950
0
  if (outStream.overflow)
2951
0
    return SZ_ERROR_OUTPUT_EOF;
2952
0
  return res;
2953
0
}
2954
2955
2956
SRes LzmaEncode(Byte *dest, SizeT *destLen, const Byte *src, SizeT srcLen,
2957
    const CLzmaEncProps *props, Byte *propsEncoded, SizeT *propsSize, int writeEndMark,
2958
    ICompressProgress *progress, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2959
0
{
2960
0
  CLzmaEnc *p = (CLzmaEnc *)LzmaEnc_Create(alloc);
2961
0
  SRes res;
2962
0
  if (!p)
2963
0
    return SZ_ERROR_MEM;
2964
2965
0
  res = LzmaEnc_SetProps(p, props);
2966
0
  if (res == SZ_OK)
2967
0
  {
2968
0
    res = LzmaEnc_WriteProperties(p, propsEncoded, propsSize);
2969
0
    if (res == SZ_OK)
2970
0
      res = LzmaEnc_MemEncode(p, dest, destLen, src, srcLen,
2971
0
          writeEndMark, progress, alloc, allocBig);
2972
0
  }
2973
2974
0
  LzmaEnc_Destroy(p, alloc, allocBig);
2975
0
  return res;
2976
0
}