Coverage Report

Created: 2024-07-27 06:12

/src/lzma-fuzz/sdk/C/LzmaEnc.c
Line
Count
Source (jump to first uncovered line)
1
/* LzmaEnc.c -- LZMA Encoder
2
2019-01-10: Igor Pavlov : Public domain */
3
4
#include "Precomp.h"
5
6
#include <string.h>
7
8
/* #define SHOW_STAT */
9
/* #define SHOW_STAT2 */
10
11
#if defined(SHOW_STAT) || defined(SHOW_STAT2)
12
#include <stdio.h>
13
#endif
14
15
#include "LzmaEnc.h"
16
17
#include "LzFind.h"
18
#ifndef _7ZIP_ST
19
#include "LzFindMt.h"
20
#endif
21
22
#ifdef SHOW_STAT
23
static unsigned g_STAT_OFFSET = 0;
24
#endif
25
26
16.4k
#define kLzmaMaxHistorySize ((UInt32)3 << 29)
27
/* #define kLzmaMaxHistorySize ((UInt32)7 << 29) */
28
29
78.6M
#define kNumTopBits 24
30
78.6M
#define kTopValue ((UInt32)1 << kNumTopBits)
31
32
429M
#define kNumBitModelTotalBits 11
33
350M
#define kBitModelTotal (1 << kNumBitModelTotalBits)
34
209M
#define kNumMoveBits 5
35
151M
#define kProbInitValue (kBitModelTotal >> 1)
36
37
154M
#define kNumMoveReducingBits 4
38
3.02M
#define kNumBitPriceShiftBits 4
39
#define kBitPrice (1 << kNumBitPriceShiftBits)
40
41
28.0k
#define REP_LEN_COUNT 64
42
43
void LzmaEncProps_Init(CLzmaEncProps *p)
44
24.7k
{
45
24.7k
  p->level = 5;
46
24.7k
  p->dictSize = p->mc = 0;
47
24.7k
  p->reduceSize = (UInt64)(Int64)-1;
48
24.7k
  p->lc = p->lp = p->pb = p->algo = p->fb = p->btMode = p->numHashBytes = p->numThreads = -1;
49
24.7k
  p->writeEndMark = 0;
50
24.7k
}
51
52
void LzmaEncProps_Normalize(CLzmaEncProps *p)
53
82.4k
{
54
82.4k
  int level = p->level;
55
82.4k
  if (level < 0) level = 5;
56
82.4k
  p->level = level;
57
  
58
82.4k
  if (p->dictSize == 0) p->dictSize = (level <= 5 ? (1 << (level * 2 + 14)) : (level <= 7 ? (1 << 25) : (1 << 26)));
59
82.4k
  if (p->dictSize > p->reduceSize)
60
0
  {
61
0
    unsigned i;
62
0
    UInt32 reduceSize = (UInt32)p->reduceSize;
63
0
    for (i = 11; i <= 30; i++)
64
0
    {
65
0
      if (reduceSize <= ((UInt32)2 << i)) { p->dictSize = ((UInt32)2 << i); break; }
66
0
      if (reduceSize <= ((UInt32)3 << i)) { p->dictSize = ((UInt32)3 << i); break; }
67
0
    }
68
0
  }
69
70
82.4k
  if (p->lc < 0) p->lc = 3;
71
82.4k
  if (p->lp < 0) p->lp = 0;
72
82.4k
  if (p->pb < 0) p->pb = 2;
73
74
82.4k
  if (p->algo < 0) p->algo = (level < 5 ? 0 : 1);
75
82.4k
  if (p->fb < 0) p->fb = (level < 7 ? 32 : 64);
76
82.4k
  if (p->btMode < 0) p->btMode = (p->algo == 0 ? 0 : 1);
77
82.4k
  if (p->numHashBytes < 0) p->numHashBytes = 4;
78
82.4k
  if (p->mc == 0) p->mc = (16 + (p->fb >> 1)) >> (p->btMode ? 0 : 1);
79
  
80
82.4k
  if (p->numThreads < 0)
81
41.2k
    p->numThreads =
82
      #ifndef _7ZIP_ST
83
      ((p->btMode && p->algo) ? 2 : 1);
84
      #else
85
41.2k
      1;
86
82.4k
      #endif
87
82.4k
}
88
89
UInt32 LzmaEncProps_GetDictSize(const CLzmaEncProps *props2)
90
8.23k
{
91
8.23k
  CLzmaEncProps props = *props2;
92
8.23k
  LzmaEncProps_Normalize(&props);
93
8.23k
  return props.dictSize;
94
8.23k
}
95
96
#if (_MSC_VER >= 1400)
97
/* BSR code is fast for some new CPUs */
98
/* #define LZMA_LOG_BSR */
99
#endif
100
101
#ifdef LZMA_LOG_BSR
102
103
#define kDicLogSizeMaxCompress 32
104
105
#define BSR2_RET(pos, res) { unsigned long zz; _BitScanReverse(&zz, (pos)); res = (zz + zz) + ((pos >> (zz - 1)) & 1); }
106
107
static unsigned GetPosSlot1(UInt32 pos)
108
{
109
  unsigned res;
110
  BSR2_RET(pos, res);
111
  return res;
112
}
113
#define GetPosSlot2(pos, res) { BSR2_RET(pos, res); }
114
#define GetPosSlot(pos, res) { if (pos < 2) res = pos; else BSR2_RET(pos, res); }
115
116
#else
117
118
4.53M
#define kNumLogBits (9 + sizeof(size_t) / 2)
119
/* #define kNumLogBits (11 + sizeof(size_t) / 8 * 3) */
120
121
16.4k
#define kDicLogSizeMaxCompress ((kNumLogBits - 1) * 2 + 7)
122
123
static void LzmaEnc_FastPosInit(Byte *g_FastPos)
124
8.23k
{
125
8.23k
  unsigned slot;
126
8.23k
  g_FastPos[0] = 0;
127
8.23k
  g_FastPos[1] = 1;
128
8.23k
  g_FastPos += 2;
129
  
130
205k
  for (slot = 2; slot < kNumLogBits * 2; slot++)
131
197k
  {
132
197k
    size_t k = ((size_t)1 << ((slot >> 1) - 1));
133
197k
    size_t j;
134
67.6M
    for (j = 0; j < k; j++)
135
67.4M
      g_FastPos[j] = (Byte)slot;
136
197k
    g_FastPos += k;
137
197k
  }
138
8.23k
}
139
140
/* we can use ((limit - pos) >> 31) only if (pos < ((UInt32)1 << 31)) */
141
/*
142
#define BSR2_RET(pos, res) { unsigned zz = 6 + ((kNumLogBits - 1) & \
143
  (0 - (((((UInt32)1 << (kNumLogBits + 6)) - 1) - pos) >> 31))); \
144
  res = p->g_FastPos[pos >> zz] + (zz * 2); }
145
*/
146
147
/*
148
#define BSR2_RET(pos, res) { unsigned zz = 6 + ((kNumLogBits - 1) & \
149
  (0 - (((((UInt32)1 << (kNumLogBits)) - 1) - (pos >> 6)) >> 31))); \
150
  res = p->g_FastPos[pos >> zz] + (zz * 2); }
151
*/
152
153
4.30M
#define BSR2_RET(pos, res) { unsigned zz = (pos < (1 << (kNumLogBits + 6))) ? 6 : 6 + kNumLogBits - 1; \
154
4.30M
  res = p->g_FastPos[pos >> zz] + (zz * 2); }
155
156
/*
157
#define BSR2_RET(pos, res) { res = (pos < (1 << (kNumLogBits + 6))) ? \
158
  p->g_FastPos[pos >> 6] + 12 : \
159
  p->g_FastPos[pos >> (6 + kNumLogBits - 1)] + (6 + (kNumLogBits - 1)) * 2; }
160
*/
161
162
8.48M
#define GetPosSlot1(pos) p->g_FastPos[pos]
163
4.16M
#define GetPosSlot2(pos, res) { BSR2_RET(pos, res); }
164
909k
#define GetPosSlot(pos, res) { if (pos < kNumFullDistances) res = p->g_FastPos[pos & (kNumFullDistances - 1)]; else BSR2_RET(pos, res); }
165
166
#endif
167
168
169
75.3M
#define LZMA_NUM_REPS 4
170
171
typedef UInt16 CState;
172
typedef UInt16 CExtra;
173
174
typedef struct
175
{
176
  UInt32 price;
177
  CState state;
178
  CExtra extra;
179
      // 0   : normal
180
      // 1   : LIT : MATCH
181
      // > 1 : MATCH (extra-1) : LIT : REP0 (len)
182
  UInt32 len;
183
  UInt32 dist;
184
  UInt32 reps[LZMA_NUM_REPS];
185
} COptimal;
186
187
188
// 18.06
189
60.5M
#define kNumOpts (1 << 11)
190
6.39M
#define kPackReserve (kNumOpts * 8)
191
// #define kNumOpts (1 << 12)
192
// #define kPackReserve (1 + kNumOpts * 2)
193
194
31.5M
#define kNumLenToPosStates 4
195
27.3M
#define kNumPosSlotBits 6
196
#define kDicLogSizeMin 0
197
148k
#define kDicLogSizeMax 32
198
#define kDistTableSizeMax (kDicLogSizeMax * 2)
199
200
7.06M
#define kNumAlignBits 4
201
6.63M
#define kAlignTableSize (1 << kNumAlignBits)
202
6.39M
#define kAlignMask (kAlignTableSize - 1)
203
204
936k
#define kStartPosModelIndex 4
205
42.1M
#define kEndPosModelIndex 14
206
42.8M
#define kNumFullDistances (1 << (kEndPosModelIndex >> 1))
207
208
typedef
209
#ifdef _LZMA_PROB32
210
  UInt32
211
#else
212
  UInt16
213
#endif
214
  CLzmaProb;
215
216
13.3M
#define LZMA_PB_MAX 4
217
32.9k
#define LZMA_LC_MAX 8
218
32.9k
#define LZMA_LP_MAX 4
219
220
13.3M
#define LZMA_NUM_PB_STATES_MAX (1 << LZMA_PB_MAX)
221
222
27.9M
#define kLenNumLowBits 3
223
16.6M
#define kLenNumLowSymbols (1 << kLenNumLowBits)
224
27.3M
#define kLenNumHighBits 8
225
22.6M
#define kLenNumHighSymbols (1 << kLenNumHighBits)
226
13.0M
#define kLenNumSymbolsTotal (kLenNumLowSymbols * 2 + kLenNumHighSymbols)
227
228
114M
#define LZMA_MATCH_LEN_MIN 2
229
13.0M
#define LZMA_MATCH_LEN_MAX (LZMA_MATCH_LEN_MIN + kLenNumSymbolsTotal - 1)
230
231
241k
#define kNumStates 12
232
233
234
typedef struct
235
{
236
  CLzmaProb low[LZMA_NUM_PB_STATES_MAX << (kLenNumLowBits + 1)];
237
  CLzmaProb high[kLenNumHighSymbols];
238
} CLenEnc;
239
240
241
typedef struct
242
{
243
  unsigned tableSize;
244
  UInt32 prices[LZMA_NUM_PB_STATES_MAX][kLenNumSymbolsTotal];
245
  // UInt32 prices1[LZMA_NUM_PB_STATES_MAX][kLenNumLowSymbols * 2];
246
  // UInt32 prices2[kLenNumSymbolsTotal];
247
} CLenPriceEnc;
248
249
#define GET_PRICE_LEN(p, posState, len) \
250
100M
    ((p)->prices[posState][(size_t)(len) - LZMA_MATCH_LEN_MIN])
251
252
/*
253
#define GET_PRICE_LEN(p, posState, len) \
254
    ((p)->prices2[(size_t)(len) - 2] + ((p)->prices1[posState][((len) - 2) & (kLenNumLowSymbols * 2 - 1)] & (((len) - 2 - kLenNumLowSymbols * 2) >> 9)))
255
*/
256
257
typedef struct
258
{
259
  UInt32 range;
260
  unsigned cache;
261
  UInt64 low;
262
  UInt64 cacheSize;
263
  Byte *buf;
264
  Byte *bufLim;
265
  Byte *bufBase;
266
  ISeqOutStream *outStream;
267
  UInt64 processed;
268
  SRes res;
269
} CRangeEnc;
270
271
272
typedef struct
273
{
274
  CLzmaProb *litProbs;
275
276
  unsigned state;
277
  UInt32 reps[LZMA_NUM_REPS];
278
279
  CLzmaProb posAlignEncoder[1 << kNumAlignBits];
280
  CLzmaProb isRep[kNumStates];
281
  CLzmaProb isRepG0[kNumStates];
282
  CLzmaProb isRepG1[kNumStates];
283
  CLzmaProb isRepG2[kNumStates];
284
  CLzmaProb isMatch[kNumStates][LZMA_NUM_PB_STATES_MAX];
285
  CLzmaProb isRep0Long[kNumStates][LZMA_NUM_PB_STATES_MAX];
286
287
  CLzmaProb posSlotEncoder[kNumLenToPosStates][1 << kNumPosSlotBits];
288
  CLzmaProb posEncoders[kNumFullDistances];
289
  
290
  CLenEnc lenProbs;
291
  CLenEnc repLenProbs;
292
293
} CSaveState;
294
295
296
typedef UInt32 CProbPrice;
297
298
299
typedef struct
300
{
301
  void *matchFinderObj;
302
  IMatchFinder matchFinder;
303
304
  unsigned optCur;
305
  unsigned optEnd;
306
307
  unsigned longestMatchLen;
308
  unsigned numPairs;
309
  UInt32 numAvail;
310
311
  unsigned state;
312
  unsigned numFastBytes;
313
  unsigned additionalOffset;
314
  UInt32 reps[LZMA_NUM_REPS];
315
  unsigned lpMask, pbMask;
316
  CLzmaProb *litProbs;
317
  CRangeEnc rc;
318
319
  UInt32 backRes;
320
321
  unsigned lc, lp, pb;
322
  unsigned lclp;
323
324
  BoolInt fastMode;
325
  BoolInt writeEndMark;
326
  BoolInt finished;
327
  BoolInt multiThread;
328
  BoolInt needInit;
329
  // BoolInt _maxMode;
330
331
  UInt64 nowPos64;
332
  
333
  unsigned matchPriceCount;
334
  // unsigned alignPriceCount;
335
  int repLenEncCounter;
336
337
  unsigned distTableSize;
338
339
  UInt32 dictSize;
340
  SRes result;
341
342
  #ifndef _7ZIP_ST
343
  BoolInt mtMode;
344
  // begin of CMatchFinderMt is used in LZ thread
345
  CMatchFinderMt matchFinderMt;
346
  // end of CMatchFinderMt is used in BT and HASH threads
347
  #endif
348
349
  CMatchFinder matchFinderBase;
350
351
  #ifndef _7ZIP_ST
352
  Byte pad[128];
353
  #endif
354
  
355
  // LZ thread
356
  CProbPrice ProbPrices[kBitModelTotal >> kNumMoveReducingBits];
357
358
  UInt32 matches[LZMA_MATCH_LEN_MAX * 2 + 2 + 1];
359
360
  UInt32 alignPrices[kAlignTableSize];
361
  UInt32 posSlotPrices[kNumLenToPosStates][kDistTableSizeMax];
362
  UInt32 distancesPrices[kNumLenToPosStates][kNumFullDistances];
363
364
  CLzmaProb posAlignEncoder[1 << kNumAlignBits];
365
  CLzmaProb isRep[kNumStates];
366
  CLzmaProb isRepG0[kNumStates];
367
  CLzmaProb isRepG1[kNumStates];
368
  CLzmaProb isRepG2[kNumStates];
369
  CLzmaProb isMatch[kNumStates][LZMA_NUM_PB_STATES_MAX];
370
  CLzmaProb isRep0Long[kNumStates][LZMA_NUM_PB_STATES_MAX];
371
  CLzmaProb posSlotEncoder[kNumLenToPosStates][1 << kNumPosSlotBits];
372
  CLzmaProb posEncoders[kNumFullDistances];
373
  
374
  CLenEnc lenProbs;
375
  CLenEnc repLenProbs;
376
377
  #ifndef LZMA_LOG_BSR
378
  Byte g_FastPos[1 << kNumLogBits];
379
  #endif
380
381
  CLenPriceEnc lenEnc;
382
  CLenPriceEnc repLenEnc;
383
384
  COptimal opt[kNumOpts];
385
386
  CSaveState saveState;
387
388
  #ifndef _7ZIP_ST
389
  Byte pad2[128];
390
  #endif
391
} CLzmaEnc;
392
393
394
395
186k
#define COPY_ARR(dest, src, arr) memcpy(dest->arr, src->arr, sizeof(src->arr));
396
397
void LzmaEnc_SaveState(CLzmaEncHandle pp)
398
16.5k
{
399
16.5k
  CLzmaEnc *p = (CLzmaEnc *)pp;
400
16.5k
  CSaveState *dest = &p->saveState;
401
  
402
16.5k
  dest->state = p->state;
403
  
404
16.5k
  dest->lenProbs = p->lenProbs;
405
16.5k
  dest->repLenProbs = p->repLenProbs;
406
407
16.5k
  COPY_ARR(dest, p, reps);
408
409
16.5k
  COPY_ARR(dest, p, posAlignEncoder);
410
16.5k
  COPY_ARR(dest, p, isRep);
411
16.5k
  COPY_ARR(dest, p, isRepG0);
412
16.5k
  COPY_ARR(dest, p, isRepG1);
413
16.5k
  COPY_ARR(dest, p, isRepG2);
414
16.5k
  COPY_ARR(dest, p, isMatch);
415
16.5k
  COPY_ARR(dest, p, isRep0Long);
416
16.5k
  COPY_ARR(dest, p, posSlotEncoder);
417
16.5k
  COPY_ARR(dest, p, posEncoders);
418
419
16.5k
  memcpy(dest->litProbs, p->litProbs, ((UInt32)0x300 << p->lclp) * sizeof(CLzmaProb));
420
16.5k
}
421
422
423
void LzmaEnc_RestoreState(CLzmaEncHandle pp)
424
2.14k
{
425
2.14k
  CLzmaEnc *dest = (CLzmaEnc *)pp;
426
2.14k
  const CSaveState *p = &dest->saveState;
427
428
2.14k
  dest->state = p->state;
429
430
2.14k
  dest->lenProbs = p->lenProbs;
431
2.14k
  dest->repLenProbs = p->repLenProbs;
432
  
433
2.14k
  COPY_ARR(dest, p, reps);
434
  
435
2.14k
  COPY_ARR(dest, p, posAlignEncoder);
436
2.14k
  COPY_ARR(dest, p, isRep);
437
2.14k
  COPY_ARR(dest, p, isRepG0);
438
2.14k
  COPY_ARR(dest, p, isRepG1);
439
2.14k
  COPY_ARR(dest, p, isRepG2);
440
2.14k
  COPY_ARR(dest, p, isMatch);
441
2.14k
  COPY_ARR(dest, p, isRep0Long);
442
2.14k
  COPY_ARR(dest, p, posSlotEncoder);
443
2.14k
  COPY_ARR(dest, p, posEncoders);
444
445
2.14k
  memcpy(dest->litProbs, p->litProbs, ((UInt32)0x300 << dest->lclp) * sizeof(CLzmaProb));
446
2.14k
}
447
448
449
450
SRes LzmaEnc_SetProps(CLzmaEncHandle pp, const CLzmaEncProps *props2)
451
16.4k
{
452
16.4k
  CLzmaEnc *p = (CLzmaEnc *)pp;
453
16.4k
  CLzmaEncProps props = *props2;
454
16.4k
  LzmaEncProps_Normalize(&props);
455
456
16.4k
  if (props.lc > LZMA_LC_MAX
457
16.4k
      || props.lp > LZMA_LP_MAX
458
16.4k
      || props.pb > LZMA_PB_MAX
459
16.4k
      || props.dictSize > ((UInt64)1 << kDicLogSizeMaxCompress)
460
16.4k
      || props.dictSize > kLzmaMaxHistorySize)
461
0
    return SZ_ERROR_PARAM;
462
463
16.4k
  p->dictSize = props.dictSize;
464
16.4k
  {
465
16.4k
    unsigned fb = props.fb;
466
16.4k
    if (fb < 5)
467
0
      fb = 5;
468
16.4k
    if (fb > LZMA_MATCH_LEN_MAX)
469
0
      fb = LZMA_MATCH_LEN_MAX;
470
16.4k
    p->numFastBytes = fb;
471
16.4k
  }
472
16.4k
  p->lc = props.lc;
473
16.4k
  p->lp = props.lp;
474
16.4k
  p->pb = props.pb;
475
16.4k
  p->fastMode = (props.algo == 0);
476
  // p->_maxMode = True;
477
16.4k
  p->matchFinderBase.btMode = (Byte)(props.btMode ? 1 : 0);
478
16.4k
  {
479
16.4k
    unsigned numHashBytes = 4;
480
16.4k
    if (props.btMode)
481
14.9k
    {
482
14.9k
      if (props.numHashBytes < 2)
483
0
        numHashBytes = 2;
484
14.9k
      else if (props.numHashBytes < 4)
485
5.35k
        numHashBytes = props.numHashBytes;
486
14.9k
    }
487
16.4k
    p->matchFinderBase.numHashBytes = numHashBytes;
488
16.4k
  }
489
490
16.4k
  p->matchFinderBase.cutValue = props.mc;
491
492
16.4k
  p->writeEndMark = props.writeEndMark;
493
494
  #ifndef _7ZIP_ST
495
  /*
496
  if (newMultiThread != _multiThread)
497
  {
498
    ReleaseMatchFinder();
499
    _multiThread = newMultiThread;
500
  }
501
  */
502
  p->multiThread = (props.numThreads > 1);
503
  #endif
504
505
16.4k
  return SZ_OK;
506
16.4k
}
507
508
509
void LzmaEnc_SetDataSize(CLzmaEncHandle pp, UInt64 expectedDataSiize)
510
8.23k
{
511
8.23k
  CLzmaEnc *p = (CLzmaEnc *)pp;
512
8.23k
  p->matchFinderBase.expectedDataSize = expectedDataSiize;
513
8.23k
}
514
515
516
8.23k
#define kState_Start 0
517
1.01M
#define kState_LitAfterMatch 4
518
1.87M
#define kState_LitAfterRep   5
519
0
#define kState_MatchAfterLit 7
520
58.3k
#define kState_RepAfterLit   8
521
522
static const Byte kLiteralNextStates[kNumStates] = {0, 0, 0, 0, 1, 2, 3, 4,  5,  6,   4, 5};
523
static const Byte kMatchNextStates[kNumStates]   = {7, 7, 7, 7, 7, 7, 7, 10, 10, 10, 10, 10};
524
static const Byte kRepNextStates[kNumStates]     = {8, 8, 8, 8, 8, 8, 8, 11, 11, 11, 11, 11};
525
static const Byte kShortRepNextStates[kNumStates]= {9, 9, 9, 9, 9, 9, 9, 11, 11, 11, 11, 11};
526
527
13.5M
#define IsLitState(s) ((s) < 7)
528
16.8M
#define GetLenToPosState2(len) (((len) < kNumLenToPosStates - 1) ? (len) : kNumLenToPosStates - 1)
529
1.60M
#define GetLenToPosState(len) (((len) < kNumLenToPosStates + 1) ? (len) - 2 : kNumLenToPosStates - 1)
530
531
53.3M
#define kInfinityPrice (1 << 30)
532
533
static void RangeEnc_Construct(CRangeEnc *p)
534
8.23k
{
535
8.23k
  p->outStream = NULL;
536
8.23k
  p->bufBase = NULL;
537
8.23k
}
538
539
#define RangeEnc_GetProcessed(p)       ((p)->processed + ((p)->buf - (p)->bufBase) + (p)->cacheSize)
540
6.39M
#define RangeEnc_GetProcessed_sizet(p) ((size_t)(p)->processed + ((p)->buf - (p)->bufBase) + (size_t)(p)->cacheSize)
541
542
8.23k
#define RC_BUF_SIZE (1 << 16)
543
544
static int RangeEnc_Alloc(CRangeEnc *p, ISzAllocPtr alloc)
545
8.23k
{
546
8.23k
  if (!p->bufBase)
547
8.23k
  {
548
8.23k
    p->bufBase = (Byte *)ISzAlloc_Alloc(alloc, RC_BUF_SIZE);
549
8.23k
    if (!p->bufBase)
550
0
      return 0;
551
8.23k
    p->bufLim = p->bufBase + RC_BUF_SIZE;
552
8.23k
  }
553
8.23k
  return 1;
554
8.23k
}
555
556
static void RangeEnc_Free(CRangeEnc *p, ISzAllocPtr alloc)
557
8.23k
{
558
8.23k
  ISzAlloc_Free(alloc, p->bufBase);
559
8.23k
  p->bufBase = 0;
560
8.23k
}
561
562
static void RangeEnc_Init(CRangeEnc *p)
563
35.1k
{
564
  /* Stream.Init(); */
565
35.1k
  p->range = 0xFFFFFFFF;
566
35.1k
  p->cache = 0;
567
35.1k
  p->low = 0;
568
35.1k
  p->cacheSize = 0;
569
570
35.1k
  p->buf = p->bufBase;
571
572
35.1k
  p->processed = 0;
573
35.1k
  p->res = SZ_OK;
574
35.1k
}
575
576
MY_NO_INLINE static void RangeEnc_FlushStream(CRangeEnc *p)
577
16.5k
{
578
16.5k
  size_t num;
579
16.5k
  if (p->res != SZ_OK)
580
0
    return;
581
16.5k
  num = p->buf - p->bufBase;
582
16.5k
  if (num != ISeqOutStream_Write(p->outStream, p->bufBase, num))
583
0
    p->res = SZ_ERROR_WRITE;
584
16.5k
  p->processed += num;
585
16.5k
  p->buf = p->bufBase;
586
16.5k
}
587
588
MY_NO_INLINE static void MY_FAST_CALL RangeEnc_ShiftLow(CRangeEnc *p)
589
8.01M
{
590
8.01M
  UInt32 low = (UInt32)p->low;
591
8.01M
  unsigned high = (unsigned)(p->low >> 32);
592
8.01M
  p->low = (UInt32)(low << 8);
593
8.01M
  if (low < (UInt32)0xFF000000 || high != 0)
594
7.98M
  {
595
7.98M
    {
596
7.98M
      Byte *buf = p->buf;
597
7.98M
      *buf++ = (Byte)(p->cache + high);
598
7.98M
      p->cache = (unsigned)(low >> 24);
599
7.98M
      p->buf = buf;
600
7.98M
      if (buf == p->bufLim)
601
0
        RangeEnc_FlushStream(p);
602
7.98M
      if (p->cacheSize == 0)
603
7.94M
        return;
604
7.98M
    }
605
32.0k
    high += 0xFF;
606
32.0k
    for (;;)
607
32.3k
    {
608
32.3k
      Byte *buf = p->buf;
609
32.3k
      *buf++ = (Byte)(high);
610
32.3k
      p->buf = buf;
611
32.3k
      if (buf == p->bufLim)
612
0
        RangeEnc_FlushStream(p);
613
32.3k
      if (--p->cacheSize == 0)
614
32.0k
        return;
615
32.3k
    }
616
32.0k
  }
617
32.3k
  p->cacheSize++;
618
32.3k
}
619
620
static void RangeEnc_FlushData(CRangeEnc *p)
621
16.5k
{
622
16.5k
  int i;
623
99.2k
  for (i = 0; i < 5; i++)
624
82.6k
    RangeEnc_ShiftLow(p);
625
16.5k
}
626
627
78.6M
#define RC_NORM(p) if (range < kTopValue) { range <<= 8; RangeEnc_ShiftLow(p); }
628
629
#define RC_BIT_PRE(p, prob) \
630
78.0M
  ttt = *(prob); \
631
78.0M
  newBound = (range >> kNumBitModelTotalBits) * ttt;
632
633
// #define _LZMA_ENC_USE_BRANCH
634
635
#ifdef _LZMA_ENC_USE_BRANCH
636
637
#define RC_BIT(p, prob, bit) { \
638
  RC_BIT_PRE(p, prob) \
639
  if (bit == 0) { range = newBound; ttt += (kBitModelTotal - ttt) >> kNumMoveBits; } \
640
  else { (p)->low += newBound; range -= newBound; ttt -= ttt >> kNumMoveBits; } \
641
  *(prob) = (CLzmaProb)ttt; \
642
  RC_NORM(p) \
643
  }
644
645
#else
646
647
65.4M
#define RC_BIT(p, prob, bit) { \
648
65.4M
  UInt32 mask; \
649
65.4M
  RC_BIT_PRE(p, prob) \
650
65.4M
  mask = 0 - (UInt32)bit; \
651
65.4M
  range &= mask; \
652
65.4M
  mask &= newBound; \
653
65.4M
  range -= mask; \
654
65.4M
  (p)->low += mask; \
655
65.4M
  mask = (UInt32)bit - 1; \
656
65.4M
  range += newBound & mask; \
657
65.4M
  mask &= (kBitModelTotal - ((1 << kNumMoveBits) - 1)); \
658
65.4M
  mask += ((1 << kNumMoveBits) - 1); \
659
65.4M
  ttt += (Int32)(mask - ttt) >> kNumMoveBits; \
660
65.4M
  *(prob) = (CLzmaProb)ttt; \
661
65.4M
  RC_NORM(p) \
662
65.4M
  }
663
664
#endif
665
666
667
668
669
#define RC_BIT_0_BASE(p, prob) \
670
9.48M
  range = newBound; *(prob) = (CLzmaProb)(ttt + ((kBitModelTotal - ttt) >> kNumMoveBits));
671
672
#define RC_BIT_1_BASE(p, prob) \
673
3.05M
  range -= newBound; (p)->low += newBound; *(prob) = (CLzmaProb)(ttt - (ttt >> kNumMoveBits)); \
674
675
#define RC_BIT_0(p, prob) \
676
9.13M
  RC_BIT_0_BASE(p, prob) \
677
9.13M
  RC_NORM(p)
678
679
#define RC_BIT_1(p, prob) \
680
2.85M
  RC_BIT_1_BASE(p, prob) \
681
2.85M
  RC_NORM(p)
682
683
static void RangeEnc_EncodeBit_0(CRangeEnc *p, CLzmaProb *prob)
684
8.23k
{
685
8.23k
  UInt32 range, ttt, newBound;
686
8.23k
  range = p->range;
687
8.23k
  RC_BIT_PRE(p, prob)
688
8.23k
  RC_BIT_0(p, prob)
689
8.23k
  p->range = range;
690
8.23k
}
691
692
static void LitEnc_Encode(CRangeEnc *p, CLzmaProb *probs, UInt32 sym)
693
6.45M
{
694
6.45M
  UInt32 range = p->range;
695
6.45M
  sym |= 0x100;
696
6.45M
  do
697
51.6M
  {
698
51.6M
    UInt32 ttt, newBound;
699
    // RangeEnc_EncodeBit(p, probs + (sym >> 8), (sym >> 7) & 1);
700
51.6M
    CLzmaProb *prob = probs + (sym >> 8);
701
51.6M
    UInt32 bit = (sym >> 7) & 1;
702
51.6M
    sym <<= 1;
703
51.6M
    RC_BIT(p, prob, bit);
704
51.6M
  }
705
51.6M
  while (sym < 0x10000);
706
6.45M
  p->range = range;
707
6.45M
}
708
709
static void LitEnc_EncodeMatched(CRangeEnc *p, CLzmaProb *probs, UInt32 sym, UInt32 matchByte)
710
361k
{
711
361k
  UInt32 range = p->range;
712
361k
  UInt32 offs = 0x100;
713
361k
  sym |= 0x100;
714
361k
  do
715
2.89M
  {
716
2.89M
    UInt32 ttt, newBound;
717
2.89M
    CLzmaProb *prob;
718
2.89M
    UInt32 bit;
719
2.89M
    matchByte <<= 1;
720
    // RangeEnc_EncodeBit(p, probs + (offs + (matchByte & offs) + (sym >> 8)), (sym >> 7) & 1);
721
2.89M
    prob = probs + (offs + (matchByte & offs) + (sym >> 8));
722
2.89M
    bit = (sym >> 7) & 1;
723
2.89M
    sym <<= 1;
724
2.89M
    offs &= ~(matchByte ^ sym);
725
2.89M
    RC_BIT(p, prob, bit);
726
2.89M
  }
727
2.89M
  while (sym < 0x10000);
728
361k
  p->range = range;
729
361k
}
730
731
732
733
static void LzmaEnc_InitPriceTables(CProbPrice *ProbPrices)
734
8.23k
{
735
8.23k
  UInt32 i;
736
1.06M
  for (i = 0; i < (kBitModelTotal >> kNumMoveReducingBits); i++)
737
1.05M
  {
738
1.05M
    const unsigned kCyclesBits = kNumBitPriceShiftBits;
739
1.05M
    UInt32 w = (i << kNumMoveReducingBits) + (1 << (kNumMoveReducingBits - 1));
740
1.05M
    unsigned bitCount = 0;
741
1.05M
    unsigned j;
742
5.27M
    for (j = 0; j < kCyclesBits; j++)
743
4.21M
    {
744
4.21M
      w = w * w;
745
4.21M
      bitCount <<= 1;
746
56.7M
      while (w >= ((UInt32)1 << 16))
747
52.5M
      {
748
52.5M
        w >>= 1;
749
52.5M
        bitCount++;
750
52.5M
      }
751
4.21M
    }
752
1.05M
    ProbPrices[i] = (CProbPrice)((kNumBitModelTotalBits << kCyclesBits) - 15 - bitCount);
753
    // printf("\n%3d: %5d", i, ProbPrices[i]);
754
1.05M
  }
755
8.23k
}
756
757
758
#define GET_PRICE(prob, bit) \
759
2.12M
  p->ProbPrices[((prob) ^ (unsigned)(((-(int)(bit))) & (kBitModelTotal - 1))) >> kNumMoveReducingBits];
760
761
#define GET_PRICEa(prob, bit) \
762
82.7M
     ProbPrices[((prob) ^ (unsigned)((-((int)(bit))) & (kBitModelTotal - 1))) >> kNumMoveReducingBits];
763
764
17.8M
#define GET_PRICE_0(prob) p->ProbPrices[(prob) >> kNumMoveReducingBits]
765
26.7M
#define GET_PRICE_1(prob) p->ProbPrices[((prob) ^ (kBitModelTotal - 1)) >> kNumMoveReducingBits]
766
767
10.9M
#define GET_PRICEa_0(prob) ProbPrices[(prob) >> kNumMoveReducingBits]
768
10.9M
#define GET_PRICEa_1(prob) ProbPrices[((prob) ^ (kBitModelTotal - 1)) >> kNumMoveReducingBits]
769
770
771
static UInt32 LitEnc_GetPrice(const CLzmaProb *probs, UInt32 sym, const CProbPrice *ProbPrices)
772
1.10M
{
773
1.10M
  UInt32 price = 0;
774
1.10M
  sym |= 0x100;
775
1.10M
  do
776
8.84M
  {
777
8.84M
    unsigned bit = sym & 1;
778
8.84M
    sym >>= 1;
779
8.84M
    price += GET_PRICEa(probs[sym], bit);
780
8.84M
  }
781
8.84M
  while (sym >= 2);
782
1.10M
  return price;
783
1.10M
}
784
785
786
static UInt32 LitEnc_Matched_GetPrice(const CLzmaProb *probs, UInt32 sym, UInt32 matchByte, const CProbPrice *ProbPrices)
787
3.78M
{
788
3.78M
  UInt32 price = 0;
789
3.78M
  UInt32 offs = 0x100;
790
3.78M
  sym |= 0x100;
791
3.78M
  do
792
30.2M
  {
793
30.2M
    matchByte <<= 1;
794
30.2M
    price += GET_PRICEa(probs[offs + (matchByte & offs) + (sym >> 8)], (sym >> 7) & 1);
795
30.2M
    sym <<= 1;
796
30.2M
    offs &= ~(matchByte ^ sym);
797
30.2M
  }
798
30.2M
  while (sym < 0x10000);
799
3.78M
  return price;
800
3.78M
}
801
802
803
static void RcTree_ReverseEncode(CRangeEnc *rc, CLzmaProb *probs, unsigned numBits, unsigned sym)
804
453k
{
805
453k
  UInt32 range = rc->range;
806
453k
  unsigned m = 1;
807
453k
  do
808
972k
  {
809
972k
    UInt32 ttt, newBound;
810
972k
    unsigned bit = sym & 1;
811
    // RangeEnc_EncodeBit(rc, probs + m, bit);
812
972k
    sym >>= 1;
813
972k
    RC_BIT(rc, probs + m, bit);
814
972k
    m = (m << 1) | bit;
815
972k
  }
816
972k
  while (--numBits);
817
453k
  rc->range = range;
818
453k
}
819
820
821
822
static void LenEnc_Init(CLenEnc *p)
823
37.2k
{
824
37.2k
  unsigned i;
825
9.56M
  for (i = 0; i < (LZMA_NUM_PB_STATES_MAX << (kLenNumLowBits + 1)); i++)
826
9.52M
    p->low[i] = kProbInitValue;
827
9.56M
  for (i = 0; i < kLenNumHighSymbols; i++)
828
9.52M
    p->high[i] = kProbInitValue;
829
37.2k
}
830
831
static void LenEnc_Encode(CLenEnc *p, CRangeEnc *rc, unsigned sym, unsigned posState)
832
1.40M
{
833
1.40M
  UInt32 range, ttt, newBound;
834
1.40M
  CLzmaProb *probs = p->low;
835
1.40M
  range = rc->range;
836
1.40M
  RC_BIT_PRE(rc, probs);
837
1.40M
  if (sym >= kLenNumLowSymbols)
838
143k
  {
839
143k
    RC_BIT_1(rc, probs);
840
143k
    probs += kLenNumLowSymbols;
841
143k
    RC_BIT_PRE(rc, probs);
842
143k
    if (sym >= kLenNumLowSymbols * 2)
843
93.8k
    {
844
93.8k
      RC_BIT_1(rc, probs);
845
93.8k
      rc->range = range;
846
      // RcTree_Encode(rc, p->high, kLenNumHighBits, sym - kLenNumLowSymbols * 2);
847
93.8k
      LitEnc_Encode(rc, p->high, sym - kLenNumLowSymbols * 2);
848
93.8k
      return;
849
93.8k
    }
850
50.0k
    sym -= kLenNumLowSymbols;
851
50.0k
  }
852
853
  // RcTree_Encode(rc, probs + (posState << kLenNumLowBits), kLenNumLowBits, sym);
854
1.31M
  {
855
1.31M
    unsigned m;
856
1.31M
    unsigned bit;
857
1.31M
    RC_BIT_0(rc, probs);
858
1.31M
    probs += (posState << (1 + kLenNumLowBits));
859
1.31M
    bit = (sym >> 2)    ; RC_BIT(rc, probs + 1, bit); m = (1 << 1) + bit;
860
1.31M
    bit = (sym >> 1) & 1; RC_BIT(rc, probs + m, bit); m = (m << 1) + bit;
861
1.31M
    bit =  sym       & 1; RC_BIT(rc, probs + m, bit);
862
1.31M
    rc->range = range;
863
1.31M
  }
864
1.31M
}
865
866
static void SetPrices_3(const CLzmaProb *probs, UInt32 startPrice, UInt32 *prices, const CProbPrice *ProbPrices)
867
973k
{
868
973k
  unsigned i;
869
4.86M
  for (i = 0; i < 8; i += 2)
870
3.89M
  {
871
3.89M
    UInt32 price = startPrice;
872
3.89M
    UInt32 prob;
873
3.89M
    price += GET_PRICEa(probs[1           ], (i >> 2));
874
3.89M
    price += GET_PRICEa(probs[2 + (i >> 2)], (i >> 1) & 1);
875
3.89M
    prob = probs[4 + (i >> 1)];
876
3.89M
    prices[i    ] = price + GET_PRICEa_0(prob);
877
3.89M
    prices[i + 1] = price + GET_PRICEa_1(prob);
878
3.89M
  }
879
973k
}
880
881
882
MY_NO_INLINE static void MY_FAST_CALL LenPriceEnc_UpdateTables(
883
    CLenPriceEnc *p,
884
    unsigned numPosStates,
885
    const CLenEnc *enc,
886
    const CProbPrice *ProbPrices)
887
63.0k
{
888
63.0k
  UInt32 b;
889
 
890
63.0k
  {
891
63.0k
    unsigned prob = enc->low[0];
892
63.0k
    UInt32 a, c;
893
63.0k
    unsigned posState;
894
63.0k
    b = GET_PRICEa_1(prob);
895
63.0k
    a = GET_PRICEa_0(prob);
896
63.0k
    c = b + GET_PRICEa_0(enc->low[kLenNumLowSymbols]);
897
549k
    for (posState = 0; posState < numPosStates; posState++)
898
486k
    {
899
486k
      UInt32 *prices = p->prices[posState];
900
486k
      const CLzmaProb *probs = enc->low + (posState << (1 + kLenNumLowBits));
901
486k
      SetPrices_3(probs, a, prices, ProbPrices);
902
486k
      SetPrices_3(probs + kLenNumLowSymbols, c, prices + kLenNumLowSymbols, ProbPrices);
903
486k
    }
904
63.0k
  }
905
906
  /*
907
  {
908
    unsigned i;
909
    UInt32 b;
910
    a = GET_PRICEa_0(enc->low[0]);
911
    for (i = 0; i < kLenNumLowSymbols; i++)
912
      p->prices2[i] = a;
913
    a = GET_PRICEa_1(enc->low[0]);
914
    b = a + GET_PRICEa_0(enc->low[kLenNumLowSymbols]);
915
    for (i = kLenNumLowSymbols; i < kLenNumLowSymbols * 2; i++)
916
      p->prices2[i] = b;
917
    a += GET_PRICEa_1(enc->low[kLenNumLowSymbols]);
918
  }
919
  */
920
 
921
  // p->counter = numSymbols;
922
  // p->counter = 64;
923
924
63.0k
  {
925
63.0k
    unsigned i = p->tableSize;
926
    
927
63.0k
    if (i > kLenNumLowSymbols * 2)
928
36.6k
    {
929
36.6k
      const CLzmaProb *probs = enc->high;
930
36.6k
      UInt32 *prices = p->prices[0] + kLenNumLowSymbols * 2;
931
36.6k
      i -= kLenNumLowSymbols * 2 - 1;
932
36.6k
      i >>= 1;
933
36.6k
      b += GET_PRICEa_1(enc->low[kLenNumLowSymbols]);
934
36.6k
      do
935
2.38M
      {
936
        /*
937
        p->prices2[i] = a +
938
        // RcTree_GetPrice(enc->high, kLenNumHighBits, i - kLenNumLowSymbols * 2, ProbPrices);
939
        LitEnc_GetPrice(probs, i - kLenNumLowSymbols * 2, ProbPrices);
940
        */
941
        // UInt32 price = a + RcTree_GetPrice(probs, kLenNumHighBits - 1, sym, ProbPrices);
942
2.38M
        unsigned sym = --i + (1 << (kLenNumHighBits - 1));
943
2.38M
        UInt32 price = b;
944
2.38M
        do
945
16.6M
        {
946
16.6M
          unsigned bit = sym & 1;
947
16.6M
          sym >>= 1;
948
16.6M
          price += GET_PRICEa(probs[sym], bit);
949
16.6M
        }
950
16.6M
        while (sym >= 2);
951
952
2.38M
        {
953
2.38M
          unsigned prob = probs[(size_t)i + (1 << (kLenNumHighBits - 1))];
954
2.38M
          prices[(size_t)i * 2    ] = price + GET_PRICEa_0(prob);
955
2.38M
          prices[(size_t)i * 2 + 1] = price + GET_PRICEa_1(prob);
956
2.38M
        }
957
2.38M
      }
958
2.38M
      while (i);
959
960
36.6k
      {
961
36.6k
        unsigned posState;
962
36.6k
        size_t num = (p->tableSize - kLenNumLowSymbols * 2) * sizeof(p->prices[0][0]);
963
340k
        for (posState = 1; posState < numPosStates; posState++)
964
304k
          memcpy(p->prices[posState] + kLenNumLowSymbols * 2, p->prices[0] + kLenNumLowSymbols * 2, num);
965
36.6k
      }
966
36.6k
    }
967
63.0k
  }
968
63.0k
}
969
970
/*
971
  #ifdef SHOW_STAT
972
  g_STAT_OFFSET += num;
973
  printf("\n MovePos %u", num);
974
  #endif
975
*/
976
  
977
278k
#define MOVE_POS(p, num) { \
978
278k
    p->additionalOffset += (num); \
979
278k
    p->matchFinder.Skip(p->matchFinderObj, (UInt32)(num)); }
980
981
982
static unsigned ReadMatchDistances(CLzmaEnc *p, unsigned *numPairsRes)
983
11.3M
{
984
11.3M
  unsigned numPairs;
985
  
986
11.3M
  p->additionalOffset++;
987
11.3M
  p->numAvail = p->matchFinder.GetNumAvailableBytes(p->matchFinderObj);
988
11.3M
  numPairs = p->matchFinder.GetMatches(p->matchFinderObj, p->matches);
989
11.3M
  *numPairsRes = numPairs;
990
  
991
  #ifdef SHOW_STAT
992
  printf("\n i = %u numPairs = %u    ", g_STAT_OFFSET, numPairs / 2);
993
  g_STAT_OFFSET++;
994
  {
995
    unsigned i;
996
    for (i = 0; i < numPairs; i += 2)
997
      printf("%2u %6u   | ", p->matches[i], p->matches[i + 1]);
998
  }
999
  #endif
1000
  
1001
11.3M
  if (numPairs == 0)
1002
5.77M
    return 0;
1003
5.61M
  {
1004
5.61M
    unsigned len = p->matches[(size_t)numPairs - 2];
1005
5.61M
    if (len != p->numFastBytes)
1006
5.45M
      return len;
1007
153k
    {
1008
153k
      UInt32 numAvail = p->numAvail;
1009
153k
      if (numAvail > LZMA_MATCH_LEN_MAX)
1010
142k
        numAvail = LZMA_MATCH_LEN_MAX;
1011
153k
      {
1012
153k
        const Byte *p1 = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1013
153k
        const Byte *p2 = p1 + len;
1014
153k
        ptrdiff_t dif = (ptrdiff_t)-1 - p->matches[(size_t)numPairs - 1];
1015
153k
        const Byte *lim = p1 + numAvail;
1016
4.65M
        for (; p2 != lim && *p2 == p2[dif]; p2++)
1017
4.49M
        {}
1018
153k
        return (unsigned)(p2 - p1);
1019
5.61M
      }
1020
5.61M
    }
1021
5.61M
  }
1022
5.61M
}
1023
1024
15.5M
#define MARK_LIT ((UInt32)(Int32)-1)
1025
1026
1.41M
#define MakeAs_Lit(p)       { (p)->dist = MARK_LIT; (p)->extra = 0; }
1027
125k
#define MakeAs_ShortRep(p)  { (p)->dist = 0; (p)->extra = 0; }
1028
1.12M
#define IsShortRep(p)       ((p)->dist == 0)
1029
1030
1031
#define GetPrice_ShortRep(p, state, posState) \
1032
155k
  ( GET_PRICE_0(p->isRepG0[state]) + GET_PRICE_0(p->isRep0Long[state][posState]))
1033
1034
3.01M
#define GetPrice_Rep_0(p, state, posState) ( \
1035
3.01M
    GET_PRICE_1(p->isMatch[state][posState]) \
1036
3.01M
  + GET_PRICE_1(p->isRep0Long[state][posState])) \
1037
3.01M
  + GET_PRICE_1(p->isRep[state]) \
1038
3.01M
  + GET_PRICE_0(p->isRepG0[state])
1039
  
1040
MY_FORCE_INLINE
1041
static UInt32 GetPrice_PureRep(const CLzmaEnc *p, unsigned repIndex, size_t state, size_t posState)
1042
5.10M
{
1043
5.10M
  UInt32 price;
1044
5.10M
  UInt32 prob = p->isRepG0[state];
1045
5.10M
  if (repIndex == 0)
1046
1.80M
  {
1047
1.80M
    price = GET_PRICE_0(prob);
1048
1.80M
    price += GET_PRICE_1(p->isRep0Long[state][posState]);
1049
1.80M
  }
1050
3.30M
  else
1051
3.30M
  {
1052
3.30M
    price = GET_PRICE_1(prob);
1053
3.30M
    prob = p->isRepG1[state];
1054
3.30M
    if (repIndex == 1)
1055
1.17M
      price += GET_PRICE_0(prob);
1056
2.12M
    else
1057
2.12M
    {
1058
2.12M
      price += GET_PRICE_1(prob);
1059
2.12M
      price += GET_PRICE(p->isRepG2[state], repIndex - 2);
1060
2.12M
    }
1061
3.30M
  }
1062
5.10M
  return price;
1063
5.10M
}
1064
1065
1066
static unsigned Backward(CLzmaEnc *p, unsigned cur)
1067
432k
{
1068
432k
  unsigned wr = cur + 1;
1069
432k
  p->optEnd = wr;
1070
1071
432k
  for (;;)
1072
2.07M
  {
1073
2.07M
    UInt32 dist = p->opt[cur].dist;
1074
2.07M
    unsigned len = (unsigned)p->opt[cur].len;
1075
2.07M
    unsigned extra = (unsigned)p->opt[cur].extra;
1076
2.07M
    cur -= len;
1077
1078
2.07M
    if (extra)
1079
31.2k
    {
1080
31.2k
      wr--;
1081
31.2k
      p->opt[wr].len = (UInt32)len;
1082
31.2k
      cur -= extra;
1083
31.2k
      len = extra;
1084
31.2k
      if (extra == 1)
1085
512
      {
1086
512
        p->opt[wr].dist = dist;
1087
512
        dist = MARK_LIT;
1088
512
      }
1089
30.7k
      else
1090
30.7k
      {
1091
30.7k
        p->opt[wr].dist = 0;
1092
30.7k
        len--;
1093
30.7k
        wr--;
1094
30.7k
        p->opt[wr].dist = MARK_LIT;
1095
30.7k
        p->opt[wr].len = 1;
1096
30.7k
      }
1097
31.2k
    }
1098
1099
2.07M
    if (cur == 0)
1100
432k
    {
1101
432k
      p->backRes = dist;
1102
432k
      p->optCur = wr;
1103
432k
      return len;
1104
432k
    }
1105
    
1106
1.64M
    wr--;
1107
1.64M
    p->opt[wr].dist = dist;
1108
1.64M
    p->opt[wr].len = (UInt32)len;
1109
1.64M
  }
1110
432k
}
1111
1112
1113
1114
#define LIT_PROBS(pos, prevByte) \
1115
11.6M
  (p->litProbs + (UInt32)3 * (((((pos) << 8) + (prevByte)) & p->lpMask) << p->lc))
1116
1117
1118
static unsigned GetOptimum(CLzmaEnc *p, UInt32 position)
1119
3.34M
{
1120
3.34M
  unsigned last, cur;
1121
3.34M
  UInt32 reps[LZMA_NUM_REPS];
1122
3.34M
  unsigned repLens[LZMA_NUM_REPS];
1123
3.34M
  UInt32 *matches;
1124
1125
3.34M
  {
1126
3.34M
    UInt32 numAvail;
1127
3.34M
    unsigned numPairs, mainLen, repMaxIndex, i, posState;
1128
3.34M
    UInt32 matchPrice, repMatchPrice;
1129
3.34M
    const Byte *data;
1130
3.34M
    Byte curByte, matchByte;
1131
    
1132
3.34M
    p->optCur = p->optEnd = 0;
1133
    
1134
3.34M
    if (p->additionalOffset == 0)
1135
3.31M
      mainLen = ReadMatchDistances(p, &numPairs);
1136
32.8k
    else
1137
32.8k
    {
1138
32.8k
      mainLen = p->longestMatchLen;
1139
32.8k
      numPairs = p->numPairs;
1140
32.8k
    }
1141
    
1142
3.34M
    numAvail = p->numAvail;
1143
3.34M
    if (numAvail < 2)
1144
2.06k
    {
1145
2.06k
      p->backRes = MARK_LIT;
1146
2.06k
      return 1;
1147
2.06k
    }
1148
3.34M
    if (numAvail > LZMA_MATCH_LEN_MAX)
1149
3.20M
      numAvail = LZMA_MATCH_LEN_MAX;
1150
    
1151
3.34M
    data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1152
3.34M
    repMaxIndex = 0;
1153
    
1154
16.7M
    for (i = 0; i < LZMA_NUM_REPS; i++)
1155
13.3M
    {
1156
13.3M
      unsigned len;
1157
13.3M
      const Byte *data2;
1158
13.3M
      reps[i] = p->reps[i];
1159
13.3M
      data2 = data - reps[i];
1160
13.3M
      if (data[0] != data2[0] || data[1] != data2[1])
1161
13.2M
      {
1162
13.2M
        repLens[i] = 0;
1163
13.2M
        continue;
1164
13.2M
      }
1165
4.80M
      for (len = 2; len < numAvail && data[len] == data2[len]; len++)
1166
4.65M
      {}
1167
148k
      repLens[i] = len;
1168
148k
      if (len > repLens[repMaxIndex])
1169
71.3k
        repMaxIndex = i;
1170
148k
    }
1171
    
1172
3.34M
    if (repLens[repMaxIndex] >= p->numFastBytes)
1173
43.6k
    {
1174
43.6k
      unsigned len;
1175
43.6k
      p->backRes = (UInt32)repMaxIndex;
1176
43.6k
      len = repLens[repMaxIndex];
1177
43.6k
      MOVE_POS(p, len - 1)
1178
43.6k
      return len;
1179
43.6k
    }
1180
    
1181
3.30M
    matches = p->matches;
1182
    
1183
3.30M
    if (mainLen >= p->numFastBytes)
1184
43.6k
    {
1185
43.6k
      p->backRes = matches[(size_t)numPairs - 1] + LZMA_NUM_REPS;
1186
43.6k
      MOVE_POS(p, mainLen - 1)
1187
43.6k
      return mainLen;
1188
43.6k
    }
1189
    
1190
3.25M
    curByte = *data;
1191
3.25M
    matchByte = *(data - reps[0]);
1192
1193
3.25M
    last = repLens[repMaxIndex];
1194
3.25M
    if (last <= mainLen)
1195
3.25M
      last = mainLen;
1196
    
1197
3.25M
    if (last < 2 && curByte != matchByte)
1198
2.79M
    {
1199
2.79M
      p->backRes = MARK_LIT;
1200
2.79M
      return 1;
1201
2.79M
    }
1202
    
1203
463k
    p->opt[0].state = (CState)p->state;
1204
    
1205
463k
    posState = (position & p->pbMask);
1206
    
1207
463k
    {
1208
463k
      const CLzmaProb *probs = LIT_PROBS(position, *(data - 1));
1209
463k
      p->opt[1].price = GET_PRICE_0(p->isMatch[p->state][posState]) +
1210
463k
        (!IsLitState(p->state) ?
1211
63.6k
          LitEnc_Matched_GetPrice(probs, curByte, matchByte, p->ProbPrices) :
1212
463k
          LitEnc_GetPrice(probs, curByte, p->ProbPrices));
1213
463k
    }
1214
1215
463k
    MakeAs_Lit(&p->opt[1]);
1216
    
1217
463k
    matchPrice = GET_PRICE_1(p->isMatch[p->state][posState]);
1218
463k
    repMatchPrice = matchPrice + GET_PRICE_1(p->isRep[p->state]);
1219
    
1220
    // 18.06
1221
463k
    if (matchByte == curByte && repLens[0] == 0)
1222
41.8k
    {
1223
41.8k
      UInt32 shortRepPrice = repMatchPrice + GetPrice_ShortRep(p, p->state, posState);
1224
41.8k
      if (shortRepPrice < p->opt[1].price)
1225
35.4k
      {
1226
35.4k
        p->opt[1].price = shortRepPrice;
1227
35.4k
        MakeAs_ShortRep(&p->opt[1]);
1228
35.4k
      }
1229
41.8k
      if (last < 2)
1230
31.2k
      {
1231
31.2k
        p->backRes = p->opt[1].dist;
1232
31.2k
        return 1;
1233
31.2k
      }
1234
41.8k
    }
1235
   
1236
432k
    p->opt[1].len = 1;
1237
    
1238
432k
    p->opt[0].reps[0] = reps[0];
1239
432k
    p->opt[0].reps[1] = reps[1];
1240
432k
    p->opt[0].reps[2] = reps[2];
1241
432k
    p->opt[0].reps[3] = reps[3];
1242
    
1243
    // ---------- REP ----------
1244
    
1245
2.16M
    for (i = 0; i < LZMA_NUM_REPS; i++)
1246
1.72M
    {
1247
1.72M
      unsigned repLen = repLens[i];
1248
1.72M
      UInt32 price;
1249
1.72M
      if (repLen < 2)
1250
1.66M
        continue;
1251
61.0k
      price = repMatchPrice + GetPrice_PureRep(p, i, p->state, posState);
1252
61.0k
      do
1253
365k
      {
1254
365k
        UInt32 price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState, repLen);
1255
365k
        COptimal *opt = &p->opt[repLen];
1256
365k
        if (price2 < opt->price)
1257
241k
        {
1258
241k
          opt->price = price2;
1259
241k
          opt->len = (UInt32)repLen;
1260
241k
          opt->dist = (UInt32)i;
1261
241k
          opt->extra = 0;
1262
241k
        }
1263
365k
      }
1264
365k
      while (--repLen >= 2);
1265
61.0k
    }
1266
    
1267
    
1268
    // ---------- MATCH ----------
1269
432k
    {
1270
432k
      unsigned len = repLens[0] + 1;
1271
432k
      if (len <= mainLen)
1272
422k
      {
1273
422k
        unsigned offs = 0;
1274
422k
        UInt32 normalMatchPrice = matchPrice + GET_PRICE_0(p->isRep[p->state]);
1275
1276
422k
        if (len < 2)
1277
420k
          len = 2;
1278
1.29k
        else
1279
4.01k
          while (len > matches[offs])
1280
2.72k
            offs += 2;
1281
    
1282
422k
        for (; ; len++)
1283
695k
        {
1284
695k
          COptimal *opt;
1285
695k
          UInt32 dist = matches[(size_t)offs + 1];
1286
695k
          UInt32 price = normalMatchPrice + GET_PRICE_LEN(&p->lenEnc, posState, len);
1287
695k
          unsigned lenToPosState = GetLenToPosState(len);
1288
       
1289
695k
          if (dist < kNumFullDistances)
1290
243k
            price += p->distancesPrices[lenToPosState][dist & (kNumFullDistances - 1)];
1291
451k
          else
1292
451k
          {
1293
451k
            unsigned slot;
1294
451k
            GetPosSlot2(dist, slot);
1295
451k
            price += p->alignPrices[dist & kAlignMask];
1296
451k
            price += p->posSlotPrices[lenToPosState][slot];
1297
451k
          }
1298
          
1299
695k
          opt = &p->opt[len];
1300
          
1301
695k
          if (price < opt->price)
1302
639k
          {
1303
639k
            opt->price = price;
1304
639k
            opt->len = (UInt32)len;
1305
639k
            opt->dist = dist + LZMA_NUM_REPS;
1306
639k
            opt->extra = 0;
1307
639k
          }
1308
          
1309
695k
          if (len == matches[offs])
1310
476k
          {
1311
476k
            offs += 2;
1312
476k
            if (offs == numPairs)
1313
422k
              break;
1314
476k
          }
1315
695k
        }
1316
422k
      }
1317
432k
    }
1318
    
1319
1320
432k
    cur = 0;
1321
1322
    #ifdef SHOW_STAT2
1323
    /* if (position >= 0) */
1324
    {
1325
      unsigned i;
1326
      printf("\n pos = %4X", position);
1327
      for (i = cur; i <= last; i++)
1328
      printf("\nprice[%4X] = %u", position - cur + i, p->opt[i].price);
1329
    }
1330
    #endif
1331
432k
  }
1332
1333
1334
  
1335
  // ---------- Optimal Parsing ----------
1336
1337
0
  for (;;)
1338
5.23M
  {
1339
5.23M
    unsigned numAvail;
1340
5.23M
    UInt32 numAvailFull;
1341
5.23M
    unsigned newLen, numPairs, prev, state, posState, startLen;
1342
5.23M
    UInt32 litPrice, matchPrice, repMatchPrice;
1343
5.23M
    BoolInt nextIsLit;
1344
5.23M
    Byte curByte, matchByte;
1345
5.23M
    const Byte *data;
1346
5.23M
    COptimal *curOpt, *nextOpt;
1347
1348
5.23M
    if (++cur == last)
1349
398k
      break;
1350
    
1351
    // 18.06
1352
4.83M
    if (cur >= kNumOpts - 64)
1353
352
    {
1354
352
      unsigned j, best;
1355
352
      UInt32 price = p->opt[cur].price;
1356
352
      best = cur;
1357
6.55k
      for (j = cur + 1; j <= last; j++)
1358
6.20k
      {
1359
6.20k
        UInt32 price2 = p->opt[j].price;
1360
6.20k
        if (price >= price2)
1361
588
        {
1362
588
          price = price2;
1363
588
          best = j;
1364
588
        }
1365
6.20k
      }
1366
352
      {
1367
352
        unsigned delta = best - cur;
1368
352
        if (delta != 0)
1369
196
        {
1370
196
          MOVE_POS(p, delta);
1371
196
        }
1372
352
      }
1373
352
      cur = best;
1374
352
      break;
1375
352
    }
1376
1377
4.83M
    newLen = ReadMatchDistances(p, &numPairs);
1378
    
1379
4.83M
    if (newLen >= p->numFastBytes)
1380
32.8k
    {
1381
32.8k
      p->numPairs = numPairs;
1382
32.8k
      p->longestMatchLen = newLen;
1383
32.8k
      break;
1384
32.8k
    }
1385
    
1386
4.80M
    curOpt = &p->opt[cur];
1387
1388
4.80M
    position++;
1389
1390
    // we need that check here, if skip_items in p->opt are possible
1391
    /*
1392
    if (curOpt->price >= kInfinityPrice)
1393
      continue;
1394
    */
1395
1396
4.80M
    prev = cur - curOpt->len;
1397
1398
4.80M
    if (curOpt->len == 1)
1399
1.12M
    {
1400
1.12M
      state = (unsigned)p->opt[prev].state;
1401
1.12M
      if (IsShortRep(curOpt))
1402
91.6k
        state = kShortRepNextStates[state];
1403
1.03M
      else
1404
1.03M
        state = kLiteralNextStates[state];
1405
1.12M
    }
1406
3.67M
    else
1407
3.67M
    {
1408
3.67M
      const COptimal *prevOpt;
1409
3.67M
      UInt32 b0;
1410
3.67M
      UInt32 dist = curOpt->dist;
1411
1412
3.67M
      if (curOpt->extra)
1413
57.6k
      {
1414
57.6k
        prev -= (unsigned)curOpt->extra;
1415
57.6k
        state = kState_RepAfterLit;
1416
57.6k
        if (curOpt->extra == 1)
1417
716
          state = (dist < LZMA_NUM_REPS ? kState_RepAfterLit : kState_MatchAfterLit);
1418
57.6k
      }
1419
3.61M
      else
1420
3.61M
      {
1421
3.61M
        state = (unsigned)p->opt[prev].state;
1422
3.61M
        if (dist < LZMA_NUM_REPS)
1423
1.64M
          state = kRepNextStates[state];
1424
1.96M
        else
1425
1.96M
          state = kMatchNextStates[state];
1426
3.61M
      }
1427
1428
3.67M
      prevOpt = &p->opt[prev];
1429
3.67M
      b0 = prevOpt->reps[0];
1430
1431
3.67M
      if (dist < LZMA_NUM_REPS)
1432
1.69M
      {
1433
1.69M
        if (dist == 0)
1434
458k
        {
1435
458k
          reps[0] = b0;
1436
458k
          reps[1] = prevOpt->reps[1];
1437
458k
          reps[2] = prevOpt->reps[2];
1438
458k
          reps[3] = prevOpt->reps[3];
1439
458k
        }
1440
1.23M
        else
1441
1.23M
        {
1442
1.23M
          reps[1] = b0;
1443
1.23M
          b0 = prevOpt->reps[1];
1444
1.23M
          if (dist == 1)
1445
719k
          {
1446
719k
            reps[0] = b0;
1447
719k
            reps[2] = prevOpt->reps[2];
1448
719k
            reps[3] = prevOpt->reps[3];
1449
719k
          }
1450
518k
          else
1451
518k
          {
1452
518k
            reps[2] = b0;
1453
518k
            reps[0] = prevOpt->reps[dist];
1454
518k
            reps[3] = prevOpt->reps[dist ^ 1];
1455
518k
          }
1456
1.23M
        }
1457
1.69M
      }
1458
1.97M
      else
1459
1.97M
      {
1460
1.97M
        reps[0] = (dist - LZMA_NUM_REPS + 1);
1461
1.97M
        reps[1] = b0;
1462
1.97M
        reps[2] = prevOpt->reps[1];
1463
1.97M
        reps[3] = prevOpt->reps[2];
1464
1.97M
      }
1465
3.67M
    }
1466
    
1467
4.80M
    curOpt->state = (CState)state;
1468
4.80M
    curOpt->reps[0] = reps[0];
1469
4.80M
    curOpt->reps[1] = reps[1];
1470
4.80M
    curOpt->reps[2] = reps[2];
1471
4.80M
    curOpt->reps[3] = reps[3];
1472
1473
4.80M
    data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1474
4.80M
    curByte = *data;
1475
4.80M
    matchByte = *(data - reps[0]);
1476
1477
4.80M
    posState = (position & p->pbMask);
1478
1479
    /*
1480
    The order of Price checks:
1481
       <  LIT
1482
       <= SHORT_REP
1483
       <  LIT : REP_0
1484
       <  REP    [ : LIT : REP_0 ]
1485
       <  MATCH  [ : LIT : REP_0 ]
1486
    */
1487
1488
4.80M
    {
1489
4.80M
      UInt32 curPrice = curOpt->price;
1490
4.80M
      unsigned prob = p->isMatch[state][posState];
1491
4.80M
      matchPrice = curPrice + GET_PRICE_1(prob);
1492
4.80M
      litPrice = curPrice + GET_PRICE_0(prob);
1493
4.80M
    }
1494
1495
4.80M
    nextOpt = &p->opt[(size_t)cur + 1];
1496
4.80M
    nextIsLit = False;
1497
1498
    // here we can allow skip_items in p->opt, if we don't check (nextOpt->price < kInfinityPrice)
1499
    // 18.new.06
1500
4.80M
    if ((nextOpt->price < kInfinityPrice
1501
        // && !IsLitState(state)
1502
4.80M
        && matchByte == curByte)
1503
4.80M
        || litPrice > nextOpt->price
1504
4.80M
        )
1505
3.26M
      litPrice = 0;
1506
1.53M
    else
1507
1.53M
    {
1508
1.53M
      const CLzmaProb *probs = LIT_PROBS(position, *(data - 1));
1509
1.53M
      litPrice += (!IsLitState(state) ?
1510
827k
          LitEnc_Matched_GetPrice(probs, curByte, matchByte, p->ProbPrices) :
1511
1.53M
          LitEnc_GetPrice(probs, curByte, p->ProbPrices));
1512
      
1513
1.53M
      if (litPrice < nextOpt->price)
1514
949k
      {
1515
949k
        nextOpt->price = litPrice;
1516
949k
        nextOpt->len = 1;
1517
949k
        MakeAs_Lit(nextOpt);
1518
949k
        nextIsLit = True;
1519
949k
      }
1520
1.53M
    }
1521
1522
4.80M
    repMatchPrice = matchPrice + GET_PRICE_1(p->isRep[state]);
1523
    
1524
4.80M
    numAvailFull = p->numAvail;
1525
4.80M
    {
1526
4.80M
      unsigned temp = kNumOpts - 1 - cur;
1527
4.80M
      if (numAvailFull > temp)
1528
3.88M
        numAvailFull = (UInt32)temp;
1529
4.80M
    }
1530
1531
    // 18.06
1532
    // ---------- SHORT_REP ----------
1533
4.80M
    if (IsLitState(state)) // 18.new
1534
1.03M
    if (matchByte == curByte)
1535
213k
    if (repMatchPrice < nextOpt->price) // 18.new
1536
    // if (numAvailFull < 2 || data[1] != *(data - reps[0] + 1))
1537
115k
    if (
1538
        // nextOpt->price >= kInfinityPrice ||
1539
115k
        nextOpt->len < 2   // we can check nextOpt->len, if skip items are not allowed in p->opt
1540
115k
        || (nextOpt->dist != 0
1541
            // && nextOpt->extra <= 1 // 17.old
1542
105k
            )
1543
115k
        )
1544
114k
    {
1545
114k
      UInt32 shortRepPrice = repMatchPrice + GetPrice_ShortRep(p, state, posState);
1546
      // if (shortRepPrice <= nextOpt->price) // 17.old
1547
114k
      if (shortRepPrice < nextOpt->price)  // 18.new
1548
89.5k
      {
1549
89.5k
        nextOpt->price = shortRepPrice;
1550
89.5k
        nextOpt->len = 1;
1551
89.5k
        MakeAs_ShortRep(nextOpt);
1552
89.5k
        nextIsLit = False;
1553
89.5k
      }
1554
114k
    }
1555
    
1556
4.80M
    if (numAvailFull < 2)
1557
3.20k
      continue;
1558
4.79M
    numAvail = (numAvailFull <= p->numFastBytes ? numAvailFull : p->numFastBytes);
1559
1560
    // numAvail <= p->numFastBytes
1561
1562
    // ---------- LIT : REP_0 ----------
1563
1564
4.79M
    if (!nextIsLit
1565
4.79M
        && litPrice != 0 // 18.new
1566
4.79M
        && matchByte != curByte
1567
4.79M
        && numAvailFull > 2)
1568
582k
    {
1569
582k
      const Byte *data2 = data - reps[0];
1570
582k
      if (data[1] == data2[1] && data[2] == data2[2])
1571
120k
      {
1572
120k
        unsigned len;
1573
120k
        unsigned limit = p->numFastBytes + 1;
1574
120k
        if (limit > numAvailFull)
1575
5.05k
          limit = numAvailFull;
1576
327k
        for (len = 3; len < limit && data[len] == data2[len]; len++)
1577
207k
        {}
1578
        
1579
120k
        {
1580
120k
          unsigned state2 = kLiteralNextStates[state];
1581
120k
          unsigned posState2 = (position + 1) & p->pbMask;
1582
120k
          UInt32 price = litPrice + GetPrice_Rep_0(p, state2, posState2);
1583
120k
          {
1584
120k
            unsigned offset = cur + len;
1585
1586
120k
            if (last < offset)
1587
4.96k
              last = offset;
1588
          
1589
            // do
1590
120k
            {
1591
120k
              UInt32 price2;
1592
120k
              COptimal *opt;
1593
120k
              len--;
1594
              // price2 = price + GetPrice_Len_Rep_0(p, len, state2, posState2);
1595
120k
              price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState2, len);
1596
1597
120k
              opt = &p->opt[offset];
1598
              // offset--;
1599
120k
              if (price2 < opt->price)
1600
8.59k
              {
1601
8.59k
                opt->price = price2;
1602
8.59k
                opt->len = (UInt32)len;
1603
8.59k
                opt->dist = 0;
1604
8.59k
                opt->extra = 1;
1605
8.59k
              }
1606
120k
            }
1607
            // while (len >= 3);
1608
120k
          }
1609
120k
        }
1610
120k
      }
1611
582k
    }
1612
    
1613
4.79M
    startLen = 2; /* speed optimization */
1614
1615
4.79M
    {
1616
      // ---------- REP ----------
1617
4.79M
      unsigned repIndex = 0; // 17.old
1618
      // unsigned repIndex = IsLitState(state) ? 0 : 1; // 18.notused
1619
23.9M
      for (; repIndex < LZMA_NUM_REPS; repIndex++)
1620
19.1M
      {
1621
19.1M
        unsigned len;
1622
19.1M
        UInt32 price;
1623
19.1M
        const Byte *data2 = data - reps[repIndex];
1624
19.1M
        if (data[0] != data2[0] || data[1] != data2[1])
1625
14.1M
          continue;
1626
        
1627
77.3M
        for (len = 2; len < numAvail && data[len] == data2[len]; len++)
1628
72.3M
        {}
1629
        
1630
        // if (len < startLen) continue; // 18.new: speed optimization
1631
1632
5.04M
        {
1633
5.04M
          unsigned offset = cur + len;
1634
5.04M
          if (last < offset)
1635
207k
            last = offset;
1636
5.04M
        }
1637
5.04M
        {
1638
5.04M
          unsigned len2 = len;
1639
5.04M
          price = repMatchPrice + GetPrice_PureRep(p, repIndex, state, posState);
1640
5.04M
          do
1641
77.3M
          {
1642
77.3M
            UInt32 price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState, len2);
1643
77.3M
            COptimal *opt = &p->opt[cur + len2];
1644
77.3M
            if (price2 < opt->price)
1645
3.21M
            {
1646
3.21M
              opt->price = price2;
1647
3.21M
              opt->len = (UInt32)len2;
1648
3.21M
              opt->dist = (UInt32)repIndex;
1649
3.21M
              opt->extra = 0;
1650
3.21M
            }
1651
77.3M
          }
1652
77.3M
          while (--len2 >= 2);
1653
5.04M
        }
1654
        
1655
5.04M
        if (repIndex == 0) startLen = len + 1;  // 17.old
1656
        // startLen = len + 1; // 18.new
1657
1658
        /* if (_maxMode) */
1659
5.04M
        {
1660
          // ---------- REP : LIT : REP_0 ----------
1661
          // numFastBytes + 1 + numFastBytes
1662
1663
5.04M
          unsigned len2 = len + 1;
1664
5.04M
          unsigned limit = len2 + p->numFastBytes;
1665
5.04M
          if (limit > numAvailFull)
1666
329k
            limit = numAvailFull;
1667
          
1668
5.04M
          len2 += 2;
1669
5.04M
          if (len2 <= limit)
1670
4.95M
          if (data[len2 - 2] == data2[len2 - 2])
1671
2.77M
          if (data[len2 - 1] == data2[len2 - 1])
1672
1.87M
          {
1673
1.87M
            unsigned state2 = kRepNextStates[state];
1674
1.87M
            unsigned posState2 = (position + len) & p->pbMask;
1675
1.87M
            price += GET_PRICE_LEN(&p->repLenEnc, posState, len)
1676
1.87M
                + GET_PRICE_0(p->isMatch[state2][posState2])
1677
1.87M
                + LitEnc_Matched_GetPrice(LIT_PROBS(position + len, data[(size_t)len - 1]),
1678
1.87M
                    data[len], data2[len], p->ProbPrices);
1679
            
1680
            // state2 = kLiteralNextStates[state2];
1681
1.87M
            state2 = kState_LitAfterRep;
1682
1.87M
            posState2 = (posState2 + 1) & p->pbMask;
1683
1684
1685
1.87M
            price += GetPrice_Rep_0(p, state2, posState2);
1686
1687
26.5M
          for (; len2 < limit && data[len2] == data2[len2]; len2++)
1688
24.6M
          {}
1689
          
1690
1.87M
          len2 -= len;
1691
          // if (len2 >= 3)
1692
1.87M
          {
1693
1.87M
            {
1694
1.87M
              unsigned offset = cur + len + len2;
1695
1696
1.87M
              if (last < offset)
1697
633k
                last = offset;
1698
              // do
1699
1.87M
              {
1700
1.87M
                UInt32 price2;
1701
1.87M
                COptimal *opt;
1702
1.87M
                len2--;
1703
                // price2 = price + GetPrice_Len_Rep_0(p, len2, state2, posState2);
1704
1.87M
                price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState2, len2);
1705
1706
1.87M
                opt = &p->opt[offset];
1707
                // offset--;
1708
1.87M
                if (price2 < opt->price)
1709
760k
                {
1710
760k
                  opt->price = price2;
1711
760k
                  opt->len = (UInt32)len2;
1712
760k
                  opt->extra = (CExtra)(len + 1);
1713
760k
                  opt->dist = (UInt32)repIndex;
1714
760k
                }
1715
1.87M
              }
1716
              // while (len2 >= 3);
1717
1.87M
            }
1718
1.87M
          }
1719
1.87M
          }
1720
5.04M
        }
1721
5.04M
      }
1722
4.79M
    }
1723
1724
1725
    // ---------- MATCH ----------
1726
    /* for (unsigned len = 2; len <= newLen; len++) */
1727
4.79M
    if (newLen > numAvail)
1728
1.00k
    {
1729
1.00k
      newLen = numAvail;
1730
2.90k
      for (numPairs = 0; newLen > matches[numPairs]; numPairs += 2);
1731
1.00k
      matches[numPairs] = (UInt32)newLen;
1732
1.00k
      numPairs += 2;
1733
1.00k
    }
1734
    
1735
    // startLen = 2; /* speed optimization */
1736
1737
4.79M
    if (newLen >= startLen)
1738
2.95M
    {
1739
2.95M
      UInt32 normalMatchPrice = matchPrice + GET_PRICE_0(p->isRep[state]);
1740
2.95M
      UInt32 dist;
1741
2.95M
      unsigned offs, posSlot, len;
1742
      
1743
2.95M
      {
1744
2.95M
        unsigned offset = cur + newLen;
1745
2.95M
        if (last < offset)
1746
791k
          last = offset;
1747
2.95M
      }
1748
1749
2.95M
      offs = 0;
1750
3.35M
      while (startLen > matches[offs])
1751
406k
        offs += 2;
1752
2.95M
      dist = matches[(size_t)offs + 1];
1753
      
1754
      // if (dist >= kNumFullDistances)
1755
2.95M
      GetPosSlot2(dist, posSlot);
1756
      
1757
13.8M
      for (len = /*2*/ startLen; ; len++)
1758
16.8M
      {
1759
16.8M
        UInt32 price = normalMatchPrice + GET_PRICE_LEN(&p->lenEnc, posState, len);
1760
16.8M
        {
1761
16.8M
          COptimal *opt;
1762
16.8M
          unsigned lenNorm = len - 2;
1763
16.8M
          lenNorm = GetLenToPosState2(lenNorm);
1764
16.8M
          if (dist < kNumFullDistances)
1765
10.8M
            price += p->distancesPrices[lenNorm][dist & (kNumFullDistances - 1)];
1766
5.93M
          else
1767
5.93M
            price += p->posSlotPrices[lenNorm][posSlot] + p->alignPrices[dist & kAlignMask];
1768
          
1769
16.8M
          opt = &p->opt[cur + len];
1770
16.8M
          if (price < opt->price)
1771
3.51M
          {
1772
3.51M
            opt->price = price;
1773
3.51M
            opt->len = (UInt32)len;
1774
3.51M
            opt->dist = dist + LZMA_NUM_REPS;
1775
3.51M
            opt->extra = 0;
1776
3.51M
          }
1777
16.8M
        }
1778
1779
16.8M
        if (len == matches[offs])
1780
3.71M
        {
1781
          // if (p->_maxMode) {
1782
          // MATCH : LIT : REP_0
1783
1784
3.71M
          const Byte *data2 = data - dist - 1;
1785
3.71M
          unsigned len2 = len + 1;
1786
3.71M
          unsigned limit = len2 + p->numFastBytes;
1787
3.71M
          if (limit > numAvailFull)
1788
123k
            limit = numAvailFull;
1789
          
1790
3.71M
          len2 += 2;
1791
3.71M
          if (len2 <= limit)
1792
3.70M
          if (data[len2 - 2] == data2[len2 - 2])
1793
1.57M
          if (data[len2 - 1] == data2[len2 - 1])
1794
1.01M
          {
1795
4.75M
          for (; len2 < limit && data[len2] == data2[len2]; len2++)
1796
3.74M
          {}
1797
          
1798
1.01M
          len2 -= len;
1799
          
1800
          // if (len2 >= 3)
1801
1.01M
          {
1802
1.01M
            unsigned state2 = kMatchNextStates[state];
1803
1.01M
            unsigned posState2 = (position + len) & p->pbMask;
1804
1.01M
            unsigned offset;
1805
1.01M
            price += GET_PRICE_0(p->isMatch[state2][posState2]);
1806
1.01M
            price += LitEnc_Matched_GetPrice(LIT_PROBS(position + len, data[(size_t)len - 1]),
1807
1.01M
                    data[len], data2[len], p->ProbPrices);
1808
1809
            // state2 = kLiteralNextStates[state2];
1810
1.01M
            state2 = kState_LitAfterMatch;
1811
1812
1.01M
            posState2 = (posState2 + 1) & p->pbMask;
1813
1.01M
            price += GetPrice_Rep_0(p, state2, posState2);
1814
1815
1.01M
            offset = cur + len + len2;
1816
1817
1.01M
            if (last < offset)
1818
130k
              last = offset;
1819
            // do
1820
1.01M
            {
1821
1.01M
              UInt32 price2;
1822
1.01M
              COptimal *opt;
1823
1.01M
              len2--;
1824
              // price2 = price + GetPrice_Len_Rep_0(p, len2, state2, posState2);
1825
1.01M
              price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState2, len2);
1826
1.01M
              opt = &p->opt[offset];
1827
              // offset--;
1828
1.01M
              if (price2 < opt->price)
1829
476k
              {
1830
476k
                opt->price = price2;
1831
476k
                opt->len = (UInt32)len2;
1832
476k
                opt->extra = (CExtra)(len + 1);
1833
476k
                opt->dist = dist + LZMA_NUM_REPS;
1834
476k
              }
1835
1.01M
            }
1836
            // while (len2 >= 3);
1837
1.01M
          }
1838
1839
1.01M
          }
1840
        
1841
3.71M
          offs += 2;
1842
3.71M
          if (offs == numPairs)
1843
2.95M
            break;
1844
761k
          dist = matches[(size_t)offs + 1];
1845
          // if (dist >= kNumFullDistances)
1846
761k
            GetPosSlot2(dist, posSlot);
1847
761k
        }
1848
16.8M
      }
1849
2.95M
    }
1850
4.79M
  }
1851
1852
432k
  do
1853
5.60M
    p->opt[last].price = kInfinityPrice;
1854
5.60M
  while (--last);
1855
1856
432k
  return Backward(p, cur);
1857
463k
}
1858
1859
1860
1861
115k
#define ChangePair(smallDist, bigDist) (((bigDist) >> 7) > (smallDist))
1862
1863
1864
1865
static unsigned GetOptimumFast(CLzmaEnc *p)
1866
3.13M
{
1867
3.13M
  UInt32 numAvail, mainDist;
1868
3.13M
  unsigned mainLen, numPairs, repIndex, repLen, i;
1869
3.13M
  const Byte *data;
1870
1871
3.13M
  if (p->additionalOffset == 0)
1872
3.08M
    mainLen = ReadMatchDistances(p, &numPairs);
1873
51.4k
  else
1874
51.4k
  {
1875
51.4k
    mainLen = p->longestMatchLen;
1876
51.4k
    numPairs = p->numPairs;
1877
51.4k
  }
1878
1879
3.13M
  numAvail = p->numAvail;
1880
3.13M
  p->backRes = MARK_LIT;
1881
3.13M
  if (numAvail < 2)
1882
1.30k
    return 1;
1883
  // if (mainLen < 2 && p->state == 0) return 1; // 18.06.notused
1884
3.13M
  if (numAvail > LZMA_MATCH_LEN_MAX)
1885
3.02M
    numAvail = LZMA_MATCH_LEN_MAX;
1886
3.13M
  data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1887
3.13M
  repLen = repIndex = 0;
1888
  
1889
15.5M
  for (i = 0; i < LZMA_NUM_REPS; i++)
1890
12.4M
  {
1891
12.4M
    unsigned len;
1892
12.4M
    const Byte *data2 = data - p->reps[i];
1893
12.4M
    if (data[0] != data2[0] || data[1] != data2[1])
1894
12.3M
      continue;
1895
3.93M
    for (len = 2; len < numAvail && data[len] == data2[len]; len++)
1896
3.78M
    {}
1897
150k
    if (len >= p->numFastBytes)
1898
37.3k
    {
1899
37.3k
      p->backRes = (UInt32)i;
1900
37.3k
      MOVE_POS(p, len - 1)
1901
37.3k
      return len;
1902
37.3k
    }
1903
112k
    if (len > repLen)
1904
82.8k
    {
1905
82.8k
      repIndex = i;
1906
82.8k
      repLen = len;
1907
82.8k
    }
1908
112k
  }
1909
1910
3.09M
  if (mainLen >= p->numFastBytes)
1911
39.3k
  {
1912
39.3k
    p->backRes = p->matches[(size_t)numPairs - 1] + LZMA_NUM_REPS;
1913
39.3k
    MOVE_POS(p, mainLen - 1)
1914
39.3k
    return mainLen;
1915
39.3k
  }
1916
1917
3.05M
  mainDist = 0; /* for GCC */
1918
  
1919
3.05M
  if (mainLen >= 2)
1920
600k
  {
1921
600k
    mainDist = p->matches[(size_t)numPairs - 1];
1922
604k
    while (numPairs > 2)
1923
67.8k
    {
1924
67.8k
      UInt32 dist2;
1925
67.8k
      if (mainLen != p->matches[(size_t)numPairs - 4] + 1)
1926
21.0k
        break;
1927
46.8k
      dist2 = p->matches[(size_t)numPairs - 3];
1928
46.8k
      if (!ChangePair(dist2, mainDist))
1929
42.4k
        break;
1930
4.37k
      numPairs -= 2;
1931
4.37k
      mainLen--;
1932
4.37k
      mainDist = dist2;
1933
4.37k
    }
1934
600k
    if (mainLen == 2 && mainDist >= 0x80)
1935
399k
      mainLen = 1;
1936
600k
  }
1937
1938
3.05M
  if (repLen >= 2)
1939
64.7k
    if (    repLen + 1 >= mainLen
1940
64.7k
        || (repLen + 2 >= mainLen && mainDist >= (1 << 9))
1941
64.7k
        || (repLen + 3 >= mainLen && mainDist >= (1 << 15)))
1942
56.6k
  {
1943
56.6k
    p->backRes = (UInt32)repIndex;
1944
56.6k
    MOVE_POS(p, repLen - 1)
1945
56.6k
    return repLen;
1946
56.6k
  }
1947
  
1948
3.00M
  if (mainLen < 2 || numAvail <= 2)
1949
2.85M
    return 1;
1950
1951
145k
  {
1952
145k
    unsigned len1 = ReadMatchDistances(p, &p->numPairs);
1953
145k
    p->longestMatchLen = len1;
1954
  
1955
145k
    if (len1 >= 2)
1956
119k
    {
1957
119k
      UInt32 newDist = p->matches[(size_t)p->numPairs - 1];
1958
119k
      if (   (len1 >= mainLen && newDist < mainDist)
1959
119k
          || (len1 == mainLen + 1 && !ChangePair(mainDist, newDist))
1960
119k
          || (len1 >  mainLen + 1)
1961
119k
          || (len1 + 1 >= mainLen && mainLen >= 3 && ChangePair(newDist, mainDist)))
1962
44.6k
        return 1;
1963
119k
    }
1964
145k
  }
1965
  
1966
100k
  data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1967
  
1968
483k
  for (i = 0; i < LZMA_NUM_REPS; i++)
1969
389k
  {
1970
389k
    unsigned len, limit;
1971
389k
    const Byte *data2 = data - p->reps[i];
1972
389k
    if (data[0] != data2[0] || data[1] != data2[1])
1973
374k
      continue;
1974
15.7k
    limit = mainLen - 1;
1975
37.7k
    for (len = 2;; len++)
1976
53.4k
    {
1977
53.4k
      if (len >= limit)
1978
6.83k
        return 1;
1979
46.6k
      if (data[len] != data2[len])
1980
8.88k
        break;
1981
46.6k
    }
1982
15.7k
  }
1983
  
1984
94.0k
  p->backRes = mainDist + LZMA_NUM_REPS;
1985
94.0k
  if (mainLen != 2)
1986
57.9k
  {
1987
57.9k
    MOVE_POS(p, mainLen - 2)
1988
57.9k
  }
1989
94.0k
  return mainLen;
1990
100k
}
1991
1992
1993
1994
1995
static void WriteEndMarker(CLzmaEnc *p, unsigned posState)
1996
0
{
1997
0
  UInt32 range;
1998
0
  range = p->rc.range;
1999
0
  {
2000
0
    UInt32 ttt, newBound;
2001
0
    CLzmaProb *prob = &p->isMatch[p->state][posState];
2002
0
    RC_BIT_PRE(&p->rc, prob)
2003
0
    RC_BIT_1(&p->rc, prob)
2004
0
    prob = &p->isRep[p->state];
2005
0
    RC_BIT_PRE(&p->rc, prob)
2006
0
    RC_BIT_0(&p->rc, prob)
2007
0
  }
2008
0
  p->state = kMatchNextStates[p->state];
2009
  
2010
0
  p->rc.range = range;
2011
0
  LenEnc_Encode(&p->lenProbs, &p->rc, 0, posState);
2012
0
  range = p->rc.range;
2013
2014
0
  {
2015
    // RcTree_Encode_PosSlot(&p->rc, p->posSlotEncoder[0], (1 << kNumPosSlotBits) - 1);
2016
0
    CLzmaProb *probs = p->posSlotEncoder[0];
2017
0
    unsigned m = 1;
2018
0
    do
2019
0
    {
2020
0
      UInt32 ttt, newBound;
2021
0
      RC_BIT_PRE(p, probs + m)
2022
0
      RC_BIT_1(&p->rc, probs + m);
2023
0
      m = (m << 1) + 1;
2024
0
    }
2025
0
    while (m < (1 << kNumPosSlotBits));
2026
0
  }
2027
0
  {
2028
    // RangeEnc_EncodeDirectBits(&p->rc, ((UInt32)1 << (30 - kNumAlignBits)) - 1, 30 - kNumAlignBits);    UInt32 range = p->range;
2029
0
    unsigned numBits = 30 - kNumAlignBits;
2030
0
    do
2031
0
    {
2032
0
      range >>= 1;
2033
0
      p->rc.low += range;
2034
0
      RC_NORM(&p->rc)
2035
0
    }
2036
0
    while (--numBits);
2037
0
  }
2038
   
2039
0
  {
2040
    // RcTree_ReverseEncode(&p->rc, p->posAlignEncoder, kNumAlignBits, kAlignMask);
2041
0
    CLzmaProb *probs = p->posAlignEncoder;
2042
0
    unsigned m = 1;
2043
0
    do
2044
0
    {
2045
0
      UInt32 ttt, newBound;
2046
0
      RC_BIT_PRE(p, probs + m)
2047
0
      RC_BIT_1(&p->rc, probs + m);
2048
0
      m = (m << 1) + 1;
2049
0
    }
2050
0
    while (m < kAlignTableSize);
2051
0
  }
2052
0
  p->rc.range = range;
2053
0
}
2054
2055
2056
static SRes CheckErrors(CLzmaEnc *p)
2057
33.0k
{
2058
33.0k
  if (p->result != SZ_OK)
2059
0
    return p->result;
2060
33.0k
  if (p->rc.res != SZ_OK)
2061
0
    p->result = SZ_ERROR_WRITE;
2062
33.0k
  if (p->matchFinderBase.result != SZ_OK)
2063
0
    p->result = SZ_ERROR_READ;
2064
33.0k
  if (p->result != SZ_OK)
2065
0
    p->finished = True;
2066
33.0k
  return p->result;
2067
33.0k
}
2068
2069
2070
MY_NO_INLINE static SRes Flush(CLzmaEnc *p, UInt32 nowPos)
2071
16.5k
{
2072
  /* ReleaseMFStream(); */
2073
16.5k
  p->finished = True;
2074
16.5k
  if (p->writeEndMark)
2075
0
    WriteEndMarker(p, nowPos & p->pbMask);
2076
16.5k
  RangeEnc_FlushData(&p->rc);
2077
16.5k
  RangeEnc_FlushStream(&p->rc);
2078
16.5k
  return CheckErrors(p);
2079
16.5k
}
2080
2081
2082
MY_NO_INLINE static void FillAlignPrices(CLzmaEnc *p)
2083
27.3k
{
2084
27.3k
  unsigned i;
2085
27.3k
  const CProbPrice *ProbPrices = p->ProbPrices;
2086
27.3k
  const CLzmaProb *probs = p->posAlignEncoder;
2087
  // p->alignPriceCount = 0;
2088
246k
  for (i = 0; i < kAlignTableSize / 2; i++)
2089
218k
  {
2090
218k
    UInt32 price = 0;
2091
218k
    unsigned sym = i;
2092
218k
    unsigned m = 1;
2093
218k
    unsigned bit;
2094
218k
    UInt32 prob;
2095
218k
    bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[m], bit); m = (m << 1) + bit;
2096
218k
    bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[m], bit); m = (m << 1) + bit;
2097
218k
    bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[m], bit); m = (m << 1) + bit;
2098
218k
    prob = probs[m];
2099
218k
    p->alignPrices[i    ] = price + GET_PRICEa_0(prob);
2100
218k
    p->alignPrices[i + 8] = price + GET_PRICEa_1(prob);
2101
    // p->alignPrices[i] = RcTree_ReverseGetPrice(p->posAlignEncoder, kNumAlignBits, i, p->ProbPrices);
2102
218k
  }
2103
27.3k
}
2104
2105
2106
MY_NO_INLINE static void FillDistancesPrices(CLzmaEnc *p)
2107
27.3k
{
2108
  // int y; for (y = 0; y < 100; y++) {
2109
2110
27.3k
  UInt32 tempPrices[kNumFullDistances];
2111
27.3k
  unsigned i, lps;
2112
2113
27.3k
  const CProbPrice *ProbPrices = p->ProbPrices;
2114
27.3k
  p->matchPriceCount = 0;
2115
2116
1.72M
  for (i = kStartPosModelIndex / 2; i < kNumFullDistances / 2; i++)
2117
1.69M
  {
2118
1.69M
    unsigned posSlot = GetPosSlot1(i);
2119
1.69M
    unsigned footerBits = (posSlot >> 1) - 1;
2120
1.69M
    unsigned base = ((2 | (posSlot & 1)) << footerBits);
2121
1.69M
    const CLzmaProb *probs = p->posEncoders + (size_t)base * 2;
2122
    // tempPrices[i] = RcTree_ReverseGetPrice(p->posEncoders + base, footerBits, i - base, p->ProbPrices);
2123
1.69M
    UInt32 price = 0;
2124
1.69M
    unsigned m = 1;
2125
1.69M
    unsigned sym = i;
2126
1.69M
    unsigned offset = (unsigned)1 << footerBits;
2127
1.69M
    base += i;
2128
    
2129
1.69M
    if (footerBits)
2130
1.64M
    do
2131
5.36M
    {
2132
5.36M
      unsigned bit = sym & 1;
2133
5.36M
      sym >>= 1;
2134
5.36M
      price += GET_PRICEa(probs[m], bit);
2135
5.36M
      m = (m << 1) + bit;
2136
5.36M
    }
2137
5.36M
    while (--footerBits);
2138
2139
1.69M
    {
2140
1.69M
      unsigned prob = probs[m];
2141
1.69M
      tempPrices[base         ] = price + GET_PRICEa_0(prob);
2142
1.69M
      tempPrices[base + offset] = price + GET_PRICEa_1(prob);
2143
1.69M
    }
2144
1.69M
  }
2145
2146
136k
  for (lps = 0; lps < kNumLenToPosStates; lps++)
2147
109k
  {
2148
109k
    unsigned slot;
2149
109k
    unsigned distTableSize2 = (p->distTableSize + 1) >> 1;
2150
109k
    UInt32 *posSlotPrices = p->posSlotPrices[lps];
2151
109k
    const CLzmaProb *probs = p->posSlotEncoder[lps];
2152
    
2153
2.73M
    for (slot = 0; slot < distTableSize2; slot++)
2154
2.62M
    {
2155
      // posSlotPrices[slot] = RcTree_GetPrice(encoder, kNumPosSlotBits, slot, p->ProbPrices);
2156
2.62M
      UInt32 price;
2157
2.62M
      unsigned bit;
2158
2.62M
      unsigned sym = slot + (1 << (kNumPosSlotBits - 1));
2159
2.62M
      unsigned prob;
2160
2.62M
      bit = sym & 1; sym >>= 1; price  = GET_PRICEa(probs[sym], bit);
2161
2.62M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2162
2.62M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2163
2.62M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2164
2.62M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2165
2.62M
      prob = probs[(size_t)slot + (1 << (kNumPosSlotBits - 1))];
2166
2.62M
      posSlotPrices[(size_t)slot * 2    ] = price + GET_PRICEa_0(prob);
2167
2.62M
      posSlotPrices[(size_t)slot * 2 + 1] = price + GET_PRICEa_1(prob);
2168
2.62M
    }
2169
    
2170
109k
    {
2171
109k
      UInt32 delta = ((UInt32)((kEndPosModelIndex / 2 - 1) - kNumAlignBits) << kNumBitPriceShiftBits);
2172
1.97M
      for (slot = kEndPosModelIndex / 2; slot < distTableSize2; slot++)
2173
1.86M
      {
2174
1.86M
        posSlotPrices[(size_t)slot * 2    ] += delta;
2175
1.86M
        posSlotPrices[(size_t)slot * 2 + 1] += delta;
2176
1.86M
        delta += ((UInt32)1 << kNumBitPriceShiftBits);
2177
1.86M
      }
2178
109k
    }
2179
2180
109k
    {
2181
109k
      UInt32 *dp = p->distancesPrices[lps];
2182
      
2183
109k
      dp[0] = posSlotPrices[0];
2184
109k
      dp[1] = posSlotPrices[1];
2185
109k
      dp[2] = posSlotPrices[2];
2186
109k
      dp[3] = posSlotPrices[3];
2187
2188
6.89M
      for (i = 4; i < kNumFullDistances; i += 2)
2189
6.78M
      {
2190
6.78M
        UInt32 slotPrice = posSlotPrices[GetPosSlot1(i)];
2191
6.78M
        dp[i    ] = slotPrice + tempPrices[i];
2192
6.78M
        dp[i + 1] = slotPrice + tempPrices[i + 1];
2193
6.78M
      }
2194
109k
    }
2195
109k
  }
2196
  // }
2197
27.3k
}
2198
2199
2200
2201
void LzmaEnc_Construct(CLzmaEnc *p)
2202
8.23k
{
2203
8.23k
  RangeEnc_Construct(&p->rc);
2204
8.23k
  MatchFinder_Construct(&p->matchFinderBase);
2205
  
2206
  #ifndef _7ZIP_ST
2207
  MatchFinderMt_Construct(&p->matchFinderMt);
2208
  p->matchFinderMt.MatchFinder = &p->matchFinderBase;
2209
  #endif
2210
2211
8.23k
  {
2212
8.23k
    CLzmaEncProps props;
2213
8.23k
    LzmaEncProps_Init(&props);
2214
8.23k
    LzmaEnc_SetProps(p, &props);
2215
8.23k
  }
2216
2217
8.23k
  #ifndef LZMA_LOG_BSR
2218
8.23k
  LzmaEnc_FastPosInit(p->g_FastPos);
2219
8.23k
  #endif
2220
2221
8.23k
  LzmaEnc_InitPriceTables(p->ProbPrices);
2222
8.23k
  p->litProbs = NULL;
2223
8.23k
  p->saveState.litProbs = NULL;
2224
2225
8.23k
}
2226
2227
CLzmaEncHandle LzmaEnc_Create(ISzAllocPtr alloc)
2228
8.23k
{
2229
8.23k
  void *p;
2230
8.23k
  p = ISzAlloc_Alloc(alloc, sizeof(CLzmaEnc));
2231
8.23k
  if (p)
2232
8.23k
    LzmaEnc_Construct((CLzmaEnc *)p);
2233
8.23k
  return p;
2234
8.23k
}
2235
2236
void LzmaEnc_FreeLits(CLzmaEnc *p, ISzAllocPtr alloc)
2237
16.4k
{
2238
16.4k
  ISzAlloc_Free(alloc, p->litProbs);
2239
16.4k
  ISzAlloc_Free(alloc, p->saveState.litProbs);
2240
16.4k
  p->litProbs = NULL;
2241
16.4k
  p->saveState.litProbs = NULL;
2242
16.4k
}
2243
2244
void LzmaEnc_Destruct(CLzmaEnc *p, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2245
8.23k
{
2246
  #ifndef _7ZIP_ST
2247
  MatchFinderMt_Destruct(&p->matchFinderMt, allocBig);
2248
  #endif
2249
  
2250
8.23k
  MatchFinder_Free(&p->matchFinderBase, allocBig);
2251
8.23k
  LzmaEnc_FreeLits(p, alloc);
2252
8.23k
  RangeEnc_Free(&p->rc, alloc);
2253
8.23k
}
2254
2255
void LzmaEnc_Destroy(CLzmaEncHandle p, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2256
8.23k
{
2257
8.23k
  LzmaEnc_Destruct((CLzmaEnc *)p, alloc, allocBig);
2258
8.23k
  ISzAlloc_Free(alloc, p);
2259
8.23k
}
2260
2261
2262
static SRes LzmaEnc_CodeOneBlock(CLzmaEnc *p, UInt32 maxPackSize, UInt32 maxUnpackSize)
2263
16.5k
{
2264
16.5k
  UInt32 nowPos32, startPos32;
2265
16.5k
  if (p->needInit)
2266
8.23k
  {
2267
8.23k
    p->matchFinder.Init(p->matchFinderObj);
2268
8.23k
    p->needInit = 0;
2269
8.23k
  }
2270
2271
16.5k
  if (p->finished)
2272
0
    return p->result;
2273
16.5k
  RINOK(CheckErrors(p));
2274
2275
16.5k
  nowPos32 = (UInt32)p->nowPos64;
2276
16.5k
  startPos32 = nowPos32;
2277
2278
16.5k
  if (p->nowPos64 == 0)
2279
8.23k
  {
2280
8.23k
    unsigned numPairs;
2281
8.23k
    Byte curByte;
2282
8.23k
    if (p->matchFinder.GetNumAvailableBytes(p->matchFinderObj) == 0)
2283
0
      return Flush(p, nowPos32);
2284
8.23k
    ReadMatchDistances(p, &numPairs);
2285
8.23k
    RangeEnc_EncodeBit_0(&p->rc, &p->isMatch[kState_Start][0]);
2286
    // p->state = kLiteralNextStates[p->state];
2287
8.23k
    curByte = *(p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - p->additionalOffset);
2288
8.23k
    LitEnc_Encode(&p->rc, p->litProbs, curByte);
2289
8.23k
    p->additionalOffset--;
2290
8.23k
    nowPos32++;
2291
8.23k
  }
2292
2293
16.5k
  if (p->matchFinder.GetNumAvailableBytes(p->matchFinderObj) != 0)
2294
  
2295
8.25k
  for (;;)
2296
8.18M
  {
2297
8.18M
    UInt32 dist;
2298
8.18M
    unsigned len, posState;
2299
8.18M
    UInt32 range, ttt, newBound;
2300
8.18M
    CLzmaProb *probs;
2301
  
2302
8.18M
    if (p->fastMode)
2303
3.13M
      len = GetOptimumFast(p);
2304
5.05M
    else
2305
5.05M
    {
2306
5.05M
      unsigned oci = p->optCur;
2307
5.05M
      if (p->optEnd == oci)
2308
3.34M
        len = GetOptimum(p, nowPos32);
2309
1.70M
      else
2310
1.70M
      {
2311
1.70M
        const COptimal *opt = &p->opt[oci];
2312
1.70M
        len = opt->len;
2313
1.70M
        p->backRes = opt->dist;
2314
1.70M
        p->optCur = oci + 1;
2315
1.70M
      }
2316
5.05M
    }
2317
2318
8.18M
    posState = (unsigned)nowPos32 & p->pbMask;
2319
8.18M
    range = p->rc.range;
2320
8.18M
    probs = &p->isMatch[p->state][posState];
2321
    
2322
8.18M
    RC_BIT_PRE(&p->rc, probs)
2323
    
2324
8.18M
    dist = p->backRes;
2325
2326
    #ifdef SHOW_STAT2
2327
    printf("\n pos = %6X, len = %3u  pos = %6u", nowPos32, len, dist);
2328
    #endif
2329
2330
8.18M
    if (dist == MARK_LIT)
2331
6.71M
    {
2332
6.71M
      Byte curByte;
2333
6.71M
      const Byte *data;
2334
6.71M
      unsigned state;
2335
2336
6.71M
      RC_BIT_0(&p->rc, probs);
2337
6.71M
      p->rc.range = range;
2338
6.71M
      data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - p->additionalOffset;
2339
6.71M
      probs = LIT_PROBS(nowPos32, *(data - 1));
2340
6.71M
      curByte = *data;
2341
6.71M
      state = p->state;
2342
6.71M
      p->state = kLiteralNextStates[state];
2343
6.71M
      if (IsLitState(state))
2344
6.35M
        LitEnc_Encode(&p->rc, probs, curByte);
2345
361k
      else
2346
361k
        LitEnc_EncodeMatched(&p->rc, probs, curByte, *(data - p->reps[0]));
2347
6.71M
    }
2348
1.47M
    else
2349
1.47M
    {
2350
1.47M
      RC_BIT_1(&p->rc, probs);
2351
1.47M
      probs = &p->isRep[p->state];
2352
1.47M
      RC_BIT_PRE(&p->rc, probs)
2353
      
2354
1.47M
      if (dist < LZMA_NUM_REPS)
2355
561k
      {
2356
561k
        RC_BIT_1(&p->rc, probs);
2357
561k
        probs = &p->isRepG0[p->state];
2358
561k
        RC_BIT_PRE(&p->rc, probs)
2359
561k
        if (dist == 0)
2360
185k
        {
2361
185k
          RC_BIT_0(&p->rc, probs);
2362
185k
          probs = &p->isRep0Long[p->state][posState];
2363
185k
          RC_BIT_PRE(&p->rc, probs)
2364
185k
          if (len != 1)
2365
121k
          {
2366
121k
            RC_BIT_1_BASE(&p->rc, probs);
2367
121k
          }
2368
63.8k
          else
2369
63.8k
          {
2370
63.8k
            RC_BIT_0_BASE(&p->rc, probs);
2371
63.8k
            p->state = kShortRepNextStates[p->state];
2372
63.8k
          }
2373
185k
        }
2374
376k
        else
2375
376k
        {
2376
376k
          RC_BIT_1(&p->rc, probs);
2377
376k
          probs = &p->isRepG1[p->state];
2378
376k
          RC_BIT_PRE(&p->rc, probs)
2379
376k
          if (dist == 1)
2380
171k
          {
2381
171k
            RC_BIT_0_BASE(&p->rc, probs);
2382
171k
            dist = p->reps[1];
2383
171k
          }
2384
205k
          else
2385
205k
          {
2386
205k
            RC_BIT_1(&p->rc, probs);
2387
205k
            probs = &p->isRepG2[p->state];
2388
205k
            RC_BIT_PRE(&p->rc, probs)
2389
205k
            if (dist == 2)
2390
119k
            {
2391
119k
              RC_BIT_0_BASE(&p->rc, probs);
2392
119k
              dist = p->reps[2];
2393
119k
            }
2394
85.6k
            else
2395
85.6k
            {
2396
85.6k
              RC_BIT_1_BASE(&p->rc, probs);
2397
85.6k
              dist = p->reps[3];
2398
85.6k
              p->reps[3] = p->reps[2];
2399
85.6k
            }
2400
205k
            p->reps[2] = p->reps[1];
2401
205k
          }
2402
376k
          p->reps[1] = p->reps[0];
2403
376k
          p->reps[0] = dist;
2404
376k
        }
2405
2406
561k
        RC_NORM(&p->rc)
2407
2408
561k
        p->rc.range = range;
2409
2410
561k
        if (len != 1)
2411
497k
        {
2412
497k
          LenEnc_Encode(&p->repLenProbs, &p->rc, len - LZMA_MATCH_LEN_MIN, posState);
2413
497k
          --p->repLenEncCounter;
2414
497k
          p->state = kRepNextStates[p->state];
2415
497k
        }
2416
561k
      }
2417
909k
      else
2418
909k
      {
2419
909k
        unsigned posSlot;
2420
909k
        RC_BIT_0(&p->rc, probs);
2421
909k
        p->rc.range = range;
2422
909k
        p->state = kMatchNextStates[p->state];
2423
2424
909k
        LenEnc_Encode(&p->lenProbs, &p->rc, len - LZMA_MATCH_LEN_MIN, posState);
2425
        // --p->lenEnc.counter;
2426
2427
909k
        dist -= LZMA_NUM_REPS;
2428
909k
        p->reps[3] = p->reps[2];
2429
909k
        p->reps[2] = p->reps[1];
2430
909k
        p->reps[1] = p->reps[0];
2431
909k
        p->reps[0] = dist + 1;
2432
        
2433
909k
        p->matchPriceCount++;
2434
909k
        GetPosSlot(dist, posSlot);
2435
        // RcTree_Encode_PosSlot(&p->rc, p->posSlotEncoder[GetLenToPosState(len)], posSlot);
2436
909k
        {
2437
909k
          UInt32 sym = (UInt32)posSlot + (1 << kNumPosSlotBits);
2438
909k
          range = p->rc.range;
2439
909k
          probs = p->posSlotEncoder[GetLenToPosState(len)];
2440
909k
          do
2441
5.45M
          {
2442
5.45M
            CLzmaProb *prob = probs + (sym >> kNumPosSlotBits);
2443
5.45M
            UInt32 bit = (sym >> (kNumPosSlotBits - 1)) & 1;
2444
5.45M
            sym <<= 1;
2445
5.45M
            RC_BIT(&p->rc, prob, bit);
2446
5.45M
          }
2447
5.45M
          while (sym < (1 << kNumPosSlotBits * 2));
2448
909k
          p->rc.range = range;
2449
909k
        }
2450
        
2451
909k
        if (dist >= kStartPosModelIndex)
2452
597k
        {
2453
597k
          unsigned footerBits = ((posSlot >> 1) - 1);
2454
2455
597k
          if (dist < kNumFullDistances)
2456
453k
          {
2457
453k
            unsigned base = ((2 | (posSlot & 1)) << footerBits);
2458
453k
            RcTree_ReverseEncode(&p->rc, p->posEncoders + base, footerBits, (unsigned)(dist /* - base */));
2459
453k
          }
2460
143k
          else
2461
143k
          {
2462
143k
            UInt32 pos2 = (dist | 0xF) << (32 - footerBits);
2463
143k
            range = p->rc.range;
2464
            // RangeEnc_EncodeDirectBits(&p->rc, posReduced >> kNumAlignBits, footerBits - kNumAlignBits);
2465
            /*
2466
            do
2467
            {
2468
              range >>= 1;
2469
              p->rc.low += range & (0 - ((dist >> --footerBits) & 1));
2470
              RC_NORM(&p->rc)
2471
            }
2472
            while (footerBits > kNumAlignBits);
2473
            */
2474
143k
            do
2475
618k
            {
2476
618k
              range >>= 1;
2477
618k
              p->rc.low += range & (0 - (pos2 >> 31));
2478
618k
              pos2 += pos2;
2479
618k
              RC_NORM(&p->rc)
2480
618k
            }
2481
618k
            while (pos2 != 0xF0000000);
2482
2483
2484
            // RcTree_ReverseEncode(&p->rc, p->posAlignEncoder, kNumAlignBits, posReduced & kAlignMask);
2485
2486
143k
            {
2487
143k
              unsigned m = 1;
2488
143k
              unsigned bit;
2489
143k
              bit = dist & 1; dist >>= 1; RC_BIT(&p->rc, p->posAlignEncoder + m, bit); m = (m << 1) + bit;
2490
143k
              bit = dist & 1; dist >>= 1; RC_BIT(&p->rc, p->posAlignEncoder + m, bit); m = (m << 1) + bit;
2491
143k
              bit = dist & 1; dist >>= 1; RC_BIT(&p->rc, p->posAlignEncoder + m, bit); m = (m << 1) + bit;
2492
143k
              bit = dist & 1;             RC_BIT(&p->rc, p->posAlignEncoder + m, bit);
2493
143k
              p->rc.range = range;
2494
              // p->alignPriceCount++;
2495
143k
            }
2496
143k
          }
2497
597k
        }
2498
909k
      }
2499
1.47M
    }
2500
2501
8.18M
    nowPos32 += (UInt32)len;
2502
8.18M
    p->additionalOffset -= len;
2503
    
2504
8.18M
    if (p->additionalOffset == 0)
2505
6.39M
    {
2506
6.39M
      UInt32 processed;
2507
2508
6.39M
      if (!p->fastMode)
2509
3.31M
      {
2510
        /*
2511
        if (p->alignPriceCount >= 16) // kAlignTableSize
2512
          FillAlignPrices(p);
2513
        if (p->matchPriceCount >= 128)
2514
          FillDistancesPrices(p);
2515
        if (p->lenEnc.counter <= 0)
2516
          LenPriceEnc_UpdateTables(&p->lenEnc, 1 << p->pb, &p->lenProbs, p->ProbPrices);
2517
        */
2518
3.31M
        if (p->matchPriceCount >= 64)
2519
10.1k
        {
2520
10.1k
          FillAlignPrices(p);
2521
          // { int y; for (y = 0; y < 100; y++) {
2522
10.1k
          FillDistancesPrices(p);
2523
          // }}
2524
10.1k
          LenPriceEnc_UpdateTables(&p->lenEnc, 1 << p->pb, &p->lenProbs, p->ProbPrices);
2525
10.1k
        }
2526
3.31M
        if (p->repLenEncCounter <= 0)
2527
3.28k
        {
2528
3.28k
          p->repLenEncCounter = REP_LEN_COUNT;
2529
3.28k
          LenPriceEnc_UpdateTables(&p->repLenEnc, 1 << p->pb, &p->repLenProbs, p->ProbPrices);
2530
3.28k
        }
2531
3.31M
      }
2532
    
2533
6.39M
      if (p->matchFinder.GetNumAvailableBytes(p->matchFinderObj) == 0)
2534
8.19k
        break;
2535
6.39M
      processed = nowPos32 - startPos32;
2536
      
2537
6.39M
      if (maxPackSize)
2538
6.39M
      {
2539
6.39M
        if (processed + kNumOpts + 300 >= maxUnpackSize
2540
6.39M
            || RangeEnc_GetProcessed_sizet(&p->rc) + kPackReserve >= maxPackSize)
2541
67
          break;
2542
6.39M
      }
2543
0
      else if (processed >= (1 << 17))
2544
0
      {
2545
0
        p->nowPos64 += nowPos32 - startPos32;
2546
0
        return CheckErrors(p);
2547
0
      }
2548
6.39M
    }
2549
8.18M
  }
2550
2551
16.5k
  p->nowPos64 += nowPos32 - startPos32;
2552
16.5k
  return Flush(p, nowPos32);
2553
16.5k
}
2554
2555
2556
2557
8.23k
#define kBigHashDicLimit ((UInt32)1 << 24)
2558
2559
static SRes LzmaEnc_Alloc(CLzmaEnc *p, UInt32 keepWindowSize, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2560
8.23k
{
2561
8.23k
  UInt32 beforeSize = kNumOpts;
2562
8.23k
  if (!RangeEnc_Alloc(&p->rc, alloc))
2563
0
    return SZ_ERROR_MEM;
2564
2565
  #ifndef _7ZIP_ST
2566
  p->mtMode = (p->multiThread && !p->fastMode && (p->matchFinderBase.btMode != 0));
2567
  #endif
2568
2569
8.23k
  {
2570
8.23k
    unsigned lclp = p->lc + p->lp;
2571
8.23k
    if (!p->litProbs || !p->saveState.litProbs || p->lclp != lclp)
2572
8.23k
    {
2573
8.23k
      LzmaEnc_FreeLits(p, alloc);
2574
8.23k
      p->litProbs = (CLzmaProb *)ISzAlloc_Alloc(alloc, ((UInt32)0x300 << lclp) * sizeof(CLzmaProb));
2575
8.23k
      p->saveState.litProbs = (CLzmaProb *)ISzAlloc_Alloc(alloc, ((UInt32)0x300 << lclp) * sizeof(CLzmaProb));
2576
8.23k
      if (!p->litProbs || !p->saveState.litProbs)
2577
0
      {
2578
0
        LzmaEnc_FreeLits(p, alloc);
2579
0
        return SZ_ERROR_MEM;
2580
0
      }
2581
8.23k
      p->lclp = lclp;
2582
8.23k
    }
2583
8.23k
  }
2584
2585
8.23k
  p->matchFinderBase.bigHash = (Byte)(p->dictSize > kBigHashDicLimit ? 1 : 0);
2586
2587
8.23k
  if (beforeSize + p->dictSize < keepWindowSize)
2588
0
    beforeSize = keepWindowSize - p->dictSize;
2589
2590
  #ifndef _7ZIP_ST
2591
  if (p->mtMode)
2592
  {
2593
    RINOK(MatchFinderMt_Create(&p->matchFinderMt, p->dictSize, beforeSize, p->numFastBytes,
2594
        LZMA_MATCH_LEN_MAX
2595
        + 1  /* 18.04 */
2596
        , allocBig));
2597
    p->matchFinderObj = &p->matchFinderMt;
2598
    p->matchFinderBase.bigHash = (Byte)(
2599
        (p->dictSize > kBigHashDicLimit && p->matchFinderBase.hashMask >= 0xFFFFFF) ? 1 : 0);
2600
    MatchFinderMt_CreateVTable(&p->matchFinderMt, &p->matchFinder);
2601
  }
2602
  else
2603
  #endif
2604
8.23k
  {
2605
8.23k
    if (!MatchFinder_Create(&p->matchFinderBase, p->dictSize, beforeSize, p->numFastBytes, LZMA_MATCH_LEN_MAX, allocBig))
2606
0
      return SZ_ERROR_MEM;
2607
8.23k
    p->matchFinderObj = &p->matchFinderBase;
2608
8.23k
    MatchFinder_CreateVTable(&p->matchFinderBase, &p->matchFinder);
2609
8.23k
  }
2610
  
2611
8.23k
  return SZ_OK;
2612
8.23k
}
2613
2614
void LzmaEnc_Init(CLzmaEnc *p)
2615
18.6k
{
2616
18.6k
  unsigned i;
2617
18.6k
  p->state = 0;
2618
18.6k
  p->reps[0] =
2619
18.6k
  p->reps[1] =
2620
18.6k
  p->reps[2] =
2621
18.6k
  p->reps[3] = 1;
2622
2623
18.6k
  RangeEnc_Init(&p->rc);
2624
2625
316k
  for (i = 0; i < (1 << kNumAlignBits); i++)
2626
297k
    p->posAlignEncoder[i] = kProbInitValue;
2627
2628
241k
  for (i = 0; i < kNumStates; i++)
2629
223k
  {
2630
223k
    unsigned j;
2631
3.79M
    for (j = 0; j < LZMA_NUM_PB_STATES_MAX; j++)
2632
3.57M
    {
2633
3.57M
      p->isMatch[i][j] = kProbInitValue;
2634
3.57M
      p->isRep0Long[i][j] = kProbInitValue;
2635
3.57M
    }
2636
223k
    p->isRep[i] = kProbInitValue;
2637
223k
    p->isRepG0[i] = kProbInitValue;
2638
223k
    p->isRepG1[i] = kProbInitValue;
2639
223k
    p->isRepG2[i] = kProbInitValue;
2640
223k
  }
2641
2642
18.6k
  {
2643
93.0k
    for (i = 0; i < kNumLenToPosStates; i++)
2644
74.4k
    {
2645
74.4k
      CLzmaProb *probs = p->posSlotEncoder[i];
2646
74.4k
      unsigned j;
2647
4.83M
      for (j = 0; j < (1 << kNumPosSlotBits); j++)
2648
4.76M
        probs[j] = kProbInitValue;
2649
74.4k
    }
2650
18.6k
  }
2651
18.6k
  {
2652
2.40M
    for (i = 0; i < kNumFullDistances; i++)
2653
2.38M
      p->posEncoders[i] = kProbInitValue;
2654
18.6k
  }
2655
2656
18.6k
  {
2657
18.6k
    UInt32 num = (UInt32)0x300 << (p->lp + p->lc);
2658
18.6k
    UInt32 k;
2659
18.6k
    CLzmaProb *probs = p->litProbs;
2660
117M
    for (k = 0; k < num; k++)
2661
117M
      probs[k] = kProbInitValue;
2662
18.6k
  }
2663
2664
2665
18.6k
  LenEnc_Init(&p->lenProbs);
2666
18.6k
  LenEnc_Init(&p->repLenProbs);
2667
2668
18.6k
  p->optEnd = 0;
2669
18.6k
  p->optCur = 0;
2670
2671
18.6k
  {
2672
38.1M
    for (i = 0; i < kNumOpts; i++)
2673
38.1M
      p->opt[i].price = kInfinityPrice;
2674
18.6k
  }
2675
2676
18.6k
  p->additionalOffset = 0;
2677
2678
18.6k
  p->pbMask = (1 << p->pb) - 1;
2679
18.6k
  p->lpMask = ((UInt32)0x100 << p->lp) - ((unsigned)0x100 >> p->lc);
2680
18.6k
}
2681
2682
2683
void LzmaEnc_InitPrices(CLzmaEnc *p)
2684
24.7k
{
2685
24.7k
  if (!p->fastMode)
2686
17.1k
  {
2687
17.1k
    FillDistancesPrices(p);
2688
17.1k
    FillAlignPrices(p);
2689
17.1k
  }
2690
2691
24.7k
  p->lenEnc.tableSize =
2692
24.7k
  p->repLenEnc.tableSize =
2693
24.7k
      p->numFastBytes + 1 - LZMA_MATCH_LEN_MIN;
2694
2695
24.7k
  p->repLenEncCounter = REP_LEN_COUNT;
2696
2697
24.7k
  LenPriceEnc_UpdateTables(&p->lenEnc, 1 << p->pb, &p->lenProbs, p->ProbPrices);
2698
24.7k
  LenPriceEnc_UpdateTables(&p->repLenEnc, 1 << p->pb, &p->repLenProbs, p->ProbPrices);
2699
24.7k
}
2700
2701
static SRes LzmaEnc_AllocAndInit(CLzmaEnc *p, UInt32 keepWindowSize, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2702
8.23k
{
2703
8.23k
  unsigned i;
2704
148k
  for (i = kEndPosModelIndex / 2; i < kDicLogSizeMax; i++)
2705
148k
    if (p->dictSize <= ((UInt32)1 << i))
2706
8.23k
      break;
2707
8.23k
  p->distTableSize = i * 2;
2708
2709
8.23k
  p->finished = False;
2710
8.23k
  p->result = SZ_OK;
2711
8.23k
  RINOK(LzmaEnc_Alloc(p, keepWindowSize, alloc, allocBig));
2712
8.23k
  LzmaEnc_Init(p);
2713
8.23k
  LzmaEnc_InitPrices(p);
2714
8.23k
  p->nowPos64 = 0;
2715
8.23k
  return SZ_OK;
2716
8.23k
}
2717
2718
static SRes LzmaEnc_Prepare(CLzmaEncHandle pp, ISeqOutStream *outStream, ISeqInStream *inStream,
2719
    ISzAllocPtr alloc, ISzAllocPtr allocBig)
2720
0
{
2721
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
2722
0
  p->matchFinderBase.stream = inStream;
2723
0
  p->needInit = 1;
2724
0
  p->rc.outStream = outStream;
2725
0
  return LzmaEnc_AllocAndInit(p, 0, alloc, allocBig);
2726
0
}
2727
2728
SRes LzmaEnc_PrepareForLzma2(CLzmaEncHandle pp,
2729
    ISeqInStream *inStream, UInt32 keepWindowSize,
2730
    ISzAllocPtr alloc, ISzAllocPtr allocBig)
2731
8.23k
{
2732
8.23k
  CLzmaEnc *p = (CLzmaEnc *)pp;
2733
8.23k
  p->matchFinderBase.stream = inStream;
2734
8.23k
  p->needInit = 1;
2735
8.23k
  return LzmaEnc_AllocAndInit(p, keepWindowSize, alloc, allocBig);
2736
8.23k
}
2737
2738
static void LzmaEnc_SetInputBuf(CLzmaEnc *p, const Byte *src, SizeT srcLen)
2739
0
{
2740
0
  p->matchFinderBase.directInput = 1;
2741
0
  p->matchFinderBase.bufferBase = (Byte *)src;
2742
0
  p->matchFinderBase.directInputRem = srcLen;
2743
0
}
2744
2745
SRes LzmaEnc_MemPrepare(CLzmaEncHandle pp, const Byte *src, SizeT srcLen,
2746
    UInt32 keepWindowSize, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2747
0
{
2748
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
2749
0
  LzmaEnc_SetInputBuf(p, src, srcLen);
2750
0
  p->needInit = 1;
2751
2752
0
  LzmaEnc_SetDataSize(pp, srcLen);
2753
0
  return LzmaEnc_AllocAndInit(p, keepWindowSize, alloc, allocBig);
2754
0
}
2755
2756
void LzmaEnc_Finish(CLzmaEncHandle pp)
2757
8.23k
{
2758
  #ifndef _7ZIP_ST
2759
  CLzmaEnc *p = (CLzmaEnc *)pp;
2760
  if (p->mtMode)
2761
    MatchFinderMt_ReleaseStream(&p->matchFinderMt);
2762
  #else
2763
8.23k
  UNUSED_VAR(pp);
2764
8.23k
  #endif
2765
8.23k
}
2766
2767
2768
typedef struct
2769
{
2770
  ISeqOutStream vt;
2771
  Byte *data;
2772
  SizeT rem;
2773
  BoolInt overflow;
2774
} CLzmaEnc_SeqOutStreamBuf;
2775
2776
static size_t SeqOutStreamBuf_Write(const ISeqOutStream *pp, const void *data, size_t size)
2777
16.5k
{
2778
16.5k
  CLzmaEnc_SeqOutStreamBuf *p = CONTAINER_FROM_VTBL(pp, CLzmaEnc_SeqOutStreamBuf, vt);
2779
16.5k
  if (p->rem < size)
2780
0
  {
2781
0
    size = p->rem;
2782
0
    p->overflow = True;
2783
0
  }
2784
16.5k
  memcpy(p->data, data, size);
2785
16.5k
  p->rem -= size;
2786
16.5k
  p->data += size;
2787
16.5k
  return size;
2788
16.5k
}
2789
2790
2791
UInt32 LzmaEnc_GetNumAvailableBytes(CLzmaEncHandle pp)
2792
0
{
2793
0
  const CLzmaEnc *p = (CLzmaEnc *)pp;
2794
0
  return p->matchFinder.GetNumAvailableBytes(p->matchFinderObj);
2795
0
}
2796
2797
2798
const Byte *LzmaEnc_GetCurBuf(CLzmaEncHandle pp)
2799
2.14k
{
2800
2.14k
  const CLzmaEnc *p = (CLzmaEnc *)pp;
2801
2.14k
  return p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - p->additionalOffset;
2802
2.14k
}
2803
2804
2805
SRes LzmaEnc_CodeOneMemBlock(CLzmaEncHandle pp, BoolInt reInit,
2806
    Byte *dest, size_t *destLen, UInt32 desiredPackSize, UInt32 *unpackSize)
2807
16.5k
{
2808
16.5k
  CLzmaEnc *p = (CLzmaEnc *)pp;
2809
16.5k
  UInt64 nowPos64;
2810
16.5k
  SRes res;
2811
16.5k
  CLzmaEnc_SeqOutStreamBuf outStream;
2812
2813
16.5k
  outStream.vt.Write = SeqOutStreamBuf_Write;
2814
16.5k
  outStream.data = dest;
2815
16.5k
  outStream.rem = *destLen;
2816
16.5k
  outStream.overflow = False;
2817
2818
16.5k
  p->writeEndMark = False;
2819
16.5k
  p->finished = False;
2820
16.5k
  p->result = SZ_OK;
2821
2822
16.5k
  if (reInit)
2823
10.3k
    LzmaEnc_Init(p);
2824
16.5k
  LzmaEnc_InitPrices(p);
2825
2826
16.5k
  nowPos64 = p->nowPos64;
2827
16.5k
  RangeEnc_Init(&p->rc);
2828
16.5k
  p->rc.outStream = &outStream.vt;
2829
2830
16.5k
  if (desiredPackSize == 0)
2831
0
    return SZ_ERROR_OUTPUT_EOF;
2832
2833
16.5k
  res = LzmaEnc_CodeOneBlock(p, desiredPackSize, *unpackSize);
2834
  
2835
16.5k
  *unpackSize = (UInt32)(p->nowPos64 - nowPos64);
2836
16.5k
  *destLen -= outStream.rem;
2837
16.5k
  if (outStream.overflow)
2838
0
    return SZ_ERROR_OUTPUT_EOF;
2839
2840
16.5k
  return res;
2841
16.5k
}
2842
2843
2844
static SRes LzmaEnc_Encode2(CLzmaEnc *p, ICompressProgress *progress)
2845
0
{
2846
0
  SRes res = SZ_OK;
2847
2848
  #ifndef _7ZIP_ST
2849
  Byte allocaDummy[0x300];
2850
  allocaDummy[0] = 0;
2851
  allocaDummy[1] = allocaDummy[0];
2852
  #endif
2853
2854
0
  for (;;)
2855
0
  {
2856
0
    res = LzmaEnc_CodeOneBlock(p, 0, 0);
2857
0
    if (res != SZ_OK || p->finished)
2858
0
      break;
2859
0
    if (progress)
2860
0
    {
2861
0
      res = ICompressProgress_Progress(progress, p->nowPos64, RangeEnc_GetProcessed(&p->rc));
2862
0
      if (res != SZ_OK)
2863
0
      {
2864
0
        res = SZ_ERROR_PROGRESS;
2865
0
        break;
2866
0
      }
2867
0
    }
2868
0
  }
2869
  
2870
0
  LzmaEnc_Finish(p);
2871
2872
  /*
2873
  if (res == SZ_OK && !Inline_MatchFinder_IsFinishedOK(&p->matchFinderBase))
2874
    res = SZ_ERROR_FAIL;
2875
  }
2876
  */
2877
2878
0
  return res;
2879
0
}
2880
2881
2882
SRes LzmaEnc_Encode(CLzmaEncHandle pp, ISeqOutStream *outStream, ISeqInStream *inStream, ICompressProgress *progress,
2883
    ISzAllocPtr alloc, ISzAllocPtr allocBig)
2884
0
{
2885
0
  RINOK(LzmaEnc_Prepare(pp, outStream, inStream, alloc, allocBig));
2886
0
  return LzmaEnc_Encode2((CLzmaEnc *)pp, progress);
2887
0
}
2888
2889
2890
SRes LzmaEnc_WriteProperties(CLzmaEncHandle pp, Byte *props, SizeT *size)
2891
8.23k
{
2892
8.23k
  CLzmaEnc *p = (CLzmaEnc *)pp;
2893
8.23k
  unsigned i;
2894
8.23k
  UInt32 dictSize = p->dictSize;
2895
8.23k
  if (*size < LZMA_PROPS_SIZE)
2896
0
    return SZ_ERROR_PARAM;
2897
8.23k
  *size = LZMA_PROPS_SIZE;
2898
8.23k
  props[0] = (Byte)((p->pb * 5 + p->lp) * 9 + p->lc);
2899
2900
8.23k
  if (dictSize >= ((UInt32)1 << 22))
2901
8.23k
  {
2902
8.23k
    UInt32 kDictMask = ((UInt32)1 << 20) - 1;
2903
8.23k
    if (dictSize < (UInt32)0xFFFFFFFF - kDictMask)
2904
8.23k
      dictSize = (dictSize + kDictMask) & ~kDictMask;
2905
8.23k
  }
2906
0
  else for (i = 11; i <= 30; i++)
2907
0
  {
2908
0
    if (dictSize <= ((UInt32)2 << i)) { dictSize = (2 << i); break; }
2909
0
    if (dictSize <= ((UInt32)3 << i)) { dictSize = (3 << i); break; }
2910
0
  }
2911
2912
41.1k
  for (i = 0; i < 4; i++)
2913
32.9k
    props[1 + i] = (Byte)(dictSize >> (8 * i));
2914
8.23k
  return SZ_OK;
2915
8.23k
}
2916
2917
2918
unsigned LzmaEnc_IsWriteEndMark(CLzmaEncHandle pp)
2919
0
{
2920
0
  return ((CLzmaEnc *)pp)->writeEndMark;
2921
0
}
2922
2923
2924
SRes LzmaEnc_MemEncode(CLzmaEncHandle pp, Byte *dest, SizeT *destLen, const Byte *src, SizeT srcLen,
2925
    int writeEndMark, ICompressProgress *progress, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2926
0
{
2927
0
  SRes res;
2928
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
2929
2930
0
  CLzmaEnc_SeqOutStreamBuf outStream;
2931
2932
0
  outStream.vt.Write = SeqOutStreamBuf_Write;
2933
0
  outStream.data = dest;
2934
0
  outStream.rem = *destLen;
2935
0
  outStream.overflow = False;
2936
2937
0
  p->writeEndMark = writeEndMark;
2938
0
  p->rc.outStream = &outStream.vt;
2939
2940
0
  res = LzmaEnc_MemPrepare(pp, src, srcLen, 0, alloc, allocBig);
2941
  
2942
0
  if (res == SZ_OK)
2943
0
  {
2944
0
    res = LzmaEnc_Encode2(p, progress);
2945
0
    if (res == SZ_OK && p->nowPos64 != srcLen)
2946
0
      res = SZ_ERROR_FAIL;
2947
0
  }
2948
2949
0
  *destLen -= outStream.rem;
2950
0
  if (outStream.overflow)
2951
0
    return SZ_ERROR_OUTPUT_EOF;
2952
0
  return res;
2953
0
}
2954
2955
2956
SRes LzmaEncode(Byte *dest, SizeT *destLen, const Byte *src, SizeT srcLen,
2957
    const CLzmaEncProps *props, Byte *propsEncoded, SizeT *propsSize, int writeEndMark,
2958
    ICompressProgress *progress, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2959
0
{
2960
0
  CLzmaEnc *p = (CLzmaEnc *)LzmaEnc_Create(alloc);
2961
0
  SRes res;
2962
0
  if (!p)
2963
0
    return SZ_ERROR_MEM;
2964
2965
0
  res = LzmaEnc_SetProps(p, props);
2966
0
  if (res == SZ_OK)
2967
0
  {
2968
0
    res = LzmaEnc_WriteProperties(p, propsEncoded, propsSize);
2969
0
    if (res == SZ_OK)
2970
0
      res = LzmaEnc_MemEncode(p, dest, destLen, src, srcLen,
2971
0
          writeEndMark, progress, alloc, allocBig);
2972
0
  }
2973
2974
0
  LzmaEnc_Destroy(p, alloc, allocBig);
2975
0
  return res;
2976
0
}