Coverage Report

Created: 2023-03-26 06:59

/src/lzma-fuzz/sdk/C/LzmaEnc.c
Line
Count
Source (jump to first uncovered line)
1
/* LzmaEnc.c -- LZMA Encoder
2
2019-01-10: Igor Pavlov : Public domain */
3
4
#include "Precomp.h"
5
6
#include <string.h>
7
8
/* #define SHOW_STAT */
9
/* #define SHOW_STAT2 */
10
11
#if defined(SHOW_STAT) || defined(SHOW_STAT2)
12
#include <stdio.h>
13
#endif
14
15
#include "LzmaEnc.h"
16
17
#include "LzFind.h"
18
#ifndef _7ZIP_ST
19
#include "LzFindMt.h"
20
#endif
21
22
#ifdef SHOW_STAT
23
static unsigned g_STAT_OFFSET = 0;
24
#endif
25
26
14.5k
#define kLzmaMaxHistorySize ((UInt32)3 << 29)
27
/* #define kLzmaMaxHistorySize ((UInt32)7 << 29) */
28
29
37.9M
#define kNumTopBits 24
30
37.9M
#define kTopValue ((UInt32)1 << kNumTopBits)
31
32
9.41G
#define kNumBitModelTotalBits 11
33
9.37G
#define kBitModelTotal (1 << kNumBitModelTotalBits)
34
94.2M
#define kNumMoveBits 5
35
9.25G
#define kProbInitValue (kBitModelTotal >> 1)
36
37
109M
#define kNumMoveReducingBits 4
38
1.72M
#define kNumBitPriceShiftBits 4
39
#define kBitPrice (1 << kNumBitPriceShiftBits)
40
41
10.7k
#define REP_LEN_COUNT 64
42
43
void LzmaEncProps_Init(CLzmaEncProps *p)
44
14.5k
{
45
14.5k
  p->level = 5;
46
14.5k
  p->dictSize = p->mc = 0;
47
14.5k
  p->reduceSize = (UInt64)(Int64)-1;
48
14.5k
  p->lc = p->lp = p->pb = p->algo = p->fb = p->btMode = p->numHashBytes = p->numThreads = -1;
49
14.5k
  p->writeEndMark = 0;
50
14.5k
}
51
52
void LzmaEncProps_Normalize(CLzmaEncProps *p)
53
21.8k
{
54
21.8k
  int level = p->level;
55
21.8k
  if (level < 0) level = 5;
56
21.8k
  p->level = level;
57
  
58
21.8k
  if (p->dictSize == 0) p->dictSize = (level <= 5 ? (1 << (level * 2 + 14)) : (level <= 7 ? (1 << 25) : (1 << 26)));
59
21.8k
  if (p->dictSize > p->reduceSize)
60
0
  {
61
0
    unsigned i;
62
0
    UInt32 reduceSize = (UInt32)p->reduceSize;
63
0
    for (i = 11; i <= 30; i++)
64
0
    {
65
0
      if (reduceSize <= ((UInt32)2 << i)) { p->dictSize = ((UInt32)2 << i); break; }
66
0
      if (reduceSize <= ((UInt32)3 << i)) { p->dictSize = ((UInt32)3 << i); break; }
67
0
    }
68
0
  }
69
70
21.8k
  if (p->lc < 0) p->lc = 3;
71
21.8k
  if (p->lp < 0) p->lp = 0;
72
21.8k
  if (p->pb < 0) p->pb = 2;
73
74
21.8k
  if (p->algo < 0) p->algo = (level < 5 ? 0 : 1);
75
21.8k
  if (p->fb < 0) p->fb = (level < 7 ? 32 : 64);
76
21.8k
  if (p->btMode < 0) p->btMode = (p->algo == 0 ? 0 : 1);
77
21.8k
  if (p->numHashBytes < 0) p->numHashBytes = 4;
78
21.8k
  if (p->mc == 0) p->mc = (16 + (p->fb >> 1)) >> (p->btMode ? 0 : 1);
79
  
80
21.8k
  if (p->numThreads < 0)
81
14.5k
    p->numThreads =
82
      #ifndef _7ZIP_ST
83
      ((p->btMode && p->algo) ? 2 : 1);
84
      #else
85
14.5k
      1;
86
21.8k
      #endif
87
21.8k
}
88
89
UInt32 LzmaEncProps_GetDictSize(const CLzmaEncProps *props2)
90
0
{
91
0
  CLzmaEncProps props = *props2;
92
0
  LzmaEncProps_Normalize(&props);
93
0
  return props.dictSize;
94
0
}
95
96
#if (_MSC_VER >= 1400)
97
/* BSR code is fast for some new CPUs */
98
/* #define LZMA_LOG_BSR */
99
#endif
100
101
#ifdef LZMA_LOG_BSR
102
103
#define kDicLogSizeMaxCompress 32
104
105
#define BSR2_RET(pos, res) { unsigned long zz; _BitScanReverse(&zz, (pos)); res = (zz + zz) + ((pos >> (zz - 1)) & 1); }
106
107
static unsigned GetPosSlot1(UInt32 pos)
108
{
109
  unsigned res;
110
  BSR2_RET(pos, res);
111
  return res;
112
}
113
#define GetPosSlot2(pos, res) { BSR2_RET(pos, res); }
114
#define GetPosSlot(pos, res) { if (pos < 2) res = pos; else BSR2_RET(pos, res); }
115
116
#else
117
118
3.59M
#define kNumLogBits (9 + sizeof(size_t) / 2)
119
/* #define kNumLogBits (11 + sizeof(size_t) / 8 * 3) */
120
121
14.5k
#define kDicLogSizeMaxCompress ((kNumLogBits - 1) * 2 + 7)
122
123
static void LzmaEnc_FastPosInit(Byte *g_FastPos)
124
7.27k
{
125
7.27k
  unsigned slot;
126
7.27k
  g_FastPos[0] = 0;
127
7.27k
  g_FastPos[1] = 1;
128
7.27k
  g_FastPos += 2;
129
  
130
181k
  for (slot = 2; slot < kNumLogBits * 2; slot++)
131
174k
  {
132
174k
    size_t k = ((size_t)1 << ((slot >> 1) - 1));
133
174k
    size_t j;
134
59.7M
    for (j = 0; j < k; j++)
135
59.6M
      g_FastPos[j] = (Byte)slot;
136
174k
    g_FastPos += k;
137
174k
  }
138
7.27k
}
139
140
/* we can use ((limit - pos) >> 31) only if (pos < ((UInt32)1 << 31)) */
141
/*
142
#define BSR2_RET(pos, res) { unsigned zz = 6 + ((kNumLogBits - 1) & \
143
  (0 - (((((UInt32)1 << (kNumLogBits + 6)) - 1) - pos) >> 31))); \
144
  res = p->g_FastPos[pos >> zz] + (zz * 2); }
145
*/
146
147
/*
148
#define BSR2_RET(pos, res) { unsigned zz = 6 + ((kNumLogBits - 1) & \
149
  (0 - (((((UInt32)1 << (kNumLogBits)) - 1) - (pos >> 6)) >> 31))); \
150
  res = p->g_FastPos[pos >> zz] + (zz * 2); }
151
*/
152
153
3.39M
#define BSR2_RET(pos, res) { unsigned zz = (pos < (1 << (kNumLogBits + 6))) ? 6 : 6 + kNumLogBits - 1; \
154
3.39M
  res = p->g_FastPos[pos >> zz] + (zz * 2); }
155
156
/*
157
#define BSR2_RET(pos, res) { res = (pos < (1 << (kNumLogBits + 6))) ? \
158
  p->g_FastPos[pos >> 6] + 12 : \
159
  p->g_FastPos[pos >> (6 + kNumLogBits - 1)] + (6 + (kNumLogBits - 1)) * 2; }
160
*/
161
162
3.42M
#define GetPosSlot1(pos) p->g_FastPos[pos]
163
3.24M
#define GetPosSlot2(pos, res) { BSR2_RET(pos, res); }
164
671k
#define GetPosSlot(pos, res) { if (pos < kNumFullDistances) res = p->g_FastPos[pos & (kNumFullDistances - 1)]; else BSR2_RET(pos, res); }
165
166
#endif
167
168
169
46.3M
#define LZMA_NUM_REPS 4
170
171
typedef UInt16 CState;
172
typedef UInt16 CExtra;
173
174
typedef struct
175
{
176
  UInt32 price;
177
  CState state;
178
  CExtra extra;
179
      // 0   : normal
180
      // 1   : LIT : MATCH
181
      // > 1 : MATCH (extra-1) : LIT : REP0 (len)
182
  UInt32 len;
183
  UInt32 dist;
184
  UInt32 reps[LZMA_NUM_REPS];
185
} COptimal;
186
187
188
// 18.06
189
22.8M
#define kNumOpts (1 << 11)
190
0
#define kPackReserve (kNumOpts * 8)
191
// #define kNumOpts (1 << 12)
192
// #define kPackReserve (1 + kNumOpts * 2)
193
194
30.6M
#define kNumLenToPosStates 4
195
16.8M
#define kNumPosSlotBits 6
196
#define kDicLogSizeMin 0
197
131k
#define kDicLogSizeMax 32
198
#define kDistTableSizeMax (kDicLogSizeMax * 2)
199
200
7.12M
#define kNumAlignBits 4
201
6.95M
#define kAlignTableSize (1 << kNumAlignBits)
202
6.83M
#define kAlignMask (kAlignTableSize - 1)
203
204
682k
#define kStartPosModelIndex 4
205
32.5M
#define kEndPosModelIndex 14
206
33.1M
#define kNumFullDistances (1 << (kEndPosModelIndex >> 1))
207
208
typedef
209
#ifdef _LZMA_PROB32
210
  UInt32
211
#else
212
  UInt16
213
#endif
214
  CLzmaProb;
215
216
5.25M
#define LZMA_PB_MAX 4
217
29.1k
#define LZMA_LC_MAX 8
218
29.1k
#define LZMA_LP_MAX 4
219
220
5.22M
#define LZMA_NUM_PB_STATES_MAX (1 << LZMA_PB_MAX)
221
222
13.0M
#define kLenNumLowBits 3
223
7.95M
#define kLenNumLowSymbols (1 << kLenNumLowBits)
224
11.0M
#define kLenNumHighBits 8
225
9.04M
#define kLenNumHighSymbols (1 << kLenNumHighBits)
226
5.30M
#define kLenNumSymbolsTotal (kLenNumLowSymbols * 2 + kLenNumHighSymbols)
227
228
102M
#define LZMA_MATCH_LEN_MIN 2
229
5.30M
#define LZMA_MATCH_LEN_MAX (LZMA_MATCH_LEN_MIN + kLenNumSymbolsTotal - 1)
230
231
94.6k
#define kNumStates 12
232
233
234
typedef struct
235
{
236
  CLzmaProb low[LZMA_NUM_PB_STATES_MAX << (kLenNumLowBits + 1)];
237
  CLzmaProb high[kLenNumHighSymbols];
238
} CLenEnc;
239
240
241
typedef struct
242
{
243
  unsigned tableSize;
244
  UInt32 prices[LZMA_NUM_PB_STATES_MAX][kLenNumSymbolsTotal];
245
  // UInt32 prices1[LZMA_NUM_PB_STATES_MAX][kLenNumLowSymbols * 2];
246
  // UInt32 prices2[kLenNumSymbolsTotal];
247
} CLenPriceEnc;
248
249
#define GET_PRICE_LEN(p, posState, len) \
250
95.5M
    ((p)->prices[posState][(size_t)(len) - LZMA_MATCH_LEN_MIN])
251
252
/*
253
#define GET_PRICE_LEN(p, posState, len) \
254
    ((p)->prices2[(size_t)(len) - 2] + ((p)->prices1[posState][((len) - 2) & (kLenNumLowSymbols * 2 - 1)] & (((len) - 2 - kLenNumLowSymbols * 2) >> 9)))
255
*/
256
257
typedef struct
258
{
259
  UInt32 range;
260
  unsigned cache;
261
  UInt64 low;
262
  UInt64 cacheSize;
263
  Byte *buf;
264
  Byte *bufLim;
265
  Byte *bufBase;
266
  ISeqOutStream *outStream;
267
  UInt64 processed;
268
  SRes res;
269
} CRangeEnc;
270
271
272
typedef struct
273
{
274
  CLzmaProb *litProbs;
275
276
  unsigned state;
277
  UInt32 reps[LZMA_NUM_REPS];
278
279
  CLzmaProb posAlignEncoder[1 << kNumAlignBits];
280
  CLzmaProb isRep[kNumStates];
281
  CLzmaProb isRepG0[kNumStates];
282
  CLzmaProb isRepG1[kNumStates];
283
  CLzmaProb isRepG2[kNumStates];
284
  CLzmaProb isMatch[kNumStates][LZMA_NUM_PB_STATES_MAX];
285
  CLzmaProb isRep0Long[kNumStates][LZMA_NUM_PB_STATES_MAX];
286
287
  CLzmaProb posSlotEncoder[kNumLenToPosStates][1 << kNumPosSlotBits];
288
  CLzmaProb posEncoders[kNumFullDistances];
289
  
290
  CLenEnc lenProbs;
291
  CLenEnc repLenProbs;
292
293
} CSaveState;
294
295
296
typedef UInt32 CProbPrice;
297
298
299
typedef struct
300
{
301
  void *matchFinderObj;
302
  IMatchFinder matchFinder;
303
304
  unsigned optCur;
305
  unsigned optEnd;
306
307
  unsigned longestMatchLen;
308
  unsigned numPairs;
309
  UInt32 numAvail;
310
311
  unsigned state;
312
  unsigned numFastBytes;
313
  unsigned additionalOffset;
314
  UInt32 reps[LZMA_NUM_REPS];
315
  unsigned lpMask, pbMask;
316
  CLzmaProb *litProbs;
317
  CRangeEnc rc;
318
319
  UInt32 backRes;
320
321
  unsigned lc, lp, pb;
322
  unsigned lclp;
323
324
  BoolInt fastMode;
325
  BoolInt writeEndMark;
326
  BoolInt finished;
327
  BoolInt multiThread;
328
  BoolInt needInit;
329
  // BoolInt _maxMode;
330
331
  UInt64 nowPos64;
332
  
333
  unsigned matchPriceCount;
334
  // unsigned alignPriceCount;
335
  int repLenEncCounter;
336
337
  unsigned distTableSize;
338
339
  UInt32 dictSize;
340
  SRes result;
341
342
  #ifndef _7ZIP_ST
343
  BoolInt mtMode;
344
  // begin of CMatchFinderMt is used in LZ thread
345
  CMatchFinderMt matchFinderMt;
346
  // end of CMatchFinderMt is used in BT and HASH threads
347
  #endif
348
349
  CMatchFinder matchFinderBase;
350
351
  #ifndef _7ZIP_ST
352
  Byte pad[128];
353
  #endif
354
  
355
  // LZ thread
356
  CProbPrice ProbPrices[kBitModelTotal >> kNumMoveReducingBits];
357
358
  UInt32 matches[LZMA_MATCH_LEN_MAX * 2 + 2 + 1];
359
360
  UInt32 alignPrices[kAlignTableSize];
361
  UInt32 posSlotPrices[kNumLenToPosStates][kDistTableSizeMax];
362
  UInt32 distancesPrices[kNumLenToPosStates][kNumFullDistances];
363
364
  CLzmaProb posAlignEncoder[1 << kNumAlignBits];
365
  CLzmaProb isRep[kNumStates];
366
  CLzmaProb isRepG0[kNumStates];
367
  CLzmaProb isRepG1[kNumStates];
368
  CLzmaProb isRepG2[kNumStates];
369
  CLzmaProb isMatch[kNumStates][LZMA_NUM_PB_STATES_MAX];
370
  CLzmaProb isRep0Long[kNumStates][LZMA_NUM_PB_STATES_MAX];
371
  CLzmaProb posSlotEncoder[kNumLenToPosStates][1 << kNumPosSlotBits];
372
  CLzmaProb posEncoders[kNumFullDistances];
373
  
374
  CLenEnc lenProbs;
375
  CLenEnc repLenProbs;
376
377
  #ifndef LZMA_LOG_BSR
378
  Byte g_FastPos[1 << kNumLogBits];
379
  #endif
380
381
  CLenPriceEnc lenEnc;
382
  CLenPriceEnc repLenEnc;
383
384
  COptimal opt[kNumOpts];
385
386
  CSaveState saveState;
387
388
  #ifndef _7ZIP_ST
389
  Byte pad2[128];
390
  #endif
391
} CLzmaEnc;
392
393
394
395
0
#define COPY_ARR(dest, src, arr) memcpy(dest->arr, src->arr, sizeof(src->arr));
396
397
void LzmaEnc_SaveState(CLzmaEncHandle pp)
398
0
{
399
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
400
0
  CSaveState *dest = &p->saveState;
401
  
402
0
  dest->state = p->state;
403
  
404
0
  dest->lenProbs = p->lenProbs;
405
0
  dest->repLenProbs = p->repLenProbs;
406
407
0
  COPY_ARR(dest, p, reps);
408
409
0
  COPY_ARR(dest, p, posAlignEncoder);
410
0
  COPY_ARR(dest, p, isRep);
411
0
  COPY_ARR(dest, p, isRepG0);
412
0
  COPY_ARR(dest, p, isRepG1);
413
0
  COPY_ARR(dest, p, isRepG2);
414
0
  COPY_ARR(dest, p, isMatch);
415
0
  COPY_ARR(dest, p, isRep0Long);
416
0
  COPY_ARR(dest, p, posSlotEncoder);
417
0
  COPY_ARR(dest, p, posEncoders);
418
419
0
  memcpy(dest->litProbs, p->litProbs, ((UInt32)0x300 << p->lclp) * sizeof(CLzmaProb));
420
0
}
421
422
423
void LzmaEnc_RestoreState(CLzmaEncHandle pp)
424
0
{
425
0
  CLzmaEnc *dest = (CLzmaEnc *)pp;
426
0
  const CSaveState *p = &dest->saveState;
427
428
0
  dest->state = p->state;
429
430
0
  dest->lenProbs = p->lenProbs;
431
0
  dest->repLenProbs = p->repLenProbs;
432
  
433
0
  COPY_ARR(dest, p, reps);
434
  
435
0
  COPY_ARR(dest, p, posAlignEncoder);
436
0
  COPY_ARR(dest, p, isRep);
437
0
  COPY_ARR(dest, p, isRepG0);
438
0
  COPY_ARR(dest, p, isRepG1);
439
0
  COPY_ARR(dest, p, isRepG2);
440
0
  COPY_ARR(dest, p, isMatch);
441
0
  COPY_ARR(dest, p, isRep0Long);
442
0
  COPY_ARR(dest, p, posSlotEncoder);
443
0
  COPY_ARR(dest, p, posEncoders);
444
445
0
  memcpy(dest->litProbs, p->litProbs, ((UInt32)0x300 << dest->lclp) * sizeof(CLzmaProb));
446
0
}
447
448
449
450
SRes LzmaEnc_SetProps(CLzmaEncHandle pp, const CLzmaEncProps *props2)
451
14.5k
{
452
14.5k
  CLzmaEnc *p = (CLzmaEnc *)pp;
453
14.5k
  CLzmaEncProps props = *props2;
454
14.5k
  LzmaEncProps_Normalize(&props);
455
456
14.5k
  if (props.lc > LZMA_LC_MAX
457
14.5k
      || props.lp > LZMA_LP_MAX
458
14.5k
      || props.pb > LZMA_PB_MAX
459
14.5k
      || props.dictSize > ((UInt64)1 << kDicLogSizeMaxCompress)
460
14.5k
      || props.dictSize > kLzmaMaxHistorySize)
461
0
    return SZ_ERROR_PARAM;
462
463
14.5k
  p->dictSize = props.dictSize;
464
14.5k
  {
465
14.5k
    unsigned fb = props.fb;
466
14.5k
    if (fb < 5)
467
0
      fb = 5;
468
14.5k
    if (fb > LZMA_MATCH_LEN_MAX)
469
0
      fb = LZMA_MATCH_LEN_MAX;
470
14.5k
    p->numFastBytes = fb;
471
14.5k
  }
472
14.5k
  p->lc = props.lc;
473
14.5k
  p->lp = props.lp;
474
14.5k
  p->pb = props.pb;
475
14.5k
  p->fastMode = (props.algo == 0);
476
  // p->_maxMode = True;
477
14.5k
  p->matchFinderBase.btMode = (Byte)(props.btMode ? 1 : 0);
478
14.5k
  {
479
14.5k
    unsigned numHashBytes = 4;
480
14.5k
    if (props.btMode)
481
13.1k
    {
482
13.1k
      if (props.numHashBytes < 2)
483
0
        numHashBytes = 2;
484
13.1k
      else if (props.numHashBytes < 4)
485
4.49k
        numHashBytes = props.numHashBytes;
486
13.1k
    }
487
14.5k
    p->matchFinderBase.numHashBytes = numHashBytes;
488
14.5k
  }
489
490
14.5k
  p->matchFinderBase.cutValue = props.mc;
491
492
14.5k
  p->writeEndMark = props.writeEndMark;
493
494
  #ifndef _7ZIP_ST
495
  /*
496
  if (newMultiThread != _multiThread)
497
  {
498
    ReleaseMatchFinder();
499
    _multiThread = newMultiThread;
500
  }
501
  */
502
  p->multiThread = (props.numThreads > 1);
503
  #endif
504
505
14.5k
  return SZ_OK;
506
14.5k
}
507
508
509
void LzmaEnc_SetDataSize(CLzmaEncHandle pp, UInt64 expectedDataSiize)
510
7.27k
{
511
7.27k
  CLzmaEnc *p = (CLzmaEnc *)pp;
512
7.27k
  p->matchFinderBase.expectedDataSize = expectedDataSiize;
513
7.27k
}
514
515
516
7.27k
#define kState_Start 0
517
1.02M
#define kState_LitAfterMatch 4
518
2.13M
#define kState_LitAfterRep   5
519
0
#define kState_MatchAfterLit 7
520
105k
#define kState_RepAfterLit   8
521
522
static const Byte kLiteralNextStates[kNumStates] = {0, 0, 0, 0, 1, 2, 3, 4,  5,  6,   4, 5};
523
static const Byte kMatchNextStates[kNumStates]   = {7, 7, 7, 7, 7, 7, 7, 10, 10, 10, 10, 10};
524
static const Byte kRepNextStates[kNumStates]     = {8, 8, 8, 8, 8, 8, 8, 11, 11, 11, 11, 11};
525
static const Byte kShortRepNextStates[kNumStates]= {9, 9, 9, 9, 9, 9, 9, 11, 11, 11, 11, 11};
526
527
7.63M
#define IsLitState(s) ((s) < 7)
528
16.1M
#define GetLenToPosState2(len) (((len) < kNumLenToPosStates - 1) ? (len) : kNumLenToPosStates - 1)
529
1.09M
#define GetLenToPosState(len) (((len) < kNumLenToPosStates + 1) ? (len) - 2 : kNumLenToPosStates - 1)
530
531
27.1M
#define kInfinityPrice (1 << 30)
532
533
static void RangeEnc_Construct(CRangeEnc *p)
534
7.27k
{
535
7.27k
  p->outStream = NULL;
536
7.27k
  p->bufBase = NULL;
537
7.27k
}
538
539
#define RangeEnc_GetProcessed(p)       ((p)->processed + ((p)->buf - (p)->bufBase) + (p)->cacheSize)
540
0
#define RangeEnc_GetProcessed_sizet(p) ((size_t)(p)->processed + ((p)->buf - (p)->bufBase) + (size_t)(p)->cacheSize)
541
542
7.27k
#define RC_BUF_SIZE (1 << 16)
543
544
static int RangeEnc_Alloc(CRangeEnc *p, ISzAllocPtr alloc)
545
7.27k
{
546
7.27k
  if (!p->bufBase)
547
7.27k
  {
548
7.27k
    p->bufBase = (Byte *)ISzAlloc_Alloc(alloc, RC_BUF_SIZE);
549
7.27k
    if (!p->bufBase)
550
0
      return 0;
551
7.27k
    p->bufLim = p->bufBase + RC_BUF_SIZE;
552
7.27k
  }
553
7.27k
  return 1;
554
7.27k
}
555
556
static void RangeEnc_Free(CRangeEnc *p, ISzAllocPtr alloc)
557
7.27k
{
558
7.27k
  ISzAlloc_Free(alloc, p->bufBase);
559
7.27k
  p->bufBase = 0;
560
7.27k
}
561
562
static void RangeEnc_Init(CRangeEnc *p)
563
7.27k
{
564
  /* Stream.Init(); */
565
7.27k
  p->range = 0xFFFFFFFF;
566
7.27k
  p->cache = 0;
567
7.27k
  p->low = 0;
568
7.27k
  p->cacheSize = 0;
569
570
7.27k
  p->buf = p->bufBase;
571
572
7.27k
  p->processed = 0;
573
7.27k
  p->res = SZ_OK;
574
7.27k
}
575
576
MY_NO_INLINE static void RangeEnc_FlushStream(CRangeEnc *p)
577
7.28k
{
578
7.28k
  size_t num;
579
7.28k
  if (p->res != SZ_OK)
580
0
    return;
581
7.28k
  num = p->buf - p->bufBase;
582
7.28k
  if (num != ISeqOutStream_Write(p->outStream, p->bufBase, num))
583
0
    p->res = SZ_ERROR_WRITE;
584
7.28k
  p->processed += num;
585
7.28k
  p->buf = p->bufBase;
586
7.28k
}
587
588
MY_NO_INLINE static void MY_FAST_CALL RangeEnc_ShiftLow(CRangeEnc *p)
589
3.52M
{
590
3.52M
  UInt32 low = (UInt32)p->low;
591
3.52M
  unsigned high = (unsigned)(p->low >> 32);
592
3.52M
  p->low = (UInt32)(low << 8);
593
3.52M
  if (low < (UInt32)0xFF000000 || high != 0)
594
3.49M
  {
595
3.49M
    {
596
3.49M
      Byte *buf = p->buf;
597
3.49M
      *buf++ = (Byte)(p->cache + high);
598
3.49M
      p->cache = (unsigned)(low >> 24);
599
3.49M
      p->buf = buf;
600
3.49M
      if (buf == p->bufLim)
601
2
        RangeEnc_FlushStream(p);
602
3.49M
      if (p->cacheSize == 0)
603
3.47M
        return;
604
3.49M
    }
605
19.3k
    high += 0xFF;
606
19.3k
    for (;;)
607
23.8k
    {
608
23.8k
      Byte *buf = p->buf;
609
23.8k
      *buf++ = (Byte)(high);
610
23.8k
      p->buf = buf;
611
23.8k
      if (buf == p->bufLim)
612
1
        RangeEnc_FlushStream(p);
613
23.8k
      if (--p->cacheSize == 0)
614
19.3k
        return;
615
23.8k
    }
616
19.3k
  }
617
23.8k
  p->cacheSize++;
618
23.8k
}
619
620
static void RangeEnc_FlushData(CRangeEnc *p)
621
7.27k
{
622
7.27k
  int i;
623
43.6k
  for (i = 0; i < 5; i++)
624
36.3k
    RangeEnc_ShiftLow(p);
625
7.27k
}
626
627
37.9M
#define RC_NORM(p) if (range < kTopValue) { range <<= 8; RangeEnc_ShiftLow(p); }
628
629
#define RC_BIT_PRE(p, prob) \
630
37.0M
  ttt = *(prob); \
631
37.0M
  newBound = (range >> kNumBitModelTotalBits) * ttt;
632
633
// #define _LZMA_ENC_USE_BRANCH
634
635
#ifdef _LZMA_ENC_USE_BRANCH
636
637
#define RC_BIT(p, prob, bit) { \
638
  RC_BIT_PRE(p, prob) \
639
  if (bit == 0) { range = newBound; ttt += (kBitModelTotal - ttt) >> kNumMoveBits; } \
640
  else { (p)->low += newBound; range -= newBound; ttt -= ttt >> kNumMoveBits; } \
641
  *(prob) = (CLzmaProb)ttt; \
642
  RC_NORM(p) \
643
  }
644
645
#else
646
647
28.6M
#define RC_BIT(p, prob, bit) { \
648
28.6M
  UInt32 mask; \
649
28.6M
  RC_BIT_PRE(p, prob) \
650
28.6M
  mask = 0 - (UInt32)bit; \
651
28.6M
  range &= mask; \
652
28.6M
  mask &= newBound; \
653
28.6M
  range -= mask; \
654
28.6M
  (p)->low += mask; \
655
28.6M
  mask = (UInt32)bit - 1; \
656
28.6M
  range += newBound & mask; \
657
28.6M
  mask &= (kBitModelTotal - ((1 << kNumMoveBits) - 1)); \
658
28.6M
  mask += ((1 << kNumMoveBits) - 1); \
659
28.6M
  ttt += (Int32)(mask - ttt) >> kNumMoveBits; \
660
28.6M
  *(prob) = (CLzmaProb)ttt; \
661
28.6M
  RC_NORM(p) \
662
28.6M
  }
663
664
#endif
665
666
667
668
669
#define RC_BIT_0_BASE(p, prob) \
670
4.96M
  range = newBound; *(prob) = (CLzmaProb)(ttt + ((kBitModelTotal - ttt) >> kNumMoveBits));
671
672
#define RC_BIT_1_BASE(p, prob) \
673
3.51M
  range -= newBound; (p)->low += newBound; *(prob) = (CLzmaProb)(ttt - (ttt >> kNumMoveBits)); \
674
675
#define RC_BIT_0(p, prob) \
676
4.49M
  RC_BIT_0_BASE(p, prob) \
677
4.49M
  RC_NORM(p)
678
679
#define RC_BIT_1(p, prob) \
680
3.23M
  RC_BIT_1_BASE(p, prob) \
681
3.23M
  RC_NORM(p)
682
683
static void RangeEnc_EncodeBit_0(CRangeEnc *p, CLzmaProb *prob)
684
7.27k
{
685
7.27k
  UInt32 range, ttt, newBound;
686
7.27k
  range = p->range;
687
7.27k
  RC_BIT_PRE(p, prob)
688
7.27k
  RC_BIT_0(p, prob)
689
7.27k
  p->range = range;
690
7.27k
}
691
692
static void LitEnc_Encode(CRangeEnc *p, CLzmaProb *probs, UInt32 sym)
693
1.87M
{
694
1.87M
  UInt32 range = p->range;
695
1.87M
  sym |= 0x100;
696
1.87M
  do
697
14.9M
  {
698
14.9M
    UInt32 ttt, newBound;
699
    // RangeEnc_EncodeBit(p, probs + (sym >> 8), (sym >> 7) & 1);
700
14.9M
    CLzmaProb *prob = probs + (sym >> 8);
701
14.9M
    UInt32 bit = (sym >> 7) & 1;
702
14.9M
    sym <<= 1;
703
14.9M
    RC_BIT(p, prob, bit);
704
14.9M
  }
705
14.9M
  while (sym < 0x10000);
706
1.87M
  p->range = range;
707
1.87M
}
708
709
static void LitEnc_EncodeMatched(CRangeEnc *p, CLzmaProb *probs, UInt32 sym, UInt32 matchByte)
710
579k
{
711
579k
  UInt32 range = p->range;
712
579k
  UInt32 offs = 0x100;
713
579k
  sym |= 0x100;
714
579k
  do
715
4.63M
  {
716
4.63M
    UInt32 ttt, newBound;
717
4.63M
    CLzmaProb *prob;
718
4.63M
    UInt32 bit;
719
4.63M
    matchByte <<= 1;
720
    // RangeEnc_EncodeBit(p, probs + (offs + (matchByte & offs) + (sym >> 8)), (sym >> 7) & 1);
721
4.63M
    prob = probs + (offs + (matchByte & offs) + (sym >> 8));
722
4.63M
    bit = (sym >> 7) & 1;
723
4.63M
    sym <<= 1;
724
4.63M
    offs &= ~(matchByte ^ sym);
725
4.63M
    RC_BIT(p, prob, bit);
726
4.63M
  }
727
4.63M
  while (sym < 0x10000);
728
579k
  p->range = range;
729
579k
}
730
731
732
733
static void LzmaEnc_InitPriceTables(CProbPrice *ProbPrices)
734
7.27k
{
735
7.27k
  UInt32 i;
736
938k
  for (i = 0; i < (kBitModelTotal >> kNumMoveReducingBits); i++)
737
931k
  {
738
931k
    const unsigned kCyclesBits = kNumBitPriceShiftBits;
739
931k
    UInt32 w = (i << kNumMoveReducingBits) + (1 << (kNumMoveReducingBits - 1));
740
931k
    unsigned bitCount = 0;
741
931k
    unsigned j;
742
4.65M
    for (j = 0; j < kCyclesBits; j++)
743
3.72M
    {
744
3.72M
      w = w * w;
745
3.72M
      bitCount <<= 1;
746
50.1M
      while (w >= ((UInt32)1 << 16))
747
46.4M
      {
748
46.4M
        w >>= 1;
749
46.4M
        bitCount++;
750
46.4M
      }
751
3.72M
    }
752
931k
    ProbPrices[i] = (CProbPrice)((kNumBitModelTotalBits << kCyclesBits) - 15 - bitCount);
753
    // printf("\n%3d: %5d", i, ProbPrices[i]);
754
931k
  }
755
7.27k
}
756
757
758
#define GET_PRICE(prob, bit) \
759
1.86M
  p->ProbPrices[((prob) ^ (unsigned)(((-(int)(bit))) & (kBitModelTotal - 1))) >> kNumMoveReducingBits];
760
761
#define GET_PRICEa(prob, bit) \
762
54.2M
     ProbPrices[((prob) ^ (unsigned)((-((int)(bit))) & (kBitModelTotal - 1))) >> kNumMoveReducingBits];
763
764
16.5M
#define GET_PRICE_0(prob) p->ProbPrices[(prob) >> kNumMoveReducingBits]
765
24.6M
#define GET_PRICE_1(prob) p->ProbPrices[((prob) ^ (kBitModelTotal - 1)) >> kNumMoveReducingBits]
766
767
4.51M
#define GET_PRICEa_0(prob) ProbPrices[(prob) >> kNumMoveReducingBits]
768
4.50M
#define GET_PRICEa_1(prob) ProbPrices[((prob) ^ (kBitModelTotal - 1)) >> kNumMoveReducingBits]
769
770
771
static UInt32 LitEnc_GetPrice(const CLzmaProb *probs, UInt32 sym, const CProbPrice *ProbPrices)
772
472k
{
773
472k
  UInt32 price = 0;
774
472k
  sym |= 0x100;
775
472k
  do
776
3.77M
  {
777
3.77M
    unsigned bit = sym & 1;
778
3.77M
    sym >>= 1;
779
3.77M
    price += GET_PRICEa(probs[sym], bit);
780
3.77M
  }
781
3.77M
  while (sym >= 2);
782
472k
  return price;
783
472k
}
784
785
786
static UInt32 LitEnc_Matched_GetPrice(const CLzmaProb *probs, UInt32 sym, UInt32 matchByte, const CProbPrice *ProbPrices)
787
4.05M
{
788
4.05M
  UInt32 price = 0;
789
4.05M
  UInt32 offs = 0x100;
790
4.05M
  sym |= 0x100;
791
4.05M
  do
792
32.4M
  {
793
32.4M
    matchByte <<= 1;
794
32.4M
    price += GET_PRICEa(probs[offs + (matchByte & offs) + (sym >> 8)], (sym >> 7) & 1);
795
32.4M
    sym <<= 1;
796
32.4M
    offs &= ~(matchByte ^ sym);
797
32.4M
  }
798
32.4M
  while (sym < 0x10000);
799
4.05M
  return price;
800
4.05M
}
801
802
803
static void RcTree_ReverseEncode(CRangeEnc *rc, CLzmaProb *probs, unsigned numBits, unsigned sym)
804
349k
{
805
349k
  UInt32 range = rc->range;
806
349k
  unsigned m = 1;
807
349k
  do
808
761k
  {
809
761k
    UInt32 ttt, newBound;
810
761k
    unsigned bit = sym & 1;
811
    // RangeEnc_EncodeBit(rc, probs + m, bit);
812
761k
    sym >>= 1;
813
761k
    RC_BIT(rc, probs + m, bit);
814
761k
    m = (m << 1) | bit;
815
761k
  }
816
761k
  while (--numBits);
817
349k
  rc->range = range;
818
349k
}
819
820
821
822
static void LenEnc_Init(CLenEnc *p)
823
14.5k
{
824
14.5k
  unsigned i;
825
3.74M
  for (i = 0; i < (LZMA_NUM_PB_STATES_MAX << (kLenNumLowBits + 1)); i++)
826
3.72M
    p->low[i] = kProbInitValue;
827
3.74M
  for (i = 0; i < kLenNumHighSymbols; i++)
828
3.72M
    p->high[i] = kProbInitValue;
829
14.5k
}
830
831
static void LenEnc_Encode(CLenEnc *p, CRangeEnc *rc, unsigned sym, unsigned posState)
832
1.30M
{
833
1.30M
  UInt32 range, ttt, newBound;
834
1.30M
  CLzmaProb *probs = p->low;
835
1.30M
  range = rc->range;
836
1.30M
  RC_BIT_PRE(rc, probs);
837
1.30M
  if (sym >= kLenNumLowSymbols)
838
208k
  {
839
208k
    RC_BIT_1(rc, probs);
840
208k
    probs += kLenNumLowSymbols;
841
208k
    RC_BIT_PRE(rc, probs);
842
208k
    if (sym >= kLenNumLowSymbols * 2)
843
115k
    {
844
115k
      RC_BIT_1(rc, probs);
845
115k
      rc->range = range;
846
      // RcTree_Encode(rc, p->high, kLenNumHighBits, sym - kLenNumLowSymbols * 2);
847
115k
      LitEnc_Encode(rc, p->high, sym - kLenNumLowSymbols * 2);
848
115k
      return;
849
115k
    }
850
93.2k
    sym -= kLenNumLowSymbols;
851
93.2k
  }
852
853
  // RcTree_Encode(rc, probs + (posState << kLenNumLowBits), kLenNumLowBits, sym);
854
1.19M
  {
855
1.19M
    unsigned m;
856
1.19M
    unsigned bit;
857
1.19M
    RC_BIT_0(rc, probs);
858
1.19M
    probs += (posState << (1 + kLenNumLowBits));
859
1.19M
    bit = (sym >> 2)    ; RC_BIT(rc, probs + 1, bit); m = (1 << 1) + bit;
860
1.19M
    bit = (sym >> 1) & 1; RC_BIT(rc, probs + m, bit); m = (m << 1) + bit;
861
1.19M
    bit =  sym       & 1; RC_BIT(rc, probs + m, bit);
862
1.19M
    rc->range = range;
863
1.19M
  }
864
1.19M
}
865
866
static void SetPrices_3(const CLzmaProb *probs, UInt32 startPrice, UInt32 *prices, const CProbPrice *ProbPrices)
867
404k
{
868
404k
  unsigned i;
869
2.02M
  for (i = 0; i < 8; i += 2)
870
1.61M
  {
871
1.61M
    UInt32 price = startPrice;
872
1.61M
    UInt32 prob;
873
1.61M
    price += GET_PRICEa(probs[1           ], (i >> 2));
874
1.61M
    price += GET_PRICEa(probs[2 + (i >> 2)], (i >> 1) & 1);
875
1.61M
    prob = probs[4 + (i >> 1)];
876
1.61M
    prices[i    ] = price + GET_PRICEa_0(prob);
877
1.61M
    prices[i + 1] = price + GET_PRICEa_1(prob);
878
1.61M
  }
879
404k
}
880
881
882
MY_NO_INLINE static void MY_FAST_CALL LenPriceEnc_UpdateTables(
883
    CLenPriceEnc *p,
884
    unsigned numPosStates,
885
    const CLenEnc *enc,
886
    const CProbPrice *ProbPrices)
887
24.1k
{
888
24.1k
  UInt32 b;
889
 
890
24.1k
  {
891
24.1k
    unsigned prob = enc->low[0];
892
24.1k
    UInt32 a, c;
893
24.1k
    unsigned posState;
894
24.1k
    b = GET_PRICEa_1(prob);
895
24.1k
    a = GET_PRICEa_0(prob);
896
24.1k
    c = b + GET_PRICEa_0(enc->low[kLenNumLowSymbols]);
897
226k
    for (posState = 0; posState < numPosStates; posState++)
898
202k
    {
899
202k
      UInt32 *prices = p->prices[posState];
900
202k
      const CLzmaProb *probs = enc->low + (posState << (1 + kLenNumLowBits));
901
202k
      SetPrices_3(probs, a, prices, ProbPrices);
902
202k
      SetPrices_3(probs + kLenNumLowSymbols, c, prices + kLenNumLowSymbols, ProbPrices);
903
202k
    }
904
24.1k
  }
905
906
  /*
907
  {
908
    unsigned i;
909
    UInt32 b;
910
    a = GET_PRICEa_0(enc->low[0]);
911
    for (i = 0; i < kLenNumLowSymbols; i++)
912
      p->prices2[i] = a;
913
    a = GET_PRICEa_1(enc->low[0]);
914
    b = a + GET_PRICEa_0(enc->low[kLenNumLowSymbols]);
915
    for (i = kLenNumLowSymbols; i < kLenNumLowSymbols * 2; i++)
916
      p->prices2[i] = b;
917
    a += GET_PRICEa_1(enc->low[kLenNumLowSymbols]);
918
  }
919
  */
920
 
921
  // p->counter = numSymbols;
922
  // p->counter = 64;
923
924
24.1k
  {
925
24.1k
    unsigned i = p->tableSize;
926
    
927
24.1k
    if (i > kLenNumLowSymbols * 2)
928
13.1k
    {
929
13.1k
      const CLzmaProb *probs = enc->high;
930
13.1k
      UInt32 *prices = p->prices[0] + kLenNumLowSymbols * 2;
931
13.1k
      i -= kLenNumLowSymbols * 2 - 1;
932
13.1k
      i >>= 1;
933
13.1k
      b += GET_PRICEa_1(enc->low[kLenNumLowSymbols]);
934
13.1k
      do
935
1.01M
      {
936
        /*
937
        p->prices2[i] = a +
938
        // RcTree_GetPrice(enc->high, kLenNumHighBits, i - kLenNumLowSymbols * 2, ProbPrices);
939
        LitEnc_GetPrice(probs, i - kLenNumLowSymbols * 2, ProbPrices);
940
        */
941
        // UInt32 price = a + RcTree_GetPrice(probs, kLenNumHighBits - 1, sym, ProbPrices);
942
1.01M
        unsigned sym = --i + (1 << (kLenNumHighBits - 1));
943
1.01M
        UInt32 price = b;
944
1.01M
        do
945
7.10M
        {
946
7.10M
          unsigned bit = sym & 1;
947
7.10M
          sym >>= 1;
948
7.10M
          price += GET_PRICEa(probs[sym], bit);
949
7.10M
        }
950
7.10M
        while (sym >= 2);
951
952
1.01M
        {
953
1.01M
          unsigned prob = probs[(size_t)i + (1 << (kLenNumHighBits - 1))];
954
1.01M
          prices[(size_t)i * 2    ] = price + GET_PRICEa_0(prob);
955
1.01M
          prices[(size_t)i * 2 + 1] = price + GET_PRICEa_1(prob);
956
1.01M
        }
957
1.01M
      }
958
1.01M
      while (i);
959
960
13.1k
      {
961
13.1k
        unsigned posState;
962
13.1k
        size_t num = (p->tableSize - kLenNumLowSymbols * 2) * sizeof(p->prices[0][0]);
963
137k
        for (posState = 1; posState < numPosStates; posState++)
964
123k
          memcpy(p->prices[posState] + kLenNumLowSymbols * 2, p->prices[0] + kLenNumLowSymbols * 2, num);
965
13.1k
      }
966
13.1k
    }
967
24.1k
  }
968
24.1k
}
969
970
/*
971
  #ifdef SHOW_STAT
972
  g_STAT_OFFSET += num;
973
  printf("\n MovePos %u", num);
974
  #endif
975
*/
976
  
977
461k
#define MOVE_POS(p, num) { \
978
461k
    p->additionalOffset += (num); \
979
461k
    p->matchFinder.Skip(p->matchFinderObj, (UInt32)(num)); }
980
981
982
static unsigned ReadMatchDistances(CLzmaEnc *p, unsigned *numPairsRes)
983
6.60M
{
984
6.60M
  unsigned numPairs;
985
  
986
6.60M
  p->additionalOffset++;
987
6.60M
  p->numAvail = p->matchFinder.GetNumAvailableBytes(p->matchFinderObj);
988
6.60M
  numPairs = p->matchFinder.GetMatches(p->matchFinderObj, p->matches);
989
6.60M
  *numPairsRes = numPairs;
990
  
991
  #ifdef SHOW_STAT
992
  printf("\n i = %u numPairs = %u    ", g_STAT_OFFSET, numPairs / 2);
993
  g_STAT_OFFSET++;
994
  {
995
    unsigned i;
996
    for (i = 0; i < numPairs; i += 2)
997
      printf("%2u %6u   | ", p->matches[i], p->matches[i + 1]);
998
  }
999
  #endif
1000
  
1001
6.60M
  if (numPairs == 0)
1002
1.79M
    return 0;
1003
4.80M
  {
1004
4.80M
    unsigned len = p->matches[(size_t)numPairs - 2];
1005
4.80M
    if (len != p->numFastBytes)
1006
4.58M
      return len;
1007
218k
    {
1008
218k
      UInt32 numAvail = p->numAvail;
1009
218k
      if (numAvail > LZMA_MATCH_LEN_MAX)
1010
207k
        numAvail = LZMA_MATCH_LEN_MAX;
1011
218k
      {
1012
218k
        const Byte *p1 = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1013
218k
        const Byte *p2 = p1 + len;
1014
218k
        ptrdiff_t dif = (ptrdiff_t)-1 - p->matches[(size_t)numPairs - 1];
1015
218k
        const Byte *lim = p1 + numAvail;
1016
4.09M
        for (; p2 != lim && *p2 == p2[dif]; p2++)
1017
3.87M
        {}
1018
218k
        return (unsigned)(p2 - p1);
1019
4.80M
      }
1020
4.80M
    }
1021
4.80M
  }
1022
4.80M
}
1023
1024
6.91M
#define MARK_LIT ((UInt32)(Int32)-1)
1025
1026
889k
#define MakeAs_Lit(p)       { (p)->dist = MARK_LIT; (p)->extra = 0; }
1027
228k
#define MakeAs_ShortRep(p)  { (p)->dist = 0; (p)->extra = 0; }
1028
955k
#define IsShortRep(p)       ((p)->dist == 0)
1029
1030
1031
#define GetPrice_ShortRep(p, state, posState) \
1032
279k
  ( GET_PRICE_0(p->isRepG0[state]) + GET_PRICE_0(p->isRep0Long[state][posState]))
1033
1034
3.28M
#define GetPrice_Rep_0(p, state, posState) ( \
1035
3.28M
    GET_PRICE_1(p->isMatch[state][posState]) \
1036
3.28M
  + GET_PRICE_1(p->isRep0Long[state][posState])) \
1037
3.28M
  + GET_PRICE_1(p->isRep[state]) \
1038
3.28M
  + GET_PRICE_0(p->isRepG0[state])
1039
  
1040
MY_FORCE_INLINE
1041
static UInt32 GetPrice_PureRep(const CLzmaEnc *p, unsigned repIndex, size_t state, size_t posState)
1042
4.69M
{
1043
4.69M
  UInt32 price;
1044
4.69M
  UInt32 prob = p->isRepG0[state];
1045
4.69M
  if (repIndex == 0)
1046
1.75M
  {
1047
1.75M
    price = GET_PRICE_0(prob);
1048
1.75M
    price += GET_PRICE_1(p->isRep0Long[state][posState]);
1049
1.75M
  }
1050
2.94M
  else
1051
2.94M
  {
1052
2.94M
    price = GET_PRICE_1(prob);
1053
2.94M
    prob = p->isRepG1[state];
1054
2.94M
    if (repIndex == 1)
1055
1.08M
      price += GET_PRICE_0(prob);
1056
1.86M
    else
1057
1.86M
    {
1058
1.86M
      price += GET_PRICE_1(prob);
1059
1.86M
      price += GET_PRICE(p->isRepG2[state], repIndex - 2);
1060
1.86M
    }
1061
2.94M
  }
1062
4.69M
  return price;
1063
4.69M
}
1064
1065
1066
static unsigned Backward(CLzmaEnc *p, unsigned cur)
1067
191k
{
1068
191k
  unsigned wr = cur + 1;
1069
191k
  p->optEnd = wr;
1070
1071
191k
  for (;;)
1072
1.26M
  {
1073
1.26M
    UInt32 dist = p->opt[cur].dist;
1074
1.26M
    unsigned len = (unsigned)p->opt[cur].len;
1075
1.26M
    unsigned extra = (unsigned)p->opt[cur].extra;
1076
1.26M
    cur -= len;
1077
1078
1.26M
    if (extra)
1079
72.3k
    {
1080
72.3k
      wr--;
1081
72.3k
      p->opt[wr].len = (UInt32)len;
1082
72.3k
      cur -= extra;
1083
72.3k
      len = extra;
1084
72.3k
      if (extra == 1)
1085
873
      {
1086
873
        p->opt[wr].dist = dist;
1087
873
        dist = MARK_LIT;
1088
873
      }
1089
71.4k
      else
1090
71.4k
      {
1091
71.4k
        p->opt[wr].dist = 0;
1092
71.4k
        len--;
1093
71.4k
        wr--;
1094
71.4k
        p->opt[wr].dist = MARK_LIT;
1095
71.4k
        p->opt[wr].len = 1;
1096
71.4k
      }
1097
72.3k
    }
1098
1099
1.26M
    if (cur == 0)
1100
191k
    {
1101
191k
      p->backRes = dist;
1102
191k
      p->optCur = wr;
1103
191k
      return len;
1104
191k
    }
1105
    
1106
1.07M
    wr--;
1107
1.07M
    p->opt[wr].dist = dist;
1108
1.07M
    p->opt[wr].len = (UInt32)len;
1109
1.07M
  }
1110
191k
}
1111
1112
1113
1114
#define LIT_PROBS(pos, prevByte) \
1115
6.85M
  (p->litProbs + (UInt32)3 * (((((pos) << 8) + (prevByte)) & p->lpMask) << p->lc))
1116
1117
1118
static unsigned GetOptimum(CLzmaEnc *p, UInt32 position)
1119
944k
{
1120
944k
  unsigned last, cur;
1121
944k
  UInt32 reps[LZMA_NUM_REPS];
1122
944k
  unsigned repLens[LZMA_NUM_REPS];
1123
944k
  UInt32 *matches;
1124
1125
944k
  {
1126
944k
    UInt32 numAvail;
1127
944k
    unsigned numPairs, mainLen, repMaxIndex, i, posState;
1128
944k
    UInt32 matchPrice, repMatchPrice;
1129
944k
    const Byte *data;
1130
944k
    Byte curByte, matchByte;
1131
    
1132
944k
    p->optCur = p->optEnd = 0;
1133
    
1134
944k
    if (p->additionalOffset == 0)
1135
913k
      mainLen = ReadMatchDistances(p, &numPairs);
1136
30.6k
    else
1137
30.6k
    {
1138
30.6k
      mainLen = p->longestMatchLen;
1139
30.6k
      numPairs = p->numPairs;
1140
30.6k
    }
1141
    
1142
944k
    numAvail = p->numAvail;
1143
944k
    if (numAvail < 2)
1144
2.39k
    {
1145
2.39k
      p->backRes = MARK_LIT;
1146
2.39k
      return 1;
1147
2.39k
    }
1148
942k
    if (numAvail > LZMA_MATCH_LEN_MAX)
1149
837k
      numAvail = LZMA_MATCH_LEN_MAX;
1150
    
1151
942k
    data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1152
942k
    repMaxIndex = 0;
1153
    
1154
4.71M
    for (i = 0; i < LZMA_NUM_REPS; i++)
1155
3.76M
    {
1156
3.76M
      unsigned len;
1157
3.76M
      const Byte *data2;
1158
3.76M
      reps[i] = p->reps[i];
1159
3.76M
      data2 = data - reps[i];
1160
3.76M
      if (data[0] != data2[0] || data[1] != data2[1])
1161
3.61M
      {
1162
3.61M
        repLens[i] = 0;
1163
3.61M
        continue;
1164
3.61M
      }
1165
3.35M
      for (len = 2; len < numAvail && data[len] == data2[len]; len++)
1166
3.20M
      {}
1167
149k
      repLens[i] = len;
1168
149k
      if (len > repLens[repMaxIndex])
1169
80.1k
        repMaxIndex = i;
1170
149k
    }
1171
    
1172
942k
    if (repLens[repMaxIndex] >= p->numFastBytes)
1173
43.4k
    {
1174
43.4k
      unsigned len;
1175
43.4k
      p->backRes = (UInt32)repMaxIndex;
1176
43.4k
      len = repLens[repMaxIndex];
1177
43.4k
      MOVE_POS(p, len - 1)
1178
43.4k
      return len;
1179
43.4k
    }
1180
    
1181
898k
    matches = p->matches;
1182
    
1183
898k
    if (mainLen >= p->numFastBytes)
1184
61.0k
    {
1185
61.0k
      p->backRes = matches[(size_t)numPairs - 1] + LZMA_NUM_REPS;
1186
61.0k
      MOVE_POS(p, mainLen - 1)
1187
61.0k
      return mainLen;
1188
61.0k
    }
1189
    
1190
837k
    curByte = *data;
1191
837k
    matchByte = *(data - reps[0]);
1192
1193
837k
    last = repLens[repMaxIndex];
1194
837k
    if (last <= mainLen)
1195
834k
      last = mainLen;
1196
    
1197
837k
    if (last < 2 && curByte != matchByte)
1198
624k
    {
1199
624k
      p->backRes = MARK_LIT;
1200
624k
      return 1;
1201
624k
    }
1202
    
1203
213k
    p->opt[0].state = (CState)p->state;
1204
    
1205
213k
    posState = (position & p->pbMask);
1206
    
1207
213k
    {
1208
213k
      const CLzmaProb *probs = LIT_PROBS(position, *(data - 1));
1209
213k
      p->opt[1].price = GET_PRICE_0(p->isMatch[p->state][posState]) +
1210
213k
        (!IsLitState(p->state) ?
1211
60.4k
          LitEnc_Matched_GetPrice(probs, curByte, matchByte, p->ProbPrices) :
1212
213k
          LitEnc_GetPrice(probs, curByte, p->ProbPrices));
1213
213k
    }
1214
1215
213k
    MakeAs_Lit(&p->opt[1]);
1216
    
1217
213k
    matchPrice = GET_PRICE_1(p->isMatch[p->state][posState]);
1218
213k
    repMatchPrice = matchPrice + GET_PRICE_1(p->isRep[p->state]);
1219
    
1220
    // 18.06
1221
213k
    if (matchByte == curByte && repLens[0] == 0)
1222
36.8k
    {
1223
36.8k
      UInt32 shortRepPrice = repMatchPrice + GetPrice_ShortRep(p, p->state, posState);
1224
36.8k
      if (shortRepPrice < p->opt[1].price)
1225
35.0k
      {
1226
35.0k
        p->opt[1].price = shortRepPrice;
1227
35.0k
        MakeAs_ShortRep(&p->opt[1]);
1228
35.0k
      }
1229
36.8k
      if (last < 2)
1230
21.1k
      {
1231
21.1k
        p->backRes = p->opt[1].dist;
1232
21.1k
        return 1;
1233
21.1k
      }
1234
36.8k
    }
1235
   
1236
191k
    p->opt[1].len = 1;
1237
    
1238
191k
    p->opt[0].reps[0] = reps[0];
1239
191k
    p->opt[0].reps[1] = reps[1];
1240
191k
    p->opt[0].reps[2] = reps[2];
1241
191k
    p->opt[0].reps[3] = reps[3];
1242
    
1243
    // ---------- REP ----------
1244
    
1245
959k
    for (i = 0; i < LZMA_NUM_REPS; i++)
1246
767k
    {
1247
767k
      unsigned repLen = repLens[i];
1248
767k
      UInt32 price;
1249
767k
      if (repLen < 2)
1250
719k
        continue;
1251
48.8k
      price = repMatchPrice + GetPrice_PureRep(p, i, p->state, posState);
1252
48.8k
      do
1253
295k
      {
1254
295k
        UInt32 price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState, repLen);
1255
295k
        COptimal *opt = &p->opt[repLen];
1256
295k
        if (price2 < opt->price)
1257
193k
        {
1258
193k
          opt->price = price2;
1259
193k
          opt->len = (UInt32)repLen;
1260
193k
          opt->dist = (UInt32)i;
1261
193k
          opt->extra = 0;
1262
193k
        }
1263
295k
      }
1264
295k
      while (--repLen >= 2);
1265
48.8k
    }
1266
    
1267
    
1268
    // ---------- MATCH ----------
1269
191k
    {
1270
191k
      unsigned len = repLens[0] + 1;
1271
191k
      if (len <= mainLen)
1272
182k
      {
1273
182k
        unsigned offs = 0;
1274
182k
        UInt32 normalMatchPrice = matchPrice + GET_PRICE_0(p->isRep[p->state]);
1275
1276
182k
        if (len < 2)
1277
180k
          len = 2;
1278
1.54k
        else
1279
4.65k
          while (len > matches[offs])
1280
3.11k
            offs += 2;
1281
    
1282
238k
        for (; ; len++)
1283
420k
        {
1284
420k
          COptimal *opt;
1285
420k
          UInt32 dist = matches[(size_t)offs + 1];
1286
420k
          UInt32 price = normalMatchPrice + GET_PRICE_LEN(&p->lenEnc, posState, len);
1287
420k
          unsigned lenToPosState = GetLenToPosState(len);
1288
       
1289
420k
          if (dist < kNumFullDistances)
1290
234k
            price += p->distancesPrices[lenToPosState][dist & (kNumFullDistances - 1)];
1291
186k
          else
1292
186k
          {
1293
186k
            unsigned slot;
1294
186k
            GetPosSlot2(dist, slot);
1295
186k
            price += p->alignPrices[dist & kAlignMask];
1296
186k
            price += p->posSlotPrices[lenToPosState][slot];
1297
186k
          }
1298
          
1299
420k
          opt = &p->opt[len];
1300
          
1301
420k
          if (price < opt->price)
1302
360k
          {
1303
360k
            opt->price = price;
1304
360k
            opt->len = (UInt32)len;
1305
360k
            opt->dist = dist + LZMA_NUM_REPS;
1306
360k
            opt->extra = 0;
1307
360k
          }
1308
          
1309
420k
          if (len == matches[offs])
1310
237k
          {
1311
237k
            offs += 2;
1312
237k
            if (offs == numPairs)
1313
182k
              break;
1314
237k
          }
1315
420k
        }
1316
182k
      }
1317
191k
    }
1318
    
1319
1320
191k
    cur = 0;
1321
1322
    #ifdef SHOW_STAT2
1323
    /* if (position >= 0) */
1324
    {
1325
      unsigned i;
1326
      printf("\n pos = %4X", position);
1327
      for (i = cur; i <= last; i++)
1328
      printf("\nprice[%4X] = %u", position - cur + i, p->opt[i].price);
1329
    }
1330
    #endif
1331
191k
  }
1332
1333
1334
  
1335
  // ---------- Optimal Parsing ----------
1336
1337
0
  for (;;)
1338
4.11M
  {
1339
4.11M
    unsigned numAvail;
1340
4.11M
    UInt32 numAvailFull;
1341
4.11M
    unsigned newLen, numPairs, prev, state, posState, startLen;
1342
4.11M
    UInt32 litPrice, matchPrice, repMatchPrice;
1343
4.11M
    BoolInt nextIsLit;
1344
4.11M
    Byte curByte, matchByte;
1345
4.11M
    const Byte *data;
1346
4.11M
    COptimal *curOpt, *nextOpt;
1347
1348
4.11M
    if (++cur == last)
1349
160k
      break;
1350
    
1351
    // 18.06
1352
3.95M
    if (cur >= kNumOpts - 64)
1353
460
    {
1354
460
      unsigned j, best;
1355
460
      UInt32 price = p->opt[cur].price;
1356
460
      best = cur;
1357
8.86k
      for (j = cur + 1; j <= last; j++)
1358
8.40k
      {
1359
8.40k
        UInt32 price2 = p->opt[j].price;
1360
8.40k
        if (price >= price2)
1361
844
        {
1362
844
          price = price2;
1363
844
          best = j;
1364
844
        }
1365
8.40k
      }
1366
460
      {
1367
460
        unsigned delta = best - cur;
1368
460
        if (delta != 0)
1369
249
        {
1370
249
          MOVE_POS(p, delta);
1371
249
        }
1372
460
      }
1373
460
      cur = best;
1374
460
      break;
1375
460
    }
1376
1377
3.95M
    newLen = ReadMatchDistances(p, &numPairs);
1378
    
1379
3.95M
    if (newLen >= p->numFastBytes)
1380
30.6k
    {
1381
30.6k
      p->numPairs = numPairs;
1382
30.6k
      p->longestMatchLen = newLen;
1383
30.6k
      break;
1384
30.6k
    }
1385
    
1386
3.92M
    curOpt = &p->opt[cur];
1387
1388
3.92M
    position++;
1389
1390
    // we need that check here, if skip_items in p->opt are possible
1391
    /*
1392
    if (curOpt->price >= kInfinityPrice)
1393
      continue;
1394
    */
1395
1396
3.92M
    prev = cur - curOpt->len;
1397
1398
3.92M
    if (curOpt->len == 1)
1399
955k
    {
1400
955k
      state = (unsigned)p->opt[prev].state;
1401
955k
      if (IsShortRep(curOpt))
1402
196k
        state = kShortRepNextStates[state];
1403
759k
      else
1404
759k
        state = kLiteralNextStates[state];
1405
955k
    }
1406
2.97M
    else
1407
2.97M
    {
1408
2.97M
      const COptimal *prevOpt;
1409
2.97M
      UInt32 b0;
1410
2.97M
      UInt32 dist = curOpt->dist;
1411
1412
2.97M
      if (curOpt->extra)
1413
104k
      {
1414
104k
        prev -= (unsigned)curOpt->extra;
1415
104k
        state = kState_RepAfterLit;
1416
104k
        if (curOpt->extra == 1)
1417
1.22k
          state = (dist < LZMA_NUM_REPS ? kState_RepAfterLit : kState_MatchAfterLit);
1418
104k
      }
1419
2.86M
      else
1420
2.86M
      {
1421
2.86M
        state = (unsigned)p->opt[prev].state;
1422
2.86M
        if (dist < LZMA_NUM_REPS)
1423
1.64M
          state = kRepNextStates[state];
1424
1.21M
        else
1425
1.21M
          state = kMatchNextStates[state];
1426
2.86M
      }
1427
1428
2.97M
      prevOpt = &p->opt[prev];
1429
2.97M
      b0 = prevOpt->reps[0];
1430
1431
2.97M
      if (dist < LZMA_NUM_REPS)
1432
1.74M
      {
1433
1.74M
        if (dist == 0)
1434
445k
        {
1435
445k
          reps[0] = b0;
1436
445k
          reps[1] = prevOpt->reps[1];
1437
445k
          reps[2] = prevOpt->reps[2];
1438
445k
          reps[3] = prevOpt->reps[3];
1439
445k
        }
1440
1.29M
        else
1441
1.29M
        {
1442
1.29M
          reps[1] = b0;
1443
1.29M
          b0 = prevOpt->reps[1];
1444
1.29M
          if (dist == 1)
1445
726k
          {
1446
726k
            reps[0] = b0;
1447
726k
            reps[2] = prevOpt->reps[2];
1448
726k
            reps[3] = prevOpt->reps[3];
1449
726k
          }
1450
572k
          else
1451
572k
          {
1452
572k
            reps[2] = b0;
1453
572k
            reps[0] = prevOpt->reps[dist];
1454
572k
            reps[3] = prevOpt->reps[dist ^ 1];
1455
572k
          }
1456
1.29M
        }
1457
1.74M
      }
1458
1.22M
      else
1459
1.22M
      {
1460
1.22M
        reps[0] = (dist - LZMA_NUM_REPS + 1);
1461
1.22M
        reps[1] = b0;
1462
1.22M
        reps[2] = prevOpt->reps[1];
1463
1.22M
        reps[3] = prevOpt->reps[2];
1464
1.22M
      }
1465
2.97M
    }
1466
    
1467
3.92M
    curOpt->state = (CState)state;
1468
3.92M
    curOpt->reps[0] = reps[0];
1469
3.92M
    curOpt->reps[1] = reps[1];
1470
3.92M
    curOpt->reps[2] = reps[2];
1471
3.92M
    curOpt->reps[3] = reps[3];
1472
1473
3.92M
    data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1474
3.92M
    curByte = *data;
1475
3.92M
    matchByte = *(data - reps[0]);
1476
1477
3.92M
    posState = (position & p->pbMask);
1478
1479
    /*
1480
    The order of Price checks:
1481
       <  LIT
1482
       <= SHORT_REP
1483
       <  LIT : REP_0
1484
       <  REP    [ : LIT : REP_0 ]
1485
       <  MATCH  [ : LIT : REP_0 ]
1486
    */
1487
1488
3.92M
    {
1489
3.92M
      UInt32 curPrice = curOpt->price;
1490
3.92M
      unsigned prob = p->isMatch[state][posState];
1491
3.92M
      matchPrice = curPrice + GET_PRICE_1(prob);
1492
3.92M
      litPrice = curPrice + GET_PRICE_0(prob);
1493
3.92M
    }
1494
1495
3.92M
    nextOpt = &p->opt[(size_t)cur + 1];
1496
3.92M
    nextIsLit = False;
1497
1498
    // here we can allow skip_items in p->opt, if we don't check (nextOpt->price < kInfinityPrice)
1499
    // 18.new.06
1500
3.92M
    if ((nextOpt->price < kInfinityPrice
1501
        // && !IsLitState(state)
1502
3.92M
        && matchByte == curByte)
1503
3.92M
        || litPrice > nextOpt->price
1504
3.92M
        )
1505
2.76M
      litPrice = 0;
1506
1.16M
    else
1507
1.16M
    {
1508
1.16M
      const CLzmaProb *probs = LIT_PROBS(position, *(data - 1));
1509
1.16M
      litPrice += (!IsLitState(state) ?
1510
842k
          LitEnc_Matched_GetPrice(probs, curByte, matchByte, p->ProbPrices) :
1511
1.16M
          LitEnc_GetPrice(probs, curByte, p->ProbPrices));
1512
      
1513
1.16M
      if (litPrice < nextOpt->price)
1514
676k
      {
1515
676k
        nextOpt->price = litPrice;
1516
676k
        nextOpt->len = 1;
1517
676k
        MakeAs_Lit(nextOpt);
1518
676k
        nextIsLit = True;
1519
676k
      }
1520
1.16M
    }
1521
1522
3.92M
    repMatchPrice = matchPrice + GET_PRICE_1(p->isRep[state]);
1523
    
1524
3.92M
    numAvailFull = p->numAvail;
1525
3.92M
    {
1526
3.92M
      unsigned temp = kNumOpts - 1 - cur;
1527
3.92M
      if (numAvailFull > temp)
1528
3.14M
        numAvailFull = (UInt32)temp;
1529
3.92M
    }
1530
1531
    // 18.06
1532
    // ---------- SHORT_REP ----------
1533
3.92M
    if (IsLitState(state)) // 18.new
1534
759k
    if (matchByte == curByte)
1535
343k
    if (repMatchPrice < nextOpt->price) // 18.new
1536
    // if (numAvailFull < 2 || data[1] != *(data - reps[0] + 1))
1537
243k
    if (
1538
        // nextOpt->price >= kInfinityPrice ||
1539
243k
        nextOpt->len < 2   // we can check nextOpt->len, if skip items are not allowed in p->opt
1540
243k
        || (nextOpt->dist != 0
1541
            // && nextOpt->extra <= 1 // 17.old
1542
233k
            )
1543
243k
        )
1544
242k
    {
1545
242k
      UInt32 shortRepPrice = repMatchPrice + GetPrice_ShortRep(p, state, posState);
1546
      // if (shortRepPrice <= nextOpt->price) // 17.old
1547
242k
      if (shortRepPrice < nextOpt->price)  // 18.new
1548
193k
      {
1549
193k
        nextOpt->price = shortRepPrice;
1550
193k
        nextOpt->len = 1;
1551
193k
        MakeAs_ShortRep(nextOpt);
1552
193k
        nextIsLit = False;
1553
193k
      }
1554
242k
    }
1555
    
1556
3.92M
    if (numAvailFull < 2)
1557
2.24k
      continue;
1558
3.92M
    numAvail = (numAvailFull <= p->numFastBytes ? numAvailFull : p->numFastBytes);
1559
1560
    // numAvail <= p->numFastBytes
1561
1562
    // ---------- LIT : REP_0 ----------
1563
1564
3.92M
    if (!nextIsLit
1565
3.92M
        && litPrice != 0 // 18.new
1566
3.92M
        && matchByte != curByte
1567
3.92M
        && numAvailFull > 2)
1568
484k
    {
1569
484k
      const Byte *data2 = data - reps[0];
1570
484k
      if (data[1] == data2[1] && data[2] == data2[2])
1571
129k
      {
1572
129k
        unsigned len;
1573
129k
        unsigned limit = p->numFastBytes + 1;
1574
129k
        if (limit > numAvailFull)
1575
5.41k
          limit = numAvailFull;
1576
314k
        for (len = 3; len < limit && data[len] == data2[len]; len++)
1577
185k
        {}
1578
        
1579
129k
        {
1580
129k
          unsigned state2 = kLiteralNextStates[state];
1581
129k
          unsigned posState2 = (position + 1) & p->pbMask;
1582
129k
          UInt32 price = litPrice + GetPrice_Rep_0(p, state2, posState2);
1583
129k
          {
1584
129k
            unsigned offset = cur + len;
1585
1586
129k
            if (last < offset)
1587
4.20k
              last = offset;
1588
          
1589
            // do
1590
129k
            {
1591
129k
              UInt32 price2;
1592
129k
              COptimal *opt;
1593
129k
              len--;
1594
              // price2 = price + GetPrice_Len_Rep_0(p, len, state2, posState2);
1595
129k
              price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState2, len);
1596
1597
129k
              opt = &p->opt[offset];
1598
              // offset--;
1599
129k
              if (price2 < opt->price)
1600
8.28k
              {
1601
8.28k
                opt->price = price2;
1602
8.28k
                opt->len = (UInt32)len;
1603
8.28k
                opt->dist = 0;
1604
8.28k
                opt->extra = 1;
1605
8.28k
              }
1606
129k
            }
1607
            // while (len >= 3);
1608
129k
          }
1609
129k
        }
1610
129k
      }
1611
484k
    }
1612
    
1613
3.92M
    startLen = 2; /* speed optimization */
1614
1615
3.92M
    {
1616
      // ---------- REP ----------
1617
3.92M
      unsigned repIndex = 0; // 17.old
1618
      // unsigned repIndex = IsLitState(state) ? 0 : 1; // 18.notused
1619
19.6M
      for (; repIndex < LZMA_NUM_REPS; repIndex++)
1620
15.6M
      {
1621
15.6M
        unsigned len;
1622
15.6M
        UInt32 price;
1623
15.6M
        const Byte *data2 = data - reps[repIndex];
1624
15.6M
        if (data[0] != data2[0] || data[1] != data2[1])
1625
11.0M
          continue;
1626
        
1627
73.2M
        for (len = 2; len < numAvail && data[len] == data2[len]; len++)
1628
68.6M
        {}
1629
        
1630
        // if (len < startLen) continue; // 18.new: speed optimization
1631
1632
4.64M
        {
1633
4.64M
          unsigned offset = cur + len;
1634
4.64M
          if (last < offset)
1635
201k
            last = offset;
1636
4.64M
        }
1637
4.64M
        {
1638
4.64M
          unsigned len2 = len;
1639
4.64M
          price = repMatchPrice + GetPrice_PureRep(p, repIndex, state, posState);
1640
4.64M
          do
1641
73.2M
          {
1642
73.2M
            UInt32 price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState, len2);
1643
73.2M
            COptimal *opt = &p->opt[cur + len2];
1644
73.2M
            if (price2 < opt->price)
1645
2.66M
            {
1646
2.66M
              opt->price = price2;
1647
2.66M
              opt->len = (UInt32)len2;
1648
2.66M
              opt->dist = (UInt32)repIndex;
1649
2.66M
              opt->extra = 0;
1650
2.66M
            }
1651
73.2M
          }
1652
73.2M
          while (--len2 >= 2);
1653
4.64M
        }
1654
        
1655
4.64M
        if (repIndex == 0) startLen = len + 1;  // 17.old
1656
        // startLen = len + 1; // 18.new
1657
1658
        /* if (_maxMode) */
1659
4.64M
        {
1660
          // ---------- REP : LIT : REP_0 ----------
1661
          // numFastBytes + 1 + numFastBytes
1662
1663
4.64M
          unsigned len2 = len + 1;
1664
4.64M
          unsigned limit = len2 + p->numFastBytes;
1665
4.64M
          if (limit > numAvailFull)
1666
402k
            limit = numAvailFull;
1667
          
1668
4.64M
          len2 += 2;
1669
4.64M
          if (len2 <= limit)
1670
4.57M
          if (data[len2 - 2] == data2[len2 - 2])
1671
2.50M
          if (data[len2 - 1] == data2[len2 - 1])
1672
2.13M
          {
1673
2.13M
            unsigned state2 = kRepNextStates[state];
1674
2.13M
            unsigned posState2 = (position + len) & p->pbMask;
1675
2.13M
            price += GET_PRICE_LEN(&p->repLenEnc, posState, len)
1676
2.13M
                + GET_PRICE_0(p->isMatch[state2][posState2])
1677
2.13M
                + LitEnc_Matched_GetPrice(LIT_PROBS(position + len, data[(size_t)len - 1]),
1678
2.13M
                    data[len], data2[len], p->ProbPrices);
1679
            
1680
            // state2 = kLiteralNextStates[state2];
1681
2.13M
            state2 = kState_LitAfterRep;
1682
2.13M
            posState2 = (posState2 + 1) & p->pbMask;
1683
1684
1685
2.13M
            price += GetPrice_Rep_0(p, state2, posState2);
1686
1687
24.9M
          for (; len2 < limit && data[len2] == data2[len2]; len2++)
1688
22.8M
          {}
1689
          
1690
2.13M
          len2 -= len;
1691
          // if (len2 >= 3)
1692
2.13M
          {
1693
2.13M
            {
1694
2.13M
              unsigned offset = cur + len + len2;
1695
1696
2.13M
              if (last < offset)
1697
383k
                last = offset;
1698
              // do
1699
2.13M
              {
1700
2.13M
                UInt32 price2;
1701
2.13M
                COptimal *opt;
1702
2.13M
                len2--;
1703
                // price2 = price + GetPrice_Len_Rep_0(p, len2, state2, posState2);
1704
2.13M
                price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState2, len2);
1705
1706
2.13M
                opt = &p->opt[offset];
1707
                // offset--;
1708
2.13M
                if (price2 < opt->price)
1709
500k
                {
1710
500k
                  opt->price = price2;
1711
500k
                  opt->len = (UInt32)len2;
1712
500k
                  opt->extra = (CExtra)(len + 1);
1713
500k
                  opt->dist = (UInt32)repIndex;
1714
500k
                }
1715
2.13M
              }
1716
              // while (len2 >= 3);
1717
2.13M
            }
1718
2.13M
          }
1719
2.13M
          }
1720
4.64M
        }
1721
4.64M
      }
1722
3.92M
    }
1723
1724
1725
    // ---------- MATCH ----------
1726
    /* for (unsigned len = 2; len <= newLen; len++) */
1727
3.92M
    if (newLen > numAvail)
1728
598
    {
1729
598
      newLen = numAvail;
1730
2.29k
      for (numPairs = 0; newLen > matches[numPairs]; numPairs += 2);
1731
598
      matches[numPairs] = (UInt32)newLen;
1732
598
      numPairs += 2;
1733
598
    }
1734
    
1735
    // startLen = 2; /* speed optimization */
1736
1737
3.92M
    if (newLen >= startLen)
1738
2.40M
    {
1739
2.40M
      UInt32 normalMatchPrice = matchPrice + GET_PRICE_0(p->isRep[state]);
1740
2.40M
      UInt32 dist;
1741
2.40M
      unsigned offs, posSlot, len;
1742
      
1743
2.40M
      {
1744
2.40M
        unsigned offset = cur + newLen;
1745
2.40M
        if (last < offset)
1746
425k
          last = offset;
1747
2.40M
      }
1748
1749
2.40M
      offs = 0;
1750
2.94M
      while (startLen > matches[offs])
1751
536k
        offs += 2;
1752
2.40M
      dist = matches[(size_t)offs + 1];
1753
      
1754
      // if (dist >= kNumFullDistances)
1755
2.40M
      GetPosSlot2(dist, posSlot);
1756
      
1757
13.7M
      for (len = /*2*/ startLen; ; len++)
1758
16.1M
      {
1759
16.1M
        UInt32 price = normalMatchPrice + GET_PRICE_LEN(&p->lenEnc, posState, len);
1760
16.1M
        {
1761
16.1M
          COptimal *opt;
1762
16.1M
          unsigned lenNorm = len - 2;
1763
16.1M
          lenNorm = GetLenToPosState2(lenNorm);
1764
16.1M
          if (dist < kNumFullDistances)
1765
9.50M
            price += p->distancesPrices[lenNorm][dist & (kNumFullDistances - 1)];
1766
6.64M
          else
1767
6.64M
            price += p->posSlotPrices[lenNorm][posSlot] + p->alignPrices[dist & kAlignMask];
1768
          
1769
16.1M
          opt = &p->opt[cur + len];
1770
16.1M
          if (price < opt->price)
1771
2.52M
          {
1772
2.52M
            opt->price = price;
1773
2.52M
            opt->len = (UInt32)len;
1774
2.52M
            opt->dist = dist + LZMA_NUM_REPS;
1775
2.52M
            opt->extra = 0;
1776
2.52M
          }
1777
16.1M
        }
1778
1779
16.1M
        if (len == matches[offs])
1780
3.06M
        {
1781
          // if (p->_maxMode) {
1782
          // MATCH : LIT : REP_0
1783
1784
3.06M
          const Byte *data2 = data - dist - 1;
1785
3.06M
          unsigned len2 = len + 1;
1786
3.06M
          unsigned limit = len2 + p->numFastBytes;
1787
3.06M
          if (limit > numAvailFull)
1788
159k
            limit = numAvailFull;
1789
          
1790
3.06M
          len2 += 2;
1791
3.06M
          if (len2 <= limit)
1792
3.04M
          if (data[len2 - 2] == data2[len2 - 2])
1793
1.44M
          if (data[len2 - 1] == data2[len2 - 1])
1794
1.02M
          {
1795
6.81M
          for (; len2 < limit && data[len2] == data2[len2]; len2++)
1796
5.79M
          {}
1797
          
1798
1.02M
          len2 -= len;
1799
          
1800
          // if (len2 >= 3)
1801
1.02M
          {
1802
1.02M
            unsigned state2 = kMatchNextStates[state];
1803
1.02M
            unsigned posState2 = (position + len) & p->pbMask;
1804
1.02M
            unsigned offset;
1805
1.02M
            price += GET_PRICE_0(p->isMatch[state2][posState2]);
1806
1.02M
            price += LitEnc_Matched_GetPrice(LIT_PROBS(position + len, data[(size_t)len - 1]),
1807
1.02M
                    data[len], data2[len], p->ProbPrices);
1808
1809
            // state2 = kLiteralNextStates[state2];
1810
1.02M
            state2 = kState_LitAfterMatch;
1811
1812
1.02M
            posState2 = (posState2 + 1) & p->pbMask;
1813
1.02M
            price += GetPrice_Rep_0(p, state2, posState2);
1814
1815
1.02M
            offset = cur + len + len2;
1816
1817
1.02M
            if (last < offset)
1818
182k
              last = offset;
1819
            // do
1820
1.02M
            {
1821
1.02M
              UInt32 price2;
1822
1.02M
              COptimal *opt;
1823
1.02M
              len2--;
1824
              // price2 = price + GetPrice_Len_Rep_0(p, len2, state2, posState2);
1825
1.02M
              price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState2, len2);
1826
1.02M
              opt = &p->opt[offset];
1827
              // offset--;
1828
1.02M
              if (price2 < opt->price)
1829
298k
              {
1830
298k
                opt->price = price2;
1831
298k
                opt->len = (UInt32)len2;
1832
298k
                opt->extra = (CExtra)(len + 1);
1833
298k
                opt->dist = dist + LZMA_NUM_REPS;
1834
298k
              }
1835
1.02M
            }
1836
            // while (len2 >= 3);
1837
1.02M
          }
1838
1839
1.02M
          }
1840
        
1841
3.06M
          offs += 2;
1842
3.06M
          if (offs == numPairs)
1843
2.40M
            break;
1844
657k
          dist = matches[(size_t)offs + 1];
1845
          // if (dist >= kNumFullDistances)
1846
657k
            GetPosSlot2(dist, posSlot);
1847
657k
        }
1848
16.1M
      }
1849
2.40M
    }
1850
3.92M
  }
1851
1852
191k
  do
1853
4.37M
    p->opt[last].price = kInfinityPrice;
1854
4.37M
  while (--last);
1855
1856
191k
  return Backward(p, cur);
1857
213k
}
1858
1859
1860
1861
178k
#define ChangePair(smallDist, bigDist) (((bigDist) >> 7) > (smallDist))
1862
1863
1864
1865
static unsigned GetOptimumFast(CLzmaEnc *p)
1866
1.58M
{
1867
1.58M
  UInt32 numAvail, mainDist;
1868
1.58M
  unsigned mainLen, numPairs, repIndex, repLen, i;
1869
1.58M
  const Byte *data;
1870
1871
1.58M
  if (p->additionalOffset == 0)
1872
1.49M
    mainLen = ReadMatchDistances(p, &numPairs);
1873
86.1k
  else
1874
86.1k
  {
1875
86.1k
    mainLen = p->longestMatchLen;
1876
86.1k
    numPairs = p->numPairs;
1877
86.1k
  }
1878
1879
1.58M
  numAvail = p->numAvail;
1880
1.58M
  p->backRes = MARK_LIT;
1881
1.58M
  if (numAvail < 2)
1882
1.45k
    return 1;
1883
  // if (mainLen < 2 && p->state == 0) return 1; // 18.06.notused
1884
1.57M
  if (numAvail > LZMA_MATCH_LEN_MAX)
1885
1.50M
    numAvail = LZMA_MATCH_LEN_MAX;
1886
1.57M
  data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1887
1.57M
  repLen = repIndex = 0;
1888
  
1889
7.73M
  for (i = 0; i < LZMA_NUM_REPS; i++)
1890
6.21M
  {
1891
6.21M
    unsigned len;
1892
6.21M
    const Byte *data2 = data - p->reps[i];
1893
6.21M
    if (data[0] != data2[0] || data[1] != data2[1])
1894
5.92M
      continue;
1895
4.67M
    for (len = 2; len < numAvail && data[len] == data2[len]; len++)
1896
4.38M
    {}
1897
292k
    if (len >= p->numFastBytes)
1898
59.7k
    {
1899
59.7k
      p->backRes = (UInt32)i;
1900
59.7k
      MOVE_POS(p, len - 1)
1901
59.7k
      return len;
1902
59.7k
    }
1903
232k
    if (len > repLen)
1904
182k
    {
1905
182k
      repIndex = i;
1906
182k
      repLen = len;
1907
182k
    }
1908
232k
  }
1909
1910
1.51M
  if (mainLen >= p->numFastBytes)
1911
64.3k
  {
1912
64.3k
    p->backRes = p->matches[(size_t)numPairs - 1] + LZMA_NUM_REPS;
1913
64.3k
    MOVE_POS(p, mainLen - 1)
1914
64.3k
    return mainLen;
1915
64.3k
  }
1916
1917
1.45M
  mainDist = 0; /* for GCC */
1918
  
1919
1.45M
  if (mainLen >= 2)
1920
558k
  {
1921
558k
    mainDist = p->matches[(size_t)numPairs - 1];
1922
562k
    while (numPairs > 2)
1923
129k
    {
1924
129k
      UInt32 dist2;
1925
129k
      if (mainLen != p->matches[(size_t)numPairs - 4] + 1)
1926
84.8k
        break;
1927
44.6k
      dist2 = p->matches[(size_t)numPairs - 3];
1928
44.6k
      if (!ChangePair(dist2, mainDist))
1929
40.3k
        break;
1930
4.34k
      numPairs -= 2;
1931
4.34k
      mainLen--;
1932
4.34k
      mainDist = dist2;
1933
4.34k
    }
1934
558k
    if (mainLen == 2 && mainDist >= 0x80)
1935
214k
      mainLen = 1;
1936
558k
  }
1937
1938
1.45M
  if (repLen >= 2)
1939
139k
    if (    repLen + 1 >= mainLen
1940
139k
        || (repLen + 2 >= mainLen && mainDist >= (1 << 9))
1941
139k
        || (repLen + 3 >= mainLen && mainDist >= (1 << 15)))
1942
115k
  {
1943
115k
    p->backRes = (UInt32)repIndex;
1944
115k
    MOVE_POS(p, repLen - 1)
1945
115k
    return repLen;
1946
115k
  }
1947
  
1948
1.34M
  if (mainLen < 2 || numAvail <= 2)
1949
1.10M
    return 1;
1950
1951
230k
  {
1952
230k
    unsigned len1 = ReadMatchDistances(p, &p->numPairs);
1953
230k
    p->longestMatchLen = len1;
1954
  
1955
230k
    if (len1 >= 2)
1956
205k
    {
1957
205k
      UInt32 newDist = p->matches[(size_t)p->numPairs - 1];
1958
205k
      if (   (len1 >= mainLen && newDist < mainDist)
1959
205k
          || (len1 == mainLen + 1 && !ChangePair(mainDist, newDist))
1960
205k
          || (len1 >  mainLen + 1)
1961
205k
          || (len1 + 1 >= mainLen && mainLen >= 3 && ChangePair(newDist, mainDist)))
1962
75.3k
        return 1;
1963
205k
    }
1964
230k
  }
1965
  
1966
154k
  data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1967
  
1968
740k
  for (i = 0; i < LZMA_NUM_REPS; i++)
1969
596k
  {
1970
596k
    unsigned len, limit;
1971
596k
    const Byte *data2 = data - p->reps[i];
1972
596k
    if (data[0] != data2[0] || data[1] != data2[1])
1973
551k
      continue;
1974
45.4k
    limit = mainLen - 1;
1975
68.3k
    for (len = 2;; len++)
1976
113k
    {
1977
113k
      if (len >= limit)
1978
10.7k
        return 1;
1979
102k
      if (data[len] != data2[len])
1980
34.6k
        break;
1981
102k
    }
1982
45.4k
  }
1983
  
1984
143k
  p->backRes = mainDist + LZMA_NUM_REPS;
1985
143k
  if (mainLen != 2)
1986
117k
  {
1987
117k
    MOVE_POS(p, mainLen - 2)
1988
117k
  }
1989
143k
  return mainLen;
1990
154k
}
1991
1992
1993
1994
1995
static void WriteEndMarker(CLzmaEnc *p, unsigned posState)
1996
4.96k
{
1997
4.96k
  UInt32 range;
1998
4.96k
  range = p->rc.range;
1999
4.96k
  {
2000
4.96k
    UInt32 ttt, newBound;
2001
4.96k
    CLzmaProb *prob = &p->isMatch[p->state][posState];
2002
4.96k
    RC_BIT_PRE(&p->rc, prob)
2003
4.96k
    RC_BIT_1(&p->rc, prob)
2004
4.96k
    prob = &p->isRep[p->state];
2005
4.96k
    RC_BIT_PRE(&p->rc, prob)
2006
4.96k
    RC_BIT_0(&p->rc, prob)
2007
4.96k
  }
2008
4.96k
  p->state = kMatchNextStates[p->state];
2009
  
2010
4.96k
  p->rc.range = range;
2011
4.96k
  LenEnc_Encode(&p->lenProbs, &p->rc, 0, posState);
2012
4.96k
  range = p->rc.range;
2013
2014
4.96k
  {
2015
    // RcTree_Encode_PosSlot(&p->rc, p->posSlotEncoder[0], (1 << kNumPosSlotBits) - 1);
2016
4.96k
    CLzmaProb *probs = p->posSlotEncoder[0];
2017
4.96k
    unsigned m = 1;
2018
4.96k
    do
2019
29.8k
    {
2020
29.8k
      UInt32 ttt, newBound;
2021
29.8k
      RC_BIT_PRE(p, probs + m)
2022
29.8k
      RC_BIT_1(&p->rc, probs + m);
2023
29.8k
      m = (m << 1) + 1;
2024
29.8k
    }
2025
29.8k
    while (m < (1 << kNumPosSlotBits));
2026
4.96k
  }
2027
4.96k
  {
2028
    // RangeEnc_EncodeDirectBits(&p->rc, ((UInt32)1 << (30 - kNumAlignBits)) - 1, 30 - kNumAlignBits);    UInt32 range = p->range;
2029
4.96k
    unsigned numBits = 30 - kNumAlignBits;
2030
4.96k
    do
2031
129k
    {
2032
129k
      range >>= 1;
2033
129k
      p->rc.low += range;
2034
129k
      RC_NORM(&p->rc)
2035
129k
    }
2036
129k
    while (--numBits);
2037
4.96k
  }
2038
   
2039
4.96k
  {
2040
    // RcTree_ReverseEncode(&p->rc, p->posAlignEncoder, kNumAlignBits, kAlignMask);
2041
4.96k
    CLzmaProb *probs = p->posAlignEncoder;
2042
4.96k
    unsigned m = 1;
2043
4.96k
    do
2044
19.8k
    {
2045
19.8k
      UInt32 ttt, newBound;
2046
19.8k
      RC_BIT_PRE(p, probs + m)
2047
19.8k
      RC_BIT_1(&p->rc, probs + m);
2048
19.8k
      m = (m << 1) + 1;
2049
19.8k
    }
2050
19.8k
    while (m < kAlignTableSize);
2051
4.96k
  }
2052
4.96k
  p->rc.range = range;
2053
4.96k
}
2054
2055
2056
static SRes CheckErrors(CLzmaEnc *p)
2057
14.5k
{
2058
14.5k
  if (p->result != SZ_OK)
2059
0
    return p->result;
2060
14.5k
  if (p->rc.res != SZ_OK)
2061
0
    p->result = SZ_ERROR_WRITE;
2062
14.5k
  if (p->matchFinderBase.result != SZ_OK)
2063
0
    p->result = SZ_ERROR_READ;
2064
14.5k
  if (p->result != SZ_OK)
2065
0
    p->finished = True;
2066
14.5k
  return p->result;
2067
14.5k
}
2068
2069
2070
MY_NO_INLINE static SRes Flush(CLzmaEnc *p, UInt32 nowPos)
2071
7.27k
{
2072
  /* ReleaseMFStream(); */
2073
7.27k
  p->finished = True;
2074
7.27k
  if (p->writeEndMark)
2075
4.96k
    WriteEndMarker(p, nowPos & p->pbMask);
2076
7.27k
  RangeEnc_FlushData(&p->rc);
2077
7.27k
  RangeEnc_FlushStream(&p->rc);
2078
7.27k
  return CheckErrors(p);
2079
7.27k
}
2080
2081
2082
MY_NO_INLINE static void FillAlignPrices(CLzmaEnc *p)
2083
11.0k
{
2084
11.0k
  unsigned i;
2085
11.0k
  const CProbPrice *ProbPrices = p->ProbPrices;
2086
11.0k
  const CLzmaProb *probs = p->posAlignEncoder;
2087
  // p->alignPriceCount = 0;
2088
99.4k
  for (i = 0; i < kAlignTableSize / 2; i++)
2089
88.3k
  {
2090
88.3k
    UInt32 price = 0;
2091
88.3k
    unsigned sym = i;
2092
88.3k
    unsigned m = 1;
2093
88.3k
    unsigned bit;
2094
88.3k
    UInt32 prob;
2095
88.3k
    bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[m], bit); m = (m << 1) + bit;
2096
88.3k
    bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[m], bit); m = (m << 1) + bit;
2097
88.3k
    bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[m], bit); m = (m << 1) + bit;
2098
88.3k
    prob = probs[m];
2099
88.3k
    p->alignPrices[i    ] = price + GET_PRICEa_0(prob);
2100
88.3k
    p->alignPrices[i + 8] = price + GET_PRICEa_1(prob);
2101
    // p->alignPrices[i] = RcTree_ReverseGetPrice(p->posAlignEncoder, kNumAlignBits, i, p->ProbPrices);
2102
88.3k
  }
2103
11.0k
}
2104
2105
2106
MY_NO_INLINE static void FillDistancesPrices(CLzmaEnc *p)
2107
11.0k
{
2108
  // int y; for (y = 0; y < 100; y++) {
2109
2110
11.0k
  UInt32 tempPrices[kNumFullDistances];
2111
11.0k
  unsigned i, lps;
2112
2113
11.0k
  const CProbPrice *ProbPrices = p->ProbPrices;
2114
11.0k
  p->matchPriceCount = 0;
2115
2116
696k
  for (i = kStartPosModelIndex / 2; i < kNumFullDistances / 2; i++)
2117
685k
  {
2118
685k
    unsigned posSlot = GetPosSlot1(i);
2119
685k
    unsigned footerBits = (posSlot >> 1) - 1;
2120
685k
    unsigned base = ((2 | (posSlot & 1)) << footerBits);
2121
685k
    const CLzmaProb *probs = p->posEncoders + (size_t)base * 2;
2122
    // tempPrices[i] = RcTree_ReverseGetPrice(p->posEncoders + base, footerBits, i - base, p->ProbPrices);
2123
685k
    UInt32 price = 0;
2124
685k
    unsigned m = 1;
2125
685k
    unsigned sym = i;
2126
685k
    unsigned offset = (unsigned)1 << footerBits;
2127
685k
    base += i;
2128
    
2129
685k
    if (footerBits)
2130
662k
    do
2131
2.16M
    {
2132
2.16M
      unsigned bit = sym & 1;
2133
2.16M
      sym >>= 1;
2134
2.16M
      price += GET_PRICEa(probs[m], bit);
2135
2.16M
      m = (m << 1) + bit;
2136
2.16M
    }
2137
2.16M
    while (--footerBits);
2138
2139
685k
    {
2140
685k
      unsigned prob = probs[m];
2141
685k
      tempPrices[base         ] = price + GET_PRICEa_0(prob);
2142
685k
      tempPrices[base + offset] = price + GET_PRICEa_1(prob);
2143
685k
    }
2144
685k
  }
2145
2146
55.2k
  for (lps = 0; lps < kNumLenToPosStates; lps++)
2147
44.1k
  {
2148
44.1k
    unsigned slot;
2149
44.1k
    unsigned distTableSize2 = (p->distTableSize + 1) >> 1;
2150
44.1k
    UInt32 *posSlotPrices = p->posSlotPrices[lps];
2151
44.1k
    const CLzmaProb *probs = p->posSlotEncoder[lps];
2152
    
2153
1.10M
    for (slot = 0; slot < distTableSize2; slot++)
2154
1.06M
    {
2155
      // posSlotPrices[slot] = RcTree_GetPrice(encoder, kNumPosSlotBits, slot, p->ProbPrices);
2156
1.06M
      UInt32 price;
2157
1.06M
      unsigned bit;
2158
1.06M
      unsigned sym = slot + (1 << (kNumPosSlotBits - 1));
2159
1.06M
      unsigned prob;
2160
1.06M
      bit = sym & 1; sym >>= 1; price  = GET_PRICEa(probs[sym], bit);
2161
1.06M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2162
1.06M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2163
1.06M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2164
1.06M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2165
1.06M
      prob = probs[(size_t)slot + (1 << (kNumPosSlotBits - 1))];
2166
1.06M
      posSlotPrices[(size_t)slot * 2    ] = price + GET_PRICEa_0(prob);
2167
1.06M
      posSlotPrices[(size_t)slot * 2 + 1] = price + GET_PRICEa_1(prob);
2168
1.06M
    }
2169
    
2170
44.1k
    {
2171
44.1k
      UInt32 delta = ((UInt32)((kEndPosModelIndex / 2 - 1) - kNumAlignBits) << kNumBitPriceShiftBits);
2172
795k
      for (slot = kEndPosModelIndex / 2; slot < distTableSize2; slot++)
2173
751k
      {
2174
751k
        posSlotPrices[(size_t)slot * 2    ] += delta;
2175
751k
        posSlotPrices[(size_t)slot * 2 + 1] += delta;
2176
751k
        delta += ((UInt32)1 << kNumBitPriceShiftBits);
2177
751k
      }
2178
44.1k
    }
2179
2180
44.1k
    {
2181
44.1k
      UInt32 *dp = p->distancesPrices[lps];
2182
      
2183
44.1k
      dp[0] = posSlotPrices[0];
2184
44.1k
      dp[1] = posSlotPrices[1];
2185
44.1k
      dp[2] = posSlotPrices[2];
2186
44.1k
      dp[3] = posSlotPrices[3];
2187
2188
2.78M
      for (i = 4; i < kNumFullDistances; i += 2)
2189
2.74M
      {
2190
2.74M
        UInt32 slotPrice = posSlotPrices[GetPosSlot1(i)];
2191
2.74M
        dp[i    ] = slotPrice + tempPrices[i];
2192
2.74M
        dp[i + 1] = slotPrice + tempPrices[i + 1];
2193
2.74M
      }
2194
44.1k
    }
2195
44.1k
  }
2196
  // }
2197
11.0k
}
2198
2199
2200
2201
void LzmaEnc_Construct(CLzmaEnc *p)
2202
7.27k
{
2203
7.27k
  RangeEnc_Construct(&p->rc);
2204
7.27k
  MatchFinder_Construct(&p->matchFinderBase);
2205
  
2206
  #ifndef _7ZIP_ST
2207
  MatchFinderMt_Construct(&p->matchFinderMt);
2208
  p->matchFinderMt.MatchFinder = &p->matchFinderBase;
2209
  #endif
2210
2211
7.27k
  {
2212
7.27k
    CLzmaEncProps props;
2213
7.27k
    LzmaEncProps_Init(&props);
2214
7.27k
    LzmaEnc_SetProps(p, &props);
2215
7.27k
  }
2216
2217
7.27k
  #ifndef LZMA_LOG_BSR
2218
7.27k
  LzmaEnc_FastPosInit(p->g_FastPos);
2219
7.27k
  #endif
2220
2221
7.27k
  LzmaEnc_InitPriceTables(p->ProbPrices);
2222
7.27k
  p->litProbs = NULL;
2223
7.27k
  p->saveState.litProbs = NULL;
2224
2225
7.27k
}
2226
2227
CLzmaEncHandle LzmaEnc_Create(ISzAllocPtr alloc)
2228
7.27k
{
2229
7.27k
  void *p;
2230
7.27k
  p = ISzAlloc_Alloc(alloc, sizeof(CLzmaEnc));
2231
7.27k
  if (p)
2232
7.27k
    LzmaEnc_Construct((CLzmaEnc *)p);
2233
7.27k
  return p;
2234
7.27k
}
2235
2236
void LzmaEnc_FreeLits(CLzmaEnc *p, ISzAllocPtr alloc)
2237
14.5k
{
2238
14.5k
  ISzAlloc_Free(alloc, p->litProbs);
2239
14.5k
  ISzAlloc_Free(alloc, p->saveState.litProbs);
2240
14.5k
  p->litProbs = NULL;
2241
14.5k
  p->saveState.litProbs = NULL;
2242
14.5k
}
2243
2244
void LzmaEnc_Destruct(CLzmaEnc *p, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2245
7.27k
{
2246
  #ifndef _7ZIP_ST
2247
  MatchFinderMt_Destruct(&p->matchFinderMt, allocBig);
2248
  #endif
2249
  
2250
7.27k
  MatchFinder_Free(&p->matchFinderBase, allocBig);
2251
7.27k
  LzmaEnc_FreeLits(p, alloc);
2252
7.27k
  RangeEnc_Free(&p->rc, alloc);
2253
7.27k
}
2254
2255
void LzmaEnc_Destroy(CLzmaEncHandle p, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2256
7.27k
{
2257
7.27k
  LzmaEnc_Destruct((CLzmaEnc *)p, alloc, allocBig);
2258
7.27k
  ISzAlloc_Free(alloc, p);
2259
7.27k
}
2260
2261
2262
static SRes LzmaEnc_CodeOneBlock(CLzmaEnc *p, UInt32 maxPackSize, UInt32 maxUnpackSize)
2263
7.27k
{
2264
7.27k
  UInt32 nowPos32, startPos32;
2265
7.27k
  if (p->needInit)
2266
7.27k
  {
2267
7.27k
    p->matchFinder.Init(p->matchFinderObj);
2268
7.27k
    p->needInit = 0;
2269
7.27k
  }
2270
2271
7.27k
  if (p->finished)
2272
0
    return p->result;
2273
7.27k
  RINOK(CheckErrors(p));
2274
2275
7.27k
  nowPos32 = (UInt32)p->nowPos64;
2276
7.27k
  startPos32 = nowPos32;
2277
2278
7.27k
  if (p->nowPos64 == 0)
2279
7.27k
  {
2280
7.27k
    unsigned numPairs;
2281
7.27k
    Byte curByte;
2282
7.27k
    if (p->matchFinder.GetNumAvailableBytes(p->matchFinderObj) == 0)
2283
0
      return Flush(p, nowPos32);
2284
7.27k
    ReadMatchDistances(p, &numPairs);
2285
7.27k
    RangeEnc_EncodeBit_0(&p->rc, &p->isMatch[kState_Start][0]);
2286
    // p->state = kLiteralNextStates[p->state];
2287
7.27k
    curByte = *(p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - p->additionalOffset);
2288
7.27k
    LitEnc_Encode(&p->rc, p->litProbs, curByte);
2289
7.27k
    p->additionalOffset--;
2290
7.27k
    nowPos32++;
2291
7.27k
  }
2292
2293
7.27k
  if (p->matchFinder.GetNumAvailableBytes(p->matchFinderObj) != 0)
2294
  
2295
7.19k
  for (;;)
2296
3.74M
  {
2297
3.74M
    UInt32 dist;
2298
3.74M
    unsigned len, posState;
2299
3.74M
    UInt32 range, ttt, newBound;
2300
3.74M
    CLzmaProb *probs;
2301
  
2302
3.74M
    if (p->fastMode)
2303
1.58M
      len = GetOptimumFast(p);
2304
2.16M
    else
2305
2.16M
    {
2306
2.16M
      unsigned oci = p->optCur;
2307
2.16M
      if (p->optEnd == oci)
2308
944k
        len = GetOptimum(p, nowPos32);
2309
1.22M
      else
2310
1.22M
      {
2311
1.22M
        const COptimal *opt = &p->opt[oci];
2312
1.22M
        len = opt->len;
2313
1.22M
        p->backRes = opt->dist;
2314
1.22M
        p->optCur = oci + 1;
2315
1.22M
      }
2316
2.16M
    }
2317
2318
3.74M
    posState = (unsigned)nowPos32 & p->pbMask;
2319
3.74M
    range = p->rc.range;
2320
3.74M
    probs = &p->isMatch[p->state][posState];
2321
    
2322
3.74M
    RC_BIT_PRE(&p->rc, probs)
2323
    
2324
3.74M
    dist = p->backRes;
2325
2326
    #ifdef SHOW_STAT2
2327
    printf("\n pos = %6X, len = %3u  pos = %6u", nowPos32, len, dist);
2328
    #endif
2329
2330
3.74M
    if (dist == MARK_LIT)
2331
2.33M
    {
2332
2.33M
      Byte curByte;
2333
2.33M
      const Byte *data;
2334
2.33M
      unsigned state;
2335
2336
2.33M
      RC_BIT_0(&p->rc, probs);
2337
2.33M
      p->rc.range = range;
2338
2.33M
      data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - p->additionalOffset;
2339
2.33M
      probs = LIT_PROBS(nowPos32, *(data - 1));
2340
2.33M
      curByte = *data;
2341
2.33M
      state = p->state;
2342
2.33M
      p->state = kLiteralNextStates[state];
2343
2.33M
      if (IsLitState(state))
2344
1.75M
        LitEnc_Encode(&p->rc, probs, curByte);
2345
579k
      else
2346
579k
        LitEnc_EncodeMatched(&p->rc, probs, curByte, *(data - p->reps[0]));
2347
2.33M
    }
2348
1.41M
    else
2349
1.41M
    {
2350
1.41M
      RC_BIT_1(&p->rc, probs);
2351
1.41M
      probs = &p->isRep[p->state];
2352
1.41M
      RC_BIT_PRE(&p->rc, probs)
2353
      
2354
1.41M
      if (dist < LZMA_NUM_REPS)
2355
742k
      {
2356
742k
        RC_BIT_1(&p->rc, probs);
2357
742k
        probs = &p->isRepG0[p->state];
2358
742k
        RC_BIT_PRE(&p->rc, probs)
2359
742k
        if (dist == 0)
2360
291k
        {
2361
291k
          RC_BIT_0(&p->rc, probs);
2362
291k
          probs = &p->isRep0Long[p->state][posState];
2363
291k
          RC_BIT_PRE(&p->rc, probs)
2364
291k
          if (len != 1)
2365
179k
          {
2366
179k
            RC_BIT_1_BASE(&p->rc, probs);
2367
179k
          }
2368
112k
          else
2369
112k
          {
2370
112k
            RC_BIT_0_BASE(&p->rc, probs);
2371
112k
            p->state = kShortRepNextStates[p->state];
2372
112k
          }
2373
291k
        }
2374
451k
        else
2375
451k
        {
2376
451k
          RC_BIT_1(&p->rc, probs);
2377
451k
          probs = &p->isRepG1[p->state];
2378
451k
          RC_BIT_PRE(&p->rc, probs)
2379
451k
          if (dist == 1)
2380
207k
          {
2381
207k
            RC_BIT_0_BASE(&p->rc, probs);
2382
207k
            dist = p->reps[1];
2383
207k
          }
2384
243k
          else
2385
243k
          {
2386
243k
            RC_BIT_1(&p->rc, probs);
2387
243k
            probs = &p->isRepG2[p->state];
2388
243k
            RC_BIT_PRE(&p->rc, probs)
2389
243k
            if (dist == 2)
2390
142k
            {
2391
142k
              RC_BIT_0_BASE(&p->rc, probs);
2392
142k
              dist = p->reps[2];
2393
142k
            }
2394
100k
            else
2395
100k
            {
2396
100k
              RC_BIT_1_BASE(&p->rc, probs);
2397
100k
              dist = p->reps[3];
2398
100k
              p->reps[3] = p->reps[2];
2399
100k
            }
2400
243k
            p->reps[2] = p->reps[1];
2401
243k
          }
2402
451k
          p->reps[1] = p->reps[0];
2403
451k
          p->reps[0] = dist;
2404
451k
        }
2405
2406
742k
        RC_NORM(&p->rc)
2407
2408
742k
        p->rc.range = range;
2409
2410
742k
        if (len != 1)
2411
630k
        {
2412
630k
          LenEnc_Encode(&p->repLenProbs, &p->rc, len - LZMA_MATCH_LEN_MIN, posState);
2413
630k
          --p->repLenEncCounter;
2414
630k
          p->state = kRepNextStates[p->state];
2415
630k
        }
2416
742k
      }
2417
671k
      else
2418
671k
      {
2419
671k
        unsigned posSlot;
2420
671k
        RC_BIT_0(&p->rc, probs);
2421
671k
        p->rc.range = range;
2422
671k
        p->state = kMatchNextStates[p->state];
2423
2424
671k
        LenEnc_Encode(&p->lenProbs, &p->rc, len - LZMA_MATCH_LEN_MIN, posState);
2425
        // --p->lenEnc.counter;
2426
2427
671k
        dist -= LZMA_NUM_REPS;
2428
671k
        p->reps[3] = p->reps[2];
2429
671k
        p->reps[2] = p->reps[1];
2430
671k
        p->reps[1] = p->reps[0];
2431
671k
        p->reps[0] = dist + 1;
2432
        
2433
671k
        p->matchPriceCount++;
2434
671k
        GetPosSlot(dist, posSlot);
2435
        // RcTree_Encode_PosSlot(&p->rc, p->posSlotEncoder[GetLenToPosState(len)], posSlot);
2436
671k
        {
2437
671k
          UInt32 sym = (UInt32)posSlot + (1 << kNumPosSlotBits);
2438
671k
          range = p->rc.range;
2439
671k
          probs = p->posSlotEncoder[GetLenToPosState(len)];
2440
671k
          do
2441
4.03M
          {
2442
4.03M
            CLzmaProb *prob = probs + (sym >> kNumPosSlotBits);
2443
4.03M
            UInt32 bit = (sym >> (kNumPosSlotBits - 1)) & 1;
2444
4.03M
            sym <<= 1;
2445
4.03M
            RC_BIT(&p->rc, prob, bit);
2446
4.03M
          }
2447
4.03M
          while (sym < (1 << kNumPosSlotBits * 2));
2448
671k
          p->rc.range = range;
2449
671k
        }
2450
        
2451
671k
        if (dist >= kStartPosModelIndex)
2452
501k
        {
2453
501k
          unsigned footerBits = ((posSlot >> 1) - 1);
2454
2455
501k
          if (dist < kNumFullDistances)
2456
349k
          {
2457
349k
            unsigned base = ((2 | (posSlot & 1)) << footerBits);
2458
349k
            RcTree_ReverseEncode(&p->rc, p->posEncoders + base, footerBits, (unsigned)(dist /* - base */));
2459
349k
          }
2460
151k
          else
2461
151k
          {
2462
151k
            UInt32 pos2 = (dist | 0xF) << (32 - footerBits);
2463
151k
            range = p->rc.range;
2464
            // RangeEnc_EncodeDirectBits(&p->rc, posReduced >> kNumAlignBits, footerBits - kNumAlignBits);
2465
            /*
2466
            do
2467
            {
2468
              range >>= 1;
2469
              p->rc.low += range & (0 - ((dist >> --footerBits) & 1));
2470
              RC_NORM(&p->rc)
2471
            }
2472
            while (footerBits > kNumAlignBits);
2473
            */
2474
151k
            do
2475
700k
            {
2476
700k
              range >>= 1;
2477
700k
              p->rc.low += range & (0 - (pos2 >> 31));
2478
700k
              pos2 += pos2;
2479
700k
              RC_NORM(&p->rc)
2480
700k
            }
2481
700k
            while (pos2 != 0xF0000000);
2482
2483
2484
            // RcTree_ReverseEncode(&p->rc, p->posAlignEncoder, kNumAlignBits, posReduced & kAlignMask);
2485
2486
151k
            {
2487
151k
              unsigned m = 1;
2488
151k
              unsigned bit;
2489
151k
              bit = dist & 1; dist >>= 1; RC_BIT(&p->rc, p->posAlignEncoder + m, bit); m = (m << 1) + bit;
2490
151k
              bit = dist & 1; dist >>= 1; RC_BIT(&p->rc, p->posAlignEncoder + m, bit); m = (m << 1) + bit;
2491
151k
              bit = dist & 1; dist >>= 1; RC_BIT(&p->rc, p->posAlignEncoder + m, bit); m = (m << 1) + bit;
2492
151k
              bit = dist & 1;             RC_BIT(&p->rc, p->posAlignEncoder + m, bit);
2493
151k
              p->rc.range = range;
2494
              // p->alignPriceCount++;
2495
151k
            }
2496
151k
          }
2497
501k
        }
2498
671k
      }
2499
1.41M
    }
2500
2501
3.74M
    nowPos32 += (UInt32)len;
2502
3.74M
    p->additionalOffset -= len;
2503
    
2504
3.74M
    if (p->additionalOffset == 0)
2505
2.40M
    {
2506
2.40M
      UInt32 processed;
2507
2508
2.40M
      if (!p->fastMode)
2509
913k
      {
2510
        /*
2511
        if (p->alignPriceCount >= 16) // kAlignTableSize
2512
          FillAlignPrices(p);
2513
        if (p->matchPriceCount >= 128)
2514
          FillDistancesPrices(p);
2515
        if (p->lenEnc.counter <= 0)
2516
          LenPriceEnc_UpdateTables(&p->lenEnc, 1 << p->pb, &p->lenProbs, p->ProbPrices);
2517
        */
2518
913k
        if (p->matchPriceCount >= 64)
2519
6.13k
        {
2520
6.13k
          FillAlignPrices(p);
2521
          // { int y; for (y = 0; y < 100; y++) {
2522
6.13k
          FillDistancesPrices(p);
2523
          // }}
2524
6.13k
          LenPriceEnc_UpdateTables(&p->lenEnc, 1 << p->pb, &p->lenProbs, p->ProbPrices);
2525
6.13k
        }
2526
913k
        if (p->repLenEncCounter <= 0)
2527
3.49k
        {
2528
3.49k
          p->repLenEncCounter = REP_LEN_COUNT;
2529
3.49k
          LenPriceEnc_UpdateTables(&p->repLenEnc, 1 << p->pb, &p->repLenProbs, p->ProbPrices);
2530
3.49k
        }
2531
913k
      }
2532
    
2533
2.40M
      if (p->matchFinder.GetNumAvailableBytes(p->matchFinderObj) == 0)
2534
7.19k
        break;
2535
2.40M
      processed = nowPos32 - startPos32;
2536
      
2537
2.40M
      if (maxPackSize)
2538
0
      {
2539
0
        if (processed + kNumOpts + 300 >= maxUnpackSize
2540
0
            || RangeEnc_GetProcessed_sizet(&p->rc) + kPackReserve >= maxPackSize)
2541
0
          break;
2542
0
      }
2543
2.40M
      else if (processed >= (1 << 17))
2544
0
      {
2545
0
        p->nowPos64 += nowPos32 - startPos32;
2546
0
        return CheckErrors(p);
2547
0
      }
2548
2.40M
    }
2549
3.74M
  }
2550
2551
7.27k
  p->nowPos64 += nowPos32 - startPos32;
2552
7.27k
  return Flush(p, nowPos32);
2553
7.27k
}
2554
2555
2556
2557
7.27k
#define kBigHashDicLimit ((UInt32)1 << 24)
2558
2559
static SRes LzmaEnc_Alloc(CLzmaEnc *p, UInt32 keepWindowSize, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2560
7.27k
{
2561
7.27k
  UInt32 beforeSize = kNumOpts;
2562
7.27k
  if (!RangeEnc_Alloc(&p->rc, alloc))
2563
0
    return SZ_ERROR_MEM;
2564
2565
  #ifndef _7ZIP_ST
2566
  p->mtMode = (p->multiThread && !p->fastMode && (p->matchFinderBase.btMode != 0));
2567
  #endif
2568
2569
7.27k
  {
2570
7.27k
    unsigned lclp = p->lc + p->lp;
2571
7.27k
    if (!p->litProbs || !p->saveState.litProbs || p->lclp != lclp)
2572
7.27k
    {
2573
7.27k
      LzmaEnc_FreeLits(p, alloc);
2574
7.27k
      p->litProbs = (CLzmaProb *)ISzAlloc_Alloc(alloc, ((UInt32)0x300 << lclp) * sizeof(CLzmaProb));
2575
7.27k
      p->saveState.litProbs = (CLzmaProb *)ISzAlloc_Alloc(alloc, ((UInt32)0x300 << lclp) * sizeof(CLzmaProb));
2576
7.27k
      if (!p->litProbs || !p->saveState.litProbs)
2577
0
      {
2578
0
        LzmaEnc_FreeLits(p, alloc);
2579
0
        return SZ_ERROR_MEM;
2580
0
      }
2581
7.27k
      p->lclp = lclp;
2582
7.27k
    }
2583
7.27k
  }
2584
2585
7.27k
  p->matchFinderBase.bigHash = (Byte)(p->dictSize > kBigHashDicLimit ? 1 : 0);
2586
2587
7.27k
  if (beforeSize + p->dictSize < keepWindowSize)
2588
0
    beforeSize = keepWindowSize - p->dictSize;
2589
2590
  #ifndef _7ZIP_ST
2591
  if (p->mtMode)
2592
  {
2593
    RINOK(MatchFinderMt_Create(&p->matchFinderMt, p->dictSize, beforeSize, p->numFastBytes,
2594
        LZMA_MATCH_LEN_MAX
2595
        + 1  /* 18.04 */
2596
        , allocBig));
2597
    p->matchFinderObj = &p->matchFinderMt;
2598
    p->matchFinderBase.bigHash = (Byte)(
2599
        (p->dictSize > kBigHashDicLimit && p->matchFinderBase.hashMask >= 0xFFFFFF) ? 1 : 0);
2600
    MatchFinderMt_CreateVTable(&p->matchFinderMt, &p->matchFinder);
2601
  }
2602
  else
2603
  #endif
2604
7.27k
  {
2605
7.27k
    if (!MatchFinder_Create(&p->matchFinderBase, p->dictSize, beforeSize, p->numFastBytes, LZMA_MATCH_LEN_MAX, allocBig))
2606
0
      return SZ_ERROR_MEM;
2607
7.27k
    p->matchFinderObj = &p->matchFinderBase;
2608
7.27k
    MatchFinder_CreateVTable(&p->matchFinderBase, &p->matchFinder);
2609
7.27k
  }
2610
  
2611
7.27k
  return SZ_OK;
2612
7.27k
}
2613
2614
void LzmaEnc_Init(CLzmaEnc *p)
2615
7.27k
{
2616
7.27k
  unsigned i;
2617
7.27k
  p->state = 0;
2618
7.27k
  p->reps[0] =
2619
7.27k
  p->reps[1] =
2620
7.27k
  p->reps[2] =
2621
7.27k
  p->reps[3] = 1;
2622
2623
7.27k
  RangeEnc_Init(&p->rc);
2624
2625
123k
  for (i = 0; i < (1 << kNumAlignBits); i++)
2626
116k
    p->posAlignEncoder[i] = kProbInitValue;
2627
2628
94.6k
  for (i = 0; i < kNumStates; i++)
2629
87.3k
  {
2630
87.3k
    unsigned j;
2631
1.48M
    for (j = 0; j < LZMA_NUM_PB_STATES_MAX; j++)
2632
1.39M
    {
2633
1.39M
      p->isMatch[i][j] = kProbInitValue;
2634
1.39M
      p->isRep0Long[i][j] = kProbInitValue;
2635
1.39M
    }
2636
87.3k
    p->isRep[i] = kProbInitValue;
2637
87.3k
    p->isRepG0[i] = kProbInitValue;
2638
87.3k
    p->isRepG1[i] = kProbInitValue;
2639
87.3k
    p->isRepG2[i] = kProbInitValue;
2640
87.3k
  }
2641
2642
7.27k
  {
2643
36.3k
    for (i = 0; i < kNumLenToPosStates; i++)
2644
29.1k
    {
2645
29.1k
      CLzmaProb *probs = p->posSlotEncoder[i];
2646
29.1k
      unsigned j;
2647
1.89M
      for (j = 0; j < (1 << kNumPosSlotBits); j++)
2648
1.86M
        probs[j] = kProbInitValue;
2649
29.1k
    }
2650
7.27k
  }
2651
7.27k
  {
2652
938k
    for (i = 0; i < kNumFullDistances; i++)
2653
931k
      p->posEncoders[i] = kProbInitValue;
2654
7.27k
  }
2655
2656
7.27k
  {
2657
7.27k
    UInt32 num = (UInt32)0x300 << (p->lp + p->lc);
2658
7.27k
    UInt32 k;
2659
7.27k
    CLzmaProb *probs = p->litProbs;
2660
9.24G
    for (k = 0; k < num; k++)
2661
9.24G
      probs[k] = kProbInitValue;
2662
7.27k
  }
2663
2664
2665
7.27k
  LenEnc_Init(&p->lenProbs);
2666
7.27k
  LenEnc_Init(&p->repLenProbs);
2667
2668
7.27k
  p->optEnd = 0;
2669
7.27k
  p->optCur = 0;
2670
2671
7.27k
  {
2672
14.9M
    for (i = 0; i < kNumOpts; i++)
2673
14.9M
      p->opt[i].price = kInfinityPrice;
2674
7.27k
  }
2675
2676
7.27k
  p->additionalOffset = 0;
2677
2678
7.27k
  p->pbMask = (1 << p->pb) - 1;
2679
7.27k
  p->lpMask = ((UInt32)0x100 << p->lp) - ((unsigned)0x100 >> p->lc);
2680
7.27k
}
2681
2682
2683
void LzmaEnc_InitPrices(CLzmaEnc *p)
2684
7.27k
{
2685
7.27k
  if (!p->fastMode)
2686
4.91k
  {
2687
4.91k
    FillDistancesPrices(p);
2688
4.91k
    FillAlignPrices(p);
2689
4.91k
  }
2690
2691
7.27k
  p->lenEnc.tableSize =
2692
7.27k
  p->repLenEnc.tableSize =
2693
7.27k
      p->numFastBytes + 1 - LZMA_MATCH_LEN_MIN;
2694
2695
7.27k
  p->repLenEncCounter = REP_LEN_COUNT;
2696
2697
7.27k
  LenPriceEnc_UpdateTables(&p->lenEnc, 1 << p->pb, &p->lenProbs, p->ProbPrices);
2698
7.27k
  LenPriceEnc_UpdateTables(&p->repLenEnc, 1 << p->pb, &p->repLenProbs, p->ProbPrices);
2699
7.27k
}
2700
2701
static SRes LzmaEnc_AllocAndInit(CLzmaEnc *p, UInt32 keepWindowSize, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2702
7.27k
{
2703
7.27k
  unsigned i;
2704
131k
  for (i = kEndPosModelIndex / 2; i < kDicLogSizeMax; i++)
2705
131k
    if (p->dictSize <= ((UInt32)1 << i))
2706
7.27k
      break;
2707
7.27k
  p->distTableSize = i * 2;
2708
2709
7.27k
  p->finished = False;
2710
7.27k
  p->result = SZ_OK;
2711
7.27k
  RINOK(LzmaEnc_Alloc(p, keepWindowSize, alloc, allocBig));
2712
7.27k
  LzmaEnc_Init(p);
2713
7.27k
  LzmaEnc_InitPrices(p);
2714
7.27k
  p->nowPos64 = 0;
2715
7.27k
  return SZ_OK;
2716
7.27k
}
2717
2718
static SRes LzmaEnc_Prepare(CLzmaEncHandle pp, ISeqOutStream *outStream, ISeqInStream *inStream,
2719
    ISzAllocPtr alloc, ISzAllocPtr allocBig)
2720
7.27k
{
2721
7.27k
  CLzmaEnc *p = (CLzmaEnc *)pp;
2722
7.27k
  p->matchFinderBase.stream = inStream;
2723
7.27k
  p->needInit = 1;
2724
7.27k
  p->rc.outStream = outStream;
2725
7.27k
  return LzmaEnc_AllocAndInit(p, 0, alloc, allocBig);
2726
7.27k
}
2727
2728
SRes LzmaEnc_PrepareForLzma2(CLzmaEncHandle pp,
2729
    ISeqInStream *inStream, UInt32 keepWindowSize,
2730
    ISzAllocPtr alloc, ISzAllocPtr allocBig)
2731
0
{
2732
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
2733
0
  p->matchFinderBase.stream = inStream;
2734
0
  p->needInit = 1;
2735
0
  return LzmaEnc_AllocAndInit(p, keepWindowSize, alloc, allocBig);
2736
0
}
2737
2738
static void LzmaEnc_SetInputBuf(CLzmaEnc *p, const Byte *src, SizeT srcLen)
2739
0
{
2740
0
  p->matchFinderBase.directInput = 1;
2741
0
  p->matchFinderBase.bufferBase = (Byte *)src;
2742
0
  p->matchFinderBase.directInputRem = srcLen;
2743
0
}
2744
2745
SRes LzmaEnc_MemPrepare(CLzmaEncHandle pp, const Byte *src, SizeT srcLen,
2746
    UInt32 keepWindowSize, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2747
0
{
2748
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
2749
0
  LzmaEnc_SetInputBuf(p, src, srcLen);
2750
0
  p->needInit = 1;
2751
2752
0
  LzmaEnc_SetDataSize(pp, srcLen);
2753
0
  return LzmaEnc_AllocAndInit(p, keepWindowSize, alloc, allocBig);
2754
0
}
2755
2756
void LzmaEnc_Finish(CLzmaEncHandle pp)
2757
7.27k
{
2758
  #ifndef _7ZIP_ST
2759
  CLzmaEnc *p = (CLzmaEnc *)pp;
2760
  if (p->mtMode)
2761
    MatchFinderMt_ReleaseStream(&p->matchFinderMt);
2762
  #else
2763
7.27k
  UNUSED_VAR(pp);
2764
7.27k
  #endif
2765
7.27k
}
2766
2767
2768
typedef struct
2769
{
2770
  ISeqOutStream vt;
2771
  Byte *data;
2772
  SizeT rem;
2773
  BoolInt overflow;
2774
} CLzmaEnc_SeqOutStreamBuf;
2775
2776
static size_t SeqOutStreamBuf_Write(const ISeqOutStream *pp, const void *data, size_t size)
2777
0
{
2778
0
  CLzmaEnc_SeqOutStreamBuf *p = CONTAINER_FROM_VTBL(pp, CLzmaEnc_SeqOutStreamBuf, vt);
2779
0
  if (p->rem < size)
2780
0
  {
2781
0
    size = p->rem;
2782
0
    p->overflow = True;
2783
0
  }
2784
0
  memcpy(p->data, data, size);
2785
0
  p->rem -= size;
2786
0
  p->data += size;
2787
0
  return size;
2788
0
}
2789
2790
2791
UInt32 LzmaEnc_GetNumAvailableBytes(CLzmaEncHandle pp)
2792
0
{
2793
0
  const CLzmaEnc *p = (CLzmaEnc *)pp;
2794
0
  return p->matchFinder.GetNumAvailableBytes(p->matchFinderObj);
2795
0
}
2796
2797
2798
const Byte *LzmaEnc_GetCurBuf(CLzmaEncHandle pp)
2799
0
{
2800
0
  const CLzmaEnc *p = (CLzmaEnc *)pp;
2801
0
  return p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - p->additionalOffset;
2802
0
}
2803
2804
2805
SRes LzmaEnc_CodeOneMemBlock(CLzmaEncHandle pp, BoolInt reInit,
2806
    Byte *dest, size_t *destLen, UInt32 desiredPackSize, UInt32 *unpackSize)
2807
0
{
2808
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
2809
0
  UInt64 nowPos64;
2810
0
  SRes res;
2811
0
  CLzmaEnc_SeqOutStreamBuf outStream;
2812
2813
0
  outStream.vt.Write = SeqOutStreamBuf_Write;
2814
0
  outStream.data = dest;
2815
0
  outStream.rem = *destLen;
2816
0
  outStream.overflow = False;
2817
2818
0
  p->writeEndMark = False;
2819
0
  p->finished = False;
2820
0
  p->result = SZ_OK;
2821
2822
0
  if (reInit)
2823
0
    LzmaEnc_Init(p);
2824
0
  LzmaEnc_InitPrices(p);
2825
2826
0
  nowPos64 = p->nowPos64;
2827
0
  RangeEnc_Init(&p->rc);
2828
0
  p->rc.outStream = &outStream.vt;
2829
2830
0
  if (desiredPackSize == 0)
2831
0
    return SZ_ERROR_OUTPUT_EOF;
2832
2833
0
  res = LzmaEnc_CodeOneBlock(p, desiredPackSize, *unpackSize);
2834
  
2835
0
  *unpackSize = (UInt32)(p->nowPos64 - nowPos64);
2836
0
  *destLen -= outStream.rem;
2837
0
  if (outStream.overflow)
2838
0
    return SZ_ERROR_OUTPUT_EOF;
2839
2840
0
  return res;
2841
0
}
2842
2843
2844
static SRes LzmaEnc_Encode2(CLzmaEnc *p, ICompressProgress *progress)
2845
7.27k
{
2846
7.27k
  SRes res = SZ_OK;
2847
2848
  #ifndef _7ZIP_ST
2849
  Byte allocaDummy[0x300];
2850
  allocaDummy[0] = 0;
2851
  allocaDummy[1] = allocaDummy[0];
2852
  #endif
2853
2854
7.27k
  for (;;)
2855
7.27k
  {
2856
7.27k
    res = LzmaEnc_CodeOneBlock(p, 0, 0);
2857
7.27k
    if (res != SZ_OK || p->finished)
2858
7.27k
      break;
2859
0
    if (progress)
2860
0
    {
2861
0
      res = ICompressProgress_Progress(progress, p->nowPos64, RangeEnc_GetProcessed(&p->rc));
2862
0
      if (res != SZ_OK)
2863
0
      {
2864
0
        res = SZ_ERROR_PROGRESS;
2865
0
        break;
2866
0
      }
2867
0
    }
2868
0
  }
2869
  
2870
7.27k
  LzmaEnc_Finish(p);
2871
2872
  /*
2873
  if (res == SZ_OK && !Inline_MatchFinder_IsFinishedOK(&p->matchFinderBase))
2874
    res = SZ_ERROR_FAIL;
2875
  }
2876
  */
2877
2878
7.27k
  return res;
2879
7.27k
}
2880
2881
2882
SRes LzmaEnc_Encode(CLzmaEncHandle pp, ISeqOutStream *outStream, ISeqInStream *inStream, ICompressProgress *progress,
2883
    ISzAllocPtr alloc, ISzAllocPtr allocBig)
2884
7.27k
{
2885
7.27k
  RINOK(LzmaEnc_Prepare(pp, outStream, inStream, alloc, allocBig));
2886
7.27k
  return LzmaEnc_Encode2((CLzmaEnc *)pp, progress);
2887
7.27k
}
2888
2889
2890
SRes LzmaEnc_WriteProperties(CLzmaEncHandle pp, Byte *props, SizeT *size)
2891
7.27k
{
2892
7.27k
  CLzmaEnc *p = (CLzmaEnc *)pp;
2893
7.27k
  unsigned i;
2894
7.27k
  UInt32 dictSize = p->dictSize;
2895
7.27k
  if (*size < LZMA_PROPS_SIZE)
2896
0
    return SZ_ERROR_PARAM;
2897
7.27k
  *size = LZMA_PROPS_SIZE;
2898
7.27k
  props[0] = (Byte)((p->pb * 5 + p->lp) * 9 + p->lc);
2899
2900
7.27k
  if (dictSize >= ((UInt32)1 << 22))
2901
7.27k
  {
2902
7.27k
    UInt32 kDictMask = ((UInt32)1 << 20) - 1;
2903
7.27k
    if (dictSize < (UInt32)0xFFFFFFFF - kDictMask)
2904
7.27k
      dictSize = (dictSize + kDictMask) & ~kDictMask;
2905
7.27k
  }
2906
0
  else for (i = 11; i <= 30; i++)
2907
0
  {
2908
0
    if (dictSize <= ((UInt32)2 << i)) { dictSize = (2 << i); break; }
2909
0
    if (dictSize <= ((UInt32)3 << i)) { dictSize = (3 << i); break; }
2910
0
  }
2911
2912
36.3k
  for (i = 0; i < 4; i++)
2913
29.1k
    props[1 + i] = (Byte)(dictSize >> (8 * i));
2914
7.27k
  return SZ_OK;
2915
7.27k
}
2916
2917
2918
unsigned LzmaEnc_IsWriteEndMark(CLzmaEncHandle pp)
2919
0
{
2920
0
  return ((CLzmaEnc *)pp)->writeEndMark;
2921
0
}
2922
2923
2924
SRes LzmaEnc_MemEncode(CLzmaEncHandle pp, Byte *dest, SizeT *destLen, const Byte *src, SizeT srcLen,
2925
    int writeEndMark, ICompressProgress *progress, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2926
0
{
2927
0
  SRes res;
2928
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
2929
2930
0
  CLzmaEnc_SeqOutStreamBuf outStream;
2931
2932
0
  outStream.vt.Write = SeqOutStreamBuf_Write;
2933
0
  outStream.data = dest;
2934
0
  outStream.rem = *destLen;
2935
0
  outStream.overflow = False;
2936
2937
0
  p->writeEndMark = writeEndMark;
2938
0
  p->rc.outStream = &outStream.vt;
2939
2940
0
  res = LzmaEnc_MemPrepare(pp, src, srcLen, 0, alloc, allocBig);
2941
  
2942
0
  if (res == SZ_OK)
2943
0
  {
2944
0
    res = LzmaEnc_Encode2(p, progress);
2945
0
    if (res == SZ_OK && p->nowPos64 != srcLen)
2946
0
      res = SZ_ERROR_FAIL;
2947
0
  }
2948
2949
0
  *destLen -= outStream.rem;
2950
0
  if (outStream.overflow)
2951
0
    return SZ_ERROR_OUTPUT_EOF;
2952
0
  return res;
2953
0
}
2954
2955
2956
SRes LzmaEncode(Byte *dest, SizeT *destLen, const Byte *src, SizeT srcLen,
2957
    const CLzmaEncProps *props, Byte *propsEncoded, SizeT *propsSize, int writeEndMark,
2958
    ICompressProgress *progress, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2959
0
{
2960
0
  CLzmaEnc *p = (CLzmaEnc *)LzmaEnc_Create(alloc);
2961
0
  SRes res;
2962
0
  if (!p)
2963
0
    return SZ_ERROR_MEM;
2964
2965
0
  res = LzmaEnc_SetProps(p, props);
2966
0
  if (res == SZ_OK)
2967
0
  {
2968
0
    res = LzmaEnc_WriteProperties(p, propsEncoded, propsSize);
2969
0
    if (res == SZ_OK)
2970
0
      res = LzmaEnc_MemEncode(p, dest, destLen, src, srcLen,
2971
0
          writeEndMark, progress, alloc, allocBig);
2972
0
  }
2973
2974
0
  LzmaEnc_Destroy(p, alloc, allocBig);
2975
0
  return res;
2976
0
}