Coverage Report

Created: 2023-03-26 06:59

/src/lzma-fuzz/sdk/C/LzmaEnc.c
Line
Count
Source (jump to first uncovered line)
1
/* LzmaEnc.c -- LZMA Encoder
2
2019-01-10: Igor Pavlov : Public domain */
3
4
#include "Precomp.h"
5
6
#include <string.h>
7
8
/* #define SHOW_STAT */
9
/* #define SHOW_STAT2 */
10
11
#if defined(SHOW_STAT) || defined(SHOW_STAT2)
12
#include <stdio.h>
13
#endif
14
15
#include "LzmaEnc.h"
16
17
#include "LzFind.h"
18
#ifndef _7ZIP_ST
19
#include "LzFindMt.h"
20
#endif
21
22
#ifdef SHOW_STAT
23
static unsigned g_STAT_OFFSET = 0;
24
#endif
25
26
16.2k
#define kLzmaMaxHistorySize ((UInt32)3 << 29)
27
/* #define kLzmaMaxHistorySize ((UInt32)7 << 29) */
28
29
74.8M
#define kNumTopBits 24
30
74.8M
#define kTopValue ((UInt32)1 << kNumTopBits)
31
32
413M
#define kNumBitModelTotalBits 11
33
338M
#define kBitModelTotal (1 << kNumBitModelTotalBits)
34
197M
#define kNumMoveBits 5
35
147M
#define kProbInitValue (kBitModelTotal >> 1)
36
37
150M
#define kNumMoveReducingBits 4
38
2.91M
#define kNumBitPriceShiftBits 4
39
#define kBitPrice (1 << kNumBitPriceShiftBits)
40
41
27.8k
#define REP_LEN_COUNT 64
42
43
void LzmaEncProps_Init(CLzmaEncProps *p)
44
24.4k
{
45
24.4k
  p->level = 5;
46
24.4k
  p->dictSize = p->mc = 0;
47
24.4k
  p->reduceSize = (UInt64)(Int64)-1;
48
24.4k
  p->lc = p->lp = p->pb = p->algo = p->fb = p->btMode = p->numHashBytes = p->numThreads = -1;
49
24.4k
  p->writeEndMark = 0;
50
24.4k
}
51
52
void LzmaEncProps_Normalize(CLzmaEncProps *p)
53
81.4k
{
54
81.4k
  int level = p->level;
55
81.4k
  if (level < 0) level = 5;
56
81.4k
  p->level = level;
57
  
58
81.4k
  if (p->dictSize == 0) p->dictSize = (level <= 5 ? (1 << (level * 2 + 14)) : (level <= 7 ? (1 << 25) : (1 << 26)));
59
81.4k
  if (p->dictSize > p->reduceSize)
60
0
  {
61
0
    unsigned i;
62
0
    UInt32 reduceSize = (UInt32)p->reduceSize;
63
0
    for (i = 11; i <= 30; i++)
64
0
    {
65
0
      if (reduceSize <= ((UInt32)2 << i)) { p->dictSize = ((UInt32)2 << i); break; }
66
0
      if (reduceSize <= ((UInt32)3 << i)) { p->dictSize = ((UInt32)3 << i); break; }
67
0
    }
68
0
  }
69
70
81.4k
  if (p->lc < 0) p->lc = 3;
71
81.4k
  if (p->lp < 0) p->lp = 0;
72
81.4k
  if (p->pb < 0) p->pb = 2;
73
74
81.4k
  if (p->algo < 0) p->algo = (level < 5 ? 0 : 1);
75
81.4k
  if (p->fb < 0) p->fb = (level < 7 ? 32 : 64);
76
81.4k
  if (p->btMode < 0) p->btMode = (p->algo == 0 ? 0 : 1);
77
81.4k
  if (p->numHashBytes < 0) p->numHashBytes = 4;
78
81.4k
  if (p->mc == 0) p->mc = (16 + (p->fb >> 1)) >> (p->btMode ? 0 : 1);
79
  
80
81.4k
  if (p->numThreads < 0)
81
40.7k
    p->numThreads =
82
      #ifndef _7ZIP_ST
83
      ((p->btMode && p->algo) ? 2 : 1);
84
      #else
85
40.7k
      1;
86
81.4k
      #endif
87
81.4k
}
88
89
UInt32 LzmaEncProps_GetDictSize(const CLzmaEncProps *props2)
90
8.13k
{
91
8.13k
  CLzmaEncProps props = *props2;
92
8.13k
  LzmaEncProps_Normalize(&props);
93
8.13k
  return props.dictSize;
94
8.13k
}
95
96
#if (_MSC_VER >= 1400)
97
/* BSR code is fast for some new CPUs */
98
/* #define LZMA_LOG_BSR */
99
#endif
100
101
#ifdef LZMA_LOG_BSR
102
103
#define kDicLogSizeMaxCompress 32
104
105
#define BSR2_RET(pos, res) { unsigned long zz; _BitScanReverse(&zz, (pos)); res = (zz + zz) + ((pos >> (zz - 1)) & 1); }
106
107
static unsigned GetPosSlot1(UInt32 pos)
108
{
109
  unsigned res;
110
  BSR2_RET(pos, res);
111
  return res;
112
}
113
#define GetPosSlot2(pos, res) { BSR2_RET(pos, res); }
114
#define GetPosSlot(pos, res) { if (pos < 2) res = pos; else BSR2_RET(pos, res); }
115
116
#else
117
118
4.65M
#define kNumLogBits (9 + sizeof(size_t) / 2)
119
/* #define kNumLogBits (11 + sizeof(size_t) / 8 * 3) */
120
121
16.2k
#define kDicLogSizeMaxCompress ((kNumLogBits - 1) * 2 + 7)
122
123
static void LzmaEnc_FastPosInit(Byte *g_FastPos)
124
8.13k
{
125
8.13k
  unsigned slot;
126
8.13k
  g_FastPos[0] = 0;
127
8.13k
  g_FastPos[1] = 1;
128
8.13k
  g_FastPos += 2;
129
  
130
203k
  for (slot = 2; slot < kNumLogBits * 2; slot++)
131
195k
  {
132
195k
    size_t k = ((size_t)1 << ((slot >> 1) - 1));
133
195k
    size_t j;
134
66.8M
    for (j = 0; j < k; j++)
135
66.6M
      g_FastPos[j] = (Byte)slot;
136
195k
    g_FastPos += k;
137
195k
  }
138
8.13k
}
139
140
/* we can use ((limit - pos) >> 31) only if (pos < ((UInt32)1 << 31)) */
141
/*
142
#define BSR2_RET(pos, res) { unsigned zz = 6 + ((kNumLogBits - 1) & \
143
  (0 - (((((UInt32)1 << (kNumLogBits + 6)) - 1) - pos) >> 31))); \
144
  res = p->g_FastPos[pos >> zz] + (zz * 2); }
145
*/
146
147
/*
148
#define BSR2_RET(pos, res) { unsigned zz = 6 + ((kNumLogBits - 1) & \
149
  (0 - (((((UInt32)1 << (kNumLogBits)) - 1) - (pos >> 6)) >> 31))); \
150
  res = p->g_FastPos[pos >> zz] + (zz * 2); }
151
*/
152
153
4.43M
#define BSR2_RET(pos, res) { unsigned zz = (pos < (1 << (kNumLogBits + 6))) ? 6 : 6 + kNumLogBits - 1; \
154
4.43M
  res = p->g_FastPos[pos >> zz] + (zz * 2); }
155
156
/*
157
#define BSR2_RET(pos, res) { res = (pos < (1 << (kNumLogBits + 6))) ? \
158
  p->g_FastPos[pos >> 6] + 12 : \
159
  p->g_FastPos[pos >> (6 + kNumLogBits - 1)] + (6 + (kNumLogBits - 1)) * 2; }
160
*/
161
162
8.07M
#define GetPosSlot1(pos) p->g_FastPos[pos]
163
4.25M
#define GetPosSlot2(pos, res) { BSR2_RET(pos, res); }
164
911k
#define GetPosSlot(pos, res) { if (pos < kNumFullDistances) res = p->g_FastPos[pos & (kNumFullDistances - 1)]; else BSR2_RET(pos, res); }
165
166
#endif
167
168
169
72.8M
#define LZMA_NUM_REPS 4
170
171
typedef UInt16 CState;
172
typedef UInt16 CExtra;
173
174
typedef struct
175
{
176
  UInt32 price;
177
  CState state;
178
  CExtra extra;
179
      // 0   : normal
180
      // 1   : LIT : MATCH
181
      // > 1 : MATCH (extra-1) : LIT : REP0 (len)
182
  UInt32 len;
183
  UInt32 dist;
184
  UInt32 reps[LZMA_NUM_REPS];
185
} COptimal;
186
187
188
// 18.06
189
58.9M
#define kNumOpts (1 << 11)
190
5.92M
#define kPackReserve (kNumOpts * 8)
191
// #define kNumOpts (1 << 12)
192
// #define kPackReserve (1 + kNumOpts * 2)
193
194
28.5M
#define kNumLenToPosStates 4
195
27.0M
#define kNumPosSlotBits 6
196
#define kDicLogSizeMin 0
197
146k
#define kDicLogSizeMax 32
198
#define kDistTableSizeMax (kDicLogSizeMax * 2)
199
200
5.78M
#define kNumAlignBits 4
201
5.37M
#define kAlignTableSize (1 << kNumAlignBits)
202
5.13M
#define kAlignMask (kAlignTableSize - 1)
203
204
937k
#define kStartPosModelIndex 4
205
40.1M
#define kEndPosModelIndex 14
206
40.8M
#define kNumFullDistances (1 << (kEndPosModelIndex >> 1))
207
208
typedef
209
#ifdef _LZMA_PROB32
210
  UInt32
211
#else
212
  UInt16
213
#endif
214
  CLzmaProb;
215
216
13.1M
#define LZMA_PB_MAX 4
217
32.5k
#define LZMA_LC_MAX 8
218
32.5k
#define LZMA_LP_MAX 4
219
220
13.1M
#define LZMA_NUM_PB_STATES_MAX (1 << LZMA_PB_MAX)
221
222
27.1M
#define kLenNumLowBits 3
223
15.9M
#define kLenNumLowSymbols (1 << kLenNumLowBits)
224
26.3M
#define kLenNumHighBits 8
225
21.6M
#define kLenNumHighSymbols (1 << kLenNumHighBits)
226
12.2M
#define kLenNumSymbolsTotal (kLenNumLowSymbols * 2 + kLenNumHighSymbols)
227
228
110M
#define LZMA_MATCH_LEN_MIN 2
229
12.2M
#define LZMA_MATCH_LEN_MAX (LZMA_MATCH_LEN_MIN + kLenNumSymbolsTotal - 1)
230
231
237k
#define kNumStates 12
232
233
234
typedef struct
235
{
236
  CLzmaProb low[LZMA_NUM_PB_STATES_MAX << (kLenNumLowBits + 1)];
237
  CLzmaProb high[kLenNumHighSymbols];
238
} CLenEnc;
239
240
241
typedef struct
242
{
243
  unsigned tableSize;
244
  UInt32 prices[LZMA_NUM_PB_STATES_MAX][kLenNumSymbolsTotal];
245
  // UInt32 prices1[LZMA_NUM_PB_STATES_MAX][kLenNumLowSymbols * 2];
246
  // UInt32 prices2[kLenNumSymbolsTotal];
247
} CLenPriceEnc;
248
249
#define GET_PRICE_LEN(p, posState, len) \
250
96.7M
    ((p)->prices[posState][(size_t)(len) - LZMA_MATCH_LEN_MIN])
251
252
/*
253
#define GET_PRICE_LEN(p, posState, len) \
254
    ((p)->prices2[(size_t)(len) - 2] + ((p)->prices1[posState][((len) - 2) & (kLenNumLowSymbols * 2 - 1)] & (((len) - 2 - kLenNumLowSymbols * 2) >> 9)))
255
*/
256
257
typedef struct
258
{
259
  UInt32 range;
260
  unsigned cache;
261
  UInt64 low;
262
  UInt64 cacheSize;
263
  Byte *buf;
264
  Byte *bufLim;
265
  Byte *bufBase;
266
  ISeqOutStream *outStream;
267
  UInt64 processed;
268
  SRes res;
269
} CRangeEnc;
270
271
272
typedef struct
273
{
274
  CLzmaProb *litProbs;
275
276
  unsigned state;
277
  UInt32 reps[LZMA_NUM_REPS];
278
279
  CLzmaProb posAlignEncoder[1 << kNumAlignBits];
280
  CLzmaProb isRep[kNumStates];
281
  CLzmaProb isRepG0[kNumStates];
282
  CLzmaProb isRepG1[kNumStates];
283
  CLzmaProb isRepG2[kNumStates];
284
  CLzmaProb isMatch[kNumStates][LZMA_NUM_PB_STATES_MAX];
285
  CLzmaProb isRep0Long[kNumStates][LZMA_NUM_PB_STATES_MAX];
286
287
  CLzmaProb posSlotEncoder[kNumLenToPosStates][1 << kNumPosSlotBits];
288
  CLzmaProb posEncoders[kNumFullDistances];
289
  
290
  CLenEnc lenProbs;
291
  CLenEnc repLenProbs;
292
293
} CSaveState;
294
295
296
typedef UInt32 CProbPrice;
297
298
299
typedef struct
300
{
301
  void *matchFinderObj;
302
  IMatchFinder matchFinder;
303
304
  unsigned optCur;
305
  unsigned optEnd;
306
307
  unsigned longestMatchLen;
308
  unsigned numPairs;
309
  UInt32 numAvail;
310
311
  unsigned state;
312
  unsigned numFastBytes;
313
  unsigned additionalOffset;
314
  UInt32 reps[LZMA_NUM_REPS];
315
  unsigned lpMask, pbMask;
316
  CLzmaProb *litProbs;
317
  CRangeEnc rc;
318
319
  UInt32 backRes;
320
321
  unsigned lc, lp, pb;
322
  unsigned lclp;
323
324
  BoolInt fastMode;
325
  BoolInt writeEndMark;
326
  BoolInt finished;
327
  BoolInt multiThread;
328
  BoolInt needInit;
329
  // BoolInt _maxMode;
330
331
  UInt64 nowPos64;
332
  
333
  unsigned matchPriceCount;
334
  // unsigned alignPriceCount;
335
  int repLenEncCounter;
336
337
  unsigned distTableSize;
338
339
  UInt32 dictSize;
340
  SRes result;
341
342
  #ifndef _7ZIP_ST
343
  BoolInt mtMode;
344
  // begin of CMatchFinderMt is used in LZ thread
345
  CMatchFinderMt matchFinderMt;
346
  // end of CMatchFinderMt is used in BT and HASH threads
347
  #endif
348
349
  CMatchFinder matchFinderBase;
350
351
  #ifndef _7ZIP_ST
352
  Byte pad[128];
353
  #endif
354
  
355
  // LZ thread
356
  CProbPrice ProbPrices[kBitModelTotal >> kNumMoveReducingBits];
357
358
  UInt32 matches[LZMA_MATCH_LEN_MAX * 2 + 2 + 1];
359
360
  UInt32 alignPrices[kAlignTableSize];
361
  UInt32 posSlotPrices[kNumLenToPosStates][kDistTableSizeMax];
362
  UInt32 distancesPrices[kNumLenToPosStates][kNumFullDistances];
363
364
  CLzmaProb posAlignEncoder[1 << kNumAlignBits];
365
  CLzmaProb isRep[kNumStates];
366
  CLzmaProb isRepG0[kNumStates];
367
  CLzmaProb isRepG1[kNumStates];
368
  CLzmaProb isRepG2[kNumStates];
369
  CLzmaProb isMatch[kNumStates][LZMA_NUM_PB_STATES_MAX];
370
  CLzmaProb isRep0Long[kNumStates][LZMA_NUM_PB_STATES_MAX];
371
  CLzmaProb posSlotEncoder[kNumLenToPosStates][1 << kNumPosSlotBits];
372
  CLzmaProb posEncoders[kNumFullDistances];
373
  
374
  CLenEnc lenProbs;
375
  CLenEnc repLenProbs;
376
377
  #ifndef LZMA_LOG_BSR
378
  Byte g_FastPos[1 << kNumLogBits];
379
  #endif
380
381
  CLenPriceEnc lenEnc;
382
  CLenPriceEnc repLenEnc;
383
384
  COptimal opt[kNumOpts];
385
386
  CSaveState saveState;
387
388
  #ifndef _7ZIP_ST
389
  Byte pad2[128];
390
  #endif
391
} CLzmaEnc;
392
393
394
395
183k
#define COPY_ARR(dest, src, arr) memcpy(dest->arr, src->arr, sizeof(src->arr));
396
397
void LzmaEnc_SaveState(CLzmaEncHandle pp)
398
16.3k
{
399
16.3k
  CLzmaEnc *p = (CLzmaEnc *)pp;
400
16.3k
  CSaveState *dest = &p->saveState;
401
  
402
16.3k
  dest->state = p->state;
403
  
404
16.3k
  dest->lenProbs = p->lenProbs;
405
16.3k
  dest->repLenProbs = p->repLenProbs;
406
407
16.3k
  COPY_ARR(dest, p, reps);
408
409
16.3k
  COPY_ARR(dest, p, posAlignEncoder);
410
16.3k
  COPY_ARR(dest, p, isRep);
411
16.3k
  COPY_ARR(dest, p, isRepG0);
412
16.3k
  COPY_ARR(dest, p, isRepG1);
413
16.3k
  COPY_ARR(dest, p, isRepG2);
414
16.3k
  COPY_ARR(dest, p, isMatch);
415
16.3k
  COPY_ARR(dest, p, isRep0Long);
416
16.3k
  COPY_ARR(dest, p, posSlotEncoder);
417
16.3k
  COPY_ARR(dest, p, posEncoders);
418
419
16.3k
  memcpy(dest->litProbs, p->litProbs, ((UInt32)0x300 << p->lclp) * sizeof(CLzmaProb));
420
16.3k
}
421
422
423
void LzmaEnc_RestoreState(CLzmaEncHandle pp)
424
2.05k
{
425
2.05k
  CLzmaEnc *dest = (CLzmaEnc *)pp;
426
2.05k
  const CSaveState *p = &dest->saveState;
427
428
2.05k
  dest->state = p->state;
429
430
2.05k
  dest->lenProbs = p->lenProbs;
431
2.05k
  dest->repLenProbs = p->repLenProbs;
432
  
433
2.05k
  COPY_ARR(dest, p, reps);
434
  
435
2.05k
  COPY_ARR(dest, p, posAlignEncoder);
436
2.05k
  COPY_ARR(dest, p, isRep);
437
2.05k
  COPY_ARR(dest, p, isRepG0);
438
2.05k
  COPY_ARR(dest, p, isRepG1);
439
2.05k
  COPY_ARR(dest, p, isRepG2);
440
2.05k
  COPY_ARR(dest, p, isMatch);
441
2.05k
  COPY_ARR(dest, p, isRep0Long);
442
2.05k
  COPY_ARR(dest, p, posSlotEncoder);
443
2.05k
  COPY_ARR(dest, p, posEncoders);
444
445
2.05k
  memcpy(dest->litProbs, p->litProbs, ((UInt32)0x300 << dest->lclp) * sizeof(CLzmaProb));
446
2.05k
}
447
448
449
450
SRes LzmaEnc_SetProps(CLzmaEncHandle pp, const CLzmaEncProps *props2)
451
16.2k
{
452
16.2k
  CLzmaEnc *p = (CLzmaEnc *)pp;
453
16.2k
  CLzmaEncProps props = *props2;
454
16.2k
  LzmaEncProps_Normalize(&props);
455
456
16.2k
  if (props.lc > LZMA_LC_MAX
457
16.2k
      || props.lp > LZMA_LP_MAX
458
16.2k
      || props.pb > LZMA_PB_MAX
459
16.2k
      || props.dictSize > ((UInt64)1 << kDicLogSizeMaxCompress)
460
16.2k
      || props.dictSize > kLzmaMaxHistorySize)
461
0
    return SZ_ERROR_PARAM;
462
463
16.2k
  p->dictSize = props.dictSize;
464
16.2k
  {
465
16.2k
    unsigned fb = props.fb;
466
16.2k
    if (fb < 5)
467
0
      fb = 5;
468
16.2k
    if (fb > LZMA_MATCH_LEN_MAX)
469
0
      fb = LZMA_MATCH_LEN_MAX;
470
16.2k
    p->numFastBytes = fb;
471
16.2k
  }
472
16.2k
  p->lc = props.lc;
473
16.2k
  p->lp = props.lp;
474
16.2k
  p->pb = props.pb;
475
16.2k
  p->fastMode = (props.algo == 0);
476
  // p->_maxMode = True;
477
16.2k
  p->matchFinderBase.btMode = (Byte)(props.btMode ? 1 : 0);
478
16.2k
  {
479
16.2k
    unsigned numHashBytes = 4;
480
16.2k
    if (props.btMode)
481
14.6k
    {
482
14.6k
      if (props.numHashBytes < 2)
483
0
        numHashBytes = 2;
484
14.6k
      else if (props.numHashBytes < 4)
485
5.01k
        numHashBytes = props.numHashBytes;
486
14.6k
    }
487
16.2k
    p->matchFinderBase.numHashBytes = numHashBytes;
488
16.2k
  }
489
490
16.2k
  p->matchFinderBase.cutValue = props.mc;
491
492
16.2k
  p->writeEndMark = props.writeEndMark;
493
494
  #ifndef _7ZIP_ST
495
  /*
496
  if (newMultiThread != _multiThread)
497
  {
498
    ReleaseMatchFinder();
499
    _multiThread = newMultiThread;
500
  }
501
  */
502
  p->multiThread = (props.numThreads > 1);
503
  #endif
504
505
16.2k
  return SZ_OK;
506
16.2k
}
507
508
509
void LzmaEnc_SetDataSize(CLzmaEncHandle pp, UInt64 expectedDataSiize)
510
8.13k
{
511
8.13k
  CLzmaEnc *p = (CLzmaEnc *)pp;
512
8.13k
  p->matchFinderBase.expectedDataSize = expectedDataSiize;
513
8.13k
}
514
515
516
8.13k
#define kState_Start 0
517
948k
#define kState_LitAfterMatch 4
518
1.80M
#define kState_LitAfterRep   5
519
0
#define kState_MatchAfterLit 7
520
71.6k
#define kState_RepAfterLit   8
521
522
static const Byte kLiteralNextStates[kNumStates] = {0, 0, 0, 0, 1, 2, 3, 4,  5,  6,   4, 5};
523
static const Byte kMatchNextStates[kNumStates]   = {7, 7, 7, 7, 7, 7, 7, 10, 10, 10, 10, 10};
524
static const Byte kRepNextStates[kNumStates]     = {8, 8, 8, 8, 8, 8, 8, 11, 11, 11, 11, 11};
525
static const Byte kShortRepNextStates[kNumStates]= {9, 9, 9, 9, 9, 9, 9, 11, 11, 11, 11, 11};
526
527
12.9M
#define IsLitState(s) ((s) < 7)
528
15.4M
#define GetLenToPosState2(len) (((len) < kNumLenToPosStates - 1) ? (len) : kNumLenToPosStates - 1)
529
1.56M
#define GetLenToPosState(len) (((len) < kNumLenToPosStates + 1) ? (len) - 2 : kNumLenToPosStates - 1)
530
531
52.6M
#define kInfinityPrice (1 << 30)
532
533
static void RangeEnc_Construct(CRangeEnc *p)
534
8.13k
{
535
8.13k
  p->outStream = NULL;
536
8.13k
  p->bufBase = NULL;
537
8.13k
}
538
539
#define RangeEnc_GetProcessed(p)       ((p)->processed + ((p)->buf - (p)->bufBase) + (p)->cacheSize)
540
5.92M
#define RangeEnc_GetProcessed_sizet(p) ((size_t)(p)->processed + ((p)->buf - (p)->bufBase) + (size_t)(p)->cacheSize)
541
542
8.13k
#define RC_BUF_SIZE (1 << 16)
543
544
static int RangeEnc_Alloc(CRangeEnc *p, ISzAllocPtr alloc)
545
8.13k
{
546
8.13k
  if (!p->bufBase)
547
8.13k
  {
548
8.13k
    p->bufBase = (Byte *)ISzAlloc_Alloc(alloc, RC_BUF_SIZE);
549
8.13k
    if (!p->bufBase)
550
0
      return 0;
551
8.13k
    p->bufLim = p->bufBase + RC_BUF_SIZE;
552
8.13k
  }
553
8.13k
  return 1;
554
8.13k
}
555
556
static void RangeEnc_Free(CRangeEnc *p, ISzAllocPtr alloc)
557
8.13k
{
558
8.13k
  ISzAlloc_Free(alloc, p->bufBase);
559
8.13k
  p->bufBase = 0;
560
8.13k
}
561
562
static void RangeEnc_Init(CRangeEnc *p)
563
34.6k
{
564
  /* Stream.Init(); */
565
34.6k
  p->range = 0xFFFFFFFF;
566
34.6k
  p->cache = 0;
567
34.6k
  p->low = 0;
568
34.6k
  p->cacheSize = 0;
569
570
34.6k
  p->buf = p->bufBase;
571
572
34.6k
  p->processed = 0;
573
34.6k
  p->res = SZ_OK;
574
34.6k
}
575
576
MY_NO_INLINE static void RangeEnc_FlushStream(CRangeEnc *p)
577
16.3k
{
578
16.3k
  size_t num;
579
16.3k
  if (p->res != SZ_OK)
580
0
    return;
581
16.3k
  num = p->buf - p->bufBase;
582
16.3k
  if (num != ISeqOutStream_Write(p->outStream, p->bufBase, num))
583
0
    p->res = SZ_ERROR_WRITE;
584
16.3k
  p->processed += num;
585
16.3k
  p->buf = p->bufBase;
586
16.3k
}
587
588
MY_NO_INLINE static void MY_FAST_CALL RangeEnc_ShiftLow(CRangeEnc *p)
589
7.54M
{
590
7.54M
  UInt32 low = (UInt32)p->low;
591
7.54M
  unsigned high = (unsigned)(p->low >> 32);
592
7.54M
  p->low = (UInt32)(low << 8);
593
7.54M
  if (low < (UInt32)0xFF000000 || high != 0)
594
7.51M
  {
595
7.51M
    {
596
7.51M
      Byte *buf = p->buf;
597
7.51M
      *buf++ = (Byte)(p->cache + high);
598
7.51M
      p->cache = (unsigned)(low >> 24);
599
7.51M
      p->buf = buf;
600
7.51M
      if (buf == p->bufLim)
601
0
        RangeEnc_FlushStream(p);
602
7.51M
      if (p->cacheSize == 0)
603
7.48M
        return;
604
7.51M
    }
605
30.4k
    high += 0xFF;
606
30.4k
    for (;;)
607
30.8k
    {
608
30.8k
      Byte *buf = p->buf;
609
30.8k
      *buf++ = (Byte)(high);
610
30.8k
      p->buf = buf;
611
30.8k
      if (buf == p->bufLim)
612
0
        RangeEnc_FlushStream(p);
613
30.8k
      if (--p->cacheSize == 0)
614
30.4k
        return;
615
30.8k
    }
616
30.4k
  }
617
30.8k
  p->cacheSize++;
618
30.8k
}
619
620
static void RangeEnc_FlushData(CRangeEnc *p)
621
16.3k
{
622
16.3k
  int i;
623
98.0k
  for (i = 0; i < 5; i++)
624
81.7k
    RangeEnc_ShiftLow(p);
625
16.3k
}
626
627
74.8M
#define RC_NORM(p) if (range < kTopValue) { range <<= 8; RangeEnc_ShiftLow(p); }
628
629
#define RC_BIT_PRE(p, prob) \
630
74.0M
  ttt = *(prob); \
631
74.0M
  newBound = (range >> kNumBitModelTotalBits) * ttt;
632
633
// #define _LZMA_ENC_USE_BRANCH
634
635
#ifdef _LZMA_ENC_USE_BRANCH
636
637
#define RC_BIT(p, prob, bit) { \
638
  RC_BIT_PRE(p, prob) \
639
  if (bit == 0) { range = newBound; ttt += (kBitModelTotal - ttt) >> kNumMoveBits; } \
640
  else { (p)->low += newBound; range -= newBound; ttt -= ttt >> kNumMoveBits; } \
641
  *(prob) = (CLzmaProb)ttt; \
642
  RC_NORM(p) \
643
  }
644
645
#else
646
647
61.6M
#define RC_BIT(p, prob, bit) { \
648
61.6M
  UInt32 mask; \
649
61.6M
  RC_BIT_PRE(p, prob) \
650
61.6M
  mask = 0 - (UInt32)bit; \
651
61.6M
  range &= mask; \
652
61.6M
  mask &= newBound; \
653
61.6M
  range -= mask; \
654
61.6M
  (p)->low += mask; \
655
61.6M
  mask = (UInt32)bit - 1; \
656
61.6M
  range += newBound & mask; \
657
61.6M
  mask &= (kBitModelTotal - ((1 << kNumMoveBits) - 1)); \
658
61.6M
  mask += ((1 << kNumMoveBits) - 1); \
659
61.6M
  ttt += (Int32)(mask - ttt) >> kNumMoveBits; \
660
61.6M
  *(prob) = (CLzmaProb)ttt; \
661
61.6M
  RC_NORM(p) \
662
61.6M
  }
663
664
#endif
665
666
667
668
669
#define RC_BIT_0_BASE(p, prob) \
670
9.08M
  range = newBound; *(prob) = (CLzmaProb)(ttt + ((kBitModelTotal - ttt) >> kNumMoveBits));
671
672
#define RC_BIT_1_BASE(p, prob) \
673
3.36M
  range -= newBound; (p)->low += newBound; *(prob) = (CLzmaProb)(ttt - (ttt >> kNumMoveBits)); \
674
675
#define RC_BIT_0(p, prob) \
676
8.69M
  RC_BIT_0_BASE(p, prob) \
677
8.69M
  RC_NORM(p)
678
679
#define RC_BIT_1(p, prob) \
680
3.11M
  RC_BIT_1_BASE(p, prob) \
681
3.11M
  RC_NORM(p)
682
683
static void RangeEnc_EncodeBit_0(CRangeEnc *p, CLzmaProb *prob)
684
8.13k
{
685
8.13k
  UInt32 range, ttt, newBound;
686
8.13k
  range = p->range;
687
8.13k
  RC_BIT_PRE(p, prob)
688
8.13k
  RC_BIT_0(p, prob)
689
8.13k
  p->range = range;
690
8.13k
}
691
692
static void LitEnc_Encode(CRangeEnc *p, CLzmaProb *probs, UInt32 sym)
693
5.82M
{
694
5.82M
  UInt32 range = p->range;
695
5.82M
  sym |= 0x100;
696
5.82M
  do
697
46.6M
  {
698
46.6M
    UInt32 ttt, newBound;
699
    // RangeEnc_EncodeBit(p, probs + (sym >> 8), (sym >> 7) & 1);
700
46.6M
    CLzmaProb *prob = probs + (sym >> 8);
701
46.6M
    UInt32 bit = (sym >> 7) & 1;
702
46.6M
    sym <<= 1;
703
46.6M
    RC_BIT(p, prob, bit);
704
46.6M
  }
705
46.6M
  while (sym < 0x10000);
706
5.82M
  p->range = range;
707
5.82M
}
708
709
static void LitEnc_EncodeMatched(CRangeEnc *p, CLzmaProb *probs, UInt32 sym, UInt32 matchByte)
710
434k
{
711
434k
  UInt32 range = p->range;
712
434k
  UInt32 offs = 0x100;
713
434k
  sym |= 0x100;
714
434k
  do
715
3.47M
  {
716
3.47M
    UInt32 ttt, newBound;
717
3.47M
    CLzmaProb *prob;
718
3.47M
    UInt32 bit;
719
3.47M
    matchByte <<= 1;
720
    // RangeEnc_EncodeBit(p, probs + (offs + (matchByte & offs) + (sym >> 8)), (sym >> 7) & 1);
721
3.47M
    prob = probs + (offs + (matchByte & offs) + (sym >> 8));
722
3.47M
    bit = (sym >> 7) & 1;
723
3.47M
    sym <<= 1;
724
3.47M
    offs &= ~(matchByte ^ sym);
725
3.47M
    RC_BIT(p, prob, bit);
726
3.47M
  }
727
3.47M
  while (sym < 0x10000);
728
434k
  p->range = range;
729
434k
}
730
731
732
733
static void LzmaEnc_InitPriceTables(CProbPrice *ProbPrices)
734
8.13k
{
735
8.13k
  UInt32 i;
736
1.04M
  for (i = 0; i < (kBitModelTotal >> kNumMoveReducingBits); i++)
737
1.04M
  {
738
1.04M
    const unsigned kCyclesBits = kNumBitPriceShiftBits;
739
1.04M
    UInt32 w = (i << kNumMoveReducingBits) + (1 << (kNumMoveReducingBits - 1));
740
1.04M
    unsigned bitCount = 0;
741
1.04M
    unsigned j;
742
5.20M
    for (j = 0; j < kCyclesBits; j++)
743
4.16M
    {
744
4.16M
      w = w * w;
745
4.16M
      bitCount <<= 1;
746
56.1M
      while (w >= ((UInt32)1 << 16))
747
51.9M
      {
748
51.9M
        w >>= 1;
749
51.9M
        bitCount++;
750
51.9M
      }
751
4.16M
    }
752
1.04M
    ProbPrices[i] = (CProbPrice)((kNumBitModelTotalBits << kCyclesBits) - 15 - bitCount);
753
    // printf("\n%3d: %5d", i, ProbPrices[i]);
754
1.04M
  }
755
8.13k
}
756
757
758
#define GET_PRICE(prob, bit) \
759
2.07M
  p->ProbPrices[((prob) ^ (unsigned)(((-(int)(bit))) & (kBitModelTotal - 1))) >> kNumMoveReducingBits];
760
761
#define GET_PRICEa(prob, bit) \
762
80.2M
     ProbPrices[((prob) ^ (unsigned)((-((int)(bit))) & (kBitModelTotal - 1))) >> kNumMoveReducingBits];
763
764
17.4M
#define GET_PRICE_0(prob) p->ProbPrices[(prob) >> kNumMoveReducingBits]
765
26.1M
#define GET_PRICE_1(prob) p->ProbPrices[((prob) ^ (kBitModelTotal - 1)) >> kNumMoveReducingBits]
766
767
10.6M
#define GET_PRICEa_0(prob) ProbPrices[(prob) >> kNumMoveReducingBits]
768
10.6M
#define GET_PRICEa_1(prob) ProbPrices[((prob) ^ (kBitModelTotal - 1)) >> kNumMoveReducingBits]
769
770
771
static UInt32 LitEnc_GetPrice(const CLzmaProb *probs, UInt32 sym, const CProbPrice *ProbPrices)
772
1.02M
{
773
1.02M
  UInt32 price = 0;
774
1.02M
  sym |= 0x100;
775
1.02M
  do
776
8.22M
  {
777
8.22M
    unsigned bit = sym & 1;
778
8.22M
    sym >>= 1;
779
8.22M
    price += GET_PRICEa(probs[sym], bit);
780
8.22M
  }
781
8.22M
  while (sym >= 2);
782
1.02M
  return price;
783
1.02M
}
784
785
786
static UInt32 LitEnc_Matched_GetPrice(const CLzmaProb *probs, UInt32 sym, UInt32 matchByte, const CProbPrice *ProbPrices)
787
3.70M
{
788
3.70M
  UInt32 price = 0;
789
3.70M
  UInt32 offs = 0x100;
790
3.70M
  sym |= 0x100;
791
3.70M
  do
792
29.6M
  {
793
29.6M
    matchByte <<= 1;
794
29.6M
    price += GET_PRICEa(probs[offs + (matchByte & offs) + (sym >> 8)], (sym >> 7) & 1);
795
29.6M
    sym <<= 1;
796
29.6M
    offs &= ~(matchByte ^ sym);
797
29.6M
  }
798
29.6M
  while (sym < 0x10000);
799
3.70M
  return price;
800
3.70M
}
801
802
803
static void RcTree_ReverseEncode(CRangeEnc *rc, CLzmaProb *probs, unsigned numBits, unsigned sym)
804
462k
{
805
462k
  UInt32 range = rc->range;
806
462k
  unsigned m = 1;
807
462k
  do
808
1.10M
  {
809
1.10M
    UInt32 ttt, newBound;
810
1.10M
    unsigned bit = sym & 1;
811
    // RangeEnc_EncodeBit(rc, probs + m, bit);
812
1.10M
    sym >>= 1;
813
1.10M
    RC_BIT(rc, probs + m, bit);
814
1.10M
    m = (m << 1) | bit;
815
1.10M
  }
816
1.10M
  while (--numBits);
817
462k
  rc->range = range;
818
462k
}
819
820
821
822
static void LenEnc_Init(CLenEnc *p)
823
36.6k
{
824
36.6k
  unsigned i;
825
9.40M
  for (i = 0; i < (LZMA_NUM_PB_STATES_MAX << (kLenNumLowBits + 1)); i++)
826
9.37M
    p->low[i] = kProbInitValue;
827
9.40M
  for (i = 0; i < kLenNumHighSymbols; i++)
828
9.37M
    p->high[i] = kProbInitValue;
829
36.6k
}
830
831
static void LenEnc_Encode(CLenEnc *p, CRangeEnc *rc, unsigned sym, unsigned posState)
832
1.48M
{
833
1.48M
  UInt32 range, ttt, newBound;
834
1.48M
  CLzmaProb *probs = p->low;
835
1.48M
  range = rc->range;
836
1.48M
  RC_BIT_PRE(rc, probs);
837
1.48M
  if (sym >= kLenNumLowSymbols)
838
150k
  {
839
150k
    RC_BIT_1(rc, probs);
840
150k
    probs += kLenNumLowSymbols;
841
150k
    RC_BIT_PRE(rc, probs);
842
150k
    if (sym >= kLenNumLowSymbols * 2)
843
90.6k
    {
844
90.6k
      RC_BIT_1(rc, probs);
845
90.6k
      rc->range = range;
846
      // RcTree_Encode(rc, p->high, kLenNumHighBits, sym - kLenNumLowSymbols * 2);
847
90.6k
      LitEnc_Encode(rc, p->high, sym - kLenNumLowSymbols * 2);
848
90.6k
      return;
849
90.6k
    }
850
60.1k
    sym -= kLenNumLowSymbols;
851
60.1k
  }
852
853
  // RcTree_Encode(rc, probs + (posState << kLenNumLowBits), kLenNumLowBits, sym);
854
1.39M
  {
855
1.39M
    unsigned m;
856
1.39M
    unsigned bit;
857
1.39M
    RC_BIT_0(rc, probs);
858
1.39M
    probs += (posState << (1 + kLenNumLowBits));
859
1.39M
    bit = (sym >> 2)    ; RC_BIT(rc, probs + 1, bit); m = (1 << 1) + bit;
860
1.39M
    bit = (sym >> 1) & 1; RC_BIT(rc, probs + m, bit); m = (m << 1) + bit;
861
1.39M
    bit =  sym       & 1; RC_BIT(rc, probs + m, bit);
862
1.39M
    rc->range = range;
863
1.39M
  }
864
1.39M
}
865
866
static void SetPrices_3(const CLzmaProb *probs, UInt32 startPrice, UInt32 *prices, const CProbPrice *ProbPrices)
867
959k
{
868
959k
  unsigned i;
869
4.79M
  for (i = 0; i < 8; i += 2)
870
3.83M
  {
871
3.83M
    UInt32 price = startPrice;
872
3.83M
    UInt32 prob;
873
3.83M
    price += GET_PRICEa(probs[1           ], (i >> 2));
874
3.83M
    price += GET_PRICEa(probs[2 + (i >> 2)], (i >> 1) & 1);
875
3.83M
    prob = probs[4 + (i >> 1)];
876
3.83M
    prices[i    ] = price + GET_PRICEa_0(prob);
877
3.83M
    prices[i + 1] = price + GET_PRICEa_1(prob);
878
3.83M
  }
879
959k
}
880
881
882
MY_NO_INLINE static void MY_FAST_CALL LenPriceEnc_UpdateTables(
883
    CLenPriceEnc *p,
884
    unsigned numPosStates,
885
    const CLenEnc *enc,
886
    const CProbPrice *ProbPrices)
887
61.8k
{
888
61.8k
  UInt32 b;
889
 
890
61.8k
  {
891
61.8k
    unsigned prob = enc->low[0];
892
61.8k
    UInt32 a, c;
893
61.8k
    unsigned posState;
894
61.8k
    b = GET_PRICEa_1(prob);
895
61.8k
    a = GET_PRICEa_0(prob);
896
61.8k
    c = b + GET_PRICEa_0(enc->low[kLenNumLowSymbols]);
897
541k
    for (posState = 0; posState < numPosStates; posState++)
898
479k
    {
899
479k
      UInt32 *prices = p->prices[posState];
900
479k
      const CLzmaProb *probs = enc->low + (posState << (1 + kLenNumLowBits));
901
479k
      SetPrices_3(probs, a, prices, ProbPrices);
902
479k
      SetPrices_3(probs + kLenNumLowSymbols, c, prices + kLenNumLowSymbols, ProbPrices);
903
479k
    }
904
61.8k
  }
905
906
  /*
907
  {
908
    unsigned i;
909
    UInt32 b;
910
    a = GET_PRICEa_0(enc->low[0]);
911
    for (i = 0; i < kLenNumLowSymbols; i++)
912
      p->prices2[i] = a;
913
    a = GET_PRICEa_1(enc->low[0]);
914
    b = a + GET_PRICEa_0(enc->low[kLenNumLowSymbols]);
915
    for (i = kLenNumLowSymbols; i < kLenNumLowSymbols * 2; i++)
916
      p->prices2[i] = b;
917
    a += GET_PRICEa_1(enc->low[kLenNumLowSymbols]);
918
  }
919
  */
920
 
921
  // p->counter = numSymbols;
922
  // p->counter = 64;
923
924
61.8k
  {
925
61.8k
    unsigned i = p->tableSize;
926
    
927
61.8k
    if (i > kLenNumLowSymbols * 2)
928
36.0k
    {
929
36.0k
      const CLzmaProb *probs = enc->high;
930
36.0k
      UInt32 *prices = p->prices[0] + kLenNumLowSymbols * 2;
931
36.0k
      i -= kLenNumLowSymbols * 2 - 1;
932
36.0k
      i >>= 1;
933
36.0k
      b += GET_PRICEa_1(enc->low[kLenNumLowSymbols]);
934
36.0k
      do
935
2.35M
      {
936
        /*
937
        p->prices2[i] = a +
938
        // RcTree_GetPrice(enc->high, kLenNumHighBits, i - kLenNumLowSymbols * 2, ProbPrices);
939
        LitEnc_GetPrice(probs, i - kLenNumLowSymbols * 2, ProbPrices);
940
        */
941
        // UInt32 price = a + RcTree_GetPrice(probs, kLenNumHighBits - 1, sym, ProbPrices);
942
2.35M
        unsigned sym = --i + (1 << (kLenNumHighBits - 1));
943
2.35M
        UInt32 price = b;
944
2.35M
        do
945
16.5M
        {
946
16.5M
          unsigned bit = sym & 1;
947
16.5M
          sym >>= 1;
948
16.5M
          price += GET_PRICEa(probs[sym], bit);
949
16.5M
        }
950
16.5M
        while (sym >= 2);
951
952
2.35M
        {
953
2.35M
          unsigned prob = probs[(size_t)i + (1 << (kLenNumHighBits - 1))];
954
2.35M
          prices[(size_t)i * 2    ] = price + GET_PRICEa_0(prob);
955
2.35M
          prices[(size_t)i * 2 + 1] = price + GET_PRICEa_1(prob);
956
2.35M
        }
957
2.35M
      }
958
2.35M
      while (i);
959
960
36.0k
      {
961
36.0k
        unsigned posState;
962
36.0k
        size_t num = (p->tableSize - kLenNumLowSymbols * 2) * sizeof(p->prices[0][0]);
963
321k
        for (posState = 1; posState < numPosStates; posState++)
964
285k
          memcpy(p->prices[posState] + kLenNumLowSymbols * 2, p->prices[0] + kLenNumLowSymbols * 2, num);
965
36.0k
      }
966
36.0k
    }
967
61.8k
  }
968
61.8k
}
969
970
/*
971
  #ifdef SHOW_STAT
972
  g_STAT_OFFSET += num;
973
  printf("\n MovePos %u", num);
974
  #endif
975
*/
976
  
977
390k
#define MOVE_POS(p, num) { \
978
390k
    p->additionalOffset += (num); \
979
390k
    p->matchFinder.Skip(p->matchFinderObj, (UInt32)(num)); }
980
981
982
static unsigned ReadMatchDistances(CLzmaEnc *p, unsigned *numPairsRes)
983
10.9M
{
984
10.9M
  unsigned numPairs;
985
  
986
10.9M
  p->additionalOffset++;
987
10.9M
  p->numAvail = p->matchFinder.GetNumAvailableBytes(p->matchFinderObj);
988
10.9M
  numPairs = p->matchFinder.GetMatches(p->matchFinderObj, p->matches);
989
10.9M
  *numPairsRes = numPairs;
990
  
991
  #ifdef SHOW_STAT
992
  printf("\n i = %u numPairs = %u    ", g_STAT_OFFSET, numPairs / 2);
993
  g_STAT_OFFSET++;
994
  {
995
    unsigned i;
996
    for (i = 0; i < numPairs; i += 2)
997
      printf("%2u %6u   | ", p->matches[i], p->matches[i + 1]);
998
  }
999
  #endif
1000
  
1001
10.9M
  if (numPairs == 0)
1002
5.24M
    return 0;
1003
5.75M
  {
1004
5.75M
    unsigned len = p->matches[(size_t)numPairs - 2];
1005
5.75M
    if (len != p->numFastBytes)
1006
5.56M
      return len;
1007
190k
    {
1008
190k
      UInt32 numAvail = p->numAvail;
1009
190k
      if (numAvail > LZMA_MATCH_LEN_MAX)
1010
177k
        numAvail = LZMA_MATCH_LEN_MAX;
1011
190k
      {
1012
190k
        const Byte *p1 = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1013
190k
        const Byte *p2 = p1 + len;
1014
190k
        ptrdiff_t dif = (ptrdiff_t)-1 - p->matches[(size_t)numPairs - 1];
1015
190k
        const Byte *lim = p1 + numAvail;
1016
4.11M
        for (; p2 != lim && *p2 == p2[dif]; p2++)
1017
3.92M
        {}
1018
190k
        return (unsigned)(p2 - p1);
1019
5.75M
      }
1020
5.75M
    }
1021
5.75M
  }
1022
5.75M
}
1023
1024
14.6M
#define MARK_LIT ((UInt32)(Int32)-1)
1025
1026
1.35M
#define MakeAs_Lit(p)       { (p)->dist = MARK_LIT; (p)->extra = 0; }
1027
149k
#define MakeAs_ShortRep(p)  { (p)->dist = 0; (p)->extra = 0; }
1028
1.16M
#define IsShortRep(p)       ((p)->dist == 0)
1029
1030
1031
#define GetPrice_ShortRep(p, state, posState) \
1032
178k
  ( GET_PRICE_0(p->isRepG0[state]) + GET_PRICE_0(p->isRep0Long[state][posState]))
1033
1034
2.87M
#define GetPrice_Rep_0(p, state, posState) ( \
1035
2.87M
    GET_PRICE_1(p->isMatch[state][posState]) \
1036
2.87M
  + GET_PRICE_1(p->isRep0Long[state][posState])) \
1037
2.87M
  + GET_PRICE_1(p->isRep[state]) \
1038
2.87M
  + GET_PRICE_0(p->isRepG0[state])
1039
  
1040
MY_FORCE_INLINE
1041
static UInt32 GetPrice_PureRep(const CLzmaEnc *p, unsigned repIndex, size_t state, size_t posState)
1042
5.07M
{
1043
5.07M
  UInt32 price;
1044
5.07M
  UInt32 prob = p->isRepG0[state];
1045
5.07M
  if (repIndex == 0)
1046
1.82M
  {
1047
1.82M
    price = GET_PRICE_0(prob);
1048
1.82M
    price += GET_PRICE_1(p->isRep0Long[state][posState]);
1049
1.82M
  }
1050
3.24M
  else
1051
3.24M
  {
1052
3.24M
    price = GET_PRICE_1(prob);
1053
3.24M
    prob = p->isRepG1[state];
1054
3.24M
    if (repIndex == 1)
1055
1.17M
      price += GET_PRICE_0(prob);
1056
2.07M
    else
1057
2.07M
    {
1058
2.07M
      price += GET_PRICE_1(prob);
1059
2.07M
      price += GET_PRICE(p->isRepG2[state], repIndex - 2);
1060
2.07M
    }
1061
3.24M
  }
1062
5.07M
  return price;
1063
5.07M
}
1064
1065
1066
static unsigned Backward(CLzmaEnc *p, unsigned cur)
1067
376k
{
1068
376k
  unsigned wr = cur + 1;
1069
376k
  p->optEnd = wr;
1070
1071
376k
  for (;;)
1072
1.97M
  {
1073
1.97M
    UInt32 dist = p->opt[cur].dist;
1074
1.97M
    unsigned len = (unsigned)p->opt[cur].len;
1075
1.97M
    unsigned extra = (unsigned)p->opt[cur].extra;
1076
1.97M
    cur -= len;
1077
1078
1.97M
    if (extra)
1079
33.9k
    {
1080
33.9k
      wr--;
1081
33.9k
      p->opt[wr].len = (UInt32)len;
1082
33.9k
      cur -= extra;
1083
33.9k
      len = extra;
1084
33.9k
      if (extra == 1)
1085
708
      {
1086
708
        p->opt[wr].dist = dist;
1087
708
        dist = MARK_LIT;
1088
708
      }
1089
33.2k
      else
1090
33.2k
      {
1091
33.2k
        p->opt[wr].dist = 0;
1092
33.2k
        len--;
1093
33.2k
        wr--;
1094
33.2k
        p->opt[wr].dist = MARK_LIT;
1095
33.2k
        p->opt[wr].len = 1;
1096
33.2k
      }
1097
33.9k
    }
1098
1099
1.97M
    if (cur == 0)
1100
376k
    {
1101
376k
      p->backRes = dist;
1102
376k
      p->optCur = wr;
1103
376k
      return len;
1104
376k
    }
1105
    
1106
1.59M
    wr--;
1107
1.59M
    p->opt[wr].dist = dist;
1108
1.59M
    p->opt[wr].len = (UInt32)len;
1109
1.59M
  }
1110
376k
}
1111
1112
1113
1114
#define LIT_PROBS(pos, prevByte) \
1115
10.8M
  (p->litProbs + (UInt32)3 * (((((pos) << 8) + (prevByte)) & p->lpMask) << p->lc))
1116
1117
1118
static unsigned GetOptimum(CLzmaEnc *p, UInt32 position)
1119
2.73M
{
1120
2.73M
  unsigned last, cur;
1121
2.73M
  UInt32 reps[LZMA_NUM_REPS];
1122
2.73M
  unsigned repLens[LZMA_NUM_REPS];
1123
2.73M
  UInt32 *matches;
1124
1125
2.73M
  {
1126
2.73M
    UInt32 numAvail;
1127
2.73M
    unsigned numPairs, mainLen, repMaxIndex, i, posState;
1128
2.73M
    UInt32 matchPrice, repMatchPrice;
1129
2.73M
    const Byte *data;
1130
2.73M
    Byte curByte, matchByte;
1131
    
1132
2.73M
    p->optCur = p->optEnd = 0;
1133
    
1134
2.73M
    if (p->additionalOffset == 0)
1135
2.70M
      mainLen = ReadMatchDistances(p, &numPairs);
1136
36.0k
    else
1137
36.0k
    {
1138
36.0k
      mainLen = p->longestMatchLen;
1139
36.0k
      numPairs = p->numPairs;
1140
36.0k
    }
1141
    
1142
2.73M
    numAvail = p->numAvail;
1143
2.73M
    if (numAvail < 2)
1144
2.03k
    {
1145
2.03k
      p->backRes = MARK_LIT;
1146
2.03k
      return 1;
1147
2.03k
    }
1148
2.73M
    if (numAvail > LZMA_MATCH_LEN_MAX)
1149
2.60M
      numAvail = LZMA_MATCH_LEN_MAX;
1150
    
1151
2.73M
    data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1152
2.73M
    repMaxIndex = 0;
1153
    
1154
13.6M
    for (i = 0; i < LZMA_NUM_REPS; i++)
1155
10.9M
    {
1156
10.9M
      unsigned len;
1157
10.9M
      const Byte *data2;
1158
10.9M
      reps[i] = p->reps[i];
1159
10.9M
      data2 = data - reps[i];
1160
10.9M
      if (data[0] != data2[0] || data[1] != data2[1])
1161
10.7M
      {
1162
10.7M
        repLens[i] = 0;
1163
10.7M
        continue;
1164
10.7M
      }
1165
3.91M
      for (len = 2; len < numAvail && data[len] == data2[len]; len++)
1166
3.75M
      {}
1167
158k
      repLens[i] = len;
1168
158k
      if (len > repLens[repMaxIndex])
1169
80.7k
        repMaxIndex = i;
1170
158k
    }
1171
    
1172
2.73M
    if (repLens[repMaxIndex] >= p->numFastBytes)
1173
46.3k
    {
1174
46.3k
      unsigned len;
1175
46.3k
      p->backRes = (UInt32)repMaxIndex;
1176
46.3k
      len = repLens[repMaxIndex];
1177
46.3k
      MOVE_POS(p, len - 1)
1178
46.3k
      return len;
1179
46.3k
    }
1180
    
1181
2.69M
    matches = p->matches;
1182
    
1183
2.69M
    if (mainLen >= p->numFastBytes)
1184
55.5k
    {
1185
55.5k
      p->backRes = matches[(size_t)numPairs - 1] + LZMA_NUM_REPS;
1186
55.5k
      MOVE_POS(p, mainLen - 1)
1187
55.5k
      return mainLen;
1188
55.5k
    }
1189
    
1190
2.63M
    curByte = *data;
1191
2.63M
    matchByte = *(data - reps[0]);
1192
1193
2.63M
    last = repLens[repMaxIndex];
1194
2.63M
    if (last <= mainLen)
1195
2.63M
      last = mainLen;
1196
    
1197
2.63M
    if (last < 2 && curByte != matchByte)
1198
2.22M
    {
1199
2.22M
      p->backRes = MARK_LIT;
1200
2.22M
      return 1;
1201
2.22M
    }
1202
    
1203
405k
    p->opt[0].state = (CState)p->state;
1204
    
1205
405k
    posState = (position & p->pbMask);
1206
    
1207
405k
    {
1208
405k
      const CLzmaProb *probs = LIT_PROBS(position, *(data - 1));
1209
405k
      p->opt[1].price = GET_PRICE_0(p->isMatch[p->state][posState]) +
1210
405k
        (!IsLitState(p->state) ?
1211
68.0k
          LitEnc_Matched_GetPrice(probs, curByte, matchByte, p->ProbPrices) :
1212
405k
          LitEnc_GetPrice(probs, curByte, p->ProbPrices));
1213
405k
    }
1214
1215
405k
    MakeAs_Lit(&p->opt[1]);
1216
    
1217
405k
    matchPrice = GET_PRICE_1(p->isMatch[p->state][posState]);
1218
405k
    repMatchPrice = matchPrice + GET_PRICE_1(p->isRep[p->state]);
1219
    
1220
    // 18.06
1221
405k
    if (matchByte == curByte && repLens[0] == 0)
1222
39.6k
    {
1223
39.6k
      UInt32 shortRepPrice = repMatchPrice + GetPrice_ShortRep(p, p->state, posState);
1224
39.6k
      if (shortRepPrice < p->opt[1].price)
1225
34.6k
      {
1226
34.6k
        p->opt[1].price = shortRepPrice;
1227
34.6k
        MakeAs_ShortRep(&p->opt[1]);
1228
34.6k
      }
1229
39.6k
      if (last < 2)
1230
28.3k
      {
1231
28.3k
        p->backRes = p->opt[1].dist;
1232
28.3k
        return 1;
1233
28.3k
      }
1234
39.6k
    }
1235
   
1236
376k
    p->opt[1].len = 1;
1237
    
1238
376k
    p->opt[0].reps[0] = reps[0];
1239
376k
    p->opt[0].reps[1] = reps[1];
1240
376k
    p->opt[0].reps[2] = reps[2];
1241
376k
    p->opt[0].reps[3] = reps[3];
1242
    
1243
    // ---------- REP ----------
1244
    
1245
1.88M
    for (i = 0; i < LZMA_NUM_REPS; i++)
1246
1.50M
    {
1247
1.50M
      unsigned repLen = repLens[i];
1248
1.50M
      UInt32 price;
1249
1.50M
      if (repLen < 2)
1250
1.44M
        continue;
1251
62.0k
      price = repMatchPrice + GetPrice_PureRep(p, i, p->state, posState);
1252
62.0k
      do
1253
343k
      {
1254
343k
        UInt32 price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState, repLen);
1255
343k
        COptimal *opt = &p->opt[repLen];
1256
343k
        if (price2 < opt->price)
1257
227k
        {
1258
227k
          opt->price = price2;
1259
227k
          opt->len = (UInt32)repLen;
1260
227k
          opt->dist = (UInt32)i;
1261
227k
          opt->extra = 0;
1262
227k
        }
1263
343k
      }
1264
343k
      while (--repLen >= 2);
1265
62.0k
    }
1266
    
1267
    
1268
    // ---------- MATCH ----------
1269
376k
    {
1270
376k
      unsigned len = repLens[0] + 1;
1271
376k
      if (len <= mainLen)
1272
366k
      {
1273
366k
        unsigned offs = 0;
1274
366k
        UInt32 normalMatchPrice = matchPrice + GET_PRICE_0(p->isRep[p->state]);
1275
1276
366k
        if (len < 2)
1277
365k
          len = 2;
1278
1.47k
        else
1279
3.89k
          while (len > matches[offs])
1280
2.42k
            offs += 2;
1281
    
1282
366k
        for (; ; len++)
1283
650k
        {
1284
650k
          COptimal *opt;
1285
650k
          UInt32 dist = matches[(size_t)offs + 1];
1286
650k
          UInt32 price = normalMatchPrice + GET_PRICE_LEN(&p->lenEnc, posState, len);
1287
650k
          unsigned lenToPosState = GetLenToPosState(len);
1288
       
1289
650k
          if (dist < kNumFullDistances)
1290
264k
            price += p->distancesPrices[lenToPosState][dist & (kNumFullDistances - 1)];
1291
386k
          else
1292
386k
          {
1293
386k
            unsigned slot;
1294
386k
            GetPosSlot2(dist, slot);
1295
386k
            price += p->alignPrices[dist & kAlignMask];
1296
386k
            price += p->posSlotPrices[lenToPosState][slot];
1297
386k
          }
1298
          
1299
650k
          opt = &p->opt[len];
1300
          
1301
650k
          if (price < opt->price)
1302
594k
          {
1303
594k
            opt->price = price;
1304
594k
            opt->len = (UInt32)len;
1305
594k
            opt->dist = dist + LZMA_NUM_REPS;
1306
594k
            opt->extra = 0;
1307
594k
          }
1308
          
1309
650k
          if (len == matches[offs])
1310
435k
          {
1311
435k
            offs += 2;
1312
435k
            if (offs == numPairs)
1313
366k
              break;
1314
435k
          }
1315
650k
        }
1316
366k
      }
1317
376k
    }
1318
    
1319
1320
376k
    cur = 0;
1321
1322
    #ifdef SHOW_STAT2
1323
    /* if (position >= 0) */
1324
    {
1325
      unsigned i;
1326
      printf("\n pos = %4X", position);
1327
      for (i = cur; i <= last; i++)
1328
      printf("\nprice[%4X] = %u", position - cur + i, p->opt[i].price);
1329
    }
1330
    #endif
1331
376k
  }
1332
1333
1334
  
1335
  // ---------- Optimal Parsing ----------
1336
1337
0
  for (;;)
1338
5.16M
  {
1339
5.16M
    unsigned numAvail;
1340
5.16M
    UInt32 numAvailFull;
1341
5.16M
    unsigned newLen, numPairs, prev, state, posState, startLen;
1342
5.16M
    UInt32 litPrice, matchPrice, repMatchPrice;
1343
5.16M
    BoolInt nextIsLit;
1344
5.16M
    Byte curByte, matchByte;
1345
5.16M
    const Byte *data;
1346
5.16M
    COptimal *curOpt, *nextOpt;
1347
1348
5.16M
    if (++cur == last)
1349
340k
      break;
1350
    
1351
    // 18.06
1352
4.82M
    if (cur >= kNumOpts - 64)
1353
424
    {
1354
424
      unsigned j, best;
1355
424
      UInt32 price = p->opt[cur].price;
1356
424
      best = cur;
1357
7.36k
      for (j = cur + 1; j <= last; j++)
1358
6.93k
      {
1359
6.93k
        UInt32 price2 = p->opt[j].price;
1360
6.93k
        if (price >= price2)
1361
661
        {
1362
661
          price = price2;
1363
661
          best = j;
1364
661
        }
1365
6.93k
      }
1366
424
      {
1367
424
        unsigned delta = best - cur;
1368
424
        if (delta != 0)
1369
250
        {
1370
250
          MOVE_POS(p, delta);
1371
250
        }
1372
424
      }
1373
424
      cur = best;
1374
424
      break;
1375
424
    }
1376
1377
4.82M
    newLen = ReadMatchDistances(p, &numPairs);
1378
    
1379
4.82M
    if (newLen >= p->numFastBytes)
1380
36.0k
    {
1381
36.0k
      p->numPairs = numPairs;
1382
36.0k
      p->longestMatchLen = newLen;
1383
36.0k
      break;
1384
36.0k
    }
1385
    
1386
4.78M
    curOpt = &p->opt[cur];
1387
1388
4.78M
    position++;
1389
1390
    // we need that check here, if skip_items in p->opt are possible
1391
    /*
1392
    if (curOpt->price >= kInfinityPrice)
1393
      continue;
1394
    */
1395
1396
4.78M
    prev = cur - curOpt->len;
1397
1398
4.78M
    if (curOpt->len == 1)
1399
1.16M
    {
1400
1.16M
      state = (unsigned)p->opt[prev].state;
1401
1.16M
      if (IsShortRep(curOpt))
1402
117k
        state = kShortRepNextStates[state];
1403
1.04M
      else
1404
1.04M
        state = kLiteralNextStates[state];
1405
1.16M
    }
1406
3.62M
    else
1407
3.62M
    {
1408
3.62M
      const COptimal *prevOpt;
1409
3.62M
      UInt32 b0;
1410
3.62M
      UInt32 dist = curOpt->dist;
1411
1412
3.62M
      if (curOpt->extra)
1413
70.6k
      {
1414
70.6k
        prev -= (unsigned)curOpt->extra;
1415
70.6k
        state = kState_RepAfterLit;
1416
70.6k
        if (curOpt->extra == 1)
1417
1.05k
          state = (dist < LZMA_NUM_REPS ? kState_RepAfterLit : kState_MatchAfterLit);
1418
70.6k
      }
1419
3.55M
      else
1420
3.55M
      {
1421
3.55M
        state = (unsigned)p->opt[prev].state;
1422
3.55M
        if (dist < LZMA_NUM_REPS)
1423
1.75M
          state = kRepNextStates[state];
1424
1.80M
        else
1425
1.80M
          state = kMatchNextStates[state];
1426
3.55M
      }
1427
1428
3.62M
      prevOpt = &p->opt[prev];
1429
3.62M
      b0 = prevOpt->reps[0];
1430
1431
3.62M
      if (dist < LZMA_NUM_REPS)
1432
1.81M
      {
1433
1.81M
        if (dist == 0)
1434
440k
        {
1435
440k
          reps[0] = b0;
1436
440k
          reps[1] = prevOpt->reps[1];
1437
440k
          reps[2] = prevOpt->reps[2];
1438
440k
          reps[3] = prevOpt->reps[3];
1439
440k
        }
1440
1.37M
        else
1441
1.37M
        {
1442
1.37M
          reps[1] = b0;
1443
1.37M
          b0 = prevOpt->reps[1];
1444
1.37M
          if (dist == 1)
1445
844k
          {
1446
844k
            reps[0] = b0;
1447
844k
            reps[2] = prevOpt->reps[2];
1448
844k
            reps[3] = prevOpt->reps[3];
1449
844k
          }
1450
529k
          else
1451
529k
          {
1452
529k
            reps[2] = b0;
1453
529k
            reps[0] = prevOpt->reps[dist];
1454
529k
            reps[3] = prevOpt->reps[dist ^ 1];
1455
529k
          }
1456
1.37M
        }
1457
1.81M
      }
1458
1.81M
      else
1459
1.81M
      {
1460
1.81M
        reps[0] = (dist - LZMA_NUM_REPS + 1);
1461
1.81M
        reps[1] = b0;
1462
1.81M
        reps[2] = prevOpt->reps[1];
1463
1.81M
        reps[3] = prevOpt->reps[2];
1464
1.81M
      }
1465
3.62M
    }
1466
    
1467
4.78M
    curOpt->state = (CState)state;
1468
4.78M
    curOpt->reps[0] = reps[0];
1469
4.78M
    curOpt->reps[1] = reps[1];
1470
4.78M
    curOpt->reps[2] = reps[2];
1471
4.78M
    curOpt->reps[3] = reps[3];
1472
1473
4.78M
    data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1474
4.78M
    curByte = *data;
1475
4.78M
    matchByte = *(data - reps[0]);
1476
1477
4.78M
    posState = (position & p->pbMask);
1478
1479
    /*
1480
    The order of Price checks:
1481
       <  LIT
1482
       <= SHORT_REP
1483
       <  LIT : REP_0
1484
       <  REP    [ : LIT : REP_0 ]
1485
       <  MATCH  [ : LIT : REP_0 ]
1486
    */
1487
1488
4.78M
    {
1489
4.78M
      UInt32 curPrice = curOpt->price;
1490
4.78M
      unsigned prob = p->isMatch[state][posState];
1491
4.78M
      matchPrice = curPrice + GET_PRICE_1(prob);
1492
4.78M
      litPrice = curPrice + GET_PRICE_0(prob);
1493
4.78M
    }
1494
1495
4.78M
    nextOpt = &p->opt[(size_t)cur + 1];
1496
4.78M
    nextIsLit = False;
1497
1498
    // here we can allow skip_items in p->opt, if we don't check (nextOpt->price < kInfinityPrice)
1499
    // 18.new.06
1500
4.78M
    if ((nextOpt->price < kInfinityPrice
1501
        // && !IsLitState(state)
1502
4.78M
        && matchByte == curByte)
1503
4.78M
        || litPrice > nextOpt->price
1504
4.78M
        )
1505
3.21M
      litPrice = 0;
1506
1.57M
    else
1507
1.57M
    {
1508
1.57M
      const CLzmaProb *probs = LIT_PROBS(position, *(data - 1));
1509
1.57M
      litPrice += (!IsLitState(state) ?
1510
879k
          LitEnc_Matched_GetPrice(probs, curByte, matchByte, p->ProbPrices) :
1511
1.57M
          LitEnc_GetPrice(probs, curByte, p->ProbPrices));
1512
      
1513
1.57M
      if (litPrice < nextOpt->price)
1514
952k
      {
1515
952k
        nextOpt->price = litPrice;
1516
952k
        nextOpt->len = 1;
1517
952k
        MakeAs_Lit(nextOpt);
1518
952k
        nextIsLit = True;
1519
952k
      }
1520
1.57M
    }
1521
1522
4.78M
    repMatchPrice = matchPrice + GET_PRICE_1(p->isRep[state]);
1523
    
1524
4.78M
    numAvailFull = p->numAvail;
1525
4.78M
    {
1526
4.78M
      unsigned temp = kNumOpts - 1 - cur;
1527
4.78M
      if (numAvailFull > temp)
1528
3.89M
        numAvailFull = (UInt32)temp;
1529
4.78M
    }
1530
1531
    // 18.06
1532
    // ---------- SHORT_REP ----------
1533
4.78M
    if (IsLitState(state)) // 18.new
1534
1.04M
    if (matchByte == curByte)
1535
244k
    if (repMatchPrice < nextOpt->price) // 18.new
1536
    // if (numAvailFull < 2 || data[1] != *(data - reps[0] + 1))
1537
139k
    if (
1538
        // nextOpt->price >= kInfinityPrice ||
1539
139k
        nextOpt->len < 2   // we can check nextOpt->len, if skip items are not allowed in p->opt
1540
139k
        || (nextOpt->dist != 0
1541
            // && nextOpt->extra <= 1 // 17.old
1542
129k
            )
1543
139k
        )
1544
138k
    {
1545
138k
      UInt32 shortRepPrice = repMatchPrice + GetPrice_ShortRep(p, state, posState);
1546
      // if (shortRepPrice <= nextOpt->price) // 17.old
1547
138k
      if (shortRepPrice < nextOpt->price)  // 18.new
1548
115k
      {
1549
115k
        nextOpt->price = shortRepPrice;
1550
115k
        nextOpt->len = 1;
1551
115k
        MakeAs_ShortRep(nextOpt);
1552
115k
        nextIsLit = False;
1553
115k
      }
1554
138k
    }
1555
    
1556
4.78M
    if (numAvailFull < 2)
1557
3.04k
      continue;
1558
4.78M
    numAvail = (numAvailFull <= p->numFastBytes ? numAvailFull : p->numFastBytes);
1559
1560
    // numAvail <= p->numFastBytes
1561
1562
    // ---------- LIT : REP_0 ----------
1563
1564
4.78M
    if (!nextIsLit
1565
4.78M
        && litPrice != 0 // 18.new
1566
4.78M
        && matchByte != curByte
1567
4.78M
        && numAvailFull > 2)
1568
616k
    {
1569
616k
      const Byte *data2 = data - reps[0];
1570
616k
      if (data[1] == data2[1] && data[2] == data2[2])
1571
118k
      {
1572
118k
        unsigned len;
1573
118k
        unsigned limit = p->numFastBytes + 1;
1574
118k
        if (limit > numAvailFull)
1575
5.35k
          limit = numAvailFull;
1576
322k
        for (len = 3; len < limit && data[len] == data2[len]; len++)
1577
203k
        {}
1578
        
1579
118k
        {
1580
118k
          unsigned state2 = kLiteralNextStates[state];
1581
118k
          unsigned posState2 = (position + 1) & p->pbMask;
1582
118k
          UInt32 price = litPrice + GetPrice_Rep_0(p, state2, posState2);
1583
118k
          {
1584
118k
            unsigned offset = cur + len;
1585
1586
118k
            if (last < offset)
1587
5.95k
              last = offset;
1588
          
1589
            // do
1590
118k
            {
1591
118k
              UInt32 price2;
1592
118k
              COptimal *opt;
1593
118k
              len--;
1594
              // price2 = price + GetPrice_Len_Rep_0(p, len, state2, posState2);
1595
118k
              price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState2, len);
1596
1597
118k
              opt = &p->opt[offset];
1598
              // offset--;
1599
118k
              if (price2 < opt->price)
1600
9.66k
              {
1601
9.66k
                opt->price = price2;
1602
9.66k
                opt->len = (UInt32)len;
1603
9.66k
                opt->dist = 0;
1604
9.66k
                opt->extra = 1;
1605
9.66k
              }
1606
118k
            }
1607
            // while (len >= 3);
1608
118k
          }
1609
118k
        }
1610
118k
      }
1611
616k
    }
1612
    
1613
4.78M
    startLen = 2; /* speed optimization */
1614
1615
4.78M
    {
1616
      // ---------- REP ----------
1617
4.78M
      unsigned repIndex = 0; // 17.old
1618
      // unsigned repIndex = IsLitState(state) ? 0 : 1; // 18.notused
1619
23.9M
      for (; repIndex < LZMA_NUM_REPS; repIndex++)
1620
19.1M
      {
1621
19.1M
        unsigned len;
1622
19.1M
        UInt32 price;
1623
19.1M
        const Byte *data2 = data - reps[repIndex];
1624
19.1M
        if (data[0] != data2[0] || data[1] != data2[1])
1625
14.1M
          continue;
1626
        
1627
75.5M
        for (len = 2; len < numAvail && data[len] == data2[len]; len++)
1628
70.5M
        {}
1629
        
1630
        // if (len < startLen) continue; // 18.new: speed optimization
1631
1632
5.01M
        {
1633
5.01M
          unsigned offset = cur + len;
1634
5.01M
          if (last < offset)
1635
201k
            last = offset;
1636
5.01M
        }
1637
5.01M
        {
1638
5.01M
          unsigned len2 = len;
1639
5.01M
          price = repMatchPrice + GetPrice_PureRep(p, repIndex, state, posState);
1640
5.01M
          do
1641
75.5M
          {
1642
75.5M
            UInt32 price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState, len2);
1643
75.5M
            COptimal *opt = &p->opt[cur + len2];
1644
75.5M
            if (price2 < opt->price)
1645
3.22M
            {
1646
3.22M
              opt->price = price2;
1647
3.22M
              opt->len = (UInt32)len2;
1648
3.22M
              opt->dist = (UInt32)repIndex;
1649
3.22M
              opt->extra = 0;
1650
3.22M
            }
1651
75.5M
          }
1652
75.5M
          while (--len2 >= 2);
1653
5.01M
        }
1654
        
1655
5.01M
        if (repIndex == 0) startLen = len + 1;  // 17.old
1656
        // startLen = len + 1; // 18.new
1657
1658
        /* if (_maxMode) */
1659
5.01M
        {
1660
          // ---------- REP : LIT : REP_0 ----------
1661
          // numFastBytes + 1 + numFastBytes
1662
1663
5.01M
          unsigned len2 = len + 1;
1664
5.01M
          unsigned limit = len2 + p->numFastBytes;
1665
5.01M
          if (limit > numAvailFull)
1666
369k
            limit = numAvailFull;
1667
          
1668
5.01M
          len2 += 2;
1669
5.01M
          if (len2 <= limit)
1670
4.92M
          if (data[len2 - 2] == data2[len2 - 2])
1671
2.73M
          if (data[len2 - 1] == data2[len2 - 1])
1672
1.80M
          {
1673
1.80M
            unsigned state2 = kRepNextStates[state];
1674
1.80M
            unsigned posState2 = (position + len) & p->pbMask;
1675
1.80M
            price += GET_PRICE_LEN(&p->repLenEnc, posState, len)
1676
1.80M
                + GET_PRICE_0(p->isMatch[state2][posState2])
1677
1.80M
                + LitEnc_Matched_GetPrice(LIT_PROBS(position + len, data[(size_t)len - 1]),
1678
1.80M
                    data[len], data2[len], p->ProbPrices);
1679
            
1680
            // state2 = kLiteralNextStates[state2];
1681
1.80M
            state2 = kState_LitAfterRep;
1682
1.80M
            posState2 = (posState2 + 1) & p->pbMask;
1683
1684
1685
1.80M
            price += GetPrice_Rep_0(p, state2, posState2);
1686
1687
24.5M
          for (; len2 < limit && data[len2] == data2[len2]; len2++)
1688
22.7M
          {}
1689
          
1690
1.80M
          len2 -= len;
1691
          // if (len2 >= 3)
1692
1.80M
          {
1693
1.80M
            {
1694
1.80M
              unsigned offset = cur + len + len2;
1695
1696
1.80M
              if (last < offset)
1697
547k
                last = offset;
1698
              // do
1699
1.80M
              {
1700
1.80M
                UInt32 price2;
1701
1.80M
                COptimal *opt;
1702
1.80M
                len2--;
1703
                // price2 = price + GetPrice_Len_Rep_0(p, len2, state2, posState2);
1704
1.80M
                price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState2, len2);
1705
1706
1.80M
                opt = &p->opt[offset];
1707
                // offset--;
1708
1.80M
                if (price2 < opt->price)
1709
680k
                {
1710
680k
                  opt->price = price2;
1711
680k
                  opt->len = (UInt32)len2;
1712
680k
                  opt->extra = (CExtra)(len + 1);
1713
680k
                  opt->dist = (UInt32)repIndex;
1714
680k
                }
1715
1.80M
              }
1716
              // while (len2 >= 3);
1717
1.80M
            }
1718
1.80M
          }
1719
1.80M
          }
1720
5.01M
        }
1721
5.01M
      }
1722
4.78M
    }
1723
1724
1725
    // ---------- MATCH ----------
1726
    /* for (unsigned len = 2; len <= newLen; len++) */
1727
4.78M
    if (newLen > numAvail)
1728
437
    {
1729
437
      newLen = numAvail;
1730
1.59k
      for (numPairs = 0; newLen > matches[numPairs]; numPairs += 2);
1731
437
      matches[numPairs] = (UInt32)newLen;
1732
437
      numPairs += 2;
1733
437
    }
1734
    
1735
    // startLen = 2; /* speed optimization */
1736
1737
4.78M
    if (newLen >= startLen)
1738
2.94M
    {
1739
2.94M
      UInt32 normalMatchPrice = matchPrice + GET_PRICE_0(p->isRep[state]);
1740
2.94M
      UInt32 dist;
1741
2.94M
      unsigned offs, posSlot, len;
1742
      
1743
2.94M
      {
1744
2.94M
        unsigned offset = cur + newLen;
1745
2.94M
        if (last < offset)
1746
840k
          last = offset;
1747
2.94M
      }
1748
1749
2.94M
      offs = 0;
1750
3.30M
      while (startLen > matches[offs])
1751
365k
        offs += 2;
1752
2.94M
      dist = matches[(size_t)offs + 1];
1753
      
1754
      // if (dist >= kNumFullDistances)
1755
2.94M
      GetPosSlot2(dist, posSlot);
1756
      
1757
12.5M
      for (len = /*2*/ startLen; ; len++)
1758
15.4M
      {
1759
15.4M
        UInt32 price = normalMatchPrice + GET_PRICE_LEN(&p->lenEnc, posState, len);
1760
15.4M
        {
1761
15.4M
          COptimal *opt;
1762
15.4M
          unsigned lenNorm = len - 2;
1763
15.4M
          lenNorm = GetLenToPosState2(lenNorm);
1764
15.4M
          if (dist < kNumFullDistances)
1765
10.7M
            price += p->distancesPrices[lenNorm][dist & (kNumFullDistances - 1)];
1766
4.74M
          else
1767
4.74M
            price += p->posSlotPrices[lenNorm][posSlot] + p->alignPrices[dist & kAlignMask];
1768
          
1769
15.4M
          opt = &p->opt[cur + len];
1770
15.4M
          if (price < opt->price)
1771
3.40M
          {
1772
3.40M
            opt->price = price;
1773
3.40M
            opt->len = (UInt32)len;
1774
3.40M
            opt->dist = dist + LZMA_NUM_REPS;
1775
3.40M
            opt->extra = 0;
1776
3.40M
          }
1777
15.4M
        }
1778
1779
15.4M
        if (len == matches[offs])
1780
3.86M
        {
1781
          // if (p->_maxMode) {
1782
          // MATCH : LIT : REP_0
1783
1784
3.86M
          const Byte *data2 = data - dist - 1;
1785
3.86M
          unsigned len2 = len + 1;
1786
3.86M
          unsigned limit = len2 + p->numFastBytes;
1787
3.86M
          if (limit > numAvailFull)
1788
123k
            limit = numAvailFull;
1789
          
1790
3.86M
          len2 += 2;
1791
3.86M
          if (len2 <= limit)
1792
3.85M
          if (data[len2 - 2] == data2[len2 - 2])
1793
1.54M
          if (data[len2 - 1] == data2[len2 - 1])
1794
948k
          {
1795
4.72M
          for (; len2 < limit && data[len2] == data2[len2]; len2++)
1796
3.77M
          {}
1797
          
1798
948k
          len2 -= len;
1799
          
1800
          // if (len2 >= 3)
1801
948k
          {
1802
948k
            unsigned state2 = kMatchNextStates[state];
1803
948k
            unsigned posState2 = (position + len) & p->pbMask;
1804
948k
            unsigned offset;
1805
948k
            price += GET_PRICE_0(p->isMatch[state2][posState2]);
1806
948k
            price += LitEnc_Matched_GetPrice(LIT_PROBS(position + len, data[(size_t)len - 1]),
1807
948k
                    data[len], data2[len], p->ProbPrices);
1808
1809
            // state2 = kLiteralNextStates[state2];
1810
948k
            state2 = kState_LitAfterMatch;
1811
1812
948k
            posState2 = (posState2 + 1) & p->pbMask;
1813
948k
            price += GetPrice_Rep_0(p, state2, posState2);
1814
1815
948k
            offset = cur + len + len2;
1816
1817
948k
            if (last < offset)
1818
143k
              last = offset;
1819
            // do
1820
948k
            {
1821
948k
              UInt32 price2;
1822
948k
              COptimal *opt;
1823
948k
              len2--;
1824
              // price2 = price + GetPrice_Len_Rep_0(p, len2, state2, posState2);
1825
948k
              price2 = price + GET_PRICE_LEN(&p->repLenEnc, posState2, len2);
1826
948k
              opt = &p->opt[offset];
1827
              // offset--;
1828
948k
              if (price2 < opt->price)
1829
416k
              {
1830
416k
                opt->price = price2;
1831
416k
                opt->len = (UInt32)len2;
1832
416k
                opt->extra = (CExtra)(len + 1);
1833
416k
                opt->dist = dist + LZMA_NUM_REPS;
1834
416k
              }
1835
948k
            }
1836
            // while (len2 >= 3);
1837
948k
          }
1838
1839
948k
          }
1840
        
1841
3.86M
          offs += 2;
1842
3.86M
          if (offs == numPairs)
1843
2.94M
            break;
1844
927k
          dist = matches[(size_t)offs + 1];
1845
          // if (dist >= kNumFullDistances)
1846
927k
            GetPosSlot2(dist, posSlot);
1847
927k
        }
1848
15.4M
      }
1849
2.94M
    }
1850
4.78M
  }
1851
1852
376k
  do
1853
5.54M
    p->opt[last].price = kInfinityPrice;
1854
5.54M
  while (--last);
1855
1856
376k
  return Backward(p, cur);
1857
405k
}
1858
1859
1860
1861
172k
#define ChangePair(smallDist, bigDist) (((bigDist) >> 7) > (smallDist))
1862
1863
1864
1865
static unsigned GetOptimumFast(CLzmaEnc *p)
1866
3.32M
{
1867
3.32M
  UInt32 numAvail, mainDist;
1868
3.32M
  unsigned mainLen, numPairs, repIndex, repLen, i;
1869
3.32M
  const Byte *data;
1870
1871
3.32M
  if (p->additionalOffset == 0)
1872
3.22M
    mainLen = ReadMatchDistances(p, &numPairs);
1873
91.7k
  else
1874
91.7k
  {
1875
91.7k
    mainLen = p->longestMatchLen;
1876
91.7k
    numPairs = p->numPairs;
1877
91.7k
  }
1878
1879
3.32M
  numAvail = p->numAvail;
1880
3.32M
  p->backRes = MARK_LIT;
1881
3.32M
  if (numAvail < 2)
1882
1.40k
    return 1;
1883
  // if (mainLen < 2 && p->state == 0) return 1; // 18.06.notused
1884
3.31M
  if (numAvail > LZMA_MATCH_LEN_MAX)
1885
3.21M
    numAvail = LZMA_MATCH_LEN_MAX;
1886
3.31M
  data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1887
3.31M
  repLen = repIndex = 0;
1888
  
1889
16.4M
  for (i = 0; i < LZMA_NUM_REPS; i++)
1890
13.2M
  {
1891
13.2M
    unsigned len;
1892
13.2M
    const Byte *data2 = data - p->reps[i];
1893
13.2M
    if (data[0] != data2[0] || data[1] != data2[1])
1894
12.9M
      continue;
1895
3.52M
    for (len = 2; len < numAvail && data[len] == data2[len]; len++)
1896
3.30M
    {}
1897
215k
    if (len >= p->numFastBytes)
1898
42.7k
    {
1899
42.7k
      p->backRes = (UInt32)i;
1900
42.7k
      MOVE_POS(p, len - 1)
1901
42.7k
      return len;
1902
42.7k
    }
1903
172k
    if (len > repLen)
1904
133k
    {
1905
133k
      repIndex = i;
1906
133k
      repLen = len;
1907
133k
    }
1908
172k
  }
1909
1910
3.27M
  if (mainLen >= p->numFastBytes)
1911
56.1k
  {
1912
56.1k
    p->backRes = p->matches[(size_t)numPairs - 1] + LZMA_NUM_REPS;
1913
56.1k
    MOVE_POS(p, mainLen - 1)
1914
56.1k
    return mainLen;
1915
56.1k
  }
1916
1917
3.22M
  mainDist = 0; /* for GCC */
1918
  
1919
3.22M
  if (mainLen >= 2)
1920
694k
  {
1921
694k
    mainDist = p->matches[(size_t)numPairs - 1];
1922
699k
    while (numPairs > 2)
1923
97.3k
    {
1924
97.3k
      UInt32 dist2;
1925
97.3k
      if (mainLen != p->matches[(size_t)numPairs - 4] + 1)
1926
33.7k
        break;
1927
63.5k
      dist2 = p->matches[(size_t)numPairs - 3];
1928
63.5k
      if (!ChangePair(dist2, mainDist))
1929
58.6k
        break;
1930
4.90k
      numPairs -= 2;
1931
4.90k
      mainLen--;
1932
4.90k
      mainDist = dist2;
1933
4.90k
    }
1934
694k
    if (mainLen == 2 && mainDist >= 0x80)
1935
365k
      mainLen = 1;
1936
694k
  }
1937
1938
3.22M
  if (repLen >= 2)
1939
111k
    if (    repLen + 1 >= mainLen
1940
111k
        || (repLen + 2 >= mainLen && mainDist >= (1 << 9))
1941
111k
        || (repLen + 3 >= mainLen && mainDist >= (1 << 15)))
1942
97.2k
  {
1943
97.2k
    p->backRes = (UInt32)repIndex;
1944
97.2k
    MOVE_POS(p, repLen - 1)
1945
97.2k
    return repLen;
1946
97.2k
  }
1947
  
1948
3.12M
  if (mainLen < 2 || numAvail <= 2)
1949
2.89M
    return 1;
1950
1951
232k
  {
1952
232k
    unsigned len1 = ReadMatchDistances(p, &p->numPairs);
1953
232k
    p->longestMatchLen = len1;
1954
  
1955
232k
    if (len1 >= 2)
1956
202k
    {
1957
202k
      UInt32 newDist = p->matches[(size_t)p->numPairs - 1];
1958
202k
      if (   (len1 >= mainLen && newDist < mainDist)
1959
202k
          || (len1 == mainLen + 1 && !ChangePair(mainDist, newDist))
1960
202k
          || (len1 >  mainLen + 1)
1961
202k
          || (len1 + 1 >= mainLen && mainLen >= 3 && ChangePair(newDist, mainDist)))
1962
78.8k
        return 1;
1963
202k
    }
1964
232k
  }
1965
  
1966
153k
  data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - 1;
1967
  
1968
730k
  for (i = 0; i < LZMA_NUM_REPS; i++)
1969
590k
  {
1970
590k
    unsigned len, limit;
1971
590k
    const Byte *data2 = data - p->reps[i];
1972
590k
    if (data[0] != data2[0] || data[1] != data2[1])
1973
560k
      continue;
1974
29.2k
    limit = mainLen - 1;
1975
41.2k
    for (len = 2;; len++)
1976
70.5k
    {
1977
70.5k
      if (len >= limit)
1978
12.9k
        return 1;
1979
57.6k
      if (data[len] != data2[len])
1980
16.3k
        break;
1981
57.6k
    }
1982
29.2k
  }
1983
  
1984
140k
  p->backRes = mainDist + LZMA_NUM_REPS;
1985
140k
  if (mainLen != 2)
1986
92.5k
  {
1987
92.5k
    MOVE_POS(p, mainLen - 2)
1988
92.5k
  }
1989
140k
  return mainLen;
1990
153k
}
1991
1992
1993
1994
1995
static void WriteEndMarker(CLzmaEnc *p, unsigned posState)
1996
0
{
1997
0
  UInt32 range;
1998
0
  range = p->rc.range;
1999
0
  {
2000
0
    UInt32 ttt, newBound;
2001
0
    CLzmaProb *prob = &p->isMatch[p->state][posState];
2002
0
    RC_BIT_PRE(&p->rc, prob)
2003
0
    RC_BIT_1(&p->rc, prob)
2004
0
    prob = &p->isRep[p->state];
2005
0
    RC_BIT_PRE(&p->rc, prob)
2006
0
    RC_BIT_0(&p->rc, prob)
2007
0
  }
2008
0
  p->state = kMatchNextStates[p->state];
2009
  
2010
0
  p->rc.range = range;
2011
0
  LenEnc_Encode(&p->lenProbs, &p->rc, 0, posState);
2012
0
  range = p->rc.range;
2013
2014
0
  {
2015
    // RcTree_Encode_PosSlot(&p->rc, p->posSlotEncoder[0], (1 << kNumPosSlotBits) - 1);
2016
0
    CLzmaProb *probs = p->posSlotEncoder[0];
2017
0
    unsigned m = 1;
2018
0
    do
2019
0
    {
2020
0
      UInt32 ttt, newBound;
2021
0
      RC_BIT_PRE(p, probs + m)
2022
0
      RC_BIT_1(&p->rc, probs + m);
2023
0
      m = (m << 1) + 1;
2024
0
    }
2025
0
    while (m < (1 << kNumPosSlotBits));
2026
0
  }
2027
0
  {
2028
    // RangeEnc_EncodeDirectBits(&p->rc, ((UInt32)1 << (30 - kNumAlignBits)) - 1, 30 - kNumAlignBits);    UInt32 range = p->range;
2029
0
    unsigned numBits = 30 - kNumAlignBits;
2030
0
    do
2031
0
    {
2032
0
      range >>= 1;
2033
0
      p->rc.low += range;
2034
0
      RC_NORM(&p->rc)
2035
0
    }
2036
0
    while (--numBits);
2037
0
  }
2038
   
2039
0
  {
2040
    // RcTree_ReverseEncode(&p->rc, p->posAlignEncoder, kNumAlignBits, kAlignMask);
2041
0
    CLzmaProb *probs = p->posAlignEncoder;
2042
0
    unsigned m = 1;
2043
0
    do
2044
0
    {
2045
0
      UInt32 ttt, newBound;
2046
0
      RC_BIT_PRE(p, probs + m)
2047
0
      RC_BIT_1(&p->rc, probs + m);
2048
0
      m = (m << 1) + 1;
2049
0
    }
2050
0
    while (m < kAlignTableSize);
2051
0
  }
2052
0
  p->rc.range = range;
2053
0
}
2054
2055
2056
static SRes CheckErrors(CLzmaEnc *p)
2057
32.6k
{
2058
32.6k
  if (p->result != SZ_OK)
2059
0
    return p->result;
2060
32.6k
  if (p->rc.res != SZ_OK)
2061
0
    p->result = SZ_ERROR_WRITE;
2062
32.6k
  if (p->matchFinderBase.result != SZ_OK)
2063
0
    p->result = SZ_ERROR_READ;
2064
32.6k
  if (p->result != SZ_OK)
2065
0
    p->finished = True;
2066
32.6k
  return p->result;
2067
32.6k
}
2068
2069
2070
MY_NO_INLINE static SRes Flush(CLzmaEnc *p, UInt32 nowPos)
2071
16.3k
{
2072
  /* ReleaseMFStream(); */
2073
16.3k
  p->finished = True;
2074
16.3k
  if (p->writeEndMark)
2075
0
    WriteEndMarker(p, nowPos & p->pbMask);
2076
16.3k
  RangeEnc_FlushData(&p->rc);
2077
16.3k
  RangeEnc_FlushStream(&p->rc);
2078
16.3k
  return CheckErrors(p);
2079
16.3k
}
2080
2081
2082
MY_NO_INLINE static void FillAlignPrices(CLzmaEnc *p)
2083
26.0k
{
2084
26.0k
  unsigned i;
2085
26.0k
  const CProbPrice *ProbPrices = p->ProbPrices;
2086
26.0k
  const CLzmaProb *probs = p->posAlignEncoder;
2087
  // p->alignPriceCount = 0;
2088
234k
  for (i = 0; i < kAlignTableSize / 2; i++)
2089
208k
  {
2090
208k
    UInt32 price = 0;
2091
208k
    unsigned sym = i;
2092
208k
    unsigned m = 1;
2093
208k
    unsigned bit;
2094
208k
    UInt32 prob;
2095
208k
    bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[m], bit); m = (m << 1) + bit;
2096
208k
    bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[m], bit); m = (m << 1) + bit;
2097
208k
    bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[m], bit); m = (m << 1) + bit;
2098
208k
    prob = probs[m];
2099
208k
    p->alignPrices[i    ] = price + GET_PRICEa_0(prob);
2100
208k
    p->alignPrices[i + 8] = price + GET_PRICEa_1(prob);
2101
    // p->alignPrices[i] = RcTree_ReverseGetPrice(p->posAlignEncoder, kNumAlignBits, i, p->ProbPrices);
2102
208k
  }
2103
26.0k
}
2104
2105
2106
MY_NO_INLINE static void FillDistancesPrices(CLzmaEnc *p)
2107
26.0k
{
2108
  // int y; for (y = 0; y < 100; y++) {
2109
2110
26.0k
  UInt32 tempPrices[kNumFullDistances];
2111
26.0k
  unsigned i, lps;
2112
2113
26.0k
  const CProbPrice *ProbPrices = p->ProbPrices;
2114
26.0k
  p->matchPriceCount = 0;
2115
2116
1.64M
  for (i = kStartPosModelIndex / 2; i < kNumFullDistances / 2; i++)
2117
1.61M
  {
2118
1.61M
    unsigned posSlot = GetPosSlot1(i);
2119
1.61M
    unsigned footerBits = (posSlot >> 1) - 1;
2120
1.61M
    unsigned base = ((2 | (posSlot & 1)) << footerBits);
2121
1.61M
    const CLzmaProb *probs = p->posEncoders + (size_t)base * 2;
2122
    // tempPrices[i] = RcTree_ReverseGetPrice(p->posEncoders + base, footerBits, i - base, p->ProbPrices);
2123
1.61M
    UInt32 price = 0;
2124
1.61M
    unsigned m = 1;
2125
1.61M
    unsigned sym = i;
2126
1.61M
    unsigned offset = (unsigned)1 << footerBits;
2127
1.61M
    base += i;
2128
    
2129
1.61M
    if (footerBits)
2130
1.56M
    do
2131
5.10M
    {
2132
5.10M
      unsigned bit = sym & 1;
2133
5.10M
      sym >>= 1;
2134
5.10M
      price += GET_PRICEa(probs[m], bit);
2135
5.10M
      m = (m << 1) + bit;
2136
5.10M
    }
2137
5.10M
    while (--footerBits);
2138
2139
1.61M
    {
2140
1.61M
      unsigned prob = probs[m];
2141
1.61M
      tempPrices[base         ] = price + GET_PRICEa_0(prob);
2142
1.61M
      tempPrices[base + offset] = price + GET_PRICEa_1(prob);
2143
1.61M
    }
2144
1.61M
  }
2145
2146
130k
  for (lps = 0; lps < kNumLenToPosStates; lps++)
2147
104k
  {
2148
104k
    unsigned slot;
2149
104k
    unsigned distTableSize2 = (p->distTableSize + 1) >> 1;
2150
104k
    UInt32 *posSlotPrices = p->posSlotPrices[lps];
2151
104k
    const CLzmaProb *probs = p->posSlotEncoder[lps];
2152
    
2153
2.60M
    for (slot = 0; slot < distTableSize2; slot++)
2154
2.50M
    {
2155
      // posSlotPrices[slot] = RcTree_GetPrice(encoder, kNumPosSlotBits, slot, p->ProbPrices);
2156
2.50M
      UInt32 price;
2157
2.50M
      unsigned bit;
2158
2.50M
      unsigned sym = slot + (1 << (kNumPosSlotBits - 1));
2159
2.50M
      unsigned prob;
2160
2.50M
      bit = sym & 1; sym >>= 1; price  = GET_PRICEa(probs[sym], bit);
2161
2.50M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2162
2.50M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2163
2.50M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2164
2.50M
      bit = sym & 1; sym >>= 1; price += GET_PRICEa(probs[sym], bit);
2165
2.50M
      prob = probs[(size_t)slot + (1 << (kNumPosSlotBits - 1))];
2166
2.50M
      posSlotPrices[(size_t)slot * 2    ] = price + GET_PRICEa_0(prob);
2167
2.50M
      posSlotPrices[(size_t)slot * 2 + 1] = price + GET_PRICEa_1(prob);
2168
2.50M
    }
2169
    
2170
104k
    {
2171
104k
      UInt32 delta = ((UInt32)((kEndPosModelIndex / 2 - 1) - kNumAlignBits) << kNumBitPriceShiftBits);
2172
1.87M
      for (slot = kEndPosModelIndex / 2; slot < distTableSize2; slot++)
2173
1.77M
      {
2174
1.77M
        posSlotPrices[(size_t)slot * 2    ] += delta;
2175
1.77M
        posSlotPrices[(size_t)slot * 2 + 1] += delta;
2176
1.77M
        delta += ((UInt32)1 << kNumBitPriceShiftBits);
2177
1.77M
      }
2178
104k
    }
2179
2180
104k
    {
2181
104k
      UInt32 *dp = p->distancesPrices[lps];
2182
      
2183
104k
      dp[0] = posSlotPrices[0];
2184
104k
      dp[1] = posSlotPrices[1];
2185
104k
      dp[2] = posSlotPrices[2];
2186
104k
      dp[3] = posSlotPrices[3];
2187
2188
6.56M
      for (i = 4; i < kNumFullDistances; i += 2)
2189
6.46M
      {
2190
6.46M
        UInt32 slotPrice = posSlotPrices[GetPosSlot1(i)];
2191
6.46M
        dp[i    ] = slotPrice + tempPrices[i];
2192
6.46M
        dp[i + 1] = slotPrice + tempPrices[i + 1];
2193
6.46M
      }
2194
104k
    }
2195
104k
  }
2196
  // }
2197
26.0k
}
2198
2199
2200
2201
void LzmaEnc_Construct(CLzmaEnc *p)
2202
8.13k
{
2203
8.13k
  RangeEnc_Construct(&p->rc);
2204
8.13k
  MatchFinder_Construct(&p->matchFinderBase);
2205
  
2206
  #ifndef _7ZIP_ST
2207
  MatchFinderMt_Construct(&p->matchFinderMt);
2208
  p->matchFinderMt.MatchFinder = &p->matchFinderBase;
2209
  #endif
2210
2211
8.13k
  {
2212
8.13k
    CLzmaEncProps props;
2213
8.13k
    LzmaEncProps_Init(&props);
2214
8.13k
    LzmaEnc_SetProps(p, &props);
2215
8.13k
  }
2216
2217
8.13k
  #ifndef LZMA_LOG_BSR
2218
8.13k
  LzmaEnc_FastPosInit(p->g_FastPos);
2219
8.13k
  #endif
2220
2221
8.13k
  LzmaEnc_InitPriceTables(p->ProbPrices);
2222
8.13k
  p->litProbs = NULL;
2223
8.13k
  p->saveState.litProbs = NULL;
2224
2225
8.13k
}
2226
2227
CLzmaEncHandle LzmaEnc_Create(ISzAllocPtr alloc)
2228
8.13k
{
2229
8.13k
  void *p;
2230
8.13k
  p = ISzAlloc_Alloc(alloc, sizeof(CLzmaEnc));
2231
8.13k
  if (p)
2232
8.13k
    LzmaEnc_Construct((CLzmaEnc *)p);
2233
8.13k
  return p;
2234
8.13k
}
2235
2236
void LzmaEnc_FreeLits(CLzmaEnc *p, ISzAllocPtr alloc)
2237
16.2k
{
2238
16.2k
  ISzAlloc_Free(alloc, p->litProbs);
2239
16.2k
  ISzAlloc_Free(alloc, p->saveState.litProbs);
2240
16.2k
  p->litProbs = NULL;
2241
16.2k
  p->saveState.litProbs = NULL;
2242
16.2k
}
2243
2244
void LzmaEnc_Destruct(CLzmaEnc *p, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2245
8.13k
{
2246
  #ifndef _7ZIP_ST
2247
  MatchFinderMt_Destruct(&p->matchFinderMt, allocBig);
2248
  #endif
2249
  
2250
8.13k
  MatchFinder_Free(&p->matchFinderBase, allocBig);
2251
8.13k
  LzmaEnc_FreeLits(p, alloc);
2252
8.13k
  RangeEnc_Free(&p->rc, alloc);
2253
8.13k
}
2254
2255
void LzmaEnc_Destroy(CLzmaEncHandle p, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2256
8.13k
{
2257
8.13k
  LzmaEnc_Destruct((CLzmaEnc *)p, alloc, allocBig);
2258
8.13k
  ISzAlloc_Free(alloc, p);
2259
8.13k
}
2260
2261
2262
static SRes LzmaEnc_CodeOneBlock(CLzmaEnc *p, UInt32 maxPackSize, UInt32 maxUnpackSize)
2263
16.3k
{
2264
16.3k
  UInt32 nowPos32, startPos32;
2265
16.3k
  if (p->needInit)
2266
8.13k
  {
2267
8.13k
    p->matchFinder.Init(p->matchFinderObj);
2268
8.13k
    p->needInit = 0;
2269
8.13k
  }
2270
2271
16.3k
  if (p->finished)
2272
0
    return p->result;
2273
16.3k
  RINOK(CheckErrors(p));
2274
2275
16.3k
  nowPos32 = (UInt32)p->nowPos64;
2276
16.3k
  startPos32 = nowPos32;
2277
2278
16.3k
  if (p->nowPos64 == 0)
2279
8.13k
  {
2280
8.13k
    unsigned numPairs;
2281
8.13k
    Byte curByte;
2282
8.13k
    if (p->matchFinder.GetNumAvailableBytes(p->matchFinderObj) == 0)
2283
0
      return Flush(p, nowPos32);
2284
8.13k
    ReadMatchDistances(p, &numPairs);
2285
8.13k
    RangeEnc_EncodeBit_0(&p->rc, &p->isMatch[kState_Start][0]);
2286
    // p->state = kLiteralNextStates[p->state];
2287
8.13k
    curByte = *(p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - p->additionalOffset);
2288
8.13k
    LitEnc_Encode(&p->rc, p->litProbs, curByte);
2289
8.13k
    p->additionalOffset--;
2290
8.13k
    nowPos32++;
2291
8.13k
  }
2292
2293
16.3k
  if (p->matchFinder.GetNumAvailableBytes(p->matchFinderObj) != 0)
2294
  
2295
8.15k
  for (;;)
2296
7.72M
  {
2297
7.72M
    UInt32 dist;
2298
7.72M
    unsigned len, posState;
2299
7.72M
    UInt32 range, ttt, newBound;
2300
7.72M
    CLzmaProb *probs;
2301
  
2302
7.72M
    if (p->fastMode)
2303
3.32M
      len = GetOptimumFast(p);
2304
4.40M
    else
2305
4.40M
    {
2306
4.40M
      unsigned oci = p->optCur;
2307
4.40M
      if (p->optEnd == oci)
2308
2.73M
        len = GetOptimum(p, nowPos32);
2309
1.66M
      else
2310
1.66M
      {
2311
1.66M
        const COptimal *opt = &p->opt[oci];
2312
1.66M
        len = opt->len;
2313
1.66M
        p->backRes = opt->dist;
2314
1.66M
        p->optCur = oci + 1;
2315
1.66M
      }
2316
4.40M
    }
2317
2318
7.72M
    posState = (unsigned)nowPos32 & p->pbMask;
2319
7.72M
    range = p->rc.range;
2320
7.72M
    probs = &p->isMatch[p->state][posState];
2321
    
2322
7.72M
    RC_BIT_PRE(&p->rc, probs)
2323
    
2324
7.72M
    dist = p->backRes;
2325
2326
    #ifdef SHOW_STAT2
2327
    printf("\n pos = %6X, len = %3u  pos = %6u", nowPos32, len, dist);
2328
    #endif
2329
2330
7.72M
    if (dist == MARK_LIT)
2331
6.16M
    {
2332
6.16M
      Byte curByte;
2333
6.16M
      const Byte *data;
2334
6.16M
      unsigned state;
2335
2336
6.16M
      RC_BIT_0(&p->rc, probs);
2337
6.16M
      p->rc.range = range;
2338
6.16M
      data = p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - p->additionalOffset;
2339
6.16M
      probs = LIT_PROBS(nowPos32, *(data - 1));
2340
6.16M
      curByte = *data;
2341
6.16M
      state = p->state;
2342
6.16M
      p->state = kLiteralNextStates[state];
2343
6.16M
      if (IsLitState(state))
2344
5.73M
        LitEnc_Encode(&p->rc, probs, curByte);
2345
434k
      else
2346
434k
        LitEnc_EncodeMatched(&p->rc, probs, curByte, *(data - p->reps[0]));
2347
6.16M
    }
2348
1.55M
    else
2349
1.55M
    {
2350
1.55M
      RC_BIT_1(&p->rc, probs);
2351
1.55M
      probs = &p->isRep[p->state];
2352
1.55M
      RC_BIT_PRE(&p->rc, probs)
2353
      
2354
1.55M
      if (dist < LZMA_NUM_REPS)
2355
644k
      {
2356
644k
        RC_BIT_1(&p->rc, probs);
2357
644k
        probs = &p->isRepG0[p->state];
2358
644k
        RC_BIT_PRE(&p->rc, probs)
2359
644k
        if (dist == 0)
2360
211k
        {
2361
211k
          RC_BIT_0(&p->rc, probs);
2362
211k
          probs = &p->isRep0Long[p->state][posState];
2363
211k
          RC_BIT_PRE(&p->rc, probs)
2364
211k
          if (len != 1)
2365
140k
          {
2366
140k
            RC_BIT_1_BASE(&p->rc, probs);
2367
140k
          }
2368
71.0k
          else
2369
71.0k
          {
2370
71.0k
            RC_BIT_0_BASE(&p->rc, probs);
2371
71.0k
            p->state = kShortRepNextStates[p->state];
2372
71.0k
          }
2373
211k
        }
2374
433k
        else
2375
433k
        {
2376
433k
          RC_BIT_1(&p->rc, probs);
2377
433k
          probs = &p->isRepG1[p->state];
2378
433k
          RC_BIT_PRE(&p->rc, probs)
2379
433k
          if (dist == 1)
2380
191k
          {
2381
191k
            RC_BIT_0_BASE(&p->rc, probs);
2382
191k
            dist = p->reps[1];
2383
191k
          }
2384
242k
          else
2385
242k
          {
2386
242k
            RC_BIT_1(&p->rc, probs);
2387
242k
            probs = &p->isRepG2[p->state];
2388
242k
            RC_BIT_PRE(&p->rc, probs)
2389
242k
            if (dist == 2)
2390
136k
            {
2391
136k
              RC_BIT_0_BASE(&p->rc, probs);
2392
136k
              dist = p->reps[2];
2393
136k
            }
2394
105k
            else
2395
105k
            {
2396
105k
              RC_BIT_1_BASE(&p->rc, probs);
2397
105k
              dist = p->reps[3];
2398
105k
              p->reps[3] = p->reps[2];
2399
105k
            }
2400
242k
            p->reps[2] = p->reps[1];
2401
242k
          }
2402
433k
          p->reps[1] = p->reps[0];
2403
433k
          p->reps[0] = dist;
2404
433k
        }
2405
2406
644k
        RC_NORM(&p->rc)
2407
2408
644k
        p->rc.range = range;
2409
2410
644k
        if (len != 1)
2411
573k
        {
2412
573k
          LenEnc_Encode(&p->repLenProbs, &p->rc, len - LZMA_MATCH_LEN_MIN, posState);
2413
573k
          --p->repLenEncCounter;
2414
573k
          p->state = kRepNextStates[p->state];
2415
573k
        }
2416
644k
      }
2417
911k
      else
2418
911k
      {
2419
911k
        unsigned posSlot;
2420
911k
        RC_BIT_0(&p->rc, probs);
2421
911k
        p->rc.range = range;
2422
911k
        p->state = kMatchNextStates[p->state];
2423
2424
911k
        LenEnc_Encode(&p->lenProbs, &p->rc, len - LZMA_MATCH_LEN_MIN, posState);
2425
        // --p->lenEnc.counter;
2426
2427
911k
        dist -= LZMA_NUM_REPS;
2428
911k
        p->reps[3] = p->reps[2];
2429
911k
        p->reps[2] = p->reps[1];
2430
911k
        p->reps[1] = p->reps[0];
2431
911k
        p->reps[0] = dist + 1;
2432
        
2433
911k
        p->matchPriceCount++;
2434
911k
        GetPosSlot(dist, posSlot);
2435
        // RcTree_Encode_PosSlot(&p->rc, p->posSlotEncoder[GetLenToPosState(len)], posSlot);
2436
911k
        {
2437
911k
          UInt32 sym = (UInt32)posSlot + (1 << kNumPosSlotBits);
2438
911k
          range = p->rc.range;
2439
911k
          probs = p->posSlotEncoder[GetLenToPosState(len)];
2440
911k
          do
2441
5.47M
          {
2442
5.47M
            CLzmaProb *prob = probs + (sym >> kNumPosSlotBits);
2443
5.47M
            UInt32 bit = (sym >> (kNumPosSlotBits - 1)) & 1;
2444
5.47M
            sym <<= 1;
2445
5.47M
            RC_BIT(&p->rc, prob, bit);
2446
5.47M
          }
2447
5.47M
          while (sym < (1 << kNumPosSlotBits * 2));
2448
911k
          p->rc.range = range;
2449
911k
        }
2450
        
2451
911k
        if (dist >= kStartPosModelIndex)
2452
646k
        {
2453
646k
          unsigned footerBits = ((posSlot >> 1) - 1);
2454
2455
646k
          if (dist < kNumFullDistances)
2456
462k
          {
2457
462k
            unsigned base = ((2 | (posSlot & 1)) << footerBits);
2458
462k
            RcTree_ReverseEncode(&p->rc, p->posEncoders + base, footerBits, (unsigned)(dist /* - base */));
2459
462k
          }
2460
184k
          else
2461
184k
          {
2462
184k
            UInt32 pos2 = (dist | 0xF) << (32 - footerBits);
2463
184k
            range = p->rc.range;
2464
            // RangeEnc_EncodeDirectBits(&p->rc, posReduced >> kNumAlignBits, footerBits - kNumAlignBits);
2465
            /*
2466
            do
2467
            {
2468
              range >>= 1;
2469
              p->rc.low += range & (0 - ((dist >> --footerBits) & 1));
2470
              RC_NORM(&p->rc)
2471
            }
2472
            while (footerBits > kNumAlignBits);
2473
            */
2474
184k
            do
2475
767k
            {
2476
767k
              range >>= 1;
2477
767k
              p->rc.low += range & (0 - (pos2 >> 31));
2478
767k
              pos2 += pos2;
2479
767k
              RC_NORM(&p->rc)
2480
767k
            }
2481
767k
            while (pos2 != 0xF0000000);
2482
2483
2484
            // RcTree_ReverseEncode(&p->rc, p->posAlignEncoder, kNumAlignBits, posReduced & kAlignMask);
2485
2486
184k
            {
2487
184k
              unsigned m = 1;
2488
184k
              unsigned bit;
2489
184k
              bit = dist & 1; dist >>= 1; RC_BIT(&p->rc, p->posAlignEncoder + m, bit); m = (m << 1) + bit;
2490
184k
              bit = dist & 1; dist >>= 1; RC_BIT(&p->rc, p->posAlignEncoder + m, bit); m = (m << 1) + bit;
2491
184k
              bit = dist & 1; dist >>= 1; RC_BIT(&p->rc, p->posAlignEncoder + m, bit); m = (m << 1) + bit;
2492
184k
              bit = dist & 1;             RC_BIT(&p->rc, p->posAlignEncoder + m, bit);
2493
184k
              p->rc.range = range;
2494
              // p->alignPriceCount++;
2495
184k
            }
2496
184k
          }
2497
646k
        }
2498
911k
      }
2499
1.55M
    }
2500
2501
7.72M
    nowPos32 += (UInt32)len;
2502
7.72M
    p->additionalOffset -= len;
2503
    
2504
7.72M
    if (p->additionalOffset == 0)
2505
5.93M
    {
2506
5.93M
      UInt32 processed;
2507
2508
5.93M
      if (!p->fastMode)
2509
2.70M
      {
2510
        /*
2511
        if (p->alignPriceCount >= 16) // kAlignTableSize
2512
          FillAlignPrices(p);
2513
        if (p->matchPriceCount >= 128)
2514
          FillDistancesPrices(p);
2515
        if (p->lenEnc.counter <= 0)
2516
          LenPriceEnc_UpdateTables(&p->lenEnc, 1 << p->pb, &p->lenProbs, p->ProbPrices);
2517
        */
2518
2.70M
        if (p->matchPriceCount >= 64)
2519
9.54k
        {
2520
9.54k
          FillAlignPrices(p);
2521
          // { int y; for (y = 0; y < 100; y++) {
2522
9.54k
          FillDistancesPrices(p);
2523
          // }}
2524
9.54k
          LenPriceEnc_UpdateTables(&p->lenEnc, 1 << p->pb, &p->lenProbs, p->ProbPrices);
2525
9.54k
        }
2526
2.70M
        if (p->repLenEncCounter <= 0)
2527
3.34k
        {
2528
3.34k
          p->repLenEncCounter = REP_LEN_COUNT;
2529
3.34k
          LenPriceEnc_UpdateTables(&p->repLenEnc, 1 << p->pb, &p->repLenProbs, p->ProbPrices);
2530
3.34k
        }
2531
2.70M
      }
2532
    
2533
5.93M
      if (p->matchFinder.GetNumAvailableBytes(p->matchFinderObj) == 0)
2534
8.09k
        break;
2535
5.92M
      processed = nowPos32 - startPos32;
2536
      
2537
5.92M
      if (maxPackSize)
2538
5.92M
      {
2539
5.92M
        if (processed + kNumOpts + 300 >= maxUnpackSize
2540
5.92M
            || RangeEnc_GetProcessed_sizet(&p->rc) + kPackReserve >= maxPackSize)
2541
67
          break;
2542
5.92M
      }
2543
0
      else if (processed >= (1 << 17))
2544
0
      {
2545
0
        p->nowPos64 += nowPos32 - startPos32;
2546
0
        return CheckErrors(p);
2547
0
      }
2548
5.92M
    }
2549
7.72M
  }
2550
2551
16.3k
  p->nowPos64 += nowPos32 - startPos32;
2552
16.3k
  return Flush(p, nowPos32);
2553
16.3k
}
2554
2555
2556
2557
8.13k
#define kBigHashDicLimit ((UInt32)1 << 24)
2558
2559
static SRes LzmaEnc_Alloc(CLzmaEnc *p, UInt32 keepWindowSize, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2560
8.13k
{
2561
8.13k
  UInt32 beforeSize = kNumOpts;
2562
8.13k
  if (!RangeEnc_Alloc(&p->rc, alloc))
2563
0
    return SZ_ERROR_MEM;
2564
2565
  #ifndef _7ZIP_ST
2566
  p->mtMode = (p->multiThread && !p->fastMode && (p->matchFinderBase.btMode != 0));
2567
  #endif
2568
2569
8.13k
  {
2570
8.13k
    unsigned lclp = p->lc + p->lp;
2571
8.13k
    if (!p->litProbs || !p->saveState.litProbs || p->lclp != lclp)
2572
8.13k
    {
2573
8.13k
      LzmaEnc_FreeLits(p, alloc);
2574
8.13k
      p->litProbs = (CLzmaProb *)ISzAlloc_Alloc(alloc, ((UInt32)0x300 << lclp) * sizeof(CLzmaProb));
2575
8.13k
      p->saveState.litProbs = (CLzmaProb *)ISzAlloc_Alloc(alloc, ((UInt32)0x300 << lclp) * sizeof(CLzmaProb));
2576
8.13k
      if (!p->litProbs || !p->saveState.litProbs)
2577
0
      {
2578
0
        LzmaEnc_FreeLits(p, alloc);
2579
0
        return SZ_ERROR_MEM;
2580
0
      }
2581
8.13k
      p->lclp = lclp;
2582
8.13k
    }
2583
8.13k
  }
2584
2585
8.13k
  p->matchFinderBase.bigHash = (Byte)(p->dictSize > kBigHashDicLimit ? 1 : 0);
2586
2587
8.13k
  if (beforeSize + p->dictSize < keepWindowSize)
2588
0
    beforeSize = keepWindowSize - p->dictSize;
2589
2590
  #ifndef _7ZIP_ST
2591
  if (p->mtMode)
2592
  {
2593
    RINOK(MatchFinderMt_Create(&p->matchFinderMt, p->dictSize, beforeSize, p->numFastBytes,
2594
        LZMA_MATCH_LEN_MAX
2595
        + 1  /* 18.04 */
2596
        , allocBig));
2597
    p->matchFinderObj = &p->matchFinderMt;
2598
    p->matchFinderBase.bigHash = (Byte)(
2599
        (p->dictSize > kBigHashDicLimit && p->matchFinderBase.hashMask >= 0xFFFFFF) ? 1 : 0);
2600
    MatchFinderMt_CreateVTable(&p->matchFinderMt, &p->matchFinder);
2601
  }
2602
  else
2603
  #endif
2604
8.13k
  {
2605
8.13k
    if (!MatchFinder_Create(&p->matchFinderBase, p->dictSize, beforeSize, p->numFastBytes, LZMA_MATCH_LEN_MAX, allocBig))
2606
0
      return SZ_ERROR_MEM;
2607
8.13k
    p->matchFinderObj = &p->matchFinderBase;
2608
8.13k
    MatchFinder_CreateVTable(&p->matchFinderBase, &p->matchFinder);
2609
8.13k
  }
2610
  
2611
8.13k
  return SZ_OK;
2612
8.13k
}
2613
2614
void LzmaEnc_Init(CLzmaEnc *p)
2615
18.3k
{
2616
18.3k
  unsigned i;
2617
18.3k
  p->state = 0;
2618
18.3k
  p->reps[0] =
2619
18.3k
  p->reps[1] =
2620
18.3k
  p->reps[2] =
2621
18.3k
  p->reps[3] = 1;
2622
2623
18.3k
  RangeEnc_Init(&p->rc);
2624
2625
311k
  for (i = 0; i < (1 << kNumAlignBits); i++)
2626
292k
    p->posAlignEncoder[i] = kProbInitValue;
2627
2628
237k
  for (i = 0; i < kNumStates; i++)
2629
219k
  {
2630
219k
    unsigned j;
2631
3.73M
    for (j = 0; j < LZMA_NUM_PB_STATES_MAX; j++)
2632
3.51M
    {
2633
3.51M
      p->isMatch[i][j] = kProbInitValue;
2634
3.51M
      p->isRep0Long[i][j] = kProbInitValue;
2635
3.51M
    }
2636
219k
    p->isRep[i] = kProbInitValue;
2637
219k
    p->isRepG0[i] = kProbInitValue;
2638
219k
    p->isRepG1[i] = kProbInitValue;
2639
219k
    p->isRepG2[i] = kProbInitValue;
2640
219k
  }
2641
2642
18.3k
  {
2643
91.5k
    for (i = 0; i < kNumLenToPosStates; i++)
2644
73.2k
    {
2645
73.2k
      CLzmaProb *probs = p->posSlotEncoder[i];
2646
73.2k
      unsigned j;
2647
4.75M
      for (j = 0; j < (1 << kNumPosSlotBits); j++)
2648
4.68M
        probs[j] = kProbInitValue;
2649
73.2k
    }
2650
18.3k
  }
2651
18.3k
  {
2652
2.36M
    for (i = 0; i < kNumFullDistances; i++)
2653
2.34M
      p->posEncoders[i] = kProbInitValue;
2654
18.3k
  }
2655
2656
18.3k
  {
2657
18.3k
    UInt32 num = (UInt32)0x300 << (p->lp + p->lc);
2658
18.3k
    UInt32 k;
2659
18.3k
    CLzmaProb *probs = p->litProbs;
2660
113M
    for (k = 0; k < num; k++)
2661
113M
      probs[k] = kProbInitValue;
2662
18.3k
  }
2663
2664
2665
18.3k
  LenEnc_Init(&p->lenProbs);
2666
18.3k
  LenEnc_Init(&p->repLenProbs);
2667
2668
18.3k
  p->optEnd = 0;
2669
18.3k
  p->optCur = 0;
2670
2671
18.3k
  {
2672
37.5M
    for (i = 0; i < kNumOpts; i++)
2673
37.4M
      p->opt[i].price = kInfinityPrice;
2674
18.3k
  }
2675
2676
18.3k
  p->additionalOffset = 0;
2677
2678
18.3k
  p->pbMask = (1 << p->pb) - 1;
2679
18.3k
  p->lpMask = ((UInt32)0x100 << p->lp) - ((unsigned)0x100 >> p->lc);
2680
18.3k
}
2681
2682
2683
void LzmaEnc_InitPrices(CLzmaEnc *p)
2684
24.4k
{
2685
24.4k
  if (!p->fastMode)
2686
16.5k
  {
2687
16.5k
    FillDistancesPrices(p);
2688
16.5k
    FillAlignPrices(p);
2689
16.5k
  }
2690
2691
24.4k
  p->lenEnc.tableSize =
2692
24.4k
  p->repLenEnc.tableSize =
2693
24.4k
      p->numFastBytes + 1 - LZMA_MATCH_LEN_MIN;
2694
2695
24.4k
  p->repLenEncCounter = REP_LEN_COUNT;
2696
2697
24.4k
  LenPriceEnc_UpdateTables(&p->lenEnc, 1 << p->pb, &p->lenProbs, p->ProbPrices);
2698
24.4k
  LenPriceEnc_UpdateTables(&p->repLenEnc, 1 << p->pb, &p->repLenProbs, p->ProbPrices);
2699
24.4k
}
2700
2701
static SRes LzmaEnc_AllocAndInit(CLzmaEnc *p, UInt32 keepWindowSize, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2702
8.13k
{
2703
8.13k
  unsigned i;
2704
146k
  for (i = kEndPosModelIndex / 2; i < kDicLogSizeMax; i++)
2705
146k
    if (p->dictSize <= ((UInt32)1 << i))
2706
8.13k
      break;
2707
8.13k
  p->distTableSize = i * 2;
2708
2709
8.13k
  p->finished = False;
2710
8.13k
  p->result = SZ_OK;
2711
8.13k
  RINOK(LzmaEnc_Alloc(p, keepWindowSize, alloc, allocBig));
2712
8.13k
  LzmaEnc_Init(p);
2713
8.13k
  LzmaEnc_InitPrices(p);
2714
8.13k
  p->nowPos64 = 0;
2715
8.13k
  return SZ_OK;
2716
8.13k
}
2717
2718
static SRes LzmaEnc_Prepare(CLzmaEncHandle pp, ISeqOutStream *outStream, ISeqInStream *inStream,
2719
    ISzAllocPtr alloc, ISzAllocPtr allocBig)
2720
0
{
2721
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
2722
0
  p->matchFinderBase.stream = inStream;
2723
0
  p->needInit = 1;
2724
0
  p->rc.outStream = outStream;
2725
0
  return LzmaEnc_AllocAndInit(p, 0, alloc, allocBig);
2726
0
}
2727
2728
SRes LzmaEnc_PrepareForLzma2(CLzmaEncHandle pp,
2729
    ISeqInStream *inStream, UInt32 keepWindowSize,
2730
    ISzAllocPtr alloc, ISzAllocPtr allocBig)
2731
8.13k
{
2732
8.13k
  CLzmaEnc *p = (CLzmaEnc *)pp;
2733
8.13k
  p->matchFinderBase.stream = inStream;
2734
8.13k
  p->needInit = 1;
2735
8.13k
  return LzmaEnc_AllocAndInit(p, keepWindowSize, alloc, allocBig);
2736
8.13k
}
2737
2738
static void LzmaEnc_SetInputBuf(CLzmaEnc *p, const Byte *src, SizeT srcLen)
2739
0
{
2740
0
  p->matchFinderBase.directInput = 1;
2741
0
  p->matchFinderBase.bufferBase = (Byte *)src;
2742
0
  p->matchFinderBase.directInputRem = srcLen;
2743
0
}
2744
2745
SRes LzmaEnc_MemPrepare(CLzmaEncHandle pp, const Byte *src, SizeT srcLen,
2746
    UInt32 keepWindowSize, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2747
0
{
2748
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
2749
0
  LzmaEnc_SetInputBuf(p, src, srcLen);
2750
0
  p->needInit = 1;
2751
2752
0
  LzmaEnc_SetDataSize(pp, srcLen);
2753
0
  return LzmaEnc_AllocAndInit(p, keepWindowSize, alloc, allocBig);
2754
0
}
2755
2756
void LzmaEnc_Finish(CLzmaEncHandle pp)
2757
8.13k
{
2758
  #ifndef _7ZIP_ST
2759
  CLzmaEnc *p = (CLzmaEnc *)pp;
2760
  if (p->mtMode)
2761
    MatchFinderMt_ReleaseStream(&p->matchFinderMt);
2762
  #else
2763
8.13k
  UNUSED_VAR(pp);
2764
8.13k
  #endif
2765
8.13k
}
2766
2767
2768
typedef struct
2769
{
2770
  ISeqOutStream vt;
2771
  Byte *data;
2772
  SizeT rem;
2773
  BoolInt overflow;
2774
} CLzmaEnc_SeqOutStreamBuf;
2775
2776
static size_t SeqOutStreamBuf_Write(const ISeqOutStream *pp, const void *data, size_t size)
2777
16.3k
{
2778
16.3k
  CLzmaEnc_SeqOutStreamBuf *p = CONTAINER_FROM_VTBL(pp, CLzmaEnc_SeqOutStreamBuf, vt);
2779
16.3k
  if (p->rem < size)
2780
0
  {
2781
0
    size = p->rem;
2782
0
    p->overflow = True;
2783
0
  }
2784
16.3k
  memcpy(p->data, data, size);
2785
16.3k
  p->rem -= size;
2786
16.3k
  p->data += size;
2787
16.3k
  return size;
2788
16.3k
}
2789
2790
2791
UInt32 LzmaEnc_GetNumAvailableBytes(CLzmaEncHandle pp)
2792
0
{
2793
0
  const CLzmaEnc *p = (CLzmaEnc *)pp;
2794
0
  return p->matchFinder.GetNumAvailableBytes(p->matchFinderObj);
2795
0
}
2796
2797
2798
const Byte *LzmaEnc_GetCurBuf(CLzmaEncHandle pp)
2799
2.05k
{
2800
2.05k
  const CLzmaEnc *p = (CLzmaEnc *)pp;
2801
2.05k
  return p->matchFinder.GetPointerToCurrentPos(p->matchFinderObj) - p->additionalOffset;
2802
2.05k
}
2803
2804
2805
SRes LzmaEnc_CodeOneMemBlock(CLzmaEncHandle pp, BoolInt reInit,
2806
    Byte *dest, size_t *destLen, UInt32 desiredPackSize, UInt32 *unpackSize)
2807
16.3k
{
2808
16.3k
  CLzmaEnc *p = (CLzmaEnc *)pp;
2809
16.3k
  UInt64 nowPos64;
2810
16.3k
  SRes res;
2811
16.3k
  CLzmaEnc_SeqOutStreamBuf outStream;
2812
2813
16.3k
  outStream.vt.Write = SeqOutStreamBuf_Write;
2814
16.3k
  outStream.data = dest;
2815
16.3k
  outStream.rem = *destLen;
2816
16.3k
  outStream.overflow = False;
2817
2818
16.3k
  p->writeEndMark = False;
2819
16.3k
  p->finished = False;
2820
16.3k
  p->result = SZ_OK;
2821
2822
16.3k
  if (reInit)
2823
10.1k
    LzmaEnc_Init(p);
2824
16.3k
  LzmaEnc_InitPrices(p);
2825
2826
16.3k
  nowPos64 = p->nowPos64;
2827
16.3k
  RangeEnc_Init(&p->rc);
2828
16.3k
  p->rc.outStream = &outStream.vt;
2829
2830
16.3k
  if (desiredPackSize == 0)
2831
0
    return SZ_ERROR_OUTPUT_EOF;
2832
2833
16.3k
  res = LzmaEnc_CodeOneBlock(p, desiredPackSize, *unpackSize);
2834
  
2835
16.3k
  *unpackSize = (UInt32)(p->nowPos64 - nowPos64);
2836
16.3k
  *destLen -= outStream.rem;
2837
16.3k
  if (outStream.overflow)
2838
0
    return SZ_ERROR_OUTPUT_EOF;
2839
2840
16.3k
  return res;
2841
16.3k
}
2842
2843
2844
static SRes LzmaEnc_Encode2(CLzmaEnc *p, ICompressProgress *progress)
2845
0
{
2846
0
  SRes res = SZ_OK;
2847
2848
  #ifndef _7ZIP_ST
2849
  Byte allocaDummy[0x300];
2850
  allocaDummy[0] = 0;
2851
  allocaDummy[1] = allocaDummy[0];
2852
  #endif
2853
2854
0
  for (;;)
2855
0
  {
2856
0
    res = LzmaEnc_CodeOneBlock(p, 0, 0);
2857
0
    if (res != SZ_OK || p->finished)
2858
0
      break;
2859
0
    if (progress)
2860
0
    {
2861
0
      res = ICompressProgress_Progress(progress, p->nowPos64, RangeEnc_GetProcessed(&p->rc));
2862
0
      if (res != SZ_OK)
2863
0
      {
2864
0
        res = SZ_ERROR_PROGRESS;
2865
0
        break;
2866
0
      }
2867
0
    }
2868
0
  }
2869
  
2870
0
  LzmaEnc_Finish(p);
2871
2872
  /*
2873
  if (res == SZ_OK && !Inline_MatchFinder_IsFinishedOK(&p->matchFinderBase))
2874
    res = SZ_ERROR_FAIL;
2875
  }
2876
  */
2877
2878
0
  return res;
2879
0
}
2880
2881
2882
SRes LzmaEnc_Encode(CLzmaEncHandle pp, ISeqOutStream *outStream, ISeqInStream *inStream, ICompressProgress *progress,
2883
    ISzAllocPtr alloc, ISzAllocPtr allocBig)
2884
0
{
2885
0
  RINOK(LzmaEnc_Prepare(pp, outStream, inStream, alloc, allocBig));
2886
0
  return LzmaEnc_Encode2((CLzmaEnc *)pp, progress);
2887
0
}
2888
2889
2890
SRes LzmaEnc_WriteProperties(CLzmaEncHandle pp, Byte *props, SizeT *size)
2891
8.13k
{
2892
8.13k
  CLzmaEnc *p = (CLzmaEnc *)pp;
2893
8.13k
  unsigned i;
2894
8.13k
  UInt32 dictSize = p->dictSize;
2895
8.13k
  if (*size < LZMA_PROPS_SIZE)
2896
0
    return SZ_ERROR_PARAM;
2897
8.13k
  *size = LZMA_PROPS_SIZE;
2898
8.13k
  props[0] = (Byte)((p->pb * 5 + p->lp) * 9 + p->lc);
2899
2900
8.13k
  if (dictSize >= ((UInt32)1 << 22))
2901
8.13k
  {
2902
8.13k
    UInt32 kDictMask = ((UInt32)1 << 20) - 1;
2903
8.13k
    if (dictSize < (UInt32)0xFFFFFFFF - kDictMask)
2904
8.13k
      dictSize = (dictSize + kDictMask) & ~kDictMask;
2905
8.13k
  }
2906
0
  else for (i = 11; i <= 30; i++)
2907
0
  {
2908
0
    if (dictSize <= ((UInt32)2 << i)) { dictSize = (2 << i); break; }
2909
0
    if (dictSize <= ((UInt32)3 << i)) { dictSize = (3 << i); break; }
2910
0
  }
2911
2912
40.6k
  for (i = 0; i < 4; i++)
2913
32.5k
    props[1 + i] = (Byte)(dictSize >> (8 * i));
2914
8.13k
  return SZ_OK;
2915
8.13k
}
2916
2917
2918
unsigned LzmaEnc_IsWriteEndMark(CLzmaEncHandle pp)
2919
0
{
2920
0
  return ((CLzmaEnc *)pp)->writeEndMark;
2921
0
}
2922
2923
2924
SRes LzmaEnc_MemEncode(CLzmaEncHandle pp, Byte *dest, SizeT *destLen, const Byte *src, SizeT srcLen,
2925
    int writeEndMark, ICompressProgress *progress, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2926
0
{
2927
0
  SRes res;
2928
0
  CLzmaEnc *p = (CLzmaEnc *)pp;
2929
2930
0
  CLzmaEnc_SeqOutStreamBuf outStream;
2931
2932
0
  outStream.vt.Write = SeqOutStreamBuf_Write;
2933
0
  outStream.data = dest;
2934
0
  outStream.rem = *destLen;
2935
0
  outStream.overflow = False;
2936
2937
0
  p->writeEndMark = writeEndMark;
2938
0
  p->rc.outStream = &outStream.vt;
2939
2940
0
  res = LzmaEnc_MemPrepare(pp, src, srcLen, 0, alloc, allocBig);
2941
  
2942
0
  if (res == SZ_OK)
2943
0
  {
2944
0
    res = LzmaEnc_Encode2(p, progress);
2945
0
    if (res == SZ_OK && p->nowPos64 != srcLen)
2946
0
      res = SZ_ERROR_FAIL;
2947
0
  }
2948
2949
0
  *destLen -= outStream.rem;
2950
0
  if (outStream.overflow)
2951
0
    return SZ_ERROR_OUTPUT_EOF;
2952
0
  return res;
2953
0
}
2954
2955
2956
SRes LzmaEncode(Byte *dest, SizeT *destLen, const Byte *src, SizeT srcLen,
2957
    const CLzmaEncProps *props, Byte *propsEncoded, SizeT *propsSize, int writeEndMark,
2958
    ICompressProgress *progress, ISzAllocPtr alloc, ISzAllocPtr allocBig)
2959
0
{
2960
0
  CLzmaEnc *p = (CLzmaEnc *)LzmaEnc_Create(alloc);
2961
0
  SRes res;
2962
0
  if (!p)
2963
0
    return SZ_ERROR_MEM;
2964
2965
0
  res = LzmaEnc_SetProps(p, props);
2966
0
  if (res == SZ_OK)
2967
0
  {
2968
0
    res = LzmaEnc_WriteProperties(p, propsEncoded, propsSize);
2969
0
    if (res == SZ_OK)
2970
0
      res = LzmaEnc_MemEncode(p, dest, destLen, src, srcLen,
2971
0
          writeEndMark, progress, alloc, allocBig);
2972
0
  }
2973
2974
0
  LzmaEnc_Destroy(p, alloc, allocBig);
2975
0
  return res;
2976
0
}