Coverage Report

Created: 2025-05-21 06:19

/src/bzip2/compress.c
Line
Count
Source (jump to first uncovered line)
1
2
/*-------------------------------------------------------------*/
3
/*--- Compression machinery (not incl block sorting)        ---*/
4
/*---                                            compress.c ---*/
5
/*-------------------------------------------------------------*/
6
7
/* ------------------------------------------------------------------
8
   This file is part of bzip2/libbzip2, a program and library for
9
   lossless, block-sorting data compression.
10
11
   bzip2/libbzip2 version 1.0.8 of 13 July 2019
12
   Copyright (C) 1996-2019 Julian Seward <jseward@acm.org>
13
14
   Please read the WARNING, DISCLAIMER and PATENTS sections in the 
15
   README file.
16
17
   This program is released under the terms of the license contained
18
   in the file LICENSE.
19
   ------------------------------------------------------------------ */
20
21
22
/* CHANGES
23
    0.9.0    -- original version.
24
    0.9.0a/b -- no changes in this file.
25
    0.9.0c   -- changed setting of nGroups in sendMTFValues() 
26
                so as to do a bit better on small files
27
*/
28
29
#include "bzlib_private.h"
30
31
32
/*---------------------------------------------------*/
33
/*--- Bit stream I/O                              ---*/
34
/*---------------------------------------------------*/
35
36
/*---------------------------------------------------*/
37
void BZ2_bsInitWrite ( EState* s )
38
4.03k
{
39
4.03k
   s->bsLive = 0;
40
4.03k
   s->bsBuff = 0;
41
4.03k
}
42
43
44
/*---------------------------------------------------*/
45
static
46
void bsFinishWrite ( EState* s )
47
4.03k
{
48
11.5k
   while (s->bsLive > 0) {
49
7.52k
      s->zbits[s->numZ] = (UChar)(s->bsBuff >> 24);
50
7.52k
      s->numZ++;
51
7.52k
      s->bsBuff <<= 8;
52
7.52k
      s->bsLive -= 8;
53
7.52k
   }
54
4.03k
}
55
56
57
/*---------------------------------------------------*/
58
175M
#define bsNEEDW(nz)                           \
59
175M
{                                             \
60
318M
   while (s->bsLive >= 8) {                   \
61
143M
      s->zbits[s->numZ]                       \
62
143M
         = (UChar)(s->bsBuff >> 24);          \
63
143M
      s->numZ++;                              \
64
143M
      s->bsBuff <<= 8;                        \
65
143M
      s->bsLive -= 8;                         \
66
143M
   }                                          \
67
175M
}
68
69
70
/*---------------------------------------------------*/
71
static
72
__inline__
73
void bsW ( EState* s, Int32 n, UInt32 v )
74
175M
{
75
175M
   bsNEEDW ( n );
76
175M
   s->bsBuff |= (v << (32 - s->bsLive - n));
77
175M
   s->bsLive += n;
78
175M
}
79
80
81
/*---------------------------------------------------*/
82
static
83
void bsPutUInt32 ( EState* s, UInt32 u )
84
8.37k
{
85
8.37k
   bsW ( s, 8, (u >> 24) & 0xffL );
86
8.37k
   bsW ( s, 8, (u >> 16) & 0xffL );
87
8.37k
   bsW ( s, 8, (u >>  8) & 0xffL );
88
8.37k
   bsW ( s, 8,  u        & 0xffL );
89
8.37k
}
90
91
92
/*---------------------------------------------------*/
93
static
94
void bsPutUChar ( EState* s, UChar c )
95
66.3k
{
96
66.3k
   bsW( s, 8, (UInt32)c );
97
66.3k
}
98
99
100
/*---------------------------------------------------*/
101
/*--- The back end proper                         ---*/
102
/*---------------------------------------------------*/
103
104
/*---------------------------------------------------*/
105
static
106
void makeMaps_e ( EState* s )
107
4.33k
{
108
4.33k
   Int32 i;
109
4.33k
   s->nInUse = 0;
110
1.11M
   for (i = 0; i < 256; i++)
111
1.11M
      if (s->inUse[i]) {
112
517k
         s->unseqToSeq[i] = s->nInUse;
113
517k
         s->nInUse++;
114
517k
      }
115
4.33k
}
116
117
118
/*---------------------------------------------------*/
119
static
120
void generateMTFValues ( EState* s )
121
4.33k
{
122
4.33k
   UChar   yy[256];
123
4.33k
   Int32   i, j;
124
4.33k
   Int32   zPend;
125
4.33k
   Int32   wr;
126
4.33k
   Int32   EOB;
127
128
   /* 
129
      After sorting (eg, here),
130
         s->arr1 [ 0 .. s->nblock-1 ] holds sorted order,
131
         and
132
         ((UChar*)s->arr2) [ 0 .. s->nblock-1 ] 
133
         holds the original block data.
134
135
      The first thing to do is generate the MTF values,
136
      and put them in
137
         ((UInt16*)s->arr1) [ 0 .. s->nblock-1 ].
138
      Because there are strictly fewer or equal MTF values
139
      than block values, ptr values in this area are overwritten
140
      with MTF values only when they are no longer needed.
141
142
      The final compressed bitstream is generated into the
143
      area starting at
144
         (UChar*) (&((UChar*)s->arr2)[s->nblock])
145
146
      These storage aliases are set up in bzCompressInit(),
147
      except for the last one, which is arranged in 
148
      compressBlock().
149
   */
150
4.33k
   UInt32* ptr   = s->ptr;
151
4.33k
   UChar* block  = s->block;
152
4.33k
   UInt16* mtfv  = s->mtfv;
153
154
4.33k
   makeMaps_e ( s );
155
4.33k
   EOB = s->nInUse+1;
156
157
530k
   for (i = 0; i <= EOB; i++) s->mtfFreq[i] = 0;
158
159
4.33k
   wr = 0;
160
4.33k
   zPend = 0;
161
521k
   for (i = 0; i < s->nInUse; i++) yy[i] = (UChar) i;
162
163
446M
   for (i = 0; i < s->nblock; i++) {
164
446M
      UChar ll_i;
165
446M
      AssertD ( wr <= i, "generateMTFValues(1)" );
166
446M
      j = ptr[i]-1; if (j < 0) j += s->nblock;
167
446M
      ll_i = s->unseqToSeq[block[j]];
168
446M
      AssertD ( ll_i < s->nInUse, "generateMTFValues(2a)" );
169
170
446M
      if (yy[0] == ll_i) { 
171
307M
         zPend++;
172
307M
      } else {
173
174
138M
         if (zPend > 0) {
175
19.4M
            zPend--;
176
22.8M
            while (True) {
177
22.8M
               if (zPend & 1) {
178
2.45M
                  mtfv[wr] = BZ_RUNB; wr++; 
179
2.45M
                  s->mtfFreq[BZ_RUNB]++; 
180
20.4M
               } else {
181
20.4M
                  mtfv[wr] = BZ_RUNA; wr++; 
182
20.4M
                  s->mtfFreq[BZ_RUNA]++; 
183
20.4M
               }
184
22.8M
               if (zPend < 2) break;
185
3.39M
               zPend = (zPend - 2) / 2;
186
3.39M
            };
187
19.4M
            zPend = 0;
188
19.4M
         }
189
138M
         {
190
138M
            register UChar  rtmp;
191
138M
            register UChar* ryy_j;
192
138M
            register UChar  rll_i;
193
138M
            rtmp  = yy[1];
194
138M
            yy[1] = yy[0];
195
138M
            ryy_j = &(yy[1]);
196
138M
            rll_i = ll_i;
197
15.9G
            while ( rll_i != rtmp ) {
198
15.8G
               register UChar rtmp2;
199
15.8G
               ryy_j++;
200
15.8G
               rtmp2  = rtmp;
201
15.8G
               rtmp   = *ryy_j;
202
15.8G
               *ryy_j = rtmp2;
203
15.8G
            };
204
138M
            yy[0] = rtmp;
205
138M
            j = ryy_j - &(yy[0]);
206
138M
            mtfv[wr] = j+1; wr++; s->mtfFreq[j+1]++;
207
138M
         }
208
209
138M
      }
210
446M
   }
211
212
4.33k
   if (zPend > 0) {
213
1.67k
      zPend--;
214
4.87k
      while (True) {
215
4.87k
         if (zPend & 1) {
216
1.94k
            mtfv[wr] = BZ_RUNB; wr++; 
217
1.94k
            s->mtfFreq[BZ_RUNB]++; 
218
2.92k
         } else {
219
2.92k
            mtfv[wr] = BZ_RUNA; wr++; 
220
2.92k
            s->mtfFreq[BZ_RUNA]++; 
221
2.92k
         }
222
4.87k
         if (zPend < 2) break;
223
3.19k
         zPend = (zPend - 2) / 2;
224
3.19k
      };
225
1.67k
      zPend = 0;
226
1.67k
   }
227
228
4.33k
   mtfv[wr] = EOB; wr++; s->mtfFreq[EOB]++;
229
230
4.33k
   s->nMTF = wr;
231
4.33k
}
232
233
234
/*---------------------------------------------------*/
235
526k
#define BZ_LESSER_ICOST  0
236
5.43M
#define BZ_GREATER_ICOST 15
237
238
static
239
void sendMTFValues ( EState* s )
240
4.33k
{
241
4.33k
   Int32 v, t, i, j, gs, ge, totc, bt, bc, iter;
242
4.33k
   Int32 nSelectors, alphaSize, minLen, maxLen, selCtr;
243
4.33k
   Int32 nGroups, nBytes;
244
245
   /*--
246
   UChar  len [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
247
   is a global since the decoder also needs it.
248
249
   Int32  code[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
250
   Int32  rfreq[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
251
   are also globals only used in this proc.
252
   Made global to keep stack frame size small.
253
   --*/
254
255
256
4.33k
   UInt16 cost[BZ_N_GROUPS];
257
4.33k
   Int32  fave[BZ_N_GROUPS];
258
259
4.33k
   UInt16* mtfv = s->mtfv;
260
261
4.33k
   if (s->verbosity >= 3)
262
0
      VPrintf3( "      %d in block, %d after MTF & 1-2 coding, "
263
4.33k
                "%d+2 syms in use\n", 
264
4.33k
                s->nblock, s->nMTF, s->nInUse );
265
266
4.33k
   alphaSize = s->nInUse+2;
267
30.3k
   for (t = 0; t < BZ_N_GROUPS; t++)
268
3.18M
      for (v = 0; v < alphaSize; v++)
269
3.15M
         s->len[t][v] = BZ_GREATER_ICOST;
270
271
   /*--- Decide how many coding tables to use ---*/
272
4.33k
   AssertH ( s->nMTF > 0, 3001 );
273
4.33k
   if (s->nMTF < 200)  nGroups = 2; else
274
2.65k
   if (s->nMTF < 600)  nGroups = 3; else
275
2.07k
   if (s->nMTF < 1200) nGroups = 4; else
276
1.79k
   if (s->nMTF < 2400) nGroups = 5; else
277
1.57k
                       nGroups = 6;
278
279
   /*--- Generate an initial set of coding tables ---*/
280
4.33k
   { 
281
4.33k
      Int32 nPart, remF, tFreq, aFreq;
282
283
4.33k
      nPart = nGroups;
284
4.33k
      remF  = s->nMTF;
285
4.33k
      gs = 0;
286
21.1k
      while (nPart > 0) {
287
16.7k
         tFreq = remF / nPart;
288
16.7k
         ge = gs-1;
289
16.7k
         aFreq = 0;
290
546k
         while (aFreq < tFreq && ge < alphaSize-1) {
291
529k
            ge++;
292
529k
            aFreq += s->mtfFreq[ge];
293
529k
         }
294
295
16.7k
         if (ge > gs 
296
16.7k
             && nPart != nGroups && nPart != 1 
297
16.7k
             && ((nGroups-nPart) % 2 == 1)) {
298
3.61k
            aFreq -= s->mtfFreq[ge];
299
3.61k
            ge--;
300
3.61k
         }
301
302
16.7k
         if (s->verbosity >= 3)
303
0
            VPrintf5( "      initial group %d, [%d .. %d], "
304
16.7k
                      "has %d syms (%4.1f%%)\n",
305
16.7k
                      nPart, gs, ge, aFreq, 
306
16.7k
                      (100.0 * (float)aFreq) / (float)(s->nMTF) );
307
 
308
2.82M
         for (v = 0; v < alphaSize; v++)
309
2.80M
            if (v >= gs && v <= ge) 
310
526k
               s->len[nPart-1][v] = BZ_LESSER_ICOST; else
311
2.28M
               s->len[nPart-1][v] = BZ_GREATER_ICOST;
312
 
313
16.7k
         nPart--;
314
16.7k
         gs = ge+1;
315
16.7k
         remF -= aFreq;
316
16.7k
      }
317
4.33k
   }
318
319
   /*--- 
320
      Iterate up to BZ_N_ITERS times to improve the tables.
321
   ---*/
322
21.6k
   for (iter = 0; iter < BZ_N_ITERS; iter++) {
323
324
121k
      for (t = 0; t < BZ_N_GROUPS; t++) fave[t] = 0;
325
326
84.4k
      for (t = 0; t < nGroups; t++)
327
11.2M
         for (v = 0; v < alphaSize; v++)
328
11.2M
            s->rfreq[t][v] = 0;
329
330
      /*---
331
        Set up an auxiliary length table which is used to fast-track
332
  the common case (nGroups == 6). 
333
      ---*/
334
17.3k
      if (nGroups == 6) {
335
1.54M
         for (v = 0; v < alphaSize; v++) {
336
1.54M
            s->len_pack[v][0] = (s->len[1][v] << 16) | s->len[0][v];
337
1.54M
            s->len_pack[v][1] = (s->len[3][v] << 16) | s->len[2][v];
338
1.54M
            s->len_pack[v][2] = (s->len[5][v] << 16) | s->len[4][v];
339
1.54M
   }
340
6.29k
      }
341
342
17.3k
      nSelectors = 0;
343
17.3k
      totc = 0;
344
17.3k
      gs = 0;
345
12.9M
      while (True) {
346
347
         /*--- Set group start & end marks. --*/
348
12.9M
         if (gs >= s->nMTF) break;
349
12.9M
         ge = gs + BZ_G_SIZE - 1; 
350
12.9M
         if (ge >= s->nMTF) ge = s->nMTF-1;
351
352
         /*-- 
353
            Calculate the cost of this group as coded
354
            by each of the coding tables.
355
         --*/
356
90.3M
         for (t = 0; t < BZ_N_GROUPS; t++) cost[t] = 0;
357
358
12.9M
         if (nGroups == 6 && 50 == ge-gs+1) {
359
            /*--- fast track the common case ---*/
360
12.8M
            register UInt32 cost01, cost23, cost45;
361
12.8M
            register UInt16 icv;
362
12.8M
            cost01 = cost23 = cost45 = 0;
363
364
12.8M
#           define BZ_ITER(nn)                \
365
640M
               icv = mtfv[gs+(nn)];           \
366
640M
               cost01 += s->len_pack[icv][0]; \
367
640M
               cost23 += s->len_pack[icv][1]; \
368
640M
               cost45 += s->len_pack[icv][2]; \
369
12.8M
370
12.8M
            BZ_ITER(0);  BZ_ITER(1);  BZ_ITER(2);  BZ_ITER(3);  BZ_ITER(4);
371
12.8M
            BZ_ITER(5);  BZ_ITER(6);  BZ_ITER(7);  BZ_ITER(8);  BZ_ITER(9);
372
12.8M
            BZ_ITER(10); BZ_ITER(11); BZ_ITER(12); BZ_ITER(13); BZ_ITER(14);
373
12.8M
            BZ_ITER(15); BZ_ITER(16); BZ_ITER(17); BZ_ITER(18); BZ_ITER(19);
374
12.8M
            BZ_ITER(20); BZ_ITER(21); BZ_ITER(22); BZ_ITER(23); BZ_ITER(24);
375
12.8M
            BZ_ITER(25); BZ_ITER(26); BZ_ITER(27); BZ_ITER(28); BZ_ITER(29);
376
12.8M
            BZ_ITER(30); BZ_ITER(31); BZ_ITER(32); BZ_ITER(33); BZ_ITER(34);
377
12.8M
            BZ_ITER(35); BZ_ITER(36); BZ_ITER(37); BZ_ITER(38); BZ_ITER(39);
378
12.8M
            BZ_ITER(40); BZ_ITER(41); BZ_ITER(42); BZ_ITER(43); BZ_ITER(44);
379
12.8M
            BZ_ITER(45); BZ_ITER(46); BZ_ITER(47); BZ_ITER(48); BZ_ITER(49);
380
381
12.8M
#           undef BZ_ITER
382
383
12.8M
            cost[0] = cost01 & 0xffff; cost[1] = cost01 >> 16;
384
12.8M
            cost[2] = cost23 & 0xffff; cost[3] = cost23 >> 16;
385
12.8M
            cost[4] = cost45 & 0xffff; cost[5] = cost45 >> 16;
386
387
12.8M
         } else {
388
      /*--- slow version which correctly handles all situations ---*/
389
3.84M
            for (i = gs; i <= ge; i++) { 
390
3.76M
               UInt16 icv = mtfv[i];
391
18.9M
               for (t = 0; t < nGroups; t++) cost[t] += s->len[t][icv];
392
3.76M
            }
393
84.7k
         }
394
 
395
         /*-- 
396
            Find the coding table which is best for this group,
397
            and record its identity in the selector table.
398
         --*/
399
12.9M
         bc = 999999999; bt = -1;
400
90.1M
         for (t = 0; t < nGroups; t++)
401
77.2M
            if (cost[t] < bc) { bc = cost[t]; bt = t; };
402
12.9M
         totc += bc;
403
12.9M
         fave[bt]++;
404
12.9M
         s->selector[nSelectors] = bt;
405
12.9M
         nSelectors++;
406
407
         /*-- 
408
            Increment the symbol frequencies for the selected table.
409
          --*/
410
12.9M
         if (nGroups == 6 && 50 == ge-gs+1) {
411
            /*--- fast track the common case ---*/
412
413
640M
#           define BZ_ITUR(nn) s->rfreq[bt][ mtfv[gs+(nn)] ]++
414
415
12.8M
            BZ_ITUR(0);  BZ_ITUR(1);  BZ_ITUR(2);  BZ_ITUR(3);  BZ_ITUR(4);
416
12.8M
            BZ_ITUR(5);  BZ_ITUR(6);  BZ_ITUR(7);  BZ_ITUR(8);  BZ_ITUR(9);
417
12.8M
            BZ_ITUR(10); BZ_ITUR(11); BZ_ITUR(12); BZ_ITUR(13); BZ_ITUR(14);
418
12.8M
            BZ_ITUR(15); BZ_ITUR(16); BZ_ITUR(17); BZ_ITUR(18); BZ_ITUR(19);
419
12.8M
            BZ_ITUR(20); BZ_ITUR(21); BZ_ITUR(22); BZ_ITUR(23); BZ_ITUR(24);
420
12.8M
            BZ_ITUR(25); BZ_ITUR(26); BZ_ITUR(27); BZ_ITUR(28); BZ_ITUR(29);
421
12.8M
            BZ_ITUR(30); BZ_ITUR(31); BZ_ITUR(32); BZ_ITUR(33); BZ_ITUR(34);
422
12.8M
            BZ_ITUR(35); BZ_ITUR(36); BZ_ITUR(37); BZ_ITUR(38); BZ_ITUR(39);
423
12.8M
            BZ_ITUR(40); BZ_ITUR(41); BZ_ITUR(42); BZ_ITUR(43); BZ_ITUR(44);
424
12.8M
            BZ_ITUR(45); BZ_ITUR(46); BZ_ITUR(47); BZ_ITUR(48); BZ_ITUR(49);
425
426
12.8M
#           undef BZ_ITUR
427
428
12.8M
         } else {
429
      /*--- slow version which correctly handles all situations ---*/
430
3.84M
            for (i = gs; i <= ge; i++)
431
3.76M
               s->rfreq[bt][ mtfv[i] ]++;
432
84.7k
         }
433
434
12.9M
         gs = ge+1;
435
12.9M
      }
436
17.3k
      if (s->verbosity >= 3) {
437
0
         VPrintf2 ( "      pass %d: size is %d, grp uses are ", 
438
0
                   iter+1, totc/8 );
439
0
         for (t = 0; t < nGroups; t++)
440
0
            VPrintf1 ( "%d ", fave[t] );
441
0
         VPrintf0 ( "\n" );
442
0
      }
443
444
      /*--
445
        Recompute the tables based on the accumulated frequencies.
446
      --*/
447
      /* maxLen was changed from 20 to 17 in bzip2-1.0.3.  See 
448
         comment in huffman.c for details. */
449
84.4k
      for (t = 0; t < nGroups; t++)
450
67.0k
         BZ2_hbMakeCodeLengths ( &(s->len[t][0]), &(s->rfreq[t][0]), 
451
67.0k
                                 alphaSize, 17 /*20*/ );
452
17.3k
   }
453
454
455
4.33k
   AssertH( nGroups < 8, 3002 );
456
4.33k
   AssertH( nSelectors < 32768 &&
457
4.33k
            nSelectors <= BZ_MAX_SELECTORS,
458
4.33k
            3003 );
459
460
461
   /*--- Compute MTF values for the selectors. ---*/
462
4.33k
   {
463
4.33k
      UChar pos[BZ_N_GROUPS], ll_i, tmp2, tmp;
464
21.1k
      for (i = 0; i < nGroups; i++) pos[i] = i;
465
3.23M
      for (i = 0; i < nSelectors; i++) {
466
3.22M
         ll_i = s->selector[i];
467
3.22M
         j = 0;
468
3.22M
         tmp = pos[j];
469
8.91M
         while ( ll_i != tmp ) {
470
5.68M
            j++;
471
5.68M
            tmp2 = tmp;
472
5.68M
            tmp = pos[j];
473
5.68M
            pos[j] = tmp2;
474
5.68M
         };
475
3.22M
         pos[0] = tmp;
476
3.22M
         s->selectorMtf[i] = j;
477
3.22M
      }
478
4.33k
   };
479
480
   /*--- Assign actual codes for the tables. --*/
481
21.1k
   for (t = 0; t < nGroups; t++) {
482
16.7k
      minLen = 32;
483
16.7k
      maxLen = 0;
484
2.82M
      for (i = 0; i < alphaSize; i++) {
485
2.80M
         if (s->len[t][i] > maxLen) maxLen = s->len[t][i];
486
2.80M
         if (s->len[t][i] < minLen) minLen = s->len[t][i];
487
2.80M
      }
488
16.7k
      AssertH ( !(maxLen > 17 /*20*/ ), 3004 );
489
16.7k
      AssertH ( !(minLen < 1),  3005 );
490
16.7k
      BZ2_hbAssignCodes ( &(s->code[t][0]), &(s->len[t][0]), 
491
16.7k
                          minLen, maxLen, alphaSize );
492
16.7k
   }
493
494
   /*--- Transmit the mapping table. ---*/
495
4.33k
   { 
496
4.33k
      Bool inUse16[16];
497
73.7k
      for (i = 0; i < 16; i++) {
498
69.4k
          inUse16[i] = False;
499
1.17M
          for (j = 0; j < 16; j++)
500
1.11M
             if (s->inUse[i * 16 + j]) inUse16[i] = True;
501
69.4k
      }
502
     
503
4.33k
      nBytes = s->numZ;
504
73.7k
      for (i = 0; i < 16; i++)
505
69.4k
         if (inUse16[i]) bsW(s,1,1); else bsW(s,1,0);
506
507
73.7k
      for (i = 0; i < 16; i++)
508
69.4k
         if (inUse16[i])
509
824k
            for (j = 0; j < 16; j++) {
510
776k
               if (s->inUse[i * 16 + j]) bsW(s,1,1); else bsW(s,1,0);
511
776k
            }
512
513
4.33k
      if (s->verbosity >= 3) 
514
0
         VPrintf1( "      bytes: mapping %d, ", s->numZ-nBytes );
515
4.33k
   }
516
517
   /*--- Now the selectors. ---*/
518
4.33k
   nBytes = s->numZ;
519
4.33k
   bsW ( s, 3, nGroups );
520
4.33k
   bsW ( s, 15, nSelectors );
521
3.23M
   for (i = 0; i < nSelectors; i++) { 
522
8.91M
      for (j = 0; j < s->selectorMtf[i]; j++) bsW(s,1,1);
523
3.22M
      bsW(s,1,0);
524
3.22M
   }
525
4.33k
   if (s->verbosity >= 3)
526
0
      VPrintf1( "selectors %d, ", s->numZ-nBytes );
527
528
   /*--- Now the coding tables. ---*/
529
4.33k
   nBytes = s->numZ;
530
531
21.1k
   for (t = 0; t < nGroups; t++) {
532
16.7k
      Int32 curr = s->len[t][0];
533
16.7k
      bsW ( s, 5, curr );
534
2.82M
      for (i = 0; i < alphaSize; i++) {
535
3.41M
         while (curr < s->len[t][i]) { bsW(s,2,2); curr++; /* 10 */ };
536
3.35M
         while (curr > s->len[t][i]) { bsW(s,2,3); curr--; /* 11 */ };
537
2.80M
         bsW ( s, 1, 0 );
538
2.80M
      }
539
16.7k
   }
540
541
4.33k
   if (s->verbosity >= 3)
542
0
      VPrintf1 ( "code lengths %d, ", s->numZ-nBytes );
543
544
   /*--- And finally, the block data proper ---*/
545
4.33k
   nBytes = s->numZ;
546
4.33k
   selCtr = 0;
547
4.33k
   gs = 0;
548
3.23M
   while (True) {
549
3.23M
      if (gs >= s->nMTF) break;
550
3.22M
      ge = gs + BZ_G_SIZE - 1; 
551
3.22M
      if (ge >= s->nMTF) ge = s->nMTF-1;
552
3.22M
      AssertH ( s->selector[selCtr] < nGroups, 3006 );
553
554
3.22M
      if (nGroups == 6 && 50 == ge-gs+1) {
555
            /*--- fast track the common case ---*/
556
3.20M
            UInt16 mtfv_i;
557
3.20M
            UChar* s_len_sel_selCtr 
558
3.20M
               = &(s->len[s->selector[selCtr]][0]);
559
3.20M
            Int32* s_code_sel_selCtr
560
3.20M
               = &(s->code[s->selector[selCtr]][0]);
561
562
3.20M
#           define BZ_ITAH(nn)                      \
563
160M
               mtfv_i = mtfv[gs+(nn)];              \
564
160M
               bsW ( s,                             \
565
160M
                     s_len_sel_selCtr[mtfv_i],      \
566
160M
                     s_code_sel_selCtr[mtfv_i] )
567
568
3.20M
            BZ_ITAH(0);  BZ_ITAH(1);  BZ_ITAH(2);  BZ_ITAH(3);  BZ_ITAH(4);
569
3.20M
            BZ_ITAH(5);  BZ_ITAH(6);  BZ_ITAH(7);  BZ_ITAH(8);  BZ_ITAH(9);
570
3.20M
            BZ_ITAH(10); BZ_ITAH(11); BZ_ITAH(12); BZ_ITAH(13); BZ_ITAH(14);
571
3.20M
            BZ_ITAH(15); BZ_ITAH(16); BZ_ITAH(17); BZ_ITAH(18); BZ_ITAH(19);
572
3.20M
            BZ_ITAH(20); BZ_ITAH(21); BZ_ITAH(22); BZ_ITAH(23); BZ_ITAH(24);
573
3.20M
            BZ_ITAH(25); BZ_ITAH(26); BZ_ITAH(27); BZ_ITAH(28); BZ_ITAH(29);
574
3.20M
            BZ_ITAH(30); BZ_ITAH(31); BZ_ITAH(32); BZ_ITAH(33); BZ_ITAH(34);
575
3.20M
            BZ_ITAH(35); BZ_ITAH(36); BZ_ITAH(37); BZ_ITAH(38); BZ_ITAH(39);
576
3.20M
            BZ_ITAH(40); BZ_ITAH(41); BZ_ITAH(42); BZ_ITAH(43); BZ_ITAH(44);
577
3.20M
            BZ_ITAH(45); BZ_ITAH(46); BZ_ITAH(47); BZ_ITAH(48); BZ_ITAH(49);
578
579
3.20M
#           undef BZ_ITAH
580
581
3.20M
      } else {
582
   /*--- slow version which correctly handles all situations ---*/
583
962k
         for (i = gs; i <= ge; i++) {
584
941k
            bsW ( s, 
585
941k
                  s->len  [s->selector[selCtr]] [mtfv[i]],
586
941k
                  s->code [s->selector[selCtr]] [mtfv[i]] );
587
941k
         }
588
21.1k
      }
589
590
591
3.22M
      gs = ge+1;
592
3.22M
      selCtr++;
593
3.22M
   }
594
4.33k
   AssertH( selCtr == nSelectors, 3007 );
595
596
4.33k
   if (s->verbosity >= 3)
597
0
      VPrintf1( "codes %d\n", s->numZ-nBytes );
598
4.33k
}
599
600
601
/*---------------------------------------------------*/
602
void BZ2_compressBlock ( EState* s, Bool is_last_block )
603
4.33k
{
604
4.33k
   if (s->nblock > 0) {
605
606
4.33k
      BZ_FINALISE_CRC ( s->blockCRC );
607
4.33k
      s->combinedCRC = (s->combinedCRC << 1) | (s->combinedCRC >> 31);
608
4.33k
      s->combinedCRC ^= s->blockCRC;
609
4.33k
      if (s->blockNo > 1) s->numZ = 0;
610
611
4.33k
      if (s->verbosity >= 2)
612
0
         VPrintf4( "    block %d: crc = 0x%08x, "
613
4.33k
                   "combined CRC = 0x%08x, size = %d\n",
614
4.33k
                   s->blockNo, s->blockCRC, s->combinedCRC, s->nblock );
615
616
4.33k
      BZ2_blockSort ( s );
617
4.33k
   }
618
619
4.33k
   s->zbits = (UChar*) (&((UChar*)s->arr2)[s->nblock]);
620
621
   /*-- If this is the first block, create the stream header. --*/
622
4.33k
   if (s->blockNo == 1) {
623
4.03k
      BZ2_bsInitWrite ( s );
624
4.03k
      bsPutUChar ( s, BZ_HDR_B );
625
4.03k
      bsPutUChar ( s, BZ_HDR_Z );
626
4.03k
      bsPutUChar ( s, BZ_HDR_h );
627
4.03k
      bsPutUChar ( s, (UChar)(BZ_HDR_0 + s->blockSize100k) );
628
4.03k
   }
629
630
4.33k
   if (s->nblock > 0) {
631
632
4.33k
      bsPutUChar ( s, 0x31 ); bsPutUChar ( s, 0x41 );
633
4.33k
      bsPutUChar ( s, 0x59 ); bsPutUChar ( s, 0x26 );
634
4.33k
      bsPutUChar ( s, 0x53 ); bsPutUChar ( s, 0x59 );
635
636
      /*-- Now the block's CRC, so it is in a known place. --*/
637
4.33k
      bsPutUInt32 ( s, s->blockCRC );
638
639
      /*-- 
640
         Now a single bit indicating (non-)randomisation. 
641
         As of version 0.9.5, we use a better sorting algorithm
642
         which makes randomisation unnecessary.  So always set
643
         the randomised bit to 'no'.  Of course, the decoder
644
         still needs to be able to handle randomised blocks
645
         so as to maintain backwards compatibility with
646
         older versions of bzip2.
647
      --*/
648
4.33k
      bsW(s,1,0);
649
650
4.33k
      bsW ( s, 24, s->origPtr );
651
4.33k
      generateMTFValues ( s );
652
4.33k
      sendMTFValues ( s );
653
4.33k
   }
654
655
656
   /*-- If this is the last block, add the stream trailer. --*/
657
4.33k
   if (is_last_block) {
658
659
4.03k
      bsPutUChar ( s, 0x17 ); bsPutUChar ( s, 0x72 );
660
4.03k
      bsPutUChar ( s, 0x45 ); bsPutUChar ( s, 0x38 );
661
4.03k
      bsPutUChar ( s, 0x50 ); bsPutUChar ( s, 0x90 );
662
4.03k
      bsPutUInt32 ( s, s->combinedCRC );
663
4.03k
      if (s->verbosity >= 2)
664
0
         VPrintf1( "    final combined CRC = 0x%08x\n   ", s->combinedCRC );
665
4.03k
      bsFinishWrite ( s );
666
4.03k
   }
667
4.33k
}
668
669
670
/*-------------------------------------------------------------*/
671
/*--- end                                        compress.c ---*/
672
/*-------------------------------------------------------------*/