Coverage Report

Created: 2026-01-17 06:26

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/bzip2/compress.c
Line
Count
Source
1
2
/*-------------------------------------------------------------*/
3
/*--- Compression machinery (not incl block sorting)        ---*/
4
/*---                                            compress.c ---*/
5
/*-------------------------------------------------------------*/
6
7
/* ------------------------------------------------------------------
8
   This file is part of bzip2/libbzip2, a program and library for
9
   lossless, block-sorting data compression.
10
11
   bzip2/libbzip2 version 1.0.8 of 13 July 2019
12
   Copyright (C) 1996-2019 Julian Seward <jseward@acm.org>
13
14
   Please read the WARNING, DISCLAIMER and PATENTS sections in the 
15
   README file.
16
17
   This program is released under the terms of the license contained
18
   in the file LICENSE.
19
   ------------------------------------------------------------------ */
20
21
22
/* CHANGES
23
    0.9.0    -- original version.
24
    0.9.0a/b -- no changes in this file.
25
    0.9.0c   -- changed setting of nGroups in sendMTFValues() 
26
                so as to do a bit better on small files
27
*/
28
29
#include "bzlib_private.h"
30
31
32
/*---------------------------------------------------*/
33
/*--- Bit stream I/O                              ---*/
34
/*---------------------------------------------------*/
35
36
/*---------------------------------------------------*/
37
void BZ2_bsInitWrite ( EState* s )
38
3.06k
{
39
3.06k
   s->bsLive = 0;
40
3.06k
   s->bsBuff = 0;
41
3.06k
}
42
43
44
/*---------------------------------------------------*/
45
static
46
void bsFinishWrite ( EState* s )
47
3.06k
{
48
8.77k
   while (s->bsLive > 0) {
49
5.70k
      s->zbits[s->numZ] = (UChar)(s->bsBuff >> 24);
50
5.70k
      s->numZ++;
51
5.70k
      s->bsBuff <<= 8;
52
5.70k
      s->bsLive -= 8;
53
5.70k
   }
54
3.06k
}
55
56
57
/*---------------------------------------------------*/
58
92.6M
#define bsNEEDW(nz)                           \
59
92.6M
{                                             \
60
161M
   while (s->bsLive >= 8) {                   \
61
68.9M
      s->zbits[s->numZ]                       \
62
68.9M
         = (UChar)(s->bsBuff >> 24);          \
63
68.9M
      s->numZ++;                              \
64
68.9M
      s->bsBuff <<= 8;                        \
65
68.9M
      s->bsLive -= 8;                         \
66
68.9M
   }                                          \
67
92.6M
}
68
69
70
/*---------------------------------------------------*/
71
static
72
__inline__
73
void bsW ( EState* s, Int32 n, UInt32 v )
74
92.6M
{
75
92.6M
   bsNEEDW ( n );
76
92.6M
   s->bsBuff |= (v << (32 - s->bsLive - n));
77
92.6M
   s->bsLive += n;
78
92.6M
}
79
80
81
/*---------------------------------------------------*/
82
static
83
void bsPutUInt32 ( EState* s, UInt32 u )
84
6.27k
{
85
6.27k
   bsW ( s, 8, (u >> 24) & 0xffL );
86
6.27k
   bsW ( s, 8, (u >> 16) & 0xffL );
87
6.27k
   bsW ( s, 8, (u >>  8) & 0xffL );
88
6.27k
   bsW ( s, 8,  u        & 0xffL );
89
6.27k
}
90
91
92
/*---------------------------------------------------*/
93
static
94
void bsPutUChar ( EState* s, UChar c )
95
49.8k
{
96
49.8k
   bsW( s, 8, (UInt32)c );
97
49.8k
}
98
99
100
/*---------------------------------------------------*/
101
/*--- The back end proper                         ---*/
102
/*---------------------------------------------------*/
103
104
/*---------------------------------------------------*/
105
static
106
void makeMaps_e ( EState* s )
107
3.20k
{
108
3.20k
   Int32 i;
109
3.20k
   s->nInUse = 0;
110
824k
   for (i = 0; i < 256; i++)
111
821k
      if (s->inUse[i]) {
112
359k
         s->unseqToSeq[i] = s->nInUse;
113
359k
         s->nInUse++;
114
359k
      }
115
3.20k
}
116
117
118
/*---------------------------------------------------*/
119
static
120
void generateMTFValues ( EState* s )
121
3.20k
{
122
3.20k
   UChar   yy[256];
123
3.20k
   Int32   i, j;
124
3.20k
   Int32   zPend;
125
3.20k
   Int32   wr;
126
3.20k
   Int32   EOB;
127
128
   /* 
129
      After sorting (eg, here),
130
         s->arr1 [ 0 .. s->nblock-1 ] holds sorted order,
131
         and
132
         ((UChar*)s->arr2) [ 0 .. s->nblock-1 ] 
133
         holds the original block data.
134
135
      The first thing to do is generate the MTF values,
136
      and put them in
137
         ((UInt16*)s->arr1) [ 0 .. s->nblock-1 ].
138
      Because there are strictly fewer or equal MTF values
139
      than block values, ptr values in this area are overwritten
140
      with MTF values only when they are no longer needed.
141
142
      The final compressed bitstream is generated into the
143
      area starting at
144
         (UChar*) (&((UChar*)s->arr2)[s->nblock])
145
146
      These storage aliases are set up in bzCompressInit(),
147
      except for the last one, which is arranged in 
148
      compressBlock().
149
   */
150
3.20k
   UInt32* ptr   = s->ptr;
151
3.20k
   UChar* block  = s->block;
152
3.20k
   UInt16* mtfv  = s->mtfv;
153
154
3.20k
   makeMaps_e ( s );
155
3.20k
   EOB = s->nInUse+1;
156
157
369k
   for (i = 0; i <= EOB; i++) s->mtfFreq[i] = 0;
158
159
3.20k
   wr = 0;
160
3.20k
   zPend = 0;
161
362k
   for (i = 0; i < s->nInUse; i++) yy[i] = (UChar) i;
162
163
240M
   for (i = 0; i < s->nblock; i++) {
164
240M
      UChar ll_i;
165
240M
      AssertD ( wr <= i, "generateMTFValues(1)" );
166
240M
      j = ptr[i]-1; if (j < 0) j += s->nblock;
167
240M
      ll_i = s->unseqToSeq[block[j]];
168
240M
      AssertD ( ll_i < s->nInUse, "generateMTFValues(2a)" );
169
170
240M
      if (yy[0] == ll_i) { 
171
173M
         zPend++;
172
173M
      } else {
173
174
67.6M
         if (zPend > 0) {
175
14.9M
            zPend--;
176
17.5M
            while (True) {
177
17.5M
               if (zPend & 1) {
178
2.17M
                  mtfv[wr] = BZ_RUNB; wr++; 
179
2.17M
                  s->mtfFreq[BZ_RUNB]++; 
180
15.3M
               } else {
181
15.3M
                  mtfv[wr] = BZ_RUNA; wr++; 
182
15.3M
                  s->mtfFreq[BZ_RUNA]++; 
183
15.3M
               }
184
17.5M
               if (zPend < 2) break;
185
2.56M
               zPend = (zPend - 2) / 2;
186
2.56M
            };
187
14.9M
            zPend = 0;
188
14.9M
         }
189
67.6M
         {
190
67.6M
            register UChar  rtmp;
191
67.6M
            register UChar* ryy_j;
192
67.6M
            register UChar  rll_i;
193
67.6M
            rtmp  = yy[1];
194
67.6M
            yy[1] = yy[0];
195
67.6M
            ryy_j = &(yy[1]);
196
67.6M
            rll_i = ll_i;
197
7.01G
            while ( rll_i != rtmp ) {
198
6.94G
               register UChar rtmp2;
199
6.94G
               ryy_j++;
200
6.94G
               rtmp2  = rtmp;
201
6.94G
               rtmp   = *ryy_j;
202
6.94G
               *ryy_j = rtmp2;
203
6.94G
            };
204
67.6M
            yy[0] = rtmp;
205
67.6M
            j = ryy_j - &(yy[0]);
206
67.6M
            mtfv[wr] = j+1; wr++; s->mtfFreq[j+1]++;
207
67.6M
         }
208
209
67.6M
      }
210
240M
   }
211
212
3.20k
   if (zPend > 0) {
213
1.60k
      zPend--;
214
7.55k
      while (True) {
215
7.55k
         if (zPend & 1) {
216
3.44k
            mtfv[wr] = BZ_RUNB; wr++; 
217
3.44k
            s->mtfFreq[BZ_RUNB]++; 
218
4.10k
         } else {
219
4.10k
            mtfv[wr] = BZ_RUNA; wr++; 
220
4.10k
            s->mtfFreq[BZ_RUNA]++; 
221
4.10k
         }
222
7.55k
         if (zPend < 2) break;
223
5.95k
         zPend = (zPend - 2) / 2;
224
5.95k
      };
225
1.60k
      zPend = 0;
226
1.60k
   }
227
228
3.20k
   mtfv[wr] = EOB; wr++; s->mtfFreq[EOB]++;
229
230
3.20k
   s->nMTF = wr;
231
3.20k
}
232
233
234
/*---------------------------------------------------*/
235
366k
#define BZ_LESSER_ICOST  0
236
3.79M
#define BZ_GREATER_ICOST 15
237
238
static
239
void sendMTFValues ( EState* s )
240
3.20k
{
241
3.20k
   Int32 v, t, i, j, gs, ge, totc, bt, bc, iter;
242
3.20k
   Int32 nSelectors, alphaSize, minLen, maxLen, selCtr;
243
3.20k
   Int32 nGroups, nBytes;
244
245
   /*--
246
   UChar  len [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
247
   is a global since the decoder also needs it.
248
249
   Int32  code[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
250
   Int32  rfreq[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
251
   are also globals only used in this proc.
252
   Made global to keep stack frame size small.
253
   --*/
254
255
256
3.20k
   UInt16 cost[BZ_N_GROUPS];
257
3.20k
   Int32  fave[BZ_N_GROUPS];
258
259
3.20k
   UInt16* mtfv = s->mtfv;
260
261
3.20k
   if (s->verbosity >= 3)
262
0
      VPrintf3( "      %d in block, %d after MTF & 1-2 coding, "
263
3.20k
                "%d+2 syms in use\n", 
264
3.20k
                s->nblock, s->nMTF, s->nInUse );
265
266
3.20k
   alphaSize = s->nInUse+2;
267
22.4k
   for (t = 0; t < BZ_N_GROUPS; t++)
268
2.21M
      for (v = 0; v < alphaSize; v++)
269
2.19M
         s->len[t][v] = BZ_GREATER_ICOST;
270
271
   /*--- Decide how many coding tables to use ---*/
272
3.20k
   AssertH ( s->nMTF > 0, 3001 );
273
3.20k
   if (s->nMTF < 200)  nGroups = 2; else
274
1.90k
   if (s->nMTF < 600)  nGroups = 3; else
275
1.45k
   if (s->nMTF < 1200) nGroups = 4; else
276
1.24k
   if (s->nMTF < 2400) nGroups = 5; else
277
1.11k
                       nGroups = 6;
278
279
   /*--- Generate an initial set of coding tables ---*/
280
3.20k
   { 
281
3.20k
      Int32 nPart, remF, tFreq, aFreq;
282
283
3.20k
      nPart = nGroups;
284
3.20k
      remF  = s->nMTF;
285
3.20k
      gs = 0;
286
15.3k
      while (nPart > 0) {
287
12.1k
         tFreq = remF / nPart;
288
12.1k
         ge = gs-1;
289
12.1k
         aFreq = 0;
290
380k
         while (aFreq < tFreq && ge < alphaSize-1) {
291
368k
            ge++;
292
368k
            aFreq += s->mtfFreq[ge];
293
368k
         }
294
295
12.1k
         if (ge > gs 
296
9.74k
             && nPart != nGroups && nPart != 1 
297
4.71k
             && ((nGroups-nPart) % 2 == 1)) {
298
2.43k
            aFreq -= s->mtfFreq[ge];
299
2.43k
            ge--;
300
2.43k
         }
301
302
12.1k
         if (s->verbosity >= 3)
303
0
            VPrintf5( "      initial group %d, [%d .. %d], "
304
12.1k
                      "has %d syms (%4.1f%%)\n",
305
12.1k
                      nPart, gs, ge, aFreq, 
306
12.1k
                      (100.0 * (float)aFreq) / (float)(s->nMTF) );
307
 
308
1.97M
         for (v = 0; v < alphaSize; v++)
309
1.96M
            if (v >= gs && v <= ge) 
310
366k
               s->len[nPart-1][v] = BZ_LESSER_ICOST; else
311
1.60M
               s->len[nPart-1][v] = BZ_GREATER_ICOST;
312
 
313
12.1k
         nPart--;
314
12.1k
         gs = ge+1;
315
12.1k
         remF -= aFreq;
316
12.1k
      }
317
3.20k
   }
318
319
   /*--- 
320
      Iterate up to BZ_N_ITERS times to improve the tables.
321
   ---*/
322
16.0k
   for (iter = 0; iter < BZ_N_ITERS; iter++) {
323
324
89.8k
      for (t = 0; t < BZ_N_GROUPS; t++) fave[t] = 0;
325
326
61.4k
      for (t = 0; t < nGroups; t++)
327
7.91M
         for (v = 0; v < alphaSize; v++)
328
7.86M
            s->rfreq[t][v] = 0;
329
330
      /*---
331
        Set up an auxiliary length table which is used to fast-track
332
  the common case (nGroups == 6). 
333
      ---*/
334
12.8k
      if (nGroups == 6) {
335
1.09M
         for (v = 0; v < alphaSize; v++) {
336
1.09M
            s->len_pack[v][0] = (s->len[1][v] << 16) | s->len[0][v];
337
1.09M
            s->len_pack[v][1] = (s->len[3][v] << 16) | s->len[2][v];
338
1.09M
            s->len_pack[v][2] = (s->len[5][v] << 16) | s->len[4][v];
339
1.09M
   }
340
4.45k
      }
341
342
12.8k
      nSelectors = 0;
343
12.8k
      totc = 0;
344
12.8k
      gs = 0;
345
6.83M
      while (True) {
346
347
         /*--- Set group start & end marks. --*/
348
6.83M
         if (gs >= s->nMTF) break;
349
6.82M
         ge = gs + BZ_G_SIZE - 1; 
350
6.82M
         if (ge >= s->nMTF) ge = s->nMTF-1;
351
352
         /*-- 
353
            Calculate the cost of this group as coded
354
            by each of the coding tables.
355
         --*/
356
47.7M
         for (t = 0; t < BZ_N_GROUPS; t++) cost[t] = 0;
357
358
6.82M
         if (nGroups == 6 && 50 == ge-gs+1) {
359
            /*--- fast track the common case ---*/
360
6.76M
            register UInt32 cost01, cost23, cost45;
361
6.76M
            register UInt16 icv;
362
6.76M
            cost01 = cost23 = cost45 = 0;
363
364
6.76M
#           define BZ_ITER(nn)                \
365
338M
               icv = mtfv[gs+(nn)];           \
366
338M
               cost01 += s->len_pack[icv][0]; \
367
338M
               cost23 += s->len_pack[icv][1]; \
368
338M
               cost45 += s->len_pack[icv][2]; \
369
6.76M
370
6.76M
            BZ_ITER(0);  BZ_ITER(1);  BZ_ITER(2);  BZ_ITER(3);  BZ_ITER(4);
371
6.76M
            BZ_ITER(5);  BZ_ITER(6);  BZ_ITER(7);  BZ_ITER(8);  BZ_ITER(9);
372
6.76M
            BZ_ITER(10); BZ_ITER(11); BZ_ITER(12); BZ_ITER(13); BZ_ITER(14);
373
6.76M
            BZ_ITER(15); BZ_ITER(16); BZ_ITER(17); BZ_ITER(18); BZ_ITER(19);
374
6.76M
            BZ_ITER(20); BZ_ITER(21); BZ_ITER(22); BZ_ITER(23); BZ_ITER(24);
375
6.76M
            BZ_ITER(25); BZ_ITER(26); BZ_ITER(27); BZ_ITER(28); BZ_ITER(29);
376
6.76M
            BZ_ITER(30); BZ_ITER(31); BZ_ITER(32); BZ_ITER(33); BZ_ITER(34);
377
6.76M
            BZ_ITER(35); BZ_ITER(36); BZ_ITER(37); BZ_ITER(38); BZ_ITER(39);
378
6.76M
            BZ_ITER(40); BZ_ITER(41); BZ_ITER(42); BZ_ITER(43); BZ_ITER(44);
379
6.76M
            BZ_ITER(45); BZ_ITER(46); BZ_ITER(47); BZ_ITER(48); BZ_ITER(49);
380
381
6.76M
#           undef BZ_ITER
382
383
6.76M
            cost[0] = cost01 & 0xffff; cost[1] = cost01 >> 16;
384
6.76M
            cost[2] = cost23 & 0xffff; cost[3] = cost23 >> 16;
385
6.76M
            cost[4] = cost45 & 0xffff; cost[5] = cost45 >> 16;
386
387
6.76M
         } else {
388
      /*--- slow version which correctly handles all situations ---*/
389
2.61M
            for (i = gs; i <= ge; i++) { 
390
2.55M
               UInt16 icv = mtfv[i];
391
12.5M
               for (t = 0; t < nGroups; t++) cost[t] += s->len[t][icv];
392
2.55M
            }
393
57.8k
         }
394
 
395
         /*-- 
396
            Find the coding table which is best for this group,
397
            and record its identity in the selector table.
398
         --*/
399
6.82M
         bc = 999999999; bt = -1;
400
47.6M
         for (t = 0; t < nGroups; t++)
401
40.8M
            if (cost[t] < bc) { bc = cost[t]; bt = t; };
402
6.82M
         totc += bc;
403
6.82M
         fave[bt]++;
404
6.82M
         s->selector[nSelectors] = bt;
405
6.82M
         nSelectors++;
406
407
         /*-- 
408
            Increment the symbol frequencies for the selected table.
409
          --*/
410
6.82M
         if (nGroups == 6 && 50 == ge-gs+1) {
411
            /*--- fast track the common case ---*/
412
413
338M
#           define BZ_ITUR(nn) s->rfreq[bt][ mtfv[gs+(nn)] ]++
414
415
6.76M
            BZ_ITUR(0);  BZ_ITUR(1);  BZ_ITUR(2);  BZ_ITUR(3);  BZ_ITUR(4);
416
6.76M
            BZ_ITUR(5);  BZ_ITUR(6);  BZ_ITUR(7);  BZ_ITUR(8);  BZ_ITUR(9);
417
6.76M
            BZ_ITUR(10); BZ_ITUR(11); BZ_ITUR(12); BZ_ITUR(13); BZ_ITUR(14);
418
6.76M
            BZ_ITUR(15); BZ_ITUR(16); BZ_ITUR(17); BZ_ITUR(18); BZ_ITUR(19);
419
6.76M
            BZ_ITUR(20); BZ_ITUR(21); BZ_ITUR(22); BZ_ITUR(23); BZ_ITUR(24);
420
6.76M
            BZ_ITUR(25); BZ_ITUR(26); BZ_ITUR(27); BZ_ITUR(28); BZ_ITUR(29);
421
6.76M
            BZ_ITUR(30); BZ_ITUR(31); BZ_ITUR(32); BZ_ITUR(33); BZ_ITUR(34);
422
6.76M
            BZ_ITUR(35); BZ_ITUR(36); BZ_ITUR(37); BZ_ITUR(38); BZ_ITUR(39);
423
6.76M
            BZ_ITUR(40); BZ_ITUR(41); BZ_ITUR(42); BZ_ITUR(43); BZ_ITUR(44);
424
6.76M
            BZ_ITUR(45); BZ_ITUR(46); BZ_ITUR(47); BZ_ITUR(48); BZ_ITUR(49);
425
426
6.76M
#           undef BZ_ITUR
427
428
6.76M
         } else {
429
      /*--- slow version which correctly handles all situations ---*/
430
2.61M
            for (i = gs; i <= ge; i++)
431
2.55M
               s->rfreq[bt][ mtfv[i] ]++;
432
57.8k
         }
433
434
6.82M
         gs = ge+1;
435
6.82M
      }
436
12.8k
      if (s->verbosity >= 3) {
437
0
         VPrintf2 ( "      pass %d: size is %d, grp uses are ", 
438
0
                   iter+1, totc/8 );
439
0
         for (t = 0; t < nGroups; t++)
440
0
            VPrintf1 ( "%d ", fave[t] );
441
0
         VPrintf0 ( "\n" );
442
0
      }
443
444
      /*--
445
        Recompute the tables based on the accumulated frequencies.
446
      --*/
447
      /* maxLen was changed from 20 to 17 in bzip2-1.0.3.  See 
448
         comment in huffman.c for details. */
449
61.4k
      for (t = 0; t < nGroups; t++)
450
48.5k
         BZ2_hbMakeCodeLengths ( &(s->len[t][0]), &(s->rfreq[t][0]), 
451
48.5k
                                 alphaSize, 17 /*20*/ );
452
12.8k
   }
453
454
455
3.20k
   AssertH( nGroups < 8, 3002 );
456
3.20k
   AssertH( nSelectors < 32768 &&
457
3.20k
            nSelectors <= BZ_MAX_SELECTORS,
458
3.20k
            3003 );
459
460
461
   /*--- Compute MTF values for the selectors. ---*/
462
3.20k
   {
463
3.20k
      UChar pos[BZ_N_GROUPS], ll_i, tmp2, tmp;
464
15.3k
      for (i = 0; i < nGroups; i++) pos[i] = i;
465
1.70M
      for (i = 0; i < nSelectors; i++) {
466
1.70M
         ll_i = s->selector[i];
467
1.70M
         j = 0;
468
1.70M
         tmp = pos[j];
469
4.01M
         while ( ll_i != tmp ) {
470
2.30M
            j++;
471
2.30M
            tmp2 = tmp;
472
2.30M
            tmp = pos[j];
473
2.30M
            pos[j] = tmp2;
474
2.30M
         };
475
1.70M
         pos[0] = tmp;
476
1.70M
         s->selectorMtf[i] = j;
477
1.70M
      }
478
3.20k
   };
479
480
   /*--- Assign actual codes for the tables. --*/
481
15.3k
   for (t = 0; t < nGroups; t++) {
482
12.1k
      minLen = 32;
483
12.1k
      maxLen = 0;
484
1.97M
      for (i = 0; i < alphaSize; i++) {
485
1.96M
         if (s->len[t][i] > maxLen) maxLen = s->len[t][i];
486
1.96M
         if (s->len[t][i] < minLen) minLen = s->len[t][i];
487
1.96M
      }
488
12.1k
      AssertH ( !(maxLen > 17 /*20*/ ), 3004 );
489
12.1k
      AssertH ( !(minLen < 1),  3005 );
490
12.1k
      BZ2_hbAssignCodes ( &(s->code[t][0]), &(s->len[t][0]), 
491
12.1k
                          minLen, maxLen, alphaSize );
492
12.1k
   }
493
494
   /*--- Transmit the mapping table. ---*/
495
3.20k
   { 
496
3.20k
      Bool inUse16[16];
497
54.5k
      for (i = 0; i < 16; i++) {
498
51.3k
          inUse16[i] = False;
499
872k
          for (j = 0; j < 16; j++)
500
821k
             if (s->inUse[i * 16 + j]) inUse16[i] = True;
501
51.3k
      }
502
     
503
3.20k
      nBytes = s->numZ;
504
54.5k
      for (i = 0; i < 16; i++)
505
51.3k
         if (inUse16[i]) bsW(s,1,1); else bsW(s,1,0);
506
507
54.5k
      for (i = 0; i < 16; i++)
508
51.3k
         if (inUse16[i])
509
578k
            for (j = 0; j < 16; j++) {
510
544k
               if (s->inUse[i * 16 + j]) bsW(s,1,1); else bsW(s,1,0);
511
544k
            }
512
513
3.20k
      if (s->verbosity >= 3) 
514
0
         VPrintf1( "      bytes: mapping %d, ", s->numZ-nBytes );
515
3.20k
   }
516
517
   /*--- Now the selectors. ---*/
518
3.20k
   nBytes = s->numZ;
519
3.20k
   bsW ( s, 3, nGroups );
520
3.20k
   bsW ( s, 15, nSelectors );
521
1.70M
   for (i = 0; i < nSelectors; i++) { 
522
4.01M
      for (j = 0; j < s->selectorMtf[i]; j++) bsW(s,1,1);
523
1.70M
      bsW(s,1,0);
524
1.70M
   }
525
3.20k
   if (s->verbosity >= 3)
526
0
      VPrintf1( "selectors %d, ", s->numZ-nBytes );
527
528
   /*--- Now the coding tables. ---*/
529
3.20k
   nBytes = s->numZ;
530
531
15.3k
   for (t = 0; t < nGroups; t++) {
532
12.1k
      Int32 curr = s->len[t][0];
533
12.1k
      bsW ( s, 5, curr );
534
1.97M
      for (i = 0; i < alphaSize; i++) {
535
2.36M
         while (curr < s->len[t][i]) { bsW(s,2,2); curr++; /* 10 */ };
536
2.33M
         while (curr > s->len[t][i]) { bsW(s,2,3); curr--; /* 11 */ };
537
1.96M
         bsW ( s, 1, 0 );
538
1.96M
      }
539
12.1k
   }
540
541
3.20k
   if (s->verbosity >= 3)
542
0
      VPrintf1 ( "code lengths %d, ", s->numZ-nBytes );
543
544
   /*--- And finally, the block data proper ---*/
545
3.20k
   nBytes = s->numZ;
546
3.20k
   selCtr = 0;
547
3.20k
   gs = 0;
548
1.70M
   while (True) {
549
1.70M
      if (gs >= s->nMTF) break;
550
1.70M
      ge = gs + BZ_G_SIZE - 1; 
551
1.70M
      if (ge >= s->nMTF) ge = s->nMTF-1;
552
1.70M
      AssertH ( s->selector[selCtr] < nGroups, 3006 );
553
554
1.70M
      if (nGroups == 6 && 50 == ge-gs+1) {
555
            /*--- fast track the common case ---*/
556
1.69M
            UInt16 mtfv_i;
557
1.69M
            UChar* s_len_sel_selCtr 
558
1.69M
               = &(s->len[s->selector[selCtr]][0]);
559
1.69M
            Int32* s_code_sel_selCtr
560
1.69M
               = &(s->code[s->selector[selCtr]][0]);
561
562
1.69M
#           define BZ_ITAH(nn)                      \
563
84.5M
               mtfv_i = mtfv[gs+(nn)];              \
564
84.5M
               bsW ( s,                             \
565
84.5M
                     s_len_sel_selCtr[mtfv_i],      \
566
84.5M
                     s_code_sel_selCtr[mtfv_i] )
567
568
1.69M
            BZ_ITAH(0);  BZ_ITAH(1);  BZ_ITAH(2);  BZ_ITAH(3);  BZ_ITAH(4);
569
1.69M
            BZ_ITAH(5);  BZ_ITAH(6);  BZ_ITAH(7);  BZ_ITAH(8);  BZ_ITAH(9);
570
1.69M
            BZ_ITAH(10); BZ_ITAH(11); BZ_ITAH(12); BZ_ITAH(13); BZ_ITAH(14);
571
1.69M
            BZ_ITAH(15); BZ_ITAH(16); BZ_ITAH(17); BZ_ITAH(18); BZ_ITAH(19);
572
1.69M
            BZ_ITAH(20); BZ_ITAH(21); BZ_ITAH(22); BZ_ITAH(23); BZ_ITAH(24);
573
1.69M
            BZ_ITAH(25); BZ_ITAH(26); BZ_ITAH(27); BZ_ITAH(28); BZ_ITAH(29);
574
1.69M
            BZ_ITAH(30); BZ_ITAH(31); BZ_ITAH(32); BZ_ITAH(33); BZ_ITAH(34);
575
1.69M
            BZ_ITAH(35); BZ_ITAH(36); BZ_ITAH(37); BZ_ITAH(38); BZ_ITAH(39);
576
1.69M
            BZ_ITAH(40); BZ_ITAH(41); BZ_ITAH(42); BZ_ITAH(43); BZ_ITAH(44);
577
1.69M
            BZ_ITAH(45); BZ_ITAH(46); BZ_ITAH(47); BZ_ITAH(48); BZ_ITAH(49);
578
579
1.69M
#           undef BZ_ITAH
580
581
1.69M
      } else {
582
   /*--- slow version which correctly handles all situations ---*/
583
652k
         for (i = gs; i <= ge; i++) {
584
638k
            bsW ( s, 
585
638k
                  s->len  [s->selector[selCtr]] [mtfv[i]],
586
638k
                  s->code [s->selector[selCtr]] [mtfv[i]] );
587
638k
         }
588
14.4k
      }
589
590
591
1.70M
      gs = ge+1;
592
1.70M
      selCtr++;
593
1.70M
   }
594
3.20k
   AssertH( selCtr == nSelectors, 3007 );
595
596
3.20k
   if (s->verbosity >= 3)
597
0
      VPrintf1( "codes %d\n", s->numZ-nBytes );
598
3.20k
}
599
600
601
/*---------------------------------------------------*/
602
void BZ2_compressBlock ( EState* s, Bool is_last_block )
603
3.20k
{
604
3.20k
   if (s->nblock > 0) {
605
606
3.20k
      BZ_FINALISE_CRC ( s->blockCRC );
607
3.20k
      s->combinedCRC = (s->combinedCRC << 1) | (s->combinedCRC >> 31);
608
3.20k
      s->combinedCRC ^= s->blockCRC;
609
3.20k
      if (s->blockNo > 1) s->numZ = 0;
610
611
3.20k
      if (s->verbosity >= 2)
612
0
         VPrintf4( "    block %d: crc = 0x%08x, "
613
3.20k
                   "combined CRC = 0x%08x, size = %d\n",
614
3.20k
                   s->blockNo, s->blockCRC, s->combinedCRC, s->nblock );
615
616
3.20k
      BZ2_blockSort ( s );
617
3.20k
   }
618
619
3.20k
   s->zbits = (UChar*) (&((UChar*)s->arr2)[s->nblock]);
620
621
   /*-- If this is the first block, create the stream header. --*/
622
3.20k
   if (s->blockNo == 1) {
623
3.06k
      BZ2_bsInitWrite ( s );
624
3.06k
      bsPutUChar ( s, BZ_HDR_B );
625
3.06k
      bsPutUChar ( s, BZ_HDR_Z );
626
3.06k
      bsPutUChar ( s, BZ_HDR_h );
627
3.06k
      bsPutUChar ( s, (UChar)(BZ_HDR_0 + s->blockSize100k) );
628
3.06k
   }
629
630
3.20k
   if (s->nblock > 0) {
631
632
3.20k
      bsPutUChar ( s, 0x31 ); bsPutUChar ( s, 0x41 );
633
3.20k
      bsPutUChar ( s, 0x59 ); bsPutUChar ( s, 0x26 );
634
3.20k
      bsPutUChar ( s, 0x53 ); bsPutUChar ( s, 0x59 );
635
636
      /*-- Now the block's CRC, so it is in a known place. --*/
637
3.20k
      bsPutUInt32 ( s, s->blockCRC );
638
639
      /*-- 
640
         Now a single bit indicating (non-)randomisation. 
641
         As of version 0.9.5, we use a better sorting algorithm
642
         which makes randomisation unnecessary.  So always set
643
         the randomised bit to 'no'.  Of course, the decoder
644
         still needs to be able to handle randomised blocks
645
         so as to maintain backwards compatibility with
646
         older versions of bzip2.
647
      --*/
648
3.20k
      bsW(s,1,0);
649
650
3.20k
      bsW ( s, 24, s->origPtr );
651
3.20k
      generateMTFValues ( s );
652
3.20k
      sendMTFValues ( s );
653
3.20k
   }
654
655
656
   /*-- If this is the last block, add the stream trailer. --*/
657
3.20k
   if (is_last_block) {
658
659
3.06k
      bsPutUChar ( s, 0x17 ); bsPutUChar ( s, 0x72 );
660
3.06k
      bsPutUChar ( s, 0x45 ); bsPutUChar ( s, 0x38 );
661
3.06k
      bsPutUChar ( s, 0x50 ); bsPutUChar ( s, 0x90 );
662
3.06k
      bsPutUInt32 ( s, s->combinedCRC );
663
3.06k
      if (s->verbosity >= 2)
664
         VPrintf1( "    final combined CRC = 0x%08x\n   ", s->combinedCRC );
665
3.06k
      bsFinishWrite ( s );
666
3.06k
   }
667
3.20k
}
668
669
670
/*-------------------------------------------------------------*/
671
/*--- end                                        compress.c ---*/
672
/*-------------------------------------------------------------*/