Coverage Report

Created: 2026-02-09 06:46

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/bzip2/compress.c
Line
Count
Source
1
2
/*-------------------------------------------------------------*/
3
/*--- Compression machinery (not incl block sorting)        ---*/
4
/*---                                            compress.c ---*/
5
/*-------------------------------------------------------------*/
6
7
/* ------------------------------------------------------------------
8
   This file is part of bzip2/libbzip2, a program and library for
9
   lossless, block-sorting data compression.
10
11
   bzip2/libbzip2 version 1.0.8 of 13 July 2019
12
   Copyright (C) 1996-2019 Julian Seward <jseward@acm.org>
13
14
   Please read the WARNING, DISCLAIMER and PATENTS sections in the 
15
   README file.
16
17
   This program is released under the terms of the license contained
18
   in the file LICENSE.
19
   ------------------------------------------------------------------ */
20
21
22
/* CHANGES
23
    0.9.0    -- original version.
24
    0.9.0a/b -- no changes in this file.
25
    0.9.0c   -- changed setting of nGroups in sendMTFValues() 
26
                so as to do a bit better on small files
27
*/
28
29
#include "bzlib_private.h"
30
31
32
/*---------------------------------------------------*/
33
/*--- Bit stream I/O                              ---*/
34
/*---------------------------------------------------*/
35
36
/*---------------------------------------------------*/
37
void BZ2_bsInitWrite ( EState* s )
38
3.29k
{
39
3.29k
   s->bsLive = 0;
40
3.29k
   s->bsBuff = 0;
41
3.29k
}
42
43
44
/*---------------------------------------------------*/
45
static
46
void bsFinishWrite ( EState* s )
47
3.29k
{
48
9.46k
   while (s->bsLive > 0) {
49
6.17k
      s->zbits[s->numZ] = (UChar)(s->bsBuff >> 24);
50
6.17k
      s->numZ++;
51
6.17k
      s->bsBuff <<= 8;
52
6.17k
      s->bsLive -= 8;
53
6.17k
   }
54
3.29k
}
55
56
57
/*---------------------------------------------------*/
58
92.4M
#define bsNEEDW(nz)                           \
59
92.4M
{                                             \
60
161M
   while (s->bsLive >= 8) {                   \
61
68.9M
      s->zbits[s->numZ]                       \
62
68.9M
         = (UChar)(s->bsBuff >> 24);          \
63
68.9M
      s->numZ++;                              \
64
68.9M
      s->bsBuff <<= 8;                        \
65
68.9M
      s->bsLive -= 8;                         \
66
68.9M
   }                                          \
67
92.4M
}
68
69
70
/*---------------------------------------------------*/
71
static
72
__inline__
73
void bsW ( EState* s, Int32 n, UInt32 v )
74
92.4M
{
75
92.4M
   bsNEEDW ( n );
76
92.4M
   s->bsBuff |= (v << (32 - s->bsLive - n));
77
92.4M
   s->bsLive += n;
78
92.4M
}
79
80
81
/*---------------------------------------------------*/
82
static
83
void bsPutUInt32 ( EState* s, UInt32 u )
84
6.71k
{
85
6.71k
   bsW ( s, 8, (u >> 24) & 0xffL );
86
6.71k
   bsW ( s, 8, (u >> 16) & 0xffL );
87
6.71k
   bsW ( s, 8, (u >>  8) & 0xffL );
88
6.71k
   bsW ( s, 8,  u        & 0xffL );
89
6.71k
}
90
91
92
/*---------------------------------------------------*/
93
static
94
void bsPutUChar ( EState* s, UChar c )
95
53.4k
{
96
53.4k
   bsW( s, 8, (UInt32)c );
97
53.4k
}
98
99
100
/*---------------------------------------------------*/
101
/*--- The back end proper                         ---*/
102
/*---------------------------------------------------*/
103
104
/*---------------------------------------------------*/
105
static
106
void makeMaps_e ( EState* s )
107
3.42k
{
108
3.42k
   Int32 i;
109
3.42k
   s->nInUse = 0;
110
880k
   for (i = 0; i < 256; i++)
111
877k
      if (s->inUse[i]) {
112
381k
         s->unseqToSeq[i] = s->nInUse;
113
381k
         s->nInUse++;
114
381k
      }
115
3.42k
}
116
117
118
/*---------------------------------------------------*/
119
static
120
void generateMTFValues ( EState* s )
121
3.42k
{
122
3.42k
   UChar   yy[256];
123
3.42k
   Int32   i, j;
124
3.42k
   Int32   zPend;
125
3.42k
   Int32   wr;
126
3.42k
   Int32   EOB;
127
128
   /* 
129
      After sorting (eg, here),
130
         s->arr1 [ 0 .. s->nblock-1 ] holds sorted order,
131
         and
132
         ((UChar*)s->arr2) [ 0 .. s->nblock-1 ] 
133
         holds the original block data.
134
135
      The first thing to do is generate the MTF values,
136
      and put them in
137
         ((UInt16*)s->arr1) [ 0 .. s->nblock-1 ].
138
      Because there are strictly fewer or equal MTF values
139
      than block values, ptr values in this area are overwritten
140
      with MTF values only when they are no longer needed.
141
142
      The final compressed bitstream is generated into the
143
      area starting at
144
         (UChar*) (&((UChar*)s->arr2)[s->nblock])
145
146
      These storage aliases are set up in bzCompressInit(),
147
      except for the last one, which is arranged in 
148
      compressBlock().
149
   */
150
3.42k
   UInt32* ptr   = s->ptr;
151
3.42k
   UChar* block  = s->block;
152
3.42k
   UInt16* mtfv  = s->mtfv;
153
154
3.42k
   makeMaps_e ( s );
155
3.42k
   EOB = s->nInUse+1;
156
157
391k
   for (i = 0; i <= EOB; i++) s->mtfFreq[i] = 0;
158
159
3.42k
   wr = 0;
160
3.42k
   zPend = 0;
161
384k
   for (i = 0; i < s->nInUse; i++) yy[i] = (UChar) i;
162
163
241M
   for (i = 0; i < s->nblock; i++) {
164
241M
      UChar ll_i;
165
241M
      AssertD ( wr <= i, "generateMTFValues(1)" );
166
241M
      j = ptr[i]-1; if (j < 0) j += s->nblock;
167
241M
      ll_i = s->unseqToSeq[block[j]];
168
241M
      AssertD ( ll_i < s->nInUse, "generateMTFValues(2a)" );
169
170
241M
      if (yy[0] == ll_i) { 
171
173M
         zPend++;
172
173M
      } else {
173
174
68.3M
         if (zPend > 0) {
175
14.4M
            zPend--;
176
16.3M
            while (True) {
177
16.3M
               if (zPend & 1) {
178
1.73M
                  mtfv[wr] = BZ_RUNB; wr++; 
179
1.73M
                  s->mtfFreq[BZ_RUNB]++; 
180
14.6M
               } else {
181
14.6M
                  mtfv[wr] = BZ_RUNA; wr++; 
182
14.6M
                  s->mtfFreq[BZ_RUNA]++; 
183
14.6M
               }
184
16.3M
               if (zPend < 2) break;
185
1.92M
               zPend = (zPend - 2) / 2;
186
1.92M
            };
187
14.4M
            zPend = 0;
188
14.4M
         }
189
68.3M
         {
190
68.3M
            register UChar  rtmp;
191
68.3M
            register UChar* ryy_j;
192
68.3M
            register UChar  rll_i;
193
68.3M
            rtmp  = yy[1];
194
68.3M
            yy[1] = yy[0];
195
68.3M
            ryy_j = &(yy[1]);
196
68.3M
            rll_i = ll_i;
197
7.09G
            while ( rll_i != rtmp ) {
198
7.02G
               register UChar rtmp2;
199
7.02G
               ryy_j++;
200
7.02G
               rtmp2  = rtmp;
201
7.02G
               rtmp   = *ryy_j;
202
7.02G
               *ryy_j = rtmp2;
203
7.02G
            };
204
68.3M
            yy[0] = rtmp;
205
68.3M
            j = ryy_j - &(yy[0]);
206
68.3M
            mtfv[wr] = j+1; wr++; s->mtfFreq[j+1]++;
207
68.3M
         }
208
209
68.3M
      }
210
241M
   }
211
212
3.42k
   if (zPend > 0) {
213
1.68k
      zPend--;
214
8.16k
      while (True) {
215
8.16k
         if (zPend & 1) {
216
3.79k
            mtfv[wr] = BZ_RUNB; wr++; 
217
3.79k
            s->mtfFreq[BZ_RUNB]++; 
218
4.37k
         } else {
219
4.37k
            mtfv[wr] = BZ_RUNA; wr++; 
220
4.37k
            s->mtfFreq[BZ_RUNA]++; 
221
4.37k
         }
222
8.16k
         if (zPend < 2) break;
223
6.48k
         zPend = (zPend - 2) / 2;
224
6.48k
      };
225
1.68k
      zPend = 0;
226
1.68k
   }
227
228
3.42k
   mtfv[wr] = EOB; wr++; s->mtfFreq[EOB]++;
229
230
3.42k
   s->nMTF = wr;
231
3.42k
}
232
233
234
/*---------------------------------------------------*/
235
388k
#define BZ_LESSER_ICOST  0
236
4.03M
#define BZ_GREATER_ICOST 15
237
238
static
239
void sendMTFValues ( EState* s )
240
3.42k
{
241
3.42k
   Int32 v, t, i, j, gs, ge, totc, bt, bc, iter;
242
3.42k
   Int32 nSelectors, alphaSize, minLen, maxLen, selCtr;
243
3.42k
   Int32 nGroups, nBytes;
244
245
   /*--
246
   UChar  len [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
247
   is a global since the decoder also needs it.
248
249
   Int32  code[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
250
   Int32  rfreq[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
251
   are also globals only used in this proc.
252
   Made global to keep stack frame size small.
253
   --*/
254
255
256
3.42k
   UInt16 cost[BZ_N_GROUPS];
257
3.42k
   Int32  fave[BZ_N_GROUPS];
258
259
3.42k
   UInt16* mtfv = s->mtfv;
260
261
3.42k
   if (s->verbosity >= 3)
262
0
      VPrintf3( "      %d in block, %d after MTF & 1-2 coding, "
263
3.42k
                "%d+2 syms in use\n", 
264
3.42k
                s->nblock, s->nMTF, s->nInUse );
265
266
3.42k
   alphaSize = s->nInUse+2;
267
23.9k
   for (t = 0; t < BZ_N_GROUPS; t++)
268
2.34M
      for (v = 0; v < alphaSize; v++)
269
2.32M
         s->len[t][v] = BZ_GREATER_ICOST;
270
271
   /*--- Decide how many coding tables to use ---*/
272
3.42k
   AssertH ( s->nMTF > 0, 3001 );
273
3.42k
   if (s->nMTF < 200)  nGroups = 2; else
274
2.04k
   if (s->nMTF < 600)  nGroups = 3; else
275
1.55k
   if (s->nMTF < 1200) nGroups = 4; else
276
1.34k
   if (s->nMTF < 2400) nGroups = 5; else
277
1.19k
                       nGroups = 6;
278
279
   /*--- Generate an initial set of coding tables ---*/
280
3.42k
   { 
281
3.42k
      Int32 nPart, remF, tFreq, aFreq;
282
283
3.42k
      nPart = nGroups;
284
3.42k
      remF  = s->nMTF;
285
3.42k
      gs = 0;
286
16.4k
      while (nPart > 0) {
287
12.9k
         tFreq = remF / nPart;
288
12.9k
         ge = gs-1;
289
12.9k
         aFreq = 0;
290
403k
         while (aFreq < tFreq && ge < alphaSize-1) {
291
390k
            ge++;
292
390k
            aFreq += s->mtfFreq[ge];
293
390k
         }
294
295
12.9k
         if (ge > gs 
296
10.4k
             && nPart != nGroups && nPart != 1 
297
5.01k
             && ((nGroups-nPart) % 2 == 1)) {
298
2.59k
            aFreq -= s->mtfFreq[ge];
299
2.59k
            ge--;
300
2.59k
         }
301
302
12.9k
         if (s->verbosity >= 3)
303
0
            VPrintf5( "      initial group %d, [%d .. %d], "
304
12.9k
                      "has %d syms (%4.1f%%)\n",
305
12.9k
                      nPart, gs, ge, aFreq, 
306
12.9k
                      (100.0 * (float)aFreq) / (float)(s->nMTF) );
307
 
308
2.10M
         for (v = 0; v < alphaSize; v++)
309
2.09M
            if (v >= gs && v <= ge) 
310
388k
               s->len[nPart-1][v] = BZ_LESSER_ICOST; else
311
1.70M
               s->len[nPart-1][v] = BZ_GREATER_ICOST;
312
 
313
12.9k
         nPart--;
314
12.9k
         gs = ge+1;
315
12.9k
         remF -= aFreq;
316
12.9k
      }
317
3.42k
   }
318
319
   /*--- 
320
      Iterate up to BZ_N_ITERS times to improve the tables.
321
   ---*/
322
17.1k
   for (iter = 0; iter < BZ_N_ITERS; iter++) {
323
324
95.9k
      for (t = 0; t < BZ_N_GROUPS; t++) fave[t] = 0;
325
326
65.6k
      for (t = 0; t < nGroups; t++)
327
8.42M
         for (v = 0; v < alphaSize; v++)
328
8.36M
            s->rfreq[t][v] = 0;
329
330
      /*---
331
        Set up an auxiliary length table which is used to fast-track
332
  the common case (nGroups == 6). 
333
      ---*/
334
13.7k
      if (nGroups == 6) {
335
1.17M
         for (v = 0; v < alphaSize; v++) {
336
1.16M
            s->len_pack[v][0] = (s->len[1][v] << 16) | s->len[0][v];
337
1.16M
            s->len_pack[v][1] = (s->len[3][v] << 16) | s->len[2][v];
338
1.16M
            s->len_pack[v][2] = (s->len[5][v] << 16) | s->len[4][v];
339
1.16M
   }
340
4.76k
      }
341
342
13.7k
      nSelectors = 0;
343
13.7k
      totc = 0;
344
13.7k
      gs = 0;
345
6.80M
      while (True) {
346
347
         /*--- Set group start & end marks. --*/
348
6.80M
         if (gs >= s->nMTF) break;
349
6.78M
         ge = gs + BZ_G_SIZE - 1; 
350
6.78M
         if (ge >= s->nMTF) ge = s->nMTF-1;
351
352
         /*-- 
353
            Calculate the cost of this group as coded
354
            by each of the coding tables.
355
         --*/
356
47.5M
         for (t = 0; t < BZ_N_GROUPS; t++) cost[t] = 0;
357
358
6.78M
         if (nGroups == 6 && 50 == ge-gs+1) {
359
            /*--- fast track the common case ---*/
360
6.72M
            register UInt32 cost01, cost23, cost45;
361
6.72M
            register UInt16 icv;
362
6.72M
            cost01 = cost23 = cost45 = 0;
363
364
6.72M
#           define BZ_ITER(nn)                \
365
336M
               icv = mtfv[gs+(nn)];           \
366
336M
               cost01 += s->len_pack[icv][0]; \
367
336M
               cost23 += s->len_pack[icv][1]; \
368
336M
               cost45 += s->len_pack[icv][2]; \
369
6.72M
370
6.72M
            BZ_ITER(0);  BZ_ITER(1);  BZ_ITER(2);  BZ_ITER(3);  BZ_ITER(4);
371
6.72M
            BZ_ITER(5);  BZ_ITER(6);  BZ_ITER(7);  BZ_ITER(8);  BZ_ITER(9);
372
6.72M
            BZ_ITER(10); BZ_ITER(11); BZ_ITER(12); BZ_ITER(13); BZ_ITER(14);
373
6.72M
            BZ_ITER(15); BZ_ITER(16); BZ_ITER(17); BZ_ITER(18); BZ_ITER(19);
374
6.72M
            BZ_ITER(20); BZ_ITER(21); BZ_ITER(22); BZ_ITER(23); BZ_ITER(24);
375
6.72M
            BZ_ITER(25); BZ_ITER(26); BZ_ITER(27); BZ_ITER(28); BZ_ITER(29);
376
6.72M
            BZ_ITER(30); BZ_ITER(31); BZ_ITER(32); BZ_ITER(33); BZ_ITER(34);
377
6.72M
            BZ_ITER(35); BZ_ITER(36); BZ_ITER(37); BZ_ITER(38); BZ_ITER(39);
378
6.72M
            BZ_ITER(40); BZ_ITER(41); BZ_ITER(42); BZ_ITER(43); BZ_ITER(44);
379
6.72M
            BZ_ITER(45); BZ_ITER(46); BZ_ITER(47); BZ_ITER(48); BZ_ITER(49);
380
381
6.72M
#           undef BZ_ITER
382
383
6.72M
            cost[0] = cost01 & 0xffff; cost[1] = cost01 >> 16;
384
6.72M
            cost[2] = cost23 & 0xffff; cost[3] = cost23 >> 16;
385
6.72M
            cost[4] = cost45 & 0xffff; cost[5] = cost45 >> 16;
386
387
6.72M
         } else {
388
      /*--- slow version which correctly handles all situations ---*/
389
2.83M
            for (i = gs; i <= ge; i++) { 
390
2.77M
               UInt16 icv = mtfv[i];
391
13.7M
               for (t = 0; t < nGroups; t++) cost[t] += s->len[t][icv];
392
2.77M
            }
393
62.6k
         }
394
 
395
         /*-- 
396
            Find the coding table which is best for this group,
397
            and record its identity in the selector table.
398
         --*/
399
6.78M
         bc = 999999999; bt = -1;
400
47.3M
         for (t = 0; t < nGroups; t++)
401
40.6M
            if (cost[t] < bc) { bc = cost[t]; bt = t; };
402
6.78M
         totc += bc;
403
6.78M
         fave[bt]++;
404
6.78M
         s->selector[nSelectors] = bt;
405
6.78M
         nSelectors++;
406
407
         /*-- 
408
            Increment the symbol frequencies for the selected table.
409
          --*/
410
6.78M
         if (nGroups == 6 && 50 == ge-gs+1) {
411
            /*--- fast track the common case ---*/
412
413
336M
#           define BZ_ITUR(nn) s->rfreq[bt][ mtfv[gs+(nn)] ]++
414
415
6.72M
            BZ_ITUR(0);  BZ_ITUR(1);  BZ_ITUR(2);  BZ_ITUR(3);  BZ_ITUR(4);
416
6.72M
            BZ_ITUR(5);  BZ_ITUR(6);  BZ_ITUR(7);  BZ_ITUR(8);  BZ_ITUR(9);
417
6.72M
            BZ_ITUR(10); BZ_ITUR(11); BZ_ITUR(12); BZ_ITUR(13); BZ_ITUR(14);
418
6.72M
            BZ_ITUR(15); BZ_ITUR(16); BZ_ITUR(17); BZ_ITUR(18); BZ_ITUR(19);
419
6.72M
            BZ_ITUR(20); BZ_ITUR(21); BZ_ITUR(22); BZ_ITUR(23); BZ_ITUR(24);
420
6.72M
            BZ_ITUR(25); BZ_ITUR(26); BZ_ITUR(27); BZ_ITUR(28); BZ_ITUR(29);
421
6.72M
            BZ_ITUR(30); BZ_ITUR(31); BZ_ITUR(32); BZ_ITUR(33); BZ_ITUR(34);
422
6.72M
            BZ_ITUR(35); BZ_ITUR(36); BZ_ITUR(37); BZ_ITUR(38); BZ_ITUR(39);
423
6.72M
            BZ_ITUR(40); BZ_ITUR(41); BZ_ITUR(42); BZ_ITUR(43); BZ_ITUR(44);
424
6.72M
            BZ_ITUR(45); BZ_ITUR(46); BZ_ITUR(47); BZ_ITUR(48); BZ_ITUR(49);
425
426
6.72M
#           undef BZ_ITUR
427
428
6.72M
         } else {
429
      /*--- slow version which correctly handles all situations ---*/
430
2.83M
            for (i = gs; i <= ge; i++)
431
2.77M
               s->rfreq[bt][ mtfv[i] ]++;
432
62.6k
         }
433
434
6.78M
         gs = ge+1;
435
6.78M
      }
436
13.7k
      if (s->verbosity >= 3) {
437
0
         VPrintf2 ( "      pass %d: size is %d, grp uses are ", 
438
0
                   iter+1, totc/8 );
439
0
         for (t = 0; t < nGroups; t++)
440
0
            VPrintf1 ( "%d ", fave[t] );
441
0
         VPrintf0 ( "\n" );
442
0
      }
443
444
      /*--
445
        Recompute the tables based on the accumulated frequencies.
446
      --*/
447
      /* maxLen was changed from 20 to 17 in bzip2-1.0.3.  See 
448
         comment in huffman.c for details. */
449
65.6k
      for (t = 0; t < nGroups; t++)
450
51.9k
         BZ2_hbMakeCodeLengths ( &(s->len[t][0]), &(s->rfreq[t][0]), 
451
51.9k
                                 alphaSize, 17 /*20*/ );
452
13.7k
   }
453
454
455
3.42k
   AssertH( nGroups < 8, 3002 );
456
3.42k
   AssertH( nSelectors < 32768 &&
457
3.42k
            nSelectors <= BZ_MAX_SELECTORS,
458
3.42k
            3003 );
459
460
461
   /*--- Compute MTF values for the selectors. ---*/
462
3.42k
   {
463
3.42k
      UChar pos[BZ_N_GROUPS], ll_i, tmp2, tmp;
464
16.4k
      for (i = 0; i < nGroups; i++) pos[i] = i;
465
1.70M
      for (i = 0; i < nSelectors; i++) {
466
1.69M
         ll_i = s->selector[i];
467
1.69M
         j = 0;
468
1.69M
         tmp = pos[j];
469
3.99M
         while ( ll_i != tmp ) {
470
2.30M
            j++;
471
2.30M
            tmp2 = tmp;
472
2.30M
            tmp = pos[j];
473
2.30M
            pos[j] = tmp2;
474
2.30M
         };
475
1.69M
         pos[0] = tmp;
476
1.69M
         s->selectorMtf[i] = j;
477
1.69M
      }
478
3.42k
   };
479
480
   /*--- Assign actual codes for the tables. --*/
481
16.4k
   for (t = 0; t < nGroups; t++) {
482
12.9k
      minLen = 32;
483
12.9k
      maxLen = 0;
484
2.10M
      for (i = 0; i < alphaSize; i++) {
485
2.09M
         if (s->len[t][i] > maxLen) maxLen = s->len[t][i];
486
2.09M
         if (s->len[t][i] < minLen) minLen = s->len[t][i];
487
2.09M
      }
488
12.9k
      AssertH ( !(maxLen > 17 /*20*/ ), 3004 );
489
12.9k
      AssertH ( !(minLen < 1),  3005 );
490
12.9k
      BZ2_hbAssignCodes ( &(s->code[t][0]), &(s->len[t][0]), 
491
12.9k
                          minLen, maxLen, alphaSize );
492
12.9k
   }
493
494
   /*--- Transmit the mapping table. ---*/
495
3.42k
   { 
496
3.42k
      Bool inUse16[16];
497
58.2k
      for (i = 0; i < 16; i++) {
498
54.8k
          inUse16[i] = False;
499
932k
          for (j = 0; j < 16; j++)
500
877k
             if (s->inUse[i * 16 + j]) inUse16[i] = True;
501
54.8k
      }
502
     
503
3.42k
      nBytes = s->numZ;
504
58.2k
      for (i = 0; i < 16; i++)
505
54.8k
         if (inUse16[i]) bsW(s,1,1); else bsW(s,1,0);
506
507
58.2k
      for (i = 0; i < 16; i++)
508
54.8k
         if (inUse16[i])
509
617k
            for (j = 0; j < 16; j++) {
510
581k
               if (s->inUse[i * 16 + j]) bsW(s,1,1); else bsW(s,1,0);
511
581k
            }
512
513
3.42k
      if (s->verbosity >= 3) 
514
0
         VPrintf1( "      bytes: mapping %d, ", s->numZ-nBytes );
515
3.42k
   }
516
517
   /*--- Now the selectors. ---*/
518
3.42k
   nBytes = s->numZ;
519
3.42k
   bsW ( s, 3, nGroups );
520
3.42k
   bsW ( s, 15, nSelectors );
521
1.70M
   for (i = 0; i < nSelectors; i++) { 
522
3.99M
      for (j = 0; j < s->selectorMtf[i]; j++) bsW(s,1,1);
523
1.69M
      bsW(s,1,0);
524
1.69M
   }
525
3.42k
   if (s->verbosity >= 3)
526
0
      VPrintf1( "selectors %d, ", s->numZ-nBytes );
527
528
   /*--- Now the coding tables. ---*/
529
3.42k
   nBytes = s->numZ;
530
531
16.4k
   for (t = 0; t < nGroups; t++) {
532
12.9k
      Int32 curr = s->len[t][0];
533
12.9k
      bsW ( s, 5, curr );
534
2.10M
      for (i = 0; i < alphaSize; i++) {
535
2.52M
         while (curr < s->len[t][i]) { bsW(s,2,2); curr++; /* 10 */ };
536
2.48M
         while (curr > s->len[t][i]) { bsW(s,2,3); curr--; /* 11 */ };
537
2.09M
         bsW ( s, 1, 0 );
538
2.09M
      }
539
12.9k
   }
540
541
3.42k
   if (s->verbosity >= 3)
542
0
      VPrintf1 ( "code lengths %d, ", s->numZ-nBytes );
543
544
   /*--- And finally, the block data proper ---*/
545
3.42k
   nBytes = s->numZ;
546
3.42k
   selCtr = 0;
547
3.42k
   gs = 0;
548
1.70M
   while (True) {
549
1.70M
      if (gs >= s->nMTF) break;
550
1.69M
      ge = gs + BZ_G_SIZE - 1; 
551
1.69M
      if (ge >= s->nMTF) ge = s->nMTF-1;
552
1.69M
      AssertH ( s->selector[selCtr] < nGroups, 3006 );
553
554
1.69M
      if (nGroups == 6 && 50 == ge-gs+1) {
555
            /*--- fast track the common case ---*/
556
1.68M
            UInt16 mtfv_i;
557
1.68M
            UChar* s_len_sel_selCtr 
558
1.68M
               = &(s->len[s->selector[selCtr]][0]);
559
1.68M
            Int32* s_code_sel_selCtr
560
1.68M
               = &(s->code[s->selector[selCtr]][0]);
561
562
1.68M
#           define BZ_ITAH(nn)                      \
563
84.0M
               mtfv_i = mtfv[gs+(nn)];              \
564
84.0M
               bsW ( s,                             \
565
84.0M
                     s_len_sel_selCtr[mtfv_i],      \
566
84.0M
                     s_code_sel_selCtr[mtfv_i] )
567
568
1.68M
            BZ_ITAH(0);  BZ_ITAH(1);  BZ_ITAH(2);  BZ_ITAH(3);  BZ_ITAH(4);
569
1.68M
            BZ_ITAH(5);  BZ_ITAH(6);  BZ_ITAH(7);  BZ_ITAH(8);  BZ_ITAH(9);
570
1.68M
            BZ_ITAH(10); BZ_ITAH(11); BZ_ITAH(12); BZ_ITAH(13); BZ_ITAH(14);
571
1.68M
            BZ_ITAH(15); BZ_ITAH(16); BZ_ITAH(17); BZ_ITAH(18); BZ_ITAH(19);
572
1.68M
            BZ_ITAH(20); BZ_ITAH(21); BZ_ITAH(22); BZ_ITAH(23); BZ_ITAH(24);
573
1.68M
            BZ_ITAH(25); BZ_ITAH(26); BZ_ITAH(27); BZ_ITAH(28); BZ_ITAH(29);
574
1.68M
            BZ_ITAH(30); BZ_ITAH(31); BZ_ITAH(32); BZ_ITAH(33); BZ_ITAH(34);
575
1.68M
            BZ_ITAH(35); BZ_ITAH(36); BZ_ITAH(37); BZ_ITAH(38); BZ_ITAH(39);
576
1.68M
            BZ_ITAH(40); BZ_ITAH(41); BZ_ITAH(42); BZ_ITAH(43); BZ_ITAH(44);
577
1.68M
            BZ_ITAH(45); BZ_ITAH(46); BZ_ITAH(47); BZ_ITAH(48); BZ_ITAH(49);
578
579
1.68M
#           undef BZ_ITAH
580
581
1.68M
      } else {
582
   /*--- slow version which correctly handles all situations ---*/
583
709k
         for (i = gs; i <= ge; i++) {
584
693k
            bsW ( s, 
585
693k
                  s->len  [s->selector[selCtr]] [mtfv[i]],
586
693k
                  s->code [s->selector[selCtr]] [mtfv[i]] );
587
693k
         }
588
15.6k
      }
589
590
591
1.69M
      gs = ge+1;
592
1.69M
      selCtr++;
593
1.69M
   }
594
3.42k
   AssertH( selCtr == nSelectors, 3007 );
595
596
3.42k
   if (s->verbosity >= 3)
597
0
      VPrintf1( "codes %d\n", s->numZ-nBytes );
598
3.42k
}
599
600
601
/*---------------------------------------------------*/
602
void BZ2_compressBlock ( EState* s, Bool is_last_block )
603
3.42k
{
604
3.42k
   if (s->nblock > 0) {
605
606
3.42k
      BZ_FINALISE_CRC ( s->blockCRC );
607
3.42k
      s->combinedCRC = (s->combinedCRC << 1) | (s->combinedCRC >> 31);
608
3.42k
      s->combinedCRC ^= s->blockCRC;
609
3.42k
      if (s->blockNo > 1) s->numZ = 0;
610
611
3.42k
      if (s->verbosity >= 2)
612
0
         VPrintf4( "    block %d: crc = 0x%08x, "
613
3.42k
                   "combined CRC = 0x%08x, size = %d\n",
614
3.42k
                   s->blockNo, s->blockCRC, s->combinedCRC, s->nblock );
615
616
3.42k
      BZ2_blockSort ( s );
617
3.42k
   }
618
619
3.42k
   s->zbits = (UChar*) (&((UChar*)s->arr2)[s->nblock]);
620
621
   /*-- If this is the first block, create the stream header. --*/
622
3.42k
   if (s->blockNo == 1) {
623
3.29k
      BZ2_bsInitWrite ( s );
624
3.29k
      bsPutUChar ( s, BZ_HDR_B );
625
3.29k
      bsPutUChar ( s, BZ_HDR_Z );
626
3.29k
      bsPutUChar ( s, BZ_HDR_h );
627
3.29k
      bsPutUChar ( s, (UChar)(BZ_HDR_0 + s->blockSize100k) );
628
3.29k
   }
629
630
3.42k
   if (s->nblock > 0) {
631
632
3.42k
      bsPutUChar ( s, 0x31 ); bsPutUChar ( s, 0x41 );
633
3.42k
      bsPutUChar ( s, 0x59 ); bsPutUChar ( s, 0x26 );
634
3.42k
      bsPutUChar ( s, 0x53 ); bsPutUChar ( s, 0x59 );
635
636
      /*-- Now the block's CRC, so it is in a known place. --*/
637
3.42k
      bsPutUInt32 ( s, s->blockCRC );
638
639
      /*-- 
640
         Now a single bit indicating (non-)randomisation. 
641
         As of version 0.9.5, we use a better sorting algorithm
642
         which makes randomisation unnecessary.  So always set
643
         the randomised bit to 'no'.  Of course, the decoder
644
         still needs to be able to handle randomised blocks
645
         so as to maintain backwards compatibility with
646
         older versions of bzip2.
647
      --*/
648
3.42k
      bsW(s,1,0);
649
650
3.42k
      bsW ( s, 24, s->origPtr );
651
3.42k
      generateMTFValues ( s );
652
3.42k
      sendMTFValues ( s );
653
3.42k
   }
654
655
656
   /*-- If this is the last block, add the stream trailer. --*/
657
3.42k
   if (is_last_block) {
658
659
3.29k
      bsPutUChar ( s, 0x17 ); bsPutUChar ( s, 0x72 );
660
3.29k
      bsPutUChar ( s, 0x45 ); bsPutUChar ( s, 0x38 );
661
3.29k
      bsPutUChar ( s, 0x50 ); bsPutUChar ( s, 0x90 );
662
3.29k
      bsPutUInt32 ( s, s->combinedCRC );
663
3.29k
      if (s->verbosity >= 2)
664
         VPrintf1( "    final combined CRC = 0x%08x\n   ", s->combinedCRC );
665
3.29k
      bsFinishWrite ( s );
666
3.29k
   }
667
3.42k
}
668
669
670
/*-------------------------------------------------------------*/
671
/*--- end                                        compress.c ---*/
672
/*-------------------------------------------------------------*/