Coverage Report

Created: 2026-02-14 06:33

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/bzip2/compress.c
Line
Count
Source
1
2
/*-------------------------------------------------------------*/
3
/*--- Compression machinery (not incl block sorting)        ---*/
4
/*---                                            compress.c ---*/
5
/*-------------------------------------------------------------*/
6
7
/* ------------------------------------------------------------------
8
   This file is part of bzip2/libbzip2, a program and library for
9
   lossless, block-sorting data compression.
10
11
   bzip2/libbzip2 version 1.0.8 of 13 July 2019
12
   Copyright (C) 1996-2019 Julian Seward <jseward@acm.org>
13
14
   Please read the WARNING, DISCLAIMER and PATENTS sections in the 
15
   README file.
16
17
   This program is released under the terms of the license contained
18
   in the file LICENSE.
19
   ------------------------------------------------------------------ */
20
21
22
/* CHANGES
23
    0.9.0    -- original version.
24
    0.9.0a/b -- no changes in this file.
25
    0.9.0c   -- changed setting of nGroups in sendMTFValues() 
26
                so as to do a bit better on small files
27
*/
28
29
#include "bzlib_private.h"
30
31
32
/*---------------------------------------------------*/
33
/*--- Bit stream I/O                              ---*/
34
/*---------------------------------------------------*/
35
36
/*---------------------------------------------------*/
37
void BZ2_bsInitWrite ( EState* s )
38
2.96k
{
39
2.96k
   s->bsLive = 0;
40
2.96k
   s->bsBuff = 0;
41
2.96k
}
42
43
44
/*---------------------------------------------------*/
45
static
46
void bsFinishWrite ( EState* s )
47
2.96k
{
48
8.52k
   while (s->bsLive > 0) {
49
5.55k
      s->zbits[s->numZ] = (UChar)(s->bsBuff >> 24);
50
5.55k
      s->numZ++;
51
5.55k
      s->bsBuff <<= 8;
52
5.55k
      s->bsLive -= 8;
53
5.55k
   }
54
2.96k
}
55
56
57
/*---------------------------------------------------*/
58
86.5M
#define bsNEEDW(nz)                           \
59
86.5M
{                                             \
60
150M
   while (s->bsLive >= 8) {                   \
61
64.0M
      s->zbits[s->numZ]                       \
62
64.0M
         = (UChar)(s->bsBuff >> 24);          \
63
64.0M
      s->numZ++;                              \
64
64.0M
      s->bsBuff <<= 8;                        \
65
64.0M
      s->bsLive -= 8;                         \
66
64.0M
   }                                          \
67
86.5M
}
68
69
70
/*---------------------------------------------------*/
71
static
72
__inline__
73
void bsW ( EState* s, Int32 n, UInt32 v )
74
86.5M
{
75
86.5M
   bsNEEDW ( n );
76
86.5M
   s->bsBuff |= (v << (32 - s->bsLive - n));
77
86.5M
   s->bsLive += n;
78
86.5M
}
79
80
81
/*---------------------------------------------------*/
82
static
83
void bsPutUInt32 ( EState* s, UInt32 u )
84
6.06k
{
85
6.06k
   bsW ( s, 8, (u >> 24) & 0xffL );
86
6.06k
   bsW ( s, 8, (u >> 16) & 0xffL );
87
6.06k
   bsW ( s, 8, (u >>  8) & 0xffL );
88
6.06k
   bsW ( s, 8,  u        & 0xffL );
89
6.06k
}
90
91
92
/*---------------------------------------------------*/
93
static
94
void bsPutUChar ( EState* s, UChar c )
95
48.2k
{
96
48.2k
   bsW( s, 8, (UInt32)c );
97
48.2k
}
98
99
100
/*---------------------------------------------------*/
101
/*--- The back end proper                         ---*/
102
/*---------------------------------------------------*/
103
104
/*---------------------------------------------------*/
105
static
106
void makeMaps_e ( EState* s )
107
3.09k
{
108
3.09k
   Int32 i;
109
3.09k
   s->nInUse = 0;
110
796k
   for (i = 0; i < 256; i++)
111
793k
      if (s->inUse[i]) {
112
348k
         s->unseqToSeq[i] = s->nInUse;
113
348k
         s->nInUse++;
114
348k
      }
115
3.09k
}
116
117
118
/*---------------------------------------------------*/
119
static
120
void generateMTFValues ( EState* s )
121
3.09k
{
122
3.09k
   UChar   yy[256];
123
3.09k
   Int32   i, j;
124
3.09k
   Int32   zPend;
125
3.09k
   Int32   wr;
126
3.09k
   Int32   EOB;
127
128
   /* 
129
      After sorting (eg, here),
130
         s->arr1 [ 0 .. s->nblock-1 ] holds sorted order,
131
         and
132
         ((UChar*)s->arr2) [ 0 .. s->nblock-1 ] 
133
         holds the original block data.
134
135
      The first thing to do is generate the MTF values,
136
      and put them in
137
         ((UInt16*)s->arr1) [ 0 .. s->nblock-1 ].
138
      Because there are strictly fewer or equal MTF values
139
      than block values, ptr values in this area are overwritten
140
      with MTF values only when they are no longer needed.
141
142
      The final compressed bitstream is generated into the
143
      area starting at
144
         (UChar*) (&((UChar*)s->arr2)[s->nblock])
145
146
      These storage aliases are set up in bzCompressInit(),
147
      except for the last one, which is arranged in 
148
      compressBlock().
149
   */
150
3.09k
   UInt32* ptr   = s->ptr;
151
3.09k
   UChar* block  = s->block;
152
3.09k
   UInt16* mtfv  = s->mtfv;
153
154
3.09k
   makeMaps_e ( s );
155
3.09k
   EOB = s->nInUse+1;
156
157
358k
   for (i = 0; i <= EOB; i++) s->mtfFreq[i] = 0;
158
159
3.09k
   wr = 0;
160
3.09k
   zPend = 0;
161
352k
   for (i = 0; i < s->nInUse; i++) yy[i] = (UChar) i;
162
163
224M
   for (i = 0; i < s->nblock; i++) {
164
224M
      UChar ll_i;
165
224M
      AssertD ( wr <= i, "generateMTFValues(1)" );
166
224M
      j = ptr[i]-1; if (j < 0) j += s->nblock;
167
224M
      ll_i = s->unseqToSeq[block[j]];
168
224M
      AssertD ( ll_i < s->nInUse, "generateMTFValues(2a)" );
169
170
224M
      if (yy[0] == ll_i) { 
171
160M
         zPend++;
172
160M
      } else {
173
174
64.4M
         if (zPend > 0) {
175
12.9M
            zPend--;
176
14.8M
            while (True) {
177
14.8M
               if (zPend & 1) {
178
1.64M
                  mtfv[wr] = BZ_RUNB; wr++; 
179
1.64M
                  s->mtfFreq[BZ_RUNB]++; 
180
13.2M
               } else {
181
13.2M
                  mtfv[wr] = BZ_RUNA; wr++; 
182
13.2M
                  s->mtfFreq[BZ_RUNA]++; 
183
13.2M
               }
184
14.8M
               if (zPend < 2) break;
185
1.90M
               zPend = (zPend - 2) / 2;
186
1.90M
            };
187
12.9M
            zPend = 0;
188
12.9M
         }
189
64.4M
         {
190
64.4M
            register UChar  rtmp;
191
64.4M
            register UChar* ryy_j;
192
64.4M
            register UChar  rll_i;
193
64.4M
            rtmp  = yy[1];
194
64.4M
            yy[1] = yy[0];
195
64.4M
            ryy_j = &(yy[1]);
196
64.4M
            rll_i = ll_i;
197
6.44G
            while ( rll_i != rtmp ) {
198
6.37G
               register UChar rtmp2;
199
6.37G
               ryy_j++;
200
6.37G
               rtmp2  = rtmp;
201
6.37G
               rtmp   = *ryy_j;
202
6.37G
               *ryy_j = rtmp2;
203
6.37G
            };
204
64.4M
            yy[0] = rtmp;
205
64.4M
            j = ryy_j - &(yy[0]);
206
64.4M
            mtfv[wr] = j+1; wr++; s->mtfFreq[j+1]++;
207
64.4M
         }
208
209
64.4M
      }
210
224M
   }
211
212
3.09k
   if (zPend > 0) {
213
1.55k
      zPend--;
214
7.71k
      while (True) {
215
7.71k
         if (zPend & 1) {
216
3.62k
            mtfv[wr] = BZ_RUNB; wr++; 
217
3.62k
            s->mtfFreq[BZ_RUNB]++; 
218
4.09k
         } else {
219
4.09k
            mtfv[wr] = BZ_RUNA; wr++; 
220
4.09k
            s->mtfFreq[BZ_RUNA]++; 
221
4.09k
         }
222
7.71k
         if (zPend < 2) break;
223
6.16k
         zPend = (zPend - 2) / 2;
224
6.16k
      };
225
1.55k
      zPend = 0;
226
1.55k
   }
227
228
3.09k
   mtfv[wr] = EOB; wr++; s->mtfFreq[EOB]++;
229
230
3.09k
   s->nMTF = wr;
231
3.09k
}
232
233
234
/*---------------------------------------------------*/
235
355k
#define BZ_LESSER_ICOST  0
236
3.69M
#define BZ_GREATER_ICOST 15
237
238
static
239
void sendMTFValues ( EState* s )
240
3.09k
{
241
3.09k
   Int32 v, t, i, j, gs, ge, totc, bt, bc, iter;
242
3.09k
   Int32 nSelectors, alphaSize, minLen, maxLen, selCtr;
243
3.09k
   Int32 nGroups, nBytes;
244
245
   /*--
246
   UChar  len [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
247
   is a global since the decoder also needs it.
248
249
   Int32  code[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
250
   Int32  rfreq[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
251
   are also globals only used in this proc.
252
   Made global to keep stack frame size small.
253
   --*/
254
255
256
3.09k
   UInt16 cost[BZ_N_GROUPS];
257
3.09k
   Int32  fave[BZ_N_GROUPS];
258
259
3.09k
   UInt16* mtfv = s->mtfv;
260
261
3.09k
   if (s->verbosity >= 3)
262
0
      VPrintf3( "      %d in block, %d after MTF & 1-2 coding, "
263
3.09k
                "%d+2 syms in use\n", 
264
3.09k
                s->nblock, s->nMTF, s->nInUse );
265
266
3.09k
   alphaSize = s->nInUse+2;
267
21.6k
   for (t = 0; t < BZ_N_GROUPS; t++)
268
2.14M
      for (v = 0; v < alphaSize; v++)
269
2.13M
         s->len[t][v] = BZ_GREATER_ICOST;
270
271
   /*--- Decide how many coding tables to use ---*/
272
3.09k
   AssertH ( s->nMTF > 0, 3001 );
273
3.09k
   if (s->nMTF < 200)  nGroups = 2; else
274
1.86k
   if (s->nMTF < 600)  nGroups = 3; else
275
1.42k
   if (s->nMTF < 1200) nGroups = 4; else
276
1.23k
   if (s->nMTF < 2400) nGroups = 5; else
277
1.10k
                       nGroups = 6;
278
279
   /*--- Generate an initial set of coding tables ---*/
280
3.09k
   { 
281
3.09k
      Int32 nPart, remF, tFreq, aFreq;
282
283
3.09k
      nPart = nGroups;
284
3.09k
      remF  = s->nMTF;
285
3.09k
      gs = 0;
286
14.9k
      while (nPart > 0) {
287
11.8k
         tFreq = remF / nPart;
288
11.8k
         ge = gs-1;
289
11.8k
         aFreq = 0;
290
369k
         while (aFreq < tFreq && ge < alphaSize-1) {
291
357k
            ge++;
292
357k
            aFreq += s->mtfFreq[ge];
293
357k
         }
294
295
11.8k
         if (ge > gs 
296
9.51k
             && nPart != nGroups && nPart != 1 
297
4.62k
             && ((nGroups-nPart) % 2 == 1)) {
298
2.37k
            aFreq -= s->mtfFreq[ge];
299
2.37k
            ge--;
300
2.37k
         }
301
302
11.8k
         if (s->verbosity >= 3)
303
0
            VPrintf5( "      initial group %d, [%d .. %d], "
304
11.8k
                      "has %d syms (%4.1f%%)\n",
305
11.8k
                      nPart, gs, ge, aFreq, 
306
11.8k
                      (100.0 * (float)aFreq) / (float)(s->nMTF) );
307
 
308
1.93M
         for (v = 0; v < alphaSize; v++)
309
1.92M
            if (v >= gs && v <= ge) 
310
355k
               s->len[nPart-1][v] = BZ_LESSER_ICOST; else
311
1.56M
               s->len[nPart-1][v] = BZ_GREATER_ICOST;
312
 
313
11.8k
         nPart--;
314
11.8k
         gs = ge+1;
315
11.8k
         remF -= aFreq;
316
11.8k
      }
317
3.09k
   }
318
319
   /*--- 
320
      Iterate up to BZ_N_ITERS times to improve the tables.
321
   ---*/
322
15.4k
   for (iter = 0; iter < BZ_N_ITERS; iter++) {
323
324
86.7k
      for (t = 0; t < BZ_N_GROUPS; t++) fave[t] = 0;
325
326
59.7k
      for (t = 0; t < nGroups; t++)
327
7.74M
         for (v = 0; v < alphaSize; v++)
328
7.69M
            s->rfreq[t][v] = 0;
329
330
      /*---
331
        Set up an auxiliary length table which is used to fast-track
332
  the common case (nGroups == 6). 
333
      ---*/
334
12.3k
      if (nGroups == 6) {
335
1.08M
         for (v = 0; v < alphaSize; v++) {
336
1.08M
            s->len_pack[v][0] = (s->len[1][v] << 16) | s->len[0][v];
337
1.08M
            s->len_pack[v][1] = (s->len[3][v] << 16) | s->len[2][v];
338
1.08M
            s->len_pack[v][2] = (s->len[5][v] << 16) | s->len[4][v];
339
1.08M
   }
340
4.43k
      }
341
342
12.3k
      nSelectors = 0;
343
12.3k
      totc = 0;
344
12.3k
      gs = 0;
345
6.36M
      while (True) {
346
347
         /*--- Set group start & end marks. --*/
348
6.36M
         if (gs >= s->nMTF) break;
349
6.35M
         ge = gs + BZ_G_SIZE - 1; 
350
6.35M
         if (ge >= s->nMTF) ge = s->nMTF-1;
351
352
         /*-- 
353
            Calculate the cost of this group as coded
354
            by each of the coding tables.
355
         --*/
356
44.4M
         for (t = 0; t < BZ_N_GROUPS; t++) cost[t] = 0;
357
358
6.35M
         if (nGroups == 6 && 50 == ge-gs+1) {
359
            /*--- fast track the common case ---*/
360
6.30M
            register UInt32 cost01, cost23, cost45;
361
6.30M
            register UInt16 icv;
362
6.30M
            cost01 = cost23 = cost45 = 0;
363
364
6.30M
#           define BZ_ITER(nn)                \
365
315M
               icv = mtfv[gs+(nn)];           \
366
315M
               cost01 += s->len_pack[icv][0]; \
367
315M
               cost23 += s->len_pack[icv][1]; \
368
315M
               cost45 += s->len_pack[icv][2]; \
369
6.30M
370
6.30M
            BZ_ITER(0);  BZ_ITER(1);  BZ_ITER(2);  BZ_ITER(3);  BZ_ITER(4);
371
6.30M
            BZ_ITER(5);  BZ_ITER(6);  BZ_ITER(7);  BZ_ITER(8);  BZ_ITER(9);
372
6.30M
            BZ_ITER(10); BZ_ITER(11); BZ_ITER(12); BZ_ITER(13); BZ_ITER(14);
373
6.30M
            BZ_ITER(15); BZ_ITER(16); BZ_ITER(17); BZ_ITER(18); BZ_ITER(19);
374
6.30M
            BZ_ITER(20); BZ_ITER(21); BZ_ITER(22); BZ_ITER(23); BZ_ITER(24);
375
6.30M
            BZ_ITER(25); BZ_ITER(26); BZ_ITER(27); BZ_ITER(28); BZ_ITER(29);
376
6.30M
            BZ_ITER(30); BZ_ITER(31); BZ_ITER(32); BZ_ITER(33); BZ_ITER(34);
377
6.30M
            BZ_ITER(35); BZ_ITER(36); BZ_ITER(37); BZ_ITER(38); BZ_ITER(39);
378
6.30M
            BZ_ITER(40); BZ_ITER(41); BZ_ITER(42); BZ_ITER(43); BZ_ITER(44);
379
6.30M
            BZ_ITER(45); BZ_ITER(46); BZ_ITER(47); BZ_ITER(48); BZ_ITER(49);
380
381
6.30M
#           undef BZ_ITER
382
383
6.30M
            cost[0] = cost01 & 0xffff; cost[1] = cost01 >> 16;
384
6.30M
            cost[2] = cost23 & 0xffff; cost[3] = cost23 >> 16;
385
6.30M
            cost[4] = cost45 & 0xffff; cost[5] = cost45 >> 16;
386
387
6.30M
         } else {
388
      /*--- slow version which correctly handles all situations ---*/
389
2.47M
            for (i = gs; i <= ge; i++) { 
390
2.41M
               UInt16 icv = mtfv[i];
391
11.8M
               for (t = 0; t < nGroups; t++) cost[t] += s->len[t][icv];
392
2.41M
            }
393
54.6k
         }
394
 
395
         /*-- 
396
            Find the coding table which is best for this group,
397
            and record its identity in the selector table.
398
         --*/
399
6.35M
         bc = 999999999; bt = -1;
400
44.3M
         for (t = 0; t < nGroups; t++)
401
38.0M
            if (cost[t] < bc) { bc = cost[t]; bt = t; };
402
6.35M
         totc += bc;
403
6.35M
         fave[bt]++;
404
6.35M
         s->selector[nSelectors] = bt;
405
6.35M
         nSelectors++;
406
407
         /*-- 
408
            Increment the symbol frequencies for the selected table.
409
          --*/
410
6.35M
         if (nGroups == 6 && 50 == ge-gs+1) {
411
            /*--- fast track the common case ---*/
412
413
315M
#           define BZ_ITUR(nn) s->rfreq[bt][ mtfv[gs+(nn)] ]++
414
415
6.30M
            BZ_ITUR(0);  BZ_ITUR(1);  BZ_ITUR(2);  BZ_ITUR(3);  BZ_ITUR(4);
416
6.30M
            BZ_ITUR(5);  BZ_ITUR(6);  BZ_ITUR(7);  BZ_ITUR(8);  BZ_ITUR(9);
417
6.30M
            BZ_ITUR(10); BZ_ITUR(11); BZ_ITUR(12); BZ_ITUR(13); BZ_ITUR(14);
418
6.30M
            BZ_ITUR(15); BZ_ITUR(16); BZ_ITUR(17); BZ_ITUR(18); BZ_ITUR(19);
419
6.30M
            BZ_ITUR(20); BZ_ITUR(21); BZ_ITUR(22); BZ_ITUR(23); BZ_ITUR(24);
420
6.30M
            BZ_ITUR(25); BZ_ITUR(26); BZ_ITUR(27); BZ_ITUR(28); BZ_ITUR(29);
421
6.30M
            BZ_ITUR(30); BZ_ITUR(31); BZ_ITUR(32); BZ_ITUR(33); BZ_ITUR(34);
422
6.30M
            BZ_ITUR(35); BZ_ITUR(36); BZ_ITUR(37); BZ_ITUR(38); BZ_ITUR(39);
423
6.30M
            BZ_ITUR(40); BZ_ITUR(41); BZ_ITUR(42); BZ_ITUR(43); BZ_ITUR(44);
424
6.30M
            BZ_ITUR(45); BZ_ITUR(46); BZ_ITUR(47); BZ_ITUR(48); BZ_ITUR(49);
425
426
6.30M
#           undef BZ_ITUR
427
428
6.30M
         } else {
429
      /*--- slow version which correctly handles all situations ---*/
430
2.47M
            for (i = gs; i <= ge; i++)
431
2.41M
               s->rfreq[bt][ mtfv[i] ]++;
432
54.6k
         }
433
434
6.35M
         gs = ge+1;
435
6.35M
      }
436
12.3k
      if (s->verbosity >= 3) {
437
0
         VPrintf2 ( "      pass %d: size is %d, grp uses are ", 
438
0
                   iter+1, totc/8 );
439
0
         for (t = 0; t < nGroups; t++)
440
0
            VPrintf1 ( "%d ", fave[t] );
441
0
         VPrintf0 ( "\n" );
442
0
      }
443
444
      /*--
445
        Recompute the tables based on the accumulated frequencies.
446
      --*/
447
      /* maxLen was changed from 20 to 17 in bzip2-1.0.3.  See 
448
         comment in huffman.c for details. */
449
59.7k
      for (t = 0; t < nGroups; t++)
450
47.3k
         BZ2_hbMakeCodeLengths ( &(s->len[t][0]), &(s->rfreq[t][0]), 
451
47.3k
                                 alphaSize, 17 /*20*/ );
452
12.3k
   }
453
454
455
3.09k
   AssertH( nGroups < 8, 3002 );
456
3.09k
   AssertH( nSelectors < 32768 &&
457
3.09k
            nSelectors <= BZ_MAX_SELECTORS,
458
3.09k
            3003 );
459
460
461
   /*--- Compute MTF values for the selectors. ---*/
462
3.09k
   {
463
3.09k
      UChar pos[BZ_N_GROUPS], ll_i, tmp2, tmp;
464
14.9k
      for (i = 0; i < nGroups; i++) pos[i] = i;
465
1.59M
      for (i = 0; i < nSelectors; i++) {
466
1.58M
         ll_i = s->selector[i];
467
1.58M
         j = 0;
468
1.58M
         tmp = pos[j];
469
3.78M
         while ( ll_i != tmp ) {
470
2.19M
            j++;
471
2.19M
            tmp2 = tmp;
472
2.19M
            tmp = pos[j];
473
2.19M
            pos[j] = tmp2;
474
2.19M
         };
475
1.58M
         pos[0] = tmp;
476
1.58M
         s->selectorMtf[i] = j;
477
1.58M
      }
478
3.09k
   };
479
480
   /*--- Assign actual codes for the tables. --*/
481
14.9k
   for (t = 0; t < nGroups; t++) {
482
11.8k
      minLen = 32;
483
11.8k
      maxLen = 0;
484
1.93M
      for (i = 0; i < alphaSize; i++) {
485
1.92M
         if (s->len[t][i] > maxLen) maxLen = s->len[t][i];
486
1.92M
         if (s->len[t][i] < minLen) minLen = s->len[t][i];
487
1.92M
      }
488
11.8k
      AssertH ( !(maxLen > 17 /*20*/ ), 3004 );
489
11.8k
      AssertH ( !(minLen < 1),  3005 );
490
11.8k
      BZ2_hbAssignCodes ( &(s->code[t][0]), &(s->len[t][0]), 
491
11.8k
                          minLen, maxLen, alphaSize );
492
11.8k
   }
493
494
   /*--- Transmit the mapping table. ---*/
495
3.09k
   { 
496
3.09k
      Bool inUse16[16];
497
52.6k
      for (i = 0; i < 16; i++) {
498
49.5k
          inUse16[i] = False;
499
842k
          for (j = 0; j < 16; j++)
500
793k
             if (s->inUse[i * 16 + j]) inUse16[i] = True;
501
49.5k
      }
502
     
503
3.09k
      nBytes = s->numZ;
504
52.6k
      for (i = 0; i < 16; i++)
505
49.5k
         if (inUse16[i]) bsW(s,1,1); else bsW(s,1,0);
506
507
52.6k
      for (i = 0; i < 16; i++)
508
49.5k
         if (inUse16[i])
509
558k
            for (j = 0; j < 16; j++) {
510
525k
               if (s->inUse[i * 16 + j]) bsW(s,1,1); else bsW(s,1,0);
511
525k
            }
512
513
3.09k
      if (s->verbosity >= 3) 
514
0
         VPrintf1( "      bytes: mapping %d, ", s->numZ-nBytes );
515
3.09k
   }
516
517
   /*--- Now the selectors. ---*/
518
3.09k
   nBytes = s->numZ;
519
3.09k
   bsW ( s, 3, nGroups );
520
3.09k
   bsW ( s, 15, nSelectors );
521
1.59M
   for (i = 0; i < nSelectors; i++) { 
522
3.78M
      for (j = 0; j < s->selectorMtf[i]; j++) bsW(s,1,1);
523
1.58M
      bsW(s,1,0);
524
1.58M
   }
525
3.09k
   if (s->verbosity >= 3)
526
0
      VPrintf1( "selectors %d, ", s->numZ-nBytes );
527
528
   /*--- Now the coding tables. ---*/
529
3.09k
   nBytes = s->numZ;
530
531
14.9k
   for (t = 0; t < nGroups; t++) {
532
11.8k
      Int32 curr = s->len[t][0];
533
11.8k
      bsW ( s, 5, curr );
534
1.93M
      for (i = 0; i < alphaSize; i++) {
535
2.32M
         while (curr < s->len[t][i]) { bsW(s,2,2); curr++; /* 10 */ };
536
2.28M
         while (curr > s->len[t][i]) { bsW(s,2,3); curr--; /* 11 */ };
537
1.92M
         bsW ( s, 1, 0 );
538
1.92M
      }
539
11.8k
   }
540
541
3.09k
   if (s->verbosity >= 3)
542
0
      VPrintf1 ( "code lengths %d, ", s->numZ-nBytes );
543
544
   /*--- And finally, the block data proper ---*/
545
3.09k
   nBytes = s->numZ;
546
3.09k
   selCtr = 0;
547
3.09k
   gs = 0;
548
1.59M
   while (True) {
549
1.59M
      if (gs >= s->nMTF) break;
550
1.58M
      ge = gs + BZ_G_SIZE - 1; 
551
1.58M
      if (ge >= s->nMTF) ge = s->nMTF-1;
552
1.58M
      AssertH ( s->selector[selCtr] < nGroups, 3006 );
553
554
1.58M
      if (nGroups == 6 && 50 == ge-gs+1) {
555
            /*--- fast track the common case ---*/
556
1.57M
            UInt16 mtfv_i;
557
1.57M
            UChar* s_len_sel_selCtr 
558
1.57M
               = &(s->len[s->selector[selCtr]][0]);
559
1.57M
            Int32* s_code_sel_selCtr
560
1.57M
               = &(s->code[s->selector[selCtr]][0]);
561
562
1.57M
#           define BZ_ITAH(nn)                      \
563
78.7M
               mtfv_i = mtfv[gs+(nn)];              \
564
78.7M
               bsW ( s,                             \
565
78.7M
                     s_len_sel_selCtr[mtfv_i],      \
566
78.7M
                     s_code_sel_selCtr[mtfv_i] )
567
568
1.57M
            BZ_ITAH(0);  BZ_ITAH(1);  BZ_ITAH(2);  BZ_ITAH(3);  BZ_ITAH(4);
569
1.57M
            BZ_ITAH(5);  BZ_ITAH(6);  BZ_ITAH(7);  BZ_ITAH(8);  BZ_ITAH(9);
570
1.57M
            BZ_ITAH(10); BZ_ITAH(11); BZ_ITAH(12); BZ_ITAH(13); BZ_ITAH(14);
571
1.57M
            BZ_ITAH(15); BZ_ITAH(16); BZ_ITAH(17); BZ_ITAH(18); BZ_ITAH(19);
572
1.57M
            BZ_ITAH(20); BZ_ITAH(21); BZ_ITAH(22); BZ_ITAH(23); BZ_ITAH(24);
573
1.57M
            BZ_ITAH(25); BZ_ITAH(26); BZ_ITAH(27); BZ_ITAH(28); BZ_ITAH(29);
574
1.57M
            BZ_ITAH(30); BZ_ITAH(31); BZ_ITAH(32); BZ_ITAH(33); BZ_ITAH(34);
575
1.57M
            BZ_ITAH(35); BZ_ITAH(36); BZ_ITAH(37); BZ_ITAH(38); BZ_ITAH(39);
576
1.57M
            BZ_ITAH(40); BZ_ITAH(41); BZ_ITAH(42); BZ_ITAH(43); BZ_ITAH(44);
577
1.57M
            BZ_ITAH(45); BZ_ITAH(46); BZ_ITAH(47); BZ_ITAH(48); BZ_ITAH(49);
578
579
1.57M
#           undef BZ_ITAH
580
581
1.57M
      } else {
582
   /*--- slow version which correctly handles all situations ---*/
583
617k
         for (i = gs; i <= ge; i++) {
584
603k
            bsW ( s, 
585
603k
                  s->len  [s->selector[selCtr]] [mtfv[i]],
586
603k
                  s->code [s->selector[selCtr]] [mtfv[i]] );
587
603k
         }
588
13.6k
      }
589
590
591
1.58M
      gs = ge+1;
592
1.58M
      selCtr++;
593
1.58M
   }
594
3.09k
   AssertH( selCtr == nSelectors, 3007 );
595
596
3.09k
   if (s->verbosity >= 3)
597
0
      VPrintf1( "codes %d\n", s->numZ-nBytes );
598
3.09k
}
599
600
601
/*---------------------------------------------------*/
602
void BZ2_compressBlock ( EState* s, Bool is_last_block )
603
3.09k
{
604
3.09k
   if (s->nblock > 0) {
605
606
3.09k
      BZ_FINALISE_CRC ( s->blockCRC );
607
3.09k
      s->combinedCRC = (s->combinedCRC << 1) | (s->combinedCRC >> 31);
608
3.09k
      s->combinedCRC ^= s->blockCRC;
609
3.09k
      if (s->blockNo > 1) s->numZ = 0;
610
611
3.09k
      if (s->verbosity >= 2)
612
0
         VPrintf4( "    block %d: crc = 0x%08x, "
613
3.09k
                   "combined CRC = 0x%08x, size = %d\n",
614
3.09k
                   s->blockNo, s->blockCRC, s->combinedCRC, s->nblock );
615
616
3.09k
      BZ2_blockSort ( s );
617
3.09k
   }
618
619
3.09k
   s->zbits = (UChar*) (&((UChar*)s->arr2)[s->nblock]);
620
621
   /*-- If this is the first block, create the stream header. --*/
622
3.09k
   if (s->blockNo == 1) {
623
2.96k
      BZ2_bsInitWrite ( s );
624
2.96k
      bsPutUChar ( s, BZ_HDR_B );
625
2.96k
      bsPutUChar ( s, BZ_HDR_Z );
626
2.96k
      bsPutUChar ( s, BZ_HDR_h );
627
2.96k
      bsPutUChar ( s, (UChar)(BZ_HDR_0 + s->blockSize100k) );
628
2.96k
   }
629
630
3.09k
   if (s->nblock > 0) {
631
632
3.09k
      bsPutUChar ( s, 0x31 ); bsPutUChar ( s, 0x41 );
633
3.09k
      bsPutUChar ( s, 0x59 ); bsPutUChar ( s, 0x26 );
634
3.09k
      bsPutUChar ( s, 0x53 ); bsPutUChar ( s, 0x59 );
635
636
      /*-- Now the block's CRC, so it is in a known place. --*/
637
3.09k
      bsPutUInt32 ( s, s->blockCRC );
638
639
      /*-- 
640
         Now a single bit indicating (non-)randomisation. 
641
         As of version 0.9.5, we use a better sorting algorithm
642
         which makes randomisation unnecessary.  So always set
643
         the randomised bit to 'no'.  Of course, the decoder
644
         still needs to be able to handle randomised blocks
645
         so as to maintain backwards compatibility with
646
         older versions of bzip2.
647
      --*/
648
3.09k
      bsW(s,1,0);
649
650
3.09k
      bsW ( s, 24, s->origPtr );
651
3.09k
      generateMTFValues ( s );
652
3.09k
      sendMTFValues ( s );
653
3.09k
   }
654
655
656
   /*-- If this is the last block, add the stream trailer. --*/
657
3.09k
   if (is_last_block) {
658
659
2.96k
      bsPutUChar ( s, 0x17 ); bsPutUChar ( s, 0x72 );
660
2.96k
      bsPutUChar ( s, 0x45 ); bsPutUChar ( s, 0x38 );
661
2.96k
      bsPutUChar ( s, 0x50 ); bsPutUChar ( s, 0x90 );
662
2.96k
      bsPutUInt32 ( s, s->combinedCRC );
663
2.96k
      if (s->verbosity >= 2)
664
         VPrintf1( "    final combined CRC = 0x%08x\n   ", s->combinedCRC );
665
2.96k
      bsFinishWrite ( s );
666
2.96k
   }
667
3.09k
}
668
669
670
/*-------------------------------------------------------------*/
671
/*--- end                                        compress.c ---*/
672
/*-------------------------------------------------------------*/