Coverage Report

Created: 2026-05-16 06:13

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/bzip2/compress.c
Line
Count
Source
1
2
/*-------------------------------------------------------------*/
3
/*--- Compression machinery (not incl block sorting)        ---*/
4
/*---                                            compress.c ---*/
5
/*-------------------------------------------------------------*/
6
7
/* ------------------------------------------------------------------
8
   This file is part of bzip2/libbzip2, a program and library for
9
   lossless, block-sorting data compression.
10
11
   bzip2/libbzip2 version 1.0.8 of 13 July 2019
12
   Copyright (C) 1996-2019 Julian Seward <jseward@acm.org>
13
14
   Please read the WARNING, DISCLAIMER and PATENTS sections in the 
15
   README file.
16
17
   This program is released under the terms of the license contained
18
   in the file LICENSE.
19
   ------------------------------------------------------------------ */
20
21
22
/* CHANGES
23
    0.9.0    -- original version.
24
    0.9.0a/b -- no changes in this file.
25
    0.9.0c   -- changed setting of nGroups in sendMTFValues() 
26
                so as to do a bit better on small files
27
*/
28
29
#include "bzlib_private.h"
30
31
32
/*---------------------------------------------------*/
33
/*--- Bit stream I/O                              ---*/
34
/*---------------------------------------------------*/
35
36
/*---------------------------------------------------*/
37
void BZ2_bsInitWrite ( EState* s )
38
3.95k
{
39
3.95k
   s->bsLive = 0;
40
3.95k
   s->bsBuff = 0;
41
3.95k
}
42
43
44
/*---------------------------------------------------*/
45
static
46
void bsFinishWrite ( EState* s )
47
3.95k
{
48
11.3k
   while (s->bsLive > 0) {
49
7.36k
      s->zbits[s->numZ] = (UChar)(s->bsBuff >> 24);
50
7.36k
      s->numZ++;
51
7.36k
      s->bsBuff <<= 8;
52
7.36k
      s->bsLive -= 8;
53
7.36k
   }
54
3.95k
}
55
56
57
/*---------------------------------------------------*/
58
205M
#define bsNEEDW(nz)                           \
59
205M
{                                             \
60
374M
   while (s->bsLive >= 8) {                   \
61
168M
      s->zbits[s->numZ]                       \
62
168M
         = (UChar)(s->bsBuff >> 24);          \
63
168M
      s->numZ++;                              \
64
168M
      s->bsBuff <<= 8;                        \
65
168M
      s->bsLive -= 8;                         \
66
168M
   }                                          \
67
205M
}
68
69
70
/*---------------------------------------------------*/
71
static
72
__inline__
73
void bsW ( EState* s, Int32 n, UInt32 v )
74
205M
{
75
205M
   bsNEEDW ( n );
76
205M
   s->bsBuff |= (v << (32 - s->bsLive - n));
77
205M
   s->bsLive += n;
78
205M
}
79
80
81
/*---------------------------------------------------*/
82
static
83
void bsPutUInt32 ( EState* s, UInt32 u )
84
9.60k
{
85
9.60k
   bsW ( s, 8, (u >> 24) & 0xffL );
86
9.60k
   bsW ( s, 8, (u >> 16) & 0xffL );
87
9.60k
   bsW ( s, 8, (u >>  8) & 0xffL );
88
9.60k
   bsW ( s, 8,  u        & 0xffL );
89
9.60k
}
90
91
92
/*---------------------------------------------------*/
93
static
94
void bsPutUChar ( EState* s, UChar c )
95
73.4k
{
96
73.4k
   bsW( s, 8, (UInt32)c );
97
73.4k
}
98
99
100
/*---------------------------------------------------*/
101
/*--- The back end proper                         ---*/
102
/*---------------------------------------------------*/
103
104
/*---------------------------------------------------*/
105
static
106
void makeMaps_e ( EState* s )
107
5.65k
{
108
5.65k
   Int32 i;
109
5.65k
   s->nInUse = 0;
110
1.45M
   for (i = 0; i < 256; i++)
111
1.44M
      if (s->inUse[i]) {
112
686k
         s->unseqToSeq[i] = s->nInUse;
113
686k
         s->nInUse++;
114
686k
      }
115
5.65k
}
116
117
118
/*---------------------------------------------------*/
119
static
120
void generateMTFValues ( EState* s )
121
5.65k
{
122
5.65k
   UChar   yy[256];
123
5.65k
   Int32   i, j;
124
5.65k
   Int32   zPend;
125
5.65k
   Int32   wr;
126
5.65k
   Int32   EOB;
127
128
   /* 
129
      After sorting (eg, here),
130
         s->arr1 [ 0 .. s->nblock-1 ] holds sorted order,
131
         and
132
         ((UChar*)s->arr2) [ 0 .. s->nblock-1 ] 
133
         holds the original block data.
134
135
      The first thing to do is generate the MTF values,
136
      and put them in
137
         ((UInt16*)s->arr1) [ 0 .. s->nblock-1 ].
138
      Because there are strictly fewer or equal MTF values
139
      than block values, ptr values in this area are overwritten
140
      with MTF values only when they are no longer needed.
141
142
      The final compressed bitstream is generated into the
143
      area starting at
144
         (UChar*) (&((UChar*)s->arr2)[s->nblock])
145
146
      These storage aliases are set up in bzCompressInit(),
147
      except for the last one, which is arranged in 
148
      compressBlock().
149
   */
150
5.65k
   UInt32* ptr   = s->ptr;
151
5.65k
   UChar* block  = s->block;
152
5.65k
   UInt16* mtfv  = s->mtfv;
153
154
5.65k
   makeMaps_e ( s );
155
5.65k
   EOB = s->nInUse+1;
156
157
703k
   for (i = 0; i <= EOB; i++) s->mtfFreq[i] = 0;
158
159
5.65k
   wr = 0;
160
5.65k
   zPend = 0;
161
691k
   for (i = 0; i < s->nInUse; i++) yy[i] = (UChar) i;
162
163
362M
   for (i = 0; i < s->nblock; i++) {
164
362M
      UChar ll_i;
165
362M
      AssertD ( wr <= i, "generateMTFValues(1)" );
166
362M
      j = ptr[i]-1; if (j < 0) j += s->nblock;
167
362M
      ll_i = s->unseqToSeq[block[j]];
168
362M
      AssertD ( ll_i < s->nInUse, "generateMTFValues(2a)" );
169
170
362M
      if (yy[0] == ll_i) { 
171
192M
         zPend++;
172
192M
      } else {
173
174
169M
         if (zPend > 0) {
175
15.5M
            zPend--;
176
19.2M
            while (True) {
177
19.2M
               if (zPend & 1) {
178
2.83M
                  mtfv[wr] = BZ_RUNB; wr++; 
179
2.83M
                  s->mtfFreq[BZ_RUNB]++; 
180
16.4M
               } else {
181
16.4M
                  mtfv[wr] = BZ_RUNA; wr++; 
182
16.4M
                  s->mtfFreq[BZ_RUNA]++; 
183
16.4M
               }
184
19.2M
               if (zPend < 2) break;
185
3.69M
               zPend = (zPend - 2) / 2;
186
3.69M
            };
187
15.5M
            zPend = 0;
188
15.5M
         }
189
169M
         {
190
169M
            register UChar  rtmp;
191
169M
            register UChar* ryy_j;
192
169M
            register UChar  rll_i;
193
169M
            rtmp  = yy[1];
194
169M
            yy[1] = yy[0];
195
169M
            ryy_j = &(yy[1]);
196
169M
            rll_i = ll_i;
197
18.0G
            while ( rll_i != rtmp ) {
198
17.8G
               register UChar rtmp2;
199
17.8G
               ryy_j++;
200
17.8G
               rtmp2  = rtmp;
201
17.8G
               rtmp   = *ryy_j;
202
17.8G
               *ryy_j = rtmp2;
203
17.8G
            };
204
169M
            yy[0] = rtmp;
205
169M
            j = ryy_j - &(yy[0]);
206
169M
            mtfv[wr] = j+1; wr++; s->mtfFreq[j+1]++;
207
169M
         }
208
209
169M
      }
210
362M
   }
211
212
5.65k
   if (zPend > 0) {
213
2.25k
      zPend--;
214
8.99k
      while (True) {
215
8.99k
         if (zPend & 1) {
216
3.73k
            mtfv[wr] = BZ_RUNB; wr++; 
217
3.73k
            s->mtfFreq[BZ_RUNB]++; 
218
5.26k
         } else {
219
5.26k
            mtfv[wr] = BZ_RUNA; wr++; 
220
5.26k
            s->mtfFreq[BZ_RUNA]++; 
221
5.26k
         }
222
8.99k
         if (zPend < 2) break;
223
6.74k
         zPend = (zPend - 2) / 2;
224
6.74k
      };
225
2.25k
      zPend = 0;
226
2.25k
   }
227
228
5.65k
   mtfv[wr] = EOB; wr++; s->mtfFreq[EOB]++;
229
230
5.65k
   s->nMTF = wr;
231
5.65k
}
232
233
234
/*---------------------------------------------------*/
235
697k
#define BZ_LESSER_ICOST  0
236
7.30M
#define BZ_GREATER_ICOST 15
237
238
static
239
void sendMTFValues ( EState* s )
240
5.65k
{
241
5.65k
   Int32 v, t, i, j, gs, ge, totc, bt, bc, iter;
242
5.65k
   Int32 nSelectors, alphaSize, minLen, maxLen, selCtr;
243
5.65k
   Int32 nGroups, nBytes;
244
245
   /*--
246
   UChar  len [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
247
   is a global since the decoder also needs it.
248
249
   Int32  code[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
250
   Int32  rfreq[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
251
   are also globals only used in this proc.
252
   Made global to keep stack frame size small.
253
   --*/
254
255
256
5.65k
   UInt16 cost[BZ_N_GROUPS];
257
5.65k
   Int32  fave[BZ_N_GROUPS];
258
259
5.65k
   UInt16* mtfv = s->mtfv;
260
261
5.65k
   if (s->verbosity >= 3)
262
0
      VPrintf3( "      %d in block, %d after MTF & 1-2 coding, "
263
5.65k
                "%d+2 syms in use\n", 
264
5.65k
                s->nblock, s->nMTF, s->nInUse );
265
266
5.65k
   alphaSize = s->nInUse+2;
267
39.5k
   for (t = 0; t < BZ_N_GROUPS; t++)
268
4.21M
      for (v = 0; v < alphaSize; v++)
269
4.18M
         s->len[t][v] = BZ_GREATER_ICOST;
270
271
   /*--- Decide how many coding tables to use ---*/
272
5.65k
   AssertH ( s->nMTF > 0, 3001 );
273
5.65k
   if (s->nMTF < 200)  nGroups = 2; else
274
3.71k
   if (s->nMTF < 600)  nGroups = 3; else
275
2.91k
   if (s->nMTF < 1200) nGroups = 4; else
276
2.61k
   if (s->nMTF < 2400) nGroups = 5; else
277
2.34k
                       nGroups = 6;
278
279
   /*--- Generate an initial set of coding tables ---*/
280
5.65k
   { 
281
5.65k
      Int32 nPart, remF, tFreq, aFreq;
282
283
5.65k
      nPart = nGroups;
284
5.65k
      remF  = s->nMTF;
285
5.65k
      gs = 0;
286
28.5k
      while (nPart > 0) {
287
22.8k
         tFreq = remF / nPart;
288
22.8k
         ge = gs-1;
289
22.8k
         aFreq = 0;
290
725k
         while (aFreq < tFreq && ge < alphaSize-1) {
291
702k
            ge++;
292
702k
            aFreq += s->mtfFreq[ge];
293
702k
         }
294
295
22.8k
         if (ge > gs 
296
18.6k
             && nPart != nGroups && nPart != 1 
297
9.58k
             && ((nGroups-nPart) % 2 == 1)) {
298
5.00k
            aFreq -= s->mtfFreq[ge];
299
5.00k
            ge--;
300
5.00k
         }
301
302
22.8k
         if (s->verbosity >= 3)
303
0
            VPrintf5( "      initial group %d, [%d .. %d], "
304
22.8k
                      "has %d syms (%4.1f%%)\n",
305
22.8k
                      nPart, gs, ge, aFreq, 
306
22.8k
                      (100.0 * (float)aFreq) / (float)(s->nMTF) );
307
 
308
3.84M
         for (v = 0; v < alphaSize; v++)
309
3.82M
            if (v >= gs && v <= ge) 
310
697k
               s->len[nPart-1][v] = BZ_LESSER_ICOST; else
311
3.12M
               s->len[nPart-1][v] = BZ_GREATER_ICOST;
312
 
313
22.8k
         nPart--;
314
22.8k
         gs = ge+1;
315
22.8k
         remF -= aFreq;
316
22.8k
      }
317
5.65k
   }
318
319
   /*--- 
320
      Iterate up to BZ_N_ITERS times to improve the tables.
321
   ---*/
322
28.2k
   for (iter = 0; iter < BZ_N_ITERS; iter++) {
323
324
158k
      for (t = 0; t < BZ_N_GROUPS; t++) fave[t] = 0;
325
326
114k
      for (t = 0; t < nGroups; t++)
327
15.3M
         for (v = 0; v < alphaSize; v++)
328
15.2M
            s->rfreq[t][v] = 0;
329
330
      /*---
331
        Set up an auxiliary length table which is used to fast-track
332
  the common case (nGroups == 6). 
333
      ---*/
334
22.6k
      if (nGroups == 6) {
335
2.21M
         for (v = 0; v < alphaSize; v++) {
336
2.20M
            s->len_pack[v][0] = (s->len[1][v] << 16) | s->len[0][v];
337
2.20M
            s->len_pack[v][1] = (s->len[3][v] << 16) | s->len[2][v];
338
2.20M
            s->len_pack[v][2] = (s->len[5][v] << 16) | s->len[4][v];
339
2.20M
   }
340
9.38k
      }
341
342
22.6k
      nSelectors = 0;
343
22.6k
      totc = 0;
344
22.6k
      gs = 0;
345
15.1M
      while (True) {
346
347
         /*--- Set group start & end marks. --*/
348
15.1M
         if (gs >= s->nMTF) break;
349
15.0M
         ge = gs + BZ_G_SIZE - 1; 
350
15.0M
         if (ge >= s->nMTF) ge = s->nMTF-1;
351
352
         /*-- 
353
            Calculate the cost of this group as coded
354
            by each of the coding tables.
355
         --*/
356
105M
         for (t = 0; t < BZ_N_GROUPS; t++) cost[t] = 0;
357
358
15.0M
         if (nGroups == 6 && 50 == ge-gs+1) {
359
            /*--- fast track the common case ---*/
360
14.9M
            register UInt32 cost01, cost23, cost45;
361
14.9M
            register UInt16 icv;
362
14.9M
            cost01 = cost23 = cost45 = 0;
363
364
14.9M
#           define BZ_ITER(nn)                \
365
749M
               icv = mtfv[gs+(nn)];           \
366
749M
               cost01 += s->len_pack[icv][0]; \
367
749M
               cost23 += s->len_pack[icv][1]; \
368
749M
               cost45 += s->len_pack[icv][2]; \
369
14.9M
370
14.9M
            BZ_ITER(0);  BZ_ITER(1);  BZ_ITER(2);  BZ_ITER(3);  BZ_ITER(4);
371
14.9M
            BZ_ITER(5);  BZ_ITER(6);  BZ_ITER(7);  BZ_ITER(8);  BZ_ITER(9);
372
14.9M
            BZ_ITER(10); BZ_ITER(11); BZ_ITER(12); BZ_ITER(13); BZ_ITER(14);
373
14.9M
            BZ_ITER(15); BZ_ITER(16); BZ_ITER(17); BZ_ITER(18); BZ_ITER(19);
374
14.9M
            BZ_ITER(20); BZ_ITER(21); BZ_ITER(22); BZ_ITER(23); BZ_ITER(24);
375
14.9M
            BZ_ITER(25); BZ_ITER(26); BZ_ITER(27); BZ_ITER(28); BZ_ITER(29);
376
14.9M
            BZ_ITER(30); BZ_ITER(31); BZ_ITER(32); BZ_ITER(33); BZ_ITER(34);
377
14.9M
            BZ_ITER(35); BZ_ITER(36); BZ_ITER(37); BZ_ITER(38); BZ_ITER(39);
378
14.9M
            BZ_ITER(40); BZ_ITER(41); BZ_ITER(42); BZ_ITER(43); BZ_ITER(44);
379
14.9M
            BZ_ITER(45); BZ_ITER(46); BZ_ITER(47); BZ_ITER(48); BZ_ITER(49);
380
381
14.9M
#           undef BZ_ITER
382
383
14.9M
            cost[0] = cost01 & 0xffff; cost[1] = cost01 >> 16;
384
14.9M
            cost[2] = cost23 & 0xffff; cost[3] = cost23 >> 16;
385
14.9M
            cost[4] = cost45 & 0xffff; cost[5] = cost45 >> 16;
386
387
14.9M
         } else {
388
      /*--- slow version which correctly handles all situations ---*/
389
4.67M
            for (i = gs; i <= ge; i++) { 
390
4.57M
               UInt16 icv = mtfv[i];
391
23.0M
               for (t = 0; t < nGroups; t++) cost[t] += s->len[t][icv];
392
4.57M
            }
393
103k
         }
394
 
395
         /*-- 
396
            Find the coding table which is best for this group,
397
            and record its identity in the selector table.
398
         --*/
399
15.0M
         bc = 999999999; bt = -1;
400
105M
         for (t = 0; t < nGroups; t++)
401
90.3M
            if (cost[t] < bc) { bc = cost[t]; bt = t; };
402
15.0M
         totc += bc;
403
15.0M
         fave[bt]++;
404
15.0M
         s->selector[nSelectors] = bt;
405
15.0M
         nSelectors++;
406
407
         /*-- 
408
            Increment the symbol frequencies for the selected table.
409
          --*/
410
15.0M
         if (nGroups == 6 && 50 == ge-gs+1) {
411
            /*--- fast track the common case ---*/
412
413
749M
#           define BZ_ITUR(nn) s->rfreq[bt][ mtfv[gs+(nn)] ]++
414
415
14.9M
            BZ_ITUR(0);  BZ_ITUR(1);  BZ_ITUR(2);  BZ_ITUR(3);  BZ_ITUR(4);
416
14.9M
            BZ_ITUR(5);  BZ_ITUR(6);  BZ_ITUR(7);  BZ_ITUR(8);  BZ_ITUR(9);
417
14.9M
            BZ_ITUR(10); BZ_ITUR(11); BZ_ITUR(12); BZ_ITUR(13); BZ_ITUR(14);
418
14.9M
            BZ_ITUR(15); BZ_ITUR(16); BZ_ITUR(17); BZ_ITUR(18); BZ_ITUR(19);
419
14.9M
            BZ_ITUR(20); BZ_ITUR(21); BZ_ITUR(22); BZ_ITUR(23); BZ_ITUR(24);
420
14.9M
            BZ_ITUR(25); BZ_ITUR(26); BZ_ITUR(27); BZ_ITUR(28); BZ_ITUR(29);
421
14.9M
            BZ_ITUR(30); BZ_ITUR(31); BZ_ITUR(32); BZ_ITUR(33); BZ_ITUR(34);
422
14.9M
            BZ_ITUR(35); BZ_ITUR(36); BZ_ITUR(37); BZ_ITUR(38); BZ_ITUR(39);
423
14.9M
            BZ_ITUR(40); BZ_ITUR(41); BZ_ITUR(42); BZ_ITUR(43); BZ_ITUR(44);
424
14.9M
            BZ_ITUR(45); BZ_ITUR(46); BZ_ITUR(47); BZ_ITUR(48); BZ_ITUR(49);
425
426
14.9M
#           undef BZ_ITUR
427
428
14.9M
         } else {
429
      /*--- slow version which correctly handles all situations ---*/
430
4.67M
            for (i = gs; i <= ge; i++)
431
4.57M
               s->rfreq[bt][ mtfv[i] ]++;
432
103k
         }
433
434
15.0M
         gs = ge+1;
435
15.0M
      }
436
22.6k
      if (s->verbosity >= 3) {
437
0
         VPrintf2 ( "      pass %d: size is %d, grp uses are ", 
438
0
                   iter+1, totc/8 );
439
0
         for (t = 0; t < nGroups; t++)
440
0
            VPrintf1 ( "%d ", fave[t] );
441
0
         VPrintf0 ( "\n" );
442
0
      }
443
444
      /*--
445
        Recompute the tables based on the accumulated frequencies.
446
      --*/
447
      /* maxLen was changed from 20 to 17 in bzip2-1.0.3.  See 
448
         comment in huffman.c for details. */
449
114k
      for (t = 0; t < nGroups; t++)
450
91.5k
         BZ2_hbMakeCodeLengths ( &(s->len[t][0]), &(s->rfreq[t][0]), 
451
91.5k
                                 alphaSize, 17 /*20*/ );
452
22.6k
   }
453
454
455
5.65k
   AssertH( nGroups < 8, 3002 );
456
5.65k
   AssertH( nSelectors < 32768 &&
457
5.65k
            nSelectors <= BZ_MAX_SELECTORS,
458
5.65k
            3003 );
459
460
461
   /*--- Compute MTF values for the selectors. ---*/
462
5.65k
   {
463
5.65k
      UChar pos[BZ_N_GROUPS], ll_i, tmp2, tmp;
464
28.5k
      for (i = 0; i < nGroups; i++) pos[i] = i;
465
3.78M
      for (i = 0; i < nSelectors; i++) {
466
3.77M
         ll_i = s->selector[i];
467
3.77M
         j = 0;
468
3.77M
         tmp = pos[j];
469
10.4M
         while ( ll_i != tmp ) {
470
6.69M
            j++;
471
6.69M
            tmp2 = tmp;
472
6.69M
            tmp = pos[j];
473
6.69M
            pos[j] = tmp2;
474
6.69M
         };
475
3.77M
         pos[0] = tmp;
476
3.77M
         s->selectorMtf[i] = j;
477
3.77M
      }
478
5.65k
   };
479
480
   /*--- Assign actual codes for the tables. --*/
481
28.5k
   for (t = 0; t < nGroups; t++) {
482
22.8k
      minLen = 32;
483
22.8k
      maxLen = 0;
484
3.84M
      for (i = 0; i < alphaSize; i++) {
485
3.82M
         if (s->len[t][i] > maxLen) maxLen = s->len[t][i];
486
3.82M
         if (s->len[t][i] < minLen) minLen = s->len[t][i];
487
3.82M
      }
488
22.8k
      AssertH ( !(maxLen > 17 /*20*/ ), 3004 );
489
22.8k
      AssertH ( !(minLen < 1),  3005 );
490
22.8k
      BZ2_hbAssignCodes ( &(s->code[t][0]), &(s->len[t][0]), 
491
22.8k
                          minLen, maxLen, alphaSize );
492
22.8k
   }
493
494
   /*--- Transmit the mapping table. ---*/
495
5.65k
   { 
496
5.65k
      Bool inUse16[16];
497
96.1k
      for (i = 0; i < 16; i++) {
498
90.4k
          inUse16[i] = False;
499
1.53M
          for (j = 0; j < 16; j++)
500
1.44M
             if (s->inUse[i * 16 + j]) inUse16[i] = True;
501
90.4k
      }
502
     
503
5.65k
      nBytes = s->numZ;
504
96.1k
      for (i = 0; i < 16; i++)
505
90.4k
         if (inUse16[i]) bsW(s,1,1); else bsW(s,1,0);
506
507
96.1k
      for (i = 0; i < 16; i++)
508
90.4k
         if (inUse16[i])
509
1.06M
            for (j = 0; j < 16; j++) {
510
1.00M
               if (s->inUse[i * 16 + j]) bsW(s,1,1); else bsW(s,1,0);
511
1.00M
            }
512
513
5.65k
      if (s->verbosity >= 3) 
514
0
         VPrintf1( "      bytes: mapping %d, ", s->numZ-nBytes );
515
5.65k
   }
516
517
   /*--- Now the selectors. ---*/
518
5.65k
   nBytes = s->numZ;
519
5.65k
   bsW ( s, 3, nGroups );
520
5.65k
   bsW ( s, 15, nSelectors );
521
3.78M
   for (i = 0; i < nSelectors; i++) { 
522
10.4M
      for (j = 0; j < s->selectorMtf[i]; j++) bsW(s,1,1);
523
3.77M
      bsW(s,1,0);
524
3.77M
   }
525
5.65k
   if (s->verbosity >= 3)
526
0
      VPrintf1( "selectors %d, ", s->numZ-nBytes );
527
528
   /*--- Now the coding tables. ---*/
529
5.65k
   nBytes = s->numZ;
530
531
28.5k
   for (t = 0; t < nGroups; t++) {
532
22.8k
      Int32 curr = s->len[t][0];
533
22.8k
      bsW ( s, 5, curr );
534
3.84M
      for (i = 0; i < alphaSize; i++) {
535
4.60M
         while (curr < s->len[t][i]) { bsW(s,2,2); curr++; /* 10 */ };
536
4.52M
         while (curr > s->len[t][i]) { bsW(s,2,3); curr--; /* 11 */ };
537
3.82M
         bsW ( s, 1, 0 );
538
3.82M
      }
539
22.8k
   }
540
541
5.65k
   if (s->verbosity >= 3)
542
0
      VPrintf1 ( "code lengths %d, ", s->numZ-nBytes );
543
544
   /*--- And finally, the block data proper ---*/
545
5.65k
   nBytes = s->numZ;
546
5.65k
   selCtr = 0;
547
5.65k
   gs = 0;
548
3.78M
   while (True) {
549
3.78M
      if (gs >= s->nMTF) break;
550
3.77M
      ge = gs + BZ_G_SIZE - 1; 
551
3.77M
      if (ge >= s->nMTF) ge = s->nMTF-1;
552
3.77M
      AssertH ( s->selector[selCtr] < nGroups, 3006 );
553
554
3.77M
      if (nGroups == 6 && 50 == ge-gs+1) {
555
            /*--- fast track the common case ---*/
556
3.74M
            UInt16 mtfv_i;
557
3.74M
            UChar* s_len_sel_selCtr 
558
3.74M
               = &(s->len[s->selector[selCtr]][0]);
559
3.74M
            Int32* s_code_sel_selCtr
560
3.74M
               = &(s->code[s->selector[selCtr]][0]);
561
562
3.74M
#           define BZ_ITAH(nn)                      \
563
187M
               mtfv_i = mtfv[gs+(nn)];              \
564
187M
               bsW ( s,                             \
565
187M
                     s_len_sel_selCtr[mtfv_i],      \
566
187M
                     s_code_sel_selCtr[mtfv_i] )
567
568
3.74M
            BZ_ITAH(0);  BZ_ITAH(1);  BZ_ITAH(2);  BZ_ITAH(3);  BZ_ITAH(4);
569
3.74M
            BZ_ITAH(5);  BZ_ITAH(6);  BZ_ITAH(7);  BZ_ITAH(8);  BZ_ITAH(9);
570
3.74M
            BZ_ITAH(10); BZ_ITAH(11); BZ_ITAH(12); BZ_ITAH(13); BZ_ITAH(14);
571
3.74M
            BZ_ITAH(15); BZ_ITAH(16); BZ_ITAH(17); BZ_ITAH(18); BZ_ITAH(19);
572
3.74M
            BZ_ITAH(20); BZ_ITAH(21); BZ_ITAH(22); BZ_ITAH(23); BZ_ITAH(24);
573
3.74M
            BZ_ITAH(25); BZ_ITAH(26); BZ_ITAH(27); BZ_ITAH(28); BZ_ITAH(29);
574
3.74M
            BZ_ITAH(30); BZ_ITAH(31); BZ_ITAH(32); BZ_ITAH(33); BZ_ITAH(34);
575
3.74M
            BZ_ITAH(35); BZ_ITAH(36); BZ_ITAH(37); BZ_ITAH(38); BZ_ITAH(39);
576
3.74M
            BZ_ITAH(40); BZ_ITAH(41); BZ_ITAH(42); BZ_ITAH(43); BZ_ITAH(44);
577
3.74M
            BZ_ITAH(45); BZ_ITAH(46); BZ_ITAH(47); BZ_ITAH(48); BZ_ITAH(49);
578
579
3.74M
#           undef BZ_ITAH
580
581
3.74M
      } else {
582
   /*--- slow version which correctly handles all situations ---*/
583
1.16M
         for (i = gs; i <= ge; i++) {
584
1.14M
            bsW ( s, 
585
1.14M
                  s->len  [s->selector[selCtr]] [mtfv[i]],
586
1.14M
                  s->code [s->selector[selCtr]] [mtfv[i]] );
587
1.14M
         }
588
25.8k
      }
589
590
591
3.77M
      gs = ge+1;
592
3.77M
      selCtr++;
593
3.77M
   }
594
5.65k
   AssertH( selCtr == nSelectors, 3007 );
595
596
5.65k
   if (s->verbosity >= 3)
597
0
      VPrintf1( "codes %d\n", s->numZ-nBytes );
598
5.65k
}
599
600
601
/*---------------------------------------------------*/
602
void BZ2_compressBlock ( EState* s, Bool is_last_block )
603
5.65k
{
604
5.65k
   if (s->nblock > 0) {
605
606
5.65k
      BZ_FINALISE_CRC ( s->blockCRC );
607
5.65k
      s->combinedCRC = (s->combinedCRC << 1) | (s->combinedCRC >> 31);
608
5.65k
      s->combinedCRC ^= s->blockCRC;
609
5.65k
      if (s->blockNo > 1) s->numZ = 0;
610
611
5.65k
      if (s->verbosity >= 2)
612
0
         VPrintf4( "    block %d: crc = 0x%08x, "
613
5.65k
                   "combined CRC = 0x%08x, size = %d\n",
614
5.65k
                   s->blockNo, s->blockCRC, s->combinedCRC, s->nblock );
615
616
5.65k
      BZ2_blockSort ( s );
617
5.65k
   }
618
619
5.65k
   s->zbits = (UChar*) (&((UChar*)s->arr2)[s->nblock]);
620
621
   /*-- If this is the first block, create the stream header. --*/
622
5.65k
   if (s->blockNo == 1) {
623
3.95k
      BZ2_bsInitWrite ( s );
624
3.95k
      bsPutUChar ( s, BZ_HDR_B );
625
3.95k
      bsPutUChar ( s, BZ_HDR_Z );
626
3.95k
      bsPutUChar ( s, BZ_HDR_h );
627
3.95k
      bsPutUChar ( s, (UChar)(BZ_HDR_0 + s->blockSize100k) );
628
3.95k
   }
629
630
5.65k
   if (s->nblock > 0) {
631
632
5.65k
      bsPutUChar ( s, 0x31 ); bsPutUChar ( s, 0x41 );
633
5.65k
      bsPutUChar ( s, 0x59 ); bsPutUChar ( s, 0x26 );
634
5.65k
      bsPutUChar ( s, 0x53 ); bsPutUChar ( s, 0x59 );
635
636
      /*-- Now the block's CRC, so it is in a known place. --*/
637
5.65k
      bsPutUInt32 ( s, s->blockCRC );
638
639
      /*-- 
640
         Now a single bit indicating (non-)randomisation. 
641
         As of version 0.9.5, we use a better sorting algorithm
642
         which makes randomisation unnecessary.  So always set
643
         the randomised bit to 'no'.  Of course, the decoder
644
         still needs to be able to handle randomised blocks
645
         so as to maintain backwards compatibility with
646
         older versions of bzip2.
647
      --*/
648
5.65k
      bsW(s,1,0);
649
650
5.65k
      bsW ( s, 24, s->origPtr );
651
5.65k
      generateMTFValues ( s );
652
5.65k
      sendMTFValues ( s );
653
5.65k
   }
654
655
656
   /*-- If this is the last block, add the stream trailer. --*/
657
5.65k
   if (is_last_block) {
658
659
3.95k
      bsPutUChar ( s, 0x17 ); bsPutUChar ( s, 0x72 );
660
3.95k
      bsPutUChar ( s, 0x45 ); bsPutUChar ( s, 0x38 );
661
3.95k
      bsPutUChar ( s, 0x50 ); bsPutUChar ( s, 0x90 );
662
3.95k
      bsPutUInt32 ( s, s->combinedCRC );
663
3.95k
      if (s->verbosity >= 2)
664
         VPrintf1( "    final combined CRC = 0x%08x\n   ", s->combinedCRC );
665
3.95k
      bsFinishWrite ( s );
666
3.95k
   }
667
5.65k
}
668
669
670
/*-------------------------------------------------------------*/
671
/*--- end                                        compress.c ---*/
672
/*-------------------------------------------------------------*/