Coverage Report

Created: 2026-02-26 07:00

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/bzip2/compress.c
Line
Count
Source
1
2
/*-------------------------------------------------------------*/
3
/*--- Compression machinery (not incl block sorting)        ---*/
4
/*---                                            compress.c ---*/
5
/*-------------------------------------------------------------*/
6
7
/* ------------------------------------------------------------------
8
   This file is part of bzip2/libbzip2, a program and library for
9
   lossless, block-sorting data compression.
10
11
   bzip2/libbzip2 version 1.0.8 of 13 July 2019
12
   Copyright (C) 1996-2019 Julian Seward <jseward@acm.org>
13
14
   Please read the WARNING, DISCLAIMER and PATENTS sections in the 
15
   README file.
16
17
   This program is released under the terms of the license contained
18
   in the file LICENSE.
19
   ------------------------------------------------------------------ */
20
21
22
/* CHANGES
23
    0.9.0    -- original version.
24
    0.9.0a/b -- no changes in this file.
25
    0.9.0c   -- changed setting of nGroups in sendMTFValues() 
26
                so as to do a bit better on small files
27
*/
28
29
#include "bzlib_private.h"
30
31
32
/*---------------------------------------------------*/
33
/*--- Bit stream I/O                              ---*/
34
/*---------------------------------------------------*/
35
36
/*---------------------------------------------------*/
37
void BZ2_bsInitWrite ( EState* s )
38
3.60k
{
39
3.60k
   s->bsLive = 0;
40
3.60k
   s->bsBuff = 0;
41
3.60k
}
42
43
44
/*---------------------------------------------------*/
45
static
46
void bsFinishWrite ( EState* s )
47
3.60k
{
48
10.3k
   while (s->bsLive > 0) {
49
6.74k
      s->zbits[s->numZ] = (UChar)(s->bsBuff >> 24);
50
6.74k
      s->numZ++;
51
6.74k
      s->bsBuff <<= 8;
52
6.74k
      s->bsLive -= 8;
53
6.74k
   }
54
3.60k
}
55
56
57
/*---------------------------------------------------*/
58
175M
#define bsNEEDW(nz)                           \
59
175M
{                                             \
60
316M
   while (s->bsLive >= 8) {                   \
61
141M
      s->zbits[s->numZ]                       \
62
141M
         = (UChar)(s->bsBuff >> 24);          \
63
141M
      s->numZ++;                              \
64
141M
      s->bsBuff <<= 8;                        \
65
141M
      s->bsLive -= 8;                         \
66
141M
   }                                          \
67
175M
}
68
69
70
/*---------------------------------------------------*/
71
static
72
__inline__
73
void bsW ( EState* s, Int32 n, UInt32 v )
74
175M
{
75
175M
   bsNEEDW ( n );
76
175M
   s->bsBuff |= (v << (32 - s->bsLive - n));
77
175M
   s->bsLive += n;
78
175M
}
79
80
81
/*---------------------------------------------------*/
82
static
83
void bsPutUInt32 ( EState* s, UInt32 u )
84
7.52k
{
85
7.52k
   bsW ( s, 8, (u >> 24) & 0xffL );
86
7.52k
   bsW ( s, 8, (u >> 16) & 0xffL );
87
7.52k
   bsW ( s, 8, (u >>  8) & 0xffL );
88
7.52k
   bsW ( s, 8,  u        & 0xffL );
89
7.52k
}
90
91
92
/*---------------------------------------------------*/
93
static
94
void bsPutUChar ( EState* s, UChar c )
95
59.5k
{
96
59.5k
   bsW( s, 8, (UInt32)c );
97
59.5k
}
98
99
100
/*---------------------------------------------------*/
101
/*--- The back end proper                         ---*/
102
/*---------------------------------------------------*/
103
104
/*---------------------------------------------------*/
105
static
106
void makeMaps_e ( EState* s )
107
3.91k
{
108
3.91k
   Int32 i;
109
3.91k
   s->nInUse = 0;
110
1.00M
   for (i = 0; i < 256; i++)
111
1.00M
      if (s->inUse[i]) {
112
467k
         s->unseqToSeq[i] = s->nInUse;
113
467k
         s->nInUse++;
114
467k
      }
115
3.91k
}
116
117
118
/*---------------------------------------------------*/
119
static
120
void generateMTFValues ( EState* s )
121
3.91k
{
122
3.91k
   UChar   yy[256];
123
3.91k
   Int32   i, j;
124
3.91k
   Int32   zPend;
125
3.91k
   Int32   wr;
126
3.91k
   Int32   EOB;
127
128
   /* 
129
      After sorting (eg, here),
130
         s->arr1 [ 0 .. s->nblock-1 ] holds sorted order,
131
         and
132
         ((UChar*)s->arr2) [ 0 .. s->nblock-1 ] 
133
         holds the original block data.
134
135
      The first thing to do is generate the MTF values,
136
      and put them in
137
         ((UInt16*)s->arr1) [ 0 .. s->nblock-1 ].
138
      Because there are strictly fewer or equal MTF values
139
      than block values, ptr values in this area are overwritten
140
      with MTF values only when they are no longer needed.
141
142
      The final compressed bitstream is generated into the
143
      area starting at
144
         (UChar*) (&((UChar*)s->arr2)[s->nblock])
145
146
      These storage aliases are set up in bzCompressInit(),
147
      except for the last one, which is arranged in 
148
      compressBlock().
149
   */
150
3.91k
   UInt32* ptr   = s->ptr;
151
3.91k
   UChar* block  = s->block;
152
3.91k
   UInt16* mtfv  = s->mtfv;
153
154
3.91k
   makeMaps_e ( s );
155
3.91k
   EOB = s->nInUse+1;
156
157
479k
   for (i = 0; i <= EOB; i++) s->mtfFreq[i] = 0;
158
159
3.91k
   wr = 0;
160
3.91k
   zPend = 0;
161
471k
   for (i = 0; i < s->nInUse; i++) yy[i] = (UChar) i;
162
163
440M
   for (i = 0; i < s->nblock; i++) {
164
440M
      UChar ll_i;
165
440M
      AssertD ( wr <= i, "generateMTFValues(1)" );
166
440M
      j = ptr[i]-1; if (j < 0) j += s->nblock;
167
440M
      ll_i = s->unseqToSeq[block[j]];
168
440M
      AssertD ( ll_i < s->nInUse, "generateMTFValues(2a)" );
169
170
440M
      if (yy[0] == ll_i) { 
171
301M
         zPend++;
172
301M
      } else {
173
174
139M
         if (zPend > 0) {
175
19.5M
            zPend--;
176
22.7M
            while (True) {
177
22.7M
               if (zPend & 1) {
178
2.29M
                  mtfv[wr] = BZ_RUNB; wr++; 
179
2.29M
                  s->mtfFreq[BZ_RUNB]++; 
180
20.4M
               } else {
181
20.4M
                  mtfv[wr] = BZ_RUNA; wr++; 
182
20.4M
                  s->mtfFreq[BZ_RUNA]++; 
183
20.4M
               }
184
22.7M
               if (zPend < 2) break;
185
3.26M
               zPend = (zPend - 2) / 2;
186
3.26M
            };
187
19.5M
            zPend = 0;
188
19.5M
         }
189
139M
         {
190
139M
            register UChar  rtmp;
191
139M
            register UChar* ryy_j;
192
139M
            register UChar  rll_i;
193
139M
            rtmp  = yy[1];
194
139M
            yy[1] = yy[0];
195
139M
            ryy_j = &(yy[1]);
196
139M
            rll_i = ll_i;
197
15.4G
            while ( rll_i != rtmp ) {
198
15.2G
               register UChar rtmp2;
199
15.2G
               ryy_j++;
200
15.2G
               rtmp2  = rtmp;
201
15.2G
               rtmp   = *ryy_j;
202
15.2G
               *ryy_j = rtmp2;
203
15.2G
            };
204
139M
            yy[0] = rtmp;
205
139M
            j = ryy_j - &(yy[0]);
206
139M
            mtfv[wr] = j+1; wr++; s->mtfFreq[j+1]++;
207
139M
         }
208
209
139M
      }
210
440M
   }
211
212
3.91k
   if (zPend > 0) {
213
1.53k
      zPend--;
214
4.70k
      while (True) {
215
4.70k
         if (zPend & 1) {
216
1.89k
            mtfv[wr] = BZ_RUNB; wr++; 
217
1.89k
            s->mtfFreq[BZ_RUNB]++; 
218
2.81k
         } else {
219
2.81k
            mtfv[wr] = BZ_RUNA; wr++; 
220
2.81k
            s->mtfFreq[BZ_RUNA]++; 
221
2.81k
         }
222
4.70k
         if (zPend < 2) break;
223
3.16k
         zPend = (zPend - 2) / 2;
224
3.16k
      };
225
1.53k
      zPend = 0;
226
1.53k
   }
227
228
3.91k
   mtfv[wr] = EOB; wr++; s->mtfFreq[EOB]++;
229
230
3.91k
   s->nMTF = wr;
231
3.91k
}
232
233
234
/*---------------------------------------------------*/
235
475k
#define BZ_LESSER_ICOST  0
236
4.93M
#define BZ_GREATER_ICOST 15
237
238
static
239
void sendMTFValues ( EState* s )
240
3.91k
{
241
3.91k
   Int32 v, t, i, j, gs, ge, totc, bt, bc, iter;
242
3.91k
   Int32 nSelectors, alphaSize, minLen, maxLen, selCtr;
243
3.91k
   Int32 nGroups, nBytes;
244
245
   /*--
246
   UChar  len [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
247
   is a global since the decoder also needs it.
248
249
   Int32  code[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
250
   Int32  rfreq[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
251
   are also globals only used in this proc.
252
   Made global to keep stack frame size small.
253
   --*/
254
255
256
3.91k
   UInt16 cost[BZ_N_GROUPS];
257
3.91k
   Int32  fave[BZ_N_GROUPS];
258
259
3.91k
   UInt16* mtfv = s->mtfv;
260
261
3.91k
   if (s->verbosity >= 3)
262
0
      VPrintf3( "      %d in block, %d after MTF & 1-2 coding, "
263
3.91k
                "%d+2 syms in use\n", 
264
3.91k
                s->nblock, s->nMTF, s->nInUse );
265
266
3.91k
   alphaSize = s->nInUse+2;
267
27.4k
   for (t = 0; t < BZ_N_GROUPS; t++)
268
2.87M
      for (v = 0; v < alphaSize; v++)
269
2.85M
         s->len[t][v] = BZ_GREATER_ICOST;
270
271
   /*--- Decide how many coding tables to use ---*/
272
3.91k
   AssertH ( s->nMTF > 0, 3001 );
273
3.91k
   if (s->nMTF < 200)  nGroups = 2; else
274
2.43k
   if (s->nMTF < 600)  nGroups = 3; else
275
1.91k
   if (s->nMTF < 1200) nGroups = 4; else
276
1.69k
   if (s->nMTF < 2400) nGroups = 5; else
277
1.48k
                       nGroups = 6;
278
279
   /*--- Generate an initial set of coding tables ---*/
280
3.91k
   { 
281
3.91k
      Int32 nPart, remF, tFreq, aFreq;
282
283
3.91k
      nPart = nGroups;
284
3.91k
      remF  = s->nMTF;
285
3.91k
      gs = 0;
286
19.2k
      while (nPart > 0) {
287
15.3k
         tFreq = remF / nPart;
288
15.3k
         ge = gs-1;
289
15.3k
         aFreq = 0;
290
494k
         while (aFreq < tFreq && ge < alphaSize-1) {
291
478k
            ge++;
292
478k
            aFreq += s->mtfFreq[ge];
293
478k
         }
294
295
15.3k
         if (ge > gs 
296
12.3k
             && nPart != nGroups && nPart != 1 
297
6.37k
             && ((nGroups-nPart) % 2 == 1)) {
298
3.35k
            aFreq -= s->mtfFreq[ge];
299
3.35k
            ge--;
300
3.35k
         }
301
302
15.3k
         if (s->verbosity >= 3)
303
0
            VPrintf5( "      initial group %d, [%d .. %d], "
304
15.3k
                      "has %d syms (%4.1f%%)\n",
305
15.3k
                      nPart, gs, ge, aFreq, 
306
15.3k
                      (100.0 * (float)aFreq) / (float)(s->nMTF) );
307
 
308
2.57M
         for (v = 0; v < alphaSize; v++)
309
2.55M
            if (v >= gs && v <= ge) 
310
475k
               s->len[nPart-1][v] = BZ_LESSER_ICOST; else
311
2.07M
               s->len[nPart-1][v] = BZ_GREATER_ICOST;
312
 
313
15.3k
         nPart--;
314
15.3k
         gs = ge+1;
315
15.3k
         remF -= aFreq;
316
15.3k
      }
317
3.91k
   }
318
319
   /*--- 
320
      Iterate up to BZ_N_ITERS times to improve the tables.
321
   ---*/
322
19.5k
   for (iter = 0; iter < BZ_N_ITERS; iter++) {
323
324
109k
      for (t = 0; t < BZ_N_GROUPS; t++) fave[t] = 0;
325
326
77.1k
      for (t = 0; t < nGroups; t++)
327
10.2M
         for (v = 0; v < alphaSize; v++)
328
10.2M
            s->rfreq[t][v] = 0;
329
330
      /*---
331
        Set up an auxiliary length table which is used to fast-track
332
  the common case (nGroups == 6). 
333
      ---*/
334
15.6k
      if (nGroups == 6) {
335
1.42M
         for (v = 0; v < alphaSize; v++) {
336
1.41M
            s->len_pack[v][0] = (s->len[1][v] << 16) | s->len[0][v];
337
1.41M
            s->len_pack[v][1] = (s->len[3][v] << 16) | s->len[2][v];
338
1.41M
            s->len_pack[v][2] = (s->len[5][v] << 16) | s->len[4][v];
339
1.41M
   }
340
5.93k
      }
341
342
15.6k
      nSelectors = 0;
343
15.6k
      totc = 0;
344
15.6k
      gs = 0;
345
12.9M
      while (True) {
346
347
         /*--- Set group start & end marks. --*/
348
12.9M
         if (gs >= s->nMTF) break;
349
12.9M
         ge = gs + BZ_G_SIZE - 1; 
350
12.9M
         if (ge >= s->nMTF) ge = s->nMTF-1;
351
352
         /*-- 
353
            Calculate the cost of this group as coded
354
            by each of the coding tables.
355
         --*/
356
90.8M
         for (t = 0; t < BZ_N_GROUPS; t++) cost[t] = 0;
357
358
12.9M
         if (nGroups == 6 && 50 == ge-gs+1) {
359
            /*--- fast track the common case ---*/
360
12.9M
            register UInt32 cost01, cost23, cost45;
361
12.9M
            register UInt16 icv;
362
12.9M
            cost01 = cost23 = cost45 = 0;
363
364
12.9M
#           define BZ_ITER(nn)                \
365
645M
               icv = mtfv[gs+(nn)];           \
366
645M
               cost01 += s->len_pack[icv][0]; \
367
645M
               cost23 += s->len_pack[icv][1]; \
368
645M
               cost45 += s->len_pack[icv][2]; \
369
12.9M
370
12.9M
            BZ_ITER(0);  BZ_ITER(1);  BZ_ITER(2);  BZ_ITER(3);  BZ_ITER(4);
371
12.9M
            BZ_ITER(5);  BZ_ITER(6);  BZ_ITER(7);  BZ_ITER(8);  BZ_ITER(9);
372
12.9M
            BZ_ITER(10); BZ_ITER(11); BZ_ITER(12); BZ_ITER(13); BZ_ITER(14);
373
12.9M
            BZ_ITER(15); BZ_ITER(16); BZ_ITER(17); BZ_ITER(18); BZ_ITER(19);
374
12.9M
            BZ_ITER(20); BZ_ITER(21); BZ_ITER(22); BZ_ITER(23); BZ_ITER(24);
375
12.9M
            BZ_ITER(25); BZ_ITER(26); BZ_ITER(27); BZ_ITER(28); BZ_ITER(29);
376
12.9M
            BZ_ITER(30); BZ_ITER(31); BZ_ITER(32); BZ_ITER(33); BZ_ITER(34);
377
12.9M
            BZ_ITER(35); BZ_ITER(36); BZ_ITER(37); BZ_ITER(38); BZ_ITER(39);
378
12.9M
            BZ_ITER(40); BZ_ITER(41); BZ_ITER(42); BZ_ITER(43); BZ_ITER(44);
379
12.9M
            BZ_ITER(45); BZ_ITER(46); BZ_ITER(47); BZ_ITER(48); BZ_ITER(49);
380
381
12.9M
#           undef BZ_ITER
382
383
12.9M
            cost[0] = cost01 & 0xffff; cost[1] = cost01 >> 16;
384
12.9M
            cost[2] = cost23 & 0xffff; cost[3] = cost23 >> 16;
385
12.9M
            cost[4] = cost45 & 0xffff; cost[5] = cost45 >> 16;
386
387
12.9M
         } else {
388
      /*--- slow version which correctly handles all situations ---*/
389
3.43M
            for (i = gs; i <= ge; i++) { 
390
3.36M
               UInt16 icv = mtfv[i];
391
17.0M
               for (t = 0; t < nGroups; t++) cost[t] += s->len[t][icv];
392
3.36M
            }
393
75.5k
         }
394
 
395
         /*-- 
396
            Find the coding table which is best for this group,
397
            and record its identity in the selector table.
398
         --*/
399
12.9M
         bc = 999999999; bt = -1;
400
90.7M
         for (t = 0; t < nGroups; t++)
401
77.7M
            if (cost[t] < bc) { bc = cost[t]; bt = t; };
402
12.9M
         totc += bc;
403
12.9M
         fave[bt]++;
404
12.9M
         s->selector[nSelectors] = bt;
405
12.9M
         nSelectors++;
406
407
         /*-- 
408
            Increment the symbol frequencies for the selected table.
409
          --*/
410
12.9M
         if (nGroups == 6 && 50 == ge-gs+1) {
411
            /*--- fast track the common case ---*/
412
413
645M
#           define BZ_ITUR(nn) s->rfreq[bt][ mtfv[gs+(nn)] ]++
414
415
12.9M
            BZ_ITUR(0);  BZ_ITUR(1);  BZ_ITUR(2);  BZ_ITUR(3);  BZ_ITUR(4);
416
12.9M
            BZ_ITUR(5);  BZ_ITUR(6);  BZ_ITUR(7);  BZ_ITUR(8);  BZ_ITUR(9);
417
12.9M
            BZ_ITUR(10); BZ_ITUR(11); BZ_ITUR(12); BZ_ITUR(13); BZ_ITUR(14);
418
12.9M
            BZ_ITUR(15); BZ_ITUR(16); BZ_ITUR(17); BZ_ITUR(18); BZ_ITUR(19);
419
12.9M
            BZ_ITUR(20); BZ_ITUR(21); BZ_ITUR(22); BZ_ITUR(23); BZ_ITUR(24);
420
12.9M
            BZ_ITUR(25); BZ_ITUR(26); BZ_ITUR(27); BZ_ITUR(28); BZ_ITUR(29);
421
12.9M
            BZ_ITUR(30); BZ_ITUR(31); BZ_ITUR(32); BZ_ITUR(33); BZ_ITUR(34);
422
12.9M
            BZ_ITUR(35); BZ_ITUR(36); BZ_ITUR(37); BZ_ITUR(38); BZ_ITUR(39);
423
12.9M
            BZ_ITUR(40); BZ_ITUR(41); BZ_ITUR(42); BZ_ITUR(43); BZ_ITUR(44);
424
12.9M
            BZ_ITUR(45); BZ_ITUR(46); BZ_ITUR(47); BZ_ITUR(48); BZ_ITUR(49);
425
426
12.9M
#           undef BZ_ITUR
427
428
12.9M
         } else {
429
      /*--- slow version which correctly handles all situations ---*/
430
3.43M
            for (i = gs; i <= ge; i++)
431
3.36M
               s->rfreq[bt][ mtfv[i] ]++;
432
75.5k
         }
433
434
12.9M
         gs = ge+1;
435
12.9M
      }
436
15.6k
      if (s->verbosity >= 3) {
437
0
         VPrintf2 ( "      pass %d: size is %d, grp uses are ", 
438
0
                   iter+1, totc/8 );
439
0
         for (t = 0; t < nGroups; t++)
440
0
            VPrintf1 ( "%d ", fave[t] );
441
0
         VPrintf0 ( "\n" );
442
0
      }
443
444
      /*--
445
        Recompute the tables based on the accumulated frequencies.
446
      --*/
447
      /* maxLen was changed from 20 to 17 in bzip2-1.0.3.  See 
448
         comment in huffman.c for details. */
449
77.1k
      for (t = 0; t < nGroups; t++)
450
61.4k
         BZ2_hbMakeCodeLengths ( &(s->len[t][0]), &(s->rfreq[t][0]), 
451
61.4k
                                 alphaSize, 17 /*20*/ );
452
15.6k
   }
453
454
455
3.91k
   AssertH( nGroups < 8, 3002 );
456
3.91k
   AssertH( nSelectors < 32768 &&
457
3.91k
            nSelectors <= BZ_MAX_SELECTORS,
458
3.91k
            3003 );
459
460
461
   /*--- Compute MTF values for the selectors. ---*/
462
3.91k
   {
463
3.91k
      UChar pos[BZ_N_GROUPS], ll_i, tmp2, tmp;
464
19.2k
      for (i = 0; i < nGroups; i++) pos[i] = i;
465
3.24M
      for (i = 0; i < nSelectors; i++) {
466
3.24M
         ll_i = s->selector[i];
467
3.24M
         j = 0;
468
3.24M
         tmp = pos[j];
469
8.81M
         while ( ll_i != tmp ) {
470
5.56M
            j++;
471
5.56M
            tmp2 = tmp;
472
5.56M
            tmp = pos[j];
473
5.56M
            pos[j] = tmp2;
474
5.56M
         };
475
3.24M
         pos[0] = tmp;
476
3.24M
         s->selectorMtf[i] = j;
477
3.24M
      }
478
3.91k
   };
479
480
   /*--- Assign actual codes for the tables. --*/
481
19.2k
   for (t = 0; t < nGroups; t++) {
482
15.3k
      minLen = 32;
483
15.3k
      maxLen = 0;
484
2.57M
      for (i = 0; i < alphaSize; i++) {
485
2.55M
         if (s->len[t][i] > maxLen) maxLen = s->len[t][i];
486
2.55M
         if (s->len[t][i] < minLen) minLen = s->len[t][i];
487
2.55M
      }
488
15.3k
      AssertH ( !(maxLen > 17 /*20*/ ), 3004 );
489
15.3k
      AssertH ( !(minLen < 1),  3005 );
490
15.3k
      BZ2_hbAssignCodes ( &(s->code[t][0]), &(s->len[t][0]), 
491
15.3k
                          minLen, maxLen, alphaSize );
492
15.3k
   }
493
494
   /*--- Transmit the mapping table. ---*/
495
3.91k
   { 
496
3.91k
      Bool inUse16[16];
497
66.5k
      for (i = 0; i < 16; i++) {
498
62.6k
          inUse16[i] = False;
499
1.06M
          for (j = 0; j < 16; j++)
500
1.00M
             if (s->inUse[i * 16 + j]) inUse16[i] = True;
501
62.6k
      }
502
     
503
3.91k
      nBytes = s->numZ;
504
66.5k
      for (i = 0; i < 16; i++)
505
62.6k
         if (inUse16[i]) bsW(s,1,1); else bsW(s,1,0);
506
507
66.5k
      for (i = 0; i < 16; i++)
508
62.6k
         if (inUse16[i])
509
744k
            for (j = 0; j < 16; j++) {
510
701k
               if (s->inUse[i * 16 + j]) bsW(s,1,1); else bsW(s,1,0);
511
701k
            }
512
513
3.91k
      if (s->verbosity >= 3) 
514
0
         VPrintf1( "      bytes: mapping %d, ", s->numZ-nBytes );
515
3.91k
   }
516
517
   /*--- Now the selectors. ---*/
518
3.91k
   nBytes = s->numZ;
519
3.91k
   bsW ( s, 3, nGroups );
520
3.91k
   bsW ( s, 15, nSelectors );
521
3.24M
   for (i = 0; i < nSelectors; i++) { 
522
8.81M
      for (j = 0; j < s->selectorMtf[i]; j++) bsW(s,1,1);
523
3.24M
      bsW(s,1,0);
524
3.24M
   }
525
3.91k
   if (s->verbosity >= 3)
526
0
      VPrintf1( "selectors %d, ", s->numZ-nBytes );
527
528
   /*--- Now the coding tables. ---*/
529
3.91k
   nBytes = s->numZ;
530
531
19.2k
   for (t = 0; t < nGroups; t++) {
532
15.3k
      Int32 curr = s->len[t][0];
533
15.3k
      bsW ( s, 5, curr );
534
2.57M
      for (i = 0; i < alphaSize; i++) {
535
3.10M
         while (curr < s->len[t][i]) { bsW(s,2,2); curr++; /* 10 */ };
536
3.05M
         while (curr > s->len[t][i]) { bsW(s,2,3); curr--; /* 11 */ };
537
2.55M
         bsW ( s, 1, 0 );
538
2.55M
      }
539
15.3k
   }
540
541
3.91k
   if (s->verbosity >= 3)
542
0
      VPrintf1 ( "code lengths %d, ", s->numZ-nBytes );
543
544
   /*--- And finally, the block data proper ---*/
545
3.91k
   nBytes = s->numZ;
546
3.91k
   selCtr = 0;
547
3.91k
   gs = 0;
548
3.24M
   while (True) {
549
3.24M
      if (gs >= s->nMTF) break;
550
3.24M
      ge = gs + BZ_G_SIZE - 1; 
551
3.24M
      if (ge >= s->nMTF) ge = s->nMTF-1;
552
3.24M
      AssertH ( s->selector[selCtr] < nGroups, 3006 );
553
554
3.24M
      if (nGroups == 6 && 50 == ge-gs+1) {
555
            /*--- fast track the common case ---*/
556
3.22M
            UInt16 mtfv_i;
557
3.22M
            UChar* s_len_sel_selCtr 
558
3.22M
               = &(s->len[s->selector[selCtr]][0]);
559
3.22M
            Int32* s_code_sel_selCtr
560
3.22M
               = &(s->code[s->selector[selCtr]][0]);
561
562
3.22M
#           define BZ_ITAH(nn)                      \
563
161M
               mtfv_i = mtfv[gs+(nn)];              \
564
161M
               bsW ( s,                             \
565
161M
                     s_len_sel_selCtr[mtfv_i],      \
566
161M
                     s_code_sel_selCtr[mtfv_i] )
567
568
3.22M
            BZ_ITAH(0);  BZ_ITAH(1);  BZ_ITAH(2);  BZ_ITAH(3);  BZ_ITAH(4);
569
3.22M
            BZ_ITAH(5);  BZ_ITAH(6);  BZ_ITAH(7);  BZ_ITAH(8);  BZ_ITAH(9);
570
3.22M
            BZ_ITAH(10); BZ_ITAH(11); BZ_ITAH(12); BZ_ITAH(13); BZ_ITAH(14);
571
3.22M
            BZ_ITAH(15); BZ_ITAH(16); BZ_ITAH(17); BZ_ITAH(18); BZ_ITAH(19);
572
3.22M
            BZ_ITAH(20); BZ_ITAH(21); BZ_ITAH(22); BZ_ITAH(23); BZ_ITAH(24);
573
3.22M
            BZ_ITAH(25); BZ_ITAH(26); BZ_ITAH(27); BZ_ITAH(28); BZ_ITAH(29);
574
3.22M
            BZ_ITAH(30); BZ_ITAH(31); BZ_ITAH(32); BZ_ITAH(33); BZ_ITAH(34);
575
3.22M
            BZ_ITAH(35); BZ_ITAH(36); BZ_ITAH(37); BZ_ITAH(38); BZ_ITAH(39);
576
3.22M
            BZ_ITAH(40); BZ_ITAH(41); BZ_ITAH(42); BZ_ITAH(43); BZ_ITAH(44);
577
3.22M
            BZ_ITAH(45); BZ_ITAH(46); BZ_ITAH(47); BZ_ITAH(48); BZ_ITAH(49);
578
579
3.22M
#           undef BZ_ITAH
580
581
3.22M
      } else {
582
   /*--- slow version which correctly handles all situations ---*/
583
859k
         for (i = gs; i <= ge; i++) {
584
840k
            bsW ( s, 
585
840k
                  s->len  [s->selector[selCtr]] [mtfv[i]],
586
840k
                  s->code [s->selector[selCtr]] [mtfv[i]] );
587
840k
         }
588
18.8k
      }
589
590
591
3.24M
      gs = ge+1;
592
3.24M
      selCtr++;
593
3.24M
   }
594
3.91k
   AssertH( selCtr == nSelectors, 3007 );
595
596
3.91k
   if (s->verbosity >= 3)
597
0
      VPrintf1( "codes %d\n", s->numZ-nBytes );
598
3.91k
}
599
600
601
/*---------------------------------------------------*/
602
void BZ2_compressBlock ( EState* s, Bool is_last_block )
603
3.91k
{
604
3.91k
   if (s->nblock > 0) {
605
606
3.91k
      BZ_FINALISE_CRC ( s->blockCRC );
607
3.91k
      s->combinedCRC = (s->combinedCRC << 1) | (s->combinedCRC >> 31);
608
3.91k
      s->combinedCRC ^= s->blockCRC;
609
3.91k
      if (s->blockNo > 1) s->numZ = 0;
610
611
3.91k
      if (s->verbosity >= 2)
612
0
         VPrintf4( "    block %d: crc = 0x%08x, "
613
3.91k
                   "combined CRC = 0x%08x, size = %d\n",
614
3.91k
                   s->blockNo, s->blockCRC, s->combinedCRC, s->nblock );
615
616
3.91k
      BZ2_blockSort ( s );
617
3.91k
   }
618
619
3.91k
   s->zbits = (UChar*) (&((UChar*)s->arr2)[s->nblock]);
620
621
   /*-- If this is the first block, create the stream header. --*/
622
3.91k
   if (s->blockNo == 1) {
623
3.60k
      BZ2_bsInitWrite ( s );
624
3.60k
      bsPutUChar ( s, BZ_HDR_B );
625
3.60k
      bsPutUChar ( s, BZ_HDR_Z );
626
3.60k
      bsPutUChar ( s, BZ_HDR_h );
627
3.60k
      bsPutUChar ( s, (UChar)(BZ_HDR_0 + s->blockSize100k) );
628
3.60k
   }
629
630
3.91k
   if (s->nblock > 0) {
631
632
3.91k
      bsPutUChar ( s, 0x31 ); bsPutUChar ( s, 0x41 );
633
3.91k
      bsPutUChar ( s, 0x59 ); bsPutUChar ( s, 0x26 );
634
3.91k
      bsPutUChar ( s, 0x53 ); bsPutUChar ( s, 0x59 );
635
636
      /*-- Now the block's CRC, so it is in a known place. --*/
637
3.91k
      bsPutUInt32 ( s, s->blockCRC );
638
639
      /*-- 
640
         Now a single bit indicating (non-)randomisation. 
641
         As of version 0.9.5, we use a better sorting algorithm
642
         which makes randomisation unnecessary.  So always set
643
         the randomised bit to 'no'.  Of course, the decoder
644
         still needs to be able to handle randomised blocks
645
         so as to maintain backwards compatibility with
646
         older versions of bzip2.
647
      --*/
648
3.91k
      bsW(s,1,0);
649
650
3.91k
      bsW ( s, 24, s->origPtr );
651
3.91k
      generateMTFValues ( s );
652
3.91k
      sendMTFValues ( s );
653
3.91k
   }
654
655
656
   /*-- If this is the last block, add the stream trailer. --*/
657
3.91k
   if (is_last_block) {
658
659
3.60k
      bsPutUChar ( s, 0x17 ); bsPutUChar ( s, 0x72 );
660
3.60k
      bsPutUChar ( s, 0x45 ); bsPutUChar ( s, 0x38 );
661
3.60k
      bsPutUChar ( s, 0x50 ); bsPutUChar ( s, 0x90 );
662
3.60k
      bsPutUInt32 ( s, s->combinedCRC );
663
3.60k
      if (s->verbosity >= 2)
664
         VPrintf1( "    final combined CRC = 0x%08x\n   ", s->combinedCRC );
665
3.60k
      bsFinishWrite ( s );
666
3.60k
   }
667
3.91k
}
668
669
670
/*-------------------------------------------------------------*/
671
/*--- end                                        compress.c ---*/
672
/*-------------------------------------------------------------*/