Coverage Report

Created: 2026-02-14 06:34

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/bzip2/compress.c
Line
Count
Source
1
2
/*-------------------------------------------------------------*/
3
/*--- Compression machinery (not incl block sorting)        ---*/
4
/*---                                            compress.c ---*/
5
/*-------------------------------------------------------------*/
6
7
/* ------------------------------------------------------------------
8
   This file is part of bzip2/libbzip2, a program and library for
9
   lossless, block-sorting data compression.
10
11
   bzip2/libbzip2 version 1.0.8 of 13 July 2019
12
   Copyright (C) 1996-2019 Julian Seward <jseward@acm.org>
13
14
   Please read the WARNING, DISCLAIMER and PATENTS sections in the 
15
   README file.
16
17
   This program is released under the terms of the license contained
18
   in the file LICENSE.
19
   ------------------------------------------------------------------ */
20
21
22
/* CHANGES
23
    0.9.0    -- original version.
24
    0.9.0a/b -- no changes in this file.
25
    0.9.0c   -- changed setting of nGroups in sendMTFValues() 
26
                so as to do a bit better on small files
27
*/
28
29
#include "bzlib_private.h"
30
31
32
/*---------------------------------------------------*/
33
/*--- Bit stream I/O                              ---*/
34
/*---------------------------------------------------*/
35
36
/*---------------------------------------------------*/
37
void BZ2_bsInitWrite ( EState* s )
38
10.2k
{
39
10.2k
   s->bsLive = 0;
40
10.2k
   s->bsBuff = 0;
41
10.2k
}
42
43
44
/*---------------------------------------------------*/
45
static
46
void bsFinishWrite ( EState* s )
47
10.2k
{
48
29.4k
   while (s->bsLive > 0) {
49
19.2k
      s->zbits[s->numZ] = (UChar)(s->bsBuff >> 24);
50
19.2k
      s->numZ++;
51
19.2k
      s->bsBuff <<= 8;
52
19.2k
      s->bsLive -= 8;
53
19.2k
   }
54
10.2k
}
55
56
57
/*---------------------------------------------------*/
58
434M
#define bsNEEDW(nz)                           \
59
434M
{                                             \
60
780M
   while (s->bsLive >= 8) {                   \
61
345M
      s->zbits[s->numZ]                       \
62
345M
         = (UChar)(s->bsBuff >> 24);          \
63
345M
      s->numZ++;                              \
64
345M
      s->bsBuff <<= 8;                        \
65
345M
      s->bsLive -= 8;                         \
66
345M
   }                                          \
67
434M
}
68
69
70
/*---------------------------------------------------*/
71
static
72
__inline__
73
void bsW ( EState* s, Int32 n, UInt32 v )
74
434M
{
75
434M
   bsNEEDW ( n );
76
434M
   s->bsBuff |= (v << (32 - s->bsLive - n));
77
434M
   s->bsLive += n;
78
434M
}
79
80
81
/*---------------------------------------------------*/
82
static
83
void bsPutUInt32 ( EState* s, UInt32 u )
84
22.5k
{
85
22.5k
   bsW ( s, 8, (u >> 24) & 0xffL );
86
22.5k
   bsW ( s, 8, (u >> 16) & 0xffL );
87
22.5k
   bsW ( s, 8, (u >>  8) & 0xffL );
88
22.5k
   bsW ( s, 8,  u        & 0xffL );
89
22.5k
}
90
91
92
/*---------------------------------------------------*/
93
static
94
void bsPutUChar ( EState* s, UChar c )
95
176k
{
96
176k
   bsW( s, 8, (UInt32)c );
97
176k
}
98
99
100
/*---------------------------------------------------*/
101
/*--- The back end proper                         ---*/
102
/*---------------------------------------------------*/
103
104
/*---------------------------------------------------*/
105
static
106
void makeMaps_e ( EState* s )
107
12.2k
{
108
12.2k
   Int32 i;
109
12.2k
   s->nInUse = 0;
110
3.14M
   for (i = 0; i < 256; i++)
111
3.13M
      if (s->inUse[i]) {
112
1.43M
         s->unseqToSeq[i] = s->nInUse;
113
1.43M
         s->nInUse++;
114
1.43M
      }
115
12.2k
}
116
117
118
/*---------------------------------------------------*/
119
static
120
void generateMTFValues ( EState* s )
121
12.2k
{
122
12.2k
   UChar   yy[256];
123
12.2k
   Int32   i, j;
124
12.2k
   Int32   zPend;
125
12.2k
   Int32   wr;
126
12.2k
   Int32   EOB;
127
128
   /* 
129
      After sorting (eg, here),
130
         s->arr1 [ 0 .. s->nblock-1 ] holds sorted order,
131
         and
132
         ((UChar*)s->arr2) [ 0 .. s->nblock-1 ] 
133
         holds the original block data.
134
135
      The first thing to do is generate the MTF values,
136
      and put them in
137
         ((UInt16*)s->arr1) [ 0 .. s->nblock-1 ].
138
      Because there are strictly fewer or equal MTF values
139
      than block values, ptr values in this area are overwritten
140
      with MTF values only when they are no longer needed.
141
142
      The final compressed bitstream is generated into the
143
      area starting at
144
         (UChar*) (&((UChar*)s->arr2)[s->nblock])
145
146
      These storage aliases are set up in bzCompressInit(),
147
      except for the last one, which is arranged in 
148
      compressBlock().
149
   */
150
12.2k
   UInt32* ptr   = s->ptr;
151
12.2k
   UChar* block  = s->block;
152
12.2k
   UInt16* mtfv  = s->mtfv;
153
154
12.2k
   makeMaps_e ( s );
155
12.2k
   EOB = s->nInUse+1;
156
157
1.47M
   for (i = 0; i <= EOB; i++) s->mtfFreq[i] = 0;
158
159
12.2k
   wr = 0;
160
12.2k
   zPend = 0;
161
1.44M
   for (i = 0; i < s->nInUse; i++) yy[i] = (UChar) i;
162
163
989M
   for (i = 0; i < s->nblock; i++) {
164
989M
      UChar ll_i;
165
989M
      AssertD ( wr <= i, "generateMTFValues(1)" );
166
989M
      j = ptr[i]-1; if (j < 0) j += s->nblock;
167
989M
      ll_i = s->unseqToSeq[block[j]];
168
989M
      AssertD ( ll_i < s->nInUse, "generateMTFValues(2a)" );
169
170
989M
      if (yy[0] == ll_i) { 
171
645M
         zPend++;
172
645M
      } else {
173
174
344M
         if (zPend > 0) {
175
46.2M
            zPend--;
176
55.0M
            while (True) {
177
55.0M
               if (zPend & 1) {
178
6.71M
                  mtfv[wr] = BZ_RUNB; wr++; 
179
6.71M
                  s->mtfFreq[BZ_RUNB]++; 
180
48.3M
               } else {
181
48.3M
                  mtfv[wr] = BZ_RUNA; wr++; 
182
48.3M
                  s->mtfFreq[BZ_RUNA]++; 
183
48.3M
               }
184
55.0M
               if (zPend < 2) break;
185
8.74M
               zPend = (zPend - 2) / 2;
186
8.74M
            };
187
46.2M
            zPend = 0;
188
46.2M
         }
189
344M
         {
190
344M
            register UChar  rtmp;
191
344M
            register UChar* ryy_j;
192
344M
            register UChar  rll_i;
193
344M
            rtmp  = yy[1];
194
344M
            yy[1] = yy[0];
195
344M
            ryy_j = &(yy[1]);
196
344M
            rll_i = ll_i;
197
37.1G
            while ( rll_i != rtmp ) {
198
36.8G
               register UChar rtmp2;
199
36.8G
               ryy_j++;
200
36.8G
               rtmp2  = rtmp;
201
36.8G
               rtmp   = *ryy_j;
202
36.8G
               *ryy_j = rtmp2;
203
36.8G
            };
204
344M
            yy[0] = rtmp;
205
344M
            j = ryy_j - &(yy[0]);
206
344M
            mtfv[wr] = j+1; wr++; s->mtfFreq[j+1]++;
207
344M
         }
208
209
344M
      }
210
989M
   }
211
212
12.2k
   if (zPend > 0) {
213
5.23k
      zPend--;
214
21.1k
      while (True) {
215
21.1k
         if (zPend & 1) {
216
9.07k
            mtfv[wr] = BZ_RUNB; wr++; 
217
9.07k
            s->mtfFreq[BZ_RUNB]++; 
218
12.1k
         } else {
219
12.1k
            mtfv[wr] = BZ_RUNA; wr++; 
220
12.1k
            s->mtfFreq[BZ_RUNA]++; 
221
12.1k
         }
222
21.1k
         if (zPend < 2) break;
223
15.9k
         zPend = (zPend - 2) / 2;
224
15.9k
      };
225
5.23k
      zPend = 0;
226
5.23k
   }
227
228
12.2k
   mtfv[wr] = EOB; wr++; s->mtfFreq[EOB]++;
229
230
12.2k
   s->nMTF = wr;
231
12.2k
}
232
233
234
/*---------------------------------------------------*/
235
1.46M
#define BZ_LESSER_ICOST  0
236
15.2M
#define BZ_GREATER_ICOST 15
237
238
static
239
void sendMTFValues ( EState* s )
240
12.2k
{
241
12.2k
   Int32 v, t, i, j, gs, ge, totc, bt, bc, iter;
242
12.2k
   Int32 nSelectors, alphaSize, minLen, maxLen, selCtr;
243
12.2k
   Int32 nGroups, nBytes;
244
245
   /*--
246
   UChar  len [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
247
   is a global since the decoder also needs it.
248
249
   Int32  code[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
250
   Int32  rfreq[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
251
   are also globals only used in this proc.
252
   Made global to keep stack frame size small.
253
   --*/
254
255
256
12.2k
   UInt16 cost[BZ_N_GROUPS];
257
12.2k
   Int32  fave[BZ_N_GROUPS];
258
259
12.2k
   UInt16* mtfv = s->mtfv;
260
261
12.2k
   if (s->verbosity >= 3)
262
0
      VPrintf3( "      %d in block, %d after MTF & 1-2 coding, "
263
12.2k
                "%d+2 syms in use\n", 
264
12.2k
                s->nblock, s->nMTF, s->nInUse );
265
266
12.2k
   alphaSize = s->nInUse+2;
267
85.7k
   for (t = 0; t < BZ_N_GROUPS; t++)
268
8.84M
      for (v = 0; v < alphaSize; v++)
269
8.76M
         s->len[t][v] = BZ_GREATER_ICOST;
270
271
   /*--- Decide how many coding tables to use ---*/
272
12.2k
   AssertH ( s->nMTF > 0, 3001 );
273
12.2k
   if (s->nMTF < 200)  nGroups = 2; else
274
7.71k
   if (s->nMTF < 600)  nGroups = 3; else
275
6.01k
   if (s->nMTF < 1200) nGroups = 4; else
276
5.32k
   if (s->nMTF < 2400) nGroups = 5; else
277
4.73k
                       nGroups = 6;
278
279
   /*--- Generate an initial set of coding tables ---*/
280
12.2k
   { 
281
12.2k
      Int32 nPart, remF, tFreq, aFreq;
282
283
12.2k
      nPart = nGroups;
284
12.2k
      remF  = s->nMTF;
285
12.2k
      gs = 0;
286
60.5k
      while (nPart > 0) {
287
48.2k
         tFreq = remF / nPart;
288
48.2k
         ge = gs-1;
289
48.2k
         aFreq = 0;
290
1.52M
         while (aFreq < tFreq && ge < alphaSize-1) {
291
1.47M
            ge++;
292
1.47M
            aFreq += s->mtfFreq[ge];
293
1.47M
         }
294
295
48.2k
         if (ge > gs 
296
38.9k
             && nPart != nGroups && nPart != 1 
297
19.7k
             && ((nGroups-nPart) % 2 == 1)) {
298
10.2k
            aFreq -= s->mtfFreq[ge];
299
10.2k
            ge--;
300
10.2k
         }
301
302
48.2k
         if (s->verbosity >= 3)
303
0
            VPrintf5( "      initial group %d, [%d .. %d], "
304
48.2k
                      "has %d syms (%4.1f%%)\n",
305
48.2k
                      nPart, gs, ge, aFreq, 
306
48.2k
                      (100.0 * (float)aFreq) / (float)(s->nMTF) );
307
 
308
7.97M
         for (v = 0; v < alphaSize; v++)
309
7.92M
            if (v >= gs && v <= ge) 
310
1.46M
               s->len[nPart-1][v] = BZ_LESSER_ICOST; else
311
6.46M
               s->len[nPart-1][v] = BZ_GREATER_ICOST;
312
 
313
48.2k
         nPart--;
314
48.2k
         gs = ge+1;
315
48.2k
         remF -= aFreq;
316
48.2k
      }
317
12.2k
   }
318
319
   /*--- 
320
      Iterate up to BZ_N_ITERS times to improve the tables.
321
   ---*/
322
61.2k
   for (iter = 0; iter < BZ_N_ITERS; iter++) {
323
324
342k
      for (t = 0; t < BZ_N_GROUPS; t++) fave[t] = 0;
325
326
242k
      for (t = 0; t < nGroups; t++)
327
31.8M
         for (v = 0; v < alphaSize; v++)
328
31.6M
            s->rfreq[t][v] = 0;
329
330
      /*---
331
        Set up an auxiliary length table which is used to fast-track
332
  the common case (nGroups == 6). 
333
      ---*/
334
48.9k
      if (nGroups == 6) {
335
4.49M
         for (v = 0; v < alphaSize; v++) {
336
4.47M
            s->len_pack[v][0] = (s->len[1][v] << 16) | s->len[0][v];
337
4.47M
            s->len_pack[v][1] = (s->len[3][v] << 16) | s->len[2][v];
338
4.47M
            s->len_pack[v][2] = (s->len[5][v] << 16) | s->len[4][v];
339
4.47M
   }
340
18.9k
      }
341
342
48.9k
      nSelectors = 0;
343
48.9k
      totc = 0;
344
48.9k
      gs = 0;
345
32.0M
      while (True) {
346
347
         /*--- Set group start & end marks. --*/
348
32.0M
         if (gs >= s->nMTF) break;
349
31.9M
         ge = gs + BZ_G_SIZE - 1; 
350
31.9M
         if (ge >= s->nMTF) ge = s->nMTF-1;
351
352
         /*-- 
353
            Calculate the cost of this group as coded
354
            by each of the coding tables.
355
         --*/
356
223M
         for (t = 0; t < BZ_N_GROUPS; t++) cost[t] = 0;
357
358
31.9M
         if (nGroups == 6 && 50 == ge-gs+1) {
359
            /*--- fast track the common case ---*/
360
31.7M
            register UInt32 cost01, cost23, cost45;
361
31.7M
            register UInt16 icv;
362
31.7M
            cost01 = cost23 = cost45 = 0;
363
364
31.7M
#           define BZ_ITER(nn)                \
365
1.58G
               icv = mtfv[gs+(nn)];           \
366
1.58G
               cost01 += s->len_pack[icv][0]; \
367
1.58G
               cost23 += s->len_pack[icv][1]; \
368
1.58G
               cost45 += s->len_pack[icv][2]; \
369
31.7M
370
31.7M
            BZ_ITER(0);  BZ_ITER(1);  BZ_ITER(2);  BZ_ITER(3);  BZ_ITER(4);
371
31.7M
            BZ_ITER(5);  BZ_ITER(6);  BZ_ITER(7);  BZ_ITER(8);  BZ_ITER(9);
372
31.7M
            BZ_ITER(10); BZ_ITER(11); BZ_ITER(12); BZ_ITER(13); BZ_ITER(14);
373
31.7M
            BZ_ITER(15); BZ_ITER(16); BZ_ITER(17); BZ_ITER(18); BZ_ITER(19);
374
31.7M
            BZ_ITER(20); BZ_ITER(21); BZ_ITER(22); BZ_ITER(23); BZ_ITER(24);
375
31.7M
            BZ_ITER(25); BZ_ITER(26); BZ_ITER(27); BZ_ITER(28); BZ_ITER(29);
376
31.7M
            BZ_ITER(30); BZ_ITER(31); BZ_ITER(32); BZ_ITER(33); BZ_ITER(34);
377
31.7M
            BZ_ITER(35); BZ_ITER(36); BZ_ITER(37); BZ_ITER(38); BZ_ITER(39);
378
31.7M
            BZ_ITER(40); BZ_ITER(41); BZ_ITER(42); BZ_ITER(43); BZ_ITER(44);
379
31.7M
            BZ_ITER(45); BZ_ITER(46); BZ_ITER(47); BZ_ITER(48); BZ_ITER(49);
380
381
31.7M
#           undef BZ_ITER
382
383
31.7M
            cost[0] = cost01 & 0xffff; cost[1] = cost01 >> 16;
384
31.7M
            cost[2] = cost23 & 0xffff; cost[3] = cost23 >> 16;
385
31.7M
            cost[4] = cost45 & 0xffff; cost[5] = cost45 >> 16;
386
387
31.7M
         } else {
388
      /*--- slow version which correctly handles all situations ---*/
389
10.2M
            for (i = gs; i <= ge; i++) { 
390
10.0M
               UInt16 icv = mtfv[i];
391
50.3M
               for (t = 0; t < nGroups; t++) cost[t] += s->len[t][icv];
392
10.0M
            }
393
226k
         }
394
 
395
         /*-- 
396
            Find the coding table which is best for this group,
397
            and record its identity in the selector table.
398
         --*/
399
31.9M
         bc = 999999999; bt = -1;
400
223M
         for (t = 0; t < nGroups; t++)
401
191M
            if (cost[t] < bc) { bc = cost[t]; bt = t; };
402
31.9M
         totc += bc;
403
31.9M
         fave[bt]++;
404
31.9M
         s->selector[nSelectors] = bt;
405
31.9M
         nSelectors++;
406
407
         /*-- 
408
            Increment the symbol frequencies for the selected table.
409
          --*/
410
31.9M
         if (nGroups == 6 && 50 == ge-gs+1) {
411
            /*--- fast track the common case ---*/
412
413
1.58G
#           define BZ_ITUR(nn) s->rfreq[bt][ mtfv[gs+(nn)] ]++
414
415
31.7M
            BZ_ITUR(0);  BZ_ITUR(1);  BZ_ITUR(2);  BZ_ITUR(3);  BZ_ITUR(4);
416
31.7M
            BZ_ITUR(5);  BZ_ITUR(6);  BZ_ITUR(7);  BZ_ITUR(8);  BZ_ITUR(9);
417
31.7M
            BZ_ITUR(10); BZ_ITUR(11); BZ_ITUR(12); BZ_ITUR(13); BZ_ITUR(14);
418
31.7M
            BZ_ITUR(15); BZ_ITUR(16); BZ_ITUR(17); BZ_ITUR(18); BZ_ITUR(19);
419
31.7M
            BZ_ITUR(20); BZ_ITUR(21); BZ_ITUR(22); BZ_ITUR(23); BZ_ITUR(24);
420
31.7M
            BZ_ITUR(25); BZ_ITUR(26); BZ_ITUR(27); BZ_ITUR(28); BZ_ITUR(29);
421
31.7M
            BZ_ITUR(30); BZ_ITUR(31); BZ_ITUR(32); BZ_ITUR(33); BZ_ITUR(34);
422
31.7M
            BZ_ITUR(35); BZ_ITUR(36); BZ_ITUR(37); BZ_ITUR(38); BZ_ITUR(39);
423
31.7M
            BZ_ITUR(40); BZ_ITUR(41); BZ_ITUR(42); BZ_ITUR(43); BZ_ITUR(44);
424
31.7M
            BZ_ITUR(45); BZ_ITUR(46); BZ_ITUR(47); BZ_ITUR(48); BZ_ITUR(49);
425
426
31.7M
#           undef BZ_ITUR
427
428
31.7M
         } else {
429
      /*--- slow version which correctly handles all situations ---*/
430
10.2M
            for (i = gs; i <= ge; i++)
431
10.0M
               s->rfreq[bt][ mtfv[i] ]++;
432
226k
         }
433
434
31.9M
         gs = ge+1;
435
31.9M
      }
436
48.9k
      if (s->verbosity >= 3) {
437
0
         VPrintf2 ( "      pass %d: size is %d, grp uses are ", 
438
0
                   iter+1, totc/8 );
439
0
         for (t = 0; t < nGroups; t++)
440
0
            VPrintf1 ( "%d ", fave[t] );
441
0
         VPrintf0 ( "\n" );
442
0
      }
443
444
      /*--
445
        Recompute the tables based on the accumulated frequencies.
446
      --*/
447
      /* maxLen was changed from 20 to 17 in bzip2-1.0.3.  See 
448
         comment in huffman.c for details. */
449
242k
      for (t = 0; t < nGroups; t++)
450
193k
         BZ2_hbMakeCodeLengths ( &(s->len[t][0]), &(s->rfreq[t][0]), 
451
193k
                                 alphaSize, 17 /*20*/ );
452
48.9k
   }
453
454
455
12.2k
   AssertH( nGroups < 8, 3002 );
456
12.2k
   AssertH( nSelectors < 32768 &&
457
12.2k
            nSelectors <= BZ_MAX_SELECTORS,
458
12.2k
            3003 );
459
460
461
   /*--- Compute MTF values for the selectors. ---*/
462
12.2k
   {
463
12.2k
      UChar pos[BZ_N_GROUPS], ll_i, tmp2, tmp;
464
60.5k
      for (i = 0; i < nGroups; i++) pos[i] = i;
465
8.00M
      for (i = 0; i < nSelectors; i++) {
466
7.99M
         ll_i = s->selector[i];
467
7.99M
         j = 0;
468
7.99M
         tmp = pos[j];
469
21.3M
         while ( ll_i != tmp ) {
470
13.3M
            j++;
471
13.3M
            tmp2 = tmp;
472
13.3M
            tmp = pos[j];
473
13.3M
            pos[j] = tmp2;
474
13.3M
         };
475
7.99M
         pos[0] = tmp;
476
7.99M
         s->selectorMtf[i] = j;
477
7.99M
      }
478
12.2k
   };
479
480
   /*--- Assign actual codes for the tables. --*/
481
60.5k
   for (t = 0; t < nGroups; t++) {
482
48.2k
      minLen = 32;
483
48.2k
      maxLen = 0;
484
7.97M
      for (i = 0; i < alphaSize; i++) {
485
7.92M
         if (s->len[t][i] > maxLen) maxLen = s->len[t][i];
486
7.92M
         if (s->len[t][i] < minLen) minLen = s->len[t][i];
487
7.92M
      }
488
48.2k
      AssertH ( !(maxLen > 17 /*20*/ ), 3004 );
489
48.2k
      AssertH ( !(minLen < 1),  3005 );
490
48.2k
      BZ2_hbAssignCodes ( &(s->code[t][0]), &(s->len[t][0]), 
491
48.2k
                          minLen, maxLen, alphaSize );
492
48.2k
   }
493
494
   /*--- Transmit the mapping table. ---*/
495
12.2k
   { 
496
12.2k
      Bool inUse16[16];
497
208k
      for (i = 0; i < 16; i++) {
498
195k
          inUse16[i] = False;
499
3.33M
          for (j = 0; j < 16; j++)
500
3.13M
             if (s->inUse[i * 16 + j]) inUse16[i] = True;
501
195k
      }
502
     
503
12.2k
      nBytes = s->numZ;
504
208k
      for (i = 0; i < 16; i++)
505
195k
         if (inUse16[i]) bsW(s,1,1); else bsW(s,1,0);
506
507
208k
      for (i = 0; i < 16; i++)
508
195k
         if (inUse16[i])
509
2.28M
            for (j = 0; j < 16; j++) {
510
2.14M
               if (s->inUse[i * 16 + j]) bsW(s,1,1); else bsW(s,1,0);
511
2.14M
            }
512
513
12.2k
      if (s->verbosity >= 3) 
514
0
         VPrintf1( "      bytes: mapping %d, ", s->numZ-nBytes );
515
12.2k
   }
516
517
   /*--- Now the selectors. ---*/
518
12.2k
   nBytes = s->numZ;
519
12.2k
   bsW ( s, 3, nGroups );
520
12.2k
   bsW ( s, 15, nSelectors );
521
8.00M
   for (i = 0; i < nSelectors; i++) { 
522
21.3M
      for (j = 0; j < s->selectorMtf[i]; j++) bsW(s,1,1);
523
7.99M
      bsW(s,1,0);
524
7.99M
   }
525
12.2k
   if (s->verbosity >= 3)
526
0
      VPrintf1( "selectors %d, ", s->numZ-nBytes );
527
528
   /*--- Now the coding tables. ---*/
529
12.2k
   nBytes = s->numZ;
530
531
60.5k
   for (t = 0; t < nGroups; t++) {
532
48.2k
      Int32 curr = s->len[t][0];
533
48.2k
      bsW ( s, 5, curr );
534
7.97M
      for (i = 0; i < alphaSize; i++) {
535
9.59M
         while (curr < s->len[t][i]) { bsW(s,2,2); curr++; /* 10 */ };
536
9.43M
         while (curr > s->len[t][i]) { bsW(s,2,3); curr--; /* 11 */ };
537
7.92M
         bsW ( s, 1, 0 );
538
7.92M
      }
539
48.2k
   }
540
541
12.2k
   if (s->verbosity >= 3)
542
0
      VPrintf1 ( "code lengths %d, ", s->numZ-nBytes );
543
544
   /*--- And finally, the block data proper ---*/
545
12.2k
   nBytes = s->numZ;
546
12.2k
   selCtr = 0;
547
12.2k
   gs = 0;
548
8.00M
   while (True) {
549
8.00M
      if (gs >= s->nMTF) break;
550
7.99M
      ge = gs + BZ_G_SIZE - 1; 
551
7.99M
      if (ge >= s->nMTF) ge = s->nMTF-1;
552
7.99M
      AssertH ( s->selector[selCtr] < nGroups, 3006 );
553
554
7.99M
      if (nGroups == 6 && 50 == ge-gs+1) {
555
            /*--- fast track the common case ---*/
556
7.93M
            UInt16 mtfv_i;
557
7.93M
            UChar* s_len_sel_selCtr 
558
7.93M
               = &(s->len[s->selector[selCtr]][0]);
559
7.93M
            Int32* s_code_sel_selCtr
560
7.93M
               = &(s->code[s->selector[selCtr]][0]);
561
562
7.93M
#           define BZ_ITAH(nn)                      \
563
396M
               mtfv_i = mtfv[gs+(nn)];              \
564
396M
               bsW ( s,                             \
565
396M
                     s_len_sel_selCtr[mtfv_i],      \
566
396M
                     s_code_sel_selCtr[mtfv_i] )
567
568
7.93M
            BZ_ITAH(0);  BZ_ITAH(1);  BZ_ITAH(2);  BZ_ITAH(3);  BZ_ITAH(4);
569
7.93M
            BZ_ITAH(5);  BZ_ITAH(6);  BZ_ITAH(7);  BZ_ITAH(8);  BZ_ITAH(9);
570
7.93M
            BZ_ITAH(10); BZ_ITAH(11); BZ_ITAH(12); BZ_ITAH(13); BZ_ITAH(14);
571
7.93M
            BZ_ITAH(15); BZ_ITAH(16); BZ_ITAH(17); BZ_ITAH(18); BZ_ITAH(19);
572
7.93M
            BZ_ITAH(20); BZ_ITAH(21); BZ_ITAH(22); BZ_ITAH(23); BZ_ITAH(24);
573
7.93M
            BZ_ITAH(25); BZ_ITAH(26); BZ_ITAH(27); BZ_ITAH(28); BZ_ITAH(29);
574
7.93M
            BZ_ITAH(30); BZ_ITAH(31); BZ_ITAH(32); BZ_ITAH(33); BZ_ITAH(34);
575
7.93M
            BZ_ITAH(35); BZ_ITAH(36); BZ_ITAH(37); BZ_ITAH(38); BZ_ITAH(39);
576
7.93M
            BZ_ITAH(40); BZ_ITAH(41); BZ_ITAH(42); BZ_ITAH(43); BZ_ITAH(44);
577
7.93M
            BZ_ITAH(45); BZ_ITAH(46); BZ_ITAH(47); BZ_ITAH(48); BZ_ITAH(49);
578
579
7.93M
#           undef BZ_ITAH
580
581
7.93M
      } else {
582
   /*--- slow version which correctly handles all situations ---*/
583
2.56M
         for (i = gs; i <= ge; i++) {
584
2.50M
            bsW ( s, 
585
2.50M
                  s->len  [s->selector[selCtr]] [mtfv[i]],
586
2.50M
                  s->code [s->selector[selCtr]] [mtfv[i]] );
587
2.50M
         }
588
56.6k
      }
589
590
591
7.99M
      gs = ge+1;
592
7.99M
      selCtr++;
593
7.99M
   }
594
12.2k
   AssertH( selCtr == nSelectors, 3007 );
595
596
12.2k
   if (s->verbosity >= 3)
597
0
      VPrintf1( "codes %d\n", s->numZ-nBytes );
598
12.2k
}
599
600
601
/*---------------------------------------------------*/
602
void BZ2_compressBlock ( EState* s, Bool is_last_block )
603
12.2k
{
604
12.2k
   if (s->nblock > 0) {
605
606
12.2k
      BZ_FINALISE_CRC ( s->blockCRC );
607
12.2k
      s->combinedCRC = (s->combinedCRC << 1) | (s->combinedCRC >> 31);
608
12.2k
      s->combinedCRC ^= s->blockCRC;
609
12.2k
      if (s->blockNo > 1) s->numZ = 0;
610
611
12.2k
      if (s->verbosity >= 2)
612
0
         VPrintf4( "    block %d: crc = 0x%08x, "
613
12.2k
                   "combined CRC = 0x%08x, size = %d\n",
614
12.2k
                   s->blockNo, s->blockCRC, s->combinedCRC, s->nblock );
615
616
12.2k
      BZ2_blockSort ( s );
617
12.2k
   }
618
619
12.2k
   s->zbits = (UChar*) (&((UChar*)s->arr2)[s->nblock]);
620
621
   /*-- If this is the first block, create the stream header. --*/
622
12.2k
   if (s->blockNo == 1) {
623
10.2k
      BZ2_bsInitWrite ( s );
624
10.2k
      bsPutUChar ( s, BZ_HDR_B );
625
10.2k
      bsPutUChar ( s, BZ_HDR_Z );
626
10.2k
      bsPutUChar ( s, BZ_HDR_h );
627
10.2k
      bsPutUChar ( s, (UChar)(BZ_HDR_0 + s->blockSize100k) );
628
10.2k
   }
629
630
12.2k
   if (s->nblock > 0) {
631
632
12.2k
      bsPutUChar ( s, 0x31 ); bsPutUChar ( s, 0x41 );
633
12.2k
      bsPutUChar ( s, 0x59 ); bsPutUChar ( s, 0x26 );
634
12.2k
      bsPutUChar ( s, 0x53 ); bsPutUChar ( s, 0x59 );
635
636
      /*-- Now the block's CRC, so it is in a known place. --*/
637
12.2k
      bsPutUInt32 ( s, s->blockCRC );
638
639
      /*-- 
640
         Now a single bit indicating (non-)randomisation. 
641
         As of version 0.9.5, we use a better sorting algorithm
642
         which makes randomisation unnecessary.  So always set
643
         the randomised bit to 'no'.  Of course, the decoder
644
         still needs to be able to handle randomised blocks
645
         so as to maintain backwards compatibility with
646
         older versions of bzip2.
647
      --*/
648
12.2k
      bsW(s,1,0);
649
650
12.2k
      bsW ( s, 24, s->origPtr );
651
12.2k
      generateMTFValues ( s );
652
12.2k
      sendMTFValues ( s );
653
12.2k
   }
654
655
656
   /*-- If this is the last block, add the stream trailer. --*/
657
12.2k
   if (is_last_block) {
658
659
10.2k
      bsPutUChar ( s, 0x17 ); bsPutUChar ( s, 0x72 );
660
10.2k
      bsPutUChar ( s, 0x45 ); bsPutUChar ( s, 0x38 );
661
10.2k
      bsPutUChar ( s, 0x50 ); bsPutUChar ( s, 0x90 );
662
10.2k
      bsPutUInt32 ( s, s->combinedCRC );
663
10.2k
      if (s->verbosity >= 2)
664
         VPrintf1( "    final combined CRC = 0x%08x\n   ", s->combinedCRC );
665
10.2k
      bsFinishWrite ( s );
666
10.2k
   }
667
12.2k
}
668
669
670
/*-------------------------------------------------------------*/
671
/*--- end                                        compress.c ---*/
672
/*-------------------------------------------------------------*/