Coverage Report

Created: 2024-07-27 06:27

/src/libtiff/libtiff/tif_lzw.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * Copyright (c) 1988-1997 Sam Leffler
3
 * Copyright (c) 1991-1997 Silicon Graphics, Inc.
4
 * Copyright (c) 2022 Even Rouault
5
 *
6
 * Permission to use, copy, modify, distribute, and sell this software and
7
 * its documentation for any purpose is hereby granted without fee, provided
8
 * that (i) the above copyright notices and this permission notice appear in
9
 * all copies of the software and related documentation, and (ii) the names of
10
 * Sam Leffler and Silicon Graphics may not be used in any advertising or
11
 * publicity relating to the software without the specific, prior written
12
 * permission of Sam Leffler and Silicon Graphics.
13
 *
14
 * THE SOFTWARE IS PROVIDED "AS-IS" AND WITHOUT WARRANTY OF ANY KIND,
15
 * EXPRESS, IMPLIED OR OTHERWISE, INCLUDING WITHOUT LIMITATION, ANY
16
 * WARRANTY OF MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE.
17
 *
18
 * IN NO EVENT SHALL SAM LEFFLER OR SILICON GRAPHICS BE LIABLE FOR
19
 * ANY SPECIAL, INCIDENTAL, INDIRECT OR CONSEQUENTIAL DAMAGES OF ANY KIND,
20
 * OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS,
21
 * WHETHER OR NOT ADVISED OF THE POSSIBILITY OF DAMAGE, AND ON ANY THEORY OF
22
 * LIABILITY, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE
23
 * OF THIS SOFTWARE.
24
 */
25
26
#include "tiffiop.h"
27
#ifdef LZW_SUPPORT
28
/*
29
 * TIFF Library.
30
 * Rev 5.0 Lempel-Ziv & Welch Compression Support
31
 *
32
 * This code is derived from the compress program whose code is
33
 * derived from software contributed to Berkeley by James A. Woods,
34
 * derived from original work by Spencer Thomas and Joseph Orost.
35
 *
36
 * The original Berkeley copyright notice appears below in its entirety.
37
 */
38
#include "tif_predict.h"
39
40
#include <stdbool.h>
41
#include <stdio.h>
42
#include <stdlib.h>
43
44
/* Select the plausible largest natural integer type for the architecture */
45
0
#define SIZEOF_WORDTYPE SIZEOF_SIZE_T
46
typedef size_t WordType;
47
48
/*
49
 * NB: The 5.0 spec describes a different algorithm than Aldus
50
 *     implements.  Specifically, Aldus does code length transitions
51
 *     one code earlier than should be done (for real LZW).
52
 *     Earlier versions of this library implemented the correct
53
 *     LZW algorithm, but emitted codes in a bit order opposite
54
 *     to the TIFF spec.  Thus, to maintain compatibility w/ Aldus
55
 *     we interpret MSB-LSB ordered codes to be images written w/
56
 *     old versions of this library, but otherwise adhere to the
57
 *     Aldus "off by one" algorithm.
58
 *
59
 * Future revisions to the TIFF spec are expected to "clarify this issue".
60
 */
61
#define LZW_COMPAT /* include backwards compatibility code */
62
63
0
#define MAXCODE(n) ((1L << (n)) - 1)
64
/*
65
 * The TIFF spec specifies that encoded bit
66
 * strings range from 9 to 12 bits.
67
 */
68
0
#define BITS_MIN 9  /* start with 9 bits */
69
0
#define BITS_MAX 12 /* max of 12 bit strings */
70
/* predefined codes */
71
0
#define CODE_CLEAR 256 /* code to clear string table */
72
0
#define CODE_EOI 257   /* end-of-information code */
73
0
#define CODE_FIRST 258 /* first free code entry */
74
0
#define CODE_MAX MAXCODE(BITS_MAX)
75
0
#define HSIZE 9001L /* 91% occupancy */
76
0
#define HSHIFT (13 - 8)
77
#ifdef LZW_COMPAT
78
/* NB: +1024 is for compatibility with old files */
79
0
#define CSIZE (MAXCODE(BITS_MAX) + 1024L)
80
#else
81
#define CSIZE (MAXCODE(BITS_MAX) + 1L)
82
#endif
83
84
/*
85
 * State block for each open TIFF file using LZW
86
 * compression/decompression.  Note that the predictor
87
 * state block must be first in this data structure.
88
 */
89
typedef struct
90
{
91
    TIFFPredictorState predict; /* predictor super class */
92
93
    unsigned short nbits;    /* # of bits/code */
94
    unsigned short maxcode;  /* maximum code for lzw_nbits */
95
    unsigned short free_ent; /* next free entry in hash table */
96
    WordType nextdata;       /* next bits of i/o */
97
    long nextbits;           /* # of valid bits in lzw_nextdata */
98
99
    int rw_mode; /* preserve rw_mode from init */
100
} LZWBaseState;
101
102
0
#define lzw_nbits base.nbits
103
0
#define lzw_maxcode base.maxcode
104
0
#define lzw_free_ent base.free_ent
105
0
#define lzw_nextdata base.nextdata
106
0
#define lzw_nextbits base.nextbits
107
108
/*
109
 * Encoding-specific state.
110
 */
111
typedef uint16_t hcode_t; /* codes fit in 16 bits */
112
typedef struct
113
{
114
    long hash;
115
    hcode_t code;
116
} hash_t;
117
118
/*
119
 * Decoding-specific state.
120
 */
121
typedef struct code_ent
122
{
123
    struct code_ent *next;
124
    unsigned short length; /* string len, including this token */
125
    /* firstchar should be placed immediately before value in this structure */
126
    unsigned char firstchar; /* first token of string */
127
    unsigned char value;     /* data value */
128
    bool repeated;
129
} code_t;
130
131
typedef int (*decodeFunc)(TIFF *, uint8_t *, tmsize_t, uint16_t);
132
133
typedef struct
134
{
135
    LZWBaseState base;
136
137
    /* Decoding specific data */
138
    long dec_nbitsmask;     /* lzw_nbits 1 bits, right adjusted */
139
    tmsize_t dec_restart;   /* restart count */
140
    uint64_t dec_bitsleft;  /* available bits in raw data */
141
    tmsize_t old_tif_rawcc; /* value of tif_rawcc at the end of the previous
142
                               TIFLZWDecode() call */
143
    decodeFunc dec_decode;  /* regular or backwards compatible */
144
    code_t *dec_codep;      /* current recognized code */
145
    code_t *dec_oldcodep;   /* previously recognized code */
146
    code_t *dec_free_entp;  /* next free entry */
147
    code_t *dec_maxcodep;   /* max available entry */
148
    code_t *dec_codetab;    /* kept separate for small machines */
149
    int read_error; /* whether a read error has occurred, and which should cause
150
                       further reads in the same strip/tile to be aborted */
151
152
    /* Encoding specific data */
153
    int enc_oldcode;         /* last code encountered */
154
    tmsize_t enc_checkpoint; /* point at which to clear table */
155
0
#define CHECK_GAP 10000      /* enc_ratio check interval */
156
    tmsize_t enc_ratio;      /* current compression ratio */
157
    tmsize_t enc_incount;    /* (input) data bytes encoded */
158
    tmsize_t enc_outcount;   /* encoded (output) bytes */
159
    uint8_t *enc_rawlimit;   /* bound on tif_rawdata buffer */
160
    hash_t *enc_hashtab;     /* kept separate for small machines */
161
} LZWCodecState;
162
163
0
#define LZWState(tif) ((LZWBaseState *)(tif)->tif_data)
164
0
#define LZWDecoderState(tif) ((LZWCodecState *)LZWState(tif))
165
0
#define LZWEncoderState(tif) ((LZWCodecState *)LZWState(tif))
166
167
static int LZWDecode(TIFF *tif, uint8_t *op0, tmsize_t occ0, uint16_t s);
168
#ifdef LZW_COMPAT
169
static int LZWDecodeCompat(TIFF *tif, uint8_t *op0, tmsize_t occ0, uint16_t s);
170
#endif
171
static void cl_hash(LZWCodecState *);
172
173
/*
174
 * LZW Decoder.
175
 */
176
177
static int LZWFixupTags(TIFF *tif)
178
0
{
179
0
    (void)tif;
180
0
    return (1);
181
0
}
182
183
static int LZWSetupDecode(TIFF *tif)
184
0
{
185
0
    static const char module[] = "LZWSetupDecode";
186
0
    LZWCodecState *sp = LZWDecoderState(tif);
187
0
    int code;
188
189
0
    if (sp == NULL)
190
0
    {
191
        /*
192
         * Allocate state block so tag methods have storage to record
193
         * values.
194
         */
195
0
        tif->tif_data = (uint8_t *)_TIFFmallocExt(tif, sizeof(LZWCodecState));
196
0
        if (tif->tif_data == NULL)
197
0
        {
198
0
            TIFFErrorExtR(tif, module, "No space for LZW state block");
199
0
            return (0);
200
0
        }
201
202
0
        sp = LZWDecoderState(tif);
203
0
        sp->dec_codetab = NULL;
204
0
        sp->dec_decode = NULL;
205
206
        /*
207
         * Setup predictor setup.
208
         */
209
0
        (void)TIFFPredictorInit(tif);
210
0
    }
211
212
0
    if (sp->dec_codetab == NULL)
213
0
    {
214
0
        sp->dec_codetab = (code_t *)_TIFFmallocExt(tif, CSIZE * sizeof(code_t));
215
0
        if (sp->dec_codetab == NULL)
216
0
        {
217
0
            TIFFErrorExtR(tif, module, "No space for LZW code table");
218
0
            return (0);
219
0
        }
220
        /*
221
         * Pre-load the table.
222
         */
223
0
        code = 255;
224
0
        do
225
0
        {
226
0
            sp->dec_codetab[code].firstchar = (unsigned char)code;
227
0
            sp->dec_codetab[code].value = (unsigned char)code;
228
0
            sp->dec_codetab[code].repeated = true;
229
0
            sp->dec_codetab[code].length = 1;
230
0
            sp->dec_codetab[code].next = NULL;
231
0
        } while (code--);
232
        /*
233
         * Zero-out the unused entries  */
234
        /* Silence false positive */
235
        /* coverity[overrun-buffer-arg] */
236
0
        memset(&sp->dec_codetab[CODE_CLEAR], 0,
237
0
               (CODE_FIRST - CODE_CLEAR) * sizeof(code_t));
238
0
    }
239
0
    return (1);
240
0
}
241
242
/*
243
 * Setup state for decoding a strip.
244
 */
245
static int LZWPreDecode(TIFF *tif, uint16_t s)
246
0
{
247
0
    static const char module[] = "LZWPreDecode";
248
0
    LZWCodecState *sp = LZWDecoderState(tif);
249
250
0
    (void)s;
251
0
    assert(sp != NULL);
252
0
    if (sp->dec_codetab == NULL)
253
0
    {
254
0
        tif->tif_setupdecode(tif);
255
0
        if (sp->dec_codetab == NULL)
256
0
            return (0);
257
0
    }
258
259
    /*
260
     * Check for old bit-reversed codes.
261
     */
262
0
    if (tif->tif_rawcc >= 2 && tif->tif_rawdata[0] == 0 &&
263
0
        (tif->tif_rawdata[1] & 0x1))
264
0
    {
265
0
#ifdef LZW_COMPAT
266
0
        if (!sp->dec_decode)
267
0
        {
268
0
            TIFFWarningExtR(tif, module, "Old-style LZW codes, convert file");
269
            /*
270
             * Override default decoding methods with
271
             * ones that deal with the old coding.
272
             * Otherwise the predictor versions set
273
             * above will call the compatibility routines
274
             * through the dec_decode method.
275
             */
276
0
            tif->tif_decoderow = LZWDecodeCompat;
277
0
            tif->tif_decodestrip = LZWDecodeCompat;
278
0
            tif->tif_decodetile = LZWDecodeCompat;
279
            /*
280
             * If doing horizontal differencing, must
281
             * re-setup the predictor logic since we
282
             * switched the basic decoder methods...
283
             */
284
0
            (*tif->tif_setupdecode)(tif);
285
0
            sp->dec_decode = LZWDecodeCompat;
286
0
        }
287
0
        sp->lzw_maxcode = MAXCODE(BITS_MIN);
288
#else  /* !LZW_COMPAT */
289
        if (!sp->dec_decode)
290
        {
291
            TIFFErrorExtR(tif, module, "Old-style LZW codes not supported");
292
            sp->dec_decode = LZWDecode;
293
        }
294
        return (0);
295
#endif /* !LZW_COMPAT */
296
0
    }
297
0
    else
298
0
    {
299
0
        sp->lzw_maxcode = MAXCODE(BITS_MIN) - 1;
300
0
        sp->dec_decode = LZWDecode;
301
0
    }
302
0
    sp->lzw_nbits = BITS_MIN;
303
0
    sp->lzw_nextbits = 0;
304
0
    sp->lzw_nextdata = 0;
305
306
0
    sp->dec_restart = 0;
307
0
    sp->dec_nbitsmask = MAXCODE(BITS_MIN);
308
0
    sp->dec_bitsleft = 0;
309
0
    sp->old_tif_rawcc = 0;
310
0
    sp->dec_free_entp = sp->dec_codetab - 1; // + CODE_FIRST;
311
    /*
312
     * Zero entries that are not yet filled in.  We do
313
     * this to guard against bogus input data that causes
314
     * us to index into undefined entries.  If you can
315
     * come up with a way to safely bounds-check input codes
316
     * while decoding then you can remove this operation.
317
     */
318
0
    sp->dec_oldcodep = &sp->dec_codetab[0];
319
0
    sp->dec_maxcodep = &sp->dec_codetab[sp->dec_nbitsmask - 1];
320
0
    sp->read_error = 0;
321
0
    return (1);
322
0
}
323
324
/*
325
 * Decode a "hunk of data".
326
 */
327
328
/* Get the next 32 or 64-bit from the input data */
329
#ifdef WORDS_BIGENDIAN
330
#define GetNextData(nextdata, bp) memcpy(&nextdata, bp, sizeof(nextdata))
331
#elif SIZEOF_WORDTYPE == 8
332
#if defined(_M_X64)
333
#define GetNextData(nextdata, bp) nextdata = _byteswap_uint64(*(uint64_t *)(bp))
334
#elif defined(__GNUC__)
335
#define GetNextData(nextdata, bp)                                              \
336
0
    memcpy(&nextdata, bp, sizeof(nextdata));                                   \
337
0
    nextdata = __builtin_bswap64(nextdata)
338
#else
339
#define GetNextData(nextdata, bp)                                              \
340
    nextdata = (((uint64_t)bp[0]) << 56) | (((uint64_t)bp[1]) << 48) |         \
341
               (((uint64_t)bp[2]) << 40) | (((uint64_t)bp[3]) << 32) |         \
342
               (((uint64_t)bp[4]) << 24) | (((uint64_t)bp[5]) << 16) |         \
343
               (((uint64_t)bp[6]) << 8) | (((uint64_t)bp[7]))
344
#endif
345
#elif SIZEOF_WORDTYPE == 4
346
#if defined(_M_X86)
347
#define GetNextData(nextdata, bp)                                              \
348
    nextdata = _byteswap_ulong(*(unsigned long *)(bp))
349
#elif defined(__GNUC__)
350
#define GetNextData(nextdata, bp)                                              \
351
    memcpy(&nextdata, bp, sizeof(nextdata));                                   \
352
    nextdata = __builtin_bswap32(nextdata)
353
#else
354
#define GetNextData(nextdata, bp)                                              \
355
    nextdata = (((uint32_t)bp[0]) << 24) | (((uint32_t)bp[1]) << 16) |         \
356
               (((uint32_t)bp[2]) << 8) | (((uint32_t)bp[3]))
357
#endif
358
#else
359
#error "Unhandled SIZEOF_WORDTYPE"
360
#endif
361
362
#define GetNextCodeLZW()                                                       \
363
0
    do                                                                         \
364
0
    {                                                                          \
365
0
        nextbits -= nbits;                                                     \
366
0
        if (nextbits < 0)                                                      \
367
0
        {                                                                      \
368
0
            if (dec_bitsleft >= 8 * SIZEOF_WORDTYPE)                           \
369
0
            {                                                                  \
370
0
                unsigned codetmp = (unsigned)(nextdata << (-nextbits));        \
371
0
                GetNextData(nextdata, bp);                                     \
372
0
                bp += SIZEOF_WORDTYPE;                                         \
373
0
                nextbits += 8 * SIZEOF_WORDTYPE;                               \
374
0
                dec_bitsleft -= 8 * SIZEOF_WORDTYPE;                           \
375
0
                code = (WordType)((codetmp | (nextdata >> nextbits)) &         \
376
0
                                  nbitsmask);                                  \
377
0
                break;                                                         \
378
0
            }                                                                  \
379
0
            else                                                               \
380
0
            {                                                                  \
381
0
                if (dec_bitsleft < 8)                                          \
382
0
                {                                                              \
383
0
                    goto no_eoi;                                               \
384
0
                }                                                              \
385
0
                nextdata = (nextdata << 8) | *(bp)++;                          \
386
0
                nextbits += 8;                                                 \
387
0
                dec_bitsleft -= 8;                                             \
388
0
                if (nextbits < 0)                                              \
389
0
                {                                                              \
390
0
                    if (dec_bitsleft < 8)                                      \
391
0
                    {                                                          \
392
0
                        goto no_eoi;                                           \
393
0
                    }                                                          \
394
0
                    nextdata = (nextdata << 8) | *(bp)++;                      \
395
0
                    nextbits += 8;                                             \
396
0
                    dec_bitsleft -= 8;                                         \
397
0
                }                                                              \
398
0
            }                                                                  \
399
0
        }                                                                      \
400
0
        code = (WordType)((nextdata >> nextbits) & nbitsmask);                 \
401
0
    } while (0)
402
403
static int LZWDecode(TIFF *tif, uint8_t *op0, tmsize_t occ0, uint16_t s)
404
0
{
405
0
    static const char module[] = "LZWDecode";
406
0
    LZWCodecState *sp = LZWDecoderState(tif);
407
0
    uint8_t *op = (uint8_t *)op0;
408
0
    tmsize_t occ = occ0;
409
0
    uint8_t *bp;
410
0
    long nbits, nextbits, nbitsmask;
411
0
    WordType nextdata;
412
0
    code_t *free_entp, *maxcodep, *oldcodep;
413
414
0
    (void)s;
415
0
    assert(sp != NULL);
416
0
    assert(sp->dec_codetab != NULL);
417
418
0
    if (sp->read_error)
419
0
    {
420
0
        memset(op, 0, (size_t)occ);
421
0
        TIFFErrorExtR(tif, module,
422
0
                      "LZWDecode: Scanline %" PRIu32 " cannot be read due to "
423
0
                      "previous error",
424
0
                      tif->tif_row);
425
0
        return 0;
426
0
    }
427
428
    /*
429
     * Restart interrupted output operation.
430
     */
431
0
    if (sp->dec_restart)
432
0
    {
433
0
        tmsize_t residue;
434
435
0
        code_t *codep = sp->dec_codep;
436
0
        residue = codep->length - sp->dec_restart;
437
0
        if (residue > occ)
438
0
        {
439
            /*
440
             * Residue from previous decode is sufficient
441
             * to satisfy decode request.  Skip to the
442
             * start of the decoded string, place decoded
443
             * values in the output buffer, and return.
444
             */
445
0
            sp->dec_restart += occ;
446
0
            do
447
0
            {
448
0
                codep = codep->next;
449
0
            } while (--residue > occ && codep);
450
0
            if (codep)
451
0
            {
452
0
                uint8_t *tp = op + occ;
453
0
                do
454
0
                {
455
0
                    *--tp = codep->value;
456
0
                    codep = codep->next;
457
0
                } while (--occ && codep);
458
0
            }
459
0
            return (1);
460
0
        }
461
        /*
462
         * Residue satisfies only part of the decode request.
463
         */
464
0
        op += residue;
465
0
        occ -= residue;
466
0
        uint8_t *tp = op;
467
0
        do
468
0
        {
469
0
            *--tp = codep->value;
470
0
            codep = codep->next;
471
0
        } while (--residue && codep);
472
0
        sp->dec_restart = 0;
473
0
    }
474
475
0
    bp = (uint8_t *)tif->tif_rawcp;
476
0
    sp->dec_bitsleft += (((uint64_t)tif->tif_rawcc - sp->old_tif_rawcc) << 3);
477
0
    uint64_t dec_bitsleft = sp->dec_bitsleft;
478
0
    nbits = sp->lzw_nbits;
479
0
    nextdata = sp->lzw_nextdata;
480
0
    nextbits = sp->lzw_nextbits;
481
0
    nbitsmask = sp->dec_nbitsmask;
482
0
    oldcodep = sp->dec_oldcodep;
483
0
    free_entp = sp->dec_free_entp;
484
0
    maxcodep = sp->dec_maxcodep;
485
0
    code_t *const dec_codetab = sp->dec_codetab;
486
0
    code_t *codep;
487
488
0
    if (occ == 0)
489
0
    {
490
0
        goto after_loop;
491
0
    }
492
493
0
begin:
494
0
{
495
0
    WordType code;
496
0
    GetNextCodeLZW();
497
0
    codep = dec_codetab + code;
498
0
    if (code >= CODE_FIRST)
499
0
        goto code_above_or_equal_to_258;
500
0
    if (code < 256)
501
0
        goto code_below_256;
502
0
    if (code == CODE_EOI)
503
0
        goto after_loop;
504
0
    goto code_clear;
505
506
0
code_below_256:
507
0
{
508
0
    if (codep > free_entp)
509
0
        goto error_code;
510
0
    free_entp->next = oldcodep;
511
0
    free_entp->firstchar = oldcodep->firstchar;
512
0
    free_entp->length = oldcodep->length + 1;
513
0
    free_entp->value = (uint8_t)code;
514
0
    free_entp->repeated =
515
0
        (bool)(oldcodep->repeated & (oldcodep->value == code));
516
0
    if (++free_entp > maxcodep)
517
0
    {
518
0
        if (++nbits > BITS_MAX) /* should not happen for a conformant encoder */
519
0
            nbits = BITS_MAX;
520
0
        nbitsmask = MAXCODE(nbits);
521
0
        maxcodep = dec_codetab + nbitsmask - 1;
522
0
        if (free_entp >= &dec_codetab[CSIZE])
523
0
        {
524
            /* At that point, the next valid states are either EOI or a */
525
            /* CODE_CLEAR. If a regular code is read, at the next */
526
            /* attempt at registering a new entry, we will error out */
527
            /* due to setting free_entp before any valid code */
528
0
            free_entp = dec_codetab - 1;
529
0
        }
530
0
    }
531
0
    oldcodep = codep;
532
0
    *op++ = (uint8_t)code;
533
0
    occ--;
534
0
    if (occ == 0)
535
0
        goto after_loop;
536
0
    goto begin;
537
0
}
538
539
0
code_above_or_equal_to_258:
540
0
{
541
    /*
542
     * Add the new entry to the code table.
543
     */
544
545
0
    if (codep >= free_entp)
546
0
    {
547
0
        if (codep != free_entp)
548
0
            goto error_code;
549
0
        free_entp->value = oldcodep->firstchar;
550
0
    }
551
0
    else
552
0
    {
553
0
        free_entp->value = codep->firstchar;
554
0
    }
555
0
    free_entp->repeated =
556
0
        (bool)(oldcodep->repeated & (oldcodep->value == free_entp->value));
557
0
    free_entp->next = oldcodep;
558
559
0
    free_entp->firstchar = oldcodep->firstchar;
560
0
    free_entp->length = oldcodep->length + 1;
561
0
    if (++free_entp > maxcodep)
562
0
    {
563
0
        if (++nbits > BITS_MAX) /* should not happen for a conformant encoder */
564
0
            nbits = BITS_MAX;
565
0
        nbitsmask = MAXCODE(nbits);
566
0
        maxcodep = dec_codetab + nbitsmask - 1;
567
0
        if (free_entp >= &dec_codetab[CSIZE])
568
0
        {
569
            /* At that point, the next valid states are either EOI or a */
570
            /* CODE_CLEAR. If a regular code is read, at the next */
571
            /* attempt at registering a new entry, we will error out */
572
            /* due to setting free_entp before any valid code */
573
0
            free_entp = dec_codetab - 1;
574
0
        }
575
0
    }
576
0
    oldcodep = codep;
577
578
    /*
579
     * Code maps to a string, copy string
580
     * value to output (written in reverse).
581
     */
582
    /* tiny bit faster on x86_64 to store in unsigned short than int */
583
0
    unsigned short len = codep->length;
584
585
0
    if (len < 3) /* equivalent to len == 2 given all other conditions */
586
0
    {
587
0
        if (occ <= 2)
588
0
        {
589
0
            if (occ == 2)
590
0
            {
591
0
                memcpy(op, &(codep->firstchar), 2);
592
0
                op += 2;
593
0
                occ -= 2;
594
0
                goto after_loop;
595
0
            }
596
0
            goto too_short_buffer;
597
0
        }
598
599
0
        memcpy(op, &(codep->firstchar), 2);
600
0
        op += 2;
601
0
        occ -= 2;
602
0
        goto begin; /* we can save the comparison occ > 0 */
603
0
    }
604
605
0
    if (len == 3)
606
0
    {
607
0
        if (occ <= 3)
608
0
        {
609
0
            if (occ == 3)
610
0
            {
611
0
                op[0] = codep->firstchar;
612
0
                op[1] = codep->next->value;
613
0
                op[2] = codep->value;
614
0
                op += 3;
615
0
                occ -= 3;
616
0
                goto after_loop;
617
0
            }
618
0
            goto too_short_buffer;
619
0
        }
620
621
0
        op[0] = codep->firstchar;
622
0
        op[1] = codep->next->value;
623
0
        op[2] = codep->value;
624
0
        op += 3;
625
0
        occ -= 3;
626
0
        goto begin; /* we can save the comparison occ > 0 */
627
0
    }
628
629
0
    if (len > occ)
630
0
    {
631
0
        goto too_short_buffer;
632
0
    }
633
634
0
    if (codep->repeated)
635
0
    {
636
0
        memset(op, codep->value, len);
637
0
        op += len;
638
0
        occ -= len;
639
0
        if (occ == 0)
640
0
            goto after_loop;
641
0
        goto begin;
642
0
    }
643
644
0
    uint8_t *tp = op + len;
645
646
0
    assert(len >= 4);
647
648
0
    *--tp = codep->value;
649
0
    codep = codep->next;
650
0
    *--tp = codep->value;
651
0
    codep = codep->next;
652
0
    *--tp = codep->value;
653
0
    codep = codep->next;
654
0
    *--tp = codep->value;
655
0
    if (tp > op)
656
0
    {
657
0
        do
658
0
        {
659
0
            codep = codep->next;
660
0
            *--tp = codep->value;
661
0
        } while (tp > op);
662
0
    }
663
664
0
    assert(occ >= len);
665
0
    op += len;
666
0
    occ -= len;
667
0
    if (occ == 0)
668
0
        goto after_loop;
669
0
    goto begin;
670
0
}
671
672
0
code_clear:
673
0
{
674
0
    free_entp = dec_codetab + CODE_FIRST;
675
0
    nbits = BITS_MIN;
676
0
    nbitsmask = MAXCODE(BITS_MIN);
677
0
    maxcodep = dec_codetab + nbitsmask - 1;
678
0
    do
679
0
    {
680
0
        GetNextCodeLZW();
681
0
    } while (code == CODE_CLEAR); /* consecutive CODE_CLEAR codes */
682
0
    if (code == CODE_EOI)
683
0
        goto after_loop;
684
0
    if (code > CODE_EOI)
685
0
    {
686
0
        goto error_code;
687
0
    }
688
0
    *op++ = (uint8_t)code;
689
0
    occ--;
690
0
    oldcodep = dec_codetab + code;
691
0
    if (occ == 0)
692
0
        goto after_loop;
693
0
    goto begin;
694
0
}
695
0
}
696
697
0
too_short_buffer:
698
0
{
699
    /*
700
     * String is too long for decode buffer,
701
     * locate portion that will fit, copy to
702
     * the decode buffer, and setup restart
703
     * logic for the next decoding call.
704
     */
705
0
    sp->dec_codep = codep;
706
0
    do
707
0
    {
708
0
        codep = codep->next;
709
0
    } while (codep->length > occ);
710
711
0
    sp->dec_restart = occ;
712
0
    uint8_t *tp = op + occ;
713
0
    do
714
0
    {
715
0
        *--tp = codep->value;
716
0
        codep = codep->next;
717
0
    } while (--occ);
718
0
}
719
720
0
after_loop:
721
0
    tif->tif_rawcc -= (tmsize_t)((uint8_t *)bp - tif->tif_rawcp);
722
0
    tif->tif_rawcp = (uint8_t *)bp;
723
0
    sp->old_tif_rawcc = tif->tif_rawcc;
724
0
    sp->dec_bitsleft = dec_bitsleft;
725
0
    sp->lzw_nbits = (unsigned short)nbits;
726
0
    sp->lzw_nextdata = nextdata;
727
0
    sp->lzw_nextbits = nextbits;
728
0
    sp->dec_nbitsmask = nbitsmask;
729
0
    sp->dec_oldcodep = oldcodep;
730
0
    sp->dec_free_entp = free_entp;
731
0
    sp->dec_maxcodep = maxcodep;
732
733
0
    if (occ > 0)
734
0
    {
735
0
        memset(op, 0, (size_t)occ);
736
0
        TIFFErrorExtR(tif, module,
737
0
                      "Not enough data at scanline %" PRIu32 " (short %" PRIu64
738
0
                      " bytes)",
739
0
                      tif->tif_row, (uint64_t)occ);
740
0
        return (0);
741
0
    }
742
0
    return (1);
743
744
0
no_eoi:
745
0
    memset(op, 0, (size_t)occ);
746
0
    sp->read_error = 1;
747
0
    TIFFErrorExtR(tif, module,
748
0
                  "LZWDecode: Strip %" PRIu32 " not terminated with EOI code",
749
0
                  tif->tif_curstrip);
750
0
    return 0;
751
0
error_code:
752
0
    memset(op, 0, (size_t)occ);
753
0
    sp->read_error = 1;
754
0
    TIFFErrorExtR(tif, tif->tif_name, "Using code not yet in table");
755
0
    return 0;
756
0
}
757
758
#ifdef LZW_COMPAT
759
760
/*
761
 * This check shouldn't be necessary because each
762
 * strip is suppose to be terminated with CODE_EOI.
763
 */
764
#define NextCode(_tif, _sp, _bp, _code, _get, dec_bitsleft)                    \
765
0
    {                                                                          \
766
0
        if (dec_bitsleft < (uint64_t)nbits)                                    \
767
0
        {                                                                      \
768
0
            TIFFWarningExtR(_tif, module,                                      \
769
0
                            "LZWDecode: Strip %" PRIu32                        \
770
0
                            " not terminated with EOI code",                   \
771
0
                            _tif->tif_curstrip);                               \
772
0
            _code = CODE_EOI;                                                  \
773
0
        }                                                                      \
774
0
        else                                                                   \
775
0
        {                                                                      \
776
0
            _get(_sp, _bp, _code);                                             \
777
0
            dec_bitsleft -= nbits;                                             \
778
0
        }                                                                      \
779
0
    }
780
781
/*
782
 * Decode a "hunk of data" for old images.
783
 */
784
#define GetNextCodeCompat(sp, bp, code)                                        \
785
0
    {                                                                          \
786
0
        nextdata |= (unsigned long)*(bp)++ << nextbits;                        \
787
0
        nextbits += 8;                                                         \
788
0
        if (nextbits < nbits)                                                  \
789
0
        {                                                                      \
790
0
            nextdata |= (unsigned long)*(bp)++ << nextbits;                    \
791
0
            nextbits += 8;                                                     \
792
0
        }                                                                      \
793
0
        code = (hcode_t)(nextdata & nbitsmask);                                \
794
0
        nextdata >>= nbits;                                                    \
795
0
        nextbits -= nbits;                                                     \
796
0
    }
797
798
static int LZWDecodeCompat(TIFF *tif, uint8_t *op0, tmsize_t occ0, uint16_t s)
799
0
{
800
0
    static const char module[] = "LZWDecodeCompat";
801
0
    LZWCodecState *sp = LZWDecoderState(tif);
802
0
    uint8_t *op = (uint8_t *)op0;
803
0
    tmsize_t occ = occ0;
804
0
    uint8_t *tp;
805
0
    uint8_t *bp;
806
0
    int code, nbits;
807
0
    int len;
808
0
    long nextbits, nbitsmask;
809
0
    WordType nextdata;
810
0
    code_t *codep, *free_entp, *maxcodep, *oldcodep;
811
812
0
    (void)s;
813
0
    assert(sp != NULL);
814
815
    /*
816
     * Restart interrupted output operation.
817
     */
818
0
    if (sp->dec_restart)
819
0
    {
820
0
        tmsize_t residue;
821
822
0
        codep = sp->dec_codep;
823
0
        residue = codep->length - sp->dec_restart;
824
0
        if (residue > occ)
825
0
        {
826
            /*
827
             * Residue from previous decode is sufficient
828
             * to satisfy decode request.  Skip to the
829
             * start of the decoded string, place decoded
830
             * values in the output buffer, and return.
831
             */
832
0
            sp->dec_restart += occ;
833
0
            do
834
0
            {
835
0
                codep = codep->next;
836
0
            } while (--residue > occ);
837
0
            tp = op + occ;
838
0
            do
839
0
            {
840
0
                *--tp = codep->value;
841
0
                codep = codep->next;
842
0
            } while (--occ);
843
0
            return (1);
844
0
        }
845
        /*
846
         * Residue satisfies only part of the decode request.
847
         */
848
0
        op += residue;
849
0
        occ -= residue;
850
0
        tp = op;
851
0
        do
852
0
        {
853
0
            *--tp = codep->value;
854
0
            codep = codep->next;
855
0
        } while (--residue);
856
0
        sp->dec_restart = 0;
857
0
    }
858
859
0
    bp = (uint8_t *)tif->tif_rawcp;
860
861
0
    sp->dec_bitsleft += (((uint64_t)tif->tif_rawcc - sp->old_tif_rawcc) << 3);
862
0
    uint64_t dec_bitsleft = sp->dec_bitsleft;
863
864
0
    nbits = sp->lzw_nbits;
865
0
    nextdata = sp->lzw_nextdata;
866
0
    nextbits = sp->lzw_nextbits;
867
0
    nbitsmask = sp->dec_nbitsmask;
868
0
    oldcodep = sp->dec_oldcodep;
869
0
    free_entp = sp->dec_free_entp;
870
0
    maxcodep = sp->dec_maxcodep;
871
872
0
    while (occ > 0)
873
0
    {
874
0
        NextCode(tif, sp, bp, code, GetNextCodeCompat, dec_bitsleft);
875
0
        if (code == CODE_EOI)
876
0
            break;
877
0
        if (code == CODE_CLEAR)
878
0
        {
879
0
            do
880
0
            {
881
0
                free_entp = sp->dec_codetab + CODE_FIRST;
882
0
                _TIFFmemset(free_entp, 0,
883
0
                            (CSIZE - CODE_FIRST) * sizeof(code_t));
884
0
                nbits = BITS_MIN;
885
0
                nbitsmask = MAXCODE(BITS_MIN);
886
0
                maxcodep = sp->dec_codetab + nbitsmask;
887
0
                NextCode(tif, sp, bp, code, GetNextCodeCompat, dec_bitsleft);
888
0
            } while (code == CODE_CLEAR); /* consecutive CODE_CLEAR codes */
889
0
            if (code == CODE_EOI)
890
0
                break;
891
0
            if (code > CODE_CLEAR)
892
0
            {
893
0
                TIFFErrorExtR(
894
0
                    tif, tif->tif_name,
895
0
                    "LZWDecode: Corrupted LZW table at scanline %" PRIu32,
896
0
                    tif->tif_row);
897
0
                return (0);
898
0
            }
899
0
            *op++ = (uint8_t)code;
900
0
            occ--;
901
0
            oldcodep = sp->dec_codetab + code;
902
0
            continue;
903
0
        }
904
0
        codep = sp->dec_codetab + code;
905
906
        /*
907
         * Add the new entry to the code table.
908
         */
909
0
        if (free_entp < &sp->dec_codetab[0] ||
910
0
            free_entp >= &sp->dec_codetab[CSIZE])
911
0
        {
912
0
            TIFFErrorExtR(tif, module,
913
0
                          "Corrupted LZW table at scanline %" PRIu32,
914
0
                          tif->tif_row);
915
0
            return (0);
916
0
        }
917
918
0
        free_entp->next = oldcodep;
919
0
        if (free_entp->next < &sp->dec_codetab[0] ||
920
0
            free_entp->next >= &sp->dec_codetab[CSIZE])
921
0
        {
922
0
            TIFFErrorExtR(tif, module,
923
0
                          "Corrupted LZW table at scanline %" PRIu32,
924
0
                          tif->tif_row);
925
0
            return (0);
926
0
        }
927
0
        free_entp->firstchar = free_entp->next->firstchar;
928
0
        free_entp->length = free_entp->next->length + 1;
929
0
        free_entp->value =
930
0
            (codep < free_entp) ? codep->firstchar : free_entp->firstchar;
931
0
        if (++free_entp > maxcodep)
932
0
        {
933
0
            if (++nbits > BITS_MAX) /* should not happen */
934
0
                nbits = BITS_MAX;
935
0
            nbitsmask = MAXCODE(nbits);
936
0
            maxcodep = sp->dec_codetab + nbitsmask;
937
0
        }
938
0
        oldcodep = codep;
939
0
        if (code >= 256)
940
0
        {
941
            /*
942
             * Code maps to a string, copy string
943
             * value to output (written in reverse).
944
             */
945
0
            if (codep->length == 0)
946
0
            {
947
0
                TIFFErrorExtR(
948
0
                    tif, module,
949
0
                    "Wrong length of decoded "
950
0
                    "string: data probably corrupted at scanline %" PRIu32,
951
0
                    tif->tif_row);
952
0
                return (0);
953
0
            }
954
0
            if (codep->length > occ)
955
0
            {
956
                /*
957
                 * String is too long for decode buffer,
958
                 * locate portion that will fit, copy to
959
                 * the decode buffer, and setup restart
960
                 * logic for the next decoding call.
961
                 */
962
0
                sp->dec_codep = codep;
963
0
                do
964
0
                {
965
0
                    codep = codep->next;
966
0
                } while (codep->length > occ);
967
0
                sp->dec_restart = occ;
968
0
                tp = op + occ;
969
0
                do
970
0
                {
971
0
                    *--tp = codep->value;
972
0
                    codep = codep->next;
973
0
                } while (--occ);
974
0
                break;
975
0
            }
976
0
            len = codep->length;
977
0
            tp = op + len;
978
0
            do
979
0
            {
980
0
                *--tp = codep->value;
981
0
                codep = codep->next;
982
0
            } while (codep && tp > op);
983
0
            assert(occ >= len);
984
0
            op += len;
985
0
            occ -= len;
986
0
        }
987
0
        else
988
0
        {
989
0
            *op++ = (uint8_t)code;
990
0
            occ--;
991
0
        }
992
0
    }
993
994
0
    tif->tif_rawcc -= (tmsize_t)((uint8_t *)bp - tif->tif_rawcp);
995
0
    tif->tif_rawcp = (uint8_t *)bp;
996
997
0
    sp->old_tif_rawcc = tif->tif_rawcc;
998
0
    sp->dec_bitsleft = dec_bitsleft;
999
1000
0
    sp->lzw_nbits = (unsigned short)nbits;
1001
0
    sp->lzw_nextdata = nextdata;
1002
0
    sp->lzw_nextbits = nextbits;
1003
0
    sp->dec_nbitsmask = nbitsmask;
1004
0
    sp->dec_oldcodep = oldcodep;
1005
0
    sp->dec_free_entp = free_entp;
1006
0
    sp->dec_maxcodep = maxcodep;
1007
1008
0
    if (occ > 0)
1009
0
    {
1010
0
        TIFFErrorExtR(tif, module,
1011
0
                      "Not enough data at scanline %" PRIu32 " (short %" PRIu64
1012
0
                      " bytes)",
1013
0
                      tif->tif_row, (uint64_t)occ);
1014
0
        return (0);
1015
0
    }
1016
0
    return (1);
1017
0
}
1018
#endif /* LZW_COMPAT */
1019
1020
/*
1021
 * LZW Encoding.
1022
 */
1023
1024
static int LZWSetupEncode(TIFF *tif)
1025
0
{
1026
0
    static const char module[] = "LZWSetupEncode";
1027
0
    LZWCodecState *sp = LZWEncoderState(tif);
1028
1029
0
    assert(sp != NULL);
1030
0
    sp->enc_hashtab = (hash_t *)_TIFFmallocExt(tif, HSIZE * sizeof(hash_t));
1031
0
    if (sp->enc_hashtab == NULL)
1032
0
    {
1033
0
        TIFFErrorExtR(tif, module, "No space for LZW hash table");
1034
0
        return (0);
1035
0
    }
1036
0
    return (1);
1037
0
}
1038
1039
/*
1040
 * Reset encoding state at the start of a strip.
1041
 */
1042
static int LZWPreEncode(TIFF *tif, uint16_t s)
1043
0
{
1044
0
    LZWCodecState *sp = LZWEncoderState(tif);
1045
1046
0
    (void)s;
1047
0
    assert(sp != NULL);
1048
1049
0
    if (sp->enc_hashtab == NULL)
1050
0
    {
1051
0
        tif->tif_setupencode(tif);
1052
0
    }
1053
1054
0
    sp->lzw_nbits = BITS_MIN;
1055
0
    sp->lzw_maxcode = MAXCODE(BITS_MIN);
1056
0
    sp->lzw_free_ent = CODE_FIRST;
1057
0
    sp->lzw_nextbits = 0;
1058
0
    sp->lzw_nextdata = 0;
1059
0
    sp->enc_checkpoint = CHECK_GAP;
1060
0
    sp->enc_ratio = 0;
1061
0
    sp->enc_incount = 0;
1062
0
    sp->enc_outcount = 0;
1063
    /*
1064
     * The 4 here insures there is space for 2 max-sized
1065
     * codes in LZWEncode and LZWPostDecode.
1066
     */
1067
0
    sp->enc_rawlimit = tif->tif_rawdata + tif->tif_rawdatasize - 1 - 4;
1068
0
    cl_hash(sp);                   /* clear hash table */
1069
0
    sp->enc_oldcode = (hcode_t)-1; /* generates CODE_CLEAR in LZWEncode */
1070
0
    return (1);
1071
0
}
1072
1073
#define CALCRATIO(sp, rat)                                                     \
1074
0
    {                                                                          \
1075
0
        if (incount > 0x007fffff)                                              \
1076
0
        { /* NB: shift will overflow */                                        \
1077
0
            rat = outcount >> 8;                                               \
1078
0
            rat = (rat == 0 ? 0x7fffffff : incount / rat);                     \
1079
0
        }                                                                      \
1080
0
        else                                                                   \
1081
0
            rat = (incount << 8) / outcount;                                   \
1082
0
    }
1083
1084
/* Explicit 0xff masking to make icc -check=conversions happy */
1085
#define PutNextCode(op, c)                                                     \
1086
0
    {                                                                          \
1087
0
        nextdata = (nextdata << nbits) | c;                                    \
1088
0
        nextbits += nbits;                                                     \
1089
0
        *op++ = (unsigned char)((nextdata >> (nextbits - 8)) & 0xff);          \
1090
0
        nextbits -= 8;                                                         \
1091
0
        if (nextbits >= 8)                                                     \
1092
0
        {                                                                      \
1093
0
            *op++ = (unsigned char)((nextdata >> (nextbits - 8)) & 0xff);      \
1094
0
            nextbits -= 8;                                                     \
1095
0
        }                                                                      \
1096
0
        outcount += nbits;                                                     \
1097
0
    }
1098
1099
/*
1100
 * Encode a chunk of pixels.
1101
 *
1102
 * Uses an open addressing double hashing (no chaining) on the
1103
 * prefix code/next character combination.  We do a variant of
1104
 * Knuth's algorithm D (vol. 3, sec. 6.4) along with G. Knott's
1105
 * relatively-prime secondary probe.  Here, the modular division
1106
 * first probe is gives way to a faster exclusive-or manipulation.
1107
 * Also do block compression with an adaptive reset, whereby the
1108
 * code table is cleared when the compression ratio decreases,
1109
 * but after the table fills.  The variable-length output codes
1110
 * are re-sized at this point, and a CODE_CLEAR is generated
1111
 * for the decoder.
1112
 */
1113
static int LZWEncode(TIFF *tif, uint8_t *bp, tmsize_t cc, uint16_t s)
1114
0
{
1115
0
    register LZWCodecState *sp = LZWEncoderState(tif);
1116
0
    register long fcode;
1117
0
    register hash_t *hp;
1118
0
    register int h, c;
1119
0
    hcode_t ent;
1120
0
    long disp;
1121
0
    tmsize_t incount, outcount, checkpoint;
1122
0
    WordType nextdata;
1123
0
    long nextbits;
1124
0
    int free_ent, maxcode, nbits;
1125
0
    uint8_t *op;
1126
0
    uint8_t *limit;
1127
1128
0
    (void)s;
1129
0
    if (sp == NULL)
1130
0
        return (0);
1131
1132
0
    assert(sp->enc_hashtab != NULL);
1133
1134
    /*
1135
     * Load local state.
1136
     */
1137
0
    incount = sp->enc_incount;
1138
0
    outcount = sp->enc_outcount;
1139
0
    checkpoint = sp->enc_checkpoint;
1140
0
    nextdata = sp->lzw_nextdata;
1141
0
    nextbits = sp->lzw_nextbits;
1142
0
    free_ent = sp->lzw_free_ent;
1143
0
    maxcode = sp->lzw_maxcode;
1144
0
    nbits = sp->lzw_nbits;
1145
0
    op = tif->tif_rawcp;
1146
0
    limit = sp->enc_rawlimit;
1147
0
    ent = (hcode_t)sp->enc_oldcode;
1148
1149
0
    if (ent == (hcode_t)-1 && cc > 0)
1150
0
    {
1151
        /*
1152
         * NB: This is safe because it can only happen
1153
         *     at the start of a strip where we know there
1154
         *     is space in the data buffer.
1155
         */
1156
0
        PutNextCode(op, CODE_CLEAR);
1157
0
        ent = *bp++;
1158
0
        cc--;
1159
0
        incount++;
1160
0
    }
1161
0
    while (cc > 0)
1162
0
    {
1163
0
        c = *bp++;
1164
0
        cc--;
1165
0
        incount++;
1166
0
        fcode = ((long)c << BITS_MAX) + ent;
1167
0
        h = (c << HSHIFT) ^ ent; /* xor hashing */
1168
#ifdef _WINDOWS
1169
        /*
1170
         * Check hash index for an overflow.
1171
         */
1172
        if (h >= HSIZE)
1173
            h -= HSIZE;
1174
#endif
1175
0
        hp = &sp->enc_hashtab[h];
1176
0
        if (hp->hash == fcode)
1177
0
        {
1178
0
            ent = hp->code;
1179
0
            continue;
1180
0
        }
1181
0
        if (hp->hash >= 0)
1182
0
        {
1183
            /*
1184
             * Primary hash failed, check secondary hash.
1185
             */
1186
0
            disp = HSIZE - h;
1187
0
            if (h == 0)
1188
0
                disp = 1;
1189
0
            do
1190
0
            {
1191
                /*
1192
                 * Avoid pointer arithmetic because of
1193
                 * wraparound problems with segments.
1194
                 */
1195
0
                if ((h -= disp) < 0)
1196
0
                    h += HSIZE;
1197
0
                hp = &sp->enc_hashtab[h];
1198
0
                if (hp->hash == fcode)
1199
0
                {
1200
0
                    ent = hp->code;
1201
0
                    goto hit;
1202
0
                }
1203
0
            } while (hp->hash >= 0);
1204
0
        }
1205
        /*
1206
         * New entry, emit code and add to table.
1207
         */
1208
        /*
1209
         * Verify there is space in the buffer for the code
1210
         * and any potential Clear code that might be emitted
1211
         * below.  The value of limit is setup so that there
1212
         * are at least 4 bytes free--room for 2 codes.
1213
         */
1214
0
        if (op > limit)
1215
0
        {
1216
0
            tif->tif_rawcc = (tmsize_t)(op - tif->tif_rawdata);
1217
0
            if (!TIFFFlushData1(tif))
1218
0
                return 0;
1219
0
            op = tif->tif_rawdata;
1220
0
        }
1221
0
        PutNextCode(op, ent);
1222
0
        ent = (hcode_t)c;
1223
0
        hp->code = (hcode_t)(free_ent++);
1224
0
        hp->hash = fcode;
1225
0
        if (free_ent == CODE_MAX - 1)
1226
0
        {
1227
            /* table is full, emit clear code and reset */
1228
0
            cl_hash(sp);
1229
0
            sp->enc_ratio = 0;
1230
0
            incount = 0;
1231
0
            outcount = 0;
1232
0
            free_ent = CODE_FIRST;
1233
0
            PutNextCode(op, CODE_CLEAR);
1234
0
            nbits = BITS_MIN;
1235
0
            maxcode = MAXCODE(BITS_MIN);
1236
0
        }
1237
0
        else
1238
0
        {
1239
            /*
1240
             * If the next entry is going to be too big for
1241
             * the code size, then increase it, if possible.
1242
             */
1243
0
            if (free_ent > maxcode)
1244
0
            {
1245
0
                nbits++;
1246
0
                assert(nbits <= BITS_MAX);
1247
0
                maxcode = (int)MAXCODE(nbits);
1248
0
            }
1249
0
            else if (incount >= checkpoint)
1250
0
            {
1251
0
                tmsize_t rat;
1252
                /*
1253
                 * Check compression ratio and, if things seem
1254
                 * to be slipping, clear the hash table and
1255
                 * reset state.  The compression ratio is a
1256
                 * 24+8-bit fractional number.
1257
                 */
1258
0
                checkpoint = incount + CHECK_GAP;
1259
0
                CALCRATIO(sp, rat);
1260
0
                if (rat <= sp->enc_ratio)
1261
0
                {
1262
0
                    cl_hash(sp);
1263
0
                    sp->enc_ratio = 0;
1264
0
                    incount = 0;
1265
0
                    outcount = 0;
1266
0
                    free_ent = CODE_FIRST;
1267
0
                    PutNextCode(op, CODE_CLEAR);
1268
0
                    nbits = BITS_MIN;
1269
0
                    maxcode = MAXCODE(BITS_MIN);
1270
0
                }
1271
0
                else
1272
0
                    sp->enc_ratio = rat;
1273
0
            }
1274
0
        }
1275
0
    hit:;
1276
0
    }
1277
1278
    /*
1279
     * Restore global state.
1280
     */
1281
0
    sp->enc_incount = incount;
1282
0
    sp->enc_outcount = outcount;
1283
0
    sp->enc_checkpoint = checkpoint;
1284
0
    sp->enc_oldcode = ent;
1285
0
    sp->lzw_nextdata = nextdata;
1286
0
    sp->lzw_nextbits = nextbits;
1287
0
    sp->lzw_free_ent = (unsigned short)free_ent;
1288
0
    sp->lzw_maxcode = (unsigned short)maxcode;
1289
0
    sp->lzw_nbits = (unsigned short)nbits;
1290
0
    tif->tif_rawcp = op;
1291
0
    return (1);
1292
0
}
1293
1294
/*
1295
 * Finish off an encoded strip by flushing the last
1296
 * string and tacking on an End Of Information code.
1297
 */
1298
static int LZWPostEncode(TIFF *tif)
1299
0
{
1300
0
    register LZWCodecState *sp = LZWEncoderState(tif);
1301
0
    uint8_t *op = tif->tif_rawcp;
1302
0
    long nextbits = sp->lzw_nextbits;
1303
0
    WordType nextdata = sp->lzw_nextdata;
1304
0
    tmsize_t outcount = sp->enc_outcount;
1305
0
    int nbits = sp->lzw_nbits;
1306
1307
0
    if (op > sp->enc_rawlimit)
1308
0
    {
1309
0
        tif->tif_rawcc = (tmsize_t)(op - tif->tif_rawdata);
1310
0
        if (!TIFFFlushData1(tif))
1311
0
            return 0;
1312
0
        op = tif->tif_rawdata;
1313
0
    }
1314
0
    if (sp->enc_oldcode != (hcode_t)-1)
1315
0
    {
1316
0
        int free_ent = sp->lzw_free_ent;
1317
1318
0
        PutNextCode(op, sp->enc_oldcode);
1319
0
        sp->enc_oldcode = (hcode_t)-1;
1320
0
        free_ent++;
1321
1322
0
        if (free_ent == CODE_MAX - 1)
1323
0
        {
1324
            /* table is full, emit clear code and reset */
1325
0
            outcount = 0;
1326
0
            PutNextCode(op, CODE_CLEAR);
1327
0
            nbits = BITS_MIN;
1328
0
        }
1329
0
        else
1330
0
        {
1331
            /*
1332
             * If the next entry is going to be too big for
1333
             * the code size, then increase it, if possible.
1334
             */
1335
0
            if (free_ent > sp->lzw_maxcode)
1336
0
            {
1337
0
                nbits++;
1338
0
                assert(nbits <= BITS_MAX);
1339
0
            }
1340
0
        }
1341
0
    }
1342
0
    PutNextCode(op, CODE_EOI);
1343
    /* Explicit 0xff masking to make icc -check=conversions happy */
1344
0
    if (nextbits > 0)
1345
0
        *op++ = (unsigned char)((nextdata << (8 - nextbits)) & 0xff);
1346
0
    tif->tif_rawcc = (tmsize_t)(op - tif->tif_rawdata);
1347
0
    (void)outcount;
1348
0
    return (1);
1349
0
}
1350
1351
/*
1352
 * Reset encoding hash table.
1353
 */
1354
static void cl_hash(LZWCodecState *sp)
1355
0
{
1356
0
    register hash_t *hp = &sp->enc_hashtab[HSIZE - 1];
1357
0
    register long i = HSIZE - 8;
1358
1359
0
    do
1360
0
    {
1361
0
        i -= 8;
1362
0
        hp[-7].hash = -1;
1363
0
        hp[-6].hash = -1;
1364
0
        hp[-5].hash = -1;
1365
0
        hp[-4].hash = -1;
1366
0
        hp[-3].hash = -1;
1367
0
        hp[-2].hash = -1;
1368
0
        hp[-1].hash = -1;
1369
0
        hp[0].hash = -1;
1370
0
        hp -= 8;
1371
0
    } while (i >= 0);
1372
0
    for (i += 8; i > 0; i--, hp--)
1373
0
        hp->hash = -1;
1374
0
}
1375
1376
static void LZWCleanup(TIFF *tif)
1377
0
{
1378
0
    (void)TIFFPredictorCleanup(tif);
1379
1380
0
    assert(tif->tif_data != 0);
1381
1382
0
    if (LZWDecoderState(tif)->dec_codetab)
1383
0
        _TIFFfreeExt(tif, LZWDecoderState(tif)->dec_codetab);
1384
1385
0
    if (LZWEncoderState(tif)->enc_hashtab)
1386
0
        _TIFFfreeExt(tif, LZWEncoderState(tif)->enc_hashtab);
1387
1388
0
    _TIFFfreeExt(tif, tif->tif_data);
1389
0
    tif->tif_data = NULL;
1390
1391
0
    _TIFFSetDefaultCompressionState(tif);
1392
0
}
1393
1394
int TIFFInitLZW(TIFF *tif, int scheme)
1395
0
{
1396
0
    static const char module[] = "TIFFInitLZW";
1397
0
    (void)scheme;
1398
0
    assert(scheme == COMPRESSION_LZW);
1399
    /*
1400
     * Allocate state block so tag methods have storage to record values.
1401
     */
1402
0
    tif->tif_data = (uint8_t *)_TIFFmallocExt(tif, sizeof(LZWCodecState));
1403
0
    if (tif->tif_data == NULL)
1404
0
        goto bad;
1405
0
    LZWDecoderState(tif)->dec_codetab = NULL;
1406
0
    LZWDecoderState(tif)->dec_decode = NULL;
1407
0
    LZWEncoderState(tif)->enc_hashtab = NULL;
1408
0
    LZWState(tif)->rw_mode = tif->tif_mode;
1409
1410
    /*
1411
     * Install codec methods.
1412
     */
1413
0
    tif->tif_fixuptags = LZWFixupTags;
1414
0
    tif->tif_setupdecode = LZWSetupDecode;
1415
0
    tif->tif_predecode = LZWPreDecode;
1416
0
    tif->tif_decoderow = LZWDecode;
1417
0
    tif->tif_decodestrip = LZWDecode;
1418
0
    tif->tif_decodetile = LZWDecode;
1419
0
    tif->tif_setupencode = LZWSetupEncode;
1420
0
    tif->tif_preencode = LZWPreEncode;
1421
0
    tif->tif_postencode = LZWPostEncode;
1422
0
    tif->tif_encoderow = LZWEncode;
1423
0
    tif->tif_encodestrip = LZWEncode;
1424
0
    tif->tif_encodetile = LZWEncode;
1425
0
    tif->tif_cleanup = LZWCleanup;
1426
    /*
1427
     * Setup predictor setup.
1428
     */
1429
0
    (void)TIFFPredictorInit(tif);
1430
0
    return (1);
1431
0
bad:
1432
0
    TIFFErrorExtR(tif, module, "No space for LZW state block");
1433
0
    return (0);
1434
0
}
1435
1436
/*
1437
 * Copyright (c) 1985, 1986 The Regents of the University of California.
1438
 * All rights reserved.
1439
 *
1440
 * This code is derived from software contributed to Berkeley by
1441
 * James A. Woods, derived from original work by Spencer Thomas
1442
 * and Joseph Orost.
1443
 *
1444
 * Redistribution and use in source and binary forms are permitted
1445
 * provided that the above copyright notice and this paragraph are
1446
 * duplicated in all such forms and that any documentation,
1447
 * advertising materials, and other materials related to such
1448
 * distribution and use acknowledge that the software was developed
1449
 * by the University of California, Berkeley.  The name of the
1450
 * University may not be used to endorse or promote products derived
1451
 * from this software without specific prior written permission.
1452
 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR
1453
 * IMPLIED WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED
1454
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
1455
 */
1456
#endif /* LZW_SUPPORT */