Coverage Report

Created: 2023-12-08 06:53

/src/freeimage-svn/FreeImage/trunk/Source/LibTIFF4/tif_lzw.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * Copyright (c) 1988-1997 Sam Leffler
3
 * Copyright (c) 1991-1997 Silicon Graphics, Inc.
4
 * Copyright (c) 2022 Even Rouault
5
 *
6
 * Permission to use, copy, modify, distribute, and sell this software and
7
 * its documentation for any purpose is hereby granted without fee, provided
8
 * that (i) the above copyright notices and this permission notice appear in
9
 * all copies of the software and related documentation, and (ii) the names of
10
 * Sam Leffler and Silicon Graphics may not be used in any advertising or
11
 * publicity relating to the software without the specific, prior written
12
 * permission of Sam Leffler and Silicon Graphics.
13
 *
14
 * THE SOFTWARE IS PROVIDED "AS-IS" AND WITHOUT WARRANTY OF ANY KIND,
15
 * EXPRESS, IMPLIED OR OTHERWISE, INCLUDING WITHOUT LIMITATION, ANY
16
 * WARRANTY OF MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE.
17
 *
18
 * IN NO EVENT SHALL SAM LEFFLER OR SILICON GRAPHICS BE LIABLE FOR
19
 * ANY SPECIAL, INCIDENTAL, INDIRECT OR CONSEQUENTIAL DAMAGES OF ANY KIND,
20
 * OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS,
21
 * WHETHER OR NOT ADVISED OF THE POSSIBILITY OF DAMAGE, AND ON ANY THEORY OF
22
 * LIABILITY, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE
23
 * OF THIS SOFTWARE.
24
 */
25
26
#include "tiffiop.h"
27
#ifdef LZW_SUPPORT
28
/*
29
 * TIFF Library.
30
 * Rev 5.0 Lempel-Ziv & Welch Compression Support
31
 *
32
 * This code is derived from the compress program whose code is
33
 * derived from software contributed to Berkeley by James A. Woods,
34
 * derived from original work by Spencer Thomas and Joseph Orost.
35
 *
36
 * The original Berkeley copyright notice appears below in its entirety.
37
 */
38
#include "tif_predict.h"
39
40
#include <stdbool.h>
41
#include <stdio.h>
42
#include <stdlib.h>
43
44
/* Select the plausible largest natural integer type for the architecture */
45
0
#define SIZEOF_WORDTYPE SIZEOF_SIZE_T
46
typedef size_t WordType;
47
48
/*
49
 * NB: The 5.0 spec describes a different algorithm than Aldus
50
 *     implements.  Specifically, Aldus does code length transitions
51
 *     one code earlier than should be done (for real LZW).
52
 *     Earlier versions of this library implemented the correct
53
 *     LZW algorithm, but emitted codes in a bit order opposite
54
 *     to the TIFF spec.  Thus, to maintain compatibility w/ Aldus
55
 *     we interpret MSB-LSB ordered codes to be images written w/
56
 *     old versions of this library, but otherwise adhere to the
57
 *     Aldus "off by one" algorithm.
58
 *
59
 * Future revisions to the TIFF spec are expected to "clarify this issue".
60
 */
61
#define LZW_COMPAT /* include backwards compatibility code */
62
63
0
#define MAXCODE(n) ((1L << (n)) - 1)
64
/*
65
 * The TIFF spec specifies that encoded bit
66
 * strings range from 9 to 12 bits.
67
 */
68
0
#define BITS_MIN 9  /* start with 9 bits */
69
0
#define BITS_MAX 12 /* max of 12 bit strings */
70
/* predefined codes */
71
0
#define CODE_CLEAR 256 /* code to clear string table */
72
0
#define CODE_EOI 257   /* end-of-information code */
73
0
#define CODE_FIRST 258 /* first free code entry */
74
0
#define CODE_MAX MAXCODE(BITS_MAX)
75
0
#define HSIZE 9001L /* 91% occupancy */
76
0
#define HSHIFT (13 - 8)
77
#ifdef LZW_COMPAT
78
/* NB: +1024 is for compatibility with old files */
79
0
#define CSIZE (MAXCODE(BITS_MAX) + 1024L)
80
#else
81
#define CSIZE (MAXCODE(BITS_MAX) + 1L)
82
#endif
83
84
/*
85
 * State block for each open TIFF file using LZW
86
 * compression/decompression.  Note that the predictor
87
 * state block must be first in this data structure.
88
 */
89
typedef struct
90
{
91
    TIFFPredictorState predict; /* predictor super class */
92
93
    unsigned short nbits;    /* # of bits/code */
94
    unsigned short maxcode;  /* maximum code for lzw_nbits */
95
    unsigned short free_ent; /* next free entry in hash table */
96
    WordType nextdata;       /* next bits of i/o */
97
    long nextbits;           /* # of valid bits in lzw_nextdata */
98
99
    int rw_mode; /* preserve rw_mode from init */
100
} LZWBaseState;
101
102
0
#define lzw_nbits base.nbits
103
0
#define lzw_maxcode base.maxcode
104
0
#define lzw_free_ent base.free_ent
105
0
#define lzw_nextdata base.nextdata
106
0
#define lzw_nextbits base.nextbits
107
108
/*
109
 * Encoding-specific state.
110
 */
111
typedef uint16_t hcode_t; /* codes fit in 16 bits */
112
typedef struct
113
{
114
    long hash;
115
    hcode_t code;
116
} hash_t;
117
118
/*
119
 * Decoding-specific state.
120
 */
121
typedef struct code_ent
122
{
123
    struct code_ent *next;
124
    unsigned short length; /* string len, including this token */
125
    /* firstchar should be placed immediately before value in this structure */
126
    unsigned char firstchar; /* first token of string */
127
    unsigned char value;     /* data value */
128
    bool repeated;
129
} code_t;
130
131
typedef int (*decodeFunc)(TIFF *, uint8_t *, tmsize_t, uint16_t);
132
133
typedef struct
134
{
135
    LZWBaseState base;
136
137
    /* Decoding specific data */
138
    long dec_nbitsmask;     /* lzw_nbits 1 bits, right adjusted */
139
    tmsize_t dec_restart;   /* restart count */
140
    uint64_t dec_bitsleft;  /* available bits in raw data */
141
    tmsize_t old_tif_rawcc; /* value of tif_rawcc at the end of the previous
142
                               TIFLZWDecode() call */
143
    decodeFunc dec_decode;  /* regular or backwards compatible */
144
    code_t *dec_codep;      /* current recognized code */
145
    code_t *dec_oldcodep;   /* previously recognized code */
146
    code_t *dec_free_entp;  /* next free entry */
147
    code_t *dec_maxcodep;   /* max available entry */
148
    code_t *dec_codetab;    /* kept separate for small machines */
149
    int read_error; /* whether a read error has occurred, and which should cause
150
                       further reads in the same strip/tile to be aborted */
151
152
    /* Encoding specific data */
153
    int enc_oldcode;         /* last code encountered */
154
    tmsize_t enc_checkpoint; /* point at which to clear table */
155
0
#define CHECK_GAP 10000      /* enc_ratio check interval */
156
    tmsize_t enc_ratio;      /* current compression ratio */
157
    tmsize_t enc_incount;    /* (input) data bytes encoded */
158
    tmsize_t enc_outcount;   /* encoded (output) bytes */
159
    uint8_t *enc_rawlimit;   /* bound on tif_rawdata buffer */
160
    hash_t *enc_hashtab;     /* kept separate for small machines */
161
} LZWCodecState;
162
163
0
#define LZWState(tif) ((LZWBaseState *)(tif)->tif_data)
164
0
#define DecoderState(tif) ((LZWCodecState *)LZWState(tif))
165
0
#define EncoderState(tif) ((LZWCodecState *)LZWState(tif))
166
167
static int LZWDecode(TIFF *tif, uint8_t *op0, tmsize_t occ0, uint16_t s);
168
#ifdef LZW_COMPAT
169
static int LZWDecodeCompat(TIFF *tif, uint8_t *op0, tmsize_t occ0, uint16_t s);
170
#endif
171
static void cl_hash(LZWCodecState *);
172
173
/*
174
 * LZW Decoder.
175
 */
176
177
static int LZWFixupTags(TIFF *tif)
178
0
{
179
0
    (void)tif;
180
0
    return (1);
181
0
}
182
183
static int LZWSetupDecode(TIFF *tif)
184
0
{
185
0
    static const char module[] = "LZWSetupDecode";
186
0
    LZWCodecState *sp = DecoderState(tif);
187
0
    int code;
188
189
0
    if (sp == NULL)
190
0
    {
191
        /*
192
         * Allocate state block so tag methods have storage to record
193
         * values.
194
         */
195
0
        tif->tif_data = (uint8_t *)_TIFFmallocExt(tif, sizeof(LZWCodecState));
196
0
        if (tif->tif_data == NULL)
197
0
        {
198
0
            TIFFErrorExtR(tif, module, "No space for LZW state block");
199
0
            return (0);
200
0
        }
201
202
0
        sp = DecoderState(tif);
203
0
        sp->dec_codetab = NULL;
204
0
        sp->dec_decode = NULL;
205
206
        /*
207
         * Setup predictor setup.
208
         */
209
0
        (void)TIFFPredictorInit(tif);
210
0
    }
211
212
0
    if (sp->dec_codetab == NULL)
213
0
    {
214
0
        sp->dec_codetab = (code_t *)_TIFFmallocExt(tif, CSIZE * sizeof(code_t));
215
0
        if (sp->dec_codetab == NULL)
216
0
        {
217
0
            TIFFErrorExtR(tif, module, "No space for LZW code table");
218
0
            return (0);
219
0
        }
220
        /*
221
         * Pre-load the table.
222
         */
223
0
        code = 255;
224
0
        do
225
0
        {
226
0
            sp->dec_codetab[code].firstchar = (unsigned char)code;
227
0
            sp->dec_codetab[code].value = (unsigned char)code;
228
0
            sp->dec_codetab[code].repeated = true;
229
0
            sp->dec_codetab[code].length = 1;
230
0
            sp->dec_codetab[code].next = NULL;
231
0
        } while (code--);
232
        /*
233
         * Zero-out the unused entries  */
234
        /* Silence false positive */
235
        /* coverity[overrun-buffer-arg] */
236
0
        memset(&sp->dec_codetab[CODE_CLEAR], 0,
237
0
               (CODE_FIRST - CODE_CLEAR) * sizeof(code_t));
238
0
    }
239
0
    return (1);
240
0
}
241
242
/*
243
 * Setup state for decoding a strip.
244
 */
245
static int LZWPreDecode(TIFF *tif, uint16_t s)
246
0
{
247
0
    static const char module[] = "LZWPreDecode";
248
0
    LZWCodecState *sp = DecoderState(tif);
249
250
0
    (void)s;
251
0
    assert(sp != NULL);
252
0
    if (sp->dec_codetab == NULL)
253
0
    {
254
0
        tif->tif_setupdecode(tif);
255
0
        if (sp->dec_codetab == NULL)
256
0
            return (0);
257
0
    }
258
259
    /*
260
     * Check for old bit-reversed codes.
261
     */
262
0
    if (tif->tif_rawcc >= 2 && tif->tif_rawdata[0] == 0 &&
263
0
        (tif->tif_rawdata[1] & 0x1))
264
0
    {
265
0
#ifdef LZW_COMPAT
266
0
        if (!sp->dec_decode)
267
0
        {
268
0
            TIFFWarningExtR(tif, module, "Old-style LZW codes, convert file");
269
            /*
270
             * Override default decoding methods with
271
             * ones that deal with the old coding.
272
             * Otherwise the predictor versions set
273
             * above will call the compatibility routines
274
             * through the dec_decode method.
275
             */
276
0
            tif->tif_decoderow = LZWDecodeCompat;
277
0
            tif->tif_decodestrip = LZWDecodeCompat;
278
0
            tif->tif_decodetile = LZWDecodeCompat;
279
            /*
280
             * If doing horizontal differencing, must
281
             * re-setup the predictor logic since we
282
             * switched the basic decoder methods...
283
             */
284
0
            (*tif->tif_setupdecode)(tif);
285
0
            sp->dec_decode = LZWDecodeCompat;
286
0
        }
287
0
        sp->lzw_maxcode = MAXCODE(BITS_MIN);
288
#else  /* !LZW_COMPAT */
289
        if (!sp->dec_decode)
290
        {
291
            TIFFErrorExtR(tif, module, "Old-style LZW codes not supported");
292
            sp->dec_decode = LZWDecode;
293
        }
294
        return (0);
295
#endif /* !LZW_COMPAT */
296
0
    }
297
0
    else
298
0
    {
299
0
        sp->lzw_maxcode = MAXCODE(BITS_MIN) - 1;
300
0
        sp->dec_decode = LZWDecode;
301
0
    }
302
0
    sp->lzw_nbits = BITS_MIN;
303
0
    sp->lzw_nextbits = 0;
304
0
    sp->lzw_nextdata = 0;
305
306
0
    sp->dec_restart = 0;
307
0
    sp->dec_nbitsmask = MAXCODE(BITS_MIN);
308
0
    sp->dec_bitsleft = 0;
309
0
    sp->old_tif_rawcc = 0;
310
0
    sp->dec_free_entp = sp->dec_codetab - 1; // + CODE_FIRST;
311
    /*
312
     * Zero entries that are not yet filled in.  We do
313
     * this to guard against bogus input data that causes
314
     * us to index into undefined entries.  If you can
315
     * come up with a way to safely bounds-check input codes
316
     * while decoding then you can remove this operation.
317
     */
318
0
    sp->dec_oldcodep = &sp->dec_codetab[0];
319
0
    sp->dec_maxcodep = &sp->dec_codetab[sp->dec_nbitsmask - 1];
320
0
    sp->read_error = 0;
321
0
    return (1);
322
0
}
323
324
/*
325
 * Decode a "hunk of data".
326
 */
327
328
/* Get the next 32 or 64-bit from the input data */
329
#ifdef WORDS_BIGENDIAN
330
#define GetNextData(nextdata, bp) memcpy(&nextdata, bp, sizeof(nextdata))
331
#elif SIZEOF_WORDTYPE == 8
332
#if defined(__GNUC__) && defined(__x86_64__)
333
#define GetNextData(nextdata, bp)                                              \
334
0
    nextdata = __builtin_bswap64(*(uint64_t *)(bp))
335
#elif defined(_M_X64)
336
#define GetNextData(nextdata, bp) nextdata = _byteswap_uint64(*(uint64_t *)(bp))
337
#elif defined(__GNUC__)
338
#define GetNextData(nextdata, bp)                                              \
339
    memcpy(&nextdata, bp, sizeof(nextdata));                                   \
340
    nextdata = __builtin_bswap64(nextdata)
341
#else
342
#define GetNextData(nextdata, bp)                                              \
343
    nextdata = (((uint64_t)bp[0]) << 56) | (((uint64_t)bp[1]) << 48) |         \
344
               (((uint64_t)bp[2]) << 40) | (((uint64_t)bp[3]) << 32) |         \
345
               (((uint64_t)bp[4]) << 24) | (((uint64_t)bp[5]) << 16) |         \
346
               (((uint64_t)bp[6]) << 8) | (((uint64_t)bp[7]))
347
#endif
348
#elif SIZEOF_WORDTYPE == 4
349
#if defined(__GNUC__) && defined(__i386__)
350
#define GetNextData(nextdata, bp)                                              \
351
    nextdata = __builtin_bswap32(*(uint32_t *)(bp))
352
#elif defined(_M_X86)
353
#define GetNextData(nextdata, bp)                                              \
354
    nextdata = _byteswap_ulong(*(unsigned long *)(bp))
355
#elif defined(__GNUC__)
356
#define GetNextData(nextdata, bp)                                              \
357
    memcpy(&nextdata, bp, sizeof(nextdata));                                   \
358
    nextdata = __builtin_bswap32(nextdata)
359
#else
360
#define GetNextData(nextdata, bp)                                              \
361
    nextdata = (((uint32_t)bp[0]) << 24) | (((uint32_t)bp[1]) << 16) |         \
362
               (((uint32_t)bp[2]) << 8) | (((uint32_t)bp[3]))
363
#endif
364
#else
365
#error "Unhandled SIZEOF_WORDTYPE"
366
#endif
367
368
#define GetNextCodeLZW()                                                       \
369
0
    do                                                                         \
370
0
    {                                                                          \
371
0
        nextbits -= nbits;                                                     \
372
0
        if (nextbits < 0)                                                      \
373
0
        {                                                                      \
374
0
            if (dec_bitsleft >= 8 * SIZEOF_WORDTYPE)                           \
375
0
            {                                                                  \
376
0
                unsigned codetmp = (unsigned)(nextdata << (-nextbits));        \
377
0
                GetNextData(nextdata, bp);                                     \
378
0
                bp += SIZEOF_WORDTYPE;                                         \
379
0
                nextbits += 8 * SIZEOF_WORDTYPE;                               \
380
0
                dec_bitsleft -= 8 * SIZEOF_WORDTYPE;                           \
381
0
                code = (WordType)((codetmp | (nextdata >> nextbits)) &         \
382
0
                                  nbitsmask);                                  \
383
0
                break;                                                         \
384
0
            }                                                                  \
385
0
            else                                                               \
386
0
            {                                                                  \
387
0
                if (dec_bitsleft < 8)                                          \
388
0
                {                                                              \
389
0
                    goto no_eoi;                                               \
390
0
                }                                                              \
391
0
                nextdata = (nextdata << 8) | *(bp)++;                          \
392
0
                nextbits += 8;                                                 \
393
0
                dec_bitsleft -= 8;                                             \
394
0
                if (nextbits < 0)                                              \
395
0
                {                                                              \
396
0
                    if (dec_bitsleft < 8)                                      \
397
0
                    {                                                          \
398
0
                        goto no_eoi;                                           \
399
0
                    }                                                          \
400
0
                    nextdata = (nextdata << 8) | *(bp)++;                      \
401
0
                    nextbits += 8;                                             \
402
0
                    dec_bitsleft -= 8;                                         \
403
0
                }                                                              \
404
0
            }                                                                  \
405
0
        }                                                                      \
406
0
        code = (WordType)((nextdata >> nextbits) & nbitsmask);                 \
407
0
    } while (0)
408
409
static int LZWDecode(TIFF *tif, uint8_t *op0, tmsize_t occ0, uint16_t s)
410
0
{
411
0
    static const char module[] = "LZWDecode";
412
0
    LZWCodecState *sp = DecoderState(tif);
413
0
    uint8_t *op = (uint8_t *)op0;
414
0
    tmsize_t occ = occ0;
415
0
    uint8_t *bp;
416
0
    long nbits, nextbits, nbitsmask;
417
0
    WordType nextdata;
418
0
    code_t *free_entp, *maxcodep, *oldcodep;
419
420
0
    (void)s;
421
0
    assert(sp != NULL);
422
0
    assert(sp->dec_codetab != NULL);
423
424
0
    if (sp->read_error)
425
0
    {
426
0
        TIFFErrorExtR(tif, module,
427
0
                      "LZWDecode: Scanline %" PRIu32 " cannot be read due to "
428
0
                      "previous error",
429
0
                      tif->tif_row);
430
0
        return 0;
431
0
    }
432
433
    /*
434
     * Restart interrupted output operation.
435
     */
436
0
    if (sp->dec_restart)
437
0
    {
438
0
        tmsize_t residue;
439
440
0
        code_t *codep = sp->dec_codep;
441
0
        residue = codep->length - sp->dec_restart;
442
0
        if (residue > occ)
443
0
        {
444
            /*
445
             * Residue from previous decode is sufficient
446
             * to satisfy decode request.  Skip to the
447
             * start of the decoded string, place decoded
448
             * values in the output buffer, and return.
449
             */
450
0
            sp->dec_restart += occ;
451
0
            do
452
0
            {
453
0
                codep = codep->next;
454
0
            } while (--residue > occ && codep);
455
0
            if (codep)
456
0
            {
457
0
                uint8_t *tp = op + occ;
458
0
                do
459
0
                {
460
0
                    *--tp = codep->value;
461
0
                    codep = codep->next;
462
0
                } while (--occ && codep);
463
0
            }
464
0
            return (1);
465
0
        }
466
        /*
467
         * Residue satisfies only part of the decode request.
468
         */
469
0
        op += residue;
470
0
        occ -= residue;
471
0
        uint8_t *tp = op;
472
0
        do
473
0
        {
474
0
            *--tp = codep->value;
475
0
            codep = codep->next;
476
0
        } while (--residue && codep);
477
0
        sp->dec_restart = 0;
478
0
    }
479
480
0
    bp = (uint8_t *)tif->tif_rawcp;
481
0
    sp->dec_bitsleft += (((uint64_t)tif->tif_rawcc - sp->old_tif_rawcc) << 3);
482
0
    uint64_t dec_bitsleft = sp->dec_bitsleft;
483
0
    nbits = sp->lzw_nbits;
484
0
    nextdata = sp->lzw_nextdata;
485
0
    nextbits = sp->lzw_nextbits;
486
0
    nbitsmask = sp->dec_nbitsmask;
487
0
    oldcodep = sp->dec_oldcodep;
488
0
    free_entp = sp->dec_free_entp;
489
0
    maxcodep = sp->dec_maxcodep;
490
0
    code_t *const dec_codetab = sp->dec_codetab;
491
0
    code_t *codep;
492
493
0
    if (occ == 0)
494
0
    {
495
0
        goto after_loop;
496
0
    }
497
498
0
begin:
499
0
{
500
0
    WordType code;
501
0
    GetNextCodeLZW();
502
0
    codep = dec_codetab + code;
503
0
    if (code >= CODE_FIRST)
504
0
        goto code_above_or_equal_to_258;
505
0
    if (code < 256)
506
0
        goto code_below_256;
507
0
    if (code == CODE_EOI)
508
0
        goto after_loop;
509
0
    goto code_clear;
510
511
0
code_below_256:
512
0
{
513
0
    if (codep > free_entp)
514
0
        goto error_code;
515
0
    free_entp->next = oldcodep;
516
0
    free_entp->firstchar = oldcodep->firstchar;
517
0
    free_entp->length = oldcodep->length + 1;
518
0
    free_entp->value = (uint8_t)code;
519
0
    free_entp->repeated =
520
0
        (bool)(oldcodep->repeated & (oldcodep->value == code));
521
0
    if (++free_entp > maxcodep)
522
0
    {
523
0
        if (++nbits > BITS_MAX) /* should not happen for a conformant encoder */
524
0
            nbits = BITS_MAX;
525
0
        nbitsmask = MAXCODE(nbits);
526
0
        maxcodep = dec_codetab + nbitsmask - 1;
527
0
        if (free_entp >= &dec_codetab[CSIZE])
528
0
        {
529
            /* At that point, the next valid states are either EOI or a */
530
            /* CODE_CLEAR. If a regular code is read, at the next */
531
            /* attempt at registering a new entry, we will error out */
532
            /* due to setting free_entp before any valid code */
533
0
            free_entp = dec_codetab - 1;
534
0
        }
535
0
    }
536
0
    oldcodep = codep;
537
0
    *op++ = (uint8_t)code;
538
0
    occ--;
539
0
    if (occ == 0)
540
0
        goto after_loop;
541
0
    goto begin;
542
0
}
543
544
0
code_above_or_equal_to_258:
545
0
{
546
    /*
547
     * Add the new entry to the code table.
548
     */
549
550
0
    if (codep >= free_entp)
551
0
    {
552
0
        if (codep != free_entp)
553
0
            goto error_code;
554
0
        free_entp->value = oldcodep->firstchar;
555
0
    }
556
0
    else
557
0
    {
558
0
        free_entp->value = codep->firstchar;
559
0
    }
560
0
    free_entp->repeated =
561
0
        (bool)(oldcodep->repeated & (oldcodep->value == free_entp->value));
562
0
    free_entp->next = oldcodep;
563
564
0
    free_entp->firstchar = oldcodep->firstchar;
565
0
    free_entp->length = oldcodep->length + 1;
566
0
    if (++free_entp > maxcodep)
567
0
    {
568
0
        if (++nbits > BITS_MAX) /* should not happen for a conformant encoder */
569
0
            nbits = BITS_MAX;
570
0
        nbitsmask = MAXCODE(nbits);
571
0
        maxcodep = dec_codetab + nbitsmask - 1;
572
0
        if (free_entp >= &dec_codetab[CSIZE])
573
0
        {
574
            /* At that point, the next valid states are either EOI or a */
575
            /* CODE_CLEAR. If a regular code is read, at the next */
576
            /* attempt at registering a new entry, we will error out */
577
            /* due to setting free_entp before any valid code */
578
0
            free_entp = dec_codetab - 1;
579
0
        }
580
0
    }
581
0
    oldcodep = codep;
582
583
    /*
584
     * Code maps to a string, copy string
585
     * value to output (written in reverse).
586
     */
587
    /* tiny bit faster on x86_64 to store in unsigned short than int */
588
0
    unsigned short len = codep->length;
589
590
0
    if (len < 3) /* equivalent to len == 2 given all other conditions */
591
0
    {
592
0
        if (occ <= 2)
593
0
        {
594
0
            if (occ == 2)
595
0
            {
596
0
                memcpy(op, &(codep->firstchar), 2);
597
0
                op += 2;
598
0
                occ -= 2;
599
0
                goto after_loop;
600
0
            }
601
0
            goto too_short_buffer;
602
0
        }
603
604
0
        memcpy(op, &(codep->firstchar), 2);
605
0
        op += 2;
606
0
        occ -= 2;
607
0
        goto begin; /* we can save the comparison occ > 0 */
608
0
    }
609
610
0
    if (len == 3)
611
0
    {
612
0
        if (occ <= 3)
613
0
        {
614
0
            if (occ == 3)
615
0
            {
616
0
                op[0] = codep->firstchar;
617
0
                op[1] = codep->next->value;
618
0
                op[2] = codep->value;
619
0
                op += 3;
620
0
                occ -= 3;
621
0
                goto after_loop;
622
0
            }
623
0
            goto too_short_buffer;
624
0
        }
625
626
0
        op[0] = codep->firstchar;
627
0
        op[1] = codep->next->value;
628
0
        op[2] = codep->value;
629
0
        op += 3;
630
0
        occ -= 3;
631
0
        goto begin; /* we can save the comparison occ > 0 */
632
0
    }
633
634
0
    if (len > occ)
635
0
    {
636
0
        goto too_short_buffer;
637
0
    }
638
639
0
    if (codep->repeated)
640
0
    {
641
0
        memset(op, codep->value, len);
642
0
        op += len;
643
0
        occ -= len;
644
0
        if (occ == 0)
645
0
            goto after_loop;
646
0
        goto begin;
647
0
    }
648
649
0
    uint8_t *tp = op + len;
650
651
0
    assert(len >= 4);
652
653
0
    *--tp = codep->value;
654
0
    codep = codep->next;
655
0
    *--tp = codep->value;
656
0
    codep = codep->next;
657
0
    *--tp = codep->value;
658
0
    codep = codep->next;
659
0
    *--tp = codep->value;
660
0
    if (tp > op)
661
0
    {
662
0
        do
663
0
        {
664
0
            codep = codep->next;
665
0
            *--tp = codep->value;
666
0
        } while (tp > op);
667
0
    }
668
669
0
    assert(occ >= len);
670
0
    op += len;
671
0
    occ -= len;
672
0
    if (occ == 0)
673
0
        goto after_loop;
674
0
    goto begin;
675
0
}
676
677
0
code_clear:
678
0
{
679
0
    free_entp = dec_codetab + CODE_FIRST;
680
0
    nbits = BITS_MIN;
681
0
    nbitsmask = MAXCODE(BITS_MIN);
682
0
    maxcodep = dec_codetab + nbitsmask - 1;
683
0
    do
684
0
    {
685
0
        GetNextCodeLZW();
686
0
    } while (code == CODE_CLEAR); /* consecutive CODE_CLEAR codes */
687
0
    if (code == CODE_EOI)
688
0
        goto after_loop;
689
0
    if (code > CODE_EOI)
690
0
    {
691
0
        goto error_code;
692
0
    }
693
0
    *op++ = (uint8_t)code;
694
0
    occ--;
695
0
    oldcodep = dec_codetab + code;
696
0
    if (occ == 0)
697
0
        goto after_loop;
698
0
    goto begin;
699
0
}
700
0
}
701
702
0
too_short_buffer:
703
0
{
704
    /*
705
     * String is too long for decode buffer,
706
     * locate portion that will fit, copy to
707
     * the decode buffer, and setup restart
708
     * logic for the next decoding call.
709
     */
710
0
    sp->dec_codep = codep;
711
0
    do
712
0
    {
713
0
        codep = codep->next;
714
0
    } while (codep->length > occ);
715
716
0
    sp->dec_restart = occ;
717
0
    uint8_t *tp = op + occ;
718
0
    do
719
0
    {
720
0
        *--tp = codep->value;
721
0
        codep = codep->next;
722
0
    } while (--occ);
723
0
}
724
725
0
after_loop:
726
0
    tif->tif_rawcc -= (tmsize_t)((uint8_t *)bp - tif->tif_rawcp);
727
0
    tif->tif_rawcp = (uint8_t *)bp;
728
0
    sp->old_tif_rawcc = tif->tif_rawcc;
729
0
    sp->dec_bitsleft = dec_bitsleft;
730
0
    sp->lzw_nbits = (unsigned short)nbits;
731
0
    sp->lzw_nextdata = nextdata;
732
0
    sp->lzw_nextbits = nextbits;
733
0
    sp->dec_nbitsmask = nbitsmask;
734
0
    sp->dec_oldcodep = oldcodep;
735
0
    sp->dec_free_entp = free_entp;
736
0
    sp->dec_maxcodep = maxcodep;
737
738
0
    if (occ > 0)
739
0
    {
740
0
        TIFFErrorExtR(tif, module,
741
0
                      "Not enough data at scanline %" PRIu32 " (short %" PRIu64
742
0
                      " bytes)",
743
0
                      tif->tif_row, (uint64_t)occ);
744
0
        return (0);
745
0
    }
746
0
    return (1);
747
748
0
no_eoi:
749
0
    sp->read_error = 1;
750
0
    TIFFErrorExtR(tif, module,
751
0
                  "LZWDecode: Strip %" PRIu32 " not terminated with EOI code",
752
0
                  tif->tif_curstrip);
753
0
    return 0;
754
0
error_code:
755
0
    sp->read_error = 1;
756
0
    TIFFErrorExtR(tif, tif->tif_name, "Using code not yet in table");
757
0
    return 0;
758
0
}
759
760
#ifdef LZW_COMPAT
761
762
/*
763
 * This check shouldn't be necessary because each
764
 * strip is suppose to be terminated with CODE_EOI.
765
 */
766
#define NextCode(_tif, _sp, _bp, _code, _get, dec_bitsleft)                    \
767
0
    {                                                                          \
768
0
        if (dec_bitsleft < (uint64_t)nbits)                                    \
769
0
        {                                                                      \
770
0
            TIFFWarningExtR(_tif, module,                                      \
771
0
                            "LZWDecode: Strip %" PRIu32                        \
772
0
                            " not terminated with EOI code",                   \
773
0
                            _tif->tif_curstrip);                               \
774
0
            _code = CODE_EOI;                                                  \
775
0
        }                                                                      \
776
0
        else                                                                   \
777
0
        {                                                                      \
778
0
            _get(_sp, _bp, _code);                                             \
779
0
            dec_bitsleft -= nbits;                                             \
780
0
        }                                                                      \
781
0
    }
782
783
/*
784
 * Decode a "hunk of data" for old images.
785
 */
786
#define GetNextCodeCompat(sp, bp, code)                                        \
787
0
    {                                                                          \
788
0
        nextdata |= (unsigned long)*(bp)++ << nextbits;                        \
789
0
        nextbits += 8;                                                         \
790
0
        if (nextbits < nbits)                                                  \
791
0
        {                                                                      \
792
0
            nextdata |= (unsigned long)*(bp)++ << nextbits;                    \
793
0
            nextbits += 8;                                                     \
794
0
        }                                                                      \
795
0
        code = (hcode_t)(nextdata & nbitsmask);                                \
796
0
        nextdata >>= nbits;                                                    \
797
0
        nextbits -= nbits;                                                     \
798
0
    }
799
800
static int LZWDecodeCompat(TIFF *tif, uint8_t *op0, tmsize_t occ0, uint16_t s)
801
0
{
802
0
    static const char module[] = "LZWDecodeCompat";
803
0
    LZWCodecState *sp = DecoderState(tif);
804
0
    uint8_t *op = (uint8_t *)op0;
805
0
    tmsize_t occ = occ0;
806
0
    uint8_t *tp;
807
0
    uint8_t *bp;
808
0
    int code, nbits;
809
0
    int len;
810
0
    long nextbits, nbitsmask;
811
0
    WordType nextdata;
812
0
    code_t *codep, *free_entp, *maxcodep, *oldcodep;
813
814
0
    (void)s;
815
0
    assert(sp != NULL);
816
817
    /*
818
     * Restart interrupted output operation.
819
     */
820
0
    if (sp->dec_restart)
821
0
    {
822
0
        tmsize_t residue;
823
824
0
        codep = sp->dec_codep;
825
0
        residue = codep->length - sp->dec_restart;
826
0
        if (residue > occ)
827
0
        {
828
            /*
829
             * Residue from previous decode is sufficient
830
             * to satisfy decode request.  Skip to the
831
             * start of the decoded string, place decoded
832
             * values in the output buffer, and return.
833
             */
834
0
            sp->dec_restart += occ;
835
0
            do
836
0
            {
837
0
                codep = codep->next;
838
0
            } while (--residue > occ);
839
0
            tp = op + occ;
840
0
            do
841
0
            {
842
0
                *--tp = codep->value;
843
0
                codep = codep->next;
844
0
            } while (--occ);
845
0
            return (1);
846
0
        }
847
        /*
848
         * Residue satisfies only part of the decode request.
849
         */
850
0
        op += residue;
851
0
        occ -= residue;
852
0
        tp = op;
853
0
        do
854
0
        {
855
0
            *--tp = codep->value;
856
0
            codep = codep->next;
857
0
        } while (--residue);
858
0
        sp->dec_restart = 0;
859
0
    }
860
861
0
    bp = (uint8_t *)tif->tif_rawcp;
862
863
0
    sp->dec_bitsleft += (((uint64_t)tif->tif_rawcc - sp->old_tif_rawcc) << 3);
864
0
    uint64_t dec_bitsleft = sp->dec_bitsleft;
865
866
0
    nbits = sp->lzw_nbits;
867
0
    nextdata = sp->lzw_nextdata;
868
0
    nextbits = sp->lzw_nextbits;
869
0
    nbitsmask = sp->dec_nbitsmask;
870
0
    oldcodep = sp->dec_oldcodep;
871
0
    free_entp = sp->dec_free_entp;
872
0
    maxcodep = sp->dec_maxcodep;
873
874
0
    while (occ > 0)
875
0
    {
876
0
        NextCode(tif, sp, bp, code, GetNextCodeCompat, dec_bitsleft);
877
0
        if (code == CODE_EOI)
878
0
            break;
879
0
        if (code == CODE_CLEAR)
880
0
        {
881
0
            do
882
0
            {
883
0
                free_entp = sp->dec_codetab + CODE_FIRST;
884
0
                _TIFFmemset(free_entp, 0,
885
0
                            (CSIZE - CODE_FIRST) * sizeof(code_t));
886
0
                nbits = BITS_MIN;
887
0
                nbitsmask = MAXCODE(BITS_MIN);
888
0
                maxcodep = sp->dec_codetab + nbitsmask;
889
0
                NextCode(tif, sp, bp, code, GetNextCodeCompat, dec_bitsleft);
890
0
            } while (code == CODE_CLEAR); /* consecutive CODE_CLEAR codes */
891
0
            if (code == CODE_EOI)
892
0
                break;
893
0
            if (code > CODE_CLEAR)
894
0
            {
895
0
                TIFFErrorExtR(
896
0
                    tif, tif->tif_name,
897
0
                    "LZWDecode: Corrupted LZW table at scanline %" PRIu32,
898
0
                    tif->tif_row);
899
0
                return (0);
900
0
            }
901
0
            *op++ = (uint8_t)code;
902
0
            occ--;
903
0
            oldcodep = sp->dec_codetab + code;
904
0
            continue;
905
0
        }
906
0
        codep = sp->dec_codetab + code;
907
908
        /*
909
         * Add the new entry to the code table.
910
         */
911
0
        if (free_entp < &sp->dec_codetab[0] ||
912
0
            free_entp >= &sp->dec_codetab[CSIZE])
913
0
        {
914
0
            TIFFErrorExtR(tif, module,
915
0
                          "Corrupted LZW table at scanline %" PRIu32,
916
0
                          tif->tif_row);
917
0
            return (0);
918
0
        }
919
920
0
        free_entp->next = oldcodep;
921
0
        if (free_entp->next < &sp->dec_codetab[0] ||
922
0
            free_entp->next >= &sp->dec_codetab[CSIZE])
923
0
        {
924
0
            TIFFErrorExtR(tif, module,
925
0
                          "Corrupted LZW table at scanline %" PRIu32,
926
0
                          tif->tif_row);
927
0
            return (0);
928
0
        }
929
0
        free_entp->firstchar = free_entp->next->firstchar;
930
0
        free_entp->length = free_entp->next->length + 1;
931
0
        free_entp->value =
932
0
            (codep < free_entp) ? codep->firstchar : free_entp->firstchar;
933
0
        if (++free_entp > maxcodep)
934
0
        {
935
0
            if (++nbits > BITS_MAX) /* should not happen */
936
0
                nbits = BITS_MAX;
937
0
            nbitsmask = MAXCODE(nbits);
938
0
            maxcodep = sp->dec_codetab + nbitsmask;
939
0
        }
940
0
        oldcodep = codep;
941
0
        if (code >= 256)
942
0
        {
943
            /*
944
             * Code maps to a string, copy string
945
             * value to output (written in reverse).
946
             */
947
0
            if (codep->length == 0)
948
0
            {
949
0
                TIFFErrorExtR(
950
0
                    tif, module,
951
0
                    "Wrong length of decoded "
952
0
                    "string: data probably corrupted at scanline %" PRIu32,
953
0
                    tif->tif_row);
954
0
                return (0);
955
0
            }
956
0
            if (codep->length > occ)
957
0
            {
958
                /*
959
                 * String is too long for decode buffer,
960
                 * locate portion that will fit, copy to
961
                 * the decode buffer, and setup restart
962
                 * logic for the next decoding call.
963
                 */
964
0
                sp->dec_codep = codep;
965
0
                do
966
0
                {
967
0
                    codep = codep->next;
968
0
                } while (codep->length > occ);
969
0
                sp->dec_restart = occ;
970
0
                tp = op + occ;
971
0
                do
972
0
                {
973
0
                    *--tp = codep->value;
974
0
                    codep = codep->next;
975
0
                } while (--occ);
976
0
                break;
977
0
            }
978
0
            len = codep->length;
979
0
            tp = op + len;
980
0
            do
981
0
            {
982
0
                *--tp = codep->value;
983
0
                codep = codep->next;
984
0
            } while (codep && tp > op);
985
0
            assert(occ >= len);
986
0
            op += len;
987
0
            occ -= len;
988
0
        }
989
0
        else
990
0
        {
991
0
            *op++ = (uint8_t)code;
992
0
            occ--;
993
0
        }
994
0
    }
995
996
0
    tif->tif_rawcc -= (tmsize_t)((uint8_t *)bp - tif->tif_rawcp);
997
0
    tif->tif_rawcp = (uint8_t *)bp;
998
999
0
    sp->old_tif_rawcc = tif->tif_rawcc;
1000
0
    sp->dec_bitsleft = dec_bitsleft;
1001
1002
0
    sp->lzw_nbits = (unsigned short)nbits;
1003
0
    sp->lzw_nextdata = nextdata;
1004
0
    sp->lzw_nextbits = nextbits;
1005
0
    sp->dec_nbitsmask = nbitsmask;
1006
0
    sp->dec_oldcodep = oldcodep;
1007
0
    sp->dec_free_entp = free_entp;
1008
0
    sp->dec_maxcodep = maxcodep;
1009
1010
0
    if (occ > 0)
1011
0
    {
1012
0
        TIFFErrorExtR(tif, module,
1013
0
                      "Not enough data at scanline %" PRIu32 " (short %" PRIu64
1014
0
                      " bytes)",
1015
0
                      tif->tif_row, (uint64_t)occ);
1016
0
        return (0);
1017
0
    }
1018
0
    return (1);
1019
0
}
1020
#endif /* LZW_COMPAT */
1021
1022
/*
1023
 * LZW Encoding.
1024
 */
1025
1026
static int LZWSetupEncode(TIFF *tif)
1027
0
{
1028
0
    static const char module[] = "LZWSetupEncode";
1029
0
    LZWCodecState *sp = EncoderState(tif);
1030
1031
0
    assert(sp != NULL);
1032
0
    sp->enc_hashtab = (hash_t *)_TIFFmallocExt(tif, HSIZE * sizeof(hash_t));
1033
0
    if (sp->enc_hashtab == NULL)
1034
0
    {
1035
0
        TIFFErrorExtR(tif, module, "No space for LZW hash table");
1036
0
        return (0);
1037
0
    }
1038
0
    return (1);
1039
0
}
1040
1041
/*
1042
 * Reset encoding state at the start of a strip.
1043
 */
1044
static int LZWPreEncode(TIFF *tif, uint16_t s)
1045
0
{
1046
0
    LZWCodecState *sp = EncoderState(tif);
1047
1048
0
    (void)s;
1049
0
    assert(sp != NULL);
1050
1051
0
    if (sp->enc_hashtab == NULL)
1052
0
    {
1053
0
        tif->tif_setupencode(tif);
1054
0
    }
1055
1056
0
    sp->lzw_nbits = BITS_MIN;
1057
0
    sp->lzw_maxcode = MAXCODE(BITS_MIN);
1058
0
    sp->lzw_free_ent = CODE_FIRST;
1059
0
    sp->lzw_nextbits = 0;
1060
0
    sp->lzw_nextdata = 0;
1061
0
    sp->enc_checkpoint = CHECK_GAP;
1062
0
    sp->enc_ratio = 0;
1063
0
    sp->enc_incount = 0;
1064
0
    sp->enc_outcount = 0;
1065
    /*
1066
     * The 4 here insures there is space for 2 max-sized
1067
     * codes in LZWEncode and LZWPostDecode.
1068
     */
1069
0
    sp->enc_rawlimit = tif->tif_rawdata + tif->tif_rawdatasize - 1 - 4;
1070
0
    cl_hash(sp);                   /* clear hash table */
1071
0
    sp->enc_oldcode = (hcode_t)-1; /* generates CODE_CLEAR in LZWEncode */
1072
0
    return (1);
1073
0
}
1074
1075
#define CALCRATIO(sp, rat)                                                     \
1076
0
    {                                                                          \
1077
0
        if (incount > 0x007fffff)                                              \
1078
0
        { /* NB: shift will overflow */                                        \
1079
0
            rat = outcount >> 8;                                               \
1080
0
            rat = (rat == 0 ? 0x7fffffff : incount / rat);                     \
1081
0
        }                                                                      \
1082
0
        else                                                                   \
1083
0
            rat = (incount << 8) / outcount;                                   \
1084
0
    }
1085
1086
/* Explicit 0xff masking to make icc -check=conversions happy */
1087
#define PutNextCode(op, c)                                                     \
1088
0
    {                                                                          \
1089
0
        nextdata = (nextdata << nbits) | c;                                    \
1090
0
        nextbits += nbits;                                                     \
1091
0
        *op++ = (unsigned char)((nextdata >> (nextbits - 8)) & 0xff);          \
1092
0
        nextbits -= 8;                                                         \
1093
0
        if (nextbits >= 8)                                                     \
1094
0
        {                                                                      \
1095
0
            *op++ = (unsigned char)((nextdata >> (nextbits - 8)) & 0xff);      \
1096
0
            nextbits -= 8;                                                     \
1097
0
        }                                                                      \
1098
0
        outcount += nbits;                                                     \
1099
0
    }
1100
1101
/*
1102
 * Encode a chunk of pixels.
1103
 *
1104
 * Uses an open addressing double hashing (no chaining) on the
1105
 * prefix code/next character combination.  We do a variant of
1106
 * Knuth's algorithm D (vol. 3, sec. 6.4) along with G. Knott's
1107
 * relatively-prime secondary probe.  Here, the modular division
1108
 * first probe is gives way to a faster exclusive-or manipulation.
1109
 * Also do block compression with an adaptive reset, whereby the
1110
 * code table is cleared when the compression ratio decreases,
1111
 * but after the table fills.  The variable-length output codes
1112
 * are re-sized at this point, and a CODE_CLEAR is generated
1113
 * for the decoder.
1114
 */
1115
static int LZWEncode(TIFF *tif, uint8_t *bp, tmsize_t cc, uint16_t s)
1116
0
{
1117
0
    register LZWCodecState *sp = EncoderState(tif);
1118
0
    register long fcode;
1119
0
    register hash_t *hp;
1120
0
    register int h, c;
1121
0
    hcode_t ent;
1122
0
    long disp;
1123
0
    tmsize_t incount, outcount, checkpoint;
1124
0
    WordType nextdata;
1125
0
    long nextbits;
1126
0
    int free_ent, maxcode, nbits;
1127
0
    uint8_t *op;
1128
0
    uint8_t *limit;
1129
1130
0
    (void)s;
1131
0
    if (sp == NULL)
1132
0
        return (0);
1133
1134
0
    assert(sp->enc_hashtab != NULL);
1135
1136
    /*
1137
     * Load local state.
1138
     */
1139
0
    incount = sp->enc_incount;
1140
0
    outcount = sp->enc_outcount;
1141
0
    checkpoint = sp->enc_checkpoint;
1142
0
    nextdata = sp->lzw_nextdata;
1143
0
    nextbits = sp->lzw_nextbits;
1144
0
    free_ent = sp->lzw_free_ent;
1145
0
    maxcode = sp->lzw_maxcode;
1146
0
    nbits = sp->lzw_nbits;
1147
0
    op = tif->tif_rawcp;
1148
0
    limit = sp->enc_rawlimit;
1149
0
    ent = (hcode_t)sp->enc_oldcode;
1150
1151
0
    if (ent == (hcode_t)-1 && cc > 0)
1152
0
    {
1153
        /*
1154
         * NB: This is safe because it can only happen
1155
         *     at the start of a strip where we know there
1156
         *     is space in the data buffer.
1157
         */
1158
0
        PutNextCode(op, CODE_CLEAR);
1159
0
        ent = *bp++;
1160
0
        cc--;
1161
0
        incount++;
1162
0
    }
1163
0
    while (cc > 0)
1164
0
    {
1165
0
        c = *bp++;
1166
0
        cc--;
1167
0
        incount++;
1168
0
        fcode = ((long)c << BITS_MAX) + ent;
1169
0
        h = (c << HSHIFT) ^ ent; /* xor hashing */
1170
#ifdef _WINDOWS
1171
        /*
1172
         * Check hash index for an overflow.
1173
         */
1174
        if (h >= HSIZE)
1175
            h -= HSIZE;
1176
#endif
1177
0
        hp = &sp->enc_hashtab[h];
1178
0
        if (hp->hash == fcode)
1179
0
        {
1180
0
            ent = hp->code;
1181
0
            continue;
1182
0
        }
1183
0
        if (hp->hash >= 0)
1184
0
        {
1185
            /*
1186
             * Primary hash failed, check secondary hash.
1187
             */
1188
0
            disp = HSIZE - h;
1189
0
            if (h == 0)
1190
0
                disp = 1;
1191
0
            do
1192
0
            {
1193
                /*
1194
                 * Avoid pointer arithmetic because of
1195
                 * wraparound problems with segments.
1196
                 */
1197
0
                if ((h -= disp) < 0)
1198
0
                    h += HSIZE;
1199
0
                hp = &sp->enc_hashtab[h];
1200
0
                if (hp->hash == fcode)
1201
0
                {
1202
0
                    ent = hp->code;
1203
0
                    goto hit;
1204
0
                }
1205
0
            } while (hp->hash >= 0);
1206
0
        }
1207
        /*
1208
         * New entry, emit code and add to table.
1209
         */
1210
        /*
1211
         * Verify there is space in the buffer for the code
1212
         * and any potential Clear code that might be emitted
1213
         * below.  The value of limit is setup so that there
1214
         * are at least 4 bytes free--room for 2 codes.
1215
         */
1216
0
        if (op > limit)
1217
0
        {
1218
0
            tif->tif_rawcc = (tmsize_t)(op - tif->tif_rawdata);
1219
0
            if (!TIFFFlushData1(tif))
1220
0
                return 0;
1221
0
            op = tif->tif_rawdata;
1222
0
        }
1223
0
        PutNextCode(op, ent);
1224
0
        ent = (hcode_t)c;
1225
0
        hp->code = (hcode_t)(free_ent++);
1226
0
        hp->hash = fcode;
1227
0
        if (free_ent == CODE_MAX - 1)
1228
0
        {
1229
            /* table is full, emit clear code and reset */
1230
0
            cl_hash(sp);
1231
0
            sp->enc_ratio = 0;
1232
0
            incount = 0;
1233
0
            outcount = 0;
1234
0
            free_ent = CODE_FIRST;
1235
0
            PutNextCode(op, CODE_CLEAR);
1236
0
            nbits = BITS_MIN;
1237
0
            maxcode = MAXCODE(BITS_MIN);
1238
0
        }
1239
0
        else
1240
0
        {
1241
            /*
1242
             * If the next entry is going to be too big for
1243
             * the code size, then increase it, if possible.
1244
             */
1245
0
            if (free_ent > maxcode)
1246
0
            {
1247
0
                nbits++;
1248
0
                assert(nbits <= BITS_MAX);
1249
0
                maxcode = (int)MAXCODE(nbits);
1250
0
            }
1251
0
            else if (incount >= checkpoint)
1252
0
            {
1253
0
                tmsize_t rat;
1254
                /*
1255
                 * Check compression ratio and, if things seem
1256
                 * to be slipping, clear the hash table and
1257
                 * reset state.  The compression ratio is a
1258
                 * 24+8-bit fractional number.
1259
                 */
1260
0
                checkpoint = incount + CHECK_GAP;
1261
0
                CALCRATIO(sp, rat);
1262
0
                if (rat <= sp->enc_ratio)
1263
0
                {
1264
0
                    cl_hash(sp);
1265
0
                    sp->enc_ratio = 0;
1266
0
                    incount = 0;
1267
0
                    outcount = 0;
1268
0
                    free_ent = CODE_FIRST;
1269
0
                    PutNextCode(op, CODE_CLEAR);
1270
0
                    nbits = BITS_MIN;
1271
0
                    maxcode = MAXCODE(BITS_MIN);
1272
0
                }
1273
0
                else
1274
0
                    sp->enc_ratio = rat;
1275
0
            }
1276
0
        }
1277
0
    hit:;
1278
0
    }
1279
1280
    /*
1281
     * Restore global state.
1282
     */
1283
0
    sp->enc_incount = incount;
1284
0
    sp->enc_outcount = outcount;
1285
0
    sp->enc_checkpoint = checkpoint;
1286
0
    sp->enc_oldcode = ent;
1287
0
    sp->lzw_nextdata = nextdata;
1288
0
    sp->lzw_nextbits = nextbits;
1289
0
    sp->lzw_free_ent = (unsigned short)free_ent;
1290
0
    sp->lzw_maxcode = (unsigned short)maxcode;
1291
0
    sp->lzw_nbits = (unsigned short)nbits;
1292
0
    tif->tif_rawcp = op;
1293
0
    return (1);
1294
0
}
1295
1296
/*
1297
 * Finish off an encoded strip by flushing the last
1298
 * string and tacking on an End Of Information code.
1299
 */
1300
static int LZWPostEncode(TIFF *tif)
1301
0
{
1302
0
    register LZWCodecState *sp = EncoderState(tif);
1303
0
    uint8_t *op = tif->tif_rawcp;
1304
0
    long nextbits = sp->lzw_nextbits;
1305
0
    WordType nextdata = sp->lzw_nextdata;
1306
0
    tmsize_t outcount = sp->enc_outcount;
1307
0
    int nbits = sp->lzw_nbits;
1308
1309
0
    if (op > sp->enc_rawlimit)
1310
0
    {
1311
0
        tif->tif_rawcc = (tmsize_t)(op - tif->tif_rawdata);
1312
0
        if (!TIFFFlushData1(tif))
1313
0
            return 0;
1314
0
        op = tif->tif_rawdata;
1315
0
    }
1316
0
    if (sp->enc_oldcode != (hcode_t)-1)
1317
0
    {
1318
0
        int free_ent = sp->lzw_free_ent;
1319
1320
0
        PutNextCode(op, sp->enc_oldcode);
1321
0
        sp->enc_oldcode = (hcode_t)-1;
1322
0
        free_ent++;
1323
1324
0
        if (free_ent == CODE_MAX - 1)
1325
0
        {
1326
            /* table is full, emit clear code and reset */
1327
0
            outcount = 0;
1328
0
            PutNextCode(op, CODE_CLEAR);
1329
0
            nbits = BITS_MIN;
1330
0
        }
1331
0
        else
1332
0
        {
1333
            /*
1334
             * If the next entry is going to be too big for
1335
             * the code size, then increase it, if possible.
1336
             */
1337
0
            if (free_ent > sp->lzw_maxcode)
1338
0
            {
1339
0
                nbits++;
1340
0
                assert(nbits <= BITS_MAX);
1341
0
            }
1342
0
        }
1343
0
    }
1344
0
    PutNextCode(op, CODE_EOI);
1345
    /* Explicit 0xff masking to make icc -check=conversions happy */
1346
0
    if (nextbits > 0)
1347
0
        *op++ = (unsigned char)((nextdata << (8 - nextbits)) & 0xff);
1348
0
    tif->tif_rawcc = (tmsize_t)(op - tif->tif_rawdata);
1349
0
    (void)outcount;
1350
0
    return (1);
1351
0
}
1352
1353
/*
1354
 * Reset encoding hash table.
1355
 */
1356
static void cl_hash(LZWCodecState *sp)
1357
0
{
1358
0
    register hash_t *hp = &sp->enc_hashtab[HSIZE - 1];
1359
0
    register long i = HSIZE - 8;
1360
1361
0
    do
1362
0
    {
1363
0
        i -= 8;
1364
0
        hp[-7].hash = -1;
1365
0
        hp[-6].hash = -1;
1366
0
        hp[-5].hash = -1;
1367
0
        hp[-4].hash = -1;
1368
0
        hp[-3].hash = -1;
1369
0
        hp[-2].hash = -1;
1370
0
        hp[-1].hash = -1;
1371
0
        hp[0].hash = -1;
1372
0
        hp -= 8;
1373
0
    } while (i >= 0);
1374
0
    for (i += 8; i > 0; i--, hp--)
1375
0
        hp->hash = -1;
1376
0
}
1377
1378
static void LZWCleanup(TIFF *tif)
1379
0
{
1380
0
    (void)TIFFPredictorCleanup(tif);
1381
1382
0
    assert(tif->tif_data != 0);
1383
1384
0
    if (DecoderState(tif)->dec_codetab)
1385
0
        _TIFFfreeExt(tif, DecoderState(tif)->dec_codetab);
1386
1387
0
    if (EncoderState(tif)->enc_hashtab)
1388
0
        _TIFFfreeExt(tif, EncoderState(tif)->enc_hashtab);
1389
1390
0
    _TIFFfreeExt(tif, tif->tif_data);
1391
0
    tif->tif_data = NULL;
1392
1393
0
    _TIFFSetDefaultCompressionState(tif);
1394
0
}
1395
1396
int TIFFInitLZW(TIFF *tif, int scheme)
1397
0
{
1398
0
    static const char module[] = "TIFFInitLZW";
1399
0
    (void)scheme;
1400
0
    assert(scheme == COMPRESSION_LZW);
1401
    /*
1402
     * Allocate state block so tag methods have storage to record values.
1403
     */
1404
0
    tif->tif_data = (uint8_t *)_TIFFmallocExt(tif, sizeof(LZWCodecState));
1405
0
    if (tif->tif_data == NULL)
1406
0
        goto bad;
1407
0
    DecoderState(tif)->dec_codetab = NULL;
1408
0
    DecoderState(tif)->dec_decode = NULL;
1409
0
    EncoderState(tif)->enc_hashtab = NULL;
1410
0
    LZWState(tif)->rw_mode = tif->tif_mode;
1411
1412
    /*
1413
     * Install codec methods.
1414
     */
1415
0
    tif->tif_fixuptags = LZWFixupTags;
1416
0
    tif->tif_setupdecode = LZWSetupDecode;
1417
0
    tif->tif_predecode = LZWPreDecode;
1418
0
    tif->tif_decoderow = LZWDecode;
1419
0
    tif->tif_decodestrip = LZWDecode;
1420
0
    tif->tif_decodetile = LZWDecode;
1421
0
    tif->tif_setupencode = LZWSetupEncode;
1422
0
    tif->tif_preencode = LZWPreEncode;
1423
0
    tif->tif_postencode = LZWPostEncode;
1424
0
    tif->tif_encoderow = LZWEncode;
1425
0
    tif->tif_encodestrip = LZWEncode;
1426
0
    tif->tif_encodetile = LZWEncode;
1427
0
    tif->tif_cleanup = LZWCleanup;
1428
    /*
1429
     * Setup predictor setup.
1430
     */
1431
0
    (void)TIFFPredictorInit(tif);
1432
0
    return (1);
1433
0
bad:
1434
0
    TIFFErrorExtR(tif, module, "No space for LZW state block");
1435
0
    return (0);
1436
0
}
1437
1438
/*
1439
 * Copyright (c) 1985, 1986 The Regents of the University of California.
1440
 * All rights reserved.
1441
 *
1442
 * This code is derived from software contributed to Berkeley by
1443
 * James A. Woods, derived from original work by Spencer Thomas
1444
 * and Joseph Orost.
1445
 *
1446
 * Redistribution and use in source and binary forms are permitted
1447
 * provided that the above copyright notice and this paragraph are
1448
 * duplicated in all such forms and that any documentation,
1449
 * advertising materials, and other materials related to such
1450
 * distribution and use acknowledge that the software was developed
1451
 * by the University of California, Berkeley.  The name of the
1452
 * University may not be used to endorse or promote products derived
1453
 * from this software without specific prior written permission.
1454
 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR
1455
 * IMPLIED WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED
1456
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
1457
 */
1458
#endif /* LZW_SUPPORT */