Coverage Report

Created: 2025-12-31 07:53

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libjxl/lib/jxl/icc_codec.cc
Line
Count
Source
1
// Copyright (c) the JPEG XL Project Authors. All rights reserved.
2
//
3
// Use of this source code is governed by a BSD-style
4
// license that can be found in the LICENSE file.
5
6
#include "lib/jxl/icc_codec.h"
7
8
#include <jxl/memory_manager.h>
9
10
#include <algorithm>
11
#include <cstddef>
12
#include <cstdint>
13
14
#include "lib/jxl/base/common.h"
15
#include "lib/jxl/base/status.h"
16
#include "lib/jxl/dec_ans.h"
17
#include "lib/jxl/dec_bit_reader.h"
18
#include "lib/jxl/fields.h"
19
#include "lib/jxl/icc_codec_common.h"
20
#include "lib/jxl/padded_bytes.h"
21
22
namespace jxl {
23
namespace {
24
25
// Shuffles or interleaves bytes, for example with width 2, turns "ABCDabcd"
26
// into "AaBbCcDd". Transposes a matrix of ceil(size / width) columns and
27
// width rows. There are size elements, size may be < width * height, if so the
28
// last elements of the rightmost column are missing, the missing spots are
29
// transposed along with the filled spots, and the result has the missing
30
// elements at the end of the bottom row. The input is the input matrix in
31
// scanline order but with missing elements skipped (which may occur in multiple
32
// locations), the output is the result matrix in scanline order (with
33
// no need to skip missing elements as they are past the end of the data).
34
Status Shuffle(JxlMemoryManager* memory_manager, uint8_t* data, size_t size,
35
1.89k
               size_t width) {
36
1.89k
  size_t height = (size + width - 1) / width;  // amount of rows of output
37
1.89k
  PaddedBytes result(memory_manager);
38
1.89k
  JXL_ASSIGN_OR_RETURN(result,
39
1.89k
                       PaddedBytes::WithInitialSpace(memory_manager, size));
40
  // i = output index, j input index
41
1.89k
  size_t s = 0;
42
1.89k
  size_t j = 0;
43
20.0k
  for (size_t i = 0; i < size; i++) {
44
18.1k
    result[i] = data[j];
45
18.1k
    j += height;
46
18.1k
    if (j >= size) j = ++s;
47
18.1k
  }
48
49
20.0k
  for (size_t i = 0; i < size; i++) {
50
18.1k
    data[i] = result[i];
51
18.1k
  }
52
1.89k
  return true;
53
1.89k
}
54
55
// TODO(eustas): should be 20, or even 18, once DecodeVarInt is improved;
56
//               currently DecodeVarInt does not signal the errors, and marks
57
//               11 bytes as used even if only 10 are used (and 9 is enough for
58
//               63-bit values).
59
constexpr const size_t kPreambleSize = 22;  // enough for reading 2 VarInts
60
61
24.7k
uint64_t DecodeVarInt(const uint8_t* input, size_t inputSize, size_t* pos) {
62
24.7k
  size_t i;
63
24.7k
  uint64_t ret = 0;
64
32.0k
  for (i = 0; *pos + i < inputSize && i < 10; ++i) {
65
31.9k
    ret |= static_cast<uint64_t>(input[*pos + i] & 127)
66
31.9k
           << static_cast<uint64_t>(7 * i);
67
    // If the next-byte flag is not set, stop
68
31.9k
    if ((input[*pos + i] & 128) == 0) break;
69
31.9k
  }
70
  // TODO(user): Return a decoding error if i == 10.
71
24.7k
  *pos += i + 1;
72
24.7k
  return ret;
73
24.7k
}
74
75
}  // namespace
76
77
// Mimics the beginning of UnpredictICC for quick validity check.
78
// At least kPreambleSize bytes of data should be valid at invocation time.
79
4.19k
Status CheckPreamble(const PaddedBytes& data, size_t enc_size) {
80
4.19k
  const uint8_t* enc = data.data();
81
4.19k
  size_t size = data.size();
82
4.19k
  size_t pos = 0;
83
4.19k
  uint64_t osize = DecodeVarInt(enc, size, &pos);
84
4.19k
  JXL_RETURN_IF_ERROR(CheckIs32Bit(osize));
85
4.16k
  if (pos >= size) return JXL_FAILURE("Out of bounds");
86
4.16k
  uint64_t csize = DecodeVarInt(enc, size, &pos);
87
4.16k
  JXL_RETURN_IF_ERROR(CheckIs32Bit(csize));
88
4.15k
  JXL_RETURN_IF_ERROR(CheckOutOfBounds(pos, csize, size));
89
  // We expect that UnpredictICC inflates input, not the other way round.
90
4.11k
  if (osize + 65536 < enc_size) return JXL_FAILURE("Malformed ICC");
91
92
  // NB(eustas): 64 MiB ICC should be enough for everything!?
93
4.04k
  const size_t output_limit = 1 << 28;
94
4.04k
  if (output_limit && osize > output_limit) {
95
12
    return JXL_FAILURE("Decoded ICC is too large");
96
12
  }
97
4.03k
  return true;
98
4.04k
}
99
100
// Decodes the result of PredictICC back to a valid ICC profile.
101
11.0k
Status UnpredictICC(const uint8_t* enc, size_t size, PaddedBytes* result) {
102
11.0k
  if (!result->empty()) return JXL_FAILURE("result must be empty initially");
103
11.0k
  JxlMemoryManager* memory_manager = result->memory_manager();
104
11.0k
  size_t pos = 0;
105
  // TODO(lode): technically speaking we need to check that the entire varint
106
  // decoding never goes out of bounds, not just the first byte. This requires
107
  // a DecodeVarInt function that returns an error code. It is safe to use
108
  // DecodeVarInt with out of bounds values, it silently returns, but the
109
  // specification requires an error. Idem for all DecodeVarInt below.
110
11.0k
  if (pos >= size) return JXL_FAILURE("Out of bounds");
111
3.47k
  uint64_t osize = DecodeVarInt(enc, size, &pos);  // Output size
112
3.47k
  JXL_RETURN_IF_ERROR(CheckIs32Bit(osize));
113
3.46k
  if (pos >= size) return JXL_FAILURE("Out of bounds");
114
3.40k
  uint64_t csize = DecodeVarInt(enc, size, &pos);  // Commands size
115
  // Every command is translated to at least on byte.
116
3.40k
  JXL_RETURN_IF_ERROR(CheckIs32Bit(csize));
117
3.39k
  size_t cpos = pos;  // pos in commands stream
118
3.39k
  JXL_RETURN_IF_ERROR(CheckOutOfBounds(pos, csize, size));
119
1.97k
  size_t commands_end = cpos + csize;
120
1.97k
  pos = commands_end;  // pos in data stream
121
122
  // Header
123
1.97k
  PaddedBytes header{memory_manager};
124
1.97k
  JXL_RETURN_IF_ERROR(header.append(ICCInitialHeaderPrediction(osize)));
125
120k
  for (size_t i = 0; i <= kICCHeaderSize; i++) {
126
120k
    if (result->size() == osize) {
127
968
      if (cpos != commands_end) return JXL_FAILURE("Not all commands used");
128
783
      if (pos != size) return JXL_FAILURE("Not all data used");
129
41
      return true;  // Valid end
130
783
    }
131
119k
    if (i == kICCHeaderSize) break;  // Done
132
118k
    ICCPredictHeader(result->data(), result->size(), header.data(), i);
133
118k
    if (pos >= size) return JXL_FAILURE("Out of bounds");
134
118k
    JXL_RETURN_IF_ERROR(result->push_back(enc[pos++] + header[i]));
135
118k
  }
136
884
  if (cpos >= commands_end) return JXL_FAILURE("Out of bounds");
137
138
  // Tag list
139
875
  uint64_t numtags = DecodeVarInt(enc, size, &cpos);
140
141
875
  if (numtags != 0) {
142
681
    numtags--;
143
681
    JXL_RETURN_IF_ERROR(CheckIs32Bit(numtags));
144
632
    JXL_RETURN_IF_ERROR(AppendUint32(numtags, result));
145
632
    uint64_t prevtagstart = kICCHeaderSize + numtags * 12;
146
632
    uint64_t prevtagsize = 0;
147
12.9k
    for (;;) {
148
12.9k
      if (result->size() > osize) return JXL_FAILURE("Invalid result size");
149
12.9k
      if (cpos > commands_end) return JXL_FAILURE("Out of bounds");
150
12.9k
      if (cpos == commands_end) break;  // Valid end
151
12.7k
      uint8_t command = enc[cpos++];
152
12.7k
      uint8_t tagcode = command & 63;
153
12.7k
      Tag tag;
154
12.7k
      if (tagcode == 0) {
155
328
        break;
156
12.4k
      } else if (tagcode == kCommandTagUnknown) {
157
506
        JXL_RETURN_IF_ERROR(CheckOutOfBounds(pos, 4, size));
158
491
        tag = DecodeKeyword(enc, size, pos);
159
491
        pos += 4;
160
11.9k
      } else if (tagcode == kCommandTagTRC) {
161
1.16k
        tag = kRtrcTag;
162
10.7k
      } else if (tagcode == kCommandTagXYZ) {
163
680
        tag = kRxyzTag;
164
10.1k
      } else {
165
10.1k
        if (tagcode - kCommandTagStringFirst >= kNumTagStrings) {
166
63
          return JXL_FAILURE("Unknown tagcode");
167
63
        }
168
10.0k
        tag = *kTagStrings[tagcode - kCommandTagStringFirst];
169
10.0k
      }
170
12.3k
      JXL_RETURN_IF_ERROR(AppendKeyword(tag, result));
171
172
12.3k
      uint64_t tagstart;
173
12.3k
      uint64_t tagsize = prevtagsize;
174
12.3k
      if (tag == kRxyzTag || tag == kGxyzTag || tag == kBxyzTag ||
175
9.61k
          tag == kKxyzTag || tag == kWtptTag || tag == kBkptTag ||
176
6.65k
          tag == kLumiTag) {
177
6.65k
        tagsize = 20;
178
6.65k
      }
179
180
12.3k
      if (command & kFlagBitOffset) {
181
2.35k
        if (cpos >= commands_end) return JXL_FAILURE("Out of bounds");
182
2.31k
        tagstart = DecodeVarInt(enc, size, &cpos);
183
10.0k
      } else {
184
10.0k
        JXL_RETURN_IF_ERROR(CheckIs32Bit(prevtagstart));
185
10.0k
        tagstart = prevtagstart + prevtagsize;
186
10.0k
      }
187
12.3k
      JXL_RETURN_IF_ERROR(CheckIs32Bit(tagstart));
188
12.3k
      JXL_RETURN_IF_ERROR(AppendUint32(tagstart, result));
189
12.3k
      if (command & kFlagBitSize) {
190
2.03k
        if (cpos >= commands_end) return JXL_FAILURE("Out of bounds");
191
2.00k
        tagsize = DecodeVarInt(enc, size, &cpos);
192
2.00k
      }
193
12.3k
      JXL_RETURN_IF_ERROR(CheckIs32Bit(tagsize));
194
12.3k
      JXL_RETURN_IF_ERROR(AppendUint32(tagsize, result));
195
12.3k
      prevtagstart = tagstart;
196
12.3k
      prevtagsize = tagsize;
197
198
12.3k
      if (tagcode == kCommandTagTRC) {
199
1.16k
        JXL_RETURN_IF_ERROR(AppendKeyword(kGtrcTag, result));
200
1.16k
        JXL_RETURN_IF_ERROR(AppendUint32(tagstart, result));
201
1.16k
        JXL_RETURN_IF_ERROR(AppendUint32(tagsize, result));
202
1.16k
        JXL_RETURN_IF_ERROR(AppendKeyword(kBtrcTag, result));
203
1.16k
        JXL_RETURN_IF_ERROR(AppendUint32(tagstart, result));
204
1.16k
        JXL_RETURN_IF_ERROR(AppendUint32(tagsize, result));
205
1.16k
      }
206
207
12.3k
      if (tagcode == kCommandTagXYZ) {
208
679
        JXL_RETURN_IF_ERROR(CheckIs32Bit(tagstart + tagsize * 2));
209
679
        JXL_RETURN_IF_ERROR(AppendKeyword(kGxyzTag, result));
210
679
        JXL_RETURN_IF_ERROR(AppendUint32(tagstart + tagsize, result));
211
679
        JXL_RETURN_IF_ERROR(AppendUint32(tagsize, result));
212
679
        JXL_RETURN_IF_ERROR(AppendKeyword(kBxyzTag, result));
213
679
        JXL_RETURN_IF_ERROR(AppendUint32(tagstart + tagsize * 2, result));
214
679
        JXL_RETURN_IF_ERROR(AppendUint32(tagsize, result));
215
679
      }
216
12.3k
    }
217
632
  }
218
219
  // Main Content
220
6.60k
  for (;;) {
221
6.60k
    if (result->size() > osize) return JXL_FAILURE("Invalid result size");
222
6.59k
    if (cpos > commands_end) return JXL_FAILURE("Out of bounds");
223
6.59k
    if (cpos == commands_end) break;  // Valid end
224
6.42k
    uint8_t command = enc[cpos++];
225
6.42k
    if (command == kCommandInsert) {
226
709
      if (cpos >= commands_end) return JXL_FAILURE("Out of bounds");
227
702
      uint64_t num = DecodeVarInt(enc, size, &cpos);
228
702
      JXL_RETURN_IF_ERROR(CheckOutOfBounds(pos, num, size));
229
2.44k
      for (size_t i = 0; i < num; i++) {
230
1.79k
        JXL_RETURN_IF_ERROR(result->push_back(enc[pos++]));
231
1.79k
      }
232
5.71k
    } else if (command == kCommandShuffle2 || command == kCommandShuffle4) {
233
1.17k
      if (cpos >= commands_end) return JXL_FAILURE("Out of bounds");
234
1.16k
      uint64_t num = DecodeVarInt(enc, size, &cpos);
235
1.16k
      JXL_RETURN_IF_ERROR(CheckOutOfBounds(pos, num, size));
236
1.12k
      PaddedBytes shuffled(memory_manager);
237
1.12k
      JXL_ASSIGN_OR_RETURN(shuffled,
238
1.12k
                           PaddedBytes::WithInitialSpace(memory_manager, num));
239
10.9k
      for (size_t i = 0; i < num; i++) {
240
9.83k
        shuffled[i] = enc[pos + i];
241
9.83k
      }
242
1.12k
      if (command == kCommandShuffle2) {
243
353
        JXL_RETURN_IF_ERROR(Shuffle(memory_manager, shuffled.data(), num, 2));
244
773
      } else if (command == kCommandShuffle4) {
245
773
        JXL_RETURN_IF_ERROR(Shuffle(memory_manager, shuffled.data(), num, 4));
246
773
      }
247
10.9k
      for (size_t i = 0; i < num; i++) {
248
9.83k
        JXL_RETURN_IF_ERROR(result->push_back(shuffled[i]));
249
9.83k
        pos++;
250
9.83k
      }
251
4.53k
    } else if (command == kCommandPredict) {
252
1.99k
      JXL_RETURN_IF_ERROR(CheckOutOfBounds(cpos, 2, commands_end));
253
1.97k
      uint8_t flags = enc[cpos++];
254
255
1.97k
      size_t width = (flags & 3) + 1;
256
1.97k
      if (width == 3) return JXL_FAILURE("Invalid width");
257
258
1.97k
      int order = (flags & 12) >> 2;
259
1.97k
      if (order == 3) return JXL_FAILURE("Invalid order");
260
261
1.97k
      uint64_t stride = width;
262
1.97k
      if (flags & 16) {
263
522
        if (cpos >= commands_end) return JXL_FAILURE("Out of bounds");
264
522
        stride = DecodeVarInt(enc, size, &cpos);
265
522
        if (stride < width) {
266
3
          return JXL_FAILURE("Invalid stride");
267
3
        }
268
522
      }
269
      // If stride * 4 >= result->size(), return failure. The check
270
      // "size == 0 || ((size - 1) >> 2) < stride" corresponds to
271
      // "stride * 4 >= size", but does not suffer from integer overflow.
272
      // This check is more strict than necessary but follows the specification
273
      // and the encoder should ensure this is followed.
274
1.96k
      if (result->empty() || ((result->size() - 1u) >> 2u) < stride) {
275
62
        return JXL_FAILURE("Invalid stride");
276
62
      }
277
278
1.90k
      if (cpos >= commands_end) return JXL_FAILURE("Out of bounds");
279
1.89k
      uint64_t num = DecodeVarInt(enc, size, &cpos);  // in bytes
280
1.89k
      JXL_RETURN_IF_ERROR(CheckOutOfBounds(pos, num, size));
281
282
1.86k
      PaddedBytes shuffled(memory_manager);
283
1.86k
      JXL_ASSIGN_OR_RETURN(shuffled,
284
1.86k
                           PaddedBytes::WithInitialSpace(memory_manager, num));
285
286
28.9k
      for (size_t i = 0; i < num; i++) {
287
27.1k
        shuffled[i] = enc[pos + i];
288
27.1k
      }
289
1.86k
      if (width > 1) {
290
767
        JXL_RETURN_IF_ERROR(
291
767
            Shuffle(memory_manager, shuffled.data(), num, width));
292
767
      }
293
294
1.86k
      size_t start = result->size();
295
28.9k
      for (size_t i = 0; i < num; i++) {
296
27.1k
        uint8_t predicted = LinearPredictICCValue(result->data(), start, i,
297
27.1k
                                                  stride, width, order);
298
27.1k
        JXL_RETURN_IF_ERROR(result->push_back(predicted + shuffled[i]));
299
27.1k
      }
300
1.86k
      pos += num;
301
2.54k
    } else if (command == kCommandXYZ) {
302
913
      JXL_RETURN_IF_ERROR(AppendKeyword(kXyz_Tag, result));
303
4.56k
      for (int i = 0; i < 4; i++) {
304
3.65k
        JXL_RETURN_IF_ERROR(result->push_back(0));
305
3.65k
      }
306
913
      JXL_RETURN_IF_ERROR(CheckOutOfBounds(pos, 12, size));
307
11.7k
      for (size_t i = 0; i < 12; i++) {
308
10.8k
        JXL_RETURN_IF_ERROR(result->push_back(enc[pos++]));
309
10.8k
      }
310
1.62k
    } else if (command >= kCommandTypeStartFirst &&
311
1.53k
               command < kCommandTypeStartFirst + kNumTypeStrings) {
312
1.42k
      JXL_RETURN_IF_ERROR(AppendKeyword(
313
1.42k
          *kTypeStrings[command - kCommandTypeStartFirst], result));
314
7.11k
      for (size_t i = 0; i < 4; i++) {
315
5.69k
        JXL_RETURN_IF_ERROR(result->push_back(0));
316
5.69k
      }
317
1.42k
    } else {
318
205
      return JXL_FAILURE("Unknown command");
319
205
    }
320
6.42k
  }
321
322
170
  if (pos != size) return JXL_FAILURE("Not all data used");
323
6
  if (result->size() != osize) return JXL_FAILURE("Invalid result size");
324
325
3
  return true;
326
6
}
327
328
38.7k
Status ICCReader::Init(BitReader* reader) {
329
38.7k
  JXL_RETURN_IF_ERROR(CheckEOI(reader));
330
38.7k
  JxlMemoryManager* memory_manager = decompressed_.memory_manager();
331
38.7k
  used_bits_base_ = reader->TotalBitsConsumed();
332
38.7k
  if (bits_to_skip_ == 0) {
333
38.6k
    enc_size_ = U64Coder::Read(reader);
334
38.6k
    if (enc_size_ > 268435456) {
335
      // Avoid too large memory allocation for invalid file.
336
212
      return JXL_FAILURE("Too large encoded profile");
337
212
    }
338
38.4k
    JXL_RETURN_IF_ERROR(DecodeHistograms(
339
38.4k
        memory_manager, reader, kNumICCContexts, &code_, &context_map_));
340
39.2k
    JXL_ASSIGN_OR_RETURN(ans_reader_, ANSSymbolReader::Create(&code_, reader));
341
39.2k
    i_ = 0;
342
39.2k
    JXL_RETURN_IF_ERROR(
343
39.2k
        decompressed_.resize(std::min<size_t>(i_ + 0x400, enc_size_)));
344
32.4k
    for (; i_ < std::min<size_t>(2, enc_size_); i_++) {
345
12.8k
      decompressed_[i_] = ans_reader_.ReadHybridUint(
346
12.8k
          ICCANSContext(i_, i_ > 0 ? decompressed_[i_ - 1] : 0,
347
12.8k
                        i_ > 1 ? decompressed_[i_ - 2] : 0),
348
12.8k
          reader, context_map_);
349
12.8k
    }
350
19.6k
    if (enc_size_ > kPreambleSize) {
351
95.8k
      for (; i_ < kPreambleSize; i_++) {
352
91.2k
        decompressed_[i_] = ans_reader_.ReadHybridUint(
353
91.2k
            ICCANSContext(i_, decompressed_[i_ - 1], decompressed_[i_ - 2]),
354
91.2k
            reader, context_map_);
355
91.2k
      }
356
4.56k
      JXL_RETURN_IF_ERROR(CheckEOI(reader));
357
4.19k
      JXL_RETURN_IF_ERROR(CheckPreamble(decompressed_, enc_size_));
358
4.19k
    }
359
19.0k
    bits_to_skip_ = reader->TotalBitsConsumed() - used_bits_base_;
360
19.0k
  } else {
361
122
    reader->SkipBits(bits_to_skip_);
362
122
  }
363
19.2k
  return true;
364
38.7k
}
365
366
13.5k
Status ICCReader::Process(BitReader* reader, PaddedBytes* icc) {
367
13.5k
  auto checkpoint = jxl::make_unique<ANSSymbolReader::Checkpoint>();
368
13.5k
  size_t saved_i = 0;
369
44.4k
  auto save = [&]() {
370
44.4k
    ans_reader_.Save(checkpoint.get());
371
44.4k
    bits_to_skip_ = reader->TotalBitsConsumed() - used_bits_base_;
372
44.4k
    saved_i = i_;
373
44.4k
  };
374
13.5k
  save();
375
44.4k
  auto check_and_restore = [&]() -> Status {
376
44.4k
    Status status = CheckEOI(reader);
377
44.4k
    if (!status) {
378
      // not enough bytes.
379
2.45k
      ans_reader_.Restore(*checkpoint);
380
2.45k
      i_ = saved_i;
381
2.45k
      return status;
382
2.45k
    }
383
41.9k
    return true;
384
44.4k
  };
385
16.9M
  for (; i_ < enc_size_; i_++) {
386
16.9M
    if (i_ % ANSSymbolReader::kMaxCheckpointInterval == 0 && i_ > 0) {
387
31.8k
      JXL_RETURN_IF_ERROR(check_and_restore());
388
30.9k
      save();
389
30.9k
      if ((i_ > 0) && (((i_ & 0xFFFF) == 0))) {
390
163
        float used_bytes =
391
163
            (reader->TotalBitsConsumed() - used_bits_base_) / 8.0f;
392
163
        if (i_ > used_bytes * 256) return JXL_FAILURE("Corrupted stream");
393
163
      }
394
30.9k
      JXL_RETURN_IF_ERROR(
395
30.9k
          decompressed_.resize(std::min<size_t>(i_ + 0x400, enc_size_)));
396
30.9k
    }
397
16.9M
    JXL_ENSURE(i_ >= 2);
398
16.9M
    decompressed_[i_] = ans_reader_.ReadHybridUint(
399
16.9M
        ICCANSContext(i_, decompressed_[i_ - 1], decompressed_[i_ - 2]), reader,
400
16.9M
        context_map_);
401
16.9M
  }
402
12.6k
  JXL_RETURN_IF_ERROR(check_and_restore());
403
11.0k
  bits_to_skip_ = reader->TotalBitsConsumed() - used_bits_base_;
404
11.0k
  if (!ans_reader_.CheckANSFinalState()) {
405
0
    return JXL_FAILURE("Corrupted ICC profile");
406
0
  }
407
408
11.0k
  icc->clear();
409
11.0k
  return UnpredictICC(decompressed_.data(), decompressed_.size(), icc);
410
11.0k
}
411
412
87.8k
Status ICCReader::CheckEOI(BitReader* reader) {
413
87.8k
  if (reader->AllReadsWithinBounds()) return true;
414
2.82k
  return JXL_NOT_ENOUGH_BYTES("Not enough bytes for reading ICC profile");
415
87.8k
}
416
417
}  // namespace jxl