Coverage Report

Created: 2025-12-31 06:23

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/brunsli/c/dec/brunsli_decode.cc
Line
Count
Source
1
// Copyright (c) Google LLC 2019
2
//
3
// Use of this source code is governed by an MIT-style
4
// license that can be found in the LICENSE file or at
5
// https://opensource.org/licenses/MIT.
6
7
#include <brunsli/brunsli_decode.h>
8
9
#include <algorithm>
10
#include <cstdlib>
11
#include <cstring>
12
#include <iterator>
13
#include <string>
14
#include <vector>
15
16
#include <brotli/decode.h>
17
#include "../common/constants.h"
18
#include "../common/context.h"
19
#include <brunsli/jpeg_data.h>
20
#include "../common/lehmer_code.h"
21
#include "../common/platform.h"
22
#include "../common/predict.h"
23
#include "../common/quant_matrix.h"
24
#include <brunsli/status.h>
25
#include <brunsli/types.h>
26
#include "./ans_decode.h"
27
#include "./arith_decode.h"
28
#include "./bit_reader.h"
29
#include "./brunsli_input.h"
30
#include "./context_map_decode.h"
31
#include "./histogram_decode.h"
32
#include "./huffman_table.h"
33
#include <brunsli/jpeg_data_writer.h>
34
#include "./state.h"
35
#include "./state_internal.h"
36
37
namespace brunsli {
38
39
using ::brunsli::internal::dec::AcDcState;
40
using ::brunsli::internal::dec::BlockI32;
41
using ::brunsli::internal::dec::Buffer;
42
using ::brunsli::internal::dec::ComponentMeta;
43
using ::brunsli::internal::dec::FallbackState;
44
using ::brunsli::internal::dec::HeaderState;
45
using ::brunsli::internal::dec::HistogramDataState;
46
using ::brunsli::internal::dec::InternalState;
47
using ::brunsli::internal::dec::JpegInternalsState;
48
using ::brunsli::internal::dec::MetadataDecompressionStage;
49
using ::brunsli::internal::dec::MetadataState;
50
using ::brunsli::internal::dec::PrepareMeta;
51
using ::brunsli::internal::dec::QuantDataState;
52
using ::brunsli::internal::dec::SectionHeaderState;
53
using ::brunsli::internal::dec::SectionState;
54
using ::brunsli::internal::dec::SerializationStatus;
55
using ::brunsli::internal::dec::Stage;
56
using ::brunsli::internal::dec::State;
57
using ::brunsli::internal::dec::UpdateSubsamplingDerivatives;
58
using ::brunsli::internal::dec::VarintState;
59
60
static const int kNumDirectCodes = 8;
61
static const int kCoeffAlphabetSize = kNumDirectCodes + 10;
62
63
static const uint32_t kKnownSectionTags =
64
    (1u << kBrunsliSignatureTag) | (1u << kBrunsliHeaderTag) |
65
    (1u << kBrunsliMetaDataTag) | (1u << kBrunsliJPEGInternalsTag) |
66
    (1u << kBrunsliQuantDataTag) | (1u << kBrunsliHistogramDataTag) |
67
    (1u << kBrunsliDCDataTag) | (1u << kBrunsliACDataTag) |
68
    (1u << kBrunsliOriginalJpgTag);
69
70
static const uint32_t kKnownHeaderVarintTags =
71
    (1u << kBrunsliHeaderWidthTag) | (1u << kBrunsliHeaderHeightTag) |
72
    (1u << kBrunsliHeaderVersionCompTag) | (1u << kBrunsliHeaderSubsamplingTag);
73
74
0
bool IsBrunsli(const uint8_t* data, const size_t len) {
75
0
  static const uint8_t kSignature[6] = {
76
0
      /* marker */ 0x0A,
77
0
      /* length */ 0x04, 0x42, 0xD2, 0xD5, 0x4E};
78
0
  static const size_t kSignatureLen = sizeof(kSignature);
79
0
  if (len < kSignatureLen) return false;
80
0
  return (memcmp(kSignature, data, kSignatureLen) == 0);
81
0
}
82
83
// Returns ceil(a/b).
84
32.5k
inline int DivCeil(int a, int b) { return (a + b - 1) / b; }
85
86
// Decodes a number in the range [0..255], by reading 1 - 11 bits.
87
7.36k
inline uint32_t DecodeVarLenUint8(BrunsliBitReader* br) {
88
7.36k
  if (BrunsliBitReaderRead(br, 1)) {
89
1.29k
    uint32_t nbits = BrunsliBitReaderRead(br, 3);
90
1.29k
    if (nbits == 0) {
91
614
      return 1u;
92
681
    } else {
93
681
      return BrunsliBitReaderRead(br, nbits) + (1u << nbits);
94
681
    }
95
1.29k
  }
96
6.06k
  return 0;
97
7.36k
}
98
99
66.1k
bool DecodeVarint(VarintState* s, BrunsliBitReader* br, size_t max_bits) {
100
66.1k
  if (s->stage == VarintState::INIT) {
101
66.1k
    s->value = 0;
102
66.1k
    s->i = 0;
103
66.1k
    s->stage = VarintState::READ_CONTINUATION;
104
66.1k
  }
105
106
224k
  while (true) {
107
224k
    switch (s->stage) {
108
145k
      case VarintState::READ_CONTINUATION: {
109
145k
        if (s->i >= max_bits) {
110
609
          s->stage = VarintState::INIT;
111
609
          return true;
112
609
        }
113
144k
        if (s->i + 1 != max_bits) {
114
144k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
115
144k
          if (!BrunsliBitReaderRead(br, 1)) {
116
65.2k
            s->stage = VarintState::INIT;
117
65.2k
            return true;
118
65.2k
          }
119
144k
        }
120
79.3k
        s->stage = VarintState::READ_DATA;
121
79.3k
        continue;
122
144k
      }
123
79.3k
      case VarintState::READ_DATA: {
124
79.3k
        if (!BrunsliBitReaderCanRead(br, 1)) return false;
125
79.2k
        size_t next_bit = BrunsliBitReaderRead(br, 1);
126
79.2k
        s->value |= next_bit << s->i;
127
79.2k
        ++s->i;
128
79.2k
        s->stage = VarintState::READ_CONTINUATION;
129
79.2k
        continue;
130
79.3k
      }
131
0
      default: {
132
0
        BRUNSLI_CHECK(false);
133
0
        return false;
134
79.3k
      }
135
224k
    }
136
224k
  }
137
66.1k
}
138
139
template <size_t kChunkSize>
140
bool DecodeLimitedVarint(VarintState* s, BrunsliBitReader* br,
141
93.9k
                         size_t max_symbols) {
142
93.9k
  if (s->stage == VarintState::INIT) {
143
93.9k
    s->value = 0;
144
93.9k
    s->i = 0;
145
93.9k
    s->stage = VarintState::READ_CONTINUATION;
146
93.9k
  }
147
134k
  while (true) {
148
134k
    switch (s->stage) {
149
114k
      case VarintState::READ_CONTINUATION: {
150
114k
        if (s->i < max_symbols) {
151
111k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
152
111k
          if (BrunsliBitReaderRead(br, 1)) {
153
20.1k
            s->stage = VarintState::READ_DATA;
154
20.1k
            continue;
155
20.1k
          }
156
111k
        }
157
93.7k
        s->stage = VarintState::INIT;
158
93.7k
        return true;
159
114k
      }
160
20.1k
      case VarintState::READ_DATA: {
161
20.1k
        if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false;
162
20.0k
        size_t next_bits = BrunsliBitReaderRead(br, kChunkSize);
163
20.0k
        s->value |= next_bits << (s->i * kChunkSize);
164
20.0k
        ++s->i;
165
20.0k
        s->stage = VarintState::READ_CONTINUATION;
166
20.0k
        continue;
167
20.1k
      }
168
0
      default: {
169
0
        BRUNSLI_CHECK(false);
170
0
        return false;
171
20.1k
      }
172
134k
    }
173
134k
  }
174
93.9k
}
bool brunsli::DecodeLimitedVarint<2ul>(brunsli::internal::dec::VarintState*, brunsli::BrunsliBitReader*, unsigned long)
Line
Count
Source
141
83.8k
                         size_t max_symbols) {
142
83.8k
  if (s->stage == VarintState::INIT) {
143
83.8k
    s->value = 0;
144
83.8k
    s->i = 0;
145
83.8k
    s->stage = VarintState::READ_CONTINUATION;
146
83.8k
  }
147
122k
  while (true) {
148
122k
    switch (s->stage) {
149
103k
      case VarintState::READ_CONTINUATION: {
150
103k
        if (s->i < max_symbols) {
151
101k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
152
101k
          if (BrunsliBitReaderRead(br, 1)) {
153
19.3k
            s->stage = VarintState::READ_DATA;
154
19.3k
            continue;
155
19.3k
          }
156
101k
        }
157
83.8k
        s->stage = VarintState::INIT;
158
83.8k
        return true;
159
103k
      }
160
19.3k
      case VarintState::READ_DATA: {
161
19.3k
        if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false;
162
19.3k
        size_t next_bits = BrunsliBitReaderRead(br, kChunkSize);
163
19.3k
        s->value |= next_bits << (s->i * kChunkSize);
164
19.3k
        ++s->i;
165
19.3k
        s->stage = VarintState::READ_CONTINUATION;
166
19.3k
        continue;
167
19.3k
      }
168
0
      default: {
169
0
        BRUNSLI_CHECK(false);
170
0
        return false;
171
19.3k
      }
172
122k
    }
173
122k
  }
174
83.8k
}
bool brunsli::DecodeLimitedVarint<8ul>(brunsli::internal::dec::VarintState*, brunsli::BrunsliBitReader*, unsigned long)
Line
Count
Source
141
10.0k
                         size_t max_symbols) {
142
10.0k
  if (s->stage == VarintState::INIT) {
143
10.0k
    s->value = 0;
144
10.0k
    s->i = 0;
145
10.0k
    s->stage = VarintState::READ_CONTINUATION;
146
10.0k
  }
147
11.4k
  while (true) {
148
11.4k
    switch (s->stage) {
149
10.7k
      case VarintState::READ_CONTINUATION: {
150
10.7k
        if (s->i < max_symbols) {
151
10.7k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
152
10.6k
          if (BrunsliBitReaderRead(br, 1)) {
153
732
            s->stage = VarintState::READ_DATA;
154
732
            continue;
155
732
          }
156
10.6k
        }
157
9.97k
        s->stage = VarintState::INIT;
158
9.97k
        return true;
159
10.7k
      }
160
732
      case VarintState::READ_DATA: {
161
732
        if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false;
162
704
        size_t next_bits = BrunsliBitReaderRead(br, kChunkSize);
163
704
        s->value |= next_bits << (s->i * kChunkSize);
164
704
        ++s->i;
165
704
        s->stage = VarintState::READ_CONTINUATION;
166
704
        continue;
167
732
      }
168
0
      default: {
169
0
        BRUNSLI_CHECK(false);
170
0
        return false;
171
732
      }
172
11.4k
    }
173
11.4k
  }
174
10.0k
}
175
176
11.2k
std::vector<uint8_t> GenerateApp0Marker(uint8_t app0_status) {
177
11.2k
  std::vector<uint8_t> app0_marker(AppData_0xe0, AppData_0xe0 + 17);
178
11.2k
  app0_marker[9] = app0_status & 1u ? 2 : 1;
179
11.2k
  app0_status >>= 1u;
180
11.2k
  app0_marker[10] = app0_status & 0x3u;
181
11.2k
  app0_status >>= 2u;
182
11.2k
  uint16_t x_dens = kApp0Densities[app0_status];
183
11.2k
  app0_marker[11] = app0_marker[13] = x_dens >> 8u;
184
11.2k
  app0_marker[12] = app0_marker[14] = x_dens & 0xFFu;
185
11.2k
  return app0_marker;
186
11.2k
}
187
188
2.31k
std::vector<uint8_t> GenerateAppMarker(uint8_t marker, uint8_t code) {
189
2.31k
  std::vector<uint8_t> s;
190
2.31k
  if (marker == 0x80) {
191
1.77k
    s = std::vector<uint8_t>(AppData_0xe2, AppData_0xe2 + 3161);
192
1.77k
    s[84] = code;
193
1.77k
  } else if (marker == 0x81) {
194
311
    s = std::vector<uint8_t>(AppData_0xec, AppData_0xec + 18);
195
311
    s[15] = code;
196
311
  } else {
197
232
    BRUNSLI_DCHECK(marker == 0x82);
198
232
    s = std::vector<uint8_t>(AppData_0xee, AppData_0xee + 15);
199
232
    s[10] = code;
200
232
  }
201
2.31k
  return s;
202
2.31k
}
203
204
bool ProcessMetaData(const uint8_t* data, size_t len, MetadataState* state,
205
221k
                     JPEGData* jpg) {
206
221k
  size_t pos = 0;
207
540k
  while (pos < len) {
208
319k
    switch (state->stage) {
209
35.5k
      case MetadataState::READ_MARKER: {
210
35.5k
        state->marker = static_cast<uint8_t>(data[pos++]);
211
35.5k
        if (state->marker == 0xD9) {
212
163
          jpg->tail_data = std::vector<uint8_t>();
213
163
          state->stage = MetadataState::READ_TAIL;
214
163
          continue;
215
35.4k
        } else if (state->marker < 0x40) {
216
11.2k
          state->short_marker_count++;
217
11.2k
          if (state->short_marker_count > kBrunsliShortMarkerLimit) {
218
6
            return false;
219
6
          }
220
11.2k
          jpg->app_data.push_back(GenerateApp0Marker(state->marker));
221
11.2k
          continue;
222
24.1k
        } else if (state->marker >= 0x80 && state->marker <= 0x82) {
223
2.33k
          state->short_marker_count++;
224
2.33k
          if (state->short_marker_count > kBrunsliShortMarkerLimit) {
225
1
            return false;
226
1
          }
227
2.33k
          state->stage = MetadataState::READ_CODE;
228
2.33k
          continue;
229
2.33k
        }
230
        // Otherwise - mutlibyte sequence.
231
21.8k
        if ((state->marker != 0xFE) && ((state->marker >> 4u) != 0x0E)) {
232
158
          return false;
233
158
        }
234
21.6k
        state->stage = MetadataState::READ_LENGTH_HI;
235
21.6k
        continue;
236
21.8k
      }
237
238
37.2k
      case MetadataState::READ_TAIL: {
239
37.2k
        Append(&jpg->tail_data, data + pos, data + len);
240
37.2k
        pos = len;
241
37.2k
        continue;
242
21.8k
      }
243
244
2.31k
      case MetadataState::READ_CODE: {
245
2.31k
        const uint8_t code = data[pos++];
246
2.31k
        jpg->app_data.push_back(GenerateAppMarker(state->marker, code));
247
2.31k
        state->stage = MetadataState::READ_MARKER;
248
2.31k
        continue;
249
21.8k
      }
250
251
21.6k
      case MetadataState::READ_LENGTH_HI: {
252
21.6k
        state->length_hi = data[pos++];
253
21.6k
        state->stage = MetadataState::READ_LENGTH_LO;
254
21.6k
        continue;
255
21.8k
      }
256
257
21.6k
      case MetadataState::READ_LENGTH_LO: {
258
21.6k
        const uint8_t lo = data[pos++];
259
21.6k
        size_t marker_len = (state->length_hi << 8u) + lo;
260
21.6k
        if (marker_len < 2) return false;
261
21.6k
        state->remaining_multibyte_length = marker_len - 2;
262
21.6k
        uint8_t head[3] = {state->marker, state->length_hi, lo};
263
21.6k
        auto* dest = (state->marker == 0xFE) ? &jpg->com_data : &jpg->app_data;
264
21.6k
        size_t delta = (state->marker == 0xFE) ? 0 : state->short_marker_count;
265
21.6k
        if (dest->size() - delta >= kBrunsliMultibyteMarkerLimit) {
266
1
          return false;
267
1
        }
268
21.6k
        dest->emplace_back(head, head + 3);
269
21.6k
        state->multibyte_sink = &dest->back();
270
        // Turn state machine to default state in case there is no payload in
271
        // multibyte sequence. This is important when such a sequence concludes
272
        // the input.
273
21.6k
        state->stage = (state->remaining_multibyte_length > 0)
274
21.6k
                           ? MetadataState::READ_MULTIBYTE
275
21.6k
                           : MetadataState::READ_MARKER;
276
21.6k
        continue;
277
21.6k
      }
278
279
200k
      case MetadataState::READ_MULTIBYTE: {
280
200k
        size_t chunk_size =
281
200k
            std::min(state->remaining_multibyte_length, len - pos);
282
200k
        Append(state->multibyte_sink, data + pos, chunk_size);
283
200k
        state->remaining_multibyte_length -= chunk_size;
284
200k
        pos += chunk_size;
285
200k
        if (state->remaining_multibyte_length == 0) {
286
21.1k
          state->stage = MetadataState::READ_MARKER;
287
21.1k
        }
288
200k
        continue;
289
21.6k
      }
290
291
0
      default: return false;
292
319k
    }
293
319k
  }
294
220k
  return true;
295
221k
}
296
297
11.5k
static BrunsliStatus DecodeHuffmanCode(State* state, JPEGData* jpg) {
298
11.5k
  InternalState& s = *state->internal;
299
11.5k
  JpegInternalsState& js = s.internals;
300
11.5k
  BrunsliBitReader* br = &js.br;
301
302
229k
  while (true) {
303
229k
    switch (js.stage) {
304
26.4k
      case JpegInternalsState::READ_HUFFMAN_LAST: {
305
26.4k
        if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA;
306
26.4k
        js.is_known_last_huffman_code = BrunsliBitReaderRead(br, 1);
307
26.4k
        jpg->huffman_code.emplace_back();
308
26.4k
        js.stage = JpegInternalsState::READ_HUFFMAN_SIMPLE;
309
26.4k
        continue;
310
26.4k
      }
311
26.4k
      case JpegInternalsState::READ_HUFFMAN_SIMPLE: {
312
26.4k
        if (!BrunsliBitReaderCanRead(br, 5 + !js.is_known_last_huffman_code)) {
313
189
          return BRUNSLI_NOT_ENOUGH_DATA;
314
189
        }
315
26.2k
        JPEGHuffmanCode* huff = &jpg->huffman_code.back();
316
317
26.2k
        huff->slot_id = BrunsliBitReaderRead(br, 2);
318
26.2k
        js.is_dc_table = (BrunsliBitReaderRead(br, 1) == 0);
319
26.2k
        huff->slot_id += js.is_dc_table ? 0 : 0x10;
320
26.2k
        huff->is_last =
321
26.2k
            js.is_known_last_huffman_code || BrunsliBitReaderRead(br, 1);
322
26.2k
        huff->counts[0] = 0;
323
26.2k
        int found_match = BrunsliBitReaderRead(br, 1);
324
26.2k
        if (found_match) {
325
16.2k
          if (js.is_dc_table) {
326
8.71k
            int huff_table_idx = BrunsliBitReaderRead(br, 1);
327
8.71k
            memcpy(&huff->counts[1], kStockDCHuffmanCodeCounts[huff_table_idx],
328
8.71k
                   sizeof(kStockDCHuffmanCodeCounts[0]));
329
8.71k
            memcpy(&huff->values[0], kStockDCHuffmanCodeValues[huff_table_idx],
330
8.71k
                   sizeof(kStockDCHuffmanCodeValues[0]));
331
8.71k
          } else {
332
7.56k
            int huff_table_idx = BrunsliBitReaderRead(br, 1);
333
7.56k
            memcpy(&huff->counts[1], kStockACHuffmanCodeCounts[huff_table_idx],
334
7.56k
                   sizeof(kStockACHuffmanCodeCounts[0]));
335
7.56k
            memcpy(&huff->values[0], kStockACHuffmanCodeValues[huff_table_idx],
336
7.56k
                   sizeof(kStockACHuffmanCodeValues[0]));
337
7.56k
          }
338
16.2k
          js.stage = JpegInternalsState::HUFFMAN_UPDATE;
339
16.2k
        } else {
340
          // One less bit is used than requested, but it is guaranteed to be
341
          // consumed in complex Huffman code case.
342
9.96k
          js.p.Init(js.is_dc_table
343
9.96k
                        ? std::vector<uint8_t>(kDefaultDCValues,
344
7.00k
                                               std::end(kDefaultDCValues))
345
9.96k
                        : std::vector<uint8_t>(kDefaultACValues,
346
2.96k
                                               std::end(kDefaultACValues)));
347
9.96k
          js.stage = JpegInternalsState::READ_HUFFMAN_MAX_LEN;
348
9.96k
        }
349
26.2k
        continue;
350
26.4k
      }
351
9.96k
      case JpegInternalsState::READ_HUFFMAN_MAX_LEN: {
352
9.96k
        if (!BrunsliBitReaderCanRead(br, 4)) return BRUNSLI_NOT_ENOUGH_DATA;
353
9.92k
        js.max_len = BrunsliBitReaderRead(br, 4) + 1;
354
9.92k
        js.total_count = 0;
355
9.92k
        js.max_count =
356
9.92k
            js.is_dc_table ? kJpegDCAlphabetSize : kJpegHuffmanAlphabetSize;
357
9.92k
        js.space = (1u << kJpegHuffmanMaxBitLength) -
358
9.92k
                   (1u << (kJpegHuffmanMaxBitLength - js.max_len));
359
9.92k
        js.i = 1;
360
9.92k
        js.stage = JpegInternalsState::READ_HUFFMAN_COUNT;
361
9.92k
        continue;
362
9.96k
      }
363
46.4k
      case JpegInternalsState::READ_HUFFMAN_COUNT: {
364
46.4k
        JPEGHuffmanCode* huff = &jpg->huffman_code.back();
365
46.4k
        if (js.i <= js.max_len) {
366
36.6k
          size_t shift = kJpegHuffmanMaxBitLength - js.i;
367
36.6k
          size_t count_limit =
368
36.6k
              std::min(js.max_count - js.total_count, js.space >> shift);
369
36.6k
          if (count_limit > 0) {
370
35.0k
            int nbits =
371
35.0k
                Log2FloorNonZero(static_cast<uint32_t>(count_limit)) + 1;
372
35.0k
            if (!BrunsliBitReaderCanRead(br, nbits)) {
373
52
              return BRUNSLI_NOT_ENOUGH_DATA;
374
52
            }
375
34.9k
            size_t count = BrunsliBitReaderRead(br, nbits);
376
34.9k
            if (count > count_limit) {
377
8
              return BRUNSLI_INVALID_BRN;
378
8
            }
379
34.9k
            huff->counts[js.i] = static_cast<int>(count);
380
34.9k
            js.total_count += count;
381
34.9k
            js.space -= count * (static_cast<size_t>(1) << shift);
382
34.9k
          }
383
36.5k
          ++js.i;
384
36.5k
          continue;
385
36.6k
        }
386
9.86k
        ++huff->counts[js.max_len];
387
9.86k
        js.i = 0;
388
9.86k
        js.stage = JpegInternalsState::READ_HUFFMAN_PERMUTATION;
389
9.86k
        continue;
390
46.4k
      }
391
93.6k
      case JpegInternalsState::READ_HUFFMAN_PERMUTATION: {
392
93.6k
        JPEGHuffmanCode* huff = &jpg->huffman_code.back();
393
93.6k
        if (js.i < js.total_count) {
394
83.8k
          const int nbits = js.p.num_bits();
395
83.8k
          if (!DecodeLimitedVarint<2>(&js.varint, br, (nbits + 1) >> 1u)) {
396
63
            return BRUNSLI_NOT_ENOUGH_DATA;
397
63
          }
398
83.8k
          uint8_t value;
399
83.8k
          if (!js.p.Remove(js.varint.value, &value)) {
400
13
            return BRUNSLI_INVALID_BRN;
401
13
          }
402
83.8k
          huff->values[js.i] = value;
403
83.8k
          ++js.i;
404
83.8k
          continue;
405
83.8k
        }
406
9.79k
        huff->values[js.total_count] = kJpegHuffmanAlphabetSize;
407
9.79k
        js.stage = JpegInternalsState::HUFFMAN_UPDATE;
408
9.79k
        continue;
409
93.6k
      }
410
26.0k
      case JpegInternalsState::HUFFMAN_UPDATE: {
411
        // This stage does not perform reading -> transient.
412
26.0k
        if (jpg->huffman_code.back().is_last) {
413
13.2k
          js.terminal_huffman_code_count++;
414
13.2k
        }
415
26.0k
        if (js.is_known_last_huffman_code) {
416
11.1k
          js.p.Clear();
417
11.1k
          return BRUNSLI_OK;
418
11.1k
        }
419
14.8k
        if (jpg->huffman_code.size() >= kMaxDHTMarkers) {
420
          // Too many Huffman codes for a valid bit-stream. Normally, a jpeg
421
          // file can have any arbitrary number of DHT, DQT, etc. But i prefer
422
          // we force a reasonable lower bound instead of open door to likely
423
          // forged BRN input.
424
1
          return BRUNSLI_INVALID_BRN;
425
1
        }
426
14.8k
        js.stage = JpegInternalsState::READ_HUFFMAN_LAST;
427
14.8k
        continue;
428
14.8k
      }
429
0
      default:
430
0
        return BRUNSLI_DECOMPRESSION_ERROR;
431
229k
    }
432
229k
  }
433
0
  return BRUNSLI_OK;
434
11.5k
}
435
436
5.13k
BrunsliStatus DecodeScanInfo(State* state, JPEGData* jpg) {
437
5.13k
  InternalState& s = *state->internal;
438
5.13k
  JpegInternalsState& js = s.internals;
439
5.13k
  BrunsliBitReader* br = &js.br;
440
441
23.1k
  const auto maybe_add_zero_run = [&js, jpg] () {
442
23.1k
    if (js.last_num > 0) {
443
16.1k
      JPEGScanInfo::ExtraZeroRunInfo info;
444
16.1k
      info.block_idx = js.last_block_idx;
445
16.1k
      info.num_extra_zero_runs = js.last_num;
446
16.1k
      jpg->scan_info[js.i].extra_zero_runs.push_back(info);
447
16.1k
      js.last_num = 0;
448
16.1k
    }
449
23.1k
  };
450
451
183k
  while (true) {
452
183k
    switch (js.stage) {
453
9.20k
      case JpegInternalsState::READ_SCAN_COMMON: {
454
9.20k
        JPEGScanInfo* si = &jpg->scan_info[js.i];
455
9.20k
        if (!BrunsliBitReaderCanRead(br, 22)) return BRUNSLI_NOT_ENOUGH_DATA;
456
9.04k
        si->Ss = BrunsliBitReaderRead(br, 6);
457
9.04k
        si->Se = BrunsliBitReaderRead(br, 6);
458
9.04k
        si->Ah = BrunsliBitReaderRead(br, 4);
459
9.04k
        si->Al = BrunsliBitReaderRead(br, 4);
460
9.04k
        si->num_components = BrunsliBitReaderRead(br, 2) + 1;
461
9.04k
        js.j = 0;
462
9.04k
        js.stage = JpegInternalsState::READ_SCAN_COMPONENT;
463
9.04k
        continue;
464
9.20k
      }
465
29.5k
      case JpegInternalsState::READ_SCAN_COMPONENT: {
466
29.5k
        JPEGScanInfo* si = &jpg->scan_info[js.i];
467
29.5k
        if (js.j < si->num_components) {
468
20.5k
          if (!BrunsliBitReaderCanRead(br, 6)) return BRUNSLI_NOT_ENOUGH_DATA;
469
20.5k
          si->components[js.j].comp_idx = BrunsliBitReaderRead(br, 2);
470
20.5k
          si->components[js.j].dc_tbl_idx = BrunsliBitReaderRead(br, 2);
471
20.5k
          si->components[js.j].ac_tbl_idx = BrunsliBitReaderRead(br, 2);
472
20.5k
          js.j++;
473
20.5k
        } else {
474
9.00k
          js.last_block_idx = -1;
475
9.00k
          js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION;
476
9.00k
        }
477
29.5k
        continue;
478
29.5k
      }
479
41.1k
      case JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION: {
480
41.1k
        if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA;
481
41.0k
        if (BrunsliBitReaderRead(br, 1)) {
482
32.1k
          js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_DATA;
483
32.1k
        } else {
484
8.93k
          js.last_block_idx = 0;
485
8.93k
          js.last_num = 0;
486
8.93k
          js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION;
487
8.93k
        }
488
41.0k
        continue;
489
41.1k
      }
490
32.1k
      case JpegInternalsState::READ_SCAN_RESET_POINT_DATA: {
491
32.1k
        JPEGScanInfo* si = &jpg->scan_info[js.i];
492
32.1k
        if (!DecodeVarint(&js.varint, br, 28)) return BRUNSLI_NOT_ENOUGH_DATA;
493
32.1k
        int block_idx =
494
32.1k
            js.last_block_idx + static_cast<int>(js.varint.value) + 1;
495
32.1k
        si->reset_points.emplace_back(block_idx);
496
32.1k
        js.last_block_idx = block_idx;
497
        // TODO(eustas): limit to exact number of blocks.
498
32.1k
        if (js.last_block_idx > (1 << 30)) {
499
          // At most 8K x 8K x num_channels blocks are expected. That is,
500
          // typically, 1.5 * 2^27. 2^30 should be sufficient for any sane
501
          // image.
502
1
          return BRUNSLI_INVALID_BRN;
503
1
        }
504
32.1k
        js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION;
505
32.1k
        continue;
506
32.1k
      }
507
40.1k
      case JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION: {
508
40.1k
        if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA;
509
40.1k
        if (BrunsliBitReaderRead(br, 1)) {
510
31.2k
          js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_DATA;
511
31.2k
        } else {
512
8.88k
          maybe_add_zero_run();
513
8.88k
          ++js.i;
514
8.88k
          if (js.i < js.num_scans) {
515
4.07k
            js.stage = JpegInternalsState::READ_SCAN_COMMON;
516
4.07k
            continue;
517
4.07k
          }
518
4.81k
          return BRUNSLI_OK;
519
8.88k
        }
520
31.2k
        continue;
521
40.1k
      }
522
31.2k
      case JpegInternalsState::READ_SCAN_ZERO_RUN_DATA: {
523
31.2k
        if (!DecodeVarint(&js.varint, br, 28)) return BRUNSLI_NOT_ENOUGH_DATA;
524
31.1k
        int block_idx = js.last_block_idx + static_cast<int>(js.varint.value);
525
31.1k
        if (block_idx > js.last_block_idx) maybe_add_zero_run();
526
31.1k
        ++js.last_num;
527
31.1k
        js.last_block_idx = block_idx;
528
        // TODO(eustas): limit to exact number of blocks.
529
31.1k
        if (js.last_block_idx > (1 << 30)) {
530
          // At most 8K x 8K x num_channels blocks are expected. That is,
531
          // typically, 1.5 * 2^27. 2^30 should be sufficient for any sane
532
          // image.
533
3
          return BRUNSLI_INVALID_BRN;
534
3
        }
535
31.1k
        js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION;
536
31.1k
        continue;
537
31.1k
      }
538
0
      default: return BRUNSLI_DECOMPRESSION_ERROR;
539
183k
    }
540
183k
  }
541
5.13k
}
542
543
static bool BRUNSLI_NOINLINE DecodeCoeffOrder(uint32_t* order, BitSource* br,
544
5.81k
                                              WordSource* in) {
545
5.81k
  uint32_t lehmer[kDCTBlockSize] = {0};
546
5.81k
  static const int kSpan = 16;
547
29.0k
  for (int i = 0; i < kDCTBlockSize; i += kSpan) {
548
23.2k
    if (!br->ReadBits(1, in)) continue;  // span is all-zero
549
2.57k
    const int start = (i > 0) ? i : 1;
550
2.57k
    const int end = i + kSpan;
551
41.8k
    for (int j = start; j < end; ++j) {
552
39.3k
      uint32_t v = 0;
553
50.2k
      while (v <= kDCTBlockSize) {
554
50.2k
        const uint32_t bits = br->ReadBits(3, in);
555
50.2k
        v += bits;
556
50.2k
        if (bits < 7) break;
557
50.2k
      }
558
39.3k
      if (v > kDCTBlockSize) return false;
559
39.3k
      lehmer[j] = v;
560
39.3k
    }
561
2.57k
  }
562
5.80k
  int end = kDCTBlockSize - 1;
563
340k
  while (end >= 1 && lehmer[end] == 0) {
564
334k
    --end;
565
334k
  }
566
5.80k
  if (lehmer[end] == 1) return false;
567
29.7k
  for (int i = 1; i <= end; ++i) {
568
24.2k
    if (lehmer[i] == 0) return false;
569
24.0k
    --lehmer[i];
570
24.0k
  }
571
5.57k
  if (!DecodeLehmerCode(lehmer, kDCTBlockSize, order)) return false;
572
361k
  for (int k = 0; k < kDCTBlockSize; ++k) {
573
355k
    order[k] = kJPEGNaturalOrder[order[k]];
574
355k
  }
575
5.55k
  return true;
576
5.57k
}
577
578
/** Reads 0..6 words from |in| and returns the value in the range 0..63. */
579
static size_t DecodeNumNonzeros(Prob* p, BinaryArithmeticDecoder* ac,
580
1.78M
                                WordSource* in) {
581
  // To simplity BST navigation, we use 1-based indexing.
582
1.78M
  Prob* bst = p - 1;
583
1.78M
  size_t ctx = 1;
584
585
12.4M
  for (size_t b = 0; b < kNumNonZeroBits; ++b) {
586
10.6M
    const int bit = ac->ReadBit(bst[ctx].get_proba(), in);
587
10.6M
    bst[ctx].Add(bit);
588
10.6M
    ctx = 2 * ctx + bit;
589
10.6M
  }
590
591
  // Leaf index in the level corresponds to the resuling value.
592
1.78M
  size_t val = ctx - (1u << kNumNonZeroBits);
593
1.78M
  BRUNSLI_DCHECK(val <= kNumNonZeroTreeSize);
594
1.78M
  return val;
595
1.78M
}
596
597
11.3k
void EnsureSubdecodersInitialized(State* state, WordSource* in) {
598
11.3k
  InternalState& s = *state->internal;
599
11.3k
  if (!s.subdecoders_initialized) {
600
11.3k
    s.ans_decoder.Init(in);
601
11.3k
    s.bit_reader.Init(in);
602
11.3k
    s.arith_decoder.Init(in);
603
11.3k
    s.subdecoders_initialized = true;
604
11.3k
  }
605
11.3k
}
606
607
10.9k
bool FinalizeSubdecoders(State* state) {
608
10.9k
  InternalState& s = *state->internal;
609
10.9k
  if (!s.ans_decoder.CheckCRC()) return false;
610
10.1k
  if (!s.bit_reader.Finish()) return false;
611
10.1k
  s.subdecoders_initialized = false;
612
10.1k
  return true;
613
10.1k
}
614
615
6.07k
BrunsliStatus DecodeDC(State* state, WordSource* in) {
616
6.07k
  const std::vector<ComponentMeta>& meta = state->meta;
617
6.07k
  const size_t num_components = meta.size();
618
6.07k
  const int mcu_rows = meta[0].height_in_blocks / meta[0].v_samp;
619
6.07k
  InternalState& s = *state->internal;
620
6.07k
  AcDcState& ac_dc_state = s.ac_dc;
621
622
6.07k
  std::vector<ComponentStateDC>& comps = ac_dc_state.dc;
623
6.07k
  if (comps.empty()) {
624
6.07k
    comps.resize(num_components);
625
12.7k
    for (size_t c = 0; c < num_components; ++c) {
626
6.69k
      comps[c].SetWidth(meta[c].width_in_blocks);
627
6.69k
    }
628
6.07k
  }
629
630
6.07k
  if (!in->CanRead(5)) return BRUNSLI_NOT_ENOUGH_DATA;
631
5.94k
  EnsureSubdecodersInitialized(state, in);
632
5.94k
  ANSDecoder ans = s.ans_decoder;
633
5.94k
  BitSource br = s.bit_reader;
634
5.94k
  BinaryArithmeticDecoder ac = s.arith_decoder;
635
636
  // We decode DC components in the following interleaved manner:
637
  //   v_samp[0] rows from component 0
638
  //   v_samp[1] rows from component 1
639
  //   v_samp[2] rows from component 2
640
  //   v_samp[3] rows from component 3 (if present)
641
  //
642
  // E.g. in a YUV420 image, we decode 2 rows of DC components from Y and then
643
  // 1 row of DC components from U and 1 row of DC components from V.
644
133k
  for (int mcu_y = ac_dc_state.next_mcu_y; mcu_y < mcu_rows; ++mcu_y) {
645
259k
    for (size_t i = ac_dc_state.next_component; i < num_components; ++i) {
646
131k
      ComponentStateDC* c = &comps[i];
647
131k
      const ComponentMeta& m = meta[i];
648
131k
      const uint8_t* context_map = state->context_map + i * kNumAvrgContexts;
649
131k
      const int ac_stride = static_cast<int>(m.ac_stride);
650
131k
      const size_t b_stride = m.b_stride;
651
131k
      const int width = m.width_in_blocks;
652
131k
      int y = mcu_y * m.v_samp + ac_dc_state.next_iy;
653
131k
      int* const prev_sgn = &c->prev_sign[1];
654
131k
      int* const prev_abs = &c->prev_abs_coeff[2];
655
502k
      for (int iy = ac_dc_state.next_iy; iy < m.v_samp; ++iy, ++y) {
656
370k
        coeff_t* coeffs =
657
370k
            m.ac_coeffs + y * ac_stride + ac_dc_state.next_x * kDCTBlockSize;
658
370k
        uint8_t* block_state =
659
370k
            m.block_state + y * b_stride + ac_dc_state.next_x;
660
58.2M
        for (int x = ac_dc_state.next_x; x < width; ++x) {
661
57.8M
          if (BRUNSLI_PREDICT_FALSE(!in->CanRead(6))) {
662
88
            ac_dc_state.next_mcu_y = mcu_y;
663
88
            ac_dc_state.next_component = i;
664
88
            ac_dc_state.next_iy = iy;
665
88
            ac_dc_state.next_x = x;
666
88
            s.ans_decoder = ans;
667
88
            s.bit_reader = br;
668
88
            s.arith_decoder = ac;
669
88
            return BRUNSLI_NOT_ENOUGH_DATA;
670
88
          }
671
57.8M
          const int is_empty_ctx =
672
57.8M
              IsEmptyBlockContext(&c->prev_is_nonempty[1], x);
673
57.8M
          Prob* BRUNSLI_RESTRICT is_empty_p =
674
57.8M
              &c->is_empty_block_prob[is_empty_ctx];
675
57.8M
          const bool is_empty_block = !ac.ReadBit(is_empty_p->get_proba(), in);
676
57.8M
          is_empty_p->Add(!is_empty_block);
677
57.8M
          c->prev_is_nonempty[x + 1] = !is_empty_block;
678
57.8M
          *block_state = is_empty_block;
679
57.8M
          int abs_val = 0;
680
57.8M
          int sign = 0;
681
57.8M
          if (!is_empty_block) {
682
18.4M
            Prob* BRUNSLI_RESTRICT p_is_zero = &c->is_zero_prob;
683
18.4M
            int is_zero = ac.ReadBit(p_is_zero->get_proba(), in);
684
18.4M
            p_is_zero->Add(is_zero);
685
18.4M
            if (!is_zero) {
686
4.35M
              const int avg_ctx = WeightedAverageContextDC(prev_abs, x);
687
4.35M
              const int sign_ctx = prev_sgn[x] * 3 + prev_sgn[x - 1];
688
4.35M
              Prob* BRUNSLI_RESTRICT sign_p = &c->sign_prob[sign_ctx];
689
4.35M
              sign = ac.ReadBit(sign_p->get_proba(), in);
690
4.35M
              sign_p->Add(sign);
691
4.35M
              const int entropy_ix = context_map[avg_ctx];
692
4.35M
              int code = ans.ReadSymbol(state->entropy_codes[entropy_ix], in);
693
4.35M
              if (code < kNumDirectCodes) {
694
670k
                abs_val = code + 1;
695
3.68M
              } else {
696
3.68M
                int nbits = code - kNumDirectCodes;
697
3.68M
                Prob* BRUNSLI_RESTRICT p_first_extra_bit =
698
3.68M
                    &c->first_extra_bit_prob[nbits];
699
3.68M
                int first_extra_bit =
700
3.68M
                    ac.ReadBit(p_first_extra_bit->get_proba(), in);
701
3.68M
                p_first_extra_bit->Add(first_extra_bit);
702
3.68M
                int extra_bits_val = first_extra_bit << nbits;
703
3.68M
                if (nbits > 0) {
704
3.55M
                  extra_bits_val |= static_cast<int>(br.ReadBits(nbits, in));
705
3.55M
                }
706
3.68M
                abs_val = kNumDirectCodes - 1 + (2 << nbits) + extra_bits_val;
707
3.68M
              }
708
4.35M
            }
709
18.4M
          }
710
57.8M
          prev_abs[x] = abs_val;
711
57.8M
          prev_sgn[x] = abs_val ? sign + 1 : 0;
712
57.8M
          coeffs[0] = ((1 - 2 * sign) * abs_val +
713
57.8M
                       PredictWithAdaptiveMedian(coeffs, x, y, ac_stride));
714
57.8M
          block_state++;
715
57.8M
          coeffs += kDCTBlockSize;
716
57.8M
        }
717
370k
        ac_dc_state.next_x = 0;
718
370k
      }
719
131k
      ac_dc_state.next_iy = 0;
720
131k
    }
721
127k
    ac_dc_state.next_component = 0;
722
127k
  }
723
724
  // Prepare for AC decoding.
725
5.86k
  ac_dc_state.next_mcu_y = 0;
726
5.86k
  ac_dc_state.next_component = 0;
727
5.86k
  ac_dc_state.next_iy = 0;
728
5.86k
  ac_dc_state.next_x = 0;
729
730
5.86k
  comps.clear();
731
5.86k
  comps.shrink_to_fit();
732
733
5.86k
  s.ans_decoder = ans;
734
5.86k
  s.bit_reader = br;
735
5.86k
  s.arith_decoder = ac;
736
5.86k
  if (!FinalizeSubdecoders(state)) return BRUNSLI_INVALID_BRN;
737
738
5.55k
  return BRUNSLI_OK;
739
5.86k
}
740
741
static void BRUNSLI_NOINLINE DecodeEmptyAcBlock(
742
9.47M
    int* BRUNSLI_RESTRICT prev_sgn, int* BRUNSLI_RESTRICT prev_abs) {
743
606M
  for (int k = 1; k < kDCTBlockSize; ++k) {
744
596M
    prev_sgn[k] = 0;
745
596M
    prev_abs[k] = 0;
746
596M
  }
747
9.47M
}
748
749
/** All the necessary things for decoding AC block. */
750
struct AcBlockCookie {
751
  int x;
752
  int y;
753
  uint8_t* BRUNSLI_RESTRICT prev_num_nonzeros;
754
  int* BRUNSLI_RESTRICT prev_sgn;
755
  int* BRUNSLI_RESTRICT prev_abs;
756
  Prob* BRUNSLI_RESTRICT num_nonzero_prob;
757
758
  BinaryArithmeticDecoder* BRUNSLI_RESTRICT ac;
759
  WordSource* BRUNSLI_RESTRICT in;
760
  ANSDecoder* BRUNSLI_RESTRICT ans;
761
  BitSource* BRUNSLI_RESTRICT br;
762
763
  coeff_t* BRUNSLI_RESTRICT coeffs;
764
  const coeff_t* BRUNSLI_RESTRICT prev_row_coeffs;
765
  const coeff_t* BRUNSLI_RESTRICT prev_col_coeffs;
766
  Prob* BRUNSLI_RESTRICT is_zero_prob;
767
  const uint32_t* BRUNSLI_RESTRICT order;
768
  const uint8_t* BRUNSLI_RESTRICT context_modes;
769
  const int* BRUNSLI_RESTRICT mult_col;
770
  const int* BRUNSLI_RESTRICT mult_row;
771
  int prev_row_delta;
772
  Prob* BRUNSLI_RESTRICT sign_prob;
773
  size_t context_bits;
774
  const uint8_t* BRUNSLI_RESTRICT context_map;
775
  const ANSDecodingData* BRUNSLI_RESTRICT entropy_codes;
776
  Prob* BRUNSLI_RESTRICT first_extra_bit_prob;
777
};
778
779
1.78M
static size_t BRUNSLI_NOINLINE DecodeAcBlock(const AcBlockCookie& cookie) {
780
1.78M
  AcBlockCookie c = cookie;
781
782
1.78M
  BinaryArithmeticDecoder ac = *c.ac;
783
1.78M
  WordSource* in = c.in;
784
1.78M
  ANSDecoder ans = *c.ans;
785
1.78M
  BitSource br = *c.br;
786
787
1.78M
  size_t num_nonzeros = 0;
788
789
1.78M
  const uint8_t nonzero_ctx = NumNonzerosContext(c.prev_num_nonzeros, c.x, c.y);
790
1.78M
  size_t last_nz = DecodeNumNonzeros(
791
1.78M
      c.num_nonzero_prob + kNumNonZeroTreeSize * nonzero_ctx, &ac, in);
792
86.0M
  for (size_t k = last_nz + 1; k < kDCTBlockSize; ++k) {
793
84.2M
    c.prev_sgn[k] = 0;
794
84.2M
    c.prev_abs[k] = 0;
795
84.2M
  }
796
29.8M
  for (size_t k = last_nz; k > 0; --k) {
797
28.0M
    int is_zero = 0;
798
28.0M
    if (k < last_nz) {
799
27.2M
      size_t bucket = kNonzeroBuckets[num_nonzeros - 1];
800
27.2M
      size_t is_zero_ctx = bucket * kDCTBlockSize + k;
801
27.2M
      Prob& p = c.is_zero_prob[is_zero_ctx];
802
27.2M
      is_zero = ac.ReadBit(p.get_proba(), in);
803
27.2M
      p.Add(is_zero);
804
27.2M
    }
805
28.0M
    int abs_val = 0;
806
28.0M
    int sign = 1;
807
28.0M
    const int k_nat = c.order[k];
808
28.0M
    if (!is_zero) {
809
7.45M
      size_t context_type = c.context_modes[k_nat];
810
7.45M
      size_t avg_ctx = 0;
811
7.45M
      size_t sign_ctx = kMaxAverageContext;
812
7.45M
      if ((context_type & 1) && (c.y > 0)) {
813
1.48M
        size_t offset = k_nat & 7;
814
1.48M
        ACPredictContextRow(c.prev_row_coeffs + offset, c.coeffs + offset,
815
1.48M
                            c.mult_col + offset * 8, &avg_ctx, &sign_ctx);
816
5.97M
      } else if ((context_type & 2) && (c.x > 0)) {
817
1.70M
        size_t offset = k_nat & ~7;
818
1.70M
        ACPredictContextCol(c.prev_col_coeffs + offset, c.coeffs + offset,
819
1.70M
                            c.mult_row + offset, &avg_ctx, &sign_ctx);
820
4.26M
      } else if (!context_type) {
821
4.16M
        avg_ctx = WeightedAverageContext(c.prev_abs + k, c.prev_row_delta);
822
4.16M
        sign_ctx =
823
4.16M
            c.prev_sgn[k] * 3 + c.prev_sgn[static_cast<int>(k) - kDCTBlockSize];
824
4.16M
      }
825
7.45M
      sign_ctx = sign_ctx * kDCTBlockSize + k;
826
7.45M
      Prob& sign_p = c.sign_prob[sign_ctx];
827
7.45M
      sign = ac.ReadBit(sign_p.get_proba(), in);
828
7.45M
      sign_p.Add(sign);
829
7.45M
      c.prev_sgn[k] = sign + 1;
830
7.45M
      sign = 1 - 2 * sign;
831
7.45M
      const size_t z_dens_ctx =
832
7.45M
          ZeroDensityContext(num_nonzeros, k, c.context_bits);
833
7.45M
      size_t histo_ix = z_dens_ctx * kNumAvrgContexts + avg_ctx;
834
7.45M
      size_t entropy_ix = c.context_map[histo_ix];
835
7.45M
      int code = ans.ReadSymbol(c.entropy_codes[entropy_ix], in);
836
7.45M
      if (code < kNumDirectCodes) {
837
3.68M
        abs_val = code + 1;
838
3.76M
      } else {
839
3.76M
        int nbits = code - kNumDirectCodes;
840
3.76M
        Prob& p = c.first_extra_bit_prob[k * 10 + nbits];
841
3.76M
        int first_extra_bit = ac.ReadBit(p.get_proba(), in);
842
3.76M
        p.Add(first_extra_bit);
843
3.76M
        int extra_bits_val = first_extra_bit << nbits;
844
3.76M
        if (nbits > 0) {
845
2.99M
          extra_bits_val |= br.ReadBits(nbits, in);
846
2.99M
        }
847
3.76M
        abs_val = kNumDirectCodes - 1 + (2u << nbits) + extra_bits_val;
848
3.76M
      }
849
7.45M
      ++num_nonzeros;
850
20.6M
    } else {
851
20.6M
      c.prev_sgn[k] = 0;
852
20.6M
    }
853
28.0M
    int coeff = sign * abs_val;
854
28.0M
    c.coeffs[k_nat] = coeff;
855
28.0M
    c.prev_abs[k] = abs_val;
856
28.0M
  }
857
858
1.78M
  *c.ans = ans;
859
1.78M
  *c.br = br;
860
1.78M
  *c.ac = ac;
861
862
1.78M
  return num_nonzeros;
863
1.78M
}
864
865
5.47k
BrunsliStatus DecodeAC(State* state, WordSource* in) {
866
5.47k
  const std::vector<ComponentMeta>& meta = state->meta;
867
5.47k
  const size_t num_components = meta.size();
868
5.47k
  const int mcu_rows = meta[0].height_in_blocks / meta[0].v_samp;
869
5.47k
  InternalState& s = *state->internal;
870
5.47k
  AcDcState& ac_dc_state = s.ac_dc;
871
872
5.47k
  std::vector<ComponentState>& comps = ac_dc_state.ac;
873
5.47k
  if (comps.empty()) {
874
5.47k
    comps.resize(num_components);
875
11.5k
    for (size_t c = 0; c < num_components; ++c) {
876
6.02k
      comps[c].SetWidth(meta[c].width_in_blocks);
877
6.02k
      ComputeACPredictMultipliers(&meta[c].quant[0], comps[c].mult_row,
878
6.02k
                                  comps[c].mult_col);
879
6.02k
    }
880
5.47k
  }
881
882
5.47k
  if (!in->CanRead(5)) return BRUNSLI_NOT_ENOUGH_DATA;
883
5.37k
  EnsureSubdecodersInitialized(state, in);
884
885
5.37k
  if (!ac_dc_state.ac_coeffs_order_decoded) {
886
10.9k
    while (ac_dc_state.next_component < num_components) {
887
5.81k
      if (!in->CanRead(121)) return BRUNSLI_NOT_ENOUGH_DATA;
888
5.81k
      if (!DecodeCoeffOrder(comps[ac_dc_state.next_component].order,
889
5.81k
                            &s.bit_reader, in)) {
890
254
        return BRUNSLI_INVALID_BRN;
891
254
      }
892
5.55k
      ac_dc_state.next_component++;
893
5.55k
    }
894
5.11k
    ac_dc_state.next_component = 0;
895
5.11k
    ac_dc_state.ac_coeffs_order_decoded = true;
896
5.11k
  }
897
898
5.11k
  AcBlockCookie c;
899
5.11k
  c.ac = &s.arith_decoder;
900
5.11k
  c.in = in;
901
5.11k
  c.ans = &s.ans_decoder;
902
5.11k
  c.br = &s.bit_reader;
903
5.11k
  c.entropy_codes = state->entropy_codes;
904
5.11k
  c.context_modes =
905
5.11k
      kContextAlgorithm + (state->use_legacy_context_model ? 64 : 0);
906
907
103k
  for (int mcu_y = ac_dc_state.next_mcu_y; mcu_y < mcu_rows; ++mcu_y) {
908
196k
    for (size_t i = ac_dc_state.next_component; i < num_components; ++i) {
909
98.3k
      ComponentState& cst = comps[i];
910
98.3k
      c.prev_num_nonzeros = cst.prev_num_nonzeros.data();
911
98.3k
      c.num_nonzero_prob = cst.num_nonzero_prob;
912
98.3k
      c.is_zero_prob = cst.is_zero_prob.data();
913
98.3k
      c.order = cst.order;
914
98.3k
      c.mult_col = cst.mult_col;
915
98.3k
      c.mult_row = cst.mult_row;
916
98.3k
      c.sign_prob = cst.sign_prob.data();
917
98.3k
      c.first_extra_bit_prob = cst.first_extra_bit_prob.data();
918
98.3k
      const ComponentMeta& m = meta[i];
919
98.3k
      c.context_map = state->context_map + m.context_offset * kNumAvrgContexts;
920
98.3k
      c.context_bits = m.context_bits;
921
98.3k
      const int width = m.width_in_blocks;
922
98.3k
      const size_t ac_stride = m.ac_stride;
923
98.3k
      const size_t b_stride = m.b_stride;
924
98.3k
      const int next_iy = ac_dc_state.next_iy;
925
98.3k
      c.y = mcu_y * m.v_samp + next_iy;
926
98.3k
      c.prev_row_delta = (1 - 2 * (c.y & 1u)) * (width + 3) * kDCTBlockSize;
927
406k
      for (int iy = next_iy; iy < m.v_samp; ++iy, ++c.y) {
928
308k
        const int next_x = ac_dc_state.next_x;
929
308k
        const size_t block_offset = next_x * kDCTBlockSize;
930
308k
        c.coeffs = m.ac_coeffs + c.y * ac_stride + block_offset;
931
308k
        c.prev_row_coeffs = c.coeffs - ac_stride;
932
308k
        c.prev_col_coeffs = c.coeffs - kDCTBlockSize;
933
308k
        const uint8_t* block_state = m.block_state + c.y * b_stride + next_x;
934
308k
        c.prev_sgn = &cst.prev_sign[kDCTBlockSize] + block_offset;
935
308k
        c.prev_abs = &cst.prev_abs_coeff[((c.y & 1u) * (width + 3) + 2) *
936
308k
                                         kDCTBlockSize] +
937
308k
                     block_offset;
938
11.5M
        for (c.x = next_x; c.x < width; ++c.x) {
939
11.2M
          bool is_empty = *(block_state++);
940
11.2M
          if (!is_empty) {
941
1.78M
            if (BRUNSLI_PREDICT_FALSE(!in->CanRead(297))) {
942
67
              ac_dc_state.next_mcu_y = mcu_y;
943
67
              ac_dc_state.next_component = i;
944
67
              ac_dc_state.next_iy = iy;
945
67
              ac_dc_state.next_x = c.x;
946
67
              return BRUNSLI_NOT_ENOUGH_DATA;
947
67
            }
948
1.78M
            size_t num_nonzeros = DecodeAcBlock(c);
949
1.78M
            BRUNSLI_DCHECK(num_nonzeros <= kNumNonZeroTreeSize);
950
1.78M
            c.prev_num_nonzeros[c.x] = static_cast<uint8_t>(num_nonzeros);
951
9.47M
          } else {
952
9.47M
            DecodeEmptyAcBlock(c.prev_sgn, c.prev_abs);
953
9.47M
            c.prev_num_nonzeros[c.x] = 0;
954
9.47M
          }
955
11.2M
          c.coeffs += kDCTBlockSize;
956
11.2M
          c.prev_sgn += kDCTBlockSize;
957
11.2M
          c.prev_abs += kDCTBlockSize;
958
11.2M
          c.prev_row_coeffs += kDCTBlockSize;
959
11.2M
          c.prev_col_coeffs += kDCTBlockSize;
960
11.2M
        }
961
308k
        c.prev_row_delta *= -1;
962
308k
        ac_dc_state.next_x = 0;
963
308k
      }
964
98.2k
      ac_dc_state.next_iy = 0;
965
98.2k
    }
966
97.9k
    ac_dc_state.next_component = 0;
967
97.9k
  }
968
5.04k
  ac_dc_state.next_mcu_y = 0;
969
970
5.04k
  comps.clear();
971
5.04k
  comps.shrink_to_fit();
972
973
5.04k
  if (!FinalizeSubdecoders(state)) return BRUNSLI_INVALID_BRN;
974
975
4.56k
  return BRUNSLI_OK;
976
5.04k
}
977
978
230k
static bool CheckCanRead(State* state, size_t required) {
979
  // TODO(eustas): dcheck len > pos
980
230k
  size_t available = state->len - state->pos;
981
230k
  return required <= available;
982
230k
}
983
984
128k
static bool CheckCanReadByte(State* state) {
985
  // TODO(eustas): dcheck len > pos
986
128k
  return state->pos != state->len;
987
128k
}
988
989
128k
static uint8_t ReadByte(State* state) {
990
  // TODO(eustas): dcheck len > pos
991
128k
  return state->data[state->pos++];
992
128k
}
993
994
212k
static uint8_t PeekByte(State* state, size_t offset) {
995
  // TODO(eustas): dcheck overflow.
996
212k
  return state->data[state->pos + offset];
997
212k
}
998
999
482k
static void SkipBytes(State* state, size_t len) {
1000
  // TODO(eustas): dcheck overflow.
1001
482k
  state->pos += len;
1002
482k
}
1003
1004
351k
static size_t GetBytesAvailable(State* state) {
1005
  // TODO(eustas): dcheck len > pos
1006
351k
  return state->len - state->pos;
1007
351k
}
1008
1009
4.82k
static size_t SkipAvailableBytes(State* state, size_t len) {
1010
4.82k
  size_t available = GetBytesAvailable(state);
1011
4.82k
  size_t skip_bytes = std::min(available, len);
1012
4.82k
  state->pos += skip_bytes;
1013
4.82k
  return skip_bytes;
1014
4.82k
}
1015
1016
177k
static BrunsliStatus DecodeBase128(State* state, size_t* val) {
1017
177k
  *val = 0;
1018
177k
  uint64_t b = 0x80;
1019
177k
  size_t i = 0;
1020
390k
  while ((i < 9) && (b & 0x80u)) {
1021
213k
    if (!CheckCanRead(state, i + 1)) return BRUNSLI_NOT_ENOUGH_DATA;
1022
212k
    b = PeekByte(state, i);
1023
212k
    *val |= (b & 0x7Fu) << (i * 7);
1024
212k
    ++i;
1025
212k
  }
1026
177k
  SkipBytes(state, i);
1027
177k
  return ((b & 0x80u) == 0) ? BRUNSLI_OK : BRUNSLI_INVALID_BRN;
1028
177k
}
1029
1030
17.5k
static Stage Fail(State* state, BrunsliStatus result) {
1031
17.5k
  InternalState& s = *state->internal;
1032
17.5k
  s.result = result;
1033
  // Preserve current stage for continuation / error reporting.
1034
17.5k
  s.last_stage = state->stage;
1035
17.5k
  return Stage::ERROR;
1036
17.5k
}
1037
1038
128k
static BrunsliStatus ReadTag(State* state, SectionState* section) {
1039
128k
  if (!CheckCanReadByte(state)) return BRUNSLI_NOT_ENOUGH_DATA;
1040
127k
  const uint8_t marker = ReadByte(state);
1041
1042
127k
  const size_t tag = marker >> 3u;
1043
127k
  if (tag == 0 || tag > 15) return BRUNSLI_INVALID_BRN;
1044
127k
  section->tag = tag;
1045
1046
127k
  const size_t wiring_type = marker & 0x7u;
1047
127k
  if (wiring_type != kBrunsliWiringTypeVarint &&
1048
65.8k
      wiring_type != kBrunsliWiringTypeLengthDelimited) {
1049
18
    return BRUNSLI_INVALID_BRN;
1050
18
  }
1051
127k
  section->is_section = (wiring_type == kBrunsliWiringTypeLengthDelimited);
1052
1053
127k
  const uint32_t tag_bit = 1u << tag;
1054
127k
  if (section->tags_met & tag_bit) {
1055
14
    BRUNSLI_LOG_ERROR() << "Duplicate marker " << std::hex
1056
14
                        << static_cast<int>(marker) << BRUNSLI_ENDL();
1057
14
    return BRUNSLI_INVALID_BRN;
1058
14
  }
1059
127k
  section->tags_met |= tag_bit;
1060
1061
127k
  return BRUNSLI_OK;
1062
127k
}
1063
1064
60.9k
static BrunsliStatus EnterSection(State* state, SectionState* section) {
1065
60.9k
  size_t section_size;
1066
60.9k
  BrunsliStatus status = DecodeBase128(state, &section_size);
1067
60.9k
  if (status != BRUNSLI_OK) return status;
1068
60.8k
  section->is_active = true;
1069
60.8k
  section->remaining = section_size;
1070
60.8k
  section->milestone = state->pos;
1071
60.8k
  section->projected_end = state->pos + section->remaining;
1072
60.8k
  return BRUNSLI_OK;
1073
60.9k
}
1074
1075
16.7k
static void LeaveSection(SectionState* section) {
1076
16.7k
  section->is_active = false;
1077
16.7k
}
1078
1079
372k
static bool IsOutOfSectionBounds(State* state) {
1080
372k
  return state->pos > state->internal->section.projected_end;
1081
372k
}
1082
1083
367k
static size_t RemainingSectionLength(State* state) {
1084
  // TODO(eustas): remove this check?
1085
367k
  if (IsOutOfSectionBounds(state)) return 0;
1086
366k
  return state->internal->section.projected_end - state->pos;
1087
367k
}
1088
1089
151k
static bool IsAtSectionBoundary(State* state) {
1090
151k
  return state->pos == state->internal->section.projected_end;
1091
151k
}
1092
1093
17.4k
Stage VerifySignature(State* state) {
1094
17.4k
  InternalState& s = *state->internal;
1095
1096
17.4k
  if (!CheckCanRead(state, kBrunsliSignatureSize)) {
1097
5
    return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
1098
5
  }
1099
17.4k
  const bool is_signature_ok =
1100
17.4k
      (memcmp(state->data + state->pos, kBrunsliSignature,
1101
17.4k
              kBrunsliSignatureSize) != 0);
1102
17.4k
  state->pos += kBrunsliSignatureSize;
1103
17.4k
  s.section.tags_met |= 1u << kBrunsliSignatureTag;
1104
17.4k
  if (is_signature_ok) return Fail(state, BRUNSLI_INVALID_BRN);
1105
17.3k
  return Stage::HEADER;
1106
17.4k
}
1107
1108
// Parses the brunsli header starting at data[*pos] and fills in *jpg.
1109
// Sets *pos to the position after the header.
1110
// Returns BRUNSLI_OK, unless the data is not valid brunsli byte stream
1111
// or is truncated.
1112
17.3k
Stage DecodeHeader(State* state, JPEGData* jpg) {
1113
17.3k
  InternalState& s = *state->internal;
1114
17.3k
  HeaderState& hs = s.header;
1115
1116
223k
  while (hs.stage != HeaderState::DONE) {
1117
207k
    switch (hs.stage) {
1118
17.3k
      case HeaderState::READ_TAG: {
1119
17.3k
        BrunsliStatus status = ReadTag(state, &s.section);
1120
17.3k
        if (status != BRUNSLI_OK) return Fail(state, status);
1121
17.3k
        if (s.section.tag != kBrunsliHeaderTag || !s.section.is_section) {
1122
6
          return Fail(state, BRUNSLI_INVALID_BRN);
1123
6
        }
1124
17.3k
        hs.stage = HeaderState::ENTER_SECTION;
1125
17.3k
        break;
1126
17.3k
      }
1127
1128
17.3k
      case HeaderState::ENTER_SECTION: {
1129
17.3k
        BrunsliStatus status = EnterSection(state, &s.section);
1130
17.3k
        if (status != BRUNSLI_OK) return Fail(state, status);
1131
17.2k
        hs.stage = HeaderState::ITEM_READ_TAG;
1132
17.2k
        break;
1133
17.3k
      }
1134
1135
83.9k
      case HeaderState::ITEM_READ_TAG: {
1136
83.9k
        if (IsAtSectionBoundary(state)) {
1137
16.9k
          hs.stage = HeaderState::FINALE;
1138
16.9k
          break;
1139
16.9k
        }
1140
66.9k
        BrunsliStatus status = ReadTag(state, &hs.section);
1141
66.9k
        if (status != BRUNSLI_OK) return Fail(state, status);
1142
66.8k
        const uint32_t tag_bit = 1u << hs.section.tag;
1143
66.8k
        if (hs.section.is_section) {
1144
4.84k
          if (kKnownHeaderVarintTags & tag_bit) {
1145
4.72k
            Fail(state, BRUNSLI_INVALID_BRN);
1146
4.72k
          }
1147
4.84k
          hs.stage = HeaderState::ITEM_ENTER_SECTION;
1148
4.84k
          break;
1149
4.84k
        }
1150
61.9k
        hs.stage = HeaderState::ITEM_READ_VALUE;
1151
61.9k
        break;
1152
66.8k
      }
1153
1154
4.84k
      case HeaderState::ITEM_ENTER_SECTION: {
1155
4.84k
        BrunsliStatus status = DecodeBase128(state, &hs.remaining_skip_length);
1156
4.84k
        if (status != BRUNSLI_OK) return Fail(state, status);
1157
4.82k
        hs.stage = HeaderState::ITEM_SKIP_CONTENTS;
1158
4.82k
        break;
1159
4.84k
      }
1160
1161
4.82k
      case HeaderState::ITEM_SKIP_CONTENTS: {
1162
4.82k
        size_t bytes_skipped =
1163
4.82k
            SkipAvailableBytes(state, hs.remaining_skip_length);
1164
4.82k
        hs.remaining_skip_length -= bytes_skipped;
1165
4.82k
        if (hs.remaining_skip_length > 0) {
1166
120
          return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
1167
120
        }
1168
4.70k
        hs.stage = HeaderState::ITEM_READ_TAG;
1169
4.70k
        break;
1170
4.82k
      }
1171
1172
61.9k
      case HeaderState::ITEM_READ_VALUE: {
1173
61.9k
        size_t value;
1174
61.9k
        BrunsliStatus status = DecodeBase128(state, &value);
1175
61.9k
        if (status != BRUNSLI_OK) return Fail(state, status);
1176
61.9k
        hs.varint_values[hs.section.tag] = value;
1177
61.9k
        hs.stage = HeaderState::ITEM_READ_TAG;
1178
61.9k
        break;
1179
61.9k
      }
1180
1181
16.9k
      case HeaderState::FINALE: {
1182
16.9k
        const bool has_version =
1183
16.9k
            hs.section.tags_met & (1u << kBrunsliHeaderVersionCompTag);
1184
16.9k
        if (!has_version) return Fail(state, BRUNSLI_INVALID_BRN);
1185
16.9k
        const size_t version_and_comp_count =
1186
16.9k
            hs.varint_values[kBrunsliHeaderVersionCompTag];
1187
1188
16.9k
        const size_t version = version_and_comp_count >> 2u;
1189
16.9k
        jpg->version = static_cast<int>(version);
1190
1191
16.9k
        if (version == 1) {  // fallback mode
1192
          // TODO(eustas): do we need this?
1193
376
          jpg->width = 0;
1194
376
          jpg->height = 0;
1195
376
          hs.stage = HeaderState::DONE;
1196
376
          break;
1197
376
        }
1198
1199
        // Wrong mode = fallback + something.
1200
16.5k
        if ((version & 1u) != 0) {
1201
16
          return Fail(state, BRUNSLI_INVALID_BRN);
1202
16
        }
1203
        // Unknown mode - only 3 bits are defined.
1204
16.5k
        if ((version & ~0x7u) != 0) {
1205
46
          return Fail(state, BRUNSLI_INVALID_BRN);
1206
46
        }
1207
1208
        // Otherwise regular brunsli.
1209
16.5k
        state->use_legacy_context_model = !(version & 2);
1210
1211
        // Do not allow "original_jpg" for regular Brunsli files.
1212
16.5k
        s.section.tags_met |= 1u << kBrunsliOriginalJpgTag;
1213
1214
16.5k
        const bool has_width =
1215
16.5k
            hs.section.tags_met & (1u << kBrunsliHeaderWidthTag);
1216
16.5k
        if (!has_width) return Fail(state, BRUNSLI_INVALID_BRN);
1217
16.5k
        const size_t width = hs.varint_values[kBrunsliHeaderWidthTag];
1218
16.5k
        const bool has_height =
1219
16.5k
            hs.section.tags_met & (1u << kBrunsliHeaderHeightTag);
1220
16.5k
        if (!has_height) return Fail(state, BRUNSLI_INVALID_BRN);
1221
16.5k
        const size_t height = hs.varint_values[kBrunsliHeaderHeightTag];
1222
1223
16.5k
        if (width == 0 || height == 0) return Fail(state, BRUNSLI_INVALID_BRN);
1224
16.5k
        if (width > kMaxDimPixels || height > kMaxDimPixels) {
1225
186
          return Fail(state, BRUNSLI_INVALID_BRN);
1226
186
        }
1227
16.3k
        jpg->width = static_cast<int>(width);
1228
16.3k
        jpg->height = static_cast<int>(height);
1229
1230
16.3k
        const size_t num_components = (version_and_comp_count & 3u) + 1u;
1231
16.3k
        jpg->components.resize(num_components);
1232
1233
16.3k
        const bool has_subsampling =
1234
16.3k
            hs.section.tags_met & (1u << kBrunsliHeaderSubsamplingTag);
1235
16.3k
        if (!has_subsampling) return Fail(state, BRUNSLI_INVALID_BRN);
1236
16.2k
        size_t subsampling_code =
1237
16.2k
            hs.varint_values[kBrunsliHeaderSubsamplingTag];
1238
1239
44.0k
        for (size_t i = 0; i < jpg->components.size(); ++i) {
1240
27.7k
          JPEGComponent* c = &jpg->components[i];
1241
27.7k
          c->v_samp_factor = (subsampling_code & 0xFu) + 1;
1242
27.7k
          subsampling_code >>= 4u;
1243
27.7k
          c->h_samp_factor = (subsampling_code & 0xFu) + 1;
1244
27.7k
          subsampling_code >>= 4u;
1245
27.7k
          if (c->v_samp_factor > kBrunsliMaxSampling) {
1246
1
            return Fail(state, BRUNSLI_INVALID_BRN);
1247
1
          }
1248
27.7k
          if (c->h_samp_factor > kBrunsliMaxSampling) {
1249
1
            return Fail(state, BRUNSLI_INVALID_BRN);
1250
1
          }
1251
27.7k
        }
1252
16.2k
        if (!UpdateSubsamplingDerivatives(jpg)) {
1253
1
          return Fail(state, BRUNSLI_INVALID_BRN);
1254
1
        }
1255
1256
16.2k
        PrepareMeta(jpg, state);
1257
1258
16.2k
        hs.stage = HeaderState::DONE;
1259
16.2k
        break;
1260
16.2k
      }
1261
1262
0
      default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
1263
207k
    }
1264
207k
  }
1265
1266
16.6k
  LeaveSection(&s.section);
1267
16.6k
  return (jpg->version == kFallbackVersion) ? Stage::FALLBACK : Stage::SECTION;
1268
17.3k
}
1269
1270
4.21k
static BrunsliStatus DecodeMetaDataSection(State* state, JPEGData* jpg) {
1271
4.21k
  InternalState& s = *state->internal;
1272
4.21k
  MetadataState& ms = s.metadata;
1273
1274
4.21k
  if (ms.decompression_stage == MetadataDecompressionStage::DONE) {
1275
0
    return BRUNSLI_INVALID_BRN;
1276
0
  }
1277
1278
4.21k
  if (ms.decompression_stage == MetadataDecompressionStage::INITIAL) {
1279
4.21k
    if (IsAtSectionBoundary(state)) {
1280
4
      ms.decompression_stage = MetadataDecompressionStage::DONE;
1281
4
      return BRUNSLI_OK;
1282
4
    }
1283
4.21k
    if (RemainingSectionLength(state) == 1) {
1284
47
      if (!CheckCanReadByte(state)) {
1285
1
        return BRUNSLI_NOT_ENOUGH_DATA;
1286
1
      }
1287
46
      uint8_t data[1];
1288
46
      data[0] = ReadByte(state);
1289
46
      bool ok = ProcessMetaData(data, 1, &ms, jpg) && ms.CanFinish();
1290
46
      ms.decompression_stage = MetadataDecompressionStage::DONE;
1291
46
      return ok ? BRUNSLI_OK : BRUNSLI_INVALID_BRN;
1292
47
    }
1293
4.16k
    ms.decompression_stage =
1294
4.16k
        MetadataDecompressionStage::READ_LENGTH;
1295
4.16k
  }
1296
1297
4.16k
  if (ms.decompression_stage == MetadataDecompressionStage::READ_LENGTH) {
1298
4.16k
    BrunsliStatus status = DecodeBase128(state, &ms.metadata_size);
1299
4.16k
    if (status != BRUNSLI_OK) return status;
1300
    // TODO(eustas): ms.metadata_size should be limited to avoid "zip-bombs".
1301
4.07k
    if (IsOutOfSectionBounds(state)) return BRUNSLI_INVALID_BRN;
1302
4.07k
    if (RemainingSectionLength(state) == 0) return BRUNSLI_INVALID_BRN;
1303
4.07k
    ms.brotli = BrotliDecoderCreateInstance(nullptr, nullptr, nullptr);
1304
4.07k
    if (ms.brotli == nullptr) return BRUNSLI_DECOMPRESSION_ERROR;
1305
4.07k
    ms.decompression_stage = MetadataDecompressionStage::DECOMPRESSING;
1306
4.07k
  }
1307
1308
4.07k
  if (ms.decompression_stage == MetadataDecompressionStage::DECOMPRESSING) {
1309
    // Free Brotli decoder and return result
1310
4.07k
    const auto finish_decompression = [&ms] (BrunsliStatus result) {
1311
2.49k
      BRUNSLI_DCHECK(ms.brotli != nullptr);
1312
2.49k
      BrotliDecoderDestroyInstance(ms.brotli);
1313
2.49k
      ms.brotli = nullptr;
1314
2.49k
      ms.decompression_stage = MetadataDecompressionStage::DONE;
1315
2.49k
      return result;
1316
2.49k
    };
1317
1318
223k
    while (true) {
1319
223k
      size_t available_bytes =
1320
223k
          std::min(GetBytesAvailable(state), RemainingSectionLength(state));
1321
223k
      size_t available_in = available_bytes;
1322
223k
      const uint8_t* next_in = state->data + state->pos;
1323
223k
      size_t available_out = 0;
1324
223k
      BrotliDecoderResult result = BrotliDecoderDecompressStream(
1325
223k
          ms.brotli, &available_in, &next_in, &available_out, nullptr, nullptr);
1326
223k
      if (result == BROTLI_DECODER_RESULT_ERROR) {
1327
1.05k
        return finish_decompression(BRUNSLI_INVALID_BRN);
1328
1.05k
      }
1329
222k
      size_t chunk_size = 0;
1330
222k
      const uint8_t* chunk_data =
1331
222k
          BrotliDecoderTakeOutput(ms.brotli, &chunk_size);
1332
222k
      ms.decompressed_size += chunk_size;
1333
222k
      if (ms.decompressed_size > ms.metadata_size) {
1334
1.08k
        return finish_decompression(BRUNSLI_INVALID_BRN);
1335
1.08k
      }
1336
221k
      size_t consumed_bytes = available_bytes - available_in;
1337
221k
      SkipBytes(state, consumed_bytes);
1338
221k
      bool chunk_ok = ProcessMetaData(chunk_data, chunk_size, &ms, jpg);
1339
221k
      if (!chunk_ok) return finish_decompression(BRUNSLI_INVALID_BRN);
1340
220k
      if (result == BROTLI_DECODER_RESULT_SUCCESS) {
1341
184
        if (RemainingSectionLength(state) != 0) {
1342
116
          return finish_decompression(BRUNSLI_INVALID_BRN);
1343
116
        }
1344
68
        if (ms.decompressed_size != ms.metadata_size) {
1345
64
          return finish_decompression(BRUNSLI_INVALID_BRN);
1346
64
        }
1347
4
        if (!ms.CanFinish()) return finish_decompression(BRUNSLI_INVALID_BRN);
1348
3
        return finish_decompression(BRUNSLI_OK);
1349
4
      }
1350
220k
      if (result == BROTLI_DECODER_RESULT_NEEDS_MORE_OUTPUT) continue;
1351
1.58k
      BRUNSLI_DCHECK(result == BROTLI_DECODER_RESULT_NEEDS_MORE_INPUT);
1352
1.58k
      if (RemainingSectionLength(state) == 0) {
1353
11
        return finish_decompression(BRUNSLI_INVALID_BRN);
1354
11
      }
1355
1.57k
      return BRUNSLI_NOT_ENOUGH_DATA;
1356
1.58k
    }
1357
4.07k
  }
1358
1359
  // Unreachable.
1360
0
  BRUNSLI_DCHECK(false);
1361
0
  return BRUNSLI_DECOMPRESSION_ERROR;
1362
4.07k
}
1363
1364
/**
1365
 * Wraps result, depending on the state of input.
1366
 *
1367
 * If parser needs more data, but section data is depleted,
1368
 * then input is corrupted.
1369
 */
1370
27.5k
static BrunsliStatus CheckBoundary(State* state, BrunsliStatus result) {
1371
27.5k
  if (result == BRUNSLI_NOT_ENOUGH_DATA) {
1372
3.42k
    bool last = (RemainingSectionLength(state) <= GetBytesAvailable(state));
1373
3.42k
    return last ? BRUNSLI_INVALID_BRN : BRUNSLI_NOT_ENOUGH_DATA;
1374
24.0k
  } else {
1375
24.0k
    return result;
1376
24.0k
  }
1377
27.5k
}
1378
1379
27.3k
static void PrepareBitReader(BrunsliBitReader* br, State* state) {
1380
27.3k
  size_t chunk_len =
1381
27.3k
      std::min(GetBytesAvailable(state), RemainingSectionLength(state));
1382
27.3k
  BrunsliBitReaderResume(br, state->data + state->pos, chunk_len);
1383
27.3k
  BRUNSLI_DCHECK(BrunsliBitReaderIsHealthy(br));
1384
27.3k
}
1385
1386
/**
1387
 * Marks data used by bit-reader as consumed.
1388
 */
1389
static BrunsliStatus SuspendBitReader(BrunsliBitReader* br, State* state,
1390
27.3k
                                      BrunsliStatus result) {
1391
27.3k
  size_t chunk_len =
1392
27.3k
      std::min(GetBytesAvailable(state), RemainingSectionLength(state));
1393
27.3k
  size_t unused_bytes = BrunsliBitReaderSuspend(br);
1394
27.3k
  size_t consumed_bytes = chunk_len - unused_bytes;
1395
27.3k
  SkipBytes(state, consumed_bytes);
1396
27.3k
  result = CheckBoundary(state, result);
1397
  // Once BitReader becomes unhealthy, further decoding should be impossible.
1398
27.3k
  BRUNSLI_DCHECK(
1399
27.3k
      BrunsliBitReaderIsHealthy(br) ||
1400
27.3k
      ((result != BRUNSLI_OK) && (result != BRUNSLI_NOT_ENOUGH_DATA)));
1401
27.3k
  return result;
1402
27.3k
}
1403
1404
11.8k
static BrunsliStatus DecodeJPEGInternalsSection(State* state, JPEGData* jpg) {
1405
11.8k
  InternalState& s = *state->internal;
1406
11.8k
  JpegInternalsState& js = s.internals;
1407
11.8k
  BrunsliBitReader* br = &js.br;
1408
1409
11.8k
  if (js.stage == JpegInternalsState::INIT) {
1410
11.8k
    BrunsliBitReaderInit(br);
1411
11.8k
    js.stage = JpegInternalsState::READ_MARKERS;
1412
11.8k
  }
1413
11.8k
  PrepareBitReader(br, state);
1414
1415
11.8k
  const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus {
1416
11.8k
    return SuspendBitReader(br, state, result);
1417
11.8k
  };
1418
1419
11.8k
  if (js.stage == JpegInternalsState::READ_MARKERS) {
1420
5.13M
    while (true) {
1421
5.13M
      if (!BrunsliBitReaderCanRead(br, 6)) {
1422
199
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1423
199
      }
1424
5.13M
      uint8_t marker = 0xc0 + BrunsliBitReaderRead(br, 6);
1425
5.13M
      jpg->marker_order.push_back(marker);
1426
5.13M
      if (marker == 0xc4) ++js.dht_count;
1427
5.13M
      if (marker == 0xdd) js.have_dri = true;
1428
5.13M
      if (marker == 0xda) ++js.num_scans;
1429
5.13M
      if (marker == 0xd9) break;
1430
5.13M
    }
1431
11.6k
    js.stage = JpegInternalsState::READ_DRI;
1432
11.6k
  }
1433
1434
11.6k
  if (js.stage == JpegInternalsState::READ_DRI) {
1435
11.6k
    if (js.have_dri) {
1436
1.57k
      if (!BrunsliBitReaderCanRead(br, 16)) {
1437
136
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1438
136
      }
1439
1.43k
      jpg->restart_interval = BrunsliBitReaderRead(br, 16);
1440
1.43k
    }
1441
11.5k
    js.stage = JpegInternalsState::READ_HUFFMAN_LAST;
1442
11.5k
  }
1443
1444
11.5k
  if (js.stage & JpegInternalsState::DECODE_HUFFMAN_MASK) {
1445
11.5k
    BrunsliStatus status = DecodeHuffmanCode(state, jpg);
1446
11.5k
    if (status != BRUNSLI_OK) return suspend_bit_reader(status);
1447
11.1k
    js.stage = JpegInternalsState::PREPARE_READ_SCANS;
1448
11.1k
  }
1449
1450
11.1k
  if (js.stage == JpegInternalsState::PREPARE_READ_SCANS) {
1451
11.1k
    if (js.dht_count != js.terminal_huffman_code_count) {
1452
162
      BRUNSLI_LOG_ERROR() << "Invalid number of DHT markers" << BRUNSLI_ENDL();
1453
162
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1454
162
    }
1455
11.0k
    if (js.num_scans > 0) {
1456
5.13k
      jpg->scan_info.resize(js.num_scans);
1457
5.13k
      js.i = 0;
1458
5.13k
      js.stage = JpegInternalsState::READ_SCAN_COMMON;
1459
5.88k
    } else {
1460
5.88k
      js.stage = JpegInternalsState::READ_NUM_QUANT;
1461
5.88k
    }
1462
11.0k
  }
1463
1464
11.0k
  if (js.stage & JpegInternalsState::DECODE_SCAN_MASK) {
1465
5.13k
    BrunsliStatus status = DecodeScanInfo(state, jpg);
1466
5.13k
    if (status != BRUNSLI_OK) return suspend_bit_reader(status);
1467
4.81k
    js.stage = JpegInternalsState::READ_NUM_QUANT;
1468
4.81k
  }
1469
1470
10.6k
  if (js.stage == JpegInternalsState::READ_NUM_QUANT) {
1471
10.6k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1472
174
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1473
174
    }
1474
10.5k
    int num_quant_tables = BrunsliBitReaderRead(br, 2) + 1;
1475
10.5k
    jpg->quant.resize(num_quant_tables);
1476
10.5k
    js.i = 0;
1477
10.5k
    js.stage = JpegInternalsState::READ_QUANT;
1478
10.5k
  }
1479
1480
20.9k
  while (js.stage == JpegInternalsState::READ_QUANT) {
1481
20.9k
    if (js.i >= jpg->quant.size()) {
1482
10.2k
      js.stage = JpegInternalsState::READ_COMP_ID_SCHEME;
1483
10.2k
      break;
1484
10.2k
    }
1485
    // 6 or 7 bits are used, but we know that at least one more bit is
1486
    // guaranteed to be used by varint out of the loop.
1487
10.7k
    if (!BrunsliBitReaderCanRead(br, 7)) {
1488
164
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1489
164
    }
1490
10.5k
    JPEGQuantTable* q = &jpg->quant[js.i];
1491
10.5k
    q->index = BrunsliBitReaderRead(br, 2);
1492
10.5k
    q->is_last = (js.i == jpg->quant.size() - 1) || BrunsliBitReaderRead(br, 1);
1493
10.5k
    q->precision = BrunsliBitReaderRead(br, 4);
1494
10.5k
    if (q->precision > 1) {
1495
130
      BRUNSLI_LOG_ERROR() << "Invalid quantization table precision: "
1496
130
                          << q->precision << BRUNSLI_ENDL();
1497
130
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1498
130
    }
1499
    // note that q->values[] are initialized to invalid 0 values.
1500
10.4k
    ++js.i;
1501
10.4k
  }
1502
1503
10.2k
  if (js.stage == JpegInternalsState::READ_COMP_ID_SCHEME) {
1504
10.2k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1505
138
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1506
138
    }
1507
10.0k
    int comp_ids = BrunsliBitReaderRead(br, 2);
1508
10.0k
    static const size_t kMinRequiredComponents[4] = {
1509
10.0k
        3 /* Ids123*/, 1 /* IdsGray */, 3 /* IdsRGB */, 0 /* IdsCustom */
1510
10.0k
    };
1511
10.0k
    if (jpg->components.size() < kMinRequiredComponents[comp_ids]) {
1512
1
      BRUNSLI_LOG_ERROR() << "Insufficient number of components for ColorId #"
1513
1
                          << comp_ids << BRUNSLI_ENDL();
1514
1
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1515
1
    }
1516
10.0k
    js.stage = JpegInternalsState::READ_NUM_PADDING_BITS;
1517
10.0k
    if (comp_ids == kComponentIds123) {
1518
526
      jpg->components[0].id = 1;
1519
526
      jpg->components[1].id = 2;
1520
526
      jpg->components[2].id = 3;
1521
9.56k
    } else if (comp_ids == kComponentIdsGray) {
1522
9.16k
      jpg->components[0].id = 1;
1523
9.16k
    } else if (comp_ids == kComponentIdsRGB) {
1524
23
      jpg->components[0].id = 'R';
1525
23
      jpg->components[1].id = 'G';
1526
23
      jpg->components[2].id = 'B';
1527
382
    } else {
1528
382
      BRUNSLI_DCHECK(comp_ids == kComponentIdsCustom);
1529
382
      js.i = 0;
1530
382
      js.stage = JpegInternalsState::READ_COMP_ID;
1531
382
    }
1532
10.0k
  }
1533
1534
10.0k
  if (js.stage == JpegInternalsState::READ_COMP_ID) {
1535
749
    while (js.i < jpg->components.size()) {
1536
397
      if (!BrunsliBitReaderCanRead(br, 8)) {
1537
30
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1538
30
      }
1539
367
      jpg->components[js.i].id = BrunsliBitReaderRead(br, 8);
1540
367
      ++js.i;
1541
367
    }
1542
352
    js.stage = JpegInternalsState::READ_NUM_PADDING_BITS;
1543
352
  }
1544
1545
10.0k
  if (js.stage == JpegInternalsState::READ_NUM_PADDING_BITS) {
1546
    // TODO(eustas): sanitize: should not be bigger than
1547
    //               7 x (num_scans + num_blocks / dri)
1548
    // security: limit is 32b for n_size
1549
10.0k
    if (!DecodeLimitedVarint<8>(&js.varint, br, 4)) {
1550
92
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1551
92
    }
1552
9.97k
    js.num_padding_bits = js.varint.value;
1553
9.97k
    jpg->has_zero_padding_bit = (js.num_padding_bits > 0);
1554
9.97k
    if (js.num_padding_bits > PaddingBitsLimit(*jpg)) {
1555
42
      BRUNSLI_LOG_ERROR() << "Suspicious number of padding bits "
1556
42
                          << js.num_padding_bits << BRUNSLI_ENDL();
1557
42
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1558
42
    }
1559
9.92k
    js.i = 0;
1560
9.92k
    js.stage = JpegInternalsState::READ_PADDING_BITS;
1561
9.92k
  }
1562
1563
9.92k
  if (js.stage == JpegInternalsState::READ_PADDING_BITS) {
1564
68.1k
    while (js.i < js.num_padding_bits) {
1565
58.2k
      if (!BrunsliBitReaderCanRead(br, 1)) {
1566
22
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1567
22
      }
1568
58.2k
      jpg->padding_bits.emplace_back(BrunsliBitReaderRead(br, 1));
1569
58.2k
      ++js.i;
1570
58.2k
    }
1571
9.90k
    suspend_bit_reader(BRUNSLI_OK);
1572
9.90k
    BrunsliBitReaderFinish(br);
1573
9.90k
    if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN;
1574
9.89k
    js.i = 0;
1575
9.89k
    js.stage = JpegInternalsState::ITERATE_MARKERS;
1576
9.89k
  } else {
1577
    // no-op
1578
0
    suspend_bit_reader(BRUNSLI_OK);
1579
0
  }
1580
1581
4.69M
  while (true) {
1582
4.69M
    switch (js.stage) {
1583
4.59M
      case JpegInternalsState::ITERATE_MARKERS: {
1584
4.59M
        if (js.i >= jpg->marker_order.size()) {
1585
9.55k
          js.stage = JpegInternalsState::DONE;
1586
4.58M
        } else if (jpg->marker_order[js.i] == 0xFF) {
1587
45.6k
          js.stage = JpegInternalsState::READ_INTERMARKER_LENGTH;
1588
4.53M
        } else {
1589
4.53M
          ++js.i;
1590
4.53M
        }
1591
4.59M
        continue;
1592
0
      }
1593
1594
45.6k
      case JpegInternalsState::READ_INTERMARKER_LENGTH: {
1595
45.6k
        BrunsliStatus status = DecodeBase128(state, &js.intermarker_length);
1596
45.6k
        if (status != BRUNSLI_OK) return CheckBoundary(state, status);
1597
45.5k
        if (js.intermarker_length > RemainingSectionLength(state)) {
1598
79
          return BRUNSLI_INVALID_BRN;
1599
79
        }
1600
45.4k
        jpg->inter_marker_data.emplace_back();
1601
45.4k
        js.stage = JpegInternalsState::READ_INTERMARKER_DATA;
1602
45.4k
        continue;
1603
45.5k
      }
1604
1605
45.4k
      case JpegInternalsState::READ_INTERMARKER_DATA: {
1606
45.4k
        auto& dest = jpg->inter_marker_data.back();
1607
45.4k
        size_t piece_limit = js.intermarker_length - dest.size();
1608
45.4k
        size_t piece_size = std::min(piece_limit, GetBytesAvailable(state));
1609
45.4k
        Append(&dest, state->data + state->pos, piece_size);
1610
45.4k
        SkipBytes(state, piece_size);
1611
45.4k
        if (dest.size() < js.intermarker_length) {
1612
110
          BRUNSLI_DCHECK(GetBytesAvailable(state) == 0);
1613
110
          BRUNSLI_DCHECK(RemainingSectionLength(state) > 0);
1614
110
          return BRUNSLI_NOT_ENOUGH_DATA;
1615
110
        }
1616
45.3k
        ++js.i;
1617
45.3k
        js.stage = JpegInternalsState::ITERATE_MARKERS;
1618
45.3k
        continue;
1619
45.4k
      }
1620
1621
9.55k
      default: { /* no-op */ }
1622
4.69M
    }
1623
9.55k
    break;  // no matching stage has been found; exit the loop.
1624
4.69M
  }
1625
1626
9.55k
  if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1627
1628
9.37k
  return BRUNSLI_OK;
1629
9.55k
}
1630
1631
7.85k
static BrunsliStatus DecodeQuantDataSection(State* state, JPEGData* jpg) {
1632
7.85k
  InternalState& s = *state->internal;
1633
7.85k
  QuantDataState& qs = s.quant;
1634
7.85k
  BrunsliBitReader* br = &qs.br;
1635
1636
7.85k
  if (qs.stage == QuantDataState::INIT) {
1637
7.85k
    BrunsliBitReaderInit(br);
1638
7.85k
    qs.stage = QuantDataState::READ_NUM_QUANT;
1639
7.85k
  }
1640
7.85k
  PrepareBitReader(br, state);
1641
1642
7.85k
  const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus {
1643
7.85k
    return SuspendBitReader(br, state, result);
1644
7.85k
  };
1645
1646
7.85k
  if (qs.stage == QuantDataState::READ_NUM_QUANT) {
1647
7.85k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1648
147
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1649
147
    }
1650
7.70k
    size_t num_quant_tables = BrunsliBitReaderRead(br, 2) + 1;
1651
7.70k
    if (jpg->quant.size() != num_quant_tables) {
1652
141
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1653
141
    }
1654
7.56k
    qs.predictor.resize(kDCTBlockSize);
1655
7.56k
    qs.i = 0;
1656
7.56k
    qs.stage = QuantDataState::READ_STOCK;
1657
7.56k
  }
1658
1659
69.0k
  while (true) {
1660
69.0k
    switch (qs.stage) {
1661
14.2k
      case QuantDataState::READ_STOCK: {
1662
14.2k
        if (qs.i >= jpg->quant.size()) {
1663
6.48k
          std::vector<uint8_t>().swap(qs.predictor);
1664
6.48k
          qs.i = 0;
1665
6.48k
          qs.stage = QuantDataState::READ_QUANT_IDX;
1666
6.48k
          continue;
1667
6.48k
        }
1668
        // Depending on еру 1-st bit, it is guaranteed that we will need to read
1669
        // at least 3 or 6 more bits.
1670
7.74k
        if (!BrunsliBitReaderCanRead(br, 4)) {
1671
140
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1672
140
        }
1673
7.60k
        qs.data_precision = 0;
1674
7.60k
        bool is_short = !BrunsliBitReaderRead(br, 1);
1675
7.60k
        if (is_short) {
1676
6.54k
          const size_t short_code = BrunsliBitReaderRead(br, 3);
1677
6.54k
          int32_t* table = jpg->quant[qs.i].values.data();
1678
6.54k
          size_t selector = (qs.i > 0) ? 1 : 0;
1679
425k
          for (size_t k = 0; k < kDCTBlockSize; ++k) {
1680
419k
            table[k] = kStockQuantizationTables[selector][short_code][k];
1681
419k
          }
1682
6.54k
          qs.stage = QuantDataState::UPDATE;
1683
6.54k
        } else {
1684
1.05k
          qs.stage = QuantDataState::READ_Q_FACTOR;
1685
1.05k
        }
1686
7.60k
        continue;
1687
7.74k
      }
1688
1689
1.05k
      case QuantDataState::READ_Q_FACTOR: {
1690
1.05k
        if (!BrunsliBitReaderCanRead(br, 6)) {
1691
156
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1692
156
        }
1693
897
        const uint32_t q_factor = BrunsliBitReaderRead(br, 6);
1694
897
        FillQuantMatrix(qs.i > 0, q_factor, qs.predictor.data());
1695
897
        qs.j = 0;
1696
897
        qs.delta = 0;
1697
897
        qs.stage = QuantDataState::READ_DIFF_IS_ZERO;
1698
897
        continue;
1699
1.05k
      }
1700
1701
17.8k
      case QuantDataState::READ_DIFF_IS_ZERO: {
1702
17.8k
        if (qs.j >= kDCTBlockSize) {
1703
222
          qs.stage = QuantDataState::UPDATE;
1704
222
          continue;
1705
222
        }
1706
17.5k
        if (!BrunsliBitReaderCanRead(br, 1)) {
1707
189
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1708
189
        }
1709
17.3k
        if (BrunsliBitReaderRead(br, 1)) {
1710
2.87k
          qs.stage = QuantDataState::READ_DIFF_SIGN;
1711
14.5k
        } else {
1712
14.5k
          qs.stage = QuantDataState::APPLY_DIFF;
1713
14.5k
        }
1714
17.3k
        continue;
1715
17.5k
      }
1716
1717
2.87k
      case QuantDataState::READ_DIFF_SIGN: {
1718
2.87k
        if (!BrunsliBitReaderCanRead(br, 1)) {
1719
158
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1720
158
        }
1721
2.71k
        qs.sign = BrunsliBitReaderRead(br, 1) ? -1 : 1;
1722
2.71k
        qs.stage = QuantDataState::READ_DIFF;
1723
2.71k
        continue;
1724
2.87k
      }
1725
1726
2.71k
      case QuantDataState::READ_DIFF: {
1727
2.71k
        if (!DecodeVarint(&qs.vs, br, 16)) {
1728
137
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1729
137
        }
1730
2.58k
        int diff = static_cast<int>(qs.vs.value) + 1;
1731
2.58k
        qs.delta += qs.sign * diff;
1732
2.58k
        qs.stage = QuantDataState::APPLY_DIFF;
1733
2.58k
        continue;
1734
2.71k
      }
1735
1736
17.1k
      case QuantDataState::APPLY_DIFF: {
1737
17.1k
        const int k = kJPEGNaturalOrder[qs.j];
1738
17.1k
        const int quant_value = qs.predictor[k] + qs.delta;
1739
17.1k
        jpg->quant[qs.i].values[k] = quant_value;
1740
17.1k
        if (quant_value <= 0) {
1741
98
          return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1742
98
        }
1743
17.0k
        if (quant_value >= 256) {
1744
10.4k
          qs.data_precision = 1;
1745
10.4k
        }
1746
17.0k
        if (quant_value >= 65536) {
1747
93
          return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1748
93
        }
1749
16.9k
        ++qs.j;
1750
16.9k
        qs.stage = QuantDataState::READ_DIFF_IS_ZERO;
1751
16.9k
        continue;
1752
17.0k
      }
1753
1754
6.77k
      case QuantDataState::UPDATE: {
1755
6.77k
        if (jpg->quant[qs.i].precision < qs.data_precision) {
1756
108
          return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1757
108
        }
1758
        // jpg->quant[qs.i].precision > qs.data_precision means that original
1759
        // JPEG1 was inefficiently encoded.
1760
6.66k
        ++qs.i;
1761
6.66k
        qs.stage = QuantDataState::READ_STOCK;
1762
6.66k
        continue;
1763
6.77k
      }
1764
1765
6.48k
      default: { /* no-op */ }
1766
69.0k
    }
1767
6.48k
    break;  // no matching stage has been found; exit the loop.
1768
69.0k
  }
1769
1770
19.7k
  while (qs.stage == QuantDataState::READ_QUANT_IDX) {
1771
13.5k
    if (qs.i >= jpg->components.size()) {
1772
6.22k
      qs.stage = QuantDataState::FINISH;
1773
6.22k
      continue;
1774
6.22k
    }
1775
7.28k
    JPEGComponent* c = &jpg->components[qs.i];
1776
7.28k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1777
155
       return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1778
155
    }
1779
7.12k
    c->quant_idx = BrunsliBitReaderRead(br, 2);
1780
7.12k
    if (c->quant_idx >= jpg->quant.size()) {
1781
104
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1782
104
    }
1783
7.02k
    ++qs.i;
1784
7.02k
  }
1785
1786
6.22k
  BRUNSLI_DCHECK(qs.stage == QuantDataState::FINISH);
1787
6.22k
  suspend_bit_reader(BRUNSLI_OK);
1788
6.22k
  BrunsliBitReaderFinish(br);
1789
6.22k
  if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN;
1790
6.22k
  if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1791
6.09k
  return BRUNSLI_OK;
1792
6.22k
}
1793
1794
7.61k
static BrunsliStatus DecodeHistogramDataSection(State* state, JPEGData* jpg) {
1795
7.61k
  InternalState& s = *state->internal;
1796
7.61k
  HistogramDataState& hs = s.histogram;
1797
7.61k
  BrunsliBitReader* br = &hs.br;
1798
1799
7.61k
  if (hs.stage == HistogramDataState::INIT) {
1800
7.61k
    BrunsliBitReaderInit(br);
1801
7.61k
    BRUNSLI_DCHECK(!jpg->components.empty());
1802
7.61k
    s.num_contexts = jpg->components.size();
1803
7.61k
    hs.stage = HistogramDataState::READ_SCHEME;
1804
    /* Optimization: hint arena about maximal used alphabet size: 272.
1805
     * 648 = 272 + 376, where 376 is a "universal" overhead for max-15-bit
1806
     * root-8-bit 2-level Huffman tables. */
1807
7.61k
    hs.arena.reserve(648);
1808
7.61k
  }
1809
7.61k
  PrepareBitReader(br, state);
1810
7.61k
  if (RemainingSectionLength(state) <= GetBytesAvailable(state)) {
1811
    // If end of section is reachable, then we could parse the remainings in
1812
    // non-streaming mode.
1813
6.79k
    BrunsliBitReaderSetOptimistic(br);
1814
6.79k
  }
1815
7.61k
  const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus {
1816
7.61k
    return SuspendBitReader(br, state, result);
1817
7.61k
  };
1818
1819
7.61k
  if (hs.stage == HistogramDataState::READ_SCHEME) {
1820
7.61k
    const size_t num_components = jpg->components.size();
1821
7.61k
    BRUNSLI_DCHECK(num_components <= 4);
1822
7.61k
    if (!BrunsliBitReaderCanRead(br, 3 * num_components)) {
1823
141
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1824
141
    }
1825
15.9k
    for (size_t i = 0; i < num_components; ++i) {
1826
8.57k
      size_t scheme = BrunsliBitReaderRead(br, 3);
1827
8.57k
      if (scheme >= kNumSchemes) return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1828
8.48k
      ComponentMeta& m = state->meta[i];
1829
8.48k
      m.context_bits = scheme;
1830
8.48k
      m.context_offset = s.num_contexts;
1831
8.48k
      s.num_contexts += kNumNonzeroContextSkip[scheme];
1832
8.48k
    }
1833
7.37k
    if (!BrunsliBitReaderIsHealthy(br)) {
1834
11
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1835
11
    }
1836
7.36k
    hs.stage = HistogramDataState::READ_NUM_HISTOGRAMS;
1837
7.36k
  }
1838
1839
7.36k
  if (hs.stage == HistogramDataState::READ_NUM_HISTOGRAMS) {
1840
7.36k
    if (!BrunsliBitReaderCanRead(br, 11)) {
1841
5
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1842
5
    }
1843
7.36k
    s.num_histograms = DecodeVarLenUint8(br) + 1;
1844
7.36k
    if (!BrunsliBitReaderIsHealthy(br)) {
1845
17
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1846
17
    }
1847
7.34k
    if (s.shallow_histograms) {
1848
0
      hs.stage = HistogramDataState::SKIP_CONTENT;
1849
7.34k
    } else {
1850
7.34k
      s.context_map_.resize(s.num_contexts * kNumAvrgContexts);
1851
7.34k
      state->context_map = s.context_map_.data();
1852
7.34k
      s.entropy_codes_.resize(s.num_histograms);
1853
7.34k
      state->entropy_codes = s.entropy_codes_.data();
1854
7.34k
      if (s.num_histograms > 1) {
1855
1.27k
        hs.stage = HistogramDataState::READ_CONTEXT_MAP_CODE;
1856
6.06k
      } else {
1857
6.06k
        hs.i = 0;
1858
6.06k
        hs.counts.resize(kCoeffAlphabetSize);
1859
6.06k
        hs.stage = HistogramDataState::READ_HISTOGRAMS;
1860
6.06k
      }
1861
7.34k
    }
1862
7.34k
  }
1863
1864
7.34k
  if (hs.stage == HistogramDataState::SKIP_CONTENT) {
1865
0
    suspend_bit_reader(BRUNSLI_OK);
1866
0
    if (!BrunsliBitReaderIsHealthy(br)) {
1867
0
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1868
0
    }
1869
0
    SkipAvailableBytes(state, RemainingSectionLength(state));
1870
0
    if (!IsAtSectionBoundary(state)) return BRUNSLI_NOT_ENOUGH_DATA;
1871
0
    hs.stage = HistogramDataState::DONE;
1872
0
  }
1873
1874
7.34k
  if (hs.stage == HistogramDataState::READ_CONTEXT_MAP_CODE) {
1875
1.27k
    if (!BrunsliBitReaderCanRead(br, 207 + s.num_histograms * 8)) {
1876
96
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1877
96
    }
1878
1.18k
    hs.max_run_length_prefix = 0;
1879
1.18k
    bool use_rle_for_zeros = !!BrunsliBitReaderRead(br, 1);
1880
1.18k
    if (use_rle_for_zeros) {
1881
367
      hs.max_run_length_prefix = BrunsliBitReaderRead(br, 4) + 1;
1882
367
    }
1883
1.18k
    size_t alphabet_size = s.num_histograms + hs.max_run_length_prefix;
1884
1.18k
    hs.entropy.reset(new HuffmanDecodingData);
1885
1.18k
    if (!hs.entropy->ReadFromBitStream(alphabet_size, br, &hs.arena)) {
1886
330
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1887
330
    }
1888
852
    hs.i = 0;
1889
852
    hs.stage = HistogramDataState::READ_CONTEXT_MAP;
1890
852
  }
1891
1892
6.92k
  if (hs.stage == HistogramDataState::READ_CONTEXT_MAP) {
1893
852
    BrunsliStatus status = DecodeContextMap(
1894
852
        *hs.entropy, hs.max_run_length_prefix, &hs.i, &s.context_map_, br);
1895
852
    if (status != BRUNSLI_OK) return suspend_bit_reader(status);
1896
519
    hs.i = 0;
1897
519
    hs.counts.resize(kCoeffAlphabetSize);
1898
519
    hs.stage = HistogramDataState::READ_HISTOGRAMS;
1899
519
  }
1900
1901
6.58k
  if (hs.stage == HistogramDataState::READ_HISTOGRAMS) {
1902
17.8k
    while (hs.i < s.num_histograms) {
1903
11.7k
      if (!BrunsliBitReaderCanRead(br, 9 + kCoeffAlphabetSize * 11)) {
1904
178
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1905
178
      }
1906
11.5k
      if (!ReadHistogram(BRUNSLI_ANS_LOG_TAB_SIZE, &hs.counts, br)) {
1907
246
        return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1908
246
      }
1909
11.2k
      if (!s.entropy_codes_[hs.i].Init(hs.counts)) {
1910
0
        return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1911
0
      }
1912
11.2k
      ++hs.i;
1913
11.2k
    }
1914
6.16k
    hs.entropy.reset();
1915
6.16k
    std::vector<uint32_t>().swap(hs.counts);
1916
6.16k
    suspend_bit_reader(BRUNSLI_OK);
1917
6.16k
    BrunsliBitReaderFinish(br);
1918
6.16k
    if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN;
1919
6.14k
    if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1920
6.09k
    hs.stage = HistogramDataState::DONE;
1921
6.09k
  }
1922
1923
6.09k
  hs.arena.reset();
1924
6.09k
  BRUNSLI_DCHECK(hs.stage == HistogramDataState::DONE);
1925
6.09k
  return BRUNSLI_OK;
1926
6.58k
}
1927
1928
6.07k
static BrunsliStatus DecodeDCDataSection(State* state) {
1929
6.07k
  size_t available = GetBytesAvailable(state) & ~1;
1930
6.07k
  size_t limit = RemainingSectionLength(state);
1931
6.07k
  BRUNSLI_DCHECK((limit & 1) == 0);
1932
6.07k
  size_t chunk_len = std::min(available, limit);
1933
  // If end of section is reachable, then we could parse the remainings in
1934
  // non-streaming mode.
1935
6.07k
  bool is_last_chunk = (chunk_len == limit);
1936
6.07k
  WordSource in(state->data + state->pos, chunk_len, is_last_chunk);
1937
1938
6.07k
  BrunsliStatus status = DecodeDC(state, &in);
1939
1940
6.07k
  BRUNSLI_DCHECK((in.pos_ & 1) == 0);
1941
6.07k
  if (in.error_) return BRUNSLI_INVALID_BRN;
1942
5.79k
  BRUNSLI_DCHECK(in.pos_ <= chunk_len);
1943
5.79k
  SkipBytes(state, in.pos_);
1944
5.79k
  if (is_last_chunk) {
1945
5.49k
    BRUNSLI_DCHECK(status != BRUNSLI_NOT_ENOUGH_DATA);
1946
5.49k
    if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1947
5.49k
  }
1948
5.78k
  return status;
1949
5.79k
}
1950
1951
5.47k
static BrunsliStatus DecodeACDataSection(State* state) {
1952
5.47k
  size_t available = GetBytesAvailable(state) & ~1;
1953
5.47k
  size_t limit = RemainingSectionLength(state);
1954
5.47k
  BRUNSLI_DCHECK((limit & 1) == 0);
1955
5.47k
  size_t chunk_len = std::min(available, limit);
1956
  // If end of section is reachable, then we could parse the remainings in
1957
  // non-streaming mode.
1958
5.47k
  bool is_last_chunk = (chunk_len == limit);
1959
5.47k
  WordSource in(state->data + state->pos, chunk_len, is_last_chunk);
1960
1961
5.47k
  BrunsliStatus status = DecodeAC(state, &in);
1962
1963
5.47k
  BRUNSLI_DCHECK((in.pos_ & 1) == 0);
1964
5.47k
  if (in.error_) return BRUNSLI_INVALID_BRN;
1965
4.85k
  BRUNSLI_DCHECK(in.pos_ <= chunk_len);
1966
4.85k
  SkipBytes(state, in.pos_);
1967
4.85k
  if (is_last_chunk) {
1968
4.64k
    BRUNSLI_DCHECK(status != BRUNSLI_NOT_ENOUGH_DATA);
1969
4.64k
    if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1970
4.64k
  }
1971
4.79k
  return status;
1972
4.85k
}
1973
1974
376
static Stage DecodeOriginalJpg(State* state, JPEGData* jpg) {
1975
376
  InternalState& s = *state->internal;
1976
376
  FallbackState& fs = s.fallback;
1977
1978
1.09k
  while (fs.stage != FallbackState::DONE) {
1979
1.04k
    switch (fs.stage) {
1980
376
      case FallbackState::READ_TAG: {
1981
376
        BrunsliStatus status = ReadTag(state, &s.section);
1982
376
        if (status != BRUNSLI_OK) return Fail(state, status);
1983
359
        if (s.section.tag != kBrunsliOriginalJpgTag || !s.section.is_section) {
1984
6
          return Fail(state, BRUNSLI_INVALID_BRN);
1985
6
        }
1986
353
        fs.stage = FallbackState::ENTER_SECTION;
1987
353
        break;
1988
359
      }
1989
1990
353
      case FallbackState::ENTER_SECTION: {
1991
353
        BrunsliStatus status = EnterSection(state, &s.section);
1992
353
        if (status != BRUNSLI_OK) return Fail(state, status);
1993
318
        jpg->original_jpg_size = s.section.remaining;
1994
        // Edge case - empty payload.
1995
318
        if (jpg->original_jpg_size == 0) {
1996
4
          jpg->original_jpg = nullptr;
1997
4
          fs.stage = FallbackState::DONE;
1998
4
          break;
1999
4
        }
2000
314
        fs.stage = FallbackState::READ_CONTENTS;
2001
314
        break;
2002
318
      }
2003
2004
314
      case FallbackState::READ_CONTENTS: {
2005
314
        size_t chunk_size = GetBytesAvailable(state);
2006
314
        if (chunk_size == 0) {
2007
          // TODO(eustas): dcheck s.section.remaining != 0
2008
79
          return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
2009
79
        }
2010
        // Check if it is possible to avoid copy.
2011
235
        const uint8_t* src = state->data + state->pos;
2012
235
        if (fs.storage.empty()) {
2013
235
          if (chunk_size >= jpg->original_jpg_size) {
2014
46
            jpg->original_jpg = src;
2015
46
            SkipBytes(state, jpg->original_jpg_size);
2016
46
            fs.stage = FallbackState::DONE;
2017
46
            break;
2018
46
          }
2019
235
        }
2020
        // Otherwise, copy input.
2021
189
        size_t remaining = jpg->original_jpg_size - fs.storage.size();
2022
189
        size_t to_copy = std::min(chunk_size, remaining);
2023
189
        fs.storage.insert(fs.storage.cend(), src, src + to_copy);
2024
189
        SkipBytes(state, to_copy);
2025
189
        if (fs.storage.size() == jpg->original_jpg_size) {
2026
0
          jpg->original_jpg = fs.storage.data();
2027
0
          fs.stage = FallbackState::DONE;
2028
0
          break;
2029
0
        }
2030
        // TODO(eustas): dcheck GetBytesAvailable(state) == 0
2031
189
        return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
2032
189
      }
2033
2034
0
      default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
2035
1.04k
    }
2036
1.04k
  }
2037
2038
50
  LeaveSection(&s.section);
2039
50
  return Stage::DONE;
2040
376
}
2041
2042
43.4k
static Stage ParseSection(State* state) {
2043
43.4k
  InternalState& s = *state->internal;
2044
43.4k
  SectionHeaderState& sh = s.section_header;
2045
2046
43.4k
  Stage result = Stage::ERROR;
2047
2048
130k
  while (sh.stage != SectionHeaderState::DONE) {
2049
86.7k
    switch (sh.stage) {
2050
43.4k
      case SectionHeaderState::READ_TAG: {
2051
43.4k
        BrunsliStatus status = ReadTag(state, &s.section);
2052
43.4k
        if (status == BRUNSLI_NOT_ENOUGH_DATA) {
2053
91
          if (HasSection(state, kBrunsliACDataTag)) return Stage::DONE;
2054
91
        }
2055
43.4k
        if (status != BRUNSLI_OK) return Fail(state, status);
2056
43.3k
        if (s.section.is_section) {
2057
43.3k
          sh.stage = SectionHeaderState::ENTER_SECTION;
2058
43.3k
          continue;
2059
43.3k
        }
2060
28
        const uint32_t tag_bit = 1u << s.section.tag;
2061
28
        const bool is_known_section_tag = kKnownSectionTags & tag_bit;
2062
28
        if (is_known_section_tag) return Fail(state, BRUNSLI_INVALID_BRN);
2063
27
        sh.stage = SectionHeaderState::READ_VALUE;
2064
27
        continue;
2065
28
      }
2066
2067
27
      case SectionHeaderState::READ_VALUE: {
2068
        // No known varint tags on top level.
2069
27
        size_t sink;
2070
27
        BrunsliStatus status = DecodeBase128(state, &sink);
2071
27
        if (status != BRUNSLI_OK) return Fail(state, status);
2072
21
        result = Stage::SECTION;
2073
21
        sh.stage = SectionHeaderState::DONE;
2074
21
        continue;
2075
27
      }
2076
2077
43.3k
      case SectionHeaderState::ENTER_SECTION: {
2078
43.3k
        BrunsliStatus status = EnterSection(state, &s.section);
2079
43.3k
        if (status != BRUNSLI_OK) return Fail(state, status);
2080
43.2k
        result = Stage::SECTION_BODY;
2081
43.2k
        sh.stage = SectionHeaderState::DONE;
2082
43.2k
        continue;
2083
43.3k
      }
2084
2085
0
      default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
2086
86.7k
    }
2087
86.7k
  }
2088
2089
43.3k
  sh.stage = SectionHeaderState::READ_TAG;
2090
43.3k
  BRUNSLI_DCHECK(result != Stage::ERROR);
2091
43.3k
  return result;
2092
43.4k
}
2093
2094
43.2k
static Stage ProcessSection(State* state, JPEGData* jpg) {
2095
43.2k
  InternalState& s = *state->internal;
2096
2097
43.2k
  const int32_t tag_bit = 1u << s.section.tag;
2098
43.2k
  const bool is_known_section_tag = kKnownSectionTags & tag_bit;
2099
2100
43.2k
  const bool skip_section =
2101
43.2k
      !is_known_section_tag || (state->skip_tags & tag_bit);
2102
2103
43.2k
  if (skip_section) {
2104
    // Skip section content.
2105
168
    size_t to_skip =
2106
168
        std::min(GetBytesAvailable(state), RemainingSectionLength(state));
2107
168
    state->pos += to_skip;
2108
168
    if (RemainingSectionLength(state) != 0) {
2109
124
      BRUNSLI_DCHECK(GetBytesAvailable(state) == 0);
2110
124
      return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
2111
124
    }
2112
44
    return Stage::SECTION;
2113
168
  }
2114
2115
43.1k
  switch (s.section.tag) {
2116
4.21k
    case kBrunsliMetaDataTag: {
2117
4.21k
      BrunsliStatus status = DecodeMetaDataSection(state, jpg);
2118
4.21k
      if (status != BRUNSLI_OK) return Fail(state, status);
2119
35
      break;
2120
4.21k
    }
2121
2122
11.8k
    case kBrunsliJPEGInternalsTag: {
2123
11.8k
      BrunsliStatus status = DecodeJPEGInternalsSection(state, jpg);
2124
11.8k
      if (status != BRUNSLI_OK) return Fail(state, status);
2125
9.37k
      break;
2126
11.8k
    }
2127
2128
9.37k
    case kBrunsliQuantDataTag: {
2129
7.85k
      if (!HasSection(state, kBrunsliJPEGInternalsTag)) {
2130
2
        return Fail(state, BRUNSLI_INVALID_BRN);
2131
2
      }
2132
7.85k
      BrunsliStatus status = DecodeQuantDataSection(state, jpg);
2133
7.85k
      if (status != BRUNSLI_OK) return Fail(state, status);
2134
6.09k
      break;
2135
7.85k
    }
2136
2137
7.61k
    case kBrunsliHistogramDataTag: {
2138
7.61k
      if (!HasSection(state, kBrunsliJPEGInternalsTag)) {
2139
1
        return Fail(state, BRUNSLI_INVALID_BRN);
2140
1
      }
2141
7.61k
      BrunsliStatus status = DecodeHistogramDataSection(state, jpg);
2142
7.61k
      if (status != BRUNSLI_OK) return Fail(state, status);
2143
6.09k
      break;
2144
7.61k
    }
2145
2146
6.09k
    case kBrunsliDCDataTag: {
2147
6.08k
      if (!HasSection(state, kBrunsliHistogramDataTag)) {
2148
1
        return Fail(state, BRUNSLI_INVALID_BRN);
2149
1
      }
2150
6.07k
      if (!HasSection(state, kBrunsliQuantDataTag)) {
2151
1
        return Fail(state, BRUNSLI_INVALID_BRN);
2152
1
      }
2153
      // This section reads input word by word.
2154
6.07k
      if ((RemainingSectionLength(state) & 1) != 0) {
2155
6
        return Fail(state, BRUNSLI_INVALID_BRN);
2156
6
      }
2157
6.07k
      internal::dec::WarmupMeta(jpg, state);
2158
6.07k
      BrunsliStatus status = DecodeDCDataSection(state);
2159
6.07k
      if (status != BRUNSLI_OK) return Fail(state, status);
2160
5.54k
      break;
2161
6.07k
    }
2162
2163
5.54k
    case kBrunsliACDataTag: {
2164
5.47k
      if (!HasSection(state, kBrunsliDCDataTag)) {
2165
1
        return Fail(state, BRUNSLI_INVALID_BRN);
2166
1
      }
2167
      // This section reads input word by word.
2168
5.47k
      if ((RemainingSectionLength(state) & 1) != 0) {
2169
1
        return Fail(state, BRUNSLI_INVALID_BRN);
2170
1
      }
2171
5.47k
      internal::dec::WarmupMeta(jpg, state);
2172
5.47k
      BrunsliStatus status = DecodeACDataSection(state);
2173
5.47k
      if (status != BRUNSLI_OK) return Fail(state, status);
2174
4.55k
      break;
2175
5.47k
    }
2176
2177
4.55k
    default:
2178
      /* Unreachable */
2179
0
      return Fail(state, BRUNSLI_INVALID_BRN);
2180
43.1k
  }
2181
2182
31.6k
  if (!IsAtSectionBoundary(state)) {
2183
61
    return Fail(state, BRUNSLI_INVALID_BRN);
2184
61
  }
2185
2186
  // Nothing is expected after the AC data.
2187
31.6k
  if (s.section.tag == kBrunsliACDataTag) {
2188
4.55k
    return Stage::DONE;
2189
4.55k
  }
2190
2191
27.0k
  return Stage::SECTION;
2192
31.6k
}
2193
2194
namespace internal {
2195
namespace dec {
2196
2197
16.2k
bool UpdateSubsamplingDerivatives(JPEGData* jpg) {
2198
44.0k
  for (size_t i = 0; i < jpg->components.size(); ++i) {
2199
27.7k
    JPEGComponent* c = &jpg->components[i];
2200
27.7k
    jpg->max_h_samp_factor = std::max(jpg->max_h_samp_factor, c->h_samp_factor);
2201
27.7k
    jpg->max_v_samp_factor = std::max(jpg->max_v_samp_factor, c->v_samp_factor);
2202
27.7k
  }
2203
16.2k
  jpg->MCU_rows = DivCeil(jpg->height, jpg->max_v_samp_factor * 8);
2204
16.2k
  jpg->MCU_cols = DivCeil(jpg->width, jpg->max_h_samp_factor * 8);
2205
44.0k
  for (size_t i = 0; i < jpg->components.size(); ++i) {
2206
27.7k
    JPEGComponent* c = &jpg->components[i];
2207
27.7k
    c->width_in_blocks = jpg->MCU_cols * c->h_samp_factor;
2208
27.7k
    c->height_in_blocks = jpg->MCU_rows * c->v_samp_factor;
2209
    // 8205 == max[ceil((65535 / (i * 8)) * i) for i in range(1, 16 + 1)]
2210
27.7k
    BRUNSLI_DCHECK(c->width_in_blocks <= 8205);
2211
27.7k
    BRUNSLI_DCHECK(c->height_in_blocks <= 8205);
2212
27.7k
    uint32_t num_blocks = c->width_in_blocks * c->height_in_blocks;
2213
27.7k
    if (num_blocks > kBrunsliMaxNumBlocks) {
2214
1
      return false;
2215
1
    }
2216
27.7k
    c->num_blocks = num_blocks;
2217
27.7k
  }
2218
16.2k
  return true;
2219
16.2k
}
2220
2221
16.2k
void PrepareMeta(const JPEGData* jpg, State* state) {
2222
16.2k
  InternalState& s = *state->internal;
2223
2224
16.2k
  size_t num_components = jpg->components.size();
2225
16.2k
  s.block_state_.resize(num_components);
2226
16.2k
  std::vector<ComponentMeta>& meta = state->meta;
2227
16.2k
  meta.resize(num_components);
2228
44.0k
  for (size_t i = 0; i < num_components; ++i) {
2229
27.7k
    const JPEGComponent& c = jpg->components[i];
2230
27.7k
    ComponentMeta& m = meta[i];
2231
27.7k
    m.h_samp = c.h_samp_factor;
2232
27.7k
    m.v_samp = c.v_samp_factor;
2233
27.7k
    m.width_in_blocks = jpg->MCU_cols * m.h_samp;
2234
27.7k
    m.height_in_blocks = jpg->MCU_rows * m.v_samp;
2235
27.7k
  }
2236
16.2k
}
2237
2238
11.5k
void WarmupMeta(JPEGData* jpg, State* state) {
2239
11.5k
  InternalState& s = *state->internal;
2240
11.5k
  std::vector<ComponentMeta>& meta = state->meta;
2241
11.5k
  const size_t num_components = meta.size();
2242
2243
11.5k
  if (!state->is_storage_allocated) {
2244
6.07k
    state->is_storage_allocated = true;
2245
12.7k
    for (size_t i = 0; i < num_components; ++i) {
2246
6.69k
      size_t num_blocks = meta[i].width_in_blocks * meta[i].height_in_blocks;
2247
6.69k
      jpg->components[i].coeffs.resize(num_blocks * kDCTBlockSize);
2248
6.69k
      s.block_state_[i].resize(num_blocks);
2249
6.69k
      meta[i].block_state = s.block_state_[i].data();
2250
6.69k
    }
2251
6.07k
  }
2252
2253
11.5k
  if (!s.is_meta_warm) {
2254
6.07k
    s.is_meta_warm = true;
2255
12.7k
    for (size_t c = 0; c < num_components; ++c) {
2256
6.69k
      ComponentMeta& m = meta[c];
2257
6.69k
      const JPEGQuantTable& q = jpg->quant[jpg->components[c].quant_idx];
2258
6.69k
      m.ac_coeffs = jpg->components[c].coeffs.data();
2259
6.69k
      m.ac_stride = m.width_in_blocks * kDCTBlockSize;
2260
6.69k
      m.b_stride = m.width_in_blocks;
2261
6.69k
      memcpy(m.quant.data(), q.values.data(),
2262
6.69k
             kDCTBlockSize * sizeof(m.quant[0]));
2263
6.69k
    }
2264
6.07k
  }
2265
11.5k
}
2266
2267
17.4k
BrunsliStatus DoProcessJpeg(State* state, JPEGData* jpg) {
2268
139k
  while (true) {
2269
139k
    switch (state->stage) {
2270
17.4k
      case Stage::SIGNATURE:
2271
17.4k
        state->stage = VerifySignature(state);
2272
17.4k
        break;
2273
2274
17.3k
      case Stage::HEADER:
2275
17.3k
        state->stage = DecodeHeader(state, jpg);
2276
17.3k
        break;
2277
2278
376
      case Stage::FALLBACK:
2279
376
        state->stage = DecodeOriginalJpg(state, jpg);
2280
376
        break;
2281
2282
43.4k
      case Stage::SECTION:
2283
43.4k
        state->stage = ParseSection(state);
2284
43.4k
        break;
2285
2286
43.2k
      case Stage::SECTION_BODY:
2287
43.2k
        state->stage = ProcessSection(state, jpg);
2288
43.2k
        break;
2289
2290
4.60k
      case Stage::DONE:
2291
        // It is expected that there is no garbage after the valid brunsli
2292
        // stream.
2293
4.60k
        if (state->pos != state->len) {
2294
39
          state->stage = Fail(state, BRUNSLI_INVALID_BRN);
2295
39
          break;
2296
39
        }
2297
4.56k
        return BRUNSLI_OK;
2298
2299
12.8k
      case Stage::ERROR:
2300
12.8k
        return state->internal->result;
2301
2302
0
      default:
2303
        /* Unreachable */
2304
0
        state->stage = Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
2305
0
        break;
2306
139k
    }
2307
139k
  }
2308
17.4k
}
2309
2310
/** Adds new input to buffer. */
2311
17.4k
void ChargeBuffer(State* state) {
2312
17.4k
  InternalState& s = *state->internal;
2313
17.4k
  Buffer& b = s.buffer;
2314
2315
17.4k
  b.borrowed_len = 0;
2316
17.4k
  b.external_data = state->data;
2317
17.4k
  b.external_pos = state->pos;
2318
17.4k
  b.external_len = state->len;
2319
17.4k
}
2320
2321
constexpr size_t kBufferMaxReadAhead = 600;
2322
2323
/** Sets input source either to buffered, or to external data. */
2324
17.4k
void LoadInput(State* state) {
2325
17.4k
  InternalState& s = *state->internal;
2326
17.4k
  Buffer& b = s.buffer;
2327
2328
  // No data buffered. Just pass external data as is.
2329
17.4k
  if (b.data_len == 0) {
2330
17.4k
    state->data = b.external_data;
2331
17.4k
    state->pos = b.external_pos;
2332
17.4k
    state->len = b.external_len;
2333
17.4k
    return;
2334
17.4k
  }
2335
2336
0
  BRUNSLI_DCHECK(b.data_len <= kBufferMaxReadAhead);
2337
2338
  // Otherwise use buffered data.
2339
0
  size_t available = b.external_len - b.external_pos;
2340
  // Always try to borrow as much as parser could require. This way, when
2341
  // buffer is unable to provide enough input, we could switch to unbuffered
2342
  // input.
2343
0
  b.borrowed_len = std::min(kBufferMaxReadAhead, available);
2344
0
  memcpy(b.data.data() + b.data_len, b.external_data + b.external_pos,
2345
0
         b.borrowed_len);
2346
0
  state->data = b.data.data();
2347
0
  state->pos = 0;
2348
0
  state->len = b.data_len + b.borrowed_len;
2349
0
}
2350
2351
/**
2352
 * Cancel borrowed bytes, if any.
2353
 *
2354
 * Returns false, if it is impossible to continue parsing.
2355
 */
2356
17.4k
bool UnloadInput(State* state, BrunsliStatus result) {
2357
17.4k
  InternalState& s = *state->internal;
2358
17.4k
  Buffer& b = s.buffer;
2359
2360
  // Non-buffered input; put tail to buffer.
2361
17.4k
  if (state->data == b.external_data) {
2362
17.4k
    b.external_pos = state->pos;
2363
17.4k
    BRUNSLI_DCHECK(b.external_pos <= b.external_len);
2364
17.4k
    if (result != BRUNSLI_NOT_ENOUGH_DATA) return true;
2365
6.33k
    BRUNSLI_DCHECK(b.data_len == 0);
2366
6.33k
    size_t available = b.external_len - b.external_pos;
2367
6.33k
    BRUNSLI_DCHECK(available < kBufferMaxReadAhead);
2368
6.33k
    if (b.data.empty()) b.data.resize(2 * kBufferMaxReadAhead);
2369
6.33k
    b.data_len = available;
2370
6.33k
    memcpy(b.data.data(), b.external_data + b.external_pos, b.data_len);
2371
6.33k
    b.external_pos += available;
2372
6.33k
    return false;
2373
17.4k
  }
2374
2375
  // Buffer depleted; switch to non-buffered input.
2376
0
  if (state->pos >= b.data_len) {
2377
0
    size_t used_borrowed_bytes = state->pos - b.data_len;
2378
0
    b.data_len = 0;
2379
0
    b.external_pos += used_borrowed_bytes;
2380
0
    return true;
2381
0
  }
2382
2383
  // Buffer not depleted; either problem discovered was already buffered data,
2384
  // or extra input was too-short.
2385
0
  b.data_len -= state->pos;
2386
0
  if (result == BRUNSLI_NOT_ENOUGH_DATA) {
2387
    // We couldn't have taken more bytes.
2388
0
    BRUNSLI_DCHECK(b.external_pos + b.borrowed_len == b.external_len);
2389
    // Remaining piece is not too large.
2390
0
    BRUNSLI_DCHECK(b.data_len + b.borrowed_len < kBufferMaxReadAhead);
2391
0
    b.data_len += b.borrowed_len;
2392
0
    b.external_pos += b.borrowed_len;
2393
0
  }
2394
0
  BRUNSLI_DCHECK(!b.data.empty());
2395
0
  if (state->pos > 0 && b.data_len > 0) {
2396
0
    memmove(b.data.data(), b.data.data() + state->pos, b.data_len);
2397
0
  }
2398
0
  BRUNSLI_DCHECK(b.data_len <= kBufferMaxReadAhead);
2399
2400
0
  return (result != BRUNSLI_NOT_ENOUGH_DATA);
2401
0
}
2402
2403
/** Sets back user-provided input. */
2404
17.4k
void UnchargeBuffer(State* state) {
2405
17.4k
  InternalState& s = *state->internal;
2406
17.4k
  Buffer& b = s.buffer;
2407
2408
17.4k
  state->data = b.external_data;
2409
17.4k
  state->pos = b.external_pos;
2410
17.4k
  state->len = b.external_len;
2411
17.4k
}
2412
2413
17.4k
BrunsliStatus ProcessJpeg(State* state, JPEGData* jpg) {
2414
17.4k
  InternalState& s = *state->internal;
2415
2416
17.4k
  if (state->pos > state->len) return BRUNSLI_INVALID_PARAM;
2417
17.4k
  ChargeBuffer(state);
2418
2419
17.4k
  BrunsliStatus result = BRUNSLI_NOT_ENOUGH_DATA;
2420
28.4k
  while (result == BRUNSLI_NOT_ENOUGH_DATA) {
2421
17.4k
    if (state->stage == Stage::ERROR) {
2422
      // General error -> no recovery.
2423
0
      if (s.result != BRUNSLI_NOT_ENOUGH_DATA) return s.result;
2424
      // Continue parsing.
2425
0
      s.result = BRUNSLI_OK;
2426
0
      state->stage = s.last_stage;
2427
0
      s.last_stage = Stage::ERROR;
2428
0
    }
2429
2430
17.4k
    LoadInput(state);
2431
17.4k
    if (s.section.is_active) {
2432
0
      s.section.milestone = state->pos;
2433
0
      s.section.projected_end = s.section.milestone + s.section.remaining;
2434
0
    }
2435
2436
17.4k
    s.section.tags_met |= state->tags_met;
2437
17.4k
    result = DoProcessJpeg(state, jpg);
2438
2439
17.4k
    if (s.section.is_active) {
2440
      // TODO(eustas): dcheck state->pos > s.section.milestone
2441
17.0k
      size_t processed_len = state->pos - s.section.milestone;
2442
      // TODO(eustas): dcheck processed_len < s.section.remaining
2443
17.0k
      s.section.remaining -= processed_len;
2444
17.0k
    }
2445
2446
17.4k
    if (!UnloadInput(state, result)) break;
2447
17.4k
  }
2448
17.4k
  UnchargeBuffer(state);
2449
17.4k
  return result;
2450
17.4k
}
2451
2452
}  // namespace dec
2453
}  // namespace internal
2454
2455
BrunsliStatus BrunsliDecodeJpeg(const uint8_t* data, const size_t len,
2456
17.4k
                                JPEGData* jpg) {
2457
17.4k
  if (!data) return BRUNSLI_INVALID_PARAM;
2458
2459
17.4k
  State state;
2460
17.4k
  state.data = data;
2461
17.4k
  state.len = len;
2462
2463
17.4k
  return internal::dec::ProcessJpeg(&state, jpg);
2464
17.4k
}
2465
2466
size_t BrunsliEstimateDecoderPeakMemoryUsage(const uint8_t* data,
2467
0
                                             const size_t len) {
2468
0
  if (!data) return BRUNSLI_INVALID_PARAM;
2469
2470
0
  State state;
2471
0
  state.data = data;
2472
0
  state.len = len;
2473
0
  state.skip_tags = ~(1u << kBrunsliHistogramDataTag);
2474
0
  InternalState& s = *state.internal;
2475
0
  s.shallow_histograms = true;
2476
2477
0
  JPEGData jpg;
2478
0
  BrunsliStatus status = internal::dec::ProcessJpeg(&state, &jpg);
2479
2480
0
  if (status != BRUNSLI_OK) return 0;
2481
2482
0
  size_t out_size = 2 * len;
2483
0
  size_t total_num_blocks = 0;
2484
0
  size_t component_state_size = 0;
2485
0
  for (size_t i = 0; i < jpg.components.size(); ++i) {
2486
0
    const JPEGComponent& c = jpg.components[i];
2487
0
    total_num_blocks += c.num_blocks;
2488
0
    component_state_size += ComponentState::SizeInBytes(c.width_in_blocks);
2489
0
  }
2490
0
  size_t jpeg_data_size = total_num_blocks * kDCTBlockSize * sizeof(coeff_t);
2491
0
  size_t context_map_size = s.num_contexts * kNumAvrgContexts * sizeof(int32_t);
2492
0
  size_t histogram_size = s.num_histograms * sizeof(ANSDecodingData);
2493
0
  size_t decode_peak = context_map_size + histogram_size + component_state_size;
2494
0
  size_t jpeg_writer_size = (1u << 17u) + (1u << 16u) * sizeof(int32_t);
2495
0
  return (out_size + jpeg_data_size + std::max(decode_peak, jpeg_writer_size));
2496
0
}
2497
2498
0
BrunsliDecoder::BrunsliDecoder() {
2499
0
  jpg_.reset(new JPEGData);
2500
0
  state_.reset(new State);
2501
0
}
2502
2503
0
BrunsliDecoder::~BrunsliDecoder() {}
2504
2505
BrunsliDecoder::Status BrunsliDecoder::Decode(size_t* available_in,
2506
                                              const uint8_t** next_in,
2507
                                              size_t* available_out,
2508
0
                                              uint8_t** next_out) {
2509
0
  JPEGData* jpg = jpg_.get();
2510
0
  BRUNSLI_DCHECK(jpg);
2511
0
  State* state = state_.get();
2512
0
  BRUNSLI_DCHECK(state);
2513
2514
0
  state->data = *next_in;
2515
0
  state->pos = 0;
2516
0
  state->len = *available_in;
2517
0
  BrunsliStatus parse_status = internal::dec::ProcessJpeg(state, jpg);
2518
0
  size_t consumed_bytes = state->pos;
2519
0
  *available_in -= consumed_bytes;
2520
0
  *next_in += consumed_bytes;
2521
2522
0
  if ((parse_status != BRUNSLI_OK) &&
2523
0
      (parse_status != BRUNSLI_NOT_ENOUGH_DATA)) {
2524
0
    return BrunsliDecoder::ERROR;
2525
0
  }
2526
2527
  // All the input given input should be consumed.
2528
0
  BRUNSLI_DCHECK(*available_in == 0);
2529
2530
0
  SerializationStatus serialization_status =
2531
0
      SerializeJpeg(state, *jpg, available_out, next_out);
2532
0
  if (serialization_status == SerializationStatus::ERROR) {
2533
0
    return BrunsliDecoder::ERROR;
2534
0
  }
2535
2536
0
  switch (serialization_status) {
2537
0
    case SerializationStatus::DONE:
2538
      // Should be impossible to finish serialization without finishing parsing.
2539
0
      BRUNSLI_DCHECK(parse_status == BRUNSLI_OK);
2540
0
      return BrunsliDecoder::DONE;
2541
2542
0
    case SerializationStatus::NEEDS_MORE_INPUT:
2543
      // If serializer says that data is incomplete, parser should say the same.
2544
0
      BRUNSLI_DCHECK(parse_status == BRUNSLI_NOT_ENOUGH_DATA);
2545
0
      return BrunsliDecoder::NEEDS_MORE_INPUT;
2546
2547
0
    case SerializationStatus::NEEDS_MORE_OUTPUT:
2548
      // TODO(eustas): make sure that serializer could produce more bytes
2549
      //               without providing more bytes to parser
2550
0
      BRUNSLI_DCHECK(*available_out == 0);
2551
0
      return BrunsliDecoder::NEEDS_MORE_OUTPUT;
2552
2553
0
    case SerializationStatus::ERROR:
2554
0
      return BrunsliDecoder::ERROR;
2555
2556
0
    default:
2557
      /* Unreachable */
2558
0
      BRUNSLI_DCHECK(false);
2559
0
      return BrunsliDecoder::ERROR;
2560
0
  }
2561
0
}
2562
2563
}  // namespace brunsli