Coverage Report

Created: 2026-05-12 06:13

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/brunsli/c/dec/brunsli_decode.cc
Line
Count
Source
1
// Copyright (c) Google LLC 2019
2
//
3
// Use of this source code is governed by an MIT-style
4
// license that can be found in the LICENSE file or at
5
// https://opensource.org/licenses/MIT.
6
7
#include <brunsli/brunsli_decode.h>
8
9
#include <algorithm>
10
#include <cstdlib>
11
#include <cstring>
12
#include <iterator>
13
#include <string>
14
#include <vector>
15
16
#include <brotli/decode.h>
17
#include "../common/constants.h"
18
#include "../common/context.h"
19
#include <brunsli/jpeg_data.h>
20
#include "../common/lehmer_code.h"
21
#include "../common/platform.h"
22
#include "../common/predict.h"
23
#include "../common/quant_matrix.h"
24
#include <brunsli/status.h>
25
#include <brunsli/types.h>
26
#include "./ans_decode.h"
27
#include "./arith_decode.h"
28
#include "./bit_reader.h"
29
#include "./brunsli_input.h"
30
#include "./context_map_decode.h"
31
#include "./histogram_decode.h"
32
#include "./huffman_table.h"
33
#include <brunsli/jpeg_data_writer.h>
34
#include "./state.h"
35
#include "./state_internal.h"
36
37
namespace brunsli {
38
39
using ::brunsli::internal::dec::AcDcState;
40
using ::brunsli::internal::dec::BlockI32;
41
using ::brunsli::internal::dec::Buffer;
42
using ::brunsli::internal::dec::ComponentMeta;
43
using ::brunsli::internal::dec::FallbackState;
44
using ::brunsli::internal::dec::HeaderState;
45
using ::brunsli::internal::dec::HistogramDataState;
46
using ::brunsli::internal::dec::InternalState;
47
using ::brunsli::internal::dec::JpegInternalsState;
48
using ::brunsli::internal::dec::MetadataDecompressionStage;
49
using ::brunsli::internal::dec::MetadataState;
50
using ::brunsli::internal::dec::PrepareMeta;
51
using ::brunsli::internal::dec::QuantDataState;
52
using ::brunsli::internal::dec::SectionHeaderState;
53
using ::brunsli::internal::dec::SectionState;
54
using ::brunsli::internal::dec::SerializationStatus;
55
using ::brunsli::internal::dec::Stage;
56
using ::brunsli::internal::dec::State;
57
using ::brunsli::internal::dec::UpdateSubsamplingDerivatives;
58
using ::brunsli::internal::dec::VarintState;
59
60
static const int kNumDirectCodes = 8;
61
static const int kCoeffAlphabetSize = kNumDirectCodes + 10;
62
63
static const uint32_t kKnownSectionTags =
64
    (1u << kBrunsliSignatureTag) | (1u << kBrunsliHeaderTag) |
65
    (1u << kBrunsliMetaDataTag) | (1u << kBrunsliJPEGInternalsTag) |
66
    (1u << kBrunsliQuantDataTag) | (1u << kBrunsliHistogramDataTag) |
67
    (1u << kBrunsliDCDataTag) | (1u << kBrunsliACDataTag) |
68
    (1u << kBrunsliOriginalJpgTag);
69
70
static const uint32_t kKnownHeaderVarintTags =
71
    (1u << kBrunsliHeaderWidthTag) | (1u << kBrunsliHeaderHeightTag) |
72
    (1u << kBrunsliHeaderVersionCompTag) | (1u << kBrunsliHeaderSubsamplingTag);
73
74
0
bool IsBrunsli(const uint8_t* data, const size_t len) {
75
0
  static const uint8_t kSignature[6] = {
76
0
      /* marker */ 0x0A,
77
0
      /* length */ 0x04, 0x42, 0xD2, 0xD5, 0x4E};
78
0
  static const size_t kSignatureLen = sizeof(kSignature);
79
0
  if (len < kSignatureLen) return false;
80
0
  return (memcmp(kSignature, data, kSignatureLen) == 0);
81
0
}
82
83
// Returns ceil(a/b).
84
51.6k
inline int DivCeil(int a, int b) { return (a + b - 1) / b; }
85
86
// Decodes a number in the range [0..255], by reading 1 - 11 bits.
87
12.3k
inline uint32_t DecodeVarLenUint8(BrunsliBitReader* br) {
88
12.3k
  if (BrunsliBitReaderRead(br, 1)) {
89
2.13k
    uint32_t nbits = BrunsliBitReaderRead(br, 3);
90
2.13k
    if (nbits == 0) {
91
1.08k
      return 1u;
92
1.08k
    } else {
93
1.04k
      return BrunsliBitReaderRead(br, nbits) + (1u << nbits);
94
1.04k
    }
95
2.13k
  }
96
10.2k
  return 0;
97
12.3k
}
98
99
161k
bool DecodeVarint(VarintState* s, BrunsliBitReader* br, size_t max_bits) {
100
161k
  if (s->stage == VarintState::INIT) {
101
133k
    s->value = 0;
102
133k
    s->i = 0;
103
133k
    s->stage = VarintState::READ_CONTINUATION;
104
133k
  }
105
106
441k
  while (true) {
107
441k
    switch (s->stage) {
108
287k
      case VarintState::READ_CONTINUATION: {
109
287k
        if (s->i >= max_bits) {
110
936
          s->stage = VarintState::INIT;
111
936
          return true;
112
936
        }
113
286k
        if (s->i + 1 != max_bits) {
114
285k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
115
271k
          if (!BrunsliBitReaderRead(br, 1)) {
116
132k
            s->stage = VarintState::INIT;
117
132k
            return true;
118
132k
          }
119
271k
        }
120
140k
        s->stage = VarintState::READ_DATA;
121
140k
        continue;
122
286k
      }
123
153k
      case VarintState::READ_DATA: {
124
153k
        if (!BrunsliBitReaderCanRead(br, 1)) return false;
125
140k
        size_t next_bit = BrunsliBitReaderRead(br, 1);
126
140k
        s->value |= next_bit << s->i;
127
140k
        ++s->i;
128
140k
        s->stage = VarintState::READ_CONTINUATION;
129
140k
        continue;
130
153k
      }
131
0
      default: {
132
0
        BRUNSLI_CHECK(false);
133
0
        return false;
134
153k
      }
135
441k
    }
136
441k
  }
137
161k
}
138
139
template <size_t kChunkSize>
140
bool DecodeLimitedVarint(VarintState* s, BrunsliBitReader* br,
141
138k
                         size_t max_symbols) {
142
138k
  if (s->stage == VarintState::INIT) {
143
126k
    s->value = 0;
144
126k
    s->i = 0;
145
126k
    s->stage = VarintState::READ_CONTINUATION;
146
126k
  }
147
203k
  while (true) {
148
203k
    switch (s->stage) {
149
166k
      case VarintState::READ_CONTINUATION: {
150
166k
        if (s->i < max_symbols) {
151
163k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
152
155k
          if (BrunsliBitReaderRead(br, 1)) {
153
32.9k
            s->stage = VarintState::READ_DATA;
154
32.9k
            continue;
155
32.9k
          }
156
155k
        }
157
126k
        s->stage = VarintState::INIT;
158
126k
        return true;
159
166k
      }
160
37.0k
      case VarintState::READ_DATA: {
161
37.0k
        if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false;
162
32.8k
        size_t next_bits = BrunsliBitReaderRead(br, kChunkSize);
163
32.8k
        s->value |= next_bits << (s->i * kChunkSize);
164
32.8k
        ++s->i;
165
32.8k
        s->stage = VarintState::READ_CONTINUATION;
166
32.8k
        continue;
167
37.0k
      }
168
0
      default: {
169
0
        BRUNSLI_CHECK(false);
170
0
        return false;
171
37.0k
      }
172
203k
    }
173
203k
  }
174
138k
}
bool brunsli::DecodeLimitedVarint<2ul>(brunsli::internal::dec::VarintState*, brunsli::BrunsliBitReader*, unsigned long)
Line
Count
Source
141
121k
                         size_t max_symbols) {
142
121k
  if (s->stage == VarintState::INIT) {
143
109k
    s->value = 0;
144
109k
    s->i = 0;
145
109k
    s->stage = VarintState::READ_CONTINUATION;
146
109k
  }
147
184k
  while (true) {
148
184k
    switch (s->stage) {
149
149k
      case VarintState::READ_CONTINUATION: {
150
149k
        if (s->i < max_symbols) {
151
145k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
152
138k
          if (BrunsliBitReaderRead(br, 1)) {
153
31.7k
            s->stage = VarintState::READ_DATA;
154
31.7k
            continue;
155
31.7k
          }
156
138k
        }
157
109k
        s->stage = VarintState::INIT;
158
109k
        return true;
159
149k
      }
160
35.2k
      case VarintState::READ_DATA: {
161
35.2k
        if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false;
162
31.6k
        size_t next_bits = BrunsliBitReaderRead(br, kChunkSize);
163
31.6k
        s->value |= next_bits << (s->i * kChunkSize);
164
31.6k
        ++s->i;
165
31.6k
        s->stage = VarintState::READ_CONTINUATION;
166
31.6k
        continue;
167
35.2k
      }
168
0
      default: {
169
0
        BRUNSLI_CHECK(false);
170
0
        return false;
171
35.2k
      }
172
184k
    }
173
184k
  }
174
121k
}
bool brunsli::DecodeLimitedVarint<8ul>(brunsli::internal::dec::VarintState*, brunsli::BrunsliBitReader*, unsigned long)
Line
Count
Source
141
17.0k
                         size_t max_symbols) {
142
17.0k
  if (s->stage == VarintState::INIT) {
143
16.4k
    s->value = 0;
144
16.4k
    s->i = 0;
145
16.4k
    s->stage = VarintState::READ_CONTINUATION;
146
16.4k
  }
147
19.3k
  while (true) {
148
19.3k
    switch (s->stage) {
149
17.6k
      case VarintState::READ_CONTINUATION: {
150
17.6k
        if (s->i < max_symbols) {
151
17.5k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
152
17.5k
          if (BrunsliBitReaderRead(br, 1)) {
153
1.20k
            s->stage = VarintState::READ_DATA;
154
1.20k
            continue;
155
1.20k
          }
156
17.5k
        }
157
16.3k
        s->stage = VarintState::INIT;
158
16.3k
        return true;
159
17.6k
      }
160
1.72k
      case VarintState::READ_DATA: {
161
1.72k
        if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false;
162
1.13k
        size_t next_bits = BrunsliBitReaderRead(br, kChunkSize);
163
1.13k
        s->value |= next_bits << (s->i * kChunkSize);
164
1.13k
        ++s->i;
165
1.13k
        s->stage = VarintState::READ_CONTINUATION;
166
1.13k
        continue;
167
1.72k
      }
168
0
      default: {
169
0
        BRUNSLI_CHECK(false);
170
0
        return false;
171
1.72k
      }
172
19.3k
    }
173
19.3k
  }
174
17.0k
}
175
176
31.8k
std::vector<uint8_t> GenerateApp0Marker(uint8_t app0_status) {
177
31.8k
  std::vector<uint8_t> app0_marker(AppData_0xe0, AppData_0xe0 + 17);
178
31.8k
  app0_marker[9] = app0_status & 1u ? 2 : 1;
179
31.8k
  app0_status >>= 1u;
180
31.8k
  app0_marker[10] = app0_status & 0x3u;
181
31.8k
  app0_status >>= 2u;
182
31.8k
  uint16_t x_dens = kApp0Densities[app0_status];
183
31.8k
  app0_marker[11] = app0_marker[13] = x_dens >> 8u;
184
31.8k
  app0_marker[12] = app0_marker[14] = x_dens & 0xFFu;
185
31.8k
  return app0_marker;
186
31.8k
}
187
188
29.0k
std::vector<uint8_t> GenerateAppMarker(uint8_t marker, uint8_t code) {
189
29.0k
  std::vector<uint8_t> s;
190
29.0k
  if (marker == 0x80) {
191
18.4k
    s = std::vector<uint8_t>(AppData_0xe2, AppData_0xe2 + 3161);
192
18.4k
    s[84] = code;
193
18.4k
  } else if (marker == 0x81) {
194
4.63k
    s = std::vector<uint8_t>(AppData_0xec, AppData_0xec + 18);
195
4.63k
    s[15] = code;
196
5.91k
  } else {
197
5.91k
    BRUNSLI_DCHECK(marker == 0x82);
198
5.91k
    s = std::vector<uint8_t>(AppData_0xee, AppData_0xee + 15);
199
5.91k
    s[10] = code;
200
5.91k
  }
201
29.0k
  return s;
202
29.0k
}
203
204
bool ProcessMetaData(const uint8_t* data, size_t len, MetadataState* state,
205
364k
                     JPEGData* jpg) {
206
364k
  size_t pos = 0;
207
828k
  while (pos < len) {
208
464k
    switch (state->stage) {
209
100k
      case MetadataState::READ_MARKER: {
210
100k
        state->marker = static_cast<uint8_t>(data[pos++]);
211
100k
        if (state->marker == 0xD9) {
212
290
          jpg->tail_data = std::vector<uint8_t>();
213
290
          state->stage = MetadataState::READ_TAIL;
214
290
          continue;
215
99.8k
        } else if (state->marker < 0x40) {
216
31.8k
          state->short_marker_count++;
217
31.8k
          if (state->short_marker_count > kBrunsliShortMarkerLimit) {
218
13
            return false;
219
13
          }
220
31.8k
          jpg->app_data.push_back(GenerateApp0Marker(state->marker));
221
31.8k
          continue;
222
68.0k
        } else if (state->marker >= 0x80 && state->marker <= 0x82) {
223
29.0k
          state->short_marker_count++;
224
29.0k
          if (state->short_marker_count > kBrunsliShortMarkerLimit) {
225
12
            return false;
226
12
          }
227
29.0k
          state->stage = MetadataState::READ_CODE;
228
29.0k
          continue;
229
29.0k
        }
230
        // Otherwise - mutlibyte sequence.
231
38.9k
        if ((state->marker != 0xFE) && ((state->marker >> 4u) != 0x0E)) {
232
215
          return false;
233
215
        }
234
38.7k
        state->stage = MetadataState::READ_LENGTH_HI;
235
38.7k
        continue;
236
38.9k
      }
237
238
54.1k
      case MetadataState::READ_TAIL: {
239
54.1k
        Append(&jpg->tail_data, data + pos, data + len);
240
54.1k
        pos = len;
241
54.1k
        continue;
242
38.9k
      }
243
244
29.0k
      case MetadataState::READ_CODE: {
245
29.0k
        const uint8_t code = data[pos++];
246
29.0k
        jpg->app_data.push_back(GenerateAppMarker(state->marker, code));
247
29.0k
        state->stage = MetadataState::READ_MARKER;
248
29.0k
        continue;
249
38.9k
      }
250
251
38.7k
      case MetadataState::READ_LENGTH_HI: {
252
38.7k
        state->length_hi = data[pos++];
253
38.7k
        state->stage = MetadataState::READ_LENGTH_LO;
254
38.7k
        continue;
255
38.9k
      }
256
257
38.7k
      case MetadataState::READ_LENGTH_LO: {
258
38.7k
        const uint8_t lo = data[pos++];
259
38.7k
        size_t marker_len = (state->length_hi << 8u) + lo;
260
38.7k
        if (marker_len < 2) return false;
261
38.7k
        state->remaining_multibyte_length = marker_len - 2;
262
38.7k
        uint8_t head[3] = {state->marker, state->length_hi, lo};
263
38.7k
        auto* dest = (state->marker == 0xFE) ? &jpg->com_data : &jpg->app_data;
264
38.7k
        size_t delta = (state->marker == 0xFE) ? 0 : state->short_marker_count;
265
38.7k
        if (dest->size() - delta >= kBrunsliMultibyteMarkerLimit) {
266
3
          return false;
267
3
        }
268
38.7k
        dest->emplace_back(head, head + 3);
269
38.7k
        state->multibyte_sink = &dest->back();
270
        // Turn state machine to default state in case there is no payload in
271
        // multibyte sequence. This is important when such a sequence concludes
272
        // the input.
273
38.7k
        state->stage = (state->remaining_multibyte_length > 0)
274
38.7k
                           ? MetadataState::READ_MULTIBYTE
275
38.7k
                           : MetadataState::READ_MARKER;
276
38.7k
        continue;
277
38.7k
      }
278
279
203k
      case MetadataState::READ_MULTIBYTE: {
280
203k
        size_t chunk_size =
281
203k
            std::min(state->remaining_multibyte_length, len - pos);
282
203k
        Append(state->multibyte_sink, data + pos, chunk_size);
283
203k
        state->remaining_multibyte_length -= chunk_size;
284
203k
        pos += chunk_size;
285
203k
        if (state->remaining_multibyte_length == 0) {
286
37.1k
          state->stage = MetadataState::READ_MARKER;
287
37.1k
        }
288
203k
        continue;
289
38.7k
      }
290
291
0
      default: return false;
292
464k
    }
293
464k
  }
294
363k
  return true;
295
364k
}
296
297
62.2k
static BrunsliStatus DecodeHuffmanCode(State* state, JPEGData* jpg) {
298
62.2k
  InternalState& s = *state->internal;
299
62.2k
  JpegInternalsState& js = s.internals;
300
62.2k
  BrunsliBitReader* br = &js.br;
301
302
377k
  while (true) {
303
377k
    switch (js.stage) {
304
42.5k
      case JpegInternalsState::READ_HUFFMAN_LAST: {
305
42.5k
        if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA;
306
41.0k
        js.is_known_last_huffman_code = BrunsliBitReaderRead(br, 1);
307
41.0k
        jpg->huffman_code.emplace_back();
308
41.0k
        js.stage = JpegInternalsState::READ_HUFFMAN_SIMPLE;
309
41.0k
        continue;
310
42.5k
      }
311
60.0k
      case JpegInternalsState::READ_HUFFMAN_SIMPLE: {
312
60.0k
        if (!BrunsliBitReaderCanRead(br, 5 + !js.is_known_last_huffman_code)) {
313
19.2k
          return BRUNSLI_NOT_ENOUGH_DATA;
314
19.2k
        }
315
40.8k
        JPEGHuffmanCode* huff = &jpg->huffman_code.back();
316
317
40.8k
        huff->slot_id = BrunsliBitReaderRead(br, 2);
318
40.8k
        js.is_dc_table = (BrunsliBitReaderRead(br, 1) == 0);
319
40.8k
        huff->slot_id += js.is_dc_table ? 0 : 0x10;
320
40.8k
        huff->is_last =
321
40.8k
            js.is_known_last_huffman_code || BrunsliBitReaderRead(br, 1);
322
40.8k
        huff->counts[0] = 0;
323
40.8k
        int found_match = BrunsliBitReaderRead(br, 1);
324
40.8k
        if (found_match) {
325
25.4k
          if (js.is_dc_table) {
326
12.9k
            int huff_table_idx = BrunsliBitReaderRead(br, 1);
327
12.9k
            memcpy(&huff->counts[1], kStockDCHuffmanCodeCounts[huff_table_idx],
328
12.9k
                   sizeof(kStockDCHuffmanCodeCounts[0]));
329
12.9k
            memcpy(&huff->values[0], kStockDCHuffmanCodeValues[huff_table_idx],
330
12.9k
                   sizeof(kStockDCHuffmanCodeValues[0]));
331
12.9k
          } else {
332
12.5k
            int huff_table_idx = BrunsliBitReaderRead(br, 1);
333
12.5k
            memcpy(&huff->counts[1], kStockACHuffmanCodeCounts[huff_table_idx],
334
12.5k
                   sizeof(kStockACHuffmanCodeCounts[0]));
335
12.5k
            memcpy(&huff->values[0], kStockACHuffmanCodeValues[huff_table_idx],
336
12.5k
                   sizeof(kStockACHuffmanCodeValues[0]));
337
12.5k
          }
338
25.4k
          js.stage = JpegInternalsState::HUFFMAN_UPDATE;
339
25.4k
        } else {
340
          // One less bit is used than requested, but it is guaranteed to be
341
          // consumed in complex Huffman code case.
342
15.4k
          js.p.Init(js.is_dc_table
343
15.4k
                        ? std::vector<uint8_t>(kDefaultDCValues,
344
10.4k
                                               std::end(kDefaultDCValues))
345
15.4k
                        : std::vector<uint8_t>(kDefaultACValues,
346
5.00k
                                               std::end(kDefaultACValues)));
347
15.4k
          js.stage = JpegInternalsState::READ_HUFFMAN_MAX_LEN;
348
15.4k
        }
349
40.8k
        continue;
350
60.0k
      }
351
18.1k
      case JpegInternalsState::READ_HUFFMAN_MAX_LEN: {
352
18.1k
        if (!BrunsliBitReaderCanRead(br, 4)) return BRUNSLI_NOT_ENOUGH_DATA;
353
15.3k
        js.max_len = BrunsliBitReaderRead(br, 4) + 1;
354
15.3k
        js.total_count = 0;
355
15.3k
        js.max_count =
356
15.3k
            js.is_dc_table ? kJpegDCAlphabetSize : kJpegHuffmanAlphabetSize;
357
15.3k
        js.space = (1u << kJpegHuffmanMaxBitLength) -
358
15.3k
                   (1u << (kJpegHuffmanMaxBitLength - js.max_len));
359
15.3k
        js.i = 1;
360
15.3k
        js.stage = JpegInternalsState::READ_HUFFMAN_COUNT;
361
15.3k
        continue;
362
18.1k
      }
363
79.6k
      case JpegInternalsState::READ_HUFFMAN_COUNT: {
364
79.6k
        JPEGHuffmanCode* huff = &jpg->huffman_code.back();
365
79.6k
        if (js.i <= js.max_len) {
366
64.3k
          size_t shift = kJpegHuffmanMaxBitLength - js.i;
367
64.3k
          size_t count_limit =
368
64.3k
              std::min(js.max_count - js.total_count, js.space >> shift);
369
64.3k
          if (count_limit > 0) {
370
61.5k
            int nbits =
371
61.5k
                Log2FloorNonZero(static_cast<uint32_t>(count_limit)) + 1;
372
61.5k
            if (!BrunsliBitReaderCanRead(br, nbits)) {
373
9.39k
              return BRUNSLI_NOT_ENOUGH_DATA;
374
9.39k
            }
375
52.1k
            size_t count = BrunsliBitReaderRead(br, nbits);
376
52.1k
            if (count > count_limit) {
377
17
              return BRUNSLI_INVALID_BRN;
378
17
            }
379
52.1k
            huff->counts[js.i] = static_cast<int>(count);
380
52.1k
            js.total_count += count;
381
52.1k
            js.space -= count * (static_cast<size_t>(1) << shift);
382
52.1k
          }
383
54.9k
          ++js.i;
384
54.9k
          continue;
385
64.3k
        }
386
15.2k
        ++huff->counts[js.max_len];
387
15.2k
        js.i = 0;
388
15.2k
        js.stage = JpegInternalsState::READ_HUFFMAN_PERMUTATION;
389
15.2k
        continue;
390
79.6k
      }
391
136k
      case JpegInternalsState::READ_HUFFMAN_PERMUTATION: {
392
136k
        JPEGHuffmanCode* huff = &jpg->huffman_code.back();
393
136k
        if (js.i < js.total_count) {
394
121k
          const int nbits = js.p.num_bits();
395
121k
          if (!DecodeLimitedVarint<2>(&js.varint, br, (nbits + 1) >> 1u)) {
396
11.3k
            return BRUNSLI_NOT_ENOUGH_DATA;
397
11.3k
          }
398
109k
          uint8_t value;
399
109k
          if (!js.p.Remove(js.varint.value, &value)) {
400
26
            return BRUNSLI_INVALID_BRN;
401
26
          }
402
109k
          huff->values[js.i] = value;
403
109k
          ++js.i;
404
109k
          continue;
405
109k
        }
406
15.1k
        huff->values[js.total_count] = kJpegHuffmanAlphabetSize;
407
15.1k
        js.stage = JpegInternalsState::HUFFMAN_UPDATE;
408
15.1k
        continue;
409
136k
      }
410
40.5k
      case JpegInternalsState::HUFFMAN_UPDATE: {
411
        // This stage does not perform reading -> transient.
412
40.5k
        if (jpg->huffman_code.back().is_last) {
413
21.7k
          js.terminal_huffman_code_count++;
414
21.7k
        }
415
40.5k
        if (js.is_known_last_huffman_code) {
416
17.9k
          js.p.Clear();
417
17.9k
          return BRUNSLI_OK;
418
17.9k
        }
419
22.5k
        if (jpg->huffman_code.size() >= kMaxDHTMarkers) {
420
          // Too many Huffman codes for a valid bit-stream. Normally, a jpeg
421
          // file can have any arbitrary number of DHT, DQT, etc. But i prefer
422
          // we force a reasonable lower bound instead of open door to likely
423
          // forged BRN input.
424
2
          return BRUNSLI_INVALID_BRN;
425
2
        }
426
22.5k
        js.stage = JpegInternalsState::READ_HUFFMAN_LAST;
427
22.5k
        continue;
428
22.5k
      }
429
0
      default:
430
0
        return BRUNSLI_DECOMPRESSION_ERROR;
431
377k
    }
432
377k
  }
433
0
  return BRUNSLI_OK;
434
62.2k
}
435
436
91.1k
BrunsliStatus DecodeScanInfo(State* state, JPEGData* jpg) {
437
91.1k
  InternalState& s = *state->internal;
438
91.1k
  JpegInternalsState& js = s.internals;
439
91.1k
  BrunsliBitReader* br = &js.br;
440
441
91.1k
  const auto maybe_add_zero_run = [&js, jpg] () {
442
43.0k
    if (js.last_num > 0) {
443
30.8k
      JPEGScanInfo::ExtraZeroRunInfo info;
444
30.8k
      info.block_idx = js.last_block_idx;
445
30.8k
      info.num_extra_zero_runs = js.last_num;
446
30.8k
      jpg->scan_info[js.i].extra_zero_runs.push_back(info);
447
30.8k
      js.last_num = 0;
448
30.8k
    }
449
43.0k
  };
450
451
436k
  while (true) {
452
436k
    switch (js.stage) {
453
39.0k
      case JpegInternalsState::READ_SCAN_COMMON: {
454
39.0k
        JPEGScanInfo* si = &jpg->scan_info[js.i];
455
39.0k
        if (!BrunsliBitReaderCanRead(br, 22)) return BRUNSLI_NOT_ENOUGH_DATA;
456
15.9k
        si->Ss = BrunsliBitReaderRead(br, 6);
457
15.9k
        si->Se = BrunsliBitReaderRead(br, 6);
458
15.9k
        si->Ah = BrunsliBitReaderRead(br, 4);
459
15.9k
        si->Al = BrunsliBitReaderRead(br, 4);
460
15.9k
        si->num_components = BrunsliBitReaderRead(br, 2) + 1;
461
15.9k
        js.j = 0;
462
15.9k
        js.stage = JpegInternalsState::READ_SCAN_COMPONENT;
463
15.9k
        continue;
464
39.0k
      }
465
78.8k
      case JpegInternalsState::READ_SCAN_COMPONENT: {
466
78.8k
        JPEGScanInfo* si = &jpg->scan_info[js.i];
467
78.8k
        if (js.j < si->num_components) {
468
62.9k
          if (!BrunsliBitReaderCanRead(br, 6)) return BRUNSLI_NOT_ENOUGH_DATA;
469
37.8k
          si->components[js.j].comp_idx = BrunsliBitReaderRead(br, 2);
470
37.8k
          si->components[js.j].dc_tbl_idx = BrunsliBitReaderRead(br, 2);
471
37.8k
          si->components[js.j].ac_tbl_idx = BrunsliBitReaderRead(br, 2);
472
37.8k
          js.j++;
473
37.8k
        } else {
474
15.8k
          js.last_block_idx = -1;
475
15.8k
          js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION;
476
15.8k
        }
477
53.6k
        continue;
478
78.8k
      }
479
80.5k
      case JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION: {
480
80.5k
        if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA;
481
72.9k
        if (BrunsliBitReaderRead(br, 1)) {
482
57.1k
          js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_DATA;
483
57.1k
        } else {
484
15.7k
          js.last_block_idx = 0;
485
15.7k
          js.last_num = 0;
486
15.7k
          js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION;
487
15.7k
        }
488
72.9k
        continue;
489
80.5k
      }
490
61.1k
      case JpegInternalsState::READ_SCAN_RESET_POINT_DATA: {
491
61.1k
        JPEGScanInfo* si = &jpg->scan_info[js.i];
492
61.1k
        if (!DecodeVarint(&js.varint, br, 28)) return BRUNSLI_NOT_ENOUGH_DATA;
493
57.1k
        int block_idx =
494
57.1k
            js.last_block_idx + static_cast<int>(js.varint.value) + 1;
495
57.1k
        si->reset_points.emplace_back(block_idx);
496
57.1k
        js.last_block_idx = block_idx;
497
        // TODO(eustas): limit to exact number of blocks.
498
57.1k
        if (js.last_block_idx > (1 << 30)) {
499
          // At most 8K x 8K x num_channels blocks are expected. That is,
500
          // typically, 1.5 * 2^27. 2^30 should be sufficient for any sane
501
          // image.
502
7
          return BRUNSLI_INVALID_BRN;
503
7
        }
504
57.1k
        js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION;
505
57.1k
        continue;
506
57.1k
      }
507
85.8k
      case JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION: {
508
85.8k
        if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA;
509
85.2k
        if (BrunsliBitReaderRead(br, 1)) {
510
69.5k
          js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_DATA;
511
69.5k
        } else {
512
15.6k
          maybe_add_zero_run();
513
15.6k
          ++js.i;
514
15.6k
          if (js.i < js.num_scans) {
515
6.86k
            js.stage = JpegInternalsState::READ_SCAN_COMMON;
516
6.86k
            continue;
517
6.86k
          }
518
8.78k
          return BRUNSLI_OK;
519
15.6k
        }
520
69.5k
        continue;
521
85.2k
      }
522
91.2k
      case JpegInternalsState::READ_SCAN_ZERO_RUN_DATA: {
523
91.2k
        if (!DecodeVarint(&js.varint, br, 28)) return BRUNSLI_NOT_ENOUGH_DATA;
524
69.4k
        int block_idx = js.last_block_idx + static_cast<int>(js.varint.value);
525
69.4k
        if (block_idx > js.last_block_idx) maybe_add_zero_run();
526
69.4k
        ++js.last_num;
527
69.4k
        js.last_block_idx = block_idx;
528
        // TODO(eustas): limit to exact number of blocks.
529
69.4k
        if (js.last_block_idx > (1 << 30)) {
530
          // At most 8K x 8K x num_channels blocks are expected. That is,
531
          // typically, 1.5 * 2^27. 2^30 should be sufficient for any sane
532
          // image.
533
3
          return BRUNSLI_INVALID_BRN;
534
3
        }
535
69.4k
        js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION;
536
69.4k
        continue;
537
69.4k
      }
538
0
      default: return BRUNSLI_DECOMPRESSION_ERROR;
539
436k
    }
540
436k
  }
541
91.1k
}
542
543
static bool BRUNSLI_NOINLINE DecodeCoeffOrder(uint32_t* order, BitSource* br,
544
10.0k
                                              WordSource* in) {
545
10.0k
  uint32_t lehmer[kDCTBlockSize] = {0};
546
10.0k
  static const int kSpan = 16;
547
49.9k
  for (int i = 0; i < kDCTBlockSize; i += kSpan) {
548
39.9k
    if (!br->ReadBits(1, in)) continue;  // span is all-zero
549
4.25k
    const int start = (i > 0) ? i : 1;
550
4.25k
    const int end = i + kSpan;
551
69.1k
    for (int j = start; j < end; ++j) {
552
64.8k
      uint32_t v = 0;
553
82.2k
      while (v <= kDCTBlockSize) {
554
82.1k
        const uint32_t bits = br->ReadBits(3, in);
555
82.1k
        v += bits;
556
82.1k
        if (bits < 7) break;
557
82.1k
      }
558
64.8k
      if (v > kDCTBlockSize) return false;
559
64.8k
      lehmer[j] = v;
560
64.8k
    }
561
4.25k
  }
562
9.99k
  int end = kDCTBlockSize - 1;
563
591k
  while (end >= 1 && lehmer[end] == 0) {
564
581k
    --end;
565
581k
  }
566
9.99k
  if (lehmer[end] == 1) return false;
567
47.9k
  for (int i = 1; i <= end; ++i) {
568
38.3k
    if (lehmer[i] == 0) return false;
569
38.0k
    --lehmer[i];
570
38.0k
  }
571
9.67k
  if (!DecodeLehmerCode(lehmer, kDCTBlockSize, order)) return false;
572
627k
  for (int k = 0; k < kDCTBlockSize; ++k) {
573
617k
    order[k] = kJPEGNaturalOrder[order[k]];
574
617k
  }
575
9.65k
  return true;
576
9.67k
}
577
578
/** Reads 0..6 words from |in| and returns the value in the range 0..63. */
579
static size_t DecodeNumNonzeros(Prob* p, BinaryArithmeticDecoder* ac,
580
2.98M
                                WordSource* in) {
581
  // To simplity BST navigation, we use 1-based indexing.
582
2.98M
  Prob* bst = p - 1;
583
2.98M
  size_t ctx = 1;
584
585
20.8M
  for (size_t b = 0; b < kNumNonZeroBits; ++b) {
586
17.9M
    const int bit = ac->ReadBit(bst[ctx].get_proba(), in);
587
17.9M
    bst[ctx].Add(bit);
588
17.9M
    ctx = 2 * ctx + bit;
589
17.9M
  }
590
591
  // Leaf index in the level corresponds to the resuling value.
592
2.98M
  size_t val = ctx - (1u << kNumNonZeroBits);
593
2.98M
  BRUNSLI_DCHECK(val <= kNumNonZeroTreeSize);
594
2.98M
  return val;
595
2.98M
}
596
597
135k
void EnsureSubdecodersInitialized(State* state, WordSource* in) {
598
135k
  InternalState& s = *state->internal;
599
135k
  if (!s.subdecoders_initialized) {
600
19.5k
    s.ans_decoder.Init(in);
601
19.5k
    s.bit_reader.Init(in);
602
19.5k
    s.arith_decoder.Init(in);
603
19.5k
    s.subdecoders_initialized = true;
604
19.5k
  }
605
135k
}
606
607
18.9k
bool FinalizeSubdecoders(State* state) {
608
18.9k
  InternalState& s = *state->internal;
609
18.9k
  if (!s.ans_decoder.CheckCRC()) return false;
610
17.9k
  if (!s.bit_reader.Finish()) return false;
611
17.8k
  s.subdecoders_initialized = false;
612
17.8k
  return true;
613
17.9k
}
614
615
95.9k
BrunsliStatus DecodeDC(State* state, WordSource* in) {
616
95.9k
  const std::vector<ComponentMeta>& meta = state->meta;
617
95.9k
  const size_t num_components = meta.size();
618
95.9k
  const int mcu_rows = meta[0].height_in_blocks / meta[0].v_samp;
619
95.9k
  InternalState& s = *state->internal;
620
95.9k
  AcDcState& ac_dc_state = s.ac_dc;
621
622
95.9k
  std::vector<ComponentStateDC>& comps = ac_dc_state.dc;
623
95.9k
  if (comps.empty()) {
624
10.3k
    comps.resize(num_components);
625
21.7k
    for (size_t c = 0; c < num_components; ++c) {
626
11.3k
      comps[c].SetWidth(meta[c].width_in_blocks);
627
11.3k
    }
628
10.3k
  }
629
630
95.9k
  if (!in->CanRead(5)) return BRUNSLI_NOT_ENOUGH_DATA;
631
29.0k
  EnsureSubdecodersInitialized(state, in);
632
29.0k
  ANSDecoder ans = s.ans_decoder;
633
29.0k
  BitSource br = s.bit_reader;
634
29.0k
  BinaryArithmeticDecoder ac = s.arith_decoder;
635
636
  // We decode DC components in the following interleaved manner:
637
  //   v_samp[0] rows from component 0
638
  //   v_samp[1] rows from component 1
639
  //   v_samp[2] rows from component 2
640
  //   v_samp[3] rows from component 3 (if present)
641
  //
642
  // E.g. in a YUV420 image, we decode 2 rows of DC components from Y and then
643
  // 1 row of DC components from U and 1 row of DC components from V.
644
281k
  for (int mcu_y = ac_dc_state.next_mcu_y; mcu_y < mcu_rows; ++mcu_y) {
645
527k
    for (size_t i = ac_dc_state.next_component; i < num_components; ++i) {
646
275k
      ComponentStateDC* c = &comps[i];
647
275k
      const ComponentMeta& m = meta[i];
648
275k
      const uint8_t* context_map = state->context_map + i * kNumAvrgContexts;
649
275k
      const int ac_stride = static_cast<int>(m.ac_stride);
650
275k
      const size_t b_stride = m.b_stride;
651
275k
      const int width = m.width_in_blocks;
652
275k
      int y = mcu_y * m.v_samp + ac_dc_state.next_iy;
653
275k
      int* const prev_sgn = &c->prev_sign[1];
654
275k
      int* const prev_abs = &c->prev_abs_coeff[2];
655
977k
      for (int iy = ac_dc_state.next_iy; iy < m.v_samp; ++iy, ++y) {
656
721k
        coeff_t* coeffs =
657
721k
            m.ac_coeffs + y * ac_stride + ac_dc_state.next_x * kDCTBlockSize;
658
721k
        uint8_t* block_state =
659
721k
            m.block_state + y * b_stride + ac_dc_state.next_x;
660
63.5M
        for (int x = ac_dc_state.next_x; x < width; ++x) {
661
62.8M
          if (BRUNSLI_PREDICT_FALSE(!in->CanRead(6))) {
662
18.9k
            ac_dc_state.next_mcu_y = mcu_y;
663
18.9k
            ac_dc_state.next_component = i;
664
18.9k
            ac_dc_state.next_iy = iy;
665
18.9k
            ac_dc_state.next_x = x;
666
18.9k
            s.ans_decoder = ans;
667
18.9k
            s.bit_reader = br;
668
18.9k
            s.arith_decoder = ac;
669
18.9k
            return BRUNSLI_NOT_ENOUGH_DATA;
670
18.9k
          }
671
62.7M
          const int is_empty_ctx =
672
62.7M
              IsEmptyBlockContext(&c->prev_is_nonempty[1], x);
673
62.7M
          Prob* BRUNSLI_RESTRICT is_empty_p =
674
62.7M
              &c->is_empty_block_prob[is_empty_ctx];
675
62.7M
          const bool is_empty_block = !ac.ReadBit(is_empty_p->get_proba(), in);
676
62.7M
          is_empty_p->Add(!is_empty_block);
677
62.7M
          c->prev_is_nonempty[x + 1] = !is_empty_block;
678
62.7M
          *block_state = is_empty_block;
679
62.7M
          int abs_val = 0;
680
62.7M
          int sign = 0;
681
62.7M
          if (!is_empty_block) {
682
13.7M
            Prob* BRUNSLI_RESTRICT p_is_zero = &c->is_zero_prob;
683
13.7M
            int is_zero = ac.ReadBit(p_is_zero->get_proba(), in);
684
13.7M
            p_is_zero->Add(is_zero);
685
13.7M
            if (!is_zero) {
686
2.80M
              const int avg_ctx = WeightedAverageContextDC(prev_abs, x);
687
2.80M
              const int sign_ctx = prev_sgn[x] * 3 + prev_sgn[x - 1];
688
2.80M
              Prob* BRUNSLI_RESTRICT sign_p = &c->sign_prob[sign_ctx];
689
2.80M
              sign = ac.ReadBit(sign_p->get_proba(), in);
690
2.80M
              sign_p->Add(sign);
691
2.80M
              const int entropy_ix = context_map[avg_ctx];
692
2.80M
              int code = ans.ReadSymbol(state->entropy_codes[entropy_ix], in);
693
2.80M
              if (code < kNumDirectCodes) {
694
411k
                abs_val = code + 1;
695
2.39M
              } else {
696
2.39M
                int nbits = code - kNumDirectCodes;
697
2.39M
                Prob* BRUNSLI_RESTRICT p_first_extra_bit =
698
2.39M
                    &c->first_extra_bit_prob[nbits];
699
2.39M
                int first_extra_bit =
700
2.39M
                    ac.ReadBit(p_first_extra_bit->get_proba(), in);
701
2.39M
                p_first_extra_bit->Add(first_extra_bit);
702
2.39M
                int extra_bits_val = first_extra_bit << nbits;
703
2.39M
                if (nbits > 0) {
704
2.17M
                  extra_bits_val |= static_cast<int>(br.ReadBits(nbits, in));
705
2.17M
                }
706
2.39M
                abs_val = kNumDirectCodes - 1 + (2 << nbits) + extra_bits_val;
707
2.39M
              }
708
2.80M
            }
709
13.7M
          }
710
62.7M
          prev_abs[x] = abs_val;
711
62.7M
          prev_sgn[x] = abs_val ? sign + 1 : 0;
712
62.7M
          coeffs[0] = ((1 - 2 * sign) * abs_val +
713
62.7M
                       PredictWithAdaptiveMedian(coeffs, x, y, ac_stride));
714
62.7M
          block_state++;
715
62.7M
          coeffs += kDCTBlockSize;
716
62.7M
        }
717
702k
        ac_dc_state.next_x = 0;
718
702k
      }
719
256k
      ac_dc_state.next_iy = 0;
720
256k
    }
721
252k
    ac_dc_state.next_component = 0;
722
252k
  }
723
724
  // Prepare for AC decoding.
725
10.0k
  ac_dc_state.next_mcu_y = 0;
726
10.0k
  ac_dc_state.next_component = 0;
727
10.0k
  ac_dc_state.next_iy = 0;
728
10.0k
  ac_dc_state.next_x = 0;
729
730
10.0k
  comps.clear();
731
10.0k
  comps.shrink_to_fit();
732
733
10.0k
  s.ans_decoder = ans;
734
10.0k
  s.bit_reader = br;
735
10.0k
  s.arith_decoder = ac;
736
10.0k
  if (!FinalizeSubdecoders(state)) return BRUNSLI_INVALID_BRN;
737
738
9.62k
  return BRUNSLI_OK;
739
10.0k
}
740
741
static void BRUNSLI_NOINLINE DecodeEmptyAcBlock(
742
17.1M
    int* BRUNSLI_RESTRICT prev_sgn, int* BRUNSLI_RESTRICT prev_abs) {
743
1.09G
  for (int k = 1; k < kDCTBlockSize; ++k) {
744
1.07G
    prev_sgn[k] = 0;
745
1.07G
    prev_abs[k] = 0;
746
1.07G
  }
747
17.1M
}
748
749
/** All the necessary things for decoding AC block. */
750
struct AcBlockCookie {
751
  int x;
752
  int y;
753
  uint8_t* BRUNSLI_RESTRICT prev_num_nonzeros;
754
  int* BRUNSLI_RESTRICT prev_sgn;
755
  int* BRUNSLI_RESTRICT prev_abs;
756
  Prob* BRUNSLI_RESTRICT num_nonzero_prob;
757
758
  BinaryArithmeticDecoder* BRUNSLI_RESTRICT ac;
759
  WordSource* BRUNSLI_RESTRICT in;
760
  ANSDecoder* BRUNSLI_RESTRICT ans;
761
  BitSource* BRUNSLI_RESTRICT br;
762
763
  coeff_t* BRUNSLI_RESTRICT coeffs;
764
  const coeff_t* BRUNSLI_RESTRICT prev_row_coeffs;
765
  const coeff_t* BRUNSLI_RESTRICT prev_col_coeffs;
766
  Prob* BRUNSLI_RESTRICT is_zero_prob;
767
  const uint32_t* BRUNSLI_RESTRICT order;
768
  const uint8_t* BRUNSLI_RESTRICT context_modes;
769
  const int* BRUNSLI_RESTRICT mult_col;
770
  const int* BRUNSLI_RESTRICT mult_row;
771
  int prev_row_delta;
772
  Prob* BRUNSLI_RESTRICT sign_prob;
773
  size_t context_bits;
774
  const uint8_t* BRUNSLI_RESTRICT context_map;
775
  const ANSDecodingData* BRUNSLI_RESTRICT entropy_codes;
776
  Prob* BRUNSLI_RESTRICT first_extra_bit_prob;
777
};
778
779
2.98M
static size_t BRUNSLI_NOINLINE DecodeAcBlock(const AcBlockCookie& cookie) {
780
2.98M
  AcBlockCookie c = cookie;
781
782
2.98M
  BinaryArithmeticDecoder ac = *c.ac;
783
2.98M
  WordSource* in = c.in;
784
2.98M
  ANSDecoder ans = *c.ans;
785
2.98M
  BitSource br = *c.br;
786
787
2.98M
  size_t num_nonzeros = 0;
788
789
2.98M
  const uint8_t nonzero_ctx = NumNonzerosContext(c.prev_num_nonzeros, c.x, c.y);
790
2.98M
  size_t last_nz = DecodeNumNonzeros(
791
2.98M
      c.num_nonzero_prob + kNumNonZeroTreeSize * nonzero_ctx, &ac, in);
792
150M
  for (size_t k = last_nz + 1; k < kDCTBlockSize; ++k) {
793
147M
    c.prev_sgn[k] = 0;
794
147M
    c.prev_abs[k] = 0;
795
147M
  }
796
43.1M
  for (size_t k = last_nz; k > 0; --k) {
797
40.1M
    int is_zero = 0;
798
40.1M
    if (k < last_nz) {
799
39.0M
      size_t bucket = kNonzeroBuckets[num_nonzeros - 1];
800
39.0M
      size_t is_zero_ctx = bucket * kDCTBlockSize + k;
801
39.0M
      Prob& p = c.is_zero_prob[is_zero_ctx];
802
39.0M
      is_zero = ac.ReadBit(p.get_proba(), in);
803
39.0M
      p.Add(is_zero);
804
39.0M
    }
805
40.1M
    int abs_val = 0;
806
40.1M
    int sign = 1;
807
40.1M
    const int k_nat = c.order[k];
808
40.1M
    if (!is_zero) {
809
9.08M
      size_t context_type = c.context_modes[k_nat];
810
9.08M
      size_t avg_ctx = 0;
811
9.08M
      size_t sign_ctx = kMaxAverageContext;
812
9.08M
      if ((context_type & 1) && (c.y > 0)) {
813
1.76M
        size_t offset = k_nat & 7;
814
1.76M
        ACPredictContextRow(c.prev_row_coeffs + offset, c.coeffs + offset,
815
1.76M
                            c.mult_col + offset * 8, &avg_ctx, &sign_ctx);
816
7.32M
      } else if ((context_type & 2) && (c.x > 0)) {
817
2.05M
        size_t offset = k_nat & ~7;
818
2.05M
        ACPredictContextCol(c.prev_col_coeffs + offset, c.coeffs + offset,
819
2.05M
                            c.mult_row + offset, &avg_ctx, &sign_ctx);
820
5.27M
      } else if (!context_type) {
821
5.14M
        avg_ctx = WeightedAverageContext(c.prev_abs + k, c.prev_row_delta);
822
5.14M
        sign_ctx =
823
5.14M
            c.prev_sgn[k] * 3 + c.prev_sgn[static_cast<int>(k) - kDCTBlockSize];
824
5.14M
      }
825
9.08M
      sign_ctx = sign_ctx * kDCTBlockSize + k;
826
9.08M
      Prob& sign_p = c.sign_prob[sign_ctx];
827
9.08M
      sign = ac.ReadBit(sign_p.get_proba(), in);
828
9.08M
      sign_p.Add(sign);
829
9.08M
      c.prev_sgn[k] = sign + 1;
830
9.08M
      sign = 1 - 2 * sign;
831
9.08M
      const size_t z_dens_ctx =
832
9.08M
          ZeroDensityContext(num_nonzeros, k, c.context_bits);
833
9.08M
      size_t histo_ix = z_dens_ctx * kNumAvrgContexts + avg_ctx;
834
9.08M
      size_t entropy_ix = c.context_map[histo_ix];
835
9.08M
      int code = ans.ReadSymbol(c.entropy_codes[entropy_ix], in);
836
9.08M
      if (code < kNumDirectCodes) {
837
4.69M
        abs_val = code + 1;
838
4.69M
      } else {
839
4.38M
        int nbits = code - kNumDirectCodes;
840
4.38M
        Prob& p = c.first_extra_bit_prob[k * 10 + nbits];
841
4.38M
        int first_extra_bit = ac.ReadBit(p.get_proba(), in);
842
4.38M
        p.Add(first_extra_bit);
843
4.38M
        int extra_bits_val = first_extra_bit << nbits;
844
4.38M
        if (nbits > 0) {
845
3.62M
          extra_bits_val |= br.ReadBits(nbits, in);
846
3.62M
        }
847
4.38M
        abs_val = kNumDirectCodes - 1 + (2u << nbits) + extra_bits_val;
848
4.38M
      }
849
9.08M
      ++num_nonzeros;
850
31.0M
    } else {
851
31.0M
      c.prev_sgn[k] = 0;
852
31.0M
    }
853
40.1M
    int coeff = sign * abs_val;
854
40.1M
    c.coeffs[k_nat] = coeff;
855
40.1M
    c.prev_abs[k] = abs_val;
856
40.1M
  }
857
858
2.98M
  *c.ans = ans;
859
2.98M
  *c.br = br;
860
2.98M
  *c.ac = ac;
861
862
2.98M
  return num_nonzeros;
863
2.98M
}
864
865
178k
BrunsliStatus DecodeAC(State* state, WordSource* in) {
866
178k
  const std::vector<ComponentMeta>& meta = state->meta;
867
178k
  const size_t num_components = meta.size();
868
178k
  const int mcu_rows = meta[0].height_in_blocks / meta[0].v_samp;
869
178k
  InternalState& s = *state->internal;
870
178k
  AcDcState& ac_dc_state = s.ac_dc;
871
872
178k
  std::vector<ComponentState>& comps = ac_dc_state.ac;
873
178k
  if (comps.empty()) {
874
9.51k
    comps.resize(num_components);
875
19.8k
    for (size_t c = 0; c < num_components; ++c) {
876
10.3k
      comps[c].SetWidth(meta[c].width_in_blocks);
877
10.3k
      ComputeACPredictMultipliers(&meta[c].quant[0], comps[c].mult_row,
878
10.3k
                                  comps[c].mult_col);
879
10.3k
    }
880
9.51k
  }
881
882
178k
  if (!in->CanRead(5)) return BRUNSLI_NOT_ENOUGH_DATA;
883
106k
  EnsureSubdecodersInitialized(state, in);
884
885
106k
  if (!ac_dc_state.ac_coeffs_order_decoded) {
886
77.1k
    while (ac_dc_state.next_component < num_components) {
887
68.1k
      if (!in->CanRead(121)) return BRUNSLI_NOT_ENOUGH_DATA;
888
10.0k
      if (!DecodeCoeffOrder(comps[ac_dc_state.next_component].order,
889
10.0k
                            &s.bit_reader, in)) {
890
353
        return BRUNSLI_INVALID_BRN;
891
353
      }
892
9.65k
      ac_dc_state.next_component++;
893
9.65k
    }
894
8.99k
    ac_dc_state.next_component = 0;
895
8.99k
    ac_dc_state.ac_coeffs_order_decoded = true;
896
8.99k
  }
897
898
47.7k
  AcBlockCookie c;
899
47.7k
  c.ac = &s.arith_decoder;
900
47.7k
  c.in = in;
901
47.7k
  c.ans = &s.ans_decoder;
902
47.7k
  c.br = &s.bit_reader;
903
47.7k
  c.entropy_codes = state->entropy_codes;
904
47.7k
  c.context_modes =
905
47.7k
      kContextAlgorithm + (state->use_legacy_context_model ? 64 : 0);
906
907
259k
  for (int mcu_y = ac_dc_state.next_mcu_y; mcu_y < mcu_rows; ++mcu_y) {
908
463k
    for (size_t i = ac_dc_state.next_component; i < num_components; ++i) {
909
251k
      ComponentState& cst = comps[i];
910
251k
      c.prev_num_nonzeros = cst.prev_num_nonzeros.data();
911
251k
      c.num_nonzero_prob = cst.num_nonzero_prob;
912
251k
      c.is_zero_prob = cst.is_zero_prob.data();
913
251k
      c.order = cst.order;
914
251k
      c.mult_col = cst.mult_col;
915
251k
      c.mult_row = cst.mult_row;
916
251k
      c.sign_prob = cst.sign_prob.data();
917
251k
      c.first_extra_bit_prob = cst.first_extra_bit_prob.data();
918
251k
      const ComponentMeta& m = meta[i];
919
251k
      c.context_map = state->context_map + m.context_offset * kNumAvrgContexts;
920
251k
      c.context_bits = m.context_bits;
921
251k
      const int width = m.width_in_blocks;
922
251k
      const size_t ac_stride = m.ac_stride;
923
251k
      const size_t b_stride = m.b_stride;
924
251k
      const int next_iy = ac_dc_state.next_iy;
925
251k
      c.y = mcu_y * m.v_samp + next_iy;
926
251k
      c.prev_row_delta = (1 - 2 * (c.y & 1u)) * (width + 3) * kDCTBlockSize;
927
864k
      for (int iy = next_iy; iy < m.v_samp; ++iy, ++c.y) {
928
651k
        const int next_x = ac_dc_state.next_x;
929
651k
        const size_t block_offset = next_x * kDCTBlockSize;
930
651k
        c.coeffs = m.ac_coeffs + c.y * ac_stride + block_offset;
931
651k
        c.prev_row_coeffs = c.coeffs - ac_stride;
932
651k
        c.prev_col_coeffs = c.coeffs - kDCTBlockSize;
933
651k
        const uint8_t* block_state = m.block_state + c.y * b_stride + next_x;
934
651k
        c.prev_sgn = &cst.prev_sign[kDCTBlockSize] + block_offset;
935
651k
        c.prev_abs = &cst.prev_abs_coeff[((c.y & 1u) * (width + 3) + 2) *
936
651k
                                         kDCTBlockSize] +
937
651k
                     block_offset;
938
20.7M
        for (c.x = next_x; c.x < width; ++c.x) {
939
20.1M
          bool is_empty = *(block_state++);
940
20.1M
          if (!is_empty) {
941
3.02M
            if (BRUNSLI_PREDICT_FALSE(!in->CanRead(297))) {
942
38.8k
              ac_dc_state.next_mcu_y = mcu_y;
943
38.8k
              ac_dc_state.next_component = i;
944
38.8k
              ac_dc_state.next_iy = iy;
945
38.8k
              ac_dc_state.next_x = c.x;
946
38.8k
              return BRUNSLI_NOT_ENOUGH_DATA;
947
38.8k
            }
948
2.98M
            size_t num_nonzeros = DecodeAcBlock(c);
949
2.98M
            BRUNSLI_DCHECK(num_nonzeros <= kNumNonZeroTreeSize);
950
2.98M
            c.prev_num_nonzeros[c.x] = static_cast<uint8_t>(num_nonzeros);
951
17.1M
          } else {
952
17.1M
            DecodeEmptyAcBlock(c.prev_sgn, c.prev_abs);
953
17.1M
            c.prev_num_nonzeros[c.x] = 0;
954
17.1M
          }
955
20.1M
          c.coeffs += kDCTBlockSize;
956
20.1M
          c.prev_sgn += kDCTBlockSize;
957
20.1M
          c.prev_abs += kDCTBlockSize;
958
20.1M
          c.prev_row_coeffs += kDCTBlockSize;
959
20.1M
          c.prev_col_coeffs += kDCTBlockSize;
960
20.1M
        }
961
613k
        c.prev_row_delta *= -1;
962
613k
        ac_dc_state.next_x = 0;
963
613k
      }
964
212k
      ac_dc_state.next_iy = 0;
965
212k
    }
966
211k
    ac_dc_state.next_component = 0;
967
211k
  }
968
8.89k
  ac_dc_state.next_mcu_y = 0;
969
970
8.89k
  comps.clear();
971
8.89k
  comps.shrink_to_fit();
972
973
8.89k
  if (!FinalizeSubdecoders(state)) return BRUNSLI_INVALID_BRN;
974
975
8.24k
  return BRUNSLI_OK;
976
8.89k
}
977
978
668k
static bool CheckCanRead(State* state, size_t required) {
979
  // TODO(eustas): dcheck len > pos
980
668k
  size_t available = state->len - state->pos;
981
668k
  return required <= available;
982
668k
}
983
984
335k
static bool CheckCanReadByte(State* state) {
985
  // TODO(eustas): dcheck len > pos
986
335k
  return state->pos != state->len;
987
335k
}
988
989
206k
static uint8_t ReadByte(State* state) {
990
  // TODO(eustas): dcheck len > pos
991
206k
  return state->data[state->pos++];
992
206k
}
993
994
403k
static uint8_t PeekByte(State* state, size_t offset) {
995
  // TODO(eustas): dcheck overflow.
996
403k
  return state->data[state->pos + offset];
997
403k
}
998
999
1.49M
static void SkipBytes(State* state, size_t len) {
1000
  // TODO(eustas): dcheck overflow.
1001
1.49M
  state->pos += len;
1002
1.49M
}
1003
1004
3.42M
static size_t GetBytesAvailable(State* state) {
1005
  // TODO(eustas): dcheck len > pos
1006
3.42M
  return state->len - state->pos;
1007
3.42M
}
1008
1009
943k
static size_t SkipAvailableBytes(State* state, size_t len) {
1010
943k
  size_t available = GetBytesAvailable(state);
1011
943k
  size_t skip_bytes = std::min(available, len);
1012
943k
  state->pos += skip_bytes;
1013
943k
  return skip_bytes;
1014
943k
}
1015
1016
387k
static BrunsliStatus DecodeBase128(State* state, size_t* val) {
1017
387k
  *val = 0;
1018
387k
  uint64_t b = 0x80;
1019
387k
  size_t i = 0;
1020
790k
  while ((i < 9) && (b & 0x80u)) {
1021
553k
    if (!CheckCanRead(state, i + 1)) return BRUNSLI_NOT_ENOUGH_DATA;
1022
403k
    b = PeekByte(state, i);
1023
403k
    *val |= (b & 0x7Fu) << (i * 7);
1024
403k
    ++i;
1025
403k
  }
1026
236k
  SkipBytes(state, i);
1027
236k
  return ((b & 0x80u) == 0) ? BRUNSLI_OK : BRUNSLI_INVALID_BRN;
1028
387k
}
1029
1030
2.29M
static Stage Fail(State* state, BrunsliStatus result) {
1031
2.29M
  InternalState& s = *state->internal;
1032
2.29M
  s.result = result;
1033
  // Preserve current stage for continuation / error reporting.
1034
2.29M
  s.last_stage = state->stage;
1035
2.29M
  return Stage::ERROR;
1036
2.29M
}
1037
1038
335k
static BrunsliStatus ReadTag(State* state, SectionState* section) {
1039
335k
  if (!CheckCanReadByte(state)) return BRUNSLI_NOT_ENOUGH_DATA;
1040
206k
  const uint8_t marker = ReadByte(state);
1041
1042
206k
  const size_t tag = marker >> 3u;
1043
206k
  if (tag == 0 || tag > 15) return BRUNSLI_INVALID_BRN;
1044
205k
  section->tag = tag;
1045
1046
205k
  const size_t wiring_type = marker & 0x7u;
1047
205k
  if (wiring_type != kBrunsliWiringTypeVarint &&
1048
108k
      wiring_type != kBrunsliWiringTypeLengthDelimited) {
1049
44
    return BRUNSLI_INVALID_BRN;
1050
44
  }
1051
205k
  section->is_section = (wiring_type == kBrunsliWiringTypeLengthDelimited);
1052
1053
205k
  const uint32_t tag_bit = 1u << tag;
1054
205k
  if (section->tags_met & tag_bit) {
1055
28
    BRUNSLI_LOG_ERROR() << "Duplicate marker " << std::hex
1056
28
                        << static_cast<int>(marker) << BRUNSLI_ENDL();
1057
28
    return BRUNSLI_INVALID_BRN;
1058
28
  }
1059
205k
  section->tags_met |= tag_bit;
1060
1061
205k
  return BRUNSLI_OK;
1062
205k
}
1063
1064
170k
static BrunsliStatus EnterSection(State* state, SectionState* section) {
1065
170k
  size_t section_size;
1066
170k
  BrunsliStatus status = DecodeBase128(state, &section_size);
1067
170k
  if (status != BRUNSLI_OK) return status;
1068
99.5k
  section->is_active = true;
1069
99.5k
  section->remaining = section_size;
1070
99.5k
  section->milestone = state->pos;
1071
99.5k
  section->projected_end = state->pos + section->remaining;
1072
99.5k
  return BRUNSLI_OK;
1073
170k
}
1074
1075
26.4k
static void LeaveSection(SectionState* section) {
1076
26.4k
  section->is_active = false;
1077
26.4k
}
1078
1079
2.94M
static bool IsOutOfSectionBounds(State* state) {
1080
2.94M
  return state->pos > state->internal->section.projected_end;
1081
2.94M
}
1082
1083
2.94M
static size_t RemainingSectionLength(State* state) {
1084
  // TODO(eustas): remove this check?
1085
2.94M
  if (IsOutOfSectionBounds(state)) return 0;
1086
2.93M
  return state->internal->section.projected_end - state->pos;
1087
2.94M
}
1088
1089
304k
static bool IsAtSectionBoundary(State* state) {
1090
304k
  return state->pos == state->internal->section.projected_end;
1091
304k
}
1092
1093
114k
Stage VerifySignature(State* state) {
1094
114k
  InternalState& s = *state->internal;
1095
1096
114k
  if (!CheckCanRead(state, kBrunsliSignatureSize)) {
1097
86.2k
    return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
1098
86.2k
  }
1099
27.7k
  const bool is_signature_ok =
1100
27.7k
      (memcmp(state->data + state->pos, kBrunsliSignature,
1101
27.7k
              kBrunsliSignatureSize) != 0);
1102
27.7k
  state->pos += kBrunsliSignatureSize;
1103
27.7k
  s.section.tags_met |= 1u << kBrunsliSignatureTag;
1104
27.7k
  if (is_signature_ok) return Fail(state, BRUNSLI_INVALID_BRN);
1105
27.6k
  return Stage::HEADER;
1106
27.7k
}
1107
1108
// Parses the brunsli header starting at data[*pos] and fills in *jpg.
1109
// Sets *pos to the position after the header.
1110
// Returns BRUNSLI_OK, unless the data is not valid brunsli byte stream
1111
// or is truncated.
1112
1.11M
Stage DecodeHeader(State* state, JPEGData* jpg) {
1113
1.11M
  InternalState& s = *state->internal;
1114
1.11M
  HeaderState& hs = s.header;
1115
1116
1.44M
  while (hs.stage != HeaderState::DONE) {
1117
1.42M
    switch (hs.stage) {
1118
56.2k
      case HeaderState::READ_TAG: {
1119
56.2k
        BrunsliStatus status = ReadTag(state, &s.section);
1120
56.2k
        if (status != BRUNSLI_OK) return Fail(state, status);
1121
27.5k
        if (s.section.tag != kBrunsliHeaderTag || !s.section.is_section) {
1122
10
          return Fail(state, BRUNSLI_INVALID_BRN);
1123
10
        }
1124
27.5k
        hs.stage = HeaderState::ENTER_SECTION;
1125
27.5k
        break;
1126
27.5k
      }
1127
1128
42.5k
      case HeaderState::ENTER_SECTION: {
1129
42.5k
        BrunsliStatus status = EnterSection(state, &s.section);
1130
42.5k
        if (status != BRUNSLI_OK) return Fail(state, status);
1131
27.5k
        hs.stage = HeaderState::ITEM_READ_TAG;
1132
27.5k
        break;
1133
42.5k
      }
1134
1135
189k
      case HeaderState::ITEM_READ_TAG: {
1136
189k
        if (IsAtSectionBoundary(state)) {
1137
26.9k
          hs.stage = HeaderState::FINALE;
1138
26.9k
          break;
1139
26.9k
        }
1140
162k
        BrunsliStatus status = ReadTag(state, &hs.section);
1141
162k
        if (status != BRUNSLI_OK) return Fail(state, status);
1142
106k
        const uint32_t tag_bit = 1u << hs.section.tag;
1143
106k
        if (hs.section.is_section) {
1144
9.13k
          if (kKnownHeaderVarintTags & tag_bit) {
1145
8.96k
            Fail(state, BRUNSLI_INVALID_BRN);
1146
8.96k
          }
1147
9.13k
          hs.stage = HeaderState::ITEM_ENTER_SECTION;
1148
9.13k
          break;
1149
9.13k
        }
1150
96.9k
        hs.stage = HeaderState::ITEM_READ_VALUE;
1151
96.9k
        break;
1152
106k
      }
1153
1154
15.0k
      case HeaderState::ITEM_ENTER_SECTION: {
1155
15.0k
        BrunsliStatus status = DecodeBase128(state, &hs.remaining_skip_length);
1156
15.0k
        if (status != BRUNSLI_OK) return Fail(state, status);
1157
9.10k
        hs.stage = HeaderState::ITEM_SKIP_CONTENTS;
1158
9.10k
        break;
1159
15.0k
      }
1160
1161
943k
      case HeaderState::ITEM_SKIP_CONTENTS: {
1162
943k
        size_t bytes_skipped =
1163
943k
            SkipAvailableBytes(state, hs.remaining_skip_length);
1164
943k
        hs.remaining_skip_length -= bytes_skipped;
1165
943k
        if (hs.remaining_skip_length > 0) {
1166
934k
          return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
1167
934k
        }
1168
8.85k
        hs.stage = HeaderState::ITEM_READ_TAG;
1169
8.85k
        break;
1170
943k
      }
1171
1172
149k
      case HeaderState::ITEM_READ_VALUE: {
1173
149k
        size_t value;
1174
149k
        BrunsliStatus status = DecodeBase128(state, &value);
1175
149k
        if (status != BRUNSLI_OK) return Fail(state, status);
1176
96.8k
        hs.varint_values[hs.section.tag] = value;
1177
96.8k
        hs.stage = HeaderState::ITEM_READ_TAG;
1178
96.8k
        break;
1179
149k
      }
1180
1181
26.9k
      case HeaderState::FINALE: {
1182
26.9k
        const bool has_version =
1183
26.9k
            hs.section.tags_met & (1u << kBrunsliHeaderVersionCompTag);
1184
26.9k
        if (!has_version) return Fail(state, BRUNSLI_INVALID_BRN);
1185
26.9k
        const size_t version_and_comp_count =
1186
26.9k
            hs.varint_values[kBrunsliHeaderVersionCompTag];
1187
1188
26.9k
        const size_t version = version_and_comp_count >> 2u;
1189
26.9k
        jpg->version = static_cast<int>(version);
1190
1191
26.9k
        if (version == 1) {  // fallback mode
1192
          // TODO(eustas): do we need this?
1193
612
          jpg->width = 0;
1194
612
          jpg->height = 0;
1195
612
          hs.stage = HeaderState::DONE;
1196
612
          break;
1197
612
        }
1198
1199
        // Wrong mode = fallback + something.
1200
26.3k
        if ((version & 1u) != 0) {
1201
35
          return Fail(state, BRUNSLI_INVALID_BRN);
1202
35
        }
1203
        // Unknown mode - only 3 bits are defined.
1204
26.2k
        if ((version & ~0x7u) != 0) {
1205
77
          return Fail(state, BRUNSLI_INVALID_BRN);
1206
77
        }
1207
1208
        // Otherwise regular brunsli.
1209
26.2k
        state->use_legacy_context_model = !(version & 2);
1210
1211
        // Do not allow "original_jpg" for regular Brunsli files.
1212
26.2k
        s.section.tags_met |= 1u << kBrunsliOriginalJpgTag;
1213
1214
26.2k
        const bool has_width =
1215
26.2k
            hs.section.tags_met & (1u << kBrunsliHeaderWidthTag);
1216
26.2k
        if (!has_width) return Fail(state, BRUNSLI_INVALID_BRN);
1217
26.2k
        const size_t width = hs.varint_values[kBrunsliHeaderWidthTag];
1218
26.2k
        const bool has_height =
1219
26.2k
            hs.section.tags_met & (1u << kBrunsliHeaderHeightTag);
1220
26.2k
        if (!has_height) return Fail(state, BRUNSLI_INVALID_BRN);
1221
26.2k
        const size_t height = hs.varint_values[kBrunsliHeaderHeightTag];
1222
1223
26.2k
        if (width == 0 || height == 0) return Fail(state, BRUNSLI_INVALID_BRN);
1224
26.1k
        if (width > kMaxDimPixels || height > kMaxDimPixels) {
1225
295
          return Fail(state, BRUNSLI_INVALID_BRN);
1226
295
        }
1227
25.9k
        jpg->width = static_cast<int>(width);
1228
25.9k
        jpg->height = static_cast<int>(height);
1229
1230
25.9k
        const size_t num_components = (version_and_comp_count & 3u) + 1u;
1231
25.9k
        jpg->components.resize(num_components);
1232
1233
25.9k
        const bool has_subsampling =
1234
25.9k
            hs.section.tags_met & (1u << kBrunsliHeaderSubsamplingTag);
1235
25.9k
        if (!has_subsampling) return Fail(state, BRUNSLI_INVALID_BRN);
1236
25.8k
        size_t subsampling_code =
1237
25.8k
            hs.varint_values[kBrunsliHeaderSubsamplingTag];
1238
1239
66.8k
        for (size_t i = 0; i < jpg->components.size(); ++i) {
1240
41.0k
          JPEGComponent* c = &jpg->components[i];
1241
41.0k
          c->v_samp_factor = (subsampling_code & 0xFu) + 1;
1242
41.0k
          subsampling_code >>= 4u;
1243
41.0k
          c->h_samp_factor = (subsampling_code & 0xFu) + 1;
1244
41.0k
          subsampling_code >>= 4u;
1245
41.0k
          if (c->v_samp_factor > kBrunsliMaxSampling) {
1246
2
            return Fail(state, BRUNSLI_INVALID_BRN);
1247
2
          }
1248
41.0k
          if (c->h_samp_factor > kBrunsliMaxSampling) {
1249
2
            return Fail(state, BRUNSLI_INVALID_BRN);
1250
2
          }
1251
41.0k
        }
1252
25.8k
        if (!UpdateSubsamplingDerivatives(jpg)) {
1253
2
          return Fail(state, BRUNSLI_INVALID_BRN);
1254
2
        }
1255
1256
25.8k
        PrepareMeta(jpg, state);
1257
1258
25.8k
        hs.stage = HeaderState::DONE;
1259
25.8k
        break;
1260
25.8k
      }
1261
1262
0
      default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
1263
1.42M
    }
1264
1.42M
  }
1265
1266
26.4k
  LeaveSection(&s.section);
1267
26.4k
  return (jpg->version == kFallbackVersion) ? Stage::FALLBACK : Stage::SECTION;
1268
1.11M
}
1269
1270
188k
static BrunsliStatus DecodeMetaDataSection(State* state, JPEGData* jpg) {
1271
188k
  InternalState& s = *state->internal;
1272
188k
  MetadataState& ms = s.metadata;
1273
1274
188k
  if (ms.decompression_stage == MetadataDecompressionStage::DONE) {
1275
0
    return BRUNSLI_INVALID_BRN;
1276
0
  }
1277
1278
188k
  if (ms.decompression_stage == MetadataDecompressionStage::INITIAL) {
1279
6.45k
    if (IsAtSectionBoundary(state)) {
1280
6
      ms.decompression_stage = MetadataDecompressionStage::DONE;
1281
6
      return BRUNSLI_OK;
1282
6
    }
1283
6.45k
    if (RemainingSectionLength(state) == 1) {
1284
128
      if (!CheckCanReadByte(state)) {
1285
51
        return BRUNSLI_NOT_ENOUGH_DATA;
1286
51
      }
1287
77
      uint8_t data[1];
1288
77
      data[0] = ReadByte(state);
1289
77
      bool ok = ProcessMetaData(data, 1, &ms, jpg) && ms.CanFinish();
1290
77
      ms.decompression_stage = MetadataDecompressionStage::DONE;
1291
77
      return ok ? BRUNSLI_OK : BRUNSLI_INVALID_BRN;
1292
128
    }
1293
6.32k
    ms.decompression_stage =
1294
6.32k
        MetadataDecompressionStage::READ_LENGTH;
1295
6.32k
  }
1296
1297
187k
  if (ms.decompression_stage == MetadataDecompressionStage::READ_LENGTH) {
1298
11.7k
    BrunsliStatus status = DecodeBase128(state, &ms.metadata_size);
1299
11.7k
    if (status != BRUNSLI_OK) return status;
1300
    // TODO(eustas): ms.metadata_size should be limited to avoid "zip-bombs".
1301
6.17k
    if (IsOutOfSectionBounds(state)) return BRUNSLI_INVALID_BRN;
1302
6.17k
    if (RemainingSectionLength(state) == 0) return BRUNSLI_INVALID_BRN;
1303
6.17k
    ms.brotli = BrotliDecoderCreateInstance(nullptr, nullptr, nullptr);
1304
6.17k
    if (ms.brotli == nullptr) return BRUNSLI_DECOMPRESSION_ERROR;
1305
6.17k
    ms.decompression_stage = MetadataDecompressionStage::DECOMPRESSING;
1306
6.17k
  }
1307
1308
182k
  if (ms.decompression_stage == MetadataDecompressionStage::DECOMPRESSING) {
1309
    // Free Brotli decoder and return result
1310
182k
    const auto finish_decompression = [&ms] (BrunsliStatus result) {
1311
2.99k
      BRUNSLI_DCHECK(ms.brotli != nullptr);
1312
2.99k
      BrotliDecoderDestroyInstance(ms.brotli);
1313
2.99k
      ms.brotli = nullptr;
1314
2.99k
      ms.decompression_stage = MetadataDecompressionStage::DONE;
1315
2.99k
      return result;
1316
2.99k
    };
1317
1318
366k
    while (true) {
1319
366k
      size_t available_bytes =
1320
366k
          std::min(GetBytesAvailable(state), RemainingSectionLength(state));
1321
366k
      size_t available_in = available_bytes;
1322
366k
      const uint8_t* next_in = state->data + state->pos;
1323
366k
      size_t available_out = 0;
1324
366k
      BrotliDecoderResult result = BrotliDecoderDecompressStream(
1325
366k
          ms.brotli, &available_in, &next_in, &available_out, nullptr, nullptr);
1326
366k
      if (result == BROTLI_DECODER_RESULT_ERROR) {
1327
1.38k
        return finish_decompression(BRUNSLI_INVALID_BRN);
1328
1.38k
      }
1329
364k
      size_t chunk_size = 0;
1330
364k
      const uint8_t* chunk_data =
1331
364k
          BrotliDecoderTakeOutput(ms.brotli, &chunk_size);
1332
364k
      ms.decompressed_size += chunk_size;
1333
364k
      if (ms.decompressed_size > ms.metadata_size) {
1334
1.05k
        return finish_decompression(BRUNSLI_INVALID_BRN);
1335
1.05k
      }
1336
363k
      size_t consumed_bytes = available_bytes - available_in;
1337
363k
      SkipBytes(state, consumed_bytes);
1338
363k
      bool chunk_ok = ProcessMetaData(chunk_data, chunk_size, &ms, jpg);
1339
363k
      if (!chunk_ok) return finish_decompression(BRUNSLI_INVALID_BRN);
1340
363k
      if (result == BROTLI_DECODER_RESULT_SUCCESS) {
1341
305
        if (RemainingSectionLength(state) != 0) {
1342
215
          return finish_decompression(BRUNSLI_INVALID_BRN);
1343
215
        }
1344
90
        if (ms.decompressed_size != ms.metadata_size) {
1345
86
          return finish_decompression(BRUNSLI_INVALID_BRN);
1346
86
        }
1347
4
        if (!ms.CanFinish()) return finish_decompression(BRUNSLI_INVALID_BRN);
1348
3
        return finish_decompression(BRUNSLI_OK);
1349
4
      }
1350
363k
      if (result == BROTLI_DECODER_RESULT_NEEDS_MORE_OUTPUT) continue;
1351
179k
      BRUNSLI_DCHECK(result == BROTLI_DECODER_RESULT_NEEDS_MORE_INPUT);
1352
179k
      if (RemainingSectionLength(state) == 0) {
1353
28
        return finish_decompression(BRUNSLI_INVALID_BRN);
1354
28
      }
1355
179k
      return BRUNSLI_NOT_ENOUGH_DATA;
1356
179k
    }
1357
182k
  }
1358
1359
  // Unreachable.
1360
0
  BRUNSLI_DCHECK(false);
1361
0
  return BRUNSLI_DECOMPRESSION_ERROR;
1362
182k
}
1363
1364
/**
1365
 * Wraps result, depending on the state of input.
1366
 *
1367
 * If parser needs more data, but section data is depleted,
1368
 * then input is corrupted.
1369
 */
1370
611k
static BrunsliStatus CheckBoundary(State* state, BrunsliStatus result) {
1371
611k
  if (result == BRUNSLI_NOT_ENOUGH_DATA) {
1372
552k
    bool last = (RemainingSectionLength(state) <= GetBytesAvailable(state));
1373
552k
    return last ? BRUNSLI_INVALID_BRN : BRUNSLI_NOT_ENOUGH_DATA;
1374
552k
  } else {
1375
59.6k
    return result;
1376
59.6k
  }
1377
611k
}
1378
1379
595k
static void PrepareBitReader(BrunsliBitReader* br, State* state) {
1380
595k
  size_t chunk_len =
1381
595k
      std::min(GetBytesAvailable(state), RemainingSectionLength(state));
1382
595k
  BrunsliBitReaderResume(br, state->data + state->pos, chunk_len);
1383
595k
  BRUNSLI_DCHECK(BrunsliBitReaderIsHealthy(br));
1384
595k
}
1385
1386
/**
1387
 * Marks data used by bit-reader as consumed.
1388
 */
1389
static BrunsliStatus SuspendBitReader(BrunsliBitReader* br, State* state,
1390
595k
                                      BrunsliStatus result) {
1391
595k
  size_t chunk_len =
1392
595k
      std::min(GetBytesAvailable(state), RemainingSectionLength(state));
1393
595k
  size_t unused_bytes = BrunsliBitReaderSuspend(br);
1394
595k
  size_t consumed_bytes = chunk_len - unused_bytes;
1395
595k
  SkipBytes(state, consumed_bytes);
1396
595k
  result = CheckBoundary(state, result);
1397
  // Once BitReader becomes unhealthy, further decoding should be impossible.
1398
595k
  BRUNSLI_DCHECK(
1399
595k
      BrunsliBitReaderIsHealthy(br) ||
1400
595k
      ((result != BRUNSLI_OK) && (result != BRUNSLI_NOT_ENOUGH_DATA)));
1401
595k
  return result;
1402
595k
}
1403
1404
502k
static BrunsliStatus DecodeJPEGInternalsSection(State* state, JPEGData* jpg) {
1405
502k
  InternalState& s = *state->internal;
1406
502k
  JpegInternalsState& js = s.internals;
1407
502k
  BrunsliBitReader* br = &js.br;
1408
1409
502k
  if (js.stage == JpegInternalsState::INIT) {
1410
19.0k
    BrunsliBitReaderInit(br);
1411
19.0k
    js.stage = JpegInternalsState::READ_MARKERS;
1412
19.0k
  }
1413
502k
  PrepareBitReader(br, state);
1414
1415
502k
  const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus {
1416
502k
    return SuspendBitReader(br, state, result);
1417
502k
  };
1418
1419
502k
  if (js.stage == JpegInternalsState::READ_MARKERS) {
1420
2.51M
    while (true) {
1421
2.51M
      if (!BrunsliBitReaderCanRead(br, 6)) {
1422
316k
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1423
316k
      }
1424
2.19M
      uint8_t marker = 0xc0 + BrunsliBitReaderRead(br, 6);
1425
2.19M
      jpg->marker_order.push_back(marker);
1426
2.19M
      if (marker == 0xc4) ++js.dht_count;
1427
2.19M
      if (marker == 0xdd) js.have_dri = true;
1428
2.19M
      if (marker == 0xda) ++js.num_scans;
1429
2.19M
      if (marker == 0xd9) break;
1430
2.19M
    }
1431
18.6k
    js.stage = JpegInternalsState::READ_DRI;
1432
18.6k
  }
1433
1434
186k
  if (js.stage == JpegInternalsState::READ_DRI) {
1435
22.0k
    if (js.have_dri) {
1436
6.48k
      if (!BrunsliBitReaderCanRead(br, 16)) {
1437
3.58k
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1438
3.58k
      }
1439
2.90k
      jpg->restart_interval = BrunsliBitReaderRead(br, 16);
1440
2.90k
    }
1441
18.5k
    js.stage = JpegInternalsState::READ_HUFFMAN_LAST;
1442
18.5k
  }
1443
1444
182k
  if (js.stage & JpegInternalsState::DECODE_HUFFMAN_MASK) {
1445
62.2k
    BrunsliStatus status = DecodeHuffmanCode(state, jpg);
1446
62.2k
    if (status != BRUNSLI_OK) return suspend_bit_reader(status);
1447
17.9k
    js.stage = JpegInternalsState::PREPARE_READ_SCANS;
1448
17.9k
  }
1449
1450
138k
  if (js.stage == JpegInternalsState::PREPARE_READ_SCANS) {
1451
17.9k
    if (js.dht_count != js.terminal_huffman_code_count) {
1452
237
      BRUNSLI_LOG_ERROR() << "Invalid number of DHT markers" << BRUNSLI_ENDL();
1453
237
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1454
237
    }
1455
17.7k
    if (js.num_scans > 0) {
1456
9.24k
      jpg->scan_info.resize(js.num_scans);
1457
9.24k
      js.i = 0;
1458
9.24k
      js.stage = JpegInternalsState::READ_SCAN_COMMON;
1459
9.24k
    } else {
1460
8.50k
      js.stage = JpegInternalsState::READ_NUM_QUANT;
1461
8.50k
    }
1462
17.7k
  }
1463
1464
138k
  if (js.stage & JpegInternalsState::DECODE_SCAN_MASK) {
1465
91.1k
    BrunsliStatus status = DecodeScanInfo(state, jpg);
1466
91.1k
    if (status != BRUNSLI_OK) return suspend_bit_reader(status);
1467
8.78k
    js.stage = JpegInternalsState::READ_NUM_QUANT;
1468
8.78k
  }
1469
1470
55.6k
  if (js.stage == JpegInternalsState::READ_NUM_QUANT) {
1471
18.5k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1472
1.41k
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1473
1.41k
    }
1474
17.0k
    int num_quant_tables = BrunsliBitReaderRead(br, 2) + 1;
1475
17.0k
    jpg->quant.resize(num_quant_tables);
1476
17.0k
    js.i = 0;
1477
17.0k
    js.stage = JpegInternalsState::READ_QUANT;
1478
17.0k
  }
1479
1480
71.4k
  while (js.stage == JpegInternalsState::READ_QUANT) {
1481
43.3k
    if (js.i >= jpg->quant.size()) {
1482
16.6k
      js.stage = JpegInternalsState::READ_COMP_ID_SCHEME;
1483
16.6k
      break;
1484
16.6k
    }
1485
    // 6 or 7 bits are used, but we know that at least one more bit is
1486
    // guaranteed to be used by varint out of the loop.
1487
26.6k
    if (!BrunsliBitReaderCanRead(br, 7)) {
1488
9.33k
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1489
9.33k
    }
1490
17.3k
    JPEGQuantTable* q = &jpg->quant[js.i];
1491
17.3k
    q->index = BrunsliBitReaderRead(br, 2);
1492
17.3k
    q->is_last = (js.i == jpg->quant.size() - 1) || BrunsliBitReaderRead(br, 1);
1493
17.3k
    q->precision = BrunsliBitReaderRead(br, 4);
1494
17.3k
    if (q->precision > 1) {
1495
212
      BRUNSLI_LOG_ERROR() << "Invalid quantization table precision: "
1496
212
                          << q->precision << BRUNSLI_ENDL();
1497
212
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1498
212
    }
1499
    // note that q->values[] are initialized to invalid 0 values.
1500
17.1k
    ++js.i;
1501
17.1k
  }
1502
1503
44.7k
  if (js.stage == JpegInternalsState::READ_COMP_ID_SCHEME) {
1504
16.7k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1505
214
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1506
214
    }
1507
16.5k
    int comp_ids = BrunsliBitReaderRead(br, 2);
1508
16.5k
    static const size_t kMinRequiredComponents[4] = {
1509
16.5k
        3 /* Ids123*/, 1 /* IdsGray */, 3 /* IdsRGB */, 0 /* IdsCustom */
1510
16.5k
    };
1511
16.5k
    if (jpg->components.size() < kMinRequiredComponents[comp_ids]) {
1512
21
      BRUNSLI_LOG_ERROR() << "Insufficient number of components for ColorId #"
1513
21
                          << comp_ids << BRUNSLI_ENDL();
1514
21
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1515
21
    }
1516
16.4k
    js.stage = JpegInternalsState::READ_NUM_PADDING_BITS;
1517
16.4k
    if (comp_ids == kComponentIds123) {
1518
679
      jpg->components[0].id = 1;
1519
679
      jpg->components[1].id = 2;
1520
679
      jpg->components[2].id = 3;
1521
15.8k
    } else if (comp_ids == kComponentIdsGray) {
1522
14.8k
      jpg->components[0].id = 1;
1523
14.8k
    } else if (comp_ids == kComponentIdsRGB) {
1524
65
      jpg->components[0].id = 'R';
1525
65
      jpg->components[1].id = 'G';
1526
65
      jpg->components[2].id = 'B';
1527
894
    } else {
1528
894
      BRUNSLI_DCHECK(comp_ids == kComponentIdsCustom);
1529
894
      js.i = 0;
1530
894
      js.stage = JpegInternalsState::READ_COMP_ID;
1531
894
    }
1532
16.4k
  }
1533
1534
44.4k
  if (js.stage == JpegInternalsState::READ_COMP_ID) {
1535
2.35k
    while (js.i < jpg->components.size()) {
1536
1.51k
      if (!BrunsliBitReaderCanRead(br, 8)) {
1537
627
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1538
627
      }
1539
885
      jpg->components[js.i].id = BrunsliBitReaderRead(br, 8);
1540
885
      ++js.i;
1541
885
    }
1542
844
    js.stage = JpegInternalsState::READ_NUM_PADDING_BITS;
1543
844
  }
1544
1545
43.8k
  if (js.stage == JpegInternalsState::READ_NUM_PADDING_BITS) {
1546
    // TODO(eustas): sanitize: should not be bigger than
1547
    //               7 x (num_scans + num_blocks / dri)
1548
    // security: limit is 32b for n_size
1549
17.0k
    if (!DecodeLimitedVarint<8>(&js.varint, br, 4)) {
1550
683
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1551
683
    }
1552
16.3k
    js.num_padding_bits = js.varint.value;
1553
16.3k
    jpg->has_zero_padding_bit = (js.num_padding_bits > 0);
1554
16.3k
    if (js.num_padding_bits > PaddingBitsLimit(*jpg)) {
1555
60
      BRUNSLI_LOG_ERROR() << "Suspicious number of padding bits "
1556
60
                          << js.num_padding_bits << BRUNSLI_ENDL();
1557
60
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1558
60
    }
1559
16.2k
    js.i = 0;
1560
16.2k
    js.stage = JpegInternalsState::READ_PADDING_BITS;
1561
16.2k
  }
1562
1563
43.1k
  if (js.stage == JpegInternalsState::READ_PADDING_BITS) {
1564
91.3k
    while (js.i < js.num_padding_bits) {
1565
75.1k
      if (!BrunsliBitReaderCanRead(br, 1)) {
1566
7.42k
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1567
7.42k
      }
1568
67.6k
      jpg->padding_bits.emplace_back(BrunsliBitReaderRead(br, 1));
1569
67.6k
      ++js.i;
1570
67.6k
    }
1571
16.2k
    suspend_bit_reader(BRUNSLI_OK);
1572
16.2k
    BrunsliBitReaderFinish(br);
1573
16.2k
    if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN;
1574
16.1k
    js.i = 0;
1575
16.1k
    js.stage = JpegInternalsState::ITERATE_MARKERS;
1576
19.4k
  } else {
1577
    // no-op
1578
19.4k
    suspend_bit_reader(BRUNSLI_OK);
1579
19.4k
  }
1580
1581
1.09M
  while (true) {
1582
1.09M
    switch (js.stage) {
1583
1.01M
      case JpegInternalsState::ITERATE_MARKERS: {
1584
1.01M
        if (js.i >= jpg->marker_order.size()) {
1585
15.6k
          js.stage = JpegInternalsState::DONE;
1586
999k
        } else if (jpg->marker_order[js.i] == 0xFF) {
1587
24.4k
          js.stage = JpegInternalsState::READ_INTERMARKER_LENGTH;
1588
974k
        } else {
1589
974k
          ++js.i;
1590
974k
        }
1591
1.01M
        continue;
1592
0
      }
1593
1594
40.7k
      case JpegInternalsState::READ_INTERMARKER_LENGTH: {
1595
40.7k
        BrunsliStatus status = DecodeBase128(state, &js.intermarker_length);
1596
40.7k
        if (status != BRUNSLI_OK) return CheckBoundary(state, status);
1597
24.3k
        if (js.intermarker_length > RemainingSectionLength(state)) {
1598
111
          return BRUNSLI_INVALID_BRN;
1599
111
        }
1600
24.2k
        jpg->inter_marker_data.emplace_back();
1601
24.2k
        js.stage = JpegInternalsState::READ_INTERMARKER_DATA;
1602
24.2k
        continue;
1603
24.3k
      }
1604
1605
27.4k
      case JpegInternalsState::READ_INTERMARKER_DATA: {
1606
27.4k
        auto& dest = jpg->inter_marker_data.back();
1607
27.4k
        size_t piece_limit = js.intermarker_length - dest.size();
1608
27.4k
        size_t piece_size = std::min(piece_limit, GetBytesAvailable(state));
1609
27.4k
        Append(&dest, state->data + state->pos, piece_size);
1610
27.4k
        SkipBytes(state, piece_size);
1611
27.4k
        if (dest.size() < js.intermarker_length) {
1612
3.43k
          BRUNSLI_DCHECK(GetBytesAvailable(state) == 0);
1613
3.43k
          BRUNSLI_DCHECK(RemainingSectionLength(state) > 0);
1614
3.43k
          return BRUNSLI_NOT_ENOUGH_DATA;
1615
3.43k
        }
1616
23.9k
        ++js.i;
1617
23.9k
        js.stage = JpegInternalsState::ITERATE_MARKERS;
1618
23.9k
        continue;
1619
27.4k
      }
1620
1621
15.6k
      default: { /* no-op */ }
1622
1.09M
    }
1623
15.6k
    break;  // no matching stage has been found; exit the loop.
1624
1.09M
  }
1625
1626
15.6k
  if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1627
1628
15.4k
  return BRUNSLI_OK;
1629
15.6k
}
1630
1631
26.0k
static BrunsliStatus DecodeQuantDataSection(State* state, JPEGData* jpg) {
1632
26.0k
  InternalState& s = *state->internal;
1633
26.0k
  QuantDataState& qs = s.quant;
1634
26.0k
  BrunsliBitReader* br = &qs.br;
1635
1636
26.0k
  if (qs.stage == QuantDataState::INIT) {
1637
13.1k
    BrunsliBitReaderInit(br);
1638
13.1k
    qs.stage = QuantDataState::READ_NUM_QUANT;
1639
13.1k
  }
1640
26.0k
  PrepareBitReader(br, state);
1641
1642
26.0k
  const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus {
1643
26.0k
    return SuspendBitReader(br, state, result);
1644
26.0k
  };
1645
1646
26.0k
  if (qs.stage == QuantDataState::READ_NUM_QUANT) {
1647
21.0k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1648
8.13k
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1649
8.13k
    }
1650
12.9k
    size_t num_quant_tables = BrunsliBitReaderRead(br, 2) + 1;
1651
12.9k
    if (jpg->quant.size() != num_quant_tables) {
1652
224
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1653
224
    }
1654
12.6k
    qs.predictor.resize(kDCTBlockSize);
1655
12.6k
    qs.i = 0;
1656
12.6k
    qs.stage = QuantDataState::READ_STOCK;
1657
12.6k
  }
1658
1659
128k
  while (true) {
1660
128k
    switch (qs.stage) {
1661
24.0k
      case QuantDataState::READ_STOCK: {
1662
24.0k
        if (qs.i >= jpg->quant.size()) {
1663
11.0k
          std::vector<uint8_t>().swap(qs.predictor);
1664
11.0k
          qs.i = 0;
1665
11.0k
          qs.stage = QuantDataState::READ_QUANT_IDX;
1666
11.0k
          continue;
1667
11.0k
        }
1668
        // Depending on еру 1-st bit, it is guaranteed that we will need to read
1669
        // at least 3 or 6 more bits.
1670
13.0k
        if (!BrunsliBitReaderCanRead(br, 4)) {
1671
205
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1672
205
        }
1673
12.8k
        qs.data_precision = 0;
1674
12.8k
        bool is_short = !BrunsliBitReaderRead(br, 1);
1675
12.8k
        if (is_short) {
1676
11.1k
          const size_t short_code = BrunsliBitReaderRead(br, 3);
1677
11.1k
          int32_t* table = jpg->quant[qs.i].values.data();
1678
11.1k
          size_t selector = (qs.i > 0) ? 1 : 0;
1679
723k
          for (size_t k = 0; k < kDCTBlockSize; ++k) {
1680
712k
            table[k] = kStockQuantizationTables[selector][short_code][k];
1681
712k
          }
1682
11.1k
          qs.stage = QuantDataState::UPDATE;
1683
11.1k
        } else {
1684
1.67k
          qs.stage = QuantDataState::READ_Q_FACTOR;
1685
1.67k
        }
1686
12.8k
        continue;
1687
13.0k
      }
1688
1689
2.35k
      case QuantDataState::READ_Q_FACTOR: {
1690
2.35k
        if (!BrunsliBitReaderCanRead(br, 6)) {
1691
901
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1692
901
        }
1693
1.45k
        const uint32_t q_factor = BrunsliBitReaderRead(br, 6);
1694
1.45k
        FillQuantMatrix(qs.i > 0, q_factor, qs.predictor.data());
1695
1.45k
        qs.j = 0;
1696
1.45k
        qs.delta = 0;
1697
1.45k
        qs.stage = QuantDataState::READ_DIFF_IS_ZERO;
1698
1.45k
        continue;
1699
2.35k
      }
1700
1701
32.9k
      case QuantDataState::READ_DIFF_IS_ZERO: {
1702
32.9k
        if (qs.j >= kDCTBlockSize) {
1703
376
          qs.stage = QuantDataState::UPDATE;
1704
376
          continue;
1705
376
        }
1706
32.5k
        if (!BrunsliBitReaderCanRead(br, 1)) {
1707
2.06k
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1708
2.06k
        }
1709
30.4k
        if (BrunsliBitReaderRead(br, 1)) {
1710
6.92k
          qs.stage = QuantDataState::READ_DIFF_SIGN;
1711
23.5k
        } else {
1712
23.5k
          qs.stage = QuantDataState::APPLY_DIFF;
1713
23.5k
        }
1714
30.4k
        continue;
1715
32.5k
      }
1716
1717
7.16k
      case QuantDataState::READ_DIFF_SIGN: {
1718
7.16k
        if (!BrunsliBitReaderCanRead(br, 1)) {
1719
462
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1720
462
        }
1721
6.70k
        qs.sign = BrunsliBitReaderRead(br, 1) ? -1 : 1;
1722
6.70k
        qs.stage = QuantDataState::READ_DIFF;
1723
6.70k
        continue;
1724
7.16k
      }
1725
1726
8.78k
      case QuantDataState::READ_DIFF: {
1727
8.78k
        if (!DecodeVarint(&qs.vs, br, 16)) {
1728
2.31k
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1729
2.31k
        }
1730
6.47k
        int diff = static_cast<int>(qs.vs.value) + 1;
1731
6.47k
        qs.delta += qs.sign * diff;
1732
6.47k
        qs.stage = QuantDataState::APPLY_DIFF;
1733
6.47k
        continue;
1734
8.78k
      }
1735
1736
30.0k
      case QuantDataState::APPLY_DIFF: {
1737
30.0k
        const int k = kJPEGNaturalOrder[qs.j];
1738
30.0k
        const int quant_value = qs.predictor[k] + qs.delta;
1739
30.0k
        jpg->quant[qs.i].values[k] = quant_value;
1740
30.0k
        if (quant_value <= 0) {
1741
193
          return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1742
193
        }
1743
29.8k
        if (quant_value >= 256) {
1744
15.5k
          qs.data_precision = 1;
1745
15.5k
        }
1746
29.8k
        if (quant_value >= 65536) {
1747
146
          return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1748
146
        }
1749
29.7k
        ++qs.j;
1750
29.7k
        qs.stage = QuantDataState::READ_DIFF_IS_ZERO;
1751
29.7k
        continue;
1752
29.8k
      }
1753
1754
11.5k
      case QuantDataState::UPDATE: {
1755
11.5k
        if (jpg->quant[qs.i].precision < qs.data_precision) {
1756
169
          return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1757
169
        }
1758
        // jpg->quant[qs.i].precision > qs.data_precision means that original
1759
        // JPEG1 was inefficiently encoded.
1760
11.3k
        ++qs.i;
1761
11.3k
        qs.stage = QuantDataState::READ_STOCK;
1762
11.3k
        continue;
1763
11.5k
      }
1764
1765
11.2k
      default: { /* no-op */ }
1766
128k
    }
1767
11.2k
    break;  // no matching stage has been found; exit the loop.
1768
128k
  }
1769
1770
33.9k
  while (qs.stage == QuantDataState::READ_QUANT_IDX) {
1771
23.2k
    if (qs.i >= jpg->components.size()) {
1772
10.6k
      qs.stage = QuantDataState::FINISH;
1773
10.6k
      continue;
1774
10.6k
    }
1775
12.6k
    JPEGComponent* c = &jpg->components[qs.i];
1776
12.6k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1777
453
       return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1778
453
    }
1779
12.1k
    c->quant_idx = BrunsliBitReaderRead(br, 2);
1780
12.1k
    if (c->quant_idx >= jpg->quant.size()) {
1781
168
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1782
168
    }
1783
11.9k
    ++qs.i;
1784
11.9k
  }
1785
1786
10.6k
  BRUNSLI_DCHECK(qs.stage == QuantDataState::FINISH);
1787
10.6k
  suspend_bit_reader(BRUNSLI_OK);
1788
10.6k
  BrunsliBitReaderFinish(br);
1789
10.6k
  if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN;
1790
10.6k
  if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1791
10.4k
  return BRUNSLI_OK;
1792
10.6k
}
1793
1794
66.5k
static BrunsliStatus DecodeHistogramDataSection(State* state, JPEGData* jpg) {
1795
66.5k
  InternalState& s = *state->internal;
1796
66.5k
  HistogramDataState& hs = s.histogram;
1797
66.5k
  BrunsliBitReader* br = &hs.br;
1798
1799
66.5k
  if (hs.stage == HistogramDataState::INIT) {
1800
12.7k
    BrunsliBitReaderInit(br);
1801
12.7k
    BRUNSLI_DCHECK(!jpg->components.empty());
1802
12.7k
    s.num_contexts = jpg->components.size();
1803
12.7k
    hs.stage = HistogramDataState::READ_SCHEME;
1804
    /* Optimization: hint arena about maximal used alphabet size: 272.
1805
     * 648 = 272 + 376, where 376 is a "universal" overhead for max-15-bit
1806
     * root-8-bit 2-level Huffman tables. */
1807
12.7k
    hs.arena.reserve(648);
1808
12.7k
  }
1809
66.5k
  PrepareBitReader(br, state);
1810
66.5k
  if (RemainingSectionLength(state) <= GetBytesAvailable(state)) {
1811
    // If end of section is reachable, then we could parse the remainings in
1812
    // non-streaming mode.
1813
11.3k
    BrunsliBitReaderSetOptimistic(br);
1814
11.3k
  }
1815
66.5k
  const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus {
1816
66.5k
    return SuspendBitReader(br, state, result);
1817
66.5k
  };
1818
1819
66.5k
  if (hs.stage == HistogramDataState::READ_SCHEME) {
1820
20.6k
    const size_t num_components = jpg->components.size();
1821
20.6k
    BRUNSLI_DCHECK(num_components <= 4);
1822
20.6k
    if (!BrunsliBitReaderCanRead(br, 3 * num_components)) {
1823
8.04k
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1824
8.04k
    }
1825
26.5k
    for (size_t i = 0; i < num_components; ++i) {
1826
14.0k
      size_t scheme = BrunsliBitReaderRead(br, 3);
1827
14.0k
      if (scheme >= kNumSchemes) return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1828
13.9k
      ComponentMeta& m = state->meta[i];
1829
13.9k
      m.context_bits = scheme;
1830
13.9k
      m.context_offset = s.num_contexts;
1831
13.9k
      s.num_contexts += kNumNonzeroContextSkip[scheme];
1832
13.9k
    }
1833
12.4k
    if (!BrunsliBitReaderIsHealthy(br)) {
1834
11
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1835
11
    }
1836
12.4k
    hs.stage = HistogramDataState::READ_NUM_HISTOGRAMS;
1837
12.4k
  }
1838
1839
58.3k
  if (hs.stage == HistogramDataState::READ_NUM_HISTOGRAMS) {
1840
19.5k
    if (!BrunsliBitReaderCanRead(br, 11)) {
1841
7.17k
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1842
7.17k
    }
1843
12.3k
    s.num_histograms = DecodeVarLenUint8(br) + 1;
1844
12.3k
    if (!BrunsliBitReaderIsHealthy(br)) {
1845
15
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1846
15
    }
1847
12.3k
    if (s.shallow_histograms) {
1848
0
      hs.stage = HistogramDataState::SKIP_CONTENT;
1849
12.3k
    } else {
1850
12.3k
      s.context_map_.resize(s.num_contexts * kNumAvrgContexts);
1851
12.3k
      state->context_map = s.context_map_.data();
1852
12.3k
      s.entropy_codes_.resize(s.num_histograms);
1853
12.3k
      state->entropy_codes = s.entropy_codes_.data();
1854
12.3k
      if (s.num_histograms > 1) {
1855
2.12k
        hs.stage = HistogramDataState::READ_CONTEXT_MAP_CODE;
1856
10.2k
      } else {
1857
10.2k
        hs.i = 0;
1858
10.2k
        hs.counts.resize(kCoeffAlphabetSize);
1859
10.2k
        hs.stage = HistogramDataState::READ_HISTOGRAMS;
1860
10.2k
      }
1861
12.3k
    }
1862
12.3k
  }
1863
1864
51.1k
  if (hs.stage == HistogramDataState::SKIP_CONTENT) {
1865
0
    suspend_bit_reader(BRUNSLI_OK);
1866
0
    if (!BrunsliBitReaderIsHealthy(br)) {
1867
0
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1868
0
    }
1869
0
    SkipAvailableBytes(state, RemainingSectionLength(state));
1870
0
    if (!IsAtSectionBoundary(state)) return BRUNSLI_NOT_ENOUGH_DATA;
1871
0
    hs.stage = HistogramDataState::DONE;
1872
0
  }
1873
1874
51.1k
  if (hs.stage == HistogramDataState::READ_CONTEXT_MAP_CODE) {
1875
24.9k
    if (!BrunsliBitReaderCanRead(br, 207 + s.num_histograms * 8)) {
1876
23.0k
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1877
23.0k
    }
1878
1.94k
    hs.max_run_length_prefix = 0;
1879
1.94k
    bool use_rle_for_zeros = !!BrunsliBitReaderRead(br, 1);
1880
1.94k
    if (use_rle_for_zeros) {
1881
618
      hs.max_run_length_prefix = BrunsliBitReaderRead(br, 4) + 1;
1882
618
    }
1883
1.94k
    size_t alphabet_size = s.num_histograms + hs.max_run_length_prefix;
1884
1.94k
    hs.entropy.reset(new HuffmanDecodingData);
1885
1.94k
    if (!hs.entropy->ReadFromBitStream(alphabet_size, br, &hs.arena)) {
1886
505
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1887
505
    }
1888
1.43k
    hs.i = 0;
1889
1.43k
    hs.stage = HistogramDataState::READ_CONTEXT_MAP;
1890
1.43k
  }
1891
1892
27.6k
  if (hs.stage == HistogramDataState::READ_CONTEXT_MAP) {
1893
5.57k
    BrunsliStatus status = DecodeContextMap(
1894
5.57k
        *hs.entropy, hs.max_run_length_prefix, &hs.i, &s.context_map_, br);
1895
5.57k
    if (status != BRUNSLI_OK) return suspend_bit_reader(status);
1896
953
    hs.i = 0;
1897
953
    hs.counts.resize(kCoeffAlphabetSize);
1898
953
    hs.stage = HistogramDataState::READ_HISTOGRAMS;
1899
953
  }
1900
1901
23.0k
  if (hs.stage == HistogramDataState::READ_HISTOGRAMS) {
1902
43.2k
    while (hs.i < s.num_histograms) {
1903
32.7k
      if (!BrunsliBitReaderCanRead(br, 9 + kCoeffAlphabetSize * 11)) {
1904
12.1k
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1905
12.1k
      }
1906
20.6k
      if (!ReadHistogram(BRUNSLI_ANS_LOG_TAB_SIZE, &hs.counts, br)) {
1907
346
        return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1908
346
      }
1909
20.2k
      if (!s.entropy_codes_[hs.i].Init(hs.counts)) {
1910
0
        return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1911
0
      }
1912
20.2k
      ++hs.i;
1913
20.2k
    }
1914
10.5k
    hs.entropy.reset();
1915
10.5k
    std::vector<uint32_t>().swap(hs.counts);
1916
10.5k
    suspend_bit_reader(BRUNSLI_OK);
1917
10.5k
    BrunsliBitReaderFinish(br);
1918
10.5k
    if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN;
1919
10.5k
    if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1920
10.4k
    hs.stage = HistogramDataState::DONE;
1921
10.4k
  }
1922
1923
10.4k
  hs.arena.reset();
1924
10.4k
  BRUNSLI_DCHECK(hs.stage == HistogramDataState::DONE);
1925
10.4k
  return BRUNSLI_OK;
1926
23.0k
}
1927
1928
95.9k
static BrunsliStatus DecodeDCDataSection(State* state) {
1929
95.9k
  size_t available = GetBytesAvailable(state) & ~1;
1930
95.9k
  size_t limit = RemainingSectionLength(state);
1931
95.9k
  BRUNSLI_DCHECK((limit & 1) == 0);
1932
95.9k
  size_t chunk_len = std::min(available, limit);
1933
  // If end of section is reachable, then we could parse the remainings in
1934
  // non-streaming mode.
1935
95.9k
  bool is_last_chunk = (chunk_len == limit);
1936
95.9k
  WordSource in(state->data + state->pos, chunk_len, is_last_chunk);
1937
1938
95.9k
  BrunsliStatus status = DecodeDC(state, &in);
1939
1940
95.9k
  BRUNSLI_DCHECK((in.pos_ & 1) == 0);
1941
95.9k
  if (in.error_) return BRUNSLI_INVALID_BRN;
1942
95.5k
  BRUNSLI_DCHECK(in.pos_ <= chunk_len);
1943
95.5k
  SkipBytes(state, in.pos_);
1944
95.5k
  if (is_last_chunk) {
1945
9.54k
    BRUNSLI_DCHECK(status != BRUNSLI_NOT_ENOUGH_DATA);
1946
9.54k
    if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1947
9.54k
  }
1948
95.4k
  return status;
1949
95.5k
}
1950
1951
178k
static BrunsliStatus DecodeACDataSection(State* state) {
1952
178k
  size_t available = GetBytesAvailable(state) & ~1;
1953
178k
  size_t limit = RemainingSectionLength(state);
1954
178k
  BRUNSLI_DCHECK((limit & 1) == 0);
1955
178k
  size_t chunk_len = std::min(available, limit);
1956
  // If end of section is reachable, then we could parse the remainings in
1957
  // non-streaming mode.
1958
178k
  bool is_last_chunk = (chunk_len == limit);
1959
178k
  WordSource in(state->data + state->pos, chunk_len, is_last_chunk);
1960
1961
178k
  BrunsliStatus status = DecodeAC(state, &in);
1962
1963
178k
  BRUNSLI_DCHECK((in.pos_ & 1) == 0);
1964
178k
  if (in.error_) return BRUNSLI_INVALID_BRN;
1965
177k
  BRUNSLI_DCHECK(in.pos_ <= chunk_len);
1966
177k
  SkipBytes(state, in.pos_);
1967
177k
  if (is_last_chunk) {
1968
8.32k
    BRUNSLI_DCHECK(status != BRUNSLI_NOT_ENOUGH_DATA);
1969
8.32k
    if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1970
8.32k
  }
1971
177k
  return status;
1972
177k
}
1973
1974
2.76k
static Stage DecodeOriginalJpg(State* state, JPEGData* jpg) {
1975
2.76k
  InternalState& s = *state->internal;
1976
2.76k
  FallbackState& fs = s.fallback;
1977
1978
3.88k
  while (fs.stage != FallbackState::DONE) {
1979
3.83k
    switch (fs.stage) {
1980
874
      case FallbackState::READ_TAG: {
1981
874
        BrunsliStatus status = ReadTag(state, &s.section);
1982
874
        if (status != BRUNSLI_OK) return Fail(state, status);
1983
581
        if (s.section.tag != kBrunsliOriginalJpgTag || !s.section.is_section) {
1984
12
          return Fail(state, BRUNSLI_INVALID_BRN);
1985
12
        }
1986
569
        fs.stage = FallbackState::ENTER_SECTION;
1987
569
        break;
1988
581
      }
1989
1990
1.64k
      case FallbackState::ENTER_SECTION: {
1991
1.64k
        BrunsliStatus status = EnterSection(state, &s.section);
1992
1.64k
        if (status != BRUNSLI_OK) return Fail(state, status);
1993
509
        jpg->original_jpg_size = s.section.remaining;
1994
        // Edge case - empty payload.
1995
509
        if (jpg->original_jpg_size == 0) {
1996
4
          jpg->original_jpg = nullptr;
1997
4
          fs.stage = FallbackState::DONE;
1998
4
          break;
1999
4
        }
2000
505
        fs.stage = FallbackState::READ_CONTENTS;
2001
505
        break;
2002
509
      }
2003
2004
1.31k
      case FallbackState::READ_CONTENTS: {
2005
1.31k
        size_t chunk_size = GetBytesAvailable(state);
2006
1.31k
        if (chunk_size == 0) {
2007
          // TODO(eustas): dcheck s.section.remaining != 0
2008
468
          return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
2009
468
        }
2010
        // Check if it is possible to avoid copy.
2011
848
        const uint8_t* src = state->data + state->pos;
2012
848
        if (fs.storage.empty()) {
2013
349
          if (chunk_size >= jpg->original_jpg_size) {
2014
38
            jpg->original_jpg = src;
2015
38
            SkipBytes(state, jpg->original_jpg_size);
2016
38
            fs.stage = FallbackState::DONE;
2017
38
            break;
2018
38
          }
2019
349
        }
2020
        // Otherwise, copy input.
2021
810
        size_t remaining = jpg->original_jpg_size - fs.storage.size();
2022
810
        size_t to_copy = std::min(chunk_size, remaining);
2023
810
        fs.storage.insert(fs.storage.cend(), src, src + to_copy);
2024
810
        SkipBytes(state, to_copy);
2025
810
        if (fs.storage.size() == jpg->original_jpg_size) {
2026
8
          jpg->original_jpg = fs.storage.data();
2027
8
          fs.stage = FallbackState::DONE;
2028
8
          break;
2029
8
        }
2030
        // TODO(eustas): dcheck GetBytesAvailable(state) == 0
2031
802
        return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
2032
810
      }
2033
2034
0
      default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
2035
3.83k
    }
2036
3.83k
  }
2037
2038
50
  LeaveSection(&s.section);
2039
50
  return Stage::DONE;
2040
2.76k
}
2041
2042
171k
static Stage ParseSection(State* state) {
2043
171k
  InternalState& s = *state->internal;
2044
171k
  SectionHeaderState& sh = s.section_header;
2045
2046
171k
  Stage result = Stage::ERROR;
2047
2048
314k
  while (sh.stage != SectionHeaderState::DONE) {
2049
242k
    switch (sh.stage) {
2050
116k
      case SectionHeaderState::READ_TAG: {
2051
116k
        BrunsliStatus status = ReadTag(state, &s.section);
2052
116k
        if (status == BRUNSLI_NOT_ENOUGH_DATA) {
2053
44.9k
          if (HasSection(state, kBrunsliACDataTag)) return Stage::DONE;
2054
44.9k
        }
2055
116k
        if (status != BRUNSLI_OK) return Fail(state, status);
2056
71.6k
        if (s.section.is_section) {
2057
71.5k
          sh.stage = SectionHeaderState::ENTER_SECTION;
2058
71.5k
          continue;
2059
71.5k
        }
2060
60
        const uint32_t tag_bit = 1u << s.section.tag;
2061
60
        const bool is_known_section_tag = kKnownSectionTags & tag_bit;
2062
60
        if (is_known_section_tag) return Fail(state, BRUNSLI_INVALID_BRN);
2063
58
        sh.stage = SectionHeaderState::READ_VALUE;
2064
58
        continue;
2065
60
      }
2066
2067
124
      case SectionHeaderState::READ_VALUE: {
2068
        // No known varint tags on top level.
2069
124
        size_t sink;
2070
124
        BrunsliStatus status = DecodeBase128(state, &sink);
2071
124
        if (status != BRUNSLI_OK) return Fail(state, status);
2072
44
        result = Stage::SECTION;
2073
44
        sh.stage = SectionHeaderState::DONE;
2074
44
        continue;
2075
124
      }
2076
2077
125k
      case SectionHeaderState::ENTER_SECTION: {
2078
125k
        BrunsliStatus status = EnterSection(state, &s.section);
2079
125k
        if (status != BRUNSLI_OK) return Fail(state, status);
2080
71.5k
        result = Stage::SECTION_BODY;
2081
71.5k
        sh.stage = SectionHeaderState::DONE;
2082
71.5k
        continue;
2083
125k
      }
2084
2085
0
      default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
2086
242k
    }
2087
242k
  }
2088
2089
71.6k
  sh.stage = SectionHeaderState::READ_TAG;
2090
71.6k
  BRUNSLI_DCHECK(result != Stage::ERROR);
2091
71.6k
  return result;
2092
171k
}
2093
2094
1.05M
static Stage ProcessSection(State* state, JPEGData* jpg) {
2095
1.05M
  InternalState& s = *state->internal;
2096
2097
1.05M
  const int32_t tag_bit = 1u << s.section.tag;
2098
1.05M
  const bool is_known_section_tag = kKnownSectionTags & tag_bit;
2099
2100
1.05M
  const bool skip_section =
2101
1.05M
      !is_known_section_tag || (state->skip_tags & tag_bit);
2102
2103
1.05M
  if (skip_section) {
2104
    // Skip section content.
2105
614
    size_t to_skip =
2106
614
        std::min(GetBytesAvailable(state), RemainingSectionLength(state));
2107
614
    state->pos += to_skip;
2108
614
    if (RemainingSectionLength(state) != 0) {
2109
579
      BRUNSLI_DCHECK(GetBytesAvailable(state) == 0);
2110
579
      return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
2111
579
    }
2112
35
    return Stage::SECTION;
2113
614
  }
2114
2115
1.05M
  switch (s.section.tag) {
2116
188k
    case kBrunsliMetaDataTag: {
2117
188k
      BrunsliStatus status = DecodeMetaDataSection(state, jpg);
2118
188k
      if (status != BRUNSLI_OK) return Fail(state, status);
2119
54
      break;
2120
188k
    }
2121
2122
502k
    case kBrunsliJPEGInternalsTag: {
2123
502k
      BrunsliStatus status = DecodeJPEGInternalsSection(state, jpg);
2124
502k
      if (status != BRUNSLI_OK) return Fail(state, status);
2125
15.4k
      break;
2126
502k
    }
2127
2128
26.0k
    case kBrunsliQuantDataTag: {
2129
26.0k
      if (!HasSection(state, kBrunsliJPEGInternalsTag)) {
2130
2
        return Fail(state, BRUNSLI_INVALID_BRN);
2131
2
      }
2132
26.0k
      BrunsliStatus status = DecodeQuantDataSection(state, jpg);
2133
26.0k
      if (status != BRUNSLI_OK) return Fail(state, status);
2134
10.4k
      break;
2135
26.0k
    }
2136
2137
66.5k
    case kBrunsliHistogramDataTag: {
2138
66.5k
      if (!HasSection(state, kBrunsliJPEGInternalsTag)) {
2139
2
        return Fail(state, BRUNSLI_INVALID_BRN);
2140
2
      }
2141
66.5k
      BrunsliStatus status = DecodeHistogramDataSection(state, jpg);
2142
66.5k
      if (status != BRUNSLI_OK) return Fail(state, status);
2143
10.4k
      break;
2144
66.5k
    }
2145
2146
95.9k
    case kBrunsliDCDataTag: {
2147
95.9k
      if (!HasSection(state, kBrunsliHistogramDataTag)) {
2148
3
        return Fail(state, BRUNSLI_INVALID_BRN);
2149
3
      }
2150
95.9k
      if (!HasSection(state, kBrunsliQuantDataTag)) {
2151
2
        return Fail(state, BRUNSLI_INVALID_BRN);
2152
2
      }
2153
      // This section reads input word by word.
2154
95.9k
      if ((RemainingSectionLength(state) & 1) != 0) {
2155
4
        return Fail(state, BRUNSLI_INVALID_BRN);
2156
4
      }
2157
95.9k
      internal::dec::WarmupMeta(jpg, state);
2158
95.9k
      BrunsliStatus status = DecodeDCDataSection(state);
2159
95.9k
      if (status != BRUNSLI_OK) return Fail(state, status);
2160
9.60k
      break;
2161
95.9k
    }
2162
2163
178k
    case kBrunsliACDataTag: {
2164
178k
      if (!HasSection(state, kBrunsliDCDataTag)) {
2165
2
        return Fail(state, BRUNSLI_INVALID_BRN);
2166
2
      }
2167
      // This section reads input word by word.
2168
178k
      if ((RemainingSectionLength(state) & 1) != 0) {
2169
2
        return Fail(state, BRUNSLI_INVALID_BRN);
2170
2
      }
2171
178k
      internal::dec::WarmupMeta(jpg, state);
2172
178k
      BrunsliStatus status = DecodeACDataSection(state);
2173
178k
      if (status != BRUNSLI_OK) return Fail(state, status);
2174
8.20k
      break;
2175
178k
    }
2176
2177
8.20k
    default:
2178
      /* Unreachable */
2179
0
      return Fail(state, BRUNSLI_INVALID_BRN);
2180
1.05M
  }
2181
2182
54.2k
  if (!IsAtSectionBoundary(state)) {
2183
89
    return Fail(state, BRUNSLI_INVALID_BRN);
2184
89
  }
2185
2186
  // Nothing is expected after the AC data.
2187
54.1k
  if (s.section.tag == kBrunsliACDataTag) {
2188
8.20k
    return Stage::DONE;
2189
8.20k
  }
2190
2191
45.9k
  return Stage::SECTION;
2192
54.1k
}
2193
2194
namespace internal {
2195
namespace dec {
2196
2197
25.8k
bool UpdateSubsamplingDerivatives(JPEGData* jpg) {
2198
66.8k
  for (size_t i = 0; i < jpg->components.size(); ++i) {
2199
41.0k
    JPEGComponent* c = &jpg->components[i];
2200
41.0k
    jpg->max_h_samp_factor = std::max(jpg->max_h_samp_factor, c->h_samp_factor);
2201
41.0k
    jpg->max_v_samp_factor = std::max(jpg->max_v_samp_factor, c->v_samp_factor);
2202
41.0k
  }
2203
25.8k
  jpg->MCU_rows = DivCeil(jpg->height, jpg->max_v_samp_factor * 8);
2204
25.8k
  jpg->MCU_cols = DivCeil(jpg->width, jpg->max_h_samp_factor * 8);
2205
66.8k
  for (size_t i = 0; i < jpg->components.size(); ++i) {
2206
41.0k
    JPEGComponent* c = &jpg->components[i];
2207
41.0k
    c->width_in_blocks = jpg->MCU_cols * c->h_samp_factor;
2208
41.0k
    c->height_in_blocks = jpg->MCU_rows * c->v_samp_factor;
2209
    // 8205 == max[ceil((65535 / (i * 8)) * i) for i in range(1, 16 + 1)]
2210
41.0k
    BRUNSLI_DCHECK(c->width_in_blocks <= 8205);
2211
41.0k
    BRUNSLI_DCHECK(c->height_in_blocks <= 8205);
2212
41.0k
    uint32_t num_blocks = c->width_in_blocks * c->height_in_blocks;
2213
41.0k
    if (num_blocks > kBrunsliMaxNumBlocks) {
2214
2
      return false;
2215
2
    }
2216
41.0k
    c->num_blocks = num_blocks;
2217
41.0k
  }
2218
25.8k
  return true;
2219
25.8k
}
2220
2221
25.8k
void PrepareMeta(const JPEGData* jpg, State* state) {
2222
25.8k
  InternalState& s = *state->internal;
2223
2224
25.8k
  size_t num_components = jpg->components.size();
2225
25.8k
  s.block_state_.resize(num_components);
2226
25.8k
  std::vector<ComponentMeta>& meta = state->meta;
2227
25.8k
  meta.resize(num_components);
2228
66.8k
  for (size_t i = 0; i < num_components; ++i) {
2229
41.0k
    const JPEGComponent& c = jpg->components[i];
2230
41.0k
    ComponentMeta& m = meta[i];
2231
41.0k
    m.h_samp = c.h_samp_factor;
2232
41.0k
    m.v_samp = c.v_samp_factor;
2233
41.0k
    m.width_in_blocks = jpg->MCU_cols * m.h_samp;
2234
41.0k
    m.height_in_blocks = jpg->MCU_rows * m.v_samp;
2235
41.0k
  }
2236
25.8k
}
2237
2238
274k
void WarmupMeta(JPEGData* jpg, State* state) {
2239
274k
  InternalState& s = *state->internal;
2240
274k
  std::vector<ComponentMeta>& meta = state->meta;
2241
274k
  const size_t num_components = meta.size();
2242
2243
274k
  if (!state->is_storage_allocated) {
2244
10.3k
    state->is_storage_allocated = true;
2245
21.7k
    for (size_t i = 0; i < num_components; ++i) {
2246
11.3k
      size_t num_blocks = meta[i].width_in_blocks * meta[i].height_in_blocks;
2247
11.3k
      jpg->components[i].coeffs.resize(num_blocks * kDCTBlockSize);
2248
11.3k
      s.block_state_[i].resize(num_blocks);
2249
11.3k
      meta[i].block_state = s.block_state_[i].data();
2250
11.3k
    }
2251
10.3k
  }
2252
2253
274k
  if (!s.is_meta_warm) {
2254
10.3k
    s.is_meta_warm = true;
2255
21.7k
    for (size_t c = 0; c < num_components; ++c) {
2256
11.3k
      ComponentMeta& m = meta[c];
2257
11.3k
      const JPEGQuantTable& q = jpg->quant[jpg->components[c].quant_idx];
2258
11.3k
      m.ac_coeffs = jpg->components[c].coeffs.data();
2259
11.3k
      m.ac_stride = m.width_in_blocks * kDCTBlockSize;
2260
11.3k
      m.b_stride = m.width_in_blocks;
2261
11.3k
      memcpy(m.quant.data(), q.values.data(),
2262
11.3k
             kDCTBlockSize * sizeof(m.quant[0]));
2263
11.3k
    }
2264
10.3k
  }
2265
274k
}
2266
2267
2.29M
BrunsliStatus DoProcessJpeg(State* state, JPEGData* jpg) {
2268
4.75M
  while (true) {
2269
4.75M
    switch (state->stage) {
2270
114k
      case Stage::SIGNATURE:
2271
114k
        state->stage = VerifySignature(state);
2272
114k
        break;
2273
2274
1.11M
      case Stage::HEADER:
2275
1.11M
        state->stage = DecodeHeader(state, jpg);
2276
1.11M
        break;
2277
2278
2.76k
      case Stage::FALLBACK:
2279
2.76k
        state->stage = DecodeOriginalJpg(state, jpg);
2280
2.76k
        break;
2281
2282
171k
      case Stage::SECTION:
2283
171k
        state->stage = ParseSection(state);
2284
171k
        break;
2285
2286
1.05M
      case Stage::SECTION_BODY:
2287
1.05M
        state->stage = ProcessSection(state, jpg);
2288
1.05M
        break;
2289
2290
8.25k
      case Stage::DONE:
2291
        // It is expected that there is no garbage after the valid brunsli
2292
        // stream.
2293
8.25k
        if (state->pos != state->len) {
2294
30
          state->stage = Fail(state, BRUNSLI_INVALID_BRN);
2295
30
          break;
2296
30
        }
2297
8.22k
        return BRUNSLI_OK;
2298
2299
2.28M
      case Stage::ERROR:
2300
2.28M
        return state->internal->result;
2301
2302
0
      default:
2303
        /* Unreachable */
2304
0
        state->stage = Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
2305
0
        break;
2306
4.75M
    }
2307
4.75M
  }
2308
2.29M
}
2309
2310
/** Adds new input to buffer. */
2311
2.24M
void ChargeBuffer(State* state) {
2312
2.24M
  InternalState& s = *state->internal;
2313
2.24M
  Buffer& b = s.buffer;
2314
2315
2.24M
  b.borrowed_len = 0;
2316
2.24M
  b.external_data = state->data;
2317
2.24M
  b.external_pos = state->pos;
2318
2.24M
  b.external_len = state->len;
2319
2.24M
}
2320
2321
constexpr size_t kBufferMaxReadAhead = 600;
2322
2323
/** Sets input source either to buffered, or to external data. */
2324
2.29M
void LoadInput(State* state) {
2325
2.29M
  InternalState& s = *state->internal;
2326
2.29M
  Buffer& b = s.buffer;
2327
2328
  // No data buffered. Just pass external data as is.
2329
2.29M
  if (b.data_len == 0) {
2330
1.90M
    state->data = b.external_data;
2331
1.90M
    state->pos = b.external_pos;
2332
1.90M
    state->len = b.external_len;
2333
1.90M
    return;
2334
1.90M
  }
2335
2336
392k
  BRUNSLI_DCHECK(b.data_len <= kBufferMaxReadAhead);
2337
2338
  // Otherwise use buffered data.
2339
392k
  size_t available = b.external_len - b.external_pos;
2340
  // Always try to borrow as much as parser could require. This way, when
2341
  // buffer is unable to provide enough input, we could switch to unbuffered
2342
  // input.
2343
392k
  b.borrowed_len = std::min(kBufferMaxReadAhead, available);
2344
392k
  memcpy(b.data.data() + b.data_len, b.external_data + b.external_pos,
2345
392k
         b.borrowed_len);
2346
392k
  state->data = b.data.data();
2347
392k
  state->pos = 0;
2348
392k
  state->len = b.data_len + b.borrowed_len;
2349
392k
}
2350
2351
/**
2352
 * Cancel borrowed bytes, if any.
2353
 *
2354
 * Returns false, if it is impossible to continue parsing.
2355
 */
2356
2.29M
bool UnloadInput(State* state, BrunsliStatus result) {
2357
2.29M
  InternalState& s = *state->internal;
2358
2.29M
  Buffer& b = s.buffer;
2359
2360
  // Non-buffered input; put tail to buffer.
2361
2.29M
  if (state->data == b.external_data) {
2362
1.90M
    b.external_pos = state->pos;
2363
1.90M
    BRUNSLI_DCHECK(b.external_pos <= b.external_len);
2364
1.90M
    if (result != BRUNSLI_NOT_ENOUGH_DATA) return true;
2365
1.89M
    BRUNSLI_DCHECK(b.data_len == 0);
2366
1.89M
    size_t available = b.external_len - b.external_pos;
2367
1.89M
    BRUNSLI_DCHECK(available < kBufferMaxReadAhead);
2368
1.89M
    if (b.data.empty()) b.data.resize(2 * kBufferMaxReadAhead);
2369
1.89M
    b.data_len = available;
2370
1.89M
    memcpy(b.data.data(), b.external_data + b.external_pos, b.data_len);
2371
1.89M
    b.external_pos += available;
2372
1.89M
    return false;
2373
1.90M
  }
2374
2375
  // Buffer depleted; switch to non-buffered input.
2376
392k
  if (state->pos >= b.data_len) {
2377
51.1k
    size_t used_borrowed_bytes = state->pos - b.data_len;
2378
51.1k
    b.data_len = 0;
2379
51.1k
    b.external_pos += used_borrowed_bytes;
2380
51.1k
    return true;
2381
51.1k
  }
2382
2383
  // Buffer not depleted; either problem discovered was already buffered data,
2384
  // or extra input was too-short.
2385
341k
  b.data_len -= state->pos;
2386
341k
  if (result == BRUNSLI_NOT_ENOUGH_DATA) {
2387
    // We couldn't have taken more bytes.
2388
340k
    BRUNSLI_DCHECK(b.external_pos + b.borrowed_len == b.external_len);
2389
    // Remaining piece is not too large.
2390
340k
    BRUNSLI_DCHECK(b.data_len + b.borrowed_len < kBufferMaxReadAhead);
2391
340k
    b.data_len += b.borrowed_len;
2392
340k
    b.external_pos += b.borrowed_len;
2393
340k
  }
2394
341k
  BRUNSLI_DCHECK(!b.data.empty());
2395
341k
  if (state->pos > 0 && b.data_len > 0) {
2396
15.6k
    memmove(b.data.data(), b.data.data() + state->pos, b.data_len);
2397
15.6k
  }
2398
341k
  BRUNSLI_DCHECK(b.data_len <= kBufferMaxReadAhead);
2399
2400
341k
  return (result != BRUNSLI_NOT_ENOUGH_DATA);
2401
392k
}
2402
2403
/** Sets back user-provided input. */
2404
2.24M
void UnchargeBuffer(State* state) {
2405
2.24M
  InternalState& s = *state->internal;
2406
2.24M
  Buffer& b = s.buffer;
2407
2408
2.24M
  state->data = b.external_data;
2409
2.24M
  state->pos = b.external_pos;
2410
2.24M
  state->len = b.external_len;
2411
2.24M
}
2412
2413
2.24M
BrunsliStatus ProcessJpeg(State* state, JPEGData* jpg) {
2414
2.24M
  InternalState& s = *state->internal;
2415
2416
2.24M
  if (state->pos > state->len) return BRUNSLI_INVALID_PARAM;
2417
2.24M
  ChargeBuffer(state);
2418
2419
2.24M
  BrunsliStatus result = BRUNSLI_NOT_ENOUGH_DATA;
2420
2.31M
  while (result == BRUNSLI_NOT_ENOUGH_DATA) {
2421
2.29M
    if (state->stage == Stage::ERROR) {
2422
      // General error -> no recovery.
2423
2.26M
      if (s.result != BRUNSLI_NOT_ENOUGH_DATA) return s.result;
2424
      // Continue parsing.
2425
2.26M
      s.result = BRUNSLI_OK;
2426
2.26M
      state->stage = s.last_stage;
2427
2.26M
      s.last_stage = Stage::ERROR;
2428
2.26M
    }
2429
2430
2.29M
    LoadInput(state);
2431
2.29M
    if (s.section.is_active) {
2432
2.10M
      s.section.milestone = state->pos;
2433
2.10M
      s.section.projected_end = s.section.milestone + s.section.remaining;
2434
2.10M
    }
2435
2436
2.29M
    s.section.tags_met |= state->tags_met;
2437
2.29M
    result = DoProcessJpeg(state, jpg);
2438
2439
2.29M
    if (s.section.is_active) {
2440
      // TODO(eustas): dcheck state->pos > s.section.milestone
2441
2.12M
      size_t processed_len = state->pos - s.section.milestone;
2442
      // TODO(eustas): dcheck processed_len < s.section.remaining
2443
2.12M
      s.section.remaining -= processed_len;
2444
2.12M
    }
2445
2446
2.29M
    if (!UnloadInput(state, result)) break;
2447
2.29M
  }
2448
2.24M
  UnchargeBuffer(state);
2449
2.24M
  return result;
2450
2.24M
}
2451
2452
}  // namespace dec
2453
}  // namespace internal
2454
2455
BrunsliStatus BrunsliDecodeJpeg(const uint8_t* data, const size_t len,
2456
13.3k
                                JPEGData* jpg) {
2457
13.3k
  if (!data) return BRUNSLI_INVALID_PARAM;
2458
2459
13.3k
  State state;
2460
13.3k
  state.data = data;
2461
13.3k
  state.len = len;
2462
2463
13.3k
  return internal::dec::ProcessJpeg(&state, jpg);
2464
13.3k
}
2465
2466
size_t BrunsliEstimateDecoderPeakMemoryUsage(const uint8_t* data,
2467
0
                                             const size_t len) {
2468
0
  if (!data) return BRUNSLI_INVALID_PARAM;
2469
2470
0
  State state;
2471
0
  state.data = data;
2472
0
  state.len = len;
2473
0
  state.skip_tags = ~(1u << kBrunsliHistogramDataTag);
2474
0
  InternalState& s = *state.internal;
2475
0
  s.shallow_histograms = true;
2476
2477
0
  JPEGData jpg;
2478
0
  BrunsliStatus status = internal::dec::ProcessJpeg(&state, &jpg);
2479
2480
0
  if (status != BRUNSLI_OK) return 0;
2481
2482
0
  size_t out_size = 2 * len;
2483
0
  size_t total_num_blocks = 0;
2484
0
  size_t component_state_size = 0;
2485
0
  for (size_t i = 0; i < jpg.components.size(); ++i) {
2486
0
    const JPEGComponent& c = jpg.components[i];
2487
0
    total_num_blocks += c.num_blocks;
2488
0
    component_state_size += ComponentState::SizeInBytes(c.width_in_blocks);
2489
0
  }
2490
0
  size_t jpeg_data_size = total_num_blocks * kDCTBlockSize * sizeof(coeff_t);
2491
0
  size_t context_map_size = s.num_contexts * kNumAvrgContexts * sizeof(int32_t);
2492
0
  size_t histogram_size = s.num_histograms * sizeof(ANSDecodingData);
2493
0
  size_t decode_peak = context_map_size + histogram_size + component_state_size;
2494
0
  size_t jpeg_writer_size = (1u << 17u) + (1u << 16u) * sizeof(int32_t);
2495
0
  return (out_size + jpeg_data_size + std::max(decode_peak, jpeg_writer_size));
2496
0
}
2497
2498
0
BrunsliDecoder::BrunsliDecoder() {
2499
0
  jpg_.reset(new JPEGData);
2500
0
  state_.reset(new State);
2501
0
}
2502
2503
0
BrunsliDecoder::~BrunsliDecoder() {}
2504
2505
BrunsliDecoder::Status BrunsliDecoder::Decode(size_t* available_in,
2506
                                              const uint8_t** next_in,
2507
                                              size_t* available_out,
2508
0
                                              uint8_t** next_out) {
2509
0
  JPEGData* jpg = jpg_.get();
2510
0
  BRUNSLI_DCHECK(jpg);
2511
0
  State* state = state_.get();
2512
0
  BRUNSLI_DCHECK(state);
2513
2514
0
  state->data = *next_in;
2515
0
  state->pos = 0;
2516
0
  state->len = *available_in;
2517
0
  BrunsliStatus parse_status = internal::dec::ProcessJpeg(state, jpg);
2518
0
  size_t consumed_bytes = state->pos;
2519
0
  *available_in -= consumed_bytes;
2520
0
  *next_in += consumed_bytes;
2521
2522
0
  if ((parse_status != BRUNSLI_OK) &&
2523
0
      (parse_status != BRUNSLI_NOT_ENOUGH_DATA)) {
2524
0
    return BrunsliDecoder::ERROR;
2525
0
  }
2526
2527
  // All the input given input should be consumed.
2528
0
  BRUNSLI_DCHECK(*available_in == 0);
2529
2530
0
  SerializationStatus serialization_status =
2531
0
      SerializeJpeg(state, *jpg, available_out, next_out);
2532
0
  if (serialization_status == SerializationStatus::ERROR) {
2533
0
    return BrunsliDecoder::ERROR;
2534
0
  }
2535
2536
0
  switch (serialization_status) {
2537
0
    case SerializationStatus::DONE:
2538
      // Should be impossible to finish serialization without finishing parsing.
2539
0
      BRUNSLI_DCHECK(parse_status == BRUNSLI_OK);
2540
0
      return BrunsliDecoder::DONE;
2541
2542
0
    case SerializationStatus::NEEDS_MORE_INPUT:
2543
      // If serializer says that data is incomplete, parser should say the same.
2544
0
      BRUNSLI_DCHECK(parse_status == BRUNSLI_NOT_ENOUGH_DATA);
2545
0
      return BrunsliDecoder::NEEDS_MORE_INPUT;
2546
2547
0
    case SerializationStatus::NEEDS_MORE_OUTPUT:
2548
      // TODO(eustas): make sure that serializer could produce more bytes
2549
      //               without providing more bytes to parser
2550
0
      BRUNSLI_DCHECK(*available_out == 0);
2551
0
      return BrunsliDecoder::NEEDS_MORE_OUTPUT;
2552
2553
0
    case SerializationStatus::ERROR:
2554
0
      return BrunsliDecoder::ERROR;
2555
2556
0
    default:
2557
      /* Unreachable */
2558
0
      BRUNSLI_DCHECK(false);
2559
0
      return BrunsliDecoder::ERROR;
2560
0
  }
2561
0
}
2562
2563
}  // namespace brunsli