Coverage Report

Created: 2025-07-18 06:08

/src/brunsli/c/dec/brunsli_decode.cc
Line
Count
Source (jump to first uncovered line)
1
// Copyright (c) Google LLC 2019
2
//
3
// Use of this source code is governed by an MIT-style
4
// license that can be found in the LICENSE file or at
5
// https://opensource.org/licenses/MIT.
6
7
#include <brunsli/brunsli_decode.h>
8
9
#include <algorithm>
10
#include <cstdlib>
11
#include <cstring>
12
#include <iterator>
13
#include <string>
14
#include <vector>
15
16
#include <brotli/decode.h>
17
#include "../common/constants.h"
18
#include "../common/context.h"
19
#include <brunsli/jpeg_data.h>
20
#include "../common/lehmer_code.h"
21
#include "../common/platform.h"
22
#include "../common/predict.h"
23
#include "../common/quant_matrix.h"
24
#include <brunsli/status.h>
25
#include <brunsli/types.h>
26
#include "./ans_decode.h"
27
#include "./arith_decode.h"
28
#include "./bit_reader.h"
29
#include "./brunsli_input.h"
30
#include "./context_map_decode.h"
31
#include "./histogram_decode.h"
32
#include "./huffman_table.h"
33
#include <brunsli/jpeg_data_writer.h>
34
#include "./state.h"
35
#include "./state_internal.h"
36
37
namespace brunsli {
38
39
using ::brunsli::internal::dec::AcDcState;
40
using ::brunsli::internal::dec::BlockI32;
41
using ::brunsli::internal::dec::Buffer;
42
using ::brunsli::internal::dec::ComponentMeta;
43
using ::brunsli::internal::dec::FallbackState;
44
using ::brunsli::internal::dec::HeaderState;
45
using ::brunsli::internal::dec::HistogramDataState;
46
using ::brunsli::internal::dec::InternalState;
47
using ::brunsli::internal::dec::JpegInternalsState;
48
using ::brunsli::internal::dec::MetadataDecompressionStage;
49
using ::brunsli::internal::dec::MetadataState;
50
using ::brunsli::internal::dec::PrepareMeta;
51
using ::brunsli::internal::dec::QuantDataState;
52
using ::brunsli::internal::dec::SectionHeaderState;
53
using ::brunsli::internal::dec::SectionState;
54
using ::brunsli::internal::dec::SerializationStatus;
55
using ::brunsli::internal::dec::Stage;
56
using ::brunsli::internal::dec::State;
57
using ::brunsli::internal::dec::UpdateSubsamplingDerivatives;
58
using ::brunsli::internal::dec::VarintState;
59
60
static const int kNumDirectCodes = 8;
61
static const int kCoeffAlphabetSize = kNumDirectCodes + 10;
62
63
static const uint32_t kKnownSectionTags =
64
    (1u << kBrunsliSignatureTag) | (1u << kBrunsliHeaderTag) |
65
    (1u << kBrunsliMetaDataTag) | (1u << kBrunsliJPEGInternalsTag) |
66
    (1u << kBrunsliQuantDataTag) | (1u << kBrunsliHistogramDataTag) |
67
    (1u << kBrunsliDCDataTag) | (1u << kBrunsliACDataTag) |
68
    (1u << kBrunsliOriginalJpgTag);
69
70
static const uint32_t kKnownHeaderVarintTags =
71
    (1u << kBrunsliHeaderWidthTag) | (1u << kBrunsliHeaderHeightTag) |
72
    (1u << kBrunsliHeaderVersionCompTag) | (1u << kBrunsliHeaderSubsamplingTag);
73
74
0
bool IsBrunsli(const uint8_t* data, const size_t len) {
75
0
  static const uint8_t kSignature[6] = {
76
0
      /* marker */ 0x0A,
77
0
      /* length */ 0x04, 0x42, 0xD2, 0xD5, 0x4E};
78
0
  static const size_t kSignatureLen = sizeof(kSignature);
79
0
  if (len < kSignatureLen) return false;
80
0
  return (memcmp(kSignature, data, kSignatureLen) == 0);
81
0
}
82
83
// Returns ceil(a/b).
84
60.8k
inline int DivCeil(int a, int b) { return (a + b - 1) / b; }
85
86
// Decodes a number in the range [0..255], by reading 1 - 11 bits.
87
13.9k
inline uint32_t DecodeVarLenUint8(BrunsliBitReader* br) {
88
13.9k
  if (BrunsliBitReaderRead(br, 1)) {
89
2.56k
    uint32_t nbits = BrunsliBitReaderRead(br, 3);
90
2.56k
    if (nbits == 0) {
91
1.22k
      return 1u;
92
1.34k
    } else {
93
1.34k
      return BrunsliBitReaderRead(br, nbits) + (1u << nbits);
94
1.34k
    }
95
2.56k
  }
96
11.4k
  return 0;
97
13.9k
}
98
99
11.2M
bool DecodeVarint(VarintState* s, BrunsliBitReader* br, size_t max_bits) {
100
11.2M
  if (s->stage == VarintState::INIT) {
101
10.4M
    s->value = 0;
102
10.4M
    s->i = 0;
103
10.4M
    s->stage = VarintState::READ_CONTINUATION;
104
10.4M
  }
105
106
25.3M
  while (true) {
107
25.3M
    switch (s->stage) {
108
18.2M
      case VarintState::READ_CONTINUATION: {
109
18.2M
        if (s->i >= max_bits) {
110
1.75k
          s->stage = VarintState::INIT;
111
1.75k
          return true;
112
1.75k
        }
113
18.2M
        if (s->i + 1 != max_bits) {
114
18.2M
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
115
17.5M
          if (!BrunsliBitReaderRead(br, 1)) {
116
10.4M
            s->stage = VarintState::INIT;
117
10.4M
            return true;
118
10.4M
          }
119
17.5M
        }
120
7.07M
        s->stage = VarintState::READ_DATA;
121
7.07M
        continue;
122
18.2M
      }
123
7.08M
      case VarintState::READ_DATA: {
124
7.08M
        if (!BrunsliBitReaderCanRead(br, 1)) return false;
125
7.07M
        size_t next_bit = BrunsliBitReaderRead(br, 1);
126
7.07M
        s->value |= next_bit << s->i;
127
7.07M
        ++s->i;
128
7.07M
        s->stage = VarintState::READ_CONTINUATION;
129
7.07M
        continue;
130
7.08M
      }
131
0
      default: {
132
0
        BRUNSLI_CHECK(false);
133
0
        return false;
134
7.08M
      }
135
25.3M
    }
136
25.3M
  }
137
11.2M
}
138
139
template <size_t kChunkSize>
140
bool DecodeLimitedVarint(VarintState* s, BrunsliBitReader* br,
141
162k
                         size_t max_symbols) {
142
162k
  if (s->stage == VarintState::INIT) {
143
147k
    s->value = 0;
144
147k
    s->i = 0;
145
147k
    s->stage = VarintState::READ_CONTINUATION;
146
147k
  }
147
243k
  while (true) {
148
243k
    switch (s->stage) {
149
198k
      case VarintState::READ_CONTINUATION: {
150
198k
        if (s->i < max_symbols) {
151
193k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
152
183k
          if (BrunsliBitReaderRead(br, 1)) {
153
40.3k
            s->stage = VarintState::READ_DATA;
154
40.3k
            continue;
155
40.3k
          }
156
183k
        }
157
147k
        s->stage = VarintState::INIT;
158
147k
        return true;
159
198k
      }
160
45.4k
      case VarintState::READ_DATA: {
161
45.4k
        if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false;
162
40.2k
        size_t next_bits = BrunsliBitReaderRead(br, kChunkSize);
163
40.2k
        s->value |= next_bits << (s->i * kChunkSize);
164
40.2k
        ++s->i;
165
40.2k
        s->stage = VarintState::READ_CONTINUATION;
166
40.2k
        continue;
167
45.4k
      }
168
0
      default: {
169
0
        BRUNSLI_CHECK(false);
170
0
        return false;
171
45.4k
      }
172
243k
    }
173
243k
  }
174
162k
}
bool brunsli::DecodeLimitedVarint<2ul>(brunsli::internal::dec::VarintState*, brunsli::BrunsliBitReader*, unsigned long)
Line
Count
Source
141
143k
                         size_t max_symbols) {
142
143k
  if (s->stage == VarintState::INIT) {
143
128k
    s->value = 0;
144
128k
    s->i = 0;
145
128k
    s->stage = VarintState::READ_CONTINUATION;
146
128k
  }
147
220k
  while (true) {
148
220k
    switch (s->stage) {
149
177k
      case VarintState::READ_CONTINUATION: {
150
177k
        if (s->i < max_symbols) {
151
173k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
152
163k
          if (BrunsliBitReaderRead(br, 1)) {
153
38.5k
            s->stage = VarintState::READ_DATA;
154
38.5k
            continue;
155
38.5k
          }
156
163k
        }
157
128k
        s->stage = VarintState::INIT;
158
128k
        return true;
159
177k
      }
160
42.9k
      case VarintState::READ_DATA: {
161
42.9k
        if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false;
162
38.5k
        size_t next_bits = BrunsliBitReaderRead(br, kChunkSize);
163
38.5k
        s->value |= next_bits << (s->i * kChunkSize);
164
38.5k
        ++s->i;
165
38.5k
        s->stage = VarintState::READ_CONTINUATION;
166
38.5k
        continue;
167
42.9k
      }
168
0
      default: {
169
0
        BRUNSLI_CHECK(false);
170
0
        return false;
171
42.9k
      }
172
220k
    }
173
220k
  }
174
143k
}
bool brunsli::DecodeLimitedVarint<8ul>(brunsli::internal::dec::VarintState*, brunsli::BrunsliBitReader*, unsigned long)
Line
Count
Source
141
19.7k
                         size_t max_symbols) {
142
19.7k
  if (s->stage == VarintState::INIT) {
143
18.9k
    s->value = 0;
144
18.9k
    s->i = 0;
145
18.9k
    s->stage = VarintState::READ_CONTINUATION;
146
18.9k
  }
147
23.1k
  while (true) {
148
23.1k
    switch (s->stage) {
149
20.6k
      case VarintState::READ_CONTINUATION: {
150
20.6k
        if (s->i < max_symbols) {
151
20.5k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
152
20.5k
          if (BrunsliBitReaderRead(br, 1)) {
153
1.79k
            s->stage = VarintState::READ_DATA;
154
1.79k
            continue;
155
1.79k
          }
156
20.5k
        }
157
18.7k
        s->stage = VarintState::INIT;
158
18.7k
        return true;
159
20.6k
      }
160
2.55k
      case VarintState::READ_DATA: {
161
2.55k
        if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false;
162
1.66k
        size_t next_bits = BrunsliBitReaderRead(br, kChunkSize);
163
1.66k
        s->value |= next_bits << (s->i * kChunkSize);
164
1.66k
        ++s->i;
165
1.66k
        s->stage = VarintState::READ_CONTINUATION;
166
1.66k
        continue;
167
2.55k
      }
168
0
      default: {
169
0
        BRUNSLI_CHECK(false);
170
0
        return false;
171
2.55k
      }
172
23.1k
    }
173
23.1k
  }
174
19.7k
}
175
176
38.3k
std::vector<uint8_t> GenerateApp0Marker(uint8_t app0_status) {
177
38.3k
  std::vector<uint8_t> app0_marker(AppData_0xe0, AppData_0xe0 + 17);
178
38.3k
  app0_marker[9] = app0_status & 1u ? 2 : 1;
179
38.3k
  app0_status >>= 1u;
180
38.3k
  app0_marker[10] = app0_status & 0x3u;
181
38.3k
  app0_status >>= 2u;
182
38.3k
  uint16_t x_dens = kApp0Densities[app0_status];
183
38.3k
  app0_marker[11] = app0_marker[13] = x_dens >> 8u;
184
38.3k
  app0_marker[12] = app0_marker[14] = x_dens & 0xFFu;
185
38.3k
  return app0_marker;
186
38.3k
}
187
188
14.0k
std::vector<uint8_t> GenerateAppMarker(uint8_t marker, uint8_t code) {
189
14.0k
  std::vector<uint8_t> s;
190
14.0k
  if (marker == 0x80) {
191
5.13k
    s = std::vector<uint8_t>(AppData_0xe2, AppData_0xe2 + 3161);
192
5.13k
    s[84] = code;
193
8.86k
  } else if (marker == 0x81) {
194
3.36k
    s = std::vector<uint8_t>(AppData_0xec, AppData_0xec + 18);
195
3.36k
    s[15] = code;
196
5.50k
  } else {
197
5.50k
    BRUNSLI_DCHECK(marker == 0x82);
198
5.50k
    s = std::vector<uint8_t>(AppData_0xee, AppData_0xee + 15);
199
5.50k
    s[10] = code;
200
5.50k
  }
201
14.0k
  return s;
202
14.0k
}
203
204
bool ProcessMetaData(const uint8_t* data, size_t len, MetadataState* state,
205
830k
                     JPEGData* jpg) {
206
830k
  size_t pos = 0;
207
1.75M
  while (pos < len) {
208
922k
    switch (state->stage) {
209
103k
      case MetadataState::READ_MARKER: {
210
103k
        state->marker = static_cast<uint8_t>(data[pos++]);
211
103k
        if (state->marker == 0xD9) {
212
357
          jpg->tail_data = std::vector<uint8_t>();
213
357
          state->stage = MetadataState::READ_TAIL;
214
357
          continue;
215
103k
        } else if (state->marker < 0x40) {
216
38.3k
          state->short_marker_count++;
217
38.3k
          if (state->short_marker_count > kBrunsliShortMarkerLimit) {
218
16
            return false;
219
16
          }
220
38.3k
          jpg->app_data.push_back(GenerateApp0Marker(state->marker));
221
38.3k
          continue;
222
65.2k
        } else if (state->marker >= 0x80 && state->marker <= 0x82) {
223
14.0k
          state->short_marker_count++;
224
14.0k
          if (state->short_marker_count > kBrunsliShortMarkerLimit) {
225
5
            return false;
226
5
          }
227
14.0k
          state->stage = MetadataState::READ_CODE;
228
14.0k
          continue;
229
14.0k
        }
230
        // Otherwise - mutlibyte sequence.
231
51.1k
        if ((state->marker != 0xFE) && ((state->marker >> 4u) != 0x0E)) {
232
233
          return false;
233
233
        }
234
50.9k
        state->stage = MetadataState::READ_LENGTH_HI;
235
50.9k
        continue;
236
51.1k
      }
237
238
158k
      case MetadataState::READ_TAIL: {
239
158k
        Append(&jpg->tail_data, data + pos, data + len);
240
158k
        pos = len;
241
158k
        continue;
242
51.1k
      }
243
244
14.0k
      case MetadataState::READ_CODE: {
245
14.0k
        const uint8_t code = data[pos++];
246
14.0k
        jpg->app_data.push_back(GenerateAppMarker(state->marker, code));
247
14.0k
        state->stage = MetadataState::READ_MARKER;
248
14.0k
        continue;
249
51.1k
      }
250
251
50.9k
      case MetadataState::READ_LENGTH_HI: {
252
50.9k
        state->length_hi = data[pos++];
253
50.9k
        state->stage = MetadataState::READ_LENGTH_LO;
254
50.9k
        continue;
255
51.1k
      }
256
257
50.9k
      case MetadataState::READ_LENGTH_LO: {
258
50.9k
        const uint8_t lo = data[pos++];
259
50.9k
        size_t marker_len = (state->length_hi << 8u) + lo;
260
50.9k
        if (marker_len < 2) return false;
261
50.9k
        state->remaining_multibyte_length = marker_len - 2;
262
50.9k
        uint8_t head[3] = {state->marker, state->length_hi, lo};
263
50.9k
        auto* dest = (state->marker == 0xFE) ? &jpg->com_data : &jpg->app_data;
264
50.9k
        size_t delta = (state->marker == 0xFE) ? 0 : state->short_marker_count;
265
50.9k
        if (dest->size() - delta >= kBrunsliMultibyteMarkerLimit) {
266
5
          return false;
267
5
        }
268
50.9k
        dest->emplace_back(head, head + 3);
269
50.9k
        state->multibyte_sink = &dest->back();
270
        // Turn state machine to default state in case there is no payload in
271
        // multibyte sequence. This is important when such a sequence concludes
272
        // the input.
273
50.9k
        state->stage = (state->remaining_multibyte_length > 0)
274
50.9k
                           ? MetadataState::READ_MULTIBYTE
275
50.9k
                           : MetadataState::READ_MARKER;
276
50.9k
        continue;
277
50.9k
      }
278
279
544k
      case MetadataState::READ_MULTIBYTE: {
280
544k
        size_t chunk_size =
281
544k
            std::min(state->remaining_multibyte_length, len - pos);
282
544k
        Append(state->multibyte_sink, data + pos, chunk_size);
283
544k
        state->remaining_multibyte_length -= chunk_size;
284
544k
        pos += chunk_size;
285
544k
        if (state->remaining_multibyte_length == 0) {
286
48.5k
          state->stage = MetadataState::READ_MARKER;
287
48.5k
        }
288
544k
        continue;
289
50.9k
      }
290
291
0
      default: return false;
292
922k
    }
293
922k
  }
294
830k
  return true;
295
830k
}
296
297
73.0k
static BrunsliStatus DecodeHuffmanCode(State* state, JPEGData* jpg) {
298
73.0k
  InternalState& s = *state->internal;
299
73.0k
  JpegInternalsState& js = s.internals;
300
73.0k
  BrunsliBitReader* br = &js.br;
301
302
463k
  while (true) {
303
463k
    switch (js.stage) {
304
53.1k
      case JpegInternalsState::READ_HUFFMAN_LAST: {
305
53.1k
        if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA;
306
51.1k
        js.is_known_last_huffman_code = BrunsliBitReaderRead(br, 1);
307
51.1k
        jpg->huffman_code.emplace_back();
308
51.1k
        js.stage = JpegInternalsState::READ_HUFFMAN_SIMPLE;
309
51.1k
        continue;
310
53.1k
      }
311
71.7k
      case JpegInternalsState::READ_HUFFMAN_SIMPLE: {
312
71.7k
        if (!BrunsliBitReaderCanRead(br, 5 + !js.is_known_last_huffman_code)) {
313
20.9k
          return BRUNSLI_NOT_ENOUGH_DATA;
314
20.9k
        }
315
50.8k
        JPEGHuffmanCode* huff = &jpg->huffman_code.back();
316
317
50.8k
        huff->slot_id = BrunsliBitReaderRead(br, 2);
318
50.8k
        js.is_dc_table = (BrunsliBitReaderRead(br, 1) == 0);
319
50.8k
        huff->slot_id += js.is_dc_table ? 0 : 0x10;
320
50.8k
        huff->is_last =
321
50.8k
            js.is_known_last_huffman_code || BrunsliBitReaderRead(br, 1);
322
50.8k
        huff->counts[0] = 0;
323
50.8k
        int found_match = BrunsliBitReaderRead(br, 1);
324
50.8k
        if (found_match) {
325
30.5k
          if (js.is_dc_table) {
326
16.6k
            int huff_table_idx = BrunsliBitReaderRead(br, 1);
327
16.6k
            memcpy(&huff->counts[1], kStockDCHuffmanCodeCounts[huff_table_idx],
328
16.6k
                   sizeof(kStockDCHuffmanCodeCounts[0]));
329
16.6k
            memcpy(&huff->values[0], kStockDCHuffmanCodeValues[huff_table_idx],
330
16.6k
                   sizeof(kStockDCHuffmanCodeValues[0]));
331
16.6k
          } else {
332
13.9k
            int huff_table_idx = BrunsliBitReaderRead(br, 1);
333
13.9k
            memcpy(&huff->counts[1], kStockACHuffmanCodeCounts[huff_table_idx],
334
13.9k
                   sizeof(kStockACHuffmanCodeCounts[0]));
335
13.9k
            memcpy(&huff->values[0], kStockACHuffmanCodeValues[huff_table_idx],
336
13.9k
                   sizeof(kStockACHuffmanCodeValues[0]));
337
13.9k
          }
338
30.5k
          js.stage = JpegInternalsState::HUFFMAN_UPDATE;
339
30.5k
        } else {
340
          // One less bit is used than requested, but it is guaranteed to be
341
          // consumed in complex Huffman code case.
342
20.2k
          js.p.Init(js.is_dc_table
343
20.2k
                        ? std::vector<uint8_t>(kDefaultDCValues,
344
14.4k
                                               std::end(kDefaultDCValues))
345
20.2k
                        : std::vector<uint8_t>(kDefaultACValues,
346
5.82k
                                               std::end(kDefaultACValues)));
347
20.2k
          js.stage = JpegInternalsState::READ_HUFFMAN_MAX_LEN;
348
20.2k
        }
349
50.8k
        continue;
350
71.7k
      }
351
23.7k
      case JpegInternalsState::READ_HUFFMAN_MAX_LEN: {
352
23.7k
        if (!BrunsliBitReaderCanRead(br, 4)) return BRUNSLI_NOT_ENOUGH_DATA;
353
20.2k
        js.max_len = BrunsliBitReaderRead(br, 4) + 1;
354
20.2k
        js.total_count = 0;
355
20.2k
        js.max_count =
356
20.2k
            js.is_dc_table ? kJpegDCAlphabetSize : kJpegHuffmanAlphabetSize;
357
20.2k
        js.space = (1u << kJpegHuffmanMaxBitLength) -
358
20.2k
                   (1u << (kJpegHuffmanMaxBitLength - js.max_len));
359
20.2k
        js.i = 1;
360
20.2k
        js.stage = JpegInternalsState::READ_HUFFMAN_COUNT;
361
20.2k
        continue;
362
23.7k
      }
363
101k
      case JpegInternalsState::READ_HUFFMAN_COUNT: {
364
101k
        JPEGHuffmanCode* huff = &jpg->huffman_code.back();
365
101k
        if (js.i <= js.max_len) {
366
81.4k
          size_t shift = kJpegHuffmanMaxBitLength - js.i;
367
81.4k
          size_t count_limit =
368
81.4k
              std::min(js.max_count - js.total_count, js.space >> shift);
369
81.4k
          if (count_limit > 0) {
370
77.9k
            int nbits =
371
77.9k
                Log2FloorNonZero(static_cast<uint32_t>(count_limit)) + 1;
372
77.9k
            if (!BrunsliBitReaderCanRead(br, nbits)) {
373
10.8k
              return BRUNSLI_NOT_ENOUGH_DATA;
374
10.8k
            }
375
67.1k
            size_t count = BrunsliBitReaderRead(br, nbits);
376
67.1k
            if (count > count_limit) {
377
9
              return BRUNSLI_INVALID_BRN;
378
9
            }
379
67.1k
            huff->counts[js.i] = static_cast<int>(count);
380
67.1k
            js.total_count += count;
381
67.1k
            js.space -= count * (static_cast<size_t>(1) << shift);
382
67.1k
          }
383
70.6k
          ++js.i;
384
70.6k
          continue;
385
81.4k
        }
386
20.0k
        ++huff->counts[js.max_len];
387
20.0k
        js.i = 0;
388
20.0k
        js.stage = JpegInternalsState::READ_HUFFMAN_PERMUTATION;
389
20.0k
        continue;
390
101k
      }
391
163k
      case JpegInternalsState::READ_HUFFMAN_PERMUTATION: {
392
163k
        JPEGHuffmanCode* huff = &jpg->huffman_code.back();
393
163k
        if (js.i < js.total_count) {
394
143k
          const int nbits = js.p.num_bits();
395
143k
          if (!DecodeLimitedVarint<2>(&js.varint, br, (nbits + 1) >> 1u)) {
396
14.4k
            return BRUNSLI_NOT_ENOUGH_DATA;
397
14.4k
          }
398
128k
          uint8_t value;
399
128k
          if (!js.p.Remove(js.varint.value, &value)) {
400
11
            return BRUNSLI_INVALID_BRN;
401
11
          }
402
128k
          huff->values[js.i] = value;
403
128k
          ++js.i;
404
128k
          continue;
405
128k
        }
406
19.9k
        huff->values[js.total_count] = kJpegHuffmanAlphabetSize;
407
19.9k
        js.stage = JpegInternalsState::HUFFMAN_UPDATE;
408
19.9k
        continue;
409
163k
      }
410
50.5k
      case JpegInternalsState::HUFFMAN_UPDATE: {
411
        // This stage does not perform reading -> transient.
412
50.5k
        if (jpg->huffman_code.back().is_last) {
413
25.6k
          js.terminal_huffman_code_count++;
414
25.6k
        }
415
50.5k
        if (js.is_known_last_huffman_code) {
416
21.1k
          js.p.Clear();
417
21.1k
          return BRUNSLI_OK;
418
21.1k
        }
419
29.3k
        if (jpg->huffman_code.size() >= kMaxDHTMarkers) {
420
          // Too many Huffman codes for a valid bit-stream. Normally, a jpeg
421
          // file can have any arbitrary number of DHT, DQT, etc. But i prefer
422
          // we force a reasonable lower bound instead of open door to likely
423
          // forged BRN input.
424
2
          return BRUNSLI_INVALID_BRN;
425
2
        }
426
29.3k
        js.stage = JpegInternalsState::READ_HUFFMAN_LAST;
427
29.3k
        continue;
428
29.3k
      }
429
0
      default:
430
0
        return BRUNSLI_DECOMPRESSION_ERROR;
431
463k
    }
432
463k
  }
433
0
  return BRUNSLI_OK;
434
73.0k
}
435
436
1.74M
BrunsliStatus DecodeScanInfo(State* state, JPEGData* jpg) {
437
1.74M
  InternalState& s = *state->internal;
438
1.74M
  JpegInternalsState& js = s.internals;
439
1.74M
  BrunsliBitReader* br = &js.br;
440
441
4.50M
  const auto maybe_add_zero_run = [&js, jpg] () {
442
4.50M
    if (js.last_num > 0) {
443
4.48M
      JPEGScanInfo::ExtraZeroRunInfo info;
444
4.48M
      info.block_idx = js.last_block_idx;
445
4.48M
      info.num_extra_zero_runs = js.last_num;
446
4.48M
      jpg->scan_info[js.i].extra_zero_runs.push_back(info);
447
4.48M
      js.last_num = 0;
448
4.48M
    }
449
4.50M
  };
450
451
23.0M
  while (true) {
452
23.0M
    switch (js.stage) {
453
172k
      case JpegInternalsState::READ_SCAN_COMMON: {
454
172k
        JPEGScanInfo* si = &jpg->scan_info[js.i];
455
172k
        if (!BrunsliBitReaderCanRead(br, 22)) return BRUNSLI_NOT_ENOUGH_DATA;
456
54.2k
        si->Ss = BrunsliBitReaderRead(br, 6);
457
54.2k
        si->Se = BrunsliBitReaderRead(br, 6);
458
54.2k
        si->Ah = BrunsliBitReaderRead(br, 4);
459
54.2k
        si->Al = BrunsliBitReaderRead(br, 4);
460
54.2k
        si->num_components = BrunsliBitReaderRead(br, 2) + 1;
461
54.2k
        js.j = 0;
462
54.2k
        js.stage = JpegInternalsState::READ_SCAN_COMPONENT;
463
54.2k
        continue;
464
172k
      }
465
291k
      case JpegInternalsState::READ_SCAN_COMPONENT: {
466
291k
        JPEGScanInfo* si = &jpg->scan_info[js.i];
467
291k
        if (js.j < si->num_components) {
468
237k
          if (!BrunsliBitReaderCanRead(br, 6)) return BRUNSLI_NOT_ENOUGH_DATA;
469
118k
          si->components[js.j].comp_idx = BrunsliBitReaderRead(br, 2);
470
118k
          si->components[js.j].dc_tbl_idx = BrunsliBitReaderRead(br, 2);
471
118k
          si->components[js.j].ac_tbl_idx = BrunsliBitReaderRead(br, 2);
472
118k
          js.j++;
473
118k
        } else {
474
54.1k
          js.last_block_idx = -1;
475
54.1k
          js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION;
476
54.1k
        }
477
172k
        continue;
478
291k
      }
479
5.59M
      case JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION: {
480
5.59M
        if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA;
481
4.98M
        if (BrunsliBitReaderRead(br, 1)) {
482
4.93M
          js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_DATA;
483
4.93M
        } else {
484
53.9k
          js.last_block_idx = 0;
485
53.9k
          js.last_num = 0;
486
53.9k
          js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION;
487
53.9k
        }
488
4.98M
        continue;
489
5.59M
      }
490
4.94M
      case JpegInternalsState::READ_SCAN_RESET_POINT_DATA: {
491
4.94M
        JPEGScanInfo* si = &jpg->scan_info[js.i];
492
4.94M
        if (!DecodeVarint(&js.varint, br, 28)) return BRUNSLI_NOT_ENOUGH_DATA;
493
4.93M
        int block_idx =
494
4.93M
            js.last_block_idx + static_cast<int>(js.varint.value) + 1;
495
4.93M
        si->reset_points.emplace_back(block_idx);
496
4.93M
        js.last_block_idx = block_idx;
497
        // TODO(eustas): limit to exact number of blocks.
498
4.93M
        if (js.last_block_idx > (1 << 30)) {
499
          // At most 8K x 8K x num_channels blocks are expected. That is,
500
          // typically, 1.5 * 2^27. 2^30 should be sufficient for any sane
501
          // image.
502
12
          return BRUNSLI_INVALID_BRN;
503
12
        }
504
4.93M
        js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION;
505
4.93M
        continue;
506
4.93M
      }
507
5.74M
      case JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION: {
508
5.74M
        if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA;
509
5.59M
        if (BrunsliBitReaderRead(br, 1)) {
510
5.53M
          js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_DATA;
511
5.53M
        } else {
512
53.7k
          maybe_add_zero_run();
513
53.7k
          ++js.i;
514
53.7k
          if (js.i < js.num_scans) {
515
44.2k
            js.stage = JpegInternalsState::READ_SCAN_COMMON;
516
44.2k
            continue;
517
44.2k
          }
518
9.51k
          return BRUNSLI_OK;
519
53.7k
        }
520
5.53M
        continue;
521
5.59M
      }
522
6.26M
      case JpegInternalsState::READ_SCAN_ZERO_RUN_DATA: {
523
6.26M
        if (!DecodeVarint(&js.varint, br, 28)) return BRUNSLI_NOT_ENOUGH_DATA;
524
5.53M
        int block_idx = js.last_block_idx + static_cast<int>(js.varint.value);
525
5.53M
        if (block_idx > js.last_block_idx) maybe_add_zero_run();
526
5.53M
        ++js.last_num;
527
5.53M
        js.last_block_idx = block_idx;
528
        // TODO(eustas): limit to exact number of blocks.
529
5.53M
        if (js.last_block_idx > (1 << 30)) {
530
          // At most 8K x 8K x num_channels blocks are expected. That is,
531
          // typically, 1.5 * 2^27. 2^30 should be sufficient for any sane
532
          // image.
533
2
          return BRUNSLI_INVALID_BRN;
534
2
        }
535
5.53M
        js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION;
536
5.53M
        continue;
537
5.53M
      }
538
0
      default: return BRUNSLI_DECOMPRESSION_ERROR;
539
23.0M
    }
540
23.0M
  }
541
1.74M
}
542
543
static bool BRUNSLI_NOINLINE DecodeCoeffOrder(uint32_t* order, BitSource* br,
544
11.0k
                                              WordSource* in) {
545
11.0k
  uint32_t lehmer[kDCTBlockSize] = {0};
546
11.0k
  static const int kSpan = 16;
547
55.3k
  for (int i = 0; i < kDCTBlockSize; i += kSpan) {
548
44.2k
    if (!br->ReadBits(1, in)) continue;  // span is all-zero
549
5.25k
    const int start = (i > 0) ? i : 1;
550
5.25k
    const int end = i + kSpan;
551
85.4k
    for (int j = start; j < end; ++j) {
552
80.1k
      uint32_t v = 0;
553
102k
      while (v <= kDCTBlockSize) {
554
102k
        const uint32_t bits = br->ReadBits(3, in);
555
102k
        v += bits;
556
102k
        if (bits < 7) break;
557
102k
      }
558
80.1k
      if (v > kDCTBlockSize) return false;
559
80.1k
      lehmer[j] = v;
560
80.1k
    }
561
5.25k
  }
562
11.0k
  int end = kDCTBlockSize - 1;
563
648k
  while (end >= 1 && lehmer[end] == 0) {
564
637k
    --end;
565
637k
  }
566
11.0k
  if (lehmer[end] == 1) return false;
567
56.7k
  for (int i = 1; i <= end; ++i) {
568
46.1k
    if (lehmer[i] == 0) return false;
569
45.7k
    --lehmer[i];
570
45.7k
  }
571
10.6k
  if (!DecodeLehmerCode(lehmer, kDCTBlockSize, order)) return false;
572
687k
  for (int k = 0; k < kDCTBlockSize; ++k) {
573
677k
    order[k] = kJPEGNaturalOrder[order[k]];
574
677k
  }
575
10.5k
  return true;
576
10.6k
}
577
578
/** Reads 0..6 words from |in| and returns the value in the range 0..63. */
579
static size_t DecodeNumNonzeros(Prob* p, BinaryArithmeticDecoder* ac,
580
3.11M
                                WordSource* in) {
581
  // To simplity BST navigation, we use 1-based indexing.
582
3.11M
  Prob* bst = p - 1;
583
3.11M
  size_t ctx = 1;
584
585
21.8M
  for (size_t b = 0; b < kNumNonZeroBits; ++b) {
586
18.7M
    const int bit = ac->ReadBit(bst[ctx].get_proba(), in);
587
18.7M
    bst[ctx].Add(bit);
588
18.7M
    ctx = 2 * ctx + bit;
589
18.7M
  }
590
591
  // Leaf index in the level corresponds to the resuling value.
592
3.11M
  size_t val = ctx - (1u << kNumNonZeroBits);
593
3.11M
  BRUNSLI_DCHECK(val <= kNumNonZeroTreeSize);
594
3.11M
  return val;
595
3.11M
}
596
597
121k
void EnsureSubdecodersInitialized(State* state, WordSource* in) {
598
121k
  InternalState& s = *state->internal;
599
121k
  if (!s.subdecoders_initialized) {
600
21.5k
    s.ans_decoder.Init(in);
601
21.5k
    s.bit_reader.Init(in);
602
21.5k
    s.arith_decoder.Init(in);
603
21.5k
    s.subdecoders_initialized = true;
604
21.5k
  }
605
121k
}
606
607
20.7k
bool FinalizeSubdecoders(State* state) {
608
20.7k
  InternalState& s = *state->internal;
609
20.7k
  if (!s.ans_decoder.CheckCRC()) return false;
610
19.5k
  if (!s.bit_reader.Finish()) return false;
611
19.4k
  s.subdecoders_initialized = false;
612
19.4k
  return true;
613
19.5k
}
614
615
94.3k
BrunsliStatus DecodeDC(State* state, WordSource* in) {
616
94.3k
  const std::vector<ComponentMeta>& meta = state->meta;
617
94.3k
  const size_t num_components = meta.size();
618
94.3k
  const int mcu_rows = meta[0].height_in_blocks / meta[0].v_samp;
619
94.3k
  InternalState& s = *state->internal;
620
94.3k
  AcDcState& ac_dc_state = s.ac_dc;
621
622
94.3k
  std::vector<ComponentStateDC>& comps = ac_dc_state.dc;
623
94.3k
  if (comps.empty()) {
624
11.5k
    comps.resize(num_components);
625
24.3k
    for (size_t c = 0; c < num_components; ++c) {
626
12.8k
      comps[c].SetWidth(meta[c].width_in_blocks);
627
12.8k
    }
628
11.5k
  }
629
630
94.3k
  if (!in->CanRead(5)) return BRUNSLI_NOT_ENOUGH_DATA;
631
26.4k
  EnsureSubdecodersInitialized(state, in);
632
26.4k
  ANSDecoder ans = s.ans_decoder;
633
26.4k
  BitSource br = s.bit_reader;
634
26.4k
  BinaryArithmeticDecoder ac = s.arith_decoder;
635
636
  // We decode DC components in the following interleaved manner:
637
  //   v_samp[0] rows from component 0
638
  //   v_samp[1] rows from component 1
639
  //   v_samp[2] rows from component 2
640
  //   v_samp[3] rows from component 3 (if present)
641
  //
642
  // E.g. in a YUV420 image, we decode 2 rows of DC components from Y and then
643
  // 1 row of DC components from U and 1 row of DC components from V.
644
287k
  for (int mcu_y = ac_dc_state.next_mcu_y; mcu_y < mcu_rows; ++mcu_y) {
645
539k
    for (size_t i = ac_dc_state.next_component; i < num_components; ++i) {
646
279k
      ComponentStateDC* c = &comps[i];
647
279k
      const ComponentMeta& m = meta[i];
648
279k
      const uint8_t* context_map = state->context_map + i * kNumAvrgContexts;
649
279k
      const int ac_stride = static_cast<int>(m.ac_stride);
650
279k
      const size_t b_stride = m.b_stride;
651
279k
      const int width = m.width_in_blocks;
652
279k
      int y = mcu_y * m.v_samp + ac_dc_state.next_iy;
653
279k
      int* const prev_sgn = &c->prev_sign[1];
654
279k
      int* const prev_abs = &c->prev_abs_coeff[2];
655
1.03M
      for (int iy = ac_dc_state.next_iy; iy < m.v_samp; ++iy, ++y) {
656
768k
        coeff_t* coeffs =
657
768k
            m.ac_coeffs + y * ac_stride + ac_dc_state.next_x * kDCTBlockSize;
658
768k
        uint8_t* block_state =
659
768k
            m.block_state + y * b_stride + ac_dc_state.next_x;
660
76.3M
        for (int x = ac_dc_state.next_x; x < width; ++x) {
661
75.5M
          if (BRUNSLI_PREDICT_FALSE(!in->CanRead(6))) {
662
15.3k
            ac_dc_state.next_mcu_y = mcu_y;
663
15.3k
            ac_dc_state.next_component = i;
664
15.3k
            ac_dc_state.next_iy = iy;
665
15.3k
            ac_dc_state.next_x = x;
666
15.3k
            s.ans_decoder = ans;
667
15.3k
            s.bit_reader = br;
668
15.3k
            s.arith_decoder = ac;
669
15.3k
            return BRUNSLI_NOT_ENOUGH_DATA;
670
15.3k
          }
671
75.5M
          const int is_empty_ctx =
672
75.5M
              IsEmptyBlockContext(&c->prev_is_nonempty[1], x);
673
75.5M
          Prob* BRUNSLI_RESTRICT is_empty_p =
674
75.5M
              &c->is_empty_block_prob[is_empty_ctx];
675
75.5M
          const bool is_empty_block = !ac.ReadBit(is_empty_p->get_proba(), in);
676
75.5M
          is_empty_p->Add(!is_empty_block);
677
75.5M
          c->prev_is_nonempty[x + 1] = !is_empty_block;
678
75.5M
          *block_state = is_empty_block;
679
75.5M
          int abs_val = 0;
680
75.5M
          int sign = 0;
681
75.5M
          if (!is_empty_block) {
682
11.8M
            Prob* BRUNSLI_RESTRICT p_is_zero = &c->is_zero_prob;
683
11.8M
            int is_zero = ac.ReadBit(p_is_zero->get_proba(), in);
684
11.8M
            p_is_zero->Add(is_zero);
685
11.8M
            if (!is_zero) {
686
2.19M
              const int avg_ctx = WeightedAverageContextDC(prev_abs, x);
687
2.19M
              const int sign_ctx = prev_sgn[x] * 3 + prev_sgn[x - 1];
688
2.19M
              Prob* BRUNSLI_RESTRICT sign_p = &c->sign_prob[sign_ctx];
689
2.19M
              sign = ac.ReadBit(sign_p->get_proba(), in);
690
2.19M
              sign_p->Add(sign);
691
2.19M
              const int entropy_ix = context_map[avg_ctx];
692
2.19M
              int code = ans.ReadSymbol(state->entropy_codes[entropy_ix], in);
693
2.19M
              if (code < kNumDirectCodes) {
694
782k
                abs_val = code + 1;
695
1.41M
              } else {
696
1.41M
                int nbits = code - kNumDirectCodes;
697
1.41M
                Prob* BRUNSLI_RESTRICT p_first_extra_bit =
698
1.41M
                    &c->first_extra_bit_prob[nbits];
699
1.41M
                int first_extra_bit =
700
1.41M
                    ac.ReadBit(p_first_extra_bit->get_proba(), in);
701
1.41M
                p_first_extra_bit->Add(first_extra_bit);
702
1.41M
                int extra_bits_val = first_extra_bit << nbits;
703
1.41M
                if (nbits > 0) {
704
1.25M
                  extra_bits_val |= static_cast<int>(br.ReadBits(nbits, in));
705
1.25M
                }
706
1.41M
                abs_val = kNumDirectCodes - 1 + (2 << nbits) + extra_bits_val;
707
1.41M
              }
708
2.19M
            }
709
11.8M
          }
710
75.5M
          prev_abs[x] = abs_val;
711
75.5M
          prev_sgn[x] = abs_val ? sign + 1 : 0;
712
75.5M
          coeffs[0] = ((1 - 2 * sign) * abs_val +
713
75.5M
                       PredictWithAdaptiveMedian(coeffs, x, y, ac_stride));
714
75.5M
          block_state++;
715
75.5M
          coeffs += kDCTBlockSize;
716
75.5M
        }
717
752k
        ac_dc_state.next_x = 0;
718
752k
      }
719
263k
      ac_dc_state.next_iy = 0;
720
263k
    }
721
260k
    ac_dc_state.next_component = 0;
722
260k
  }
723
724
  // Prepare for AC decoding.
725
11.1k
  ac_dc_state.next_mcu_y = 0;
726
11.1k
  ac_dc_state.next_component = 0;
727
11.1k
  ac_dc_state.next_iy = 0;
728
11.1k
  ac_dc_state.next_x = 0;
729
730
11.1k
  comps.clear();
731
11.1k
  comps.shrink_to_fit();
732
733
11.1k
  s.ans_decoder = ans;
734
11.1k
  s.bit_reader = br;
735
11.1k
  s.arith_decoder = ac;
736
11.1k
  if (!FinalizeSubdecoders(state)) return BRUNSLI_INVALID_BRN;
737
738
10.6k
  return BRUNSLI_OK;
739
11.1k
}
740
741
static void BRUNSLI_NOINLINE DecodeEmptyAcBlock(
742
19.5M
    int* BRUNSLI_RESTRICT prev_sgn, int* BRUNSLI_RESTRICT prev_abs) {
743
1.24G
  for (int k = 1; k < kDCTBlockSize; ++k) {
744
1.23G
    prev_sgn[k] = 0;
745
1.23G
    prev_abs[k] = 0;
746
1.23G
  }
747
19.5M
}
748
749
/** All the necessary things for decoding AC block. */
750
struct AcBlockCookie {
751
  int x;
752
  int y;
753
  uint8_t* BRUNSLI_RESTRICT prev_num_nonzeros;
754
  int* BRUNSLI_RESTRICT prev_sgn;
755
  int* BRUNSLI_RESTRICT prev_abs;
756
  Prob* BRUNSLI_RESTRICT num_nonzero_prob;
757
758
  BinaryArithmeticDecoder* BRUNSLI_RESTRICT ac;
759
  WordSource* BRUNSLI_RESTRICT in;
760
  ANSDecoder* BRUNSLI_RESTRICT ans;
761
  BitSource* BRUNSLI_RESTRICT br;
762
763
  coeff_t* BRUNSLI_RESTRICT coeffs;
764
  const coeff_t* BRUNSLI_RESTRICT prev_row_coeffs;
765
  const coeff_t* BRUNSLI_RESTRICT prev_col_coeffs;
766
  Prob* BRUNSLI_RESTRICT is_zero_prob;
767
  const uint32_t* BRUNSLI_RESTRICT order;
768
  const uint8_t* BRUNSLI_RESTRICT context_modes;
769
  const int* BRUNSLI_RESTRICT mult_col;
770
  const int* BRUNSLI_RESTRICT mult_row;
771
  int prev_row_delta;
772
  Prob* BRUNSLI_RESTRICT sign_prob;
773
  size_t context_bits;
774
  const uint8_t* BRUNSLI_RESTRICT context_map;
775
  const ANSDecodingData* BRUNSLI_RESTRICT entropy_codes;
776
  Prob* BRUNSLI_RESTRICT first_extra_bit_prob;
777
};
778
779
3.11M
static size_t BRUNSLI_NOINLINE DecodeAcBlock(const AcBlockCookie& cookie) {
780
3.11M
  AcBlockCookie c = cookie;
781
782
3.11M
  BinaryArithmeticDecoder ac = *c.ac;
783
3.11M
  WordSource* in = c.in;
784
3.11M
  ANSDecoder ans = *c.ans;
785
3.11M
  BitSource br = *c.br;
786
787
3.11M
  size_t num_nonzeros = 0;
788
789
3.11M
  const uint8_t nonzero_ctx = NumNonzerosContext(c.prev_num_nonzeros, c.x, c.y);
790
3.11M
  size_t last_nz = DecodeNumNonzeros(
791
3.11M
      c.num_nonzero_prob + kNumNonZeroTreeSize * nonzero_ctx, &ac, in);
792
167M
  for (size_t k = last_nz + 1; k < kDCTBlockSize; ++k) {
793
164M
    c.prev_sgn[k] = 0;
794
164M
    c.prev_abs[k] = 0;
795
164M
  }
796
35.2M
  for (size_t k = last_nz; k > 0; --k) {
797
32.1M
    int is_zero = 0;
798
32.1M
    if (k < last_nz) {
799
31.2M
      size_t bucket = kNonzeroBuckets[num_nonzeros - 1];
800
31.2M
      size_t is_zero_ctx = bucket * kDCTBlockSize + k;
801
31.2M
      Prob& p = c.is_zero_prob[is_zero_ctx];
802
31.2M
      is_zero = ac.ReadBit(p.get_proba(), in);
803
31.2M
      p.Add(is_zero);
804
31.2M
    }
805
32.1M
    int abs_val = 0;
806
32.1M
    int sign = 1;
807
32.1M
    const int k_nat = c.order[k];
808
32.1M
    if (!is_zero) {
809
5.93M
      size_t context_type = c.context_modes[k_nat];
810
5.93M
      size_t avg_ctx = 0;
811
5.93M
      size_t sign_ctx = kMaxAverageContext;
812
5.93M
      if ((context_type & 1) && (c.y > 0)) {
813
1.13M
        size_t offset = k_nat & 7;
814
1.13M
        ACPredictContextRow(c.prev_row_coeffs + offset, c.coeffs + offset,
815
1.13M
                            c.mult_col + offset * 8, &avg_ctx, &sign_ctx);
816
4.79M
      } else if ((context_type & 2) && (c.x > 0)) {
817
1.30M
        size_t offset = k_nat & ~7;
818
1.30M
        ACPredictContextCol(c.prev_col_coeffs + offset, c.coeffs + offset,
819
1.30M
                            c.mult_row + offset, &avg_ctx, &sign_ctx);
820
3.49M
      } else if (!context_type) {
821
3.39M
        avg_ctx = WeightedAverageContext(c.prev_abs + k, c.prev_row_delta);
822
3.39M
        sign_ctx =
823
3.39M
            c.prev_sgn[k] * 3 + c.prev_sgn[static_cast<int>(k) - kDCTBlockSize];
824
3.39M
      }
825
5.93M
      sign_ctx = sign_ctx * kDCTBlockSize + k;
826
5.93M
      Prob& sign_p = c.sign_prob[sign_ctx];
827
5.93M
      sign = ac.ReadBit(sign_p.get_proba(), in);
828
5.93M
      sign_p.Add(sign);
829
5.93M
      c.prev_sgn[k] = sign + 1;
830
5.93M
      sign = 1 - 2 * sign;
831
5.93M
      const size_t z_dens_ctx =
832
5.93M
          ZeroDensityContext(num_nonzeros, k, c.context_bits);
833
5.93M
      size_t histo_ix = z_dens_ctx * kNumAvrgContexts + avg_ctx;
834
5.93M
      size_t entropy_ix = c.context_map[histo_ix];
835
5.93M
      int code = ans.ReadSymbol(c.entropy_codes[entropy_ix], in);
836
5.93M
      if (code < kNumDirectCodes) {
837
3.23M
        abs_val = code + 1;
838
3.23M
      } else {
839
2.69M
        int nbits = code - kNumDirectCodes;
840
2.69M
        Prob& p = c.first_extra_bit_prob[k * 10 + nbits];
841
2.69M
        int first_extra_bit = ac.ReadBit(p.get_proba(), in);
842
2.69M
        p.Add(first_extra_bit);
843
2.69M
        int extra_bits_val = first_extra_bit << nbits;
844
2.69M
        if (nbits > 0) {
845
2.46M
          extra_bits_val |= br.ReadBits(nbits, in);
846
2.46M
        }
847
2.69M
        abs_val = kNumDirectCodes - 1 + (2u << nbits) + extra_bits_val;
848
2.69M
      }
849
5.93M
      ++num_nonzeros;
850
26.2M
    } else {
851
26.2M
      c.prev_sgn[k] = 0;
852
26.2M
    }
853
32.1M
    int coeff = sign * abs_val;
854
32.1M
    c.coeffs[k_nat] = coeff;
855
32.1M
    c.prev_abs[k] = abs_val;
856
32.1M
  }
857
858
3.11M
  *c.ans = ans;
859
3.11M
  *c.br = br;
860
3.11M
  *c.ac = ac;
861
862
3.11M
  return num_nonzeros;
863
3.11M
}
864
865
168k
BrunsliStatus DecodeAC(State* state, WordSource* in) {
866
168k
  const std::vector<ComponentMeta>& meta = state->meta;
867
168k
  const size_t num_components = meta.size();
868
168k
  const int mcu_rows = meta[0].height_in_blocks / meta[0].v_samp;
869
168k
  InternalState& s = *state->internal;
870
168k
  AcDcState& ac_dc_state = s.ac_dc;
871
872
168k
  std::vector<ComponentState>& comps = ac_dc_state.ac;
873
168k
  if (comps.empty()) {
874
10.4k
    comps.resize(num_components);
875
22.0k
    for (size_t c = 0; c < num_components; ++c) {
876
11.5k
      comps[c].SetWidth(meta[c].width_in_blocks);
877
11.5k
      ComputeACPredictMultipliers(&meta[c].quant[0], comps[c].mult_row,
878
11.5k
                                  comps[c].mult_col);
879
11.5k
    }
880
10.4k
  }
881
882
168k
  if (!in->CanRead(5)) return BRUNSLI_NOT_ENOUGH_DATA;
883
95.4k
  EnsureSubdecodersInitialized(state, in);
884
885
95.4k
  if (!ac_dc_state.ac_coeffs_order_decoded) {
886
78.4k
    while (ac_dc_state.next_component < num_components) {
887
68.7k
      if (!in->CanRead(121)) return BRUNSLI_NOT_ENOUGH_DATA;
888
11.0k
      if (!DecodeCoeffOrder(comps[ac_dc_state.next_component].order,
889
11.0k
                            &s.bit_reader, in)) {
890
492
        return BRUNSLI_INVALID_BRN;
891
492
      }
892
10.5k
      ac_dc_state.next_component++;
893
10.5k
    }
894
9.72k
    ac_dc_state.next_component = 0;
895
9.72k
    ac_dc_state.ac_coeffs_order_decoded = true;
896
9.72k
  }
897
898
37.2k
  AcBlockCookie c;
899
37.2k
  c.ac = &s.arith_decoder;
900
37.2k
  c.in = in;
901
37.2k
  c.ans = &s.ans_decoder;
902
37.2k
  c.br = &s.bit_reader;
903
37.2k
  c.entropy_codes = state->entropy_codes;
904
37.2k
  c.context_modes =
905
37.2k
      kContextAlgorithm + (state->use_legacy_context_model ? 64 : 0);
906
907
242k
  for (int mcu_y = ac_dc_state.next_mcu_y; mcu_y < mcu_rows; ++mcu_y) {
908
438k
    for (size_t i = ac_dc_state.next_component; i < num_components; ++i) {
909
233k
      ComponentState& cst = comps[i];
910
233k
      c.prev_num_nonzeros = cst.prev_num_nonzeros.data();
911
233k
      c.num_nonzero_prob = cst.num_nonzero_prob;
912
233k
      c.is_zero_prob = cst.is_zero_prob.data();
913
233k
      c.order = cst.order;
914
233k
      c.mult_col = cst.mult_col;
915
233k
      c.mult_row = cst.mult_row;
916
233k
      c.sign_prob = cst.sign_prob.data();
917
233k
      c.first_extra_bit_prob = cst.first_extra_bit_prob.data();
918
233k
      const ComponentMeta& m = meta[i];
919
233k
      c.context_map = state->context_map + m.context_offset * kNumAvrgContexts;
920
233k
      c.context_bits = m.context_bits;
921
233k
      const int width = m.width_in_blocks;
922
233k
      const size_t ac_stride = m.ac_stride;
923
233k
      const size_t b_stride = m.b_stride;
924
233k
      const int next_iy = ac_dc_state.next_iy;
925
233k
      c.y = mcu_y * m.v_samp + next_iy;
926
233k
      c.prev_row_delta = (1 - 2 * (c.y & 1u)) * (width + 3) * kDCTBlockSize;
927
868k
      for (int iy = next_iy; iy < m.v_samp; ++iy, ++c.y) {
928
662k
        const int next_x = ac_dc_state.next_x;
929
662k
        const size_t block_offset = next_x * kDCTBlockSize;
930
662k
        c.coeffs = m.ac_coeffs + c.y * ac_stride + block_offset;
931
662k
        c.prev_row_coeffs = c.coeffs - ac_stride;
932
662k
        c.prev_col_coeffs = c.coeffs - kDCTBlockSize;
933
662k
        const uint8_t* block_state = m.block_state + c.y * b_stride + next_x;
934
662k
        c.prev_sgn = &cst.prev_sign[kDCTBlockSize] + block_offset;
935
662k
        c.prev_abs = &cst.prev_abs_coeff[((c.y & 1u) * (width + 3) + 2) *
936
662k
                                         kDCTBlockSize] +
937
662k
                     block_offset;
938
23.3M
        for (c.x = next_x; c.x < width; ++c.x) {
939
22.6M
          bool is_empty = *(block_state++);
940
22.6M
          if (!is_empty) {
941
3.14M
            if (BRUNSLI_PREDICT_FALSE(!in->CanRead(297))) {
942
27.6k
              ac_dc_state.next_mcu_y = mcu_y;
943
27.6k
              ac_dc_state.next_component = i;
944
27.6k
              ac_dc_state.next_iy = iy;
945
27.6k
              ac_dc_state.next_x = c.x;
946
27.6k
              return BRUNSLI_NOT_ENOUGH_DATA;
947
27.6k
            }
948
3.11M
            size_t num_nonzeros = DecodeAcBlock(c);
949
3.11M
            BRUNSLI_DCHECK(num_nonzeros <= kNumNonZeroTreeSize);
950
3.11M
            c.prev_num_nonzeros[c.x] = static_cast<uint8_t>(num_nonzeros);
951
19.5M
          } else {
952
19.5M
            DecodeEmptyAcBlock(c.prev_sgn, c.prev_abs);
953
19.5M
            c.prev_num_nonzeros[c.x] = 0;
954
19.5M
          }
955
22.6M
          c.coeffs += kDCTBlockSize;
956
22.6M
          c.prev_sgn += kDCTBlockSize;
957
22.6M
          c.prev_abs += kDCTBlockSize;
958
22.6M
          c.prev_row_coeffs += kDCTBlockSize;
959
22.6M
          c.prev_col_coeffs += kDCTBlockSize;
960
22.6M
        }
961
634k
        c.prev_row_delta *= -1;
962
634k
        ac_dc_state.next_x = 0;
963
634k
      }
964
205k
      ac_dc_state.next_iy = 0;
965
205k
    }
966
205k
    ac_dc_state.next_component = 0;
967
205k
  }
968
9.66k
  ac_dc_state.next_mcu_y = 0;
969
970
9.66k
  comps.clear();
971
9.66k
  comps.shrink_to_fit();
972
973
9.66k
  if (!FinalizeSubdecoders(state)) return BRUNSLI_INVALID_BRN;
974
975
8.83k
  return BRUNSLI_OK;
976
9.66k
}
977
978
809k
static bool CheckCanRead(State* state, size_t required) {
979
  // TODO(eustas): dcheck len > pos
980
809k
  size_t available = state->len - state->pos;
981
809k
  return required <= available;
982
809k
}
983
984
377k
static bool CheckCanReadByte(State* state) {
985
  // TODO(eustas): dcheck len > pos
986
377k
  return state->pos != state->len;
987
377k
}
988
989
239k
static uint8_t ReadByte(State* state) {
990
  // TODO(eustas): dcheck len > pos
991
239k
  return state->data[state->pos++];
992
239k
}
993
994
506k
static uint8_t PeekByte(State* state, size_t offset) {
995
  // TODO(eustas): dcheck overflow.
996
506k
  return state->data[state->pos + offset];
997
506k
}
998
999
6.59M
static void SkipBytes(State* state, size_t len) {
1000
  // TODO(eustas): dcheck overflow.
1001
6.59M
  state->pos += len;
1002
6.59M
}
1003
1004
16.7M
static size_t GetBytesAvailable(State* state) {
1005
  // TODO(eustas): dcheck len > pos
1006
16.7M
  return state->len - state->pos;
1007
16.7M
}
1008
1009
11.4k
static size_t SkipAvailableBytes(State* state, size_t len) {
1010
11.4k
  size_t available = GetBytesAvailable(state);
1011
11.4k
  size_t skip_bytes = std::min(available, len);
1012
11.4k
  state->pos += skip_bytes;
1013
11.4k
  return skip_bytes;
1014
11.4k
}
1015
1016
459k
static BrunsliStatus DecodeBase128(State* state, size_t* val) {
1017
459k
  *val = 0;
1018
459k
  uint64_t b = 0x80;
1019
459k
  size_t i = 0;
1020
965k
  while ((i < 9) && (b & 0x80u)) {
1021
684k
    if (!CheckCanRead(state, i + 1)) return BRUNSLI_NOT_ENOUGH_DATA;
1022
506k
    b = PeekByte(state, i);
1023
506k
    *val |= (b & 0x7Fu) << (i * 7);
1024
506k
    ++i;
1025
506k
  }
1026
281k
  SkipBytes(state, i);
1027
281k
  return ((b & 0x80u) == 0) ? BRUNSLI_OK : BRUNSLI_INVALID_BRN;
1028
459k
}
1029
1030
6.24M
static Stage Fail(State* state, BrunsliStatus result) {
1031
6.24M
  InternalState& s = *state->internal;
1032
6.24M
  s.result = result;
1033
  // Preserve current stage for continuation / error reporting.
1034
6.24M
  s.last_stage = state->stage;
1035
6.24M
  return Stage::ERROR;
1036
6.24M
}
1037
1038
377k
static BrunsliStatus ReadTag(State* state, SectionState* section) {
1039
377k
  if (!CheckCanReadByte(state)) return BRUNSLI_NOT_ENOUGH_DATA;
1040
239k
  const uint8_t marker = ReadByte(state);
1041
1042
239k
  const size_t tag = marker >> 3u;
1043
239k
  if (tag == 0 || tag > 15) return BRUNSLI_INVALID_BRN;
1044
239k
  section->tag = tag;
1045
1046
239k
  const size_t wiring_type = marker & 0x7u;
1047
239k
  if (wiring_type != kBrunsliWiringTypeVarint &&
1048
239k
      wiring_type != kBrunsliWiringTypeLengthDelimited) {
1049
48
    return BRUNSLI_INVALID_BRN;
1050
48
  }
1051
239k
  section->is_section = (wiring_type == kBrunsliWiringTypeLengthDelimited);
1052
1053
239k
  const uint32_t tag_bit = 1u << tag;
1054
239k
  if (section->tags_met & tag_bit) {
1055
31
    BRUNSLI_LOG_ERROR() << "Duplicate marker " << std::hex
1056
31
                        << static_cast<int>(marker) << BRUNSLI_ENDL();
1057
31
    return BRUNSLI_INVALID_BRN;
1058
31
  }
1059
239k
  section->tags_met |= tag_bit;
1060
1061
239k
  return BRUNSLI_OK;
1062
239k
}
1063
1064
189k
static BrunsliStatus EnterSection(State* state, SectionState* section) {
1065
189k
  size_t section_size;
1066
189k
  BrunsliStatus status = DecodeBase128(state, &section_size);
1067
189k
  if (status != BRUNSLI_OK) return status;
1068
114k
  section->is_active = true;
1069
114k
  section->remaining = section_size;
1070
114k
  section->milestone = state->pos;
1071
114k
  section->projected_end = state->pos + section->remaining;
1072
114k
  return BRUNSLI_OK;
1073
189k
}
1074
1075
31.1k
static void LeaveSection(SectionState* section) {
1076
31.1k
  section->is_active = false;
1077
31.1k
}
1078
1079
17.4M
static bool IsOutOfSectionBounds(State* state) {
1080
17.4M
  return state->pos > state->internal->section.projected_end;
1081
17.4M
}
1082
1083
17.4M
static size_t RemainingSectionLength(State* state) {
1084
  // TODO(eustas): remove this check?
1085
17.4M
  if (IsOutOfSectionBounds(state)) return 0;
1086
17.4M
  return state->internal->section.projected_end - state->pos;
1087
17.4M
}
1088
1089
345k
static bool IsAtSectionBoundary(State* state) {
1090
345k
  return state->pos == state->internal->section.projected_end;
1091
345k
}
1092
1093
124k
Stage VerifySignature(State* state) {
1094
124k
  InternalState& s = *state->internal;
1095
1096
124k
  if (!CheckCanRead(state, kBrunsliSignatureSize)) {
1097
92.3k
    return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
1098
92.3k
  }
1099
32.4k
  const bool is_signature_ok =
1100
32.4k
      (memcmp(state->data + state->pos, kBrunsliSignature,
1101
32.4k
              kBrunsliSignatureSize) != 0);
1102
32.4k
  state->pos += kBrunsliSignatureSize;
1103
32.4k
  s.section.tags_met |= 1u << kBrunsliSignatureTag;
1104
32.4k
  if (is_signature_ok) return Fail(state, BRUNSLI_INVALID_BRN);
1105
32.3k
  return Stage::HEADER;
1106
32.4k
}
1107
1108
// Parses the brunsli header starting at data[*pos] and fills in *jpg.
1109
// Sets *pos to the position after the header.
1110
// Returns BRUNSLI_OK, unless the data is not valid brunsli byte stream
1111
// or is truncated.
1112
202k
Stage DecodeHeader(State* state, JPEGData* jpg) {
1113
202k
  InternalState& s = *state->internal;
1114
202k
  HeaderState& hs = s.header;
1115
1116
589k
  while (hs.stage != HeaderState::DONE) {
1117
558k
    switch (hs.stage) {
1118
63.0k
      case HeaderState::READ_TAG: {
1119
63.0k
        BrunsliStatus status = ReadTag(state, &s.section);
1120
63.0k
        if (status != BRUNSLI_OK) return Fail(state, status);
1121
32.2k
        if (s.section.tag != kBrunsliHeaderTag || !s.section.is_section) {
1122
12
          return Fail(state, BRUNSLI_INVALID_BRN);
1123
12
        }
1124
32.2k
        hs.stage = HeaderState::ENTER_SECTION;
1125
32.2k
        break;
1126
32.2k
      }
1127
1128
48.2k
      case HeaderState::ENTER_SECTION: {
1129
48.2k
        BrunsliStatus status = EnterSection(state, &s.section);
1130
48.2k
        if (status != BRUNSLI_OK) return Fail(state, status);
1131
32.2k
        hs.stage = HeaderState::ITEM_READ_TAG;
1132
32.2k
        break;
1133
48.2k
      }
1134
1135
216k
      case HeaderState::ITEM_READ_TAG: {
1136
216k
        if (IsAtSectionBoundary(state)) {
1137
31.6k
          hs.stage = HeaderState::FINALE;
1138
31.6k
          break;
1139
31.6k
        }
1140
184k
        BrunsliStatus status = ReadTag(state, &hs.section);
1141
184k
        if (status != BRUNSLI_OK) return Fail(state, status);
1142
124k
        const uint32_t tag_bit = 1u << hs.section.tag;
1143
124k
        if (hs.section.is_section) {
1144
10.6k
          if (kKnownHeaderVarintTags & tag_bit) {
1145
10.5k
            Fail(state, BRUNSLI_INVALID_BRN);
1146
10.5k
          }
1147
10.6k
          hs.stage = HeaderState::ITEM_ENTER_SECTION;
1148
10.6k
          break;
1149
10.6k
        }
1150
114k
        hs.stage = HeaderState::ITEM_READ_VALUE;
1151
114k
        break;
1152
124k
      }
1153
1154
16.8k
      case HeaderState::ITEM_ENTER_SECTION: {
1155
16.8k
        BrunsliStatus status = DecodeBase128(state, &hs.remaining_skip_length);
1156
16.8k
        if (status != BRUNSLI_OK) return Fail(state, status);
1157
10.6k
        hs.stage = HeaderState::ITEM_SKIP_CONTENTS;
1158
10.6k
        break;
1159
16.8k
      }
1160
1161
11.4k
      case HeaderState::ITEM_SKIP_CONTENTS: {
1162
11.4k
        size_t bytes_skipped =
1163
11.4k
            SkipAvailableBytes(state, hs.remaining_skip_length);
1164
11.4k
        hs.remaining_skip_length -= bytes_skipped;
1165
11.4k
        if (hs.remaining_skip_length > 0) {
1166
1.01k
          return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
1167
1.01k
        }
1168
10.3k
        hs.stage = HeaderState::ITEM_READ_TAG;
1169
10.3k
        break;
1170
11.4k
      }
1171
1172
170k
      case HeaderState::ITEM_READ_VALUE: {
1173
170k
        size_t value;
1174
170k
        BrunsliStatus status = DecodeBase128(state, &value);
1175
170k
        if (status != BRUNSLI_OK) return Fail(state, status);
1176
114k
        hs.varint_values[hs.section.tag] = value;
1177
114k
        hs.stage = HeaderState::ITEM_READ_TAG;
1178
114k
        break;
1179
170k
      }
1180
1181
31.6k
      case HeaderState::FINALE: {
1182
31.6k
        const bool has_version =
1183
31.6k
            hs.section.tags_met & (1u << kBrunsliHeaderVersionCompTag);
1184
31.6k
        if (!has_version) return Fail(state, BRUNSLI_INVALID_BRN);
1185
31.6k
        const size_t version_and_comp_count =
1186
31.6k
            hs.varint_values[kBrunsliHeaderVersionCompTag];
1187
1188
31.6k
        const size_t version = version_and_comp_count >> 2u;
1189
31.6k
        jpg->version = static_cast<int>(version);
1190
1191
31.6k
        if (version == 1) {  // fallback mode
1192
          // TODO(eustas): do we need this?
1193
647
          jpg->width = 0;
1194
647
          jpg->height = 0;
1195
647
          hs.stage = HeaderState::DONE;
1196
647
          break;
1197
647
        }
1198
1199
        // Wrong mode = fallback + something.
1200
31.0k
        if ((version & 1u) != 0) {
1201
36
          return Fail(state, BRUNSLI_INVALID_BRN);
1202
36
        }
1203
        // Unknown mode - only 3 bits are defined.
1204
30.9k
        if ((version & ~0x7u) != 0) {
1205
94
          return Fail(state, BRUNSLI_INVALID_BRN);
1206
94
        }
1207
1208
        // Otherwise regular brunsli.
1209
30.8k
        state->use_legacy_context_model = !(version & 2);
1210
1211
        // Do not allow "original_jpg" for regular Brunsli files.
1212
30.8k
        s.section.tags_met |= 1u << kBrunsliOriginalJpgTag;
1213
1214
30.8k
        const bool has_width =
1215
30.8k
            hs.section.tags_met & (1u << kBrunsliHeaderWidthTag);
1216
30.8k
        if (!has_width) return Fail(state, BRUNSLI_INVALID_BRN);
1217
30.8k
        const size_t width = hs.varint_values[kBrunsliHeaderWidthTag];
1218
30.8k
        const bool has_height =
1219
30.8k
            hs.section.tags_met & (1u << kBrunsliHeaderHeightTag);
1220
30.8k
        if (!has_height) return Fail(state, BRUNSLI_INVALID_BRN);
1221
30.8k
        const size_t height = hs.varint_values[kBrunsliHeaderHeightTag];
1222
1223
30.8k
        if (width == 0 || height == 0) return Fail(state, BRUNSLI_INVALID_BRN);
1224
30.8k
        if (width > kMaxDimPixels || height > kMaxDimPixels) {
1225
358
          return Fail(state, BRUNSLI_INVALID_BRN);
1226
358
        }
1227
30.5k
        jpg->width = static_cast<int>(width);
1228
30.5k
        jpg->height = static_cast<int>(height);
1229
1230
30.5k
        const size_t num_components = (version_and_comp_count & 3u) + 1u;
1231
30.5k
        jpg->components.resize(num_components);
1232
1233
30.5k
        const bool has_subsampling =
1234
30.5k
            hs.section.tags_met & (1u << kBrunsliHeaderSubsamplingTag);
1235
30.5k
        if (!has_subsampling) return Fail(state, BRUNSLI_INVALID_BRN);
1236
30.4k
        size_t subsampling_code =
1237
30.4k
            hs.varint_values[kBrunsliHeaderSubsamplingTag];
1238
1239
79.1k
        for (size_t i = 0; i < jpg->components.size(); ++i) {
1240
48.6k
          JPEGComponent* c = &jpg->components[i];
1241
48.6k
          c->v_samp_factor = (subsampling_code & 0xFu) + 1;
1242
48.6k
          subsampling_code >>= 4u;
1243
48.6k
          c->h_samp_factor = (subsampling_code & 0xFu) + 1;
1244
48.6k
          subsampling_code >>= 4u;
1245
48.6k
          if (c->v_samp_factor > kBrunsliMaxSampling) {
1246
2
            return Fail(state, BRUNSLI_INVALID_BRN);
1247
2
          }
1248
48.6k
          if (c->h_samp_factor > kBrunsliMaxSampling) {
1249
2
            return Fail(state, BRUNSLI_INVALID_BRN);
1250
2
          }
1251
48.6k
        }
1252
30.4k
        if (!UpdateSubsamplingDerivatives(jpg)) {
1253
5
          return Fail(state, BRUNSLI_INVALID_BRN);
1254
5
        }
1255
1256
30.4k
        PrepareMeta(jpg, state);
1257
1258
30.4k
        hs.stage = HeaderState::DONE;
1259
30.4k
        break;
1260
30.4k
      }
1261
1262
0
      default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
1263
558k
    }
1264
558k
  }
1265
1266
31.0k
  LeaveSection(&s.section);
1267
31.0k
  return (jpg->version == kFallbackVersion) ? Stage::FALLBACK : Stage::SECTION;
1268
202k
}
1269
1270
477k
static BrunsliStatus DecodeMetaDataSection(State* state, JPEGData* jpg) {
1271
477k
  InternalState& s = *state->internal;
1272
477k
  MetadataState& ms = s.metadata;
1273
1274
477k
  if (ms.decompression_stage == MetadataDecompressionStage::DONE) {
1275
0
    return BRUNSLI_INVALID_BRN;
1276
0
  }
1277
1278
477k
  if (ms.decompression_stage == MetadataDecompressionStage::INITIAL) {
1279
7.71k
    if (IsAtSectionBoundary(state)) {
1280
7
      ms.decompression_stage = MetadataDecompressionStage::DONE;
1281
7
      return BRUNSLI_OK;
1282
7
    }
1283
7.70k
    if (RemainingSectionLength(state) == 1) {
1284
142
      if (!CheckCanReadByte(state)) {
1285
45
        return BRUNSLI_NOT_ENOUGH_DATA;
1286
45
      }
1287
97
      uint8_t data[1];
1288
97
      data[0] = ReadByte(state);
1289
97
      bool ok = ProcessMetaData(data, 1, &ms, jpg) && ms.CanFinish();
1290
97
      ms.decompression_stage = MetadataDecompressionStage::DONE;
1291
97
      return ok ? BRUNSLI_OK : BRUNSLI_INVALID_BRN;
1292
142
    }
1293
7.56k
    ms.decompression_stage =
1294
7.56k
        MetadataDecompressionStage::READ_LENGTH;
1295
7.56k
  }
1296
1297
477k
  if (ms.decompression_stage == MetadataDecompressionStage::READ_LENGTH) {
1298
13.9k
    BrunsliStatus status = DecodeBase128(state, &ms.metadata_size);
1299
13.9k
    if (status != BRUNSLI_OK) return status;
1300
    // TODO(eustas): ms.metadata_size should be limited to avoid "zip-bombs".
1301
7.40k
    if (IsOutOfSectionBounds(state)) return BRUNSLI_INVALID_BRN;
1302
7.39k
    if (RemainingSectionLength(state) == 0) return BRUNSLI_INVALID_BRN;
1303
7.39k
    ms.brotli = BrotliDecoderCreateInstance(nullptr, nullptr, nullptr);
1304
7.39k
    if (ms.brotli == nullptr) return BRUNSLI_DECOMPRESSION_ERROR;
1305
7.39k
    ms.decompression_stage = MetadataDecompressionStage::DECOMPRESSING;
1306
7.39k
  }
1307
1308
470k
  if (ms.decompression_stage == MetadataDecompressionStage::DECOMPRESSING) {
1309
    // Free Brotli decoder and return result
1310
470k
    const auto finish_decompression = [&ms] (BrunsliStatus result) {
1311
3.54k
      BRUNSLI_DCHECK(ms.brotli != nullptr);
1312
3.54k
      BrotliDecoderDestroyInstance(ms.brotli);
1313
3.54k
      ms.brotli = nullptr;
1314
3.54k
      ms.decompression_stage = MetadataDecompressionStage::DONE;
1315
3.54k
      return result;
1316
3.54k
    };
1317
1318
833k
    while (true) {
1319
833k
      size_t available_bytes =
1320
833k
          std::min(GetBytesAvailable(state), RemainingSectionLength(state));
1321
833k
      size_t available_in = available_bytes;
1322
833k
      const uint8_t* next_in = state->data + state->pos;
1323
833k
      size_t available_out = 0;
1324
833k
      BrotliDecoderResult result = BrotliDecoderDecompressStream(
1325
833k
          ms.brotli, &available_in, &next_in, &available_out, nullptr, nullptr);
1326
833k
      if (result == BROTLI_DECODER_RESULT_ERROR) {
1327
1.65k
        return finish_decompression(BRUNSLI_INVALID_BRN);
1328
1.65k
      }
1329
831k
      size_t chunk_size = 0;
1330
831k
      const uint8_t* chunk_data =
1331
831k
          BrotliDecoderTakeOutput(ms.brotli, &chunk_size);
1332
831k
      ms.decompressed_size += chunk_size;
1333
831k
      if (ms.decompressed_size > ms.metadata_size) {
1334
1.25k
        return finish_decompression(BRUNSLI_INVALID_BRN);
1335
1.25k
      }
1336
830k
      size_t consumed_bytes = available_bytes - available_in;
1337
830k
      SkipBytes(state, consumed_bytes);
1338
830k
      bool chunk_ok = ProcessMetaData(chunk_data, chunk_size, &ms, jpg);
1339
830k
      if (!chunk_ok) return finish_decompression(BRUNSLI_INVALID_BRN);
1340
830k
      if (result == BROTLI_DECODER_RESULT_SUCCESS) {
1341
353
        if (RemainingSectionLength(state) != 0) {
1342
218
          return finish_decompression(BRUNSLI_INVALID_BRN);
1343
218
        }
1344
135
        if (ms.decompressed_size != ms.metadata_size) {
1345
128
          return finish_decompression(BRUNSLI_INVALID_BRN);
1346
128
        }
1347
7
        if (!ms.CanFinish()) return finish_decompression(BRUNSLI_INVALID_BRN);
1348
5
        return finish_decompression(BRUNSLI_OK);
1349
7
      }
1350
829k
      if (result == BROTLI_DECODER_RESULT_NEEDS_MORE_OUTPUT) continue;
1351
467k
      BRUNSLI_DCHECK(result == BROTLI_DECODER_RESULT_NEEDS_MORE_INPUT);
1352
467k
      if (RemainingSectionLength(state) == 0) {
1353
48
        return finish_decompression(BRUNSLI_INVALID_BRN);
1354
48
      }
1355
467k
      return BRUNSLI_NOT_ENOUGH_DATA;
1356
467k
    }
1357
470k
  }
1358
1359
  // Unreachable.
1360
0
  BRUNSLI_DCHECK(false);
1361
0
  return BRUNSLI_DECOMPRESSION_ERROR;
1362
470k
}
1363
1364
/**
1365
 * Wraps result, depending on the state of input.
1366
 *
1367
 * If parser needs more data, but section data is depleted,
1368
 * then input is corrupted.
1369
 */
1370
5.21M
static BrunsliStatus CheckBoundary(State* state, BrunsliStatus result) {
1371
5.21M
  if (result == BRUNSLI_NOT_ENOUGH_DATA) {
1372
5.12M
    bool last = (RemainingSectionLength(state) <= GetBytesAvailable(state));
1373
5.12M
    return last ? BRUNSLI_INVALID_BRN : BRUNSLI_NOT_ENOUGH_DATA;
1374
5.12M
  } else {
1375
83.7k
    return result;
1376
83.7k
  }
1377
5.21M
}
1378
1379
5.17M
static void PrepareBitReader(BrunsliBitReader* br, State* state) {
1380
5.17M
  size_t chunk_len =
1381
5.17M
      std::min(GetBytesAvailable(state), RemainingSectionLength(state));
1382
5.17M
  BrunsliBitReaderResume(br, state->data + state->pos, chunk_len);
1383
5.17M
  BRUNSLI_DCHECK(BrunsliBitReaderIsHealthy(br));
1384
5.17M
}
1385
1386
/**
1387
 * Marks data used by bit-reader as consumed.
1388
 */
1389
static BrunsliStatus SuspendBitReader(BrunsliBitReader* br, State* state,
1390
5.17M
                                      BrunsliStatus result) {
1391
5.17M
  size_t chunk_len =
1392
5.17M
      std::min(GetBytesAvailable(state), RemainingSectionLength(state));
1393
5.17M
  size_t unused_bytes = BrunsliBitReaderSuspend(br);
1394
5.17M
  size_t consumed_bytes = chunk_len - unused_bytes;
1395
5.17M
  SkipBytes(state, consumed_bytes);
1396
5.17M
  result = CheckBoundary(state, result);
1397
  // Once BitReader becomes unhealthy, further decoding should be impossible.
1398
5.17M
  BRUNSLI_DCHECK(
1399
5.17M
      BrunsliBitReaderIsHealthy(br) ||
1400
5.17M
      ((result != BRUNSLI_OK) && (result != BRUNSLI_NOT_ENOUGH_DATA)));
1401
5.17M
  return result;
1402
5.17M
}
1403
1404
5.07M
static BrunsliStatus DecodeJPEGInternalsSection(State* state, JPEGData* jpg) {
1405
5.07M
  InternalState& s = *state->internal;
1406
5.07M
  JpegInternalsState& js = s.internals;
1407
5.07M
  BrunsliBitReader* br = &js.br;
1408
1409
5.07M
  if (js.stage == JpegInternalsState::INIT) {
1410
22.3k
    BrunsliBitReaderInit(br);
1411
22.3k
    js.stage = JpegInternalsState::READ_MARKERS;
1412
22.3k
  }
1413
5.07M
  PrepareBitReader(br, state);
1414
1415
5.07M
  const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus {
1416
5.07M
    return SuspendBitReader(br, state, result);
1417
5.07M
  };
1418
1419
5.07M
  if (js.stage == JpegInternalsState::READ_MARKERS) {
1420
14.9M
    while (true) {
1421
14.9M
      if (!BrunsliBitReaderCanRead(br, 6)) {
1422
2.67M
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1423
2.67M
      }
1424
12.2M
      uint8_t marker = 0xc0 + BrunsliBitReaderRead(br, 6);
1425
12.2M
      jpg->marker_order.push_back(marker);
1426
12.2M
      if (marker == 0xc4) ++js.dht_count;
1427
12.2M
      if (marker == 0xdd) js.have_dri = true;
1428
12.2M
      if (marker == 0xda) ++js.num_scans;
1429
12.2M
      if (marker == 0xd9) break;
1430
12.2M
    }
1431
21.9k
    js.stage = JpegInternalsState::READ_DRI;
1432
21.9k
  }
1433
1434
2.39M
  if (js.stage == JpegInternalsState::READ_DRI) {
1435
25.3k
    if (js.have_dri) {
1436
6.77k
      if (!BrunsliBitReaderCanRead(br, 16)) {
1437
3.59k
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1438
3.59k
      }
1439
3.18k
      jpg->restart_interval = BrunsliBitReaderRead(br, 16);
1440
3.18k
    }
1441
21.7k
    js.stage = JpegInternalsState::READ_HUFFMAN_LAST;
1442
21.7k
  }
1443
1444
2.38M
  if (js.stage & JpegInternalsState::DECODE_HUFFMAN_MASK) {
1445
73.0k
    BrunsliStatus status = DecodeHuffmanCode(state, jpg);
1446
73.0k
    if (status != BRUNSLI_OK) return suspend_bit_reader(status);
1447
21.1k
    js.stage = JpegInternalsState::PREPARE_READ_SCANS;
1448
21.1k
  }
1449
1450
2.33M
  if (js.stage == JpegInternalsState::PREPARE_READ_SCANS) {
1451
21.1k
    if (js.dht_count != js.terminal_huffman_code_count) {
1452
340
      BRUNSLI_LOG_ERROR() << "Invalid number of DHT markers" << BRUNSLI_ENDL();
1453
340
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1454
340
    }
1455
20.8k
    if (js.num_scans > 0) {
1456
10.2k
      jpg->scan_info.resize(js.num_scans);
1457
10.2k
      js.i = 0;
1458
10.2k
      js.stage = JpegInternalsState::READ_SCAN_COMMON;
1459
10.5k
    } else {
1460
10.5k
      js.stage = JpegInternalsState::READ_NUM_QUANT;
1461
10.5k
    }
1462
20.8k
  }
1463
1464
2.33M
  if (js.stage & JpegInternalsState::DECODE_SCAN_MASK) {
1465
1.74M
    BrunsliStatus status = DecodeScanInfo(state, jpg);
1466
1.74M
    if (status != BRUNSLI_OK) return suspend_bit_reader(status);
1467
9.51k
    js.stage = JpegInternalsState::READ_NUM_QUANT;
1468
9.51k
  }
1469
1470
600k
  if (js.stage == JpegInternalsState::READ_NUM_QUANT) {
1471
21.2k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1472
1.39k
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1473
1.39k
    }
1474
19.8k
    int num_quant_tables = BrunsliBitReaderRead(br, 2) + 1;
1475
19.8k
    jpg->quant.resize(num_quant_tables);
1476
19.8k
    js.i = 0;
1477
19.8k
    js.stage = JpegInternalsState::READ_QUANT;
1478
19.8k
  }
1479
1480
618k
  while (js.stage == JpegInternalsState::READ_QUANT) {
1481
49.4k
    if (js.i >= jpg->quant.size()) {
1482
19.2k
      js.stage = JpegInternalsState::READ_COMP_ID_SCHEME;
1483
19.2k
      break;
1484
19.2k
    }
1485
    // 6 or 7 bits are used, but we know that at least one more bit is
1486
    // guaranteed to be used by varint out of the loop.
1487
30.2k
    if (!BrunsliBitReaderCanRead(br, 7)) {
1488
10.0k
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1489
10.0k
    }
1490
20.2k
    JPEGQuantTable* q = &jpg->quant[js.i];
1491
20.2k
    q->index = BrunsliBitReaderRead(br, 2);
1492
20.2k
    q->is_last = (js.i == jpg->quant.size() - 1) || BrunsliBitReaderRead(br, 1);
1493
20.2k
    q->precision = BrunsliBitReaderRead(br, 4);
1494
20.2k
    if (q->precision > 1) {
1495
303
      BRUNSLI_LOG_ERROR() << "Invalid quantization table precision: "
1496
303
                          << q->precision << BRUNSLI_ENDL();
1497
303
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1498
303
    }
1499
    // note that q->values[] are initialized to invalid 0 values.
1500
19.8k
    ++js.i;
1501
19.8k
  }
1502
1503
588k
  if (js.stage == JpegInternalsState::READ_COMP_ID_SCHEME) {
1504
19.2k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1505
233
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1506
233
    }
1507
19.0k
    int comp_ids = BrunsliBitReaderRead(br, 2);
1508
19.0k
    static const size_t kMinRequiredComponents[4] = {
1509
19.0k
        3 /* Ids123*/, 1 /* IdsGray */, 3 /* IdsRGB */, 0 /* IdsCustom */
1510
19.0k
    };
1511
19.0k
    if (jpg->components.size() < kMinRequiredComponents[comp_ids]) {
1512
42
      BRUNSLI_LOG_ERROR() << "Insufficient number of components for ColorId #"
1513
42
                          << comp_ids << BRUNSLI_ENDL();
1514
42
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1515
42
    }
1516
18.9k
    js.stage = JpegInternalsState::READ_NUM_PADDING_BITS;
1517
18.9k
    if (comp_ids == kComponentIds123) {
1518
816
      jpg->components[0].id = 1;
1519
816
      jpg->components[1].id = 2;
1520
816
      jpg->components[2].id = 3;
1521
18.1k
    } else if (comp_ids == kComponentIdsGray) {
1522
16.8k
      jpg->components[0].id = 1;
1523
16.8k
    } else if (comp_ids == kComponentIdsRGB) {
1524
148
      jpg->components[0].id = 'R';
1525
148
      jpg->components[1].id = 'G';
1526
148
      jpg->components[2].id = 'B';
1527
1.14k
    } else {
1528
1.14k
      BRUNSLI_DCHECK(comp_ids == kComponentIdsCustom);
1529
1.14k
      js.i = 0;
1530
1.14k
      js.stage = JpegInternalsState::READ_COMP_ID;
1531
1.14k
    }
1532
18.9k
  }
1533
1534
588k
  if (js.stage == JpegInternalsState::READ_COMP_ID) {
1535
2.92k
    while (js.i < jpg->components.size()) {
1536
1.85k
      if (!BrunsliBitReaderCanRead(br, 8)) {
1537
717
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1538
717
      }
1539
1.13k
      jpg->components[js.i].id = BrunsliBitReaderRead(br, 8);
1540
1.13k
      ++js.i;
1541
1.13k
    }
1542
1.07k
    js.stage = JpegInternalsState::READ_NUM_PADDING_BITS;
1543
1.07k
  }
1544
1545
587k
  if (js.stage == JpegInternalsState::READ_NUM_PADDING_BITS) {
1546
    // TODO(eustas): sanitize: should not be bigger than
1547
    //               7 x (num_scans + num_blocks / dri)
1548
    // security: limit is 32b for n_size
1549
19.7k
    if (!DecodeLimitedVarint<8>(&js.varint, br, 4)) {
1550
922
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1551
922
    }
1552
18.7k
    js.num_padding_bits = js.varint.value;
1553
18.7k
    jpg->has_zero_padding_bit = (js.num_padding_bits > 0);
1554
18.7k
    if (js.num_padding_bits > PaddingBitsLimit(*jpg)) {
1555
107
      BRUNSLI_LOG_ERROR() << "Suspicious number of padding bits "
1556
107
                          << js.num_padding_bits << BRUNSLI_ENDL();
1557
107
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1558
107
    }
1559
18.6k
    js.i = 0;
1560
18.6k
    js.stage = JpegInternalsState::READ_PADDING_BITS;
1561
18.6k
  }
1562
1563
586k
  if (js.stage == JpegInternalsState::READ_PADDING_BITS) {
1564
6.82M
    while (js.i < js.num_padding_bits) {
1565
6.80M
      if (!BrunsliBitReaderCanRead(br, 1)) {
1566
529k
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1567
529k
      }
1568
6.27M
      jpg->padding_bits.emplace_back(BrunsliBitReaderRead(br, 1));
1569
6.27M
      ++js.i;
1570
6.27M
    }
1571
18.5k
    suspend_bit_reader(BRUNSLI_OK);
1572
18.5k
    BrunsliBitReaderFinish(br);
1573
18.5k
    if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN;
1574
18.5k
    js.i = 0;
1575
18.5k
    js.stage = JpegInternalsState::ITERATE_MARKERS;
1576
38.0k
  } else {
1577
    // no-op
1578
38.0k
    suspend_bit_reader(BRUNSLI_OK);
1579
38.0k
  }
1580
1581
443k
  while (true) {
1582
443k
    switch (js.stage) {
1583
318k
      case JpegInternalsState::ITERATE_MARKERS: {
1584
318k
        if (js.i >= jpg->marker_order.size()) {
1585
17.9k
          js.stage = JpegInternalsState::DONE;
1586
300k
        } else if (jpg->marker_order[js.i] == 0xFF) {
1587
34.6k
          js.stage = JpegInternalsState::READ_INTERMARKER_LENGTH;
1588
265k
        } else {
1589
265k
          ++js.i;
1590
265k
        }
1591
318k
        continue;
1592
0
      }
1593
1594
67.9k
      case JpegInternalsState::READ_INTERMARKER_LENGTH: {
1595
67.9k
        BrunsliStatus status = DecodeBase128(state, &js.intermarker_length);
1596
67.9k
        if (status != BRUNSLI_OK) return CheckBoundary(state, status);
1597
34.4k
        if (js.intermarker_length > RemainingSectionLength(state)) {
1598
140
          return BRUNSLI_INVALID_BRN;
1599
140
        }
1600
34.2k
        jpg->inter_marker_data.emplace_back();
1601
34.2k
        js.stage = JpegInternalsState::READ_INTERMARKER_DATA;
1602
34.2k
        continue;
1603
34.4k
      }
1604
1605
39.0k
      case JpegInternalsState::READ_INTERMARKER_DATA: {
1606
39.0k
        auto& dest = jpg->inter_marker_data.back();
1607
39.0k
        size_t piece_limit = js.intermarker_length - dest.size();
1608
39.0k
        size_t piece_size = std::min(piece_limit, GetBytesAvailable(state));
1609
39.0k
        Append(&dest, state->data + state->pos, piece_size);
1610
39.0k
        SkipBytes(state, piece_size);
1611
39.0k
        if (dest.size() < js.intermarker_length) {
1612
4.92k
          BRUNSLI_DCHECK(GetBytesAvailable(state) == 0);
1613
4.92k
          BRUNSLI_DCHECK(RemainingSectionLength(state) > 0);
1614
4.92k
          return BRUNSLI_NOT_ENOUGH_DATA;
1615
4.92k
        }
1616
34.1k
        ++js.i;
1617
34.1k
        js.stage = JpegInternalsState::ITERATE_MARKERS;
1618
34.1k
        continue;
1619
39.0k
      }
1620
1621
17.9k
      default: { /* no-op */ }
1622
443k
    }
1623
17.9k
    break;  // no matching stage has been found; exit the loop.
1624
443k
  }
1625
1626
17.9k
  if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1627
1628
17.7k
  return BRUNSLI_OK;
1629
17.9k
}
1630
1631
27.8k
static BrunsliStatus DecodeQuantDataSection(State* state, JPEGData* jpg) {
1632
27.8k
  InternalState& s = *state->internal;
1633
27.8k
  QuantDataState& qs = s.quant;
1634
27.8k
  BrunsliBitReader* br = &qs.br;
1635
1636
27.8k
  if (qs.stage == QuantDataState::INIT) {
1637
14.6k
    BrunsliBitReaderInit(br);
1638
14.6k
    qs.stage = QuantDataState::READ_NUM_QUANT;
1639
14.6k
  }
1640
27.8k
  PrepareBitReader(br, state);
1641
1642
27.8k
  const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus {
1643
27.8k
    return SuspendBitReader(br, state, result);
1644
27.8k
  };
1645
1646
27.8k
  if (qs.stage == QuantDataState::READ_NUM_QUANT) {
1647
22.8k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1648
8.47k
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1649
8.47k
    }
1650
14.4k
    size_t num_quant_tables = BrunsliBitReaderRead(br, 2) + 1;
1651
14.4k
    if (jpg->quant.size() != num_quant_tables) {
1652
183
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1653
183
    }
1654
14.2k
    qs.predictor.resize(kDCTBlockSize);
1655
14.2k
    qs.i = 0;
1656
14.2k
    qs.stage = QuantDataState::READ_STOCK;
1657
14.2k
  }
1658
1659
137k
  while (true) {
1660
137k
    switch (qs.stage) {
1661
26.8k
      case QuantDataState::READ_STOCK: {
1662
26.8k
        if (qs.i >= jpg->quant.size()) {
1663
12.2k
          std::vector<uint8_t>().swap(qs.predictor);
1664
12.2k
          qs.i = 0;
1665
12.2k
          qs.stage = QuantDataState::READ_QUANT_IDX;
1666
12.2k
          continue;
1667
12.2k
        }
1668
        // Depending on еру 1-st bit, it is guaranteed that we will need to read
1669
        // at least 3 or 6 more bits.
1670
14.6k
        if (!BrunsliBitReaderCanRead(br, 4)) {
1671
264
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1672
264
        }
1673
14.3k
        qs.data_precision = 0;
1674
14.3k
        bool is_short = !BrunsliBitReaderRead(br, 1);
1675
14.3k
        if (is_short) {
1676
12.3k
          const size_t short_code = BrunsliBitReaderRead(br, 3);
1677
12.3k
          int32_t* table = jpg->quant[qs.i].values.data();
1678
12.3k
          size_t selector = (qs.i > 0) ? 1 : 0;
1679
805k
          for (size_t k = 0; k < kDCTBlockSize; ++k) {
1680
792k
            table[k] = kStockQuantizationTables[selector][short_code][k];
1681
792k
          }
1682
12.3k
          qs.stage = QuantDataState::UPDATE;
1683
12.3k
        } else {
1684
1.97k
          qs.stage = QuantDataState::READ_Q_FACTOR;
1685
1.97k
        }
1686
14.3k
        continue;
1687
14.6k
      }
1688
1689
2.75k
      case QuantDataState::READ_Q_FACTOR: {
1690
2.75k
        if (!BrunsliBitReaderCanRead(br, 6)) {
1691
1.02k
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1692
1.02k
        }
1693
1.72k
        const uint32_t q_factor = BrunsliBitReaderRead(br, 6);
1694
1.72k
        FillQuantMatrix(qs.i > 0, q_factor, qs.predictor.data());
1695
1.72k
        qs.j = 0;
1696
1.72k
        qs.delta = 0;
1697
1.72k
        qs.stage = QuantDataState::READ_DIFF_IS_ZERO;
1698
1.72k
        continue;
1699
2.75k
      }
1700
1701
35.1k
      case QuantDataState::READ_DIFF_IS_ZERO: {
1702
35.1k
        if (qs.j >= kDCTBlockSize) {
1703
410
          qs.stage = QuantDataState::UPDATE;
1704
410
          continue;
1705
410
        }
1706
34.7k
        if (!BrunsliBitReaderCanRead(br, 1)) {
1707
1.89k
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1708
1.89k
        }
1709
32.8k
        if (BrunsliBitReaderRead(br, 1)) {
1710
6.74k
          qs.stage = QuantDataState::READ_DIFF_SIGN;
1711
26.1k
        } else {
1712
26.1k
          qs.stage = QuantDataState::APPLY_DIFF;
1713
26.1k
        }
1714
32.8k
        continue;
1715
34.7k
      }
1716
1717
6.94k
      case QuantDataState::READ_DIFF_SIGN: {
1718
6.94k
        if (!BrunsliBitReaderCanRead(br, 1)) {
1719
459
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1720
459
        }
1721
6.49k
        qs.sign = BrunsliBitReaderRead(br, 1) ? -1 : 1;
1722
6.49k
        qs.stage = QuantDataState::READ_DIFF;
1723
6.49k
        continue;
1724
6.94k
      }
1725
1726
8.59k
      case QuantDataState::READ_DIFF: {
1727
8.59k
        if (!DecodeVarint(&qs.vs, br, 16)) {
1728
2.39k
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1729
2.39k
        }
1730
6.19k
        int diff = static_cast<int>(qs.vs.value) + 1;
1731
6.19k
        qs.delta += qs.sign * diff;
1732
6.19k
        qs.stage = QuantDataState::APPLY_DIFF;
1733
6.19k
        continue;
1734
8.59k
      }
1735
1736
32.3k
      case QuantDataState::APPLY_DIFF: {
1737
32.3k
        const int k = kJPEGNaturalOrder[qs.j];
1738
32.3k
        const int quant_value = qs.predictor[k] + qs.delta;
1739
32.3k
        jpg->quant[qs.i].values[k] = quant_value;
1740
32.3k
        if (quant_value <= 0) {
1741
244
          return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1742
244
        }
1743
32.1k
        if (quant_value >= 256) {
1744
16.1k
          qs.data_precision = 1;
1745
16.1k
        }
1746
32.1k
        if (quant_value >= 65536) {
1747
237
          return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1748
237
        }
1749
31.8k
        ++qs.j;
1750
31.8k
        qs.stage = QuantDataState::READ_DIFF_IS_ZERO;
1751
31.8k
        continue;
1752
32.1k
      }
1753
1754
12.7k
      case QuantDataState::UPDATE: {
1755
12.7k
        if (jpg->quant[qs.i].precision < qs.data_precision) {
1756
211
          return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1757
211
        }
1758
        // jpg->quant[qs.i].precision > qs.data_precision means that original
1759
        // JPEG1 was inefficiently encoded.
1760
12.5k
        ++qs.i;
1761
12.5k
        qs.stage = QuantDataState::READ_STOCK;
1762
12.5k
        continue;
1763
12.7k
      }
1764
1765
12.4k
      default: { /* no-op */ }
1766
137k
    }
1767
12.4k
    break;  // no matching stage has been found; exit the loop.
1768
137k
  }
1769
1770
37.6k
  while (qs.stage == QuantDataState::READ_QUANT_IDX) {
1771
25.8k
    if (qs.i >= jpg->components.size()) {
1772
11.7k
      qs.stage = QuantDataState::FINISH;
1773
11.7k
      continue;
1774
11.7k
    }
1775
14.0k
    JPEGComponent* c = &jpg->components[qs.i];
1776
14.0k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1777
461
       return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1778
461
    }
1779
13.6k
    c->quant_idx = BrunsliBitReaderRead(br, 2);
1780
13.6k
    if (c->quant_idx >= jpg->quant.size()) {
1781
243
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1782
243
    }
1783
13.3k
    ++qs.i;
1784
13.3k
  }
1785
1786
11.7k
  BRUNSLI_DCHECK(qs.stage == QuantDataState::FINISH);
1787
11.7k
  suspend_bit_reader(BRUNSLI_OK);
1788
11.7k
  BrunsliBitReaderFinish(br);
1789
11.7k
  if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN;
1790
11.7k
  if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1791
11.5k
  return BRUNSLI_OK;
1792
11.7k
}
1793
1794
79.2k
static BrunsliStatus DecodeHistogramDataSection(State* state, JPEGData* jpg) {
1795
79.2k
  InternalState& s = *state->internal;
1796
79.2k
  HistogramDataState& hs = s.histogram;
1797
79.2k
  BrunsliBitReader* br = &hs.br;
1798
1799
79.2k
  if (hs.stage == HistogramDataState::INIT) {
1800
14.6k
    BrunsliBitReaderInit(br);
1801
14.6k
    BRUNSLI_DCHECK(!jpg->components.empty());
1802
14.6k
    s.num_contexts = jpg->components.size();
1803
14.6k
    hs.stage = HistogramDataState::READ_SCHEME;
1804
    /* Optimization: hint arena about maximal used alphabet size: 272.
1805
     * 648 = 272 + 376, where 376 is a "universal" overhead for max-15-bit
1806
     * root-8-bit 2-level Huffman tables. */
1807
14.6k
    hs.arena.reserve(648);
1808
14.6k
  }
1809
79.2k
  PrepareBitReader(br, state);
1810
79.2k
  if (RemainingSectionLength(state) <= GetBytesAvailable(state)) {
1811
    // If end of section is reachable, then we could parse the remainings in
1812
    // non-streaming mode.
1813
12.8k
    BrunsliBitReaderSetOptimistic(br);
1814
12.8k
  }
1815
79.2k
  const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus {
1816
79.2k
    return SuspendBitReader(br, state, result);
1817
79.2k
  };
1818
1819
79.2k
  if (hs.stage == HistogramDataState::READ_SCHEME) {
1820
22.9k
    const size_t num_components = jpg->components.size();
1821
22.9k
    BRUNSLI_DCHECK(num_components <= 4);
1822
22.9k
    if (!BrunsliBitReaderCanRead(br, 3 * num_components)) {
1823
8.47k
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1824
8.47k
    }
1825
30.6k
    for (size_t i = 0; i < num_components; ++i) {
1826
16.4k
      size_t scheme = BrunsliBitReaderRead(br, 3);
1827
16.4k
      if (scheme >= kNumSchemes) return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1828
16.2k
      ComponentMeta& m = state->meta[i];
1829
16.2k
      m.context_bits = scheme;
1830
16.2k
      m.context_offset = s.num_contexts;
1831
16.2k
      s.num_contexts += kNumNonzeroContextSkip[scheme];
1832
16.2k
    }
1833
14.2k
    if (!BrunsliBitReaderIsHealthy(br)) {
1834
27
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1835
27
    }
1836
14.2k
    hs.stage = HistogramDataState::READ_NUM_HISTOGRAMS;
1837
14.2k
  }
1838
1839
70.5k
  if (hs.stage == HistogramDataState::READ_NUM_HISTOGRAMS) {
1840
21.5k
    if (!BrunsliBitReaderCanRead(br, 11)) {
1841
7.54k
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1842
7.54k
    }
1843
13.9k
    s.num_histograms = DecodeVarLenUint8(br) + 1;
1844
13.9k
    if (!BrunsliBitReaderIsHealthy(br)) {
1845
22
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1846
22
    }
1847
13.9k
    if (s.shallow_histograms) {
1848
0
      hs.stage = HistogramDataState::SKIP_CONTENT;
1849
13.9k
    } else {
1850
13.9k
      s.context_map_.resize(s.num_contexts * kNumAvrgContexts);
1851
13.9k
      state->context_map = s.context_map_.data();
1852
13.9k
      s.entropy_codes_.resize(s.num_histograms);
1853
13.9k
      state->entropy_codes = s.entropy_codes_.data();
1854
13.9k
      if (s.num_histograms > 1) {
1855
2.54k
        hs.stage = HistogramDataState::READ_CONTEXT_MAP_CODE;
1856
11.4k
      } else {
1857
11.4k
        hs.i = 0;
1858
11.4k
        hs.counts.resize(kCoeffAlphabetSize);
1859
11.4k
        hs.stage = HistogramDataState::READ_HISTOGRAMS;
1860
11.4k
      }
1861
13.9k
    }
1862
13.9k
  }
1863
1864
62.9k
  if (hs.stage == HistogramDataState::SKIP_CONTENT) {
1865
0
    suspend_bit_reader(BRUNSLI_OK);
1866
0
    if (!BrunsliBitReaderIsHealthy(br)) {
1867
0
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1868
0
    }
1869
0
    SkipAvailableBytes(state, RemainingSectionLength(state));
1870
0
    if (!IsAtSectionBoundary(state)) return BRUNSLI_NOT_ENOUGH_DATA;
1871
0
    hs.stage = HistogramDataState::DONE;
1872
0
  }
1873
1874
62.9k
  if (hs.stage == HistogramDataState::READ_CONTEXT_MAP_CODE) {
1875
29.1k
    if (!BrunsliBitReaderCanRead(br, 207 + s.num_histograms * 8)) {
1876
26.8k
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1877
26.8k
    }
1878
2.29k
    hs.max_run_length_prefix = 0;
1879
2.29k
    bool use_rle_for_zeros = !!BrunsliBitReaderRead(br, 1);
1880
2.29k
    if (use_rle_for_zeros) {
1881
885
      hs.max_run_length_prefix = BrunsliBitReaderRead(br, 4) + 1;
1882
885
    }
1883
2.29k
    size_t alphabet_size = s.num_histograms + hs.max_run_length_prefix;
1884
2.29k
    hs.entropy.reset(new HuffmanDecodingData);
1885
2.29k
    if (!hs.entropy->ReadFromBitStream(alphabet_size, br, &hs.arena)) {
1886
653
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1887
653
    }
1888
1.63k
    hs.i = 0;
1889
1.63k
    hs.stage = HistogramDataState::READ_CONTEXT_MAP;
1890
1.63k
  }
1891
1892
35.4k
  if (hs.stage == HistogramDataState::READ_CONTEXT_MAP) {
1893
7.60k
    BrunsliStatus status = DecodeContextMap(
1894
7.60k
        *hs.entropy, hs.max_run_length_prefix, &hs.i, &s.context_map_, br);
1895
7.60k
    if (status != BRUNSLI_OK) return suspend_bit_reader(status);
1896
1.02k
    hs.i = 0;
1897
1.02k
    hs.counts.resize(kCoeffAlphabetSize);
1898
1.02k
    hs.stage = HistogramDataState::READ_HISTOGRAMS;
1899
1.02k
  }
1900
1901
28.8k
  if (hs.stage == HistogramDataState::READ_HISTOGRAMS) {
1902
52.4k
    while (hs.i < s.num_histograms) {
1903
40.7k
      if (!BrunsliBitReaderCanRead(br, 9 + kCoeffAlphabetSize * 11)) {
1904
16.7k
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1905
16.7k
      }
1906
24.0k
      if (!ReadHistogram(BRUNSLI_ANS_LOG_TAB_SIZE, &hs.counts, br)) {
1907
415
        return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1908
415
      }
1909
23.5k
      if (!s.entropy_codes_[hs.i].Init(hs.counts)) {
1910
0
        return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1911
0
      }
1912
23.5k
      ++hs.i;
1913
23.5k
    }
1914
11.7k
    hs.entropy.reset();
1915
11.7k
    std::vector<uint32_t>().swap(hs.counts);
1916
11.7k
    suspend_bit_reader(BRUNSLI_OK);
1917
11.7k
    BrunsliBitReaderFinish(br);
1918
11.7k
    if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN;
1919
11.6k
    if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1920
11.5k
    hs.stage = HistogramDataState::DONE;
1921
11.5k
  }
1922
1923
11.5k
  hs.arena.reset();
1924
11.5k
  BRUNSLI_DCHECK(hs.stage == HistogramDataState::DONE);
1925
11.5k
  return BRUNSLI_OK;
1926
28.8k
}
1927
1928
94.3k
static BrunsliStatus DecodeDCDataSection(State* state) {
1929
94.3k
  size_t available = GetBytesAvailable(state) & ~1;
1930
94.3k
  size_t limit = RemainingSectionLength(state);
1931
94.3k
  BRUNSLI_DCHECK((limit & 1) == 0);
1932
94.3k
  size_t chunk_len = std::min(available, limit);
1933
  // If end of section is reachable, then we could parse the remainings in
1934
  // non-streaming mode.
1935
94.3k
  bool is_last_chunk = (chunk_len == limit);
1936
94.3k
  WordSource in(state->data + state->pos, chunk_len, is_last_chunk);
1937
1938
94.3k
  BrunsliStatus status = DecodeDC(state, &in);
1939
1940
94.3k
  BRUNSLI_DCHECK((in.pos_ & 1) == 0);
1941
94.3k
  if (in.error_) return BRUNSLI_INVALID_BRN;
1942
93.8k
  BRUNSLI_DCHECK(in.pos_ <= chunk_len);
1943
93.8k
  SkipBytes(state, in.pos_);
1944
93.8k
  if (is_last_chunk) {
1945
10.5k
    BRUNSLI_DCHECK(status != BRUNSLI_NOT_ENOUGH_DATA);
1946
10.5k
    if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1947
10.5k
  }
1948
93.8k
  return status;
1949
93.8k
}
1950
1951
168k
static BrunsliStatus DecodeACDataSection(State* state) {
1952
168k
  size_t available = GetBytesAvailable(state) & ~1;
1953
168k
  size_t limit = RemainingSectionLength(state);
1954
168k
  BRUNSLI_DCHECK((limit & 1) == 0);
1955
168k
  size_t chunk_len = std::min(available, limit);
1956
  // If end of section is reachable, then we could parse the remainings in
1957
  // non-streaming mode.
1958
168k
  bool is_last_chunk = (chunk_len == limit);
1959
168k
  WordSource in(state->data + state->pos, chunk_len, is_last_chunk);
1960
1961
168k
  BrunsliStatus status = DecodeAC(state, &in);
1962
1963
168k
  BRUNSLI_DCHECK((in.pos_ & 1) == 0);
1964
168k
  if (in.error_) return BRUNSLI_INVALID_BRN;
1965
167k
  BRUNSLI_DCHECK(in.pos_ <= chunk_len);
1966
167k
  SkipBytes(state, in.pos_);
1967
167k
  if (is_last_chunk) {
1968
8.97k
    BRUNSLI_DCHECK(status != BRUNSLI_NOT_ENOUGH_DATA);
1969
8.97k
    if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1970
8.97k
  }
1971
167k
  return status;
1972
167k
}
1973
1974
2.81k
static Stage DecodeOriginalJpg(State* state, JPEGData* jpg) {
1975
2.81k
  InternalState& s = *state->internal;
1976
2.81k
  FallbackState& fs = s.fallback;
1977
1978
3.99k
  while (fs.stage != FallbackState::DONE) {
1979
3.94k
    switch (fs.stage) {
1980
902
      case FallbackState::READ_TAG: {
1981
902
        BrunsliStatus status = ReadTag(state, &s.section);
1982
902
        if (status != BRUNSLI_OK) return Fail(state, status);
1983
614
        if (s.section.tag != kBrunsliOriginalJpgTag || !s.section.is_section) {
1984
14
          return Fail(state, BRUNSLI_INVALID_BRN);
1985
14
        }
1986
600
        fs.stage = FallbackState::ENTER_SECTION;
1987
600
        break;
1988
614
      }
1989
1990
1.64k
      case FallbackState::ENTER_SECTION: {
1991
1.64k
        BrunsliStatus status = EnterSection(state, &s.section);
1992
1.64k
        if (status != BRUNSLI_OK) return Fail(state, status);
1993
530
        jpg->original_jpg_size = s.section.remaining;
1994
        // Edge case - empty payload.
1995
530
        if (jpg->original_jpg_size == 0) {
1996
6
          jpg->original_jpg = nullptr;
1997
6
          fs.stage = FallbackState::DONE;
1998
6
          break;
1999
6
        }
2000
524
        fs.stage = FallbackState::READ_CONTENTS;
2001
524
        break;
2002
530
      }
2003
2004
1.39k
      case FallbackState::READ_CONTENTS: {
2005
1.39k
        size_t chunk_size = GetBytesAvailable(state);
2006
1.39k
        if (chunk_size == 0) {
2007
          // TODO(eustas): dcheck s.section.remaining != 0
2008
464
          return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
2009
464
        }
2010
        // Check if it is possible to avoid copy.
2011
932
        const uint8_t* src = state->data + state->pos;
2012
932
        if (fs.storage.empty()) {
2013
364
          if (chunk_size >= jpg->original_jpg_size) {
2014
38
            jpg->original_jpg = src;
2015
38
            SkipBytes(state, jpg->original_jpg_size);
2016
38
            fs.stage = FallbackState::DONE;
2017
38
            break;
2018
38
          }
2019
364
        }
2020
        // Otherwise, copy input.
2021
894
        size_t remaining = jpg->original_jpg_size - fs.storage.size();
2022
894
        size_t to_copy = std::min(chunk_size, remaining);
2023
894
        fs.storage.insert(fs.storage.cend(), src, src + to_copy);
2024
894
        SkipBytes(state, to_copy);
2025
894
        if (fs.storage.size() == jpg->original_jpg_size) {
2026
11
          jpg->original_jpg = fs.storage.data();
2027
11
          fs.stage = FallbackState::DONE;
2028
11
          break;
2029
11
        }
2030
        // TODO(eustas): dcheck GetBytesAvailable(state) == 0
2031
883
        return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
2032
894
      }
2033
2034
0
      default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
2035
3.94k
    }
2036
3.94k
  }
2037
2038
55
  LeaveSection(&s.section);
2039
55
  return Stage::DONE;
2040
2.81k
}
2041
2042
187k
static Stage ParseSection(State* state) {
2043
187k
  InternalState& s = *state->internal;
2044
187k
  SectionHeaderState& sh = s.section_header;
2045
2046
187k
  Stage result = Stage::ERROR;
2047
2048
350k
  while (sh.stage != SectionHeaderState::DONE) {
2049
268k
    switch (sh.stage) {
2050
128k
      case SectionHeaderState::READ_TAG: {
2051
128k
        BrunsliStatus status = ReadTag(state, &s.section);
2052
128k
        if (status == BRUNSLI_NOT_ENOUGH_DATA) {
2053
46.8k
          if (HasSection(state, kBrunsliACDataTag)) return Stage::DONE;
2054
46.8k
        }
2055
128k
        if (status != BRUNSLI_OK) return Fail(state, status);
2056
81.7k
        if (s.section.is_section) {
2057
81.6k
          sh.stage = SectionHeaderState::ENTER_SECTION;
2058
81.6k
          continue;
2059
81.6k
        }
2060
92
        const uint32_t tag_bit = 1u << s.section.tag;
2061
92
        const bool is_known_section_tag = kKnownSectionTags & tag_bit;
2062
92
        if (is_known_section_tag) return Fail(state, BRUNSLI_INVALID_BRN);
2063
88
        sh.stage = SectionHeaderState::READ_VALUE;
2064
88
        continue;
2065
92
      }
2066
2067
218
      case SectionHeaderState::READ_VALUE: {
2068
        // No known varint tags on top level.
2069
218
        size_t sink;
2070
218
        BrunsliStatus status = DecodeBase128(state, &sink);
2071
218
        if (status != BRUNSLI_OK) return Fail(state, status);
2072
74
        result = Stage::SECTION;
2073
74
        sh.stage = SectionHeaderState::DONE;
2074
74
        continue;
2075
218
      }
2076
2077
140k
      case SectionHeaderState::ENTER_SECTION: {
2078
140k
        BrunsliStatus status = EnterSection(state, &s.section);
2079
140k
        if (status != BRUNSLI_OK) return Fail(state, status);
2080
81.6k
        result = Stage::SECTION_BODY;
2081
81.6k
        sh.stage = SectionHeaderState::DONE;
2082
81.6k
        continue;
2083
140k
      }
2084
2085
0
      default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
2086
268k
    }
2087
268k
  }
2088
2089
81.7k
  sh.stage = SectionHeaderState::READ_TAG;
2090
81.7k
  BRUNSLI_DCHECK(result != Stage::ERROR);
2091
81.7k
  return result;
2092
187k
}
2093
2094
5.92M
static Stage ProcessSection(State* state, JPEGData* jpg) {
2095
5.92M
  InternalState& s = *state->internal;
2096
2097
5.92M
  const int32_t tag_bit = 1u << s.section.tag;
2098
5.92M
  const bool is_known_section_tag = kKnownSectionTags & tag_bit;
2099
2100
5.92M
  const bool skip_section =
2101
5.92M
      !is_known_section_tag || (state->skip_tags & tag_bit);
2102
2103
5.92M
  if (skip_section) {
2104
    // Skip section content.
2105
617
    size_t to_skip =
2106
617
        std::min(GetBytesAvailable(state), RemainingSectionLength(state));
2107
617
    state->pos += to_skip;
2108
617
    if (RemainingSectionLength(state) != 0) {
2109
557
      BRUNSLI_DCHECK(GetBytesAvailable(state) == 0);
2110
557
      return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
2111
557
    }
2112
60
    return Stage::SECTION;
2113
617
  }
2114
2115
5.92M
  switch (s.section.tag) {
2116
477k
    case kBrunsliMetaDataTag: {
2117
477k
      BrunsliStatus status = DecodeMetaDataSection(state, jpg);
2118
477k
      if (status != BRUNSLI_OK) return Fail(state, status);
2119
72
      break;
2120
477k
    }
2121
2122
5.07M
    case kBrunsliJPEGInternalsTag: {
2123
5.07M
      BrunsliStatus status = DecodeJPEGInternalsSection(state, jpg);
2124
5.07M
      if (status != BRUNSLI_OK) return Fail(state, status);
2125
17.7k
      break;
2126
5.07M
    }
2127
2128
27.8k
    case kBrunsliQuantDataTag: {
2129
27.8k
      if (!HasSection(state, kBrunsliJPEGInternalsTag)) {
2130
2
        return Fail(state, BRUNSLI_INVALID_BRN);
2131
2
      }
2132
27.8k
      BrunsliStatus status = DecodeQuantDataSection(state, jpg);
2133
27.8k
      if (status != BRUNSLI_OK) return Fail(state, status);
2134
11.5k
      break;
2135
27.8k
    }
2136
2137
79.2k
    case kBrunsliHistogramDataTag: {
2138
79.2k
      if (!HasSection(state, kBrunsliJPEGInternalsTag)) {
2139
2
        return Fail(state, BRUNSLI_INVALID_BRN);
2140
2
      }
2141
79.2k
      BrunsliStatus status = DecodeHistogramDataSection(state, jpg);
2142
79.2k
      if (status != BRUNSLI_OK) return Fail(state, status);
2143
11.5k
      break;
2144
79.2k
    }
2145
2146
94.3k
    case kBrunsliDCDataTag: {
2147
94.3k
      if (!HasSection(state, kBrunsliHistogramDataTag)) {
2148
3
        return Fail(state, BRUNSLI_INVALID_BRN);
2149
3
      }
2150
94.3k
      if (!HasSection(state, kBrunsliQuantDataTag)) {
2151
3
        return Fail(state, BRUNSLI_INVALID_BRN);
2152
3
      }
2153
      // This section reads input word by word.
2154
94.3k
      if ((RemainingSectionLength(state) & 1) != 0) {
2155
4
        return Fail(state, BRUNSLI_INVALID_BRN);
2156
4
      }
2157
94.3k
      internal::dec::WarmupMeta(jpg, state);
2158
94.3k
      BrunsliStatus status = DecodeDCDataSection(state);
2159
94.3k
      if (status != BRUNSLI_OK) return Fail(state, status);
2160
10.5k
      break;
2161
94.3k
    }
2162
2163
168k
    case kBrunsliACDataTag: {
2164
168k
      if (!HasSection(state, kBrunsliDCDataTag)) {
2165
3
        return Fail(state, BRUNSLI_INVALID_BRN);
2166
3
      }
2167
      // This section reads input word by word.
2168
168k
      if ((RemainingSectionLength(state) & 1) != 0) {
2169
7
        return Fail(state, BRUNSLI_INVALID_BRN);
2170
7
      }
2171
168k
      internal::dec::WarmupMeta(jpg, state);
2172
168k
      BrunsliStatus status = DecodeACDataSection(state);
2173
168k
      if (status != BRUNSLI_OK) return Fail(state, status);
2174
8.79k
      break;
2175
168k
    }
2176
2177
8.79k
    default:
2178
      /* Unreachable */
2179
0
      return Fail(state, BRUNSLI_INVALID_BRN);
2180
5.92M
  }
2181
2182
60.3k
  if (!IsAtSectionBoundary(state)) {
2183
117
    return Fail(state, BRUNSLI_INVALID_BRN);
2184
117
  }
2185
2186
  // Nothing is expected after the AC data.
2187
60.2k
  if (s.section.tag == kBrunsliACDataTag) {
2188
8.79k
    return Stage::DONE;
2189
8.79k
  }
2190
2191
51.4k
  return Stage::SECTION;
2192
60.2k
}
2193
2194
namespace internal {
2195
namespace dec {
2196
2197
30.4k
bool UpdateSubsamplingDerivatives(JPEGData* jpg) {
2198
79.1k
  for (size_t i = 0; i < jpg->components.size(); ++i) {
2199
48.6k
    JPEGComponent* c = &jpg->components[i];
2200
48.6k
    jpg->max_h_samp_factor = std::max(jpg->max_h_samp_factor, c->h_samp_factor);
2201
48.6k
    jpg->max_v_samp_factor = std::max(jpg->max_v_samp_factor, c->v_samp_factor);
2202
48.6k
  }
2203
30.4k
  jpg->MCU_rows = DivCeil(jpg->height, jpg->max_v_samp_factor * 8);
2204
30.4k
  jpg->MCU_cols = DivCeil(jpg->width, jpg->max_h_samp_factor * 8);
2205
79.1k
  for (size_t i = 0; i < jpg->components.size(); ++i) {
2206
48.6k
    JPEGComponent* c = &jpg->components[i];
2207
48.6k
    c->width_in_blocks = jpg->MCU_cols * c->h_samp_factor;
2208
48.6k
    c->height_in_blocks = jpg->MCU_rows * c->v_samp_factor;
2209
    // 8205 == max[ceil((65535 / (i * 8)) * i) for i in range(1, 16 + 1)]
2210
48.6k
    BRUNSLI_DCHECK(c->width_in_blocks <= 8205);
2211
48.6k
    BRUNSLI_DCHECK(c->height_in_blocks <= 8205);
2212
48.6k
    uint32_t num_blocks = c->width_in_blocks * c->height_in_blocks;
2213
48.6k
    if (num_blocks > kBrunsliMaxNumBlocks) {
2214
5
      return false;
2215
5
    }
2216
48.6k
    c->num_blocks = num_blocks;
2217
48.6k
  }
2218
30.4k
  return true;
2219
30.4k
}
2220
2221
30.4k
void PrepareMeta(const JPEGData* jpg, State* state) {
2222
30.4k
  InternalState& s = *state->internal;
2223
2224
30.4k
  size_t num_components = jpg->components.size();
2225
30.4k
  s.block_state_.resize(num_components);
2226
30.4k
  std::vector<ComponentMeta>& meta = state->meta;
2227
30.4k
  meta.resize(num_components);
2228
79.1k
  for (size_t i = 0; i < num_components; ++i) {
2229
48.6k
    const JPEGComponent& c = jpg->components[i];
2230
48.6k
    ComponentMeta& m = meta[i];
2231
48.6k
    m.h_samp = c.h_samp_factor;
2232
48.6k
    m.v_samp = c.v_samp_factor;
2233
48.6k
    m.width_in_blocks = jpg->MCU_cols * m.h_samp;
2234
48.6k
    m.height_in_blocks = jpg->MCU_rows * m.v_samp;
2235
48.6k
  }
2236
30.4k
}
2237
2238
263k
void WarmupMeta(JPEGData* jpg, State* state) {
2239
263k
  InternalState& s = *state->internal;
2240
263k
  std::vector<ComponentMeta>& meta = state->meta;
2241
263k
  const size_t num_components = meta.size();
2242
2243
263k
  if (!state->is_storage_allocated) {
2244
11.5k
    state->is_storage_allocated = true;
2245
24.3k
    for (size_t i = 0; i < num_components; ++i) {
2246
12.8k
      size_t num_blocks = meta[i].width_in_blocks * meta[i].height_in_blocks;
2247
12.8k
      jpg->components[i].coeffs.resize(num_blocks * kDCTBlockSize);
2248
12.8k
      s.block_state_[i].resize(num_blocks);
2249
12.8k
      meta[i].block_state = s.block_state_[i].data();
2250
12.8k
    }
2251
11.5k
  }
2252
2253
263k
  if (!s.is_meta_warm) {
2254
11.5k
    s.is_meta_warm = true;
2255
24.3k
    for (size_t c = 0; c < num_components; ++c) {
2256
12.8k
      ComponentMeta& m = meta[c];
2257
12.8k
      const JPEGQuantTable& q = jpg->quant[jpg->components[c].quant_idx];
2258
12.8k
      m.ac_coeffs = jpg->components[c].coeffs.data();
2259
12.8k
      m.ac_stride = m.width_in_blocks * kDCTBlockSize;
2260
12.8k
      m.b_stride = m.width_in_blocks;
2261
12.8k
      memcpy(m.quant.data(), q.values.data(),
2262
12.8k
             kDCTBlockSize * sizeof(m.quant[0]));
2263
12.8k
    }
2264
11.5k
  }
2265
263k
}
2266
2267
6.24M
BrunsliStatus DoProcessJpeg(State* state, JPEGData* jpg) {
2268
12.6M
  while (true) {
2269
12.6M
    switch (state->stage) {
2270
124k
      case Stage::SIGNATURE:
2271
124k
        state->stage = VerifySignature(state);
2272
124k
        break;
2273
2274
202k
      case Stage::HEADER:
2275
202k
        state->stage = DecodeHeader(state, jpg);
2276
202k
        break;
2277
2278
2.81k
      case Stage::FALLBACK:
2279
2.81k
        state->stage = DecodeOriginalJpg(state, jpg);
2280
2.81k
        break;
2281
2282
187k
      case Stage::SECTION:
2283
187k
        state->stage = ParseSection(state);
2284
187k
        break;
2285
2286
5.92M
      case Stage::SECTION_BODY:
2287
5.92M
        state->stage = ProcessSection(state, jpg);
2288
5.92M
        break;
2289
2290
8.84k
      case Stage::DONE:
2291
        // It is expected that there is no garbage after the valid brunsli
2292
        // stream.
2293
8.84k
        if (state->pos != state->len) {
2294
31
          state->stage = Fail(state, BRUNSLI_INVALID_BRN);
2295
31
          break;
2296
31
        }
2297
8.81k
        return BRUNSLI_OK;
2298
2299
6.23M
      case Stage::ERROR:
2300
6.23M
        return state->internal->result;
2301
2302
0
      default:
2303
        /* Unreachable */
2304
0
        state->stage = Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
2305
0
        break;
2306
12.6M
    }
2307
12.6M
  }
2308
6.24M
}
2309
2310
/** Adds new input to buffer. */
2311
6.15M
void ChargeBuffer(State* state) {
2312
6.15M
  InternalState& s = *state->internal;
2313
6.15M
  Buffer& b = s.buffer;
2314
2315
6.15M
  b.borrowed_len = 0;
2316
6.15M
  b.external_data = state->data;
2317
6.15M
  b.external_pos = state->pos;
2318
6.15M
  b.external_len = state->len;
2319
6.15M
}
2320
2321
constexpr size_t kBufferMaxReadAhead = 600;
2322
2323
/** Sets input source either to buffered, or to external data. */
2324
6.24M
void LoadInput(State* state) {
2325
6.24M
  InternalState& s = *state->internal;
2326
6.24M
  Buffer& b = s.buffer;
2327
2328
  // No data buffered. Just pass external data as is.
2329
6.24M
  if (b.data_len == 0) {
2330
5.77M
    state->data = b.external_data;
2331
5.77M
    state->pos = b.external_pos;
2332
5.77M
    state->len = b.external_len;
2333
5.77M
    return;
2334
5.77M
  }
2335
2336
468k
  BRUNSLI_DCHECK(b.data_len <= kBufferMaxReadAhead);
2337
2338
  // Otherwise use buffered data.
2339
468k
  size_t available = b.external_len - b.external_pos;
2340
  // Always try to borrow as much as parser could require. This way, when
2341
  // buffer is unable to provide enough input, we could switch to unbuffered
2342
  // input.
2343
468k
  b.borrowed_len = std::min(kBufferMaxReadAhead, available);
2344
468k
  memcpy(b.data.data() + b.data_len, b.external_data + b.external_pos,
2345
468k
         b.borrowed_len);
2346
468k
  state->data = b.data.data();
2347
468k
  state->pos = 0;
2348
468k
  state->len = b.data_len + b.borrowed_len;
2349
468k
}
2350
2351
/**
2352
 * Cancel borrowed bytes, if any.
2353
 *
2354
 * Returns false, if it is impossible to continue parsing.
2355
 */
2356
6.24M
bool UnloadInput(State* state, BrunsliStatus result) {
2357
6.24M
  InternalState& s = *state->internal;
2358
6.24M
  Buffer& b = s.buffer;
2359
2360
  // Non-buffered input; put tail to buffer.
2361
6.24M
  if (state->data == b.external_data) {
2362
5.77M
    b.external_pos = state->pos;
2363
5.77M
    BRUNSLI_DCHECK(b.external_pos <= b.external_len);
2364
5.77M
    if (result != BRUNSLI_NOT_ENOUGH_DATA) return true;
2365
5.75M
    BRUNSLI_DCHECK(b.data_len == 0);
2366
5.75M
    size_t available = b.external_len - b.external_pos;
2367
5.75M
    BRUNSLI_DCHECK(available < kBufferMaxReadAhead);
2368
5.75M
    if (b.data.empty()) b.data.resize(2 * kBufferMaxReadAhead);
2369
5.75M
    b.data_len = available;
2370
5.75M
    memcpy(b.data.data(), b.external_data + b.external_pos, b.data_len);
2371
5.75M
    b.external_pos += available;
2372
5.75M
    return false;
2373
5.77M
  }
2374
2375
  // Buffer depleted; switch to non-buffered input.
2376
468k
  if (state->pos >= b.data_len) {
2377
89.9k
    size_t used_borrowed_bytes = state->pos - b.data_len;
2378
89.9k
    b.data_len = 0;
2379
89.9k
    b.external_pos += used_borrowed_bytes;
2380
89.9k
    return true;
2381
89.9k
  }
2382
2383
  // Buffer not depleted; either problem discovered was already buffered data,
2384
  // or extra input was too-short.
2385
378k
  b.data_len -= state->pos;
2386
378k
  if (result == BRUNSLI_NOT_ENOUGH_DATA) {
2387
    // We couldn't have taken more bytes.
2388
377k
    BRUNSLI_DCHECK(b.external_pos + b.borrowed_len == b.external_len);
2389
    // Remaining piece is not too large.
2390
377k
    BRUNSLI_DCHECK(b.data_len + b.borrowed_len < kBufferMaxReadAhead);
2391
377k
    b.data_len += b.borrowed_len;
2392
377k
    b.external_pos += b.borrowed_len;
2393
377k
  }
2394
378k
  BRUNSLI_DCHECK(!b.data.empty());
2395
378k
  if (state->pos > 0 && b.data_len > 0) {
2396
11.0k
    memmove(b.data.data(), b.data.data() + state->pos, b.data_len);
2397
11.0k
  }
2398
378k
  BRUNSLI_DCHECK(b.data_len <= kBufferMaxReadAhead);
2399
2400
378k
  return (result != BRUNSLI_NOT_ENOUGH_DATA);
2401
468k
}
2402
2403
/** Sets back user-provided input. */
2404
6.15M
void UnchargeBuffer(State* state) {
2405
6.15M
  InternalState& s = *state->internal;
2406
6.15M
  Buffer& b = s.buffer;
2407
2408
6.15M
  state->data = b.external_data;
2409
6.15M
  state->pos = b.external_pos;
2410
6.15M
  state->len = b.external_len;
2411
6.15M
}
2412
2413
6.15M
BrunsliStatus ProcessJpeg(State* state, JPEGData* jpg) {
2414
6.15M
  InternalState& s = *state->internal;
2415
2416
6.15M
  if (state->pos > state->len) return BRUNSLI_INVALID_PARAM;
2417
6.15M
  ChargeBuffer(state);
2418
2419
6.15M
  BrunsliStatus result = BRUNSLI_NOT_ENOUGH_DATA;
2420
6.26M
  while (result == BRUNSLI_NOT_ENOUGH_DATA) {
2421
6.24M
    if (state->stage == Stage::ERROR) {
2422
      // General error -> no recovery.
2423
6.20M
      if (s.result != BRUNSLI_NOT_ENOUGH_DATA) return s.result;
2424
      // Continue parsing.
2425
6.20M
      s.result = BRUNSLI_OK;
2426
6.20M
      state->stage = s.last_stage;
2427
6.20M
      s.last_stage = Stage::ERROR;
2428
6.20M
    }
2429
2430
6.24M
    LoadInput(state);
2431
6.24M
    if (s.section.is_active) {
2432
6.03M
      s.section.milestone = state->pos;
2433
6.03M
      s.section.projected_end = s.section.milestone + s.section.remaining;
2434
6.03M
    }
2435
2436
6.24M
    s.section.tags_met |= state->tags_met;
2437
6.24M
    result = DoProcessJpeg(state, jpg);
2438
2439
6.24M
    if (s.section.is_active) {
2440
      // TODO(eustas): dcheck state->pos > s.section.milestone
2441
6.06M
      size_t processed_len = state->pos - s.section.milestone;
2442
      // TODO(eustas): dcheck processed_len < s.section.remaining
2443
6.06M
      s.section.remaining -= processed_len;
2444
6.06M
    }
2445
2446
6.24M
    if (!UnloadInput(state, result)) break;
2447
6.24M
  }
2448
6.15M
  UnchargeBuffer(state);
2449
6.15M
  return result;
2450
6.15M
}
2451
2452
}  // namespace dec
2453
}  // namespace internal
2454
2455
BrunsliStatus BrunsliDecodeJpeg(const uint8_t* data, const size_t len,
2456
17.0k
                                JPEGData* jpg) {
2457
17.0k
  if (!data) return BRUNSLI_INVALID_PARAM;
2458
2459
17.0k
  State state;
2460
17.0k
  state.data = data;
2461
17.0k
  state.len = len;
2462
2463
17.0k
  return internal::dec::ProcessJpeg(&state, jpg);
2464
17.0k
}
2465
2466
size_t BrunsliEstimateDecoderPeakMemoryUsage(const uint8_t* data,
2467
0
                                             const size_t len) {
2468
0
  if (!data) return BRUNSLI_INVALID_PARAM;
2469
2470
0
  State state;
2471
0
  state.data = data;
2472
0
  state.len = len;
2473
0
  state.skip_tags = ~(1u << kBrunsliHistogramDataTag);
2474
0
  InternalState& s = *state.internal;
2475
0
  s.shallow_histograms = true;
2476
2477
0
  JPEGData jpg;
2478
0
  BrunsliStatus status = internal::dec::ProcessJpeg(&state, &jpg);
2479
2480
0
  if (status != BRUNSLI_OK) return 0;
2481
2482
0
  size_t out_size = 2 * len;
2483
0
  size_t total_num_blocks = 0;
2484
0
  size_t component_state_size = 0;
2485
0
  for (size_t i = 0; i < jpg.components.size(); ++i) {
2486
0
    const JPEGComponent& c = jpg.components[i];
2487
0
    total_num_blocks += c.num_blocks;
2488
0
    component_state_size += ComponentState::SizeInBytes(c.width_in_blocks);
2489
0
  }
2490
0
  size_t jpeg_data_size = total_num_blocks * kDCTBlockSize * sizeof(coeff_t);
2491
0
  size_t context_map_size = s.num_contexts * kNumAvrgContexts * sizeof(int32_t);
2492
0
  size_t histogram_size = s.num_histograms * sizeof(ANSDecodingData);
2493
0
  size_t decode_peak = context_map_size + histogram_size + component_state_size;
2494
0
  size_t jpeg_writer_size = (1u << 17u) + (1u << 16u) * sizeof(int32_t);
2495
0
  return (out_size + jpeg_data_size + std::max(decode_peak, jpeg_writer_size));
2496
0
}
2497
2498
0
BrunsliDecoder::BrunsliDecoder() {
2499
0
  jpg_.reset(new JPEGData);
2500
0
  state_.reset(new State);
2501
0
}
2502
2503
0
BrunsliDecoder::~BrunsliDecoder() {}
2504
2505
BrunsliDecoder::Status BrunsliDecoder::Decode(size_t* available_in,
2506
                                              const uint8_t** next_in,
2507
                                              size_t* available_out,
2508
0
                                              uint8_t** next_out) {
2509
0
  JPEGData* jpg = jpg_.get();
2510
0
  BRUNSLI_DCHECK(jpg);
2511
0
  State* state = state_.get();
2512
0
  BRUNSLI_DCHECK(state);
2513
2514
0
  state->data = *next_in;
2515
0
  state->pos = 0;
2516
0
  state->len = *available_in;
2517
0
  BrunsliStatus parse_status = internal::dec::ProcessJpeg(state, jpg);
2518
0
  size_t consumed_bytes = state->pos;
2519
0
  *available_in -= consumed_bytes;
2520
0
  *next_in += consumed_bytes;
2521
2522
0
  if ((parse_status != BRUNSLI_OK) &&
2523
0
      (parse_status != BRUNSLI_NOT_ENOUGH_DATA)) {
2524
0
    return BrunsliDecoder::ERROR;
2525
0
  }
2526
2527
  // All the input given input should be consumed.
2528
0
  BRUNSLI_DCHECK(*available_in == 0);
2529
2530
0
  SerializationStatus serialization_status =
2531
0
      SerializeJpeg(state, *jpg, available_out, next_out);
2532
0
  if (serialization_status == SerializationStatus::ERROR) {
2533
0
    return BrunsliDecoder::ERROR;
2534
0
  }
2535
2536
0
  switch (serialization_status) {
2537
0
    case SerializationStatus::DONE:
2538
      // Should be impossible to finish serialization without finishing parsing.
2539
0
      BRUNSLI_DCHECK(parse_status == BRUNSLI_OK);
2540
0
      return BrunsliDecoder::DONE;
2541
2542
0
    case SerializationStatus::NEEDS_MORE_INPUT:
2543
      // If serializer says that data is incomplete, parser should say the same.
2544
0
      BRUNSLI_DCHECK(parse_status == BRUNSLI_NOT_ENOUGH_DATA);
2545
0
      return BrunsliDecoder::NEEDS_MORE_INPUT;
2546
2547
0
    case SerializationStatus::NEEDS_MORE_OUTPUT:
2548
      // TODO(eustas): make sure that serializer could produce more bytes
2549
      //               without providing more bytes to parser
2550
0
      BRUNSLI_DCHECK(*available_out == 0);
2551
0
      return BrunsliDecoder::NEEDS_MORE_OUTPUT;
2552
2553
0
    case SerializationStatus::ERROR:
2554
0
      return BrunsliDecoder::ERROR;
2555
2556
0
    default:
2557
      /* Unreachable */
2558
0
      BRUNSLI_DCHECK(false);
2559
0
      return BrunsliDecoder::ERROR;
2560
0
  }
2561
0
}
2562
2563
}  // namespace brunsli