Coverage Report

Created: 2025-11-11 06:34

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/brunsli/c/dec/brunsli_decode.cc
Line
Count
Source
1
// Copyright (c) Google LLC 2019
2
//
3
// Use of this source code is governed by an MIT-style
4
// license that can be found in the LICENSE file or at
5
// https://opensource.org/licenses/MIT.
6
7
#include <brunsli/brunsli_decode.h>
8
9
#include <algorithm>
10
#include <cstdlib>
11
#include <cstring>
12
#include <iterator>
13
#include <string>
14
#include <vector>
15
16
#include <brotli/decode.h>
17
#include "../common/constants.h"
18
#include "../common/context.h"
19
#include <brunsli/jpeg_data.h>
20
#include "../common/lehmer_code.h"
21
#include "../common/platform.h"
22
#include "../common/predict.h"
23
#include "../common/quant_matrix.h"
24
#include <brunsli/status.h>
25
#include <brunsli/types.h>
26
#include "./ans_decode.h"
27
#include "./arith_decode.h"
28
#include "./bit_reader.h"
29
#include "./brunsli_input.h"
30
#include "./context_map_decode.h"
31
#include "./histogram_decode.h"
32
#include "./huffman_table.h"
33
#include <brunsli/jpeg_data_writer.h>
34
#include "./state.h"
35
#include "./state_internal.h"
36
37
namespace brunsli {
38
39
using ::brunsli::internal::dec::AcDcState;
40
using ::brunsli::internal::dec::BlockI32;
41
using ::brunsli::internal::dec::Buffer;
42
using ::brunsli::internal::dec::ComponentMeta;
43
using ::brunsli::internal::dec::FallbackState;
44
using ::brunsli::internal::dec::HeaderState;
45
using ::brunsli::internal::dec::HistogramDataState;
46
using ::brunsli::internal::dec::InternalState;
47
using ::brunsli::internal::dec::JpegInternalsState;
48
using ::brunsli::internal::dec::MetadataDecompressionStage;
49
using ::brunsli::internal::dec::MetadataState;
50
using ::brunsli::internal::dec::PrepareMeta;
51
using ::brunsli::internal::dec::QuantDataState;
52
using ::brunsli::internal::dec::SectionHeaderState;
53
using ::brunsli::internal::dec::SectionState;
54
using ::brunsli::internal::dec::SerializationStatus;
55
using ::brunsli::internal::dec::Stage;
56
using ::brunsli::internal::dec::State;
57
using ::brunsli::internal::dec::UpdateSubsamplingDerivatives;
58
using ::brunsli::internal::dec::VarintState;
59
60
static const int kNumDirectCodes = 8;
61
static const int kCoeffAlphabetSize = kNumDirectCodes + 10;
62
63
static const uint32_t kKnownSectionTags =
64
    (1u << kBrunsliSignatureTag) | (1u << kBrunsliHeaderTag) |
65
    (1u << kBrunsliMetaDataTag) | (1u << kBrunsliJPEGInternalsTag) |
66
    (1u << kBrunsliQuantDataTag) | (1u << kBrunsliHistogramDataTag) |
67
    (1u << kBrunsliDCDataTag) | (1u << kBrunsliACDataTag) |
68
    (1u << kBrunsliOriginalJpgTag);
69
70
static const uint32_t kKnownHeaderVarintTags =
71
    (1u << kBrunsliHeaderWidthTag) | (1u << kBrunsliHeaderHeightTag) |
72
    (1u << kBrunsliHeaderVersionCompTag) | (1u << kBrunsliHeaderSubsamplingTag);
73
74
0
bool IsBrunsli(const uint8_t* data, const size_t len) {
75
0
  static const uint8_t kSignature[6] = {
76
0
      /* marker */ 0x0A,
77
0
      /* length */ 0x04, 0x42, 0xD2, 0xD5, 0x4E};
78
0
  static const size_t kSignatureLen = sizeof(kSignature);
79
0
  if (len < kSignatureLen) return false;
80
0
  return (memcmp(kSignature, data, kSignatureLen) == 0);
81
0
}
82
83
// Returns ceil(a/b).
84
31.4k
inline int DivCeil(int a, int b) { return (a + b - 1) / b; }
85
86
// Decodes a number in the range [0..255], by reading 1 - 11 bits.
87
7.11k
inline uint32_t DecodeVarLenUint8(BrunsliBitReader* br) {
88
7.11k
  if (BrunsliBitReaderRead(br, 1)) {
89
1.23k
    uint32_t nbits = BrunsliBitReaderRead(br, 3);
90
1.23k
    if (nbits == 0) {
91
587
      return 1u;
92
645
    } else {
93
645
      return BrunsliBitReaderRead(br, nbits) + (1u << nbits);
94
645
    }
95
1.23k
  }
96
5.88k
  return 0;
97
7.11k
}
98
99
99.8k
bool DecodeVarint(VarintState* s, BrunsliBitReader* br, size_t max_bits) {
100
99.8k
  if (s->stage == VarintState::INIT) {
101
99.8k
    s->value = 0;
102
99.8k
    s->i = 0;
103
99.8k
    s->stage = VarintState::READ_CONTINUATION;
104
99.8k
  }
105
106
317k
  while (true) {
107
317k
    switch (s->stage) {
108
208k
      case VarintState::READ_CONTINUATION: {
109
208k
        if (s->i >= max_bits) {
110
736
          s->stage = VarintState::INIT;
111
736
          return true;
112
736
        }
113
207k
        if (s->i + 1 != max_bits) {
114
207k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
115
206k
          if (!BrunsliBitReaderRead(br, 1)) {
116
98.9k
            s->stage = VarintState::INIT;
117
98.9k
            return true;
118
98.9k
          }
119
206k
        }
120
108k
        s->stage = VarintState::READ_DATA;
121
108k
        continue;
122
207k
      }
123
108k
      case VarintState::READ_DATA: {
124
108k
        if (!BrunsliBitReaderCanRead(br, 1)) return false;
125
108k
        size_t next_bit = BrunsliBitReaderRead(br, 1);
126
108k
        s->value |= next_bit << s->i;
127
108k
        ++s->i;
128
108k
        s->stage = VarintState::READ_CONTINUATION;
129
108k
        continue;
130
108k
      }
131
0
      default: {
132
0
        BRUNSLI_CHECK(false);
133
0
        return false;
134
108k
      }
135
317k
    }
136
317k
  }
137
99.8k
}
138
139
template <size_t kChunkSize>
140
bool DecodeLimitedVarint(VarintState* s, BrunsliBitReader* br,
141
102k
                         size_t max_symbols) {
142
102k
  if (s->stage == VarintState::INIT) {
143
102k
    s->value = 0;
144
102k
    s->i = 0;
145
102k
    s->stage = VarintState::READ_CONTINUATION;
146
102k
  }
147
142k
  while (true) {
148
142k
    switch (s->stage) {
149
122k
      case VarintState::READ_CONTINUATION: {
150
122k
        if (s->i < max_symbols) {
151
120k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
152
120k
          if (BrunsliBitReaderRead(br, 1)) {
153
20.4k
            s->stage = VarintState::READ_DATA;
154
20.4k
            continue;
155
20.4k
          }
156
120k
        }
157
101k
        s->stage = VarintState::INIT;
158
101k
        return true;
159
122k
      }
160
20.4k
      case VarintState::READ_DATA: {
161
20.4k
        if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false;
162
20.3k
        size_t next_bits = BrunsliBitReaderRead(br, kChunkSize);
163
20.3k
        s->value |= next_bits << (s->i * kChunkSize);
164
20.3k
        ++s->i;
165
20.3k
        s->stage = VarintState::READ_CONTINUATION;
166
20.3k
        continue;
167
20.4k
      }
168
0
      default: {
169
0
        BRUNSLI_CHECK(false);
170
0
        return false;
171
20.4k
      }
172
142k
    }
173
142k
  }
174
102k
}
bool brunsli::DecodeLimitedVarint<2ul>(brunsli::internal::dec::VarintState*, brunsli::BrunsliBitReader*, unsigned long)
Line
Count
Source
141
92.4k
                         size_t max_symbols) {
142
92.4k
  if (s->stage == VarintState::INIT) {
143
92.4k
    s->value = 0;
144
92.4k
    s->i = 0;
145
92.4k
    s->stage = VarintState::READ_CONTINUATION;
146
92.4k
  }
147
131k
  while (true) {
148
131k
    switch (s->stage) {
149
112k
      case VarintState::READ_CONTINUATION: {
150
112k
        if (s->i < max_symbols) {
151
109k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
152
109k
          if (BrunsliBitReaderRead(br, 1)) {
153
19.6k
            s->stage = VarintState::READ_DATA;
154
19.6k
            continue;
155
19.6k
          }
156
109k
        }
157
92.3k
        s->stage = VarintState::INIT;
158
92.3k
        return true;
159
112k
      }
160
19.6k
      case VarintState::READ_DATA: {
161
19.6k
        if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false;
162
19.6k
        size_t next_bits = BrunsliBitReaderRead(br, kChunkSize);
163
19.6k
        s->value |= next_bits << (s->i * kChunkSize);
164
19.6k
        ++s->i;
165
19.6k
        s->stage = VarintState::READ_CONTINUATION;
166
19.6k
        continue;
167
19.6k
      }
168
0
      default: {
169
0
        BRUNSLI_CHECK(false);
170
0
        return false;
171
19.6k
      }
172
131k
    }
173
131k
  }
174
92.4k
}
bool brunsli::DecodeLimitedVarint<8ul>(brunsli::internal::dec::VarintState*, brunsli::BrunsliBitReader*, unsigned long)
Line
Count
Source
141
9.69k
                         size_t max_symbols) {
142
9.69k
  if (s->stage == VarintState::INIT) {
143
9.69k
    s->value = 0;
144
9.69k
    s->i = 0;
145
9.69k
    s->stage = VarintState::READ_CONTINUATION;
146
9.69k
  }
147
11.1k
  while (true) {
148
11.1k
    switch (s->stage) {
149
10.3k
      case VarintState::READ_CONTINUATION: {
150
10.3k
        if (s->i < max_symbols) {
151
10.3k
          if (!BrunsliBitReaderCanRead(br, 1)) return false;
152
10.3k
          if (BrunsliBitReaderRead(br, 1)) {
153
746
            s->stage = VarintState::READ_DATA;
154
746
            continue;
155
746
          }
156
10.3k
        }
157
9.60k
        s->stage = VarintState::INIT;
158
9.60k
        return true;
159
10.3k
      }
160
746
      case VarintState::READ_DATA: {
161
746
        if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false;
162
700
        size_t next_bits = BrunsliBitReaderRead(br, kChunkSize);
163
700
        s->value |= next_bits << (s->i * kChunkSize);
164
700
        ++s->i;
165
700
        s->stage = VarintState::READ_CONTINUATION;
166
700
        continue;
167
746
      }
168
0
      default: {
169
0
        BRUNSLI_CHECK(false);
170
0
        return false;
171
746
      }
172
11.1k
    }
173
11.1k
  }
174
9.69k
}
175
176
11.9k
std::vector<uint8_t> GenerateApp0Marker(uint8_t app0_status) {
177
11.9k
  std::vector<uint8_t> app0_marker(AppData_0xe0, AppData_0xe0 + 17);
178
11.9k
  app0_marker[9] = app0_status & 1u ? 2 : 1;
179
11.9k
  app0_status >>= 1u;
180
11.9k
  app0_marker[10] = app0_status & 0x3u;
181
11.9k
  app0_status >>= 2u;
182
11.9k
  uint16_t x_dens = kApp0Densities[app0_status];
183
11.9k
  app0_marker[11] = app0_marker[13] = x_dens >> 8u;
184
11.9k
  app0_marker[12] = app0_marker[14] = x_dens & 0xFFu;
185
11.9k
  return app0_marker;
186
11.9k
}
187
188
4.05k
std::vector<uint8_t> GenerateAppMarker(uint8_t marker, uint8_t code) {
189
4.05k
  std::vector<uint8_t> s;
190
4.05k
  if (marker == 0x80) {
191
2.88k
    s = std::vector<uint8_t>(AppData_0xe2, AppData_0xe2 + 3161);
192
2.88k
    s[84] = code;
193
2.88k
  } else if (marker == 0x81) {
194
756
    s = std::vector<uint8_t>(AppData_0xec, AppData_0xec + 18);
195
756
    s[15] = code;
196
756
  } else {
197
409
    BRUNSLI_DCHECK(marker == 0x82);
198
409
    s = std::vector<uint8_t>(AppData_0xee, AppData_0xee + 15);
199
409
    s[10] = code;
200
409
  }
201
4.05k
  return s;
202
4.05k
}
203
204
bool ProcessMetaData(const uint8_t* data, size_t len, MetadataState* state,
205
151k
                     JPEGData* jpg) {
206
151k
  size_t pos = 0;
207
395k
  while (pos < len) {
208
244k
    switch (state->stage) {
209
35.6k
      case MetadataState::READ_MARKER: {
210
35.6k
        state->marker = static_cast<uint8_t>(data[pos++]);
211
35.6k
        if (state->marker == 0xD9) {
212
151
          jpg->tail_data = std::vector<uint8_t>();
213
151
          state->stage = MetadataState::READ_TAIL;
214
151
          continue;
215
35.4k
        } else if (state->marker < 0x40) {
216
11.9k
          state->short_marker_count++;
217
11.9k
          if (state->short_marker_count > kBrunsliShortMarkerLimit) {
218
9
            return false;
219
9
          }
220
11.9k
          jpg->app_data.push_back(GenerateApp0Marker(state->marker));
221
11.9k
          continue;
222
23.4k
        } else if (state->marker >= 0x80 && state->marker <= 0x82) {
223
4.07k
          state->short_marker_count++;
224
4.07k
          if (state->short_marker_count > kBrunsliShortMarkerLimit) {
225
1
            return false;
226
1
          }
227
4.07k
          state->stage = MetadataState::READ_CODE;
228
4.07k
          continue;
229
4.07k
        }
230
        // Otherwise - mutlibyte sequence.
231
19.4k
        if ((state->marker != 0xFE) && ((state->marker >> 4u) != 0x0E)) {
232
142
          return false;
233
142
        }
234
19.2k
        state->stage = MetadataState::READ_LENGTH_HI;
235
19.2k
        continue;
236
19.4k
      }
237
238
31.3k
      case MetadataState::READ_TAIL: {
239
31.3k
        Append(&jpg->tail_data, data + pos, data + len);
240
31.3k
        pos = len;
241
31.3k
        continue;
242
19.4k
      }
243
244
4.05k
      case MetadataState::READ_CODE: {
245
4.05k
        const uint8_t code = data[pos++];
246
4.05k
        jpg->app_data.push_back(GenerateAppMarker(state->marker, code));
247
4.05k
        state->stage = MetadataState::READ_MARKER;
248
4.05k
        continue;
249
19.4k
      }
250
251
19.2k
      case MetadataState::READ_LENGTH_HI: {
252
19.2k
        state->length_hi = data[pos++];
253
19.2k
        state->stage = MetadataState::READ_LENGTH_LO;
254
19.2k
        continue;
255
19.4k
      }
256
257
19.2k
      case MetadataState::READ_LENGTH_LO: {
258
19.2k
        const uint8_t lo = data[pos++];
259
19.2k
        size_t marker_len = (state->length_hi << 8u) + lo;
260
19.2k
        if (marker_len < 2) return false;
261
19.2k
        state->remaining_multibyte_length = marker_len - 2;
262
19.2k
        uint8_t head[3] = {state->marker, state->length_hi, lo};
263
19.2k
        auto* dest = (state->marker == 0xFE) ? &jpg->com_data : &jpg->app_data;
264
19.2k
        size_t delta = (state->marker == 0xFE) ? 0 : state->short_marker_count;
265
19.2k
        if (dest->size() - delta >= kBrunsliMultibyteMarkerLimit) {
266
2
          return false;
267
2
        }
268
19.2k
        dest->emplace_back(head, head + 3);
269
19.2k
        state->multibyte_sink = &dest->back();
270
        // Turn state machine to default state in case there is no payload in
271
        // multibyte sequence. This is important when such a sequence concludes
272
        // the input.
273
19.2k
        state->stage = (state->remaining_multibyte_length > 0)
274
19.2k
                           ? MetadataState::READ_MULTIBYTE
275
19.2k
                           : MetadataState::READ_MARKER;
276
19.2k
        continue;
277
19.2k
      }
278
279
134k
      case MetadataState::READ_MULTIBYTE: {
280
134k
        size_t chunk_size =
281
134k
            std::min(state->remaining_multibyte_length, len - pos);
282
134k
        Append(state->multibyte_sink, data + pos, chunk_size);
283
134k
        state->remaining_multibyte_length -= chunk_size;
284
134k
        pos += chunk_size;
285
134k
        if (state->remaining_multibyte_length == 0) {
286
17.6k
          state->stage = MetadataState::READ_MARKER;
287
17.6k
        }
288
134k
        continue;
289
19.2k
      }
290
291
0
      default: return false;
292
244k
    }
293
244k
  }
294
151k
  return true;
295
151k
}
296
297
11.1k
static BrunsliStatus DecodeHuffmanCode(State* state, JPEGData* jpg) {
298
11.1k
  InternalState& s = *state->internal;
299
11.1k
  JpegInternalsState& js = s.internals;
300
11.1k
  BrunsliBitReader* br = &js.br;
301
302
238k
  while (true) {
303
238k
    switch (js.stage) {
304
26.3k
      case JpegInternalsState::READ_HUFFMAN_LAST: {
305
26.3k
        if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA;
306
26.3k
        js.is_known_last_huffman_code = BrunsliBitReaderRead(br, 1);
307
26.3k
        jpg->huffman_code.emplace_back();
308
26.3k
        js.stage = JpegInternalsState::READ_HUFFMAN_SIMPLE;
309
26.3k
        continue;
310
26.3k
      }
311
26.3k
      case JpegInternalsState::READ_HUFFMAN_SIMPLE: {
312
26.3k
        if (!BrunsliBitReaderCanRead(br, 5 + !js.is_known_last_huffman_code)) {
313
174
          return BRUNSLI_NOT_ENOUGH_DATA;
314
174
        }
315
26.1k
        JPEGHuffmanCode* huff = &jpg->huffman_code.back();
316
317
26.1k
        huff->slot_id = BrunsliBitReaderRead(br, 2);
318
26.1k
        js.is_dc_table = (BrunsliBitReaderRead(br, 1) == 0);
319
26.1k
        huff->slot_id += js.is_dc_table ? 0 : 0x10;
320
26.1k
        huff->is_last =
321
26.1k
            js.is_known_last_huffman_code || BrunsliBitReaderRead(br, 1);
322
26.1k
        huff->counts[0] = 0;
323
26.1k
        int found_match = BrunsliBitReaderRead(br, 1);
324
26.1k
        if (found_match) {
325
16.1k
          if (js.is_dc_table) {
326
8.31k
            int huff_table_idx = BrunsliBitReaderRead(br, 1);
327
8.31k
            memcpy(&huff->counts[1], kStockDCHuffmanCodeCounts[huff_table_idx],
328
8.31k
                   sizeof(kStockDCHuffmanCodeCounts[0]));
329
8.31k
            memcpy(&huff->values[0], kStockDCHuffmanCodeValues[huff_table_idx],
330
8.31k
                   sizeof(kStockDCHuffmanCodeValues[0]));
331
8.31k
          } else {
332
7.84k
            int huff_table_idx = BrunsliBitReaderRead(br, 1);
333
7.84k
            memcpy(&huff->counts[1], kStockACHuffmanCodeCounts[huff_table_idx],
334
7.84k
                   sizeof(kStockACHuffmanCodeCounts[0]));
335
7.84k
            memcpy(&huff->values[0], kStockACHuffmanCodeValues[huff_table_idx],
336
7.84k
                   sizeof(kStockACHuffmanCodeValues[0]));
337
7.84k
          }
338
16.1k
          js.stage = JpegInternalsState::HUFFMAN_UPDATE;
339
16.1k
        } else {
340
          // One less bit is used than requested, but it is guaranteed to be
341
          // consumed in complex Huffman code case.
342
10.0k
          js.p.Init(js.is_dc_table
343
10.0k
                        ? std::vector<uint8_t>(kDefaultDCValues,
344
7.10k
                                               std::end(kDefaultDCValues))
345
10.0k
                        : std::vector<uint8_t>(kDefaultACValues,
346
2.90k
                                               std::end(kDefaultACValues)));
347
10.0k
          js.stage = JpegInternalsState::READ_HUFFMAN_MAX_LEN;
348
10.0k
        }
349
26.1k
        continue;
350
26.3k
      }
351
10.0k
      case JpegInternalsState::READ_HUFFMAN_MAX_LEN: {
352
10.0k
        if (!BrunsliBitReaderCanRead(br, 4)) return BRUNSLI_NOT_ENOUGH_DATA;
353
9.97k
        js.max_len = BrunsliBitReaderRead(br, 4) + 1;
354
9.97k
        js.total_count = 0;
355
9.97k
        js.max_count =
356
9.97k
            js.is_dc_table ? kJpegDCAlphabetSize : kJpegHuffmanAlphabetSize;
357
9.97k
        js.space = (1u << kJpegHuffmanMaxBitLength) -
358
9.97k
                   (1u << (kJpegHuffmanMaxBitLength - js.max_len));
359
9.97k
        js.i = 1;
360
9.97k
        js.stage = JpegInternalsState::READ_HUFFMAN_COUNT;
361
9.97k
        continue;
362
10.0k
      }
363
47.6k
      case JpegInternalsState::READ_HUFFMAN_COUNT: {
364
47.6k
        JPEGHuffmanCode* huff = &jpg->huffman_code.back();
365
47.6k
        if (js.i <= js.max_len) {
366
37.7k
          size_t shift = kJpegHuffmanMaxBitLength - js.i;
367
37.7k
          size_t count_limit =
368
37.7k
              std::min(js.max_count - js.total_count, js.space >> shift);
369
37.7k
          if (count_limit > 0) {
370
35.8k
            int nbits =
371
35.8k
                Log2FloorNonZero(static_cast<uint32_t>(count_limit)) + 1;
372
35.8k
            if (!BrunsliBitReaderCanRead(br, nbits)) {
373
46
              return BRUNSLI_NOT_ENOUGH_DATA;
374
46
            }
375
35.7k
            size_t count = BrunsliBitReaderRead(br, nbits);
376
35.7k
            if (count > count_limit) {
377
7
              return BRUNSLI_INVALID_BRN;
378
7
            }
379
35.7k
            huff->counts[js.i] = static_cast<int>(count);
380
35.7k
            js.total_count += count;
381
35.7k
            js.space -= count * (static_cast<size_t>(1) << shift);
382
35.7k
          }
383
37.7k
          ++js.i;
384
37.7k
          continue;
385
37.7k
        }
386
9.91k
        ++huff->counts[js.max_len];
387
9.91k
        js.i = 0;
388
9.91k
        js.stage = JpegInternalsState::READ_HUFFMAN_PERMUTATION;
389
9.91k
        continue;
390
47.6k
      }
391
102k
      case JpegInternalsState::READ_HUFFMAN_PERMUTATION: {
392
102k
        JPEGHuffmanCode* huff = &jpg->huffman_code.back();
393
102k
        if (js.i < js.total_count) {
394
92.4k
          const int nbits = js.p.num_bits();
395
92.4k
          if (!DecodeLimitedVarint<2>(&js.varint, br, (nbits + 1) >> 1u)) {
396
60
            return BRUNSLI_NOT_ENOUGH_DATA;
397
60
          }
398
92.3k
          uint8_t value;
399
92.3k
          if (!js.p.Remove(js.varint.value, &value)) {
400
12
            return BRUNSLI_INVALID_BRN;
401
12
          }
402
92.3k
          huff->values[js.i] = value;
403
92.3k
          ++js.i;
404
92.3k
          continue;
405
92.3k
        }
406
9.84k
        huff->values[js.total_count] = kJpegHuffmanAlphabetSize;
407
9.84k
        js.stage = JpegInternalsState::HUFFMAN_UPDATE;
408
9.84k
        continue;
409
102k
      }
410
26.0k
      case JpegInternalsState::HUFFMAN_UPDATE: {
411
        // This stage does not perform reading -> transient.
412
26.0k
        if (jpg->huffman_code.back().is_last) {
413
12.9k
          js.terminal_huffman_code_count++;
414
12.9k
        }
415
26.0k
        if (js.is_known_last_huffman_code) {
416
10.7k
          js.p.Clear();
417
10.7k
          return BRUNSLI_OK;
418
10.7k
        }
419
15.2k
        if (jpg->huffman_code.size() >= kMaxDHTMarkers) {
420
          // Too many Huffman codes for a valid bit-stream. Normally, a jpeg
421
          // file can have any arbitrary number of DHT, DQT, etc. But i prefer
422
          // we force a reasonable lower bound instead of open door to likely
423
          // forged BRN input.
424
1
          return BRUNSLI_INVALID_BRN;
425
1
        }
426
15.2k
        js.stage = JpegInternalsState::READ_HUFFMAN_LAST;
427
15.2k
        continue;
428
15.2k
      }
429
0
      default:
430
0
        return BRUNSLI_DECOMPRESSION_ERROR;
431
238k
    }
432
238k
  }
433
0
  return BRUNSLI_OK;
434
11.1k
}
435
436
5.00k
BrunsliStatus DecodeScanInfo(State* state, JPEGData* jpg) {
437
5.00k
  InternalState& s = *state->internal;
438
5.00k
  JpegInternalsState& js = s.internals;
439
5.00k
  BrunsliBitReader* br = &js.br;
440
441
25.5k
  const auto maybe_add_zero_run = [&js, jpg] () {
442
25.5k
    if (js.last_num > 0) {
443
18.9k
      JPEGScanInfo::ExtraZeroRunInfo info;
444
18.9k
      info.block_idx = js.last_block_idx;
445
18.9k
      info.num_extra_zero_runs = js.last_num;
446
18.9k
      jpg->scan_info[js.i].extra_zero_runs.push_back(info);
447
18.9k
      js.last_num = 0;
448
18.9k
    }
449
25.5k
  };
450
451
250k
  while (true) {
452
250k
    switch (js.stage) {
453
9.10k
      case JpegInternalsState::READ_SCAN_COMMON: {
454
9.10k
        JPEGScanInfo* si = &jpg->scan_info[js.i];
455
9.10k
        if (!BrunsliBitReaderCanRead(br, 22)) return BRUNSLI_NOT_ENOUGH_DATA;
456
8.94k
        si->Ss = BrunsliBitReaderRead(br, 6);
457
8.94k
        si->Se = BrunsliBitReaderRead(br, 6);
458
8.94k
        si->Ah = BrunsliBitReaderRead(br, 4);
459
8.94k
        si->Al = BrunsliBitReaderRead(br, 4);
460
8.94k
        si->num_components = BrunsliBitReaderRead(br, 2) + 1;
461
8.94k
        js.j = 0;
462
8.94k
        js.stage = JpegInternalsState::READ_SCAN_COMPONENT;
463
8.94k
        continue;
464
9.10k
      }
465
29.6k
      case JpegInternalsState::READ_SCAN_COMPONENT: {
466
29.6k
        JPEGScanInfo* si = &jpg->scan_info[js.i];
467
29.6k
        if (js.j < si->num_components) {
468
20.7k
          if (!BrunsliBitReaderCanRead(br, 6)) return BRUNSLI_NOT_ENOUGH_DATA;
469
20.6k
          si->components[js.j].comp_idx = BrunsliBitReaderRead(br, 2);
470
20.6k
          si->components[js.j].dc_tbl_idx = BrunsliBitReaderRead(br, 2);
471
20.6k
          si->components[js.j].ac_tbl_idx = BrunsliBitReaderRead(br, 2);
472
20.6k
          js.j++;
473
20.6k
        } else {
474
8.91k
          js.last_block_idx = -1;
475
8.91k
          js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION;
476
8.91k
        }
477
29.6k
        continue;
478
29.6k
      }
479
66.2k
      case JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION: {
480
66.2k
        if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA;
481
66.2k
        if (BrunsliBitReaderRead(br, 1)) {
482
57.4k
          js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_DATA;
483
57.4k
        } else {
484
8.83k
          js.last_block_idx = 0;
485
8.83k
          js.last_num = 0;
486
8.83k
          js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION;
487
8.83k
        }
488
66.2k
        continue;
489
66.2k
      }
490
57.4k
      case JpegInternalsState::READ_SCAN_RESET_POINT_DATA: {
491
57.4k
        JPEGScanInfo* si = &jpg->scan_info[js.i];
492
57.4k
        if (!DecodeVarint(&js.varint, br, 28)) return BRUNSLI_NOT_ENOUGH_DATA;
493
57.3k
        int block_idx =
494
57.3k
            js.last_block_idx + static_cast<int>(js.varint.value) + 1;
495
57.3k
        si->reset_points.emplace_back(block_idx);
496
57.3k
        js.last_block_idx = block_idx;
497
        // TODO(eustas): limit to exact number of blocks.
498
57.3k
        if (js.last_block_idx > (1 << 30)) {
499
          // At most 8K x 8K x num_channels blocks are expected. That is,
500
          // typically, 1.5 * 2^27. 2^30 should be sufficient for any sane
501
          // image.
502
1
          return BRUNSLI_INVALID_BRN;
503
1
        }
504
57.3k
        js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION;
505
57.3k
        continue;
506
57.3k
      }
507
48.5k
      case JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION: {
508
48.5k
        if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA;
509
48.5k
        if (BrunsliBitReaderRead(br, 1)) {
510
39.7k
          js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_DATA;
511
39.7k
        } else {
512
8.79k
          maybe_add_zero_run();
513
8.79k
          ++js.i;
514
8.79k
          if (js.i < js.num_scans) {
515
4.09k
            js.stage = JpegInternalsState::READ_SCAN_COMMON;
516
4.09k
            continue;
517
4.09k
          }
518
4.69k
          return BRUNSLI_OK;
519
8.79k
        }
520
39.7k
        continue;
521
48.5k
      }
522
39.7k
      case JpegInternalsState::READ_SCAN_ZERO_RUN_DATA: {
523
39.7k
        if (!DecodeVarint(&js.varint, br, 28)) return BRUNSLI_NOT_ENOUGH_DATA;
524
39.7k
        int block_idx = js.last_block_idx + static_cast<int>(js.varint.value);
525
39.7k
        if (block_idx > js.last_block_idx) maybe_add_zero_run();
526
39.7k
        ++js.last_num;
527
39.7k
        js.last_block_idx = block_idx;
528
        // TODO(eustas): limit to exact number of blocks.
529
39.7k
        if (js.last_block_idx > (1 << 30)) {
530
          // At most 8K x 8K x num_channels blocks are expected. That is,
531
          // typically, 1.5 * 2^27. 2^30 should be sufficient for any sane
532
          // image.
533
2
          return BRUNSLI_INVALID_BRN;
534
2
        }
535
39.7k
        js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION;
536
39.7k
        continue;
537
39.7k
      }
538
0
      default: return BRUNSLI_DECOMPRESSION_ERROR;
539
250k
    }
540
250k
  }
541
5.00k
}
542
543
static bool BRUNSLI_NOINLINE DecodeCoeffOrder(uint32_t* order, BitSource* br,
544
5.63k
                                              WordSource* in) {
545
5.63k
  uint32_t lehmer[kDCTBlockSize] = {0};
546
5.63k
  static const int kSpan = 16;
547
28.1k
  for (int i = 0; i < kDCTBlockSize; i += kSpan) {
548
22.5k
    if (!br->ReadBits(1, in)) continue;  // span is all-zero
549
2.59k
    const int start = (i > 0) ? i : 1;
550
2.59k
    const int end = i + kSpan;
551
42.2k
    for (int j = start; j < end; ++j) {
552
39.6k
      uint32_t v = 0;
553
50.9k
      while (v <= kDCTBlockSize) {
554
50.9k
        const uint32_t bits = br->ReadBits(3, in);
555
50.9k
        v += bits;
556
50.9k
        if (bits < 7) break;
557
50.9k
      }
558
39.6k
      if (v > kDCTBlockSize) return false;
559
39.6k
      lehmer[j] = v;
560
39.6k
    }
561
2.59k
  }
562
5.62k
  int end = kDCTBlockSize - 1;
563
328k
  while (end >= 1 && lehmer[end] == 0) {
564
322k
    --end;
565
322k
  }
566
5.62k
  if (lehmer[end] == 1) return false;
567
29.9k
  for (int i = 1; i <= end; ++i) {
568
24.5k
    if (lehmer[i] == 0) return false;
569
24.3k
    --lehmer[i];
570
24.3k
  }
571
5.40k
  if (!DecodeLehmerCode(lehmer, kDCTBlockSize, order)) return false;
572
350k
  for (int k = 0; k < kDCTBlockSize; ++k) {
573
344k
    order[k] = kJPEGNaturalOrder[order[k]];
574
344k
  }
575
5.38k
  return true;
576
5.40k
}
577
578
/** Reads 0..6 words from |in| and returns the value in the range 0..63. */
579
static size_t DecodeNumNonzeros(Prob* p, BinaryArithmeticDecoder* ac,
580
1.84M
                                WordSource* in) {
581
  // To simplity BST navigation, we use 1-based indexing.
582
1.84M
  Prob* bst = p - 1;
583
1.84M
  size_t ctx = 1;
584
585
12.8M
  for (size_t b = 0; b < kNumNonZeroBits; ++b) {
586
11.0M
    const int bit = ac->ReadBit(bst[ctx].get_proba(), in);
587
11.0M
    bst[ctx].Add(bit);
588
11.0M
    ctx = 2 * ctx + bit;
589
11.0M
  }
590
591
  // Leaf index in the level corresponds to the resuling value.
592
1.84M
  size_t val = ctx - (1u << kNumNonZeroBits);
593
1.84M
  BRUNSLI_DCHECK(val <= kNumNonZeroTreeSize);
594
1.84M
  return val;
595
1.84M
}
596
597
10.9k
void EnsureSubdecodersInitialized(State* state, WordSource* in) {
598
10.9k
  InternalState& s = *state->internal;
599
10.9k
  if (!s.subdecoders_initialized) {
600
10.9k
    s.ans_decoder.Init(in);
601
10.9k
    s.bit_reader.Init(in);
602
10.9k
    s.arith_decoder.Init(in);
603
10.9k
    s.subdecoders_initialized = true;
604
10.9k
  }
605
10.9k
}
606
607
10.5k
bool FinalizeSubdecoders(State* state) {
608
10.5k
  InternalState& s = *state->internal;
609
10.5k
  if (!s.ans_decoder.CheckCRC()) return false;
610
9.79k
  if (!s.bit_reader.Finish()) return false;
611
9.76k
  s.subdecoders_initialized = false;
612
9.76k
  return true;
613
9.79k
}
614
615
5.88k
BrunsliStatus DecodeDC(State* state, WordSource* in) {
616
5.88k
  const std::vector<ComponentMeta>& meta = state->meta;
617
5.88k
  const size_t num_components = meta.size();
618
5.88k
  const int mcu_rows = meta[0].height_in_blocks / meta[0].v_samp;
619
5.88k
  InternalState& s = *state->internal;
620
5.88k
  AcDcState& ac_dc_state = s.ac_dc;
621
622
5.88k
  std::vector<ComponentStateDC>& comps = ac_dc_state.dc;
623
5.88k
  if (comps.empty()) {
624
5.88k
    comps.resize(num_components);
625
12.4k
    for (size_t c = 0; c < num_components; ++c) {
626
6.51k
      comps[c].SetWidth(meta[c].width_in_blocks);
627
6.51k
    }
628
5.88k
  }
629
630
5.88k
  if (!in->CanRead(5)) return BRUNSLI_NOT_ENOUGH_DATA;
631
5.76k
  EnsureSubdecodersInitialized(state, in);
632
5.76k
  ANSDecoder ans = s.ans_decoder;
633
5.76k
  BitSource br = s.bit_reader;
634
5.76k
  BinaryArithmeticDecoder ac = s.arith_decoder;
635
636
  // We decode DC components in the following interleaved manner:
637
  //   v_samp[0] rows from component 0
638
  //   v_samp[1] rows from component 1
639
  //   v_samp[2] rows from component 2
640
  //   v_samp[3] rows from component 3 (if present)
641
  //
642
  // E.g. in a YUV420 image, we decode 2 rows of DC components from Y and then
643
  // 1 row of DC components from U and 1 row of DC components from V.
644
123k
  for (int mcu_y = ac_dc_state.next_mcu_y; mcu_y < mcu_rows; ++mcu_y) {
645
238k
    for (size_t i = ac_dc_state.next_component; i < num_components; ++i) {
646
120k
      ComponentStateDC* c = &comps[i];
647
120k
      const ComponentMeta& m = meta[i];
648
120k
      const uint8_t* context_map = state->context_map + i * kNumAvrgContexts;
649
120k
      const int ac_stride = static_cast<int>(m.ac_stride);
650
120k
      const size_t b_stride = m.b_stride;
651
120k
      const int width = m.width_in_blocks;
652
120k
      int y = mcu_y * m.v_samp + ac_dc_state.next_iy;
653
120k
      int* const prev_sgn = &c->prev_sign[1];
654
120k
      int* const prev_abs = &c->prev_abs_coeff[2];
655
488k
      for (int iy = ac_dc_state.next_iy; iy < m.v_samp; ++iy, ++y) {
656
367k
        coeff_t* coeffs =
657
367k
            m.ac_coeffs + y * ac_stride + ac_dc_state.next_x * kDCTBlockSize;
658
367k
        uint8_t* block_state =
659
367k
            m.block_state + y * b_stride + ac_dc_state.next_x;
660
48.3M
        for (int x = ac_dc_state.next_x; x < width; ++x) {
661
48.0M
          if (BRUNSLI_PREDICT_FALSE(!in->CanRead(6))) {
662
97
            ac_dc_state.next_mcu_y = mcu_y;
663
97
            ac_dc_state.next_component = i;
664
97
            ac_dc_state.next_iy = iy;
665
97
            ac_dc_state.next_x = x;
666
97
            s.ans_decoder = ans;
667
97
            s.bit_reader = br;
668
97
            s.arith_decoder = ac;
669
97
            return BRUNSLI_NOT_ENOUGH_DATA;
670
97
          }
671
48.0M
          const int is_empty_ctx =
672
48.0M
              IsEmptyBlockContext(&c->prev_is_nonempty[1], x);
673
48.0M
          Prob* BRUNSLI_RESTRICT is_empty_p =
674
48.0M
              &c->is_empty_block_prob[is_empty_ctx];
675
48.0M
          const bool is_empty_block = !ac.ReadBit(is_empty_p->get_proba(), in);
676
48.0M
          is_empty_p->Add(!is_empty_block);
677
48.0M
          c->prev_is_nonempty[x + 1] = !is_empty_block;
678
48.0M
          *block_state = is_empty_block;
679
48.0M
          int abs_val = 0;
680
48.0M
          int sign = 0;
681
48.0M
          if (!is_empty_block) {
682
12.2M
            Prob* BRUNSLI_RESTRICT p_is_zero = &c->is_zero_prob;
683
12.2M
            int is_zero = ac.ReadBit(p_is_zero->get_proba(), in);
684
12.2M
            p_is_zero->Add(is_zero);
685
12.2M
            if (!is_zero) {
686
4.09M
              const int avg_ctx = WeightedAverageContextDC(prev_abs, x);
687
4.09M
              const int sign_ctx = prev_sgn[x] * 3 + prev_sgn[x - 1];
688
4.09M
              Prob* BRUNSLI_RESTRICT sign_p = &c->sign_prob[sign_ctx];
689
4.09M
              sign = ac.ReadBit(sign_p->get_proba(), in);
690
4.09M
              sign_p->Add(sign);
691
4.09M
              const int entropy_ix = context_map[avg_ctx];
692
4.09M
              int code = ans.ReadSymbol(state->entropy_codes[entropy_ix], in);
693
4.09M
              if (code < kNumDirectCodes) {
694
600k
                abs_val = code + 1;
695
3.49M
              } else {
696
3.49M
                int nbits = code - kNumDirectCodes;
697
3.49M
                Prob* BRUNSLI_RESTRICT p_first_extra_bit =
698
3.49M
                    &c->first_extra_bit_prob[nbits];
699
3.49M
                int first_extra_bit =
700
3.49M
                    ac.ReadBit(p_first_extra_bit->get_proba(), in);
701
3.49M
                p_first_extra_bit->Add(first_extra_bit);
702
3.49M
                int extra_bits_val = first_extra_bit << nbits;
703
3.49M
                if (nbits > 0) {
704
3.38M
                  extra_bits_val |= static_cast<int>(br.ReadBits(nbits, in));
705
3.38M
                }
706
3.49M
                abs_val = kNumDirectCodes - 1 + (2 << nbits) + extra_bits_val;
707
3.49M
              }
708
4.09M
            }
709
12.2M
          }
710
48.0M
          prev_abs[x] = abs_val;
711
48.0M
          prev_sgn[x] = abs_val ? sign + 1 : 0;
712
48.0M
          coeffs[0] = ((1 - 2 * sign) * abs_val +
713
48.0M
                       PredictWithAdaptiveMedian(coeffs, x, y, ac_stride));
714
48.0M
          block_state++;
715
48.0M
          coeffs += kDCTBlockSize;
716
48.0M
        }
717
367k
        ac_dc_state.next_x = 0;
718
367k
      }
719
120k
      ac_dc_state.next_iy = 0;
720
120k
    }
721
117k
    ac_dc_state.next_component = 0;
722
117k
  }
723
724
  // Prepare for AC decoding.
725
5.66k
  ac_dc_state.next_mcu_y = 0;
726
5.66k
  ac_dc_state.next_component = 0;
727
5.66k
  ac_dc_state.next_iy = 0;
728
5.66k
  ac_dc_state.next_x = 0;
729
730
5.66k
  comps.clear();
731
5.66k
  comps.shrink_to_fit();
732
733
5.66k
  s.ans_decoder = ans;
734
5.66k
  s.bit_reader = br;
735
5.66k
  s.arith_decoder = ac;
736
5.66k
  if (!FinalizeSubdecoders(state)) return BRUNSLI_INVALID_BRN;
737
738
5.36k
  return BRUNSLI_OK;
739
5.66k
}
740
741
static void BRUNSLI_NOINLINE DecodeEmptyAcBlock(
742
9.46M
    int* BRUNSLI_RESTRICT prev_sgn, int* BRUNSLI_RESTRICT prev_abs) {
743
605M
  for (int k = 1; k < kDCTBlockSize; ++k) {
744
596M
    prev_sgn[k] = 0;
745
596M
    prev_abs[k] = 0;
746
596M
  }
747
9.46M
}
748
749
/** All the necessary things for decoding AC block. */
750
struct AcBlockCookie {
751
  int x;
752
  int y;
753
  uint8_t* BRUNSLI_RESTRICT prev_num_nonzeros;
754
  int* BRUNSLI_RESTRICT prev_sgn;
755
  int* BRUNSLI_RESTRICT prev_abs;
756
  Prob* BRUNSLI_RESTRICT num_nonzero_prob;
757
758
  BinaryArithmeticDecoder* BRUNSLI_RESTRICT ac;
759
  WordSource* BRUNSLI_RESTRICT in;
760
  ANSDecoder* BRUNSLI_RESTRICT ans;
761
  BitSource* BRUNSLI_RESTRICT br;
762
763
  coeff_t* BRUNSLI_RESTRICT coeffs;
764
  const coeff_t* BRUNSLI_RESTRICT prev_row_coeffs;
765
  const coeff_t* BRUNSLI_RESTRICT prev_col_coeffs;
766
  Prob* BRUNSLI_RESTRICT is_zero_prob;
767
  const uint32_t* BRUNSLI_RESTRICT order;
768
  const uint8_t* BRUNSLI_RESTRICT context_modes;
769
  const int* BRUNSLI_RESTRICT mult_col;
770
  const int* BRUNSLI_RESTRICT mult_row;
771
  int prev_row_delta;
772
  Prob* BRUNSLI_RESTRICT sign_prob;
773
  size_t context_bits;
774
  const uint8_t* BRUNSLI_RESTRICT context_map;
775
  const ANSDecodingData* BRUNSLI_RESTRICT entropy_codes;
776
  Prob* BRUNSLI_RESTRICT first_extra_bit_prob;
777
};
778
779
1.84M
static size_t BRUNSLI_NOINLINE DecodeAcBlock(const AcBlockCookie& cookie) {
780
1.84M
  AcBlockCookie c = cookie;
781
782
1.84M
  BinaryArithmeticDecoder ac = *c.ac;
783
1.84M
  WordSource* in = c.in;
784
1.84M
  ANSDecoder ans = *c.ans;
785
1.84M
  BitSource br = *c.br;
786
787
1.84M
  size_t num_nonzeros = 0;
788
789
1.84M
  const uint8_t nonzero_ctx = NumNonzerosContext(c.prev_num_nonzeros, c.x, c.y);
790
1.84M
  size_t last_nz = DecodeNumNonzeros(
791
1.84M
      c.num_nonzero_prob + kNumNonZeroTreeSize * nonzero_ctx, &ac, in);
792
94.1M
  for (size_t k = last_nz + 1; k < kDCTBlockSize; ++k) {
793
92.2M
    c.prev_sgn[k] = 0;
794
92.2M
    c.prev_abs[k] = 0;
795
92.2M
  }
796
25.5M
  for (size_t k = last_nz; k > 0; --k) {
797
23.7M
    int is_zero = 0;
798
23.7M
    if (k < last_nz) {
799
22.9M
      size_t bucket = kNonzeroBuckets[num_nonzeros - 1];
800
22.9M
      size_t is_zero_ctx = bucket * kDCTBlockSize + k;
801
22.9M
      Prob& p = c.is_zero_prob[is_zero_ctx];
802
22.9M
      is_zero = ac.ReadBit(p.get_proba(), in);
803
22.9M
      p.Add(is_zero);
804
22.9M
    }
805
23.7M
    int abs_val = 0;
806
23.7M
    int sign = 1;
807
23.7M
    const int k_nat = c.order[k];
808
23.7M
    if (!is_zero) {
809
6.90M
      size_t context_type = c.context_modes[k_nat];
810
6.90M
      size_t avg_ctx = 0;
811
6.90M
      size_t sign_ctx = kMaxAverageContext;
812
6.90M
      if ((context_type & 1) && (c.y > 0)) {
813
1.43M
        size_t offset = k_nat & 7;
814
1.43M
        ACPredictContextRow(c.prev_row_coeffs + offset, c.coeffs + offset,
815
1.43M
                            c.mult_col + offset * 8, &avg_ctx, &sign_ctx);
816
5.46M
      } else if ((context_type & 2) && (c.x > 0)) {
817
1.58M
        size_t offset = k_nat & ~7;
818
1.58M
        ACPredictContextCol(c.prev_col_coeffs + offset, c.coeffs + offset,
819
1.58M
                            c.mult_row + offset, &avg_ctx, &sign_ctx);
820
3.88M
      } else if (!context_type) {
821
3.78M
        avg_ctx = WeightedAverageContext(c.prev_abs + k, c.prev_row_delta);
822
3.78M
        sign_ctx =
823
3.78M
            c.prev_sgn[k] * 3 + c.prev_sgn[static_cast<int>(k) - kDCTBlockSize];
824
3.78M
      }
825
6.90M
      sign_ctx = sign_ctx * kDCTBlockSize + k;
826
6.90M
      Prob& sign_p = c.sign_prob[sign_ctx];
827
6.90M
      sign = ac.ReadBit(sign_p.get_proba(), in);
828
6.90M
      sign_p.Add(sign);
829
6.90M
      c.prev_sgn[k] = sign + 1;
830
6.90M
      sign = 1 - 2 * sign;
831
6.90M
      const size_t z_dens_ctx =
832
6.90M
          ZeroDensityContext(num_nonzeros, k, c.context_bits);
833
6.90M
      size_t histo_ix = z_dens_ctx * kNumAvrgContexts + avg_ctx;
834
6.90M
      size_t entropy_ix = c.context_map[histo_ix];
835
6.90M
      int code = ans.ReadSymbol(c.entropy_codes[entropy_ix], in);
836
6.90M
      if (code < kNumDirectCodes) {
837
3.44M
        abs_val = code + 1;
838
3.45M
      } else {
839
3.45M
        int nbits = code - kNumDirectCodes;
840
3.45M
        Prob& p = c.first_extra_bit_prob[k * 10 + nbits];
841
3.45M
        int first_extra_bit = ac.ReadBit(p.get_proba(), in);
842
3.45M
        p.Add(first_extra_bit);
843
3.45M
        int extra_bits_val = first_extra_bit << nbits;
844
3.45M
        if (nbits > 0) {
845
2.82M
          extra_bits_val |= br.ReadBits(nbits, in);
846
2.82M
        }
847
3.45M
        abs_val = kNumDirectCodes - 1 + (2u << nbits) + extra_bits_val;
848
3.45M
      }
849
6.90M
      ++num_nonzeros;
850
16.8M
    } else {
851
16.8M
      c.prev_sgn[k] = 0;
852
16.8M
    }
853
23.7M
    int coeff = sign * abs_val;
854
23.7M
    c.coeffs[k_nat] = coeff;
855
23.7M
    c.prev_abs[k] = abs_val;
856
23.7M
  }
857
858
1.84M
  *c.ans = ans;
859
1.84M
  *c.br = br;
860
1.84M
  *c.ac = ac;
861
862
1.84M
  return num_nonzeros;
863
1.84M
}
864
865
5.28k
BrunsliStatus DecodeAC(State* state, WordSource* in) {
866
5.28k
  const std::vector<ComponentMeta>& meta = state->meta;
867
5.28k
  const size_t num_components = meta.size();
868
5.28k
  const int mcu_rows = meta[0].height_in_blocks / meta[0].v_samp;
869
5.28k
  InternalState& s = *state->internal;
870
5.28k
  AcDcState& ac_dc_state = s.ac_dc;
871
872
5.28k
  std::vector<ComponentState>& comps = ac_dc_state.ac;
873
5.28k
  if (comps.empty()) {
874
5.28k
    comps.resize(num_components);
875
11.1k
    for (size_t c = 0; c < num_components; ++c) {
876
5.83k
      comps[c].SetWidth(meta[c].width_in_blocks);
877
5.83k
      ComputeACPredictMultipliers(&meta[c].quant[0], comps[c].mult_row,
878
5.83k
                                  comps[c].mult_col);
879
5.83k
    }
880
5.28k
  }
881
882
5.28k
  if (!in->CanRead(5)) return BRUNSLI_NOT_ENOUGH_DATA;
883
5.18k
  EnsureSubdecodersInitialized(state, in);
884
885
5.18k
  if (!ac_dc_state.ac_coeffs_order_decoded) {
886
10.5k
    while (ac_dc_state.next_component < num_components) {
887
5.63k
      if (!in->CanRead(121)) return BRUNSLI_NOT_ENOUGH_DATA;
888
5.63k
      if (!DecodeCoeffOrder(comps[ac_dc_state.next_component].order,
889
5.63k
                            &s.bit_reader, in)) {
890
248
        return BRUNSLI_INVALID_BRN;
891
248
      }
892
5.38k
      ac_dc_state.next_component++;
893
5.38k
    }
894
4.93k
    ac_dc_state.next_component = 0;
895
4.93k
    ac_dc_state.ac_coeffs_order_decoded = true;
896
4.93k
  }
897
898
4.93k
  AcBlockCookie c;
899
4.93k
  c.ac = &s.arith_decoder;
900
4.93k
  c.in = in;
901
4.93k
  c.ans = &s.ans_decoder;
902
4.93k
  c.br = &s.bit_reader;
903
4.93k
  c.entropy_codes = state->entropy_codes;
904
4.93k
  c.context_modes =
905
4.93k
      kContextAlgorithm + (state->use_legacy_context_model ? 64 : 0);
906
907
97.0k
  for (int mcu_y = ac_dc_state.next_mcu_y; mcu_y < mcu_rows; ++mcu_y) {
908
184k
    for (size_t i = ac_dc_state.next_component; i < num_components; ++i) {
909
92.4k
      ComponentState& cst = comps[i];
910
92.4k
      c.prev_num_nonzeros = cst.prev_num_nonzeros.data();
911
92.4k
      c.num_nonzero_prob = cst.num_nonzero_prob;
912
92.4k
      c.is_zero_prob = cst.is_zero_prob.data();
913
92.4k
      c.order = cst.order;
914
92.4k
      c.mult_col = cst.mult_col;
915
92.4k
      c.mult_row = cst.mult_row;
916
92.4k
      c.sign_prob = cst.sign_prob.data();
917
92.4k
      c.first_extra_bit_prob = cst.first_extra_bit_prob.data();
918
92.4k
      const ComponentMeta& m = meta[i];
919
92.4k
      c.context_map = state->context_map + m.context_offset * kNumAvrgContexts;
920
92.4k
      c.context_bits = m.context_bits;
921
92.4k
      const int width = m.width_in_blocks;
922
92.4k
      const size_t ac_stride = m.ac_stride;
923
92.4k
      const size_t b_stride = m.b_stride;
924
92.4k
      const int next_iy = ac_dc_state.next_iy;
925
92.4k
      c.y = mcu_y * m.v_samp + next_iy;
926
92.4k
      c.prev_row_delta = (1 - 2 * (c.y & 1u)) * (width + 3) * kDCTBlockSize;
927
394k
      for (int iy = next_iy; iy < m.v_samp; ++iy, ++c.y) {
928
302k
        const int next_x = ac_dc_state.next_x;
929
302k
        const size_t block_offset = next_x * kDCTBlockSize;
930
302k
        c.coeffs = m.ac_coeffs + c.y * ac_stride + block_offset;
931
302k
        c.prev_row_coeffs = c.coeffs - ac_stride;
932
302k
        c.prev_col_coeffs = c.coeffs - kDCTBlockSize;
933
302k
        const uint8_t* block_state = m.block_state + c.y * b_stride + next_x;
934
302k
        c.prev_sgn = &cst.prev_sign[kDCTBlockSize] + block_offset;
935
302k
        c.prev_abs = &cst.prev_abs_coeff[((c.y & 1u) * (width + 3) + 2) *
936
302k
                                         kDCTBlockSize] +
937
302k
                     block_offset;
938
11.6M
        for (c.x = next_x; c.x < width; ++c.x) {
939
11.3M
          bool is_empty = *(block_state++);
940
11.3M
          if (!is_empty) {
941
1.84M
            if (BRUNSLI_PREDICT_FALSE(!in->CanRead(297))) {
942
66
              ac_dc_state.next_mcu_y = mcu_y;
943
66
              ac_dc_state.next_component = i;
944
66
              ac_dc_state.next_iy = iy;
945
66
              ac_dc_state.next_x = c.x;
946
66
              return BRUNSLI_NOT_ENOUGH_DATA;
947
66
            }
948
1.84M
            size_t num_nonzeros = DecodeAcBlock(c);
949
1.84M
            BRUNSLI_DCHECK(num_nonzeros <= kNumNonZeroTreeSize);
950
1.84M
            c.prev_num_nonzeros[c.x] = static_cast<uint8_t>(num_nonzeros);
951
9.46M
          } else {
952
9.46M
            DecodeEmptyAcBlock(c.prev_sgn, c.prev_abs);
953
9.46M
            c.prev_num_nonzeros[c.x] = 0;
954
9.46M
          }
955
11.3M
          c.coeffs += kDCTBlockSize;
956
11.3M
          c.prev_sgn += kDCTBlockSize;
957
11.3M
          c.prev_abs += kDCTBlockSize;
958
11.3M
          c.prev_row_coeffs += kDCTBlockSize;
959
11.3M
          c.prev_col_coeffs += kDCTBlockSize;
960
11.3M
        }
961
301k
        c.prev_row_delta *= -1;
962
301k
        ac_dc_state.next_x = 0;
963
301k
      }
964
92.3k
      ac_dc_state.next_iy = 0;
965
92.3k
    }
966
92.0k
    ac_dc_state.next_component = 0;
967
92.0k
  }
968
4.86k
  ac_dc_state.next_mcu_y = 0;
969
970
4.86k
  comps.clear();
971
4.86k
  comps.shrink_to_fit();
972
973
4.86k
  if (!FinalizeSubdecoders(state)) return BRUNSLI_INVALID_BRN;
974
975
4.40k
  return BRUNSLI_OK;
976
4.86k
}
977
978
208k
static bool CheckCanRead(State* state, size_t required) {
979
  // TODO(eustas): dcheck len > pos
980
208k
  size_t available = state->len - state->pos;
981
208k
  return required <= available;
982
208k
}
983
984
123k
static bool CheckCanReadByte(State* state) {
985
  // TODO(eustas): dcheck len > pos
986
123k
  return state->pos != state->len;
987
123k
}
988
989
123k
static uint8_t ReadByte(State* state) {
990
  // TODO(eustas): dcheck len > pos
991
123k
  return state->data[state->pos++];
992
123k
}
993
994
191k
static uint8_t PeekByte(State* state, size_t offset) {
995
  // TODO(eustas): dcheck overflow.
996
191k
  return state->data[state->pos + offset];
997
191k
}
998
999
368k
static void SkipBytes(State* state, size_t len) {
1000
  // TODO(eustas): dcheck overflow.
1001
368k
  state->pos += len;
1002
368k
}
1003
1004
259k
static size_t GetBytesAvailable(State* state) {
1005
  // TODO(eustas): dcheck len > pos
1006
259k
  return state->len - state->pos;
1007
259k
}
1008
1009
4.63k
static size_t SkipAvailableBytes(State* state, size_t len) {
1010
4.63k
  size_t available = GetBytesAvailable(state);
1011
4.63k
  size_t skip_bytes = std::min(available, len);
1012
4.63k
  state->pos += skip_bytes;
1013
4.63k
  return skip_bytes;
1014
4.63k
}
1015
1016
154k
static BrunsliStatus DecodeBase128(State* state, size_t* val) {
1017
154k
  *val = 0;
1018
154k
  uint64_t b = 0x80;
1019
154k
  size_t i = 0;
1020
345k
  while ((i < 9) && (b & 0x80u)) {
1021
191k
    if (!CheckCanRead(state, i + 1)) return BRUNSLI_NOT_ENOUGH_DATA;
1022
191k
    b = PeekByte(state, i);
1023
191k
    *val |= (b & 0x7Fu) << (i * 7);
1024
191k
    ++i;
1025
191k
  }
1026
153k
  SkipBytes(state, i);
1027
153k
  return ((b & 0x80u) == 0) ? BRUNSLI_OK : BRUNSLI_INVALID_BRN;
1028
154k
}
1029
1030
16.9k
static Stage Fail(State* state, BrunsliStatus result) {
1031
16.9k
  InternalState& s = *state->internal;
1032
16.9k
  s.result = result;
1033
  // Preserve current stage for continuation / error reporting.
1034
16.9k
  s.last_stage = state->stage;
1035
16.9k
  return Stage::ERROR;
1036
16.9k
}
1037
1038
123k
static BrunsliStatus ReadTag(State* state, SectionState* section) {
1039
123k
  if (!CheckCanReadByte(state)) return BRUNSLI_NOT_ENOUGH_DATA;
1040
123k
  const uint8_t marker = ReadByte(state);
1041
1042
123k
  const size_t tag = marker >> 3u;
1043
123k
  if (tag == 0 || tag > 15) return BRUNSLI_INVALID_BRN;
1044
123k
  section->tag = tag;
1045
1046
123k
  const size_t wiring_type = marker & 0x7u;
1047
123k
  if (wiring_type != kBrunsliWiringTypeVarint &&
1048
63.5k
      wiring_type != kBrunsliWiringTypeLengthDelimited) {
1049
19
    return BRUNSLI_INVALID_BRN;
1050
19
  }
1051
123k
  section->is_section = (wiring_type == kBrunsliWiringTypeLengthDelimited);
1052
1053
123k
  const uint32_t tag_bit = 1u << tag;
1054
123k
  if (section->tags_met & tag_bit) {
1055
13
    BRUNSLI_LOG_ERROR() << "Duplicate marker " << std::hex
1056
13
                        << static_cast<int>(marker) << BRUNSLI_ENDL();
1057
13
    return BRUNSLI_INVALID_BRN;
1058
13
  }
1059
123k
  section->tags_met |= tag_bit;
1060
1061
123k
  return BRUNSLI_OK;
1062
123k
}
1063
1064
58.8k
static BrunsliStatus EnterSection(State* state, SectionState* section) {
1065
58.8k
  size_t section_size;
1066
58.8k
  BrunsliStatus status = DecodeBase128(state, &section_size);
1067
58.8k
  if (status != BRUNSLI_OK) return status;
1068
58.7k
  section->is_active = true;
1069
58.7k
  section->remaining = section_size;
1070
58.7k
  section->milestone = state->pos;
1071
58.7k
  section->projected_end = state->pos + section->remaining;
1072
58.7k
  return BRUNSLI_OK;
1073
58.8k
}
1074
1075
16.1k
static void LeaveSection(SectionState* section) {
1076
16.1k
  section->is_active = false;
1077
16.1k
}
1078
1079
279k
static bool IsOutOfSectionBounds(State* state) {
1080
279k
  return state->pos > state->internal->section.projected_end;
1081
279k
}
1082
1083
275k
static size_t RemainingSectionLength(State* state) {
1084
  // TODO(eustas): remove this check?
1085
275k
  if (IsOutOfSectionBounds(state)) return 0;
1086
267k
  return state->internal->section.projected_end - state->pos;
1087
275k
}
1088
1089
146k
static bool IsAtSectionBoundary(State* state) {
1090
146k
  return state->pos == state->internal->section.projected_end;
1091
146k
}
1092
1093
16.8k
Stage VerifySignature(State* state) {
1094
16.8k
  InternalState& s = *state->internal;
1095
1096
16.8k
  if (!CheckCanRead(state, kBrunsliSignatureSize)) {
1097
5
    return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
1098
5
  }
1099
16.8k
  const bool is_signature_ok =
1100
16.8k
      (memcmp(state->data + state->pos, kBrunsliSignature,
1101
16.8k
              kBrunsliSignatureSize) != 0);
1102
16.8k
  state->pos += kBrunsliSignatureSize;
1103
16.8k
  s.section.tags_met |= 1u << kBrunsliSignatureTag;
1104
16.8k
  if (is_signature_ok) return Fail(state, BRUNSLI_INVALID_BRN);
1105
16.7k
  return Stage::HEADER;
1106
16.8k
}
1107
1108
// Parses the brunsli header starting at data[*pos] and fills in *jpg.
1109
// Sets *pos to the position after the header.
1110
// Returns BRUNSLI_OK, unless the data is not valid brunsli byte stream
1111
// or is truncated.
1112
16.7k
Stage DecodeHeader(State* state, JPEGData* jpg) {
1113
16.7k
  InternalState& s = *state->internal;
1114
16.7k
  HeaderState& hs = s.header;
1115
1116
216k
  while (hs.stage != HeaderState::DONE) {
1117
199k
    switch (hs.stage) {
1118
16.7k
      case HeaderState::READ_TAG: {
1119
16.7k
        BrunsliStatus status = ReadTag(state, &s.section);
1120
16.7k
        if (status != BRUNSLI_OK) return Fail(state, status);
1121
16.7k
        if (s.section.tag != kBrunsliHeaderTag || !s.section.is_section) {
1122
7
          return Fail(state, BRUNSLI_INVALID_BRN);
1123
7
        }
1124
16.7k
        hs.stage = HeaderState::ENTER_SECTION;
1125
16.7k
        break;
1126
16.7k
      }
1127
1128
16.7k
      case HeaderState::ENTER_SECTION: {
1129
16.7k
        BrunsliStatus status = EnterSection(state, &s.section);
1130
16.7k
        if (status != BRUNSLI_OK) return Fail(state, status);
1131
16.6k
        hs.stage = HeaderState::ITEM_READ_TAG;
1132
16.6k
        break;
1133
16.7k
      }
1134
1135
80.9k
      case HeaderState::ITEM_READ_TAG: {
1136
80.9k
        if (IsAtSectionBoundary(state)) {
1137
16.3k
          hs.stage = HeaderState::FINALE;
1138
16.3k
          break;
1139
16.3k
        }
1140
64.6k
        BrunsliStatus status = ReadTag(state, &hs.section);
1141
64.6k
        if (status != BRUNSLI_OK) return Fail(state, status);
1142
64.4k
        const uint32_t tag_bit = 1u << hs.section.tag;
1143
64.4k
        if (hs.section.is_section) {
1144
4.64k
          if (kKnownHeaderVarintTags & tag_bit) {
1145
4.51k
            Fail(state, BRUNSLI_INVALID_BRN);
1146
4.51k
          }
1147
4.64k
          hs.stage = HeaderState::ITEM_ENTER_SECTION;
1148
4.64k
          break;
1149
4.64k
        }
1150
59.8k
        hs.stage = HeaderState::ITEM_READ_VALUE;
1151
59.8k
        break;
1152
64.4k
      }
1153
1154
4.64k
      case HeaderState::ITEM_ENTER_SECTION: {
1155
4.64k
        BrunsliStatus status = DecodeBase128(state, &hs.remaining_skip_length);
1156
4.64k
        if (status != BRUNSLI_OK) return Fail(state, status);
1157
4.63k
        hs.stage = HeaderState::ITEM_SKIP_CONTENTS;
1158
4.63k
        break;
1159
4.64k
      }
1160
1161
4.63k
      case HeaderState::ITEM_SKIP_CONTENTS: {
1162
4.63k
        size_t bytes_skipped =
1163
4.63k
            SkipAvailableBytes(state, hs.remaining_skip_length);
1164
4.63k
        hs.remaining_skip_length -= bytes_skipped;
1165
4.63k
        if (hs.remaining_skip_length > 0) {
1166
124
          return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
1167
124
        }
1168
4.50k
        hs.stage = HeaderState::ITEM_READ_TAG;
1169
4.50k
        break;
1170
4.63k
      }
1171
1172
59.8k
      case HeaderState::ITEM_READ_VALUE: {
1173
59.8k
        size_t value;
1174
59.8k
        BrunsliStatus status = DecodeBase128(state, &value);
1175
59.8k
        if (status != BRUNSLI_OK) return Fail(state, status);
1176
59.8k
        hs.varint_values[hs.section.tag] = value;
1177
59.8k
        hs.stage = HeaderState::ITEM_READ_TAG;
1178
59.8k
        break;
1179
59.8k
      }
1180
1181
16.3k
      case HeaderState::FINALE: {
1182
16.3k
        const bool has_version =
1183
16.3k
            hs.section.tags_met & (1u << kBrunsliHeaderVersionCompTag);
1184
16.3k
        if (!has_version) return Fail(state, BRUNSLI_INVALID_BRN);
1185
16.3k
        const size_t version_and_comp_count =
1186
16.3k
            hs.varint_values[kBrunsliHeaderVersionCompTag];
1187
1188
16.3k
        const size_t version = version_and_comp_count >> 2u;
1189
16.3k
        jpg->version = static_cast<int>(version);
1190
1191
16.3k
        if (version == 1) {  // fallback mode
1192
          // TODO(eustas): do we need this?
1193
356
          jpg->width = 0;
1194
356
          jpg->height = 0;
1195
356
          hs.stage = HeaderState::DONE;
1196
356
          break;
1197
356
        }
1198
1199
        // Wrong mode = fallback + something.
1200
16.0k
        if ((version & 1u) != 0) {
1201
18
          return Fail(state, BRUNSLI_INVALID_BRN);
1202
18
        }
1203
        // Unknown mode - only 3 bits are defined.
1204
15.9k
        if ((version & ~0x7u) != 0) {
1205
49
          return Fail(state, BRUNSLI_INVALID_BRN);
1206
49
        }
1207
1208
        // Otherwise regular brunsli.
1209
15.9k
        state->use_legacy_context_model = !(version & 2);
1210
1211
        // Do not allow "original_jpg" for regular Brunsli files.
1212
15.9k
        s.section.tags_met |= 1u << kBrunsliOriginalJpgTag;
1213
1214
15.9k
        const bool has_width =
1215
15.9k
            hs.section.tags_met & (1u << kBrunsliHeaderWidthTag);
1216
15.9k
        if (!has_width) return Fail(state, BRUNSLI_INVALID_BRN);
1217
15.9k
        const size_t width = hs.varint_values[kBrunsliHeaderWidthTag];
1218
15.9k
        const bool has_height =
1219
15.9k
            hs.section.tags_met & (1u << kBrunsliHeaderHeightTag);
1220
15.9k
        if (!has_height) return Fail(state, BRUNSLI_INVALID_BRN);
1221
15.9k
        const size_t height = hs.varint_values[kBrunsliHeaderHeightTag];
1222
1223
15.9k
        if (width == 0 || height == 0) return Fail(state, BRUNSLI_INVALID_BRN);
1224
15.9k
        if (width > kMaxDimPixels || height > kMaxDimPixels) {
1225
175
          return Fail(state, BRUNSLI_INVALID_BRN);
1226
175
        }
1227
15.7k
        jpg->width = static_cast<int>(width);
1228
15.7k
        jpg->height = static_cast<int>(height);
1229
1230
15.7k
        const size_t num_components = (version_and_comp_count & 3u) + 1u;
1231
15.7k
        jpg->components.resize(num_components);
1232
1233
15.7k
        const bool has_subsampling =
1234
15.7k
            hs.section.tags_met & (1u << kBrunsliHeaderSubsamplingTag);
1235
15.7k
        if (!has_subsampling) return Fail(state, BRUNSLI_INVALID_BRN);
1236
15.7k
        size_t subsampling_code =
1237
15.7k
            hs.varint_values[kBrunsliHeaderSubsamplingTag];
1238
1239
42.6k
        for (size_t i = 0; i < jpg->components.size(); ++i) {
1240
26.9k
          JPEGComponent* c = &jpg->components[i];
1241
26.9k
          c->v_samp_factor = (subsampling_code & 0xFu) + 1;
1242
26.9k
          subsampling_code >>= 4u;
1243
26.9k
          c->h_samp_factor = (subsampling_code & 0xFu) + 1;
1244
26.9k
          subsampling_code >>= 4u;
1245
26.9k
          if (c->v_samp_factor > kBrunsliMaxSampling) {
1246
1
            return Fail(state, BRUNSLI_INVALID_BRN);
1247
1
          }
1248
26.9k
          if (c->h_samp_factor > kBrunsliMaxSampling) {
1249
1
            return Fail(state, BRUNSLI_INVALID_BRN);
1250
1
          }
1251
26.9k
        }
1252
15.7k
        if (!UpdateSubsamplingDerivatives(jpg)) {
1253
1
          return Fail(state, BRUNSLI_INVALID_BRN);
1254
1
        }
1255
1256
15.7k
        PrepareMeta(jpg, state);
1257
1258
15.7k
        hs.stage = HeaderState::DONE;
1259
15.7k
        break;
1260
15.7k
      }
1261
1262
0
      default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
1263
199k
    }
1264
199k
  }
1265
1266
16.0k
  LeaveSection(&s.section);
1267
16.0k
  return (jpg->version == kFallbackVersion) ? Stage::FALLBACK : Stage::SECTION;
1268
16.7k
}
1269
1270
4.09k
static BrunsliStatus DecodeMetaDataSection(State* state, JPEGData* jpg) {
1271
4.09k
  InternalState& s = *state->internal;
1272
4.09k
  MetadataState& ms = s.metadata;
1273
1274
4.09k
  if (ms.decompression_stage == MetadataDecompressionStage::DONE) {
1275
0
    return BRUNSLI_INVALID_BRN;
1276
0
  }
1277
1278
4.09k
  if (ms.decompression_stage == MetadataDecompressionStage::INITIAL) {
1279
4.09k
    if (IsAtSectionBoundary(state)) {
1280
3
      ms.decompression_stage = MetadataDecompressionStage::DONE;
1281
3
      return BRUNSLI_OK;
1282
3
    }
1283
4.09k
    if (RemainingSectionLength(state) == 1) {
1284
44
      if (!CheckCanReadByte(state)) {
1285
1
        return BRUNSLI_NOT_ENOUGH_DATA;
1286
1
      }
1287
43
      uint8_t data[1];
1288
43
      data[0] = ReadByte(state);
1289
43
      bool ok = ProcessMetaData(data, 1, &ms, jpg) && ms.CanFinish();
1290
43
      ms.decompression_stage = MetadataDecompressionStage::DONE;
1291
43
      return ok ? BRUNSLI_OK : BRUNSLI_INVALID_BRN;
1292
44
    }
1293
4.05k
    ms.decompression_stage =
1294
4.05k
        MetadataDecompressionStage::READ_LENGTH;
1295
4.05k
  }
1296
1297
4.05k
  if (ms.decompression_stage == MetadataDecompressionStage::READ_LENGTH) {
1298
4.05k
    BrunsliStatus status = DecodeBase128(state, &ms.metadata_size);
1299
4.05k
    if (status != BRUNSLI_OK) return status;
1300
    // TODO(eustas): ms.metadata_size should be limited to avoid "zip-bombs".
1301
3.96k
    if (IsOutOfSectionBounds(state)) return BRUNSLI_INVALID_BRN;
1302
3.96k
    if (RemainingSectionLength(state) == 0) return BRUNSLI_INVALID_BRN;
1303
3.96k
    ms.brotli = BrotliDecoderCreateInstance(nullptr, nullptr, nullptr);
1304
3.96k
    if (ms.brotli == nullptr) return BRUNSLI_DECOMPRESSION_ERROR;
1305
3.96k
    ms.decompression_stage = MetadataDecompressionStage::DECOMPRESSING;
1306
3.96k
  }
1307
1308
3.96k
  if (ms.decompression_stage == MetadataDecompressionStage::DECOMPRESSING) {
1309
    // Free Brotli decoder and return result
1310
3.96k
    const auto finish_decompression = [&ms] (BrunsliStatus result) {
1311
2.40k
      BRUNSLI_DCHECK(ms.brotli != nullptr);
1312
2.40k
      BrotliDecoderDestroyInstance(ms.brotli);
1313
2.40k
      ms.brotli = nullptr;
1314
2.40k
      ms.decompression_stage = MetadataDecompressionStage::DONE;
1315
2.40k
      return result;
1316
2.40k
    };
1317
1318
153k
    while (true) {
1319
153k
      size_t available_bytes =
1320
153k
          std::min(GetBytesAvailable(state), RemainingSectionLength(state));
1321
153k
      size_t available_in = available_bytes;
1322
153k
      const uint8_t* next_in = state->data + state->pos;
1323
153k
      size_t available_out = 0;
1324
153k
      BrotliDecoderResult result = BrotliDecoderDecompressStream(
1325
153k
          ms.brotli, &available_in, &next_in, &available_out, nullptr, nullptr);
1326
153k
      if (result == BROTLI_DECODER_RESULT_ERROR) {
1327
1.03k
        return finish_decompression(BRUNSLI_INVALID_BRN);
1328
1.03k
      }
1329
152k
      size_t chunk_size = 0;
1330
152k
      const uint8_t* chunk_data =
1331
152k
          BrotliDecoderTakeOutput(ms.brotli, &chunk_size);
1332
152k
      ms.decompressed_size += chunk_size;
1333
152k
      if (ms.decompressed_size > ms.metadata_size) {
1334
1.03k
        return finish_decompression(BRUNSLI_INVALID_BRN);
1335
1.03k
      }
1336
151k
      size_t consumed_bytes = available_bytes - available_in;
1337
151k
      SkipBytes(state, consumed_bytes);
1338
151k
      bool chunk_ok = ProcessMetaData(chunk_data, chunk_size, &ms, jpg);
1339
151k
      if (!chunk_ok) return finish_decompression(BRUNSLI_INVALID_BRN);
1340
151k
      if (result == BROTLI_DECODER_RESULT_SUCCESS) {
1341
187
        if (RemainingSectionLength(state) != 0) {
1342
118
          return finish_decompression(BRUNSLI_INVALID_BRN);
1343
118
        }
1344
69
        if (ms.decompressed_size != ms.metadata_size) {
1345
64
          return finish_decompression(BRUNSLI_INVALID_BRN);
1346
64
        }
1347
5
        if (!ms.CanFinish()) return finish_decompression(BRUNSLI_INVALID_BRN);
1348
3
        return finish_decompression(BRUNSLI_OK);
1349
5
      }
1350
150k
      if (result == BROTLI_DECODER_RESULT_NEEDS_MORE_OUTPUT) continue;
1351
1.56k
      BRUNSLI_DCHECK(result == BROTLI_DECODER_RESULT_NEEDS_MORE_INPUT);
1352
1.56k
      if (RemainingSectionLength(state) == 0) {
1353
14
        return finish_decompression(BRUNSLI_INVALID_BRN);
1354
14
      }
1355
1.55k
      return BRUNSLI_NOT_ENOUGH_DATA;
1356
1.56k
    }
1357
3.96k
  }
1358
1359
  // Unreachable.
1360
0
  BRUNSLI_DCHECK(false);
1361
0
  return BRUNSLI_DECOMPRESSION_ERROR;
1362
3.96k
}
1363
1364
/**
1365
 * Wraps result, depending on the state of input.
1366
 *
1367
 * If parser needs more data, but section data is depleted,
1368
 * then input is corrupted.
1369
 */
1370
26.5k
static BrunsliStatus CheckBoundary(State* state, BrunsliStatus result) {
1371
26.5k
  if (result == BRUNSLI_NOT_ENOUGH_DATA) {
1372
3.26k
    bool last = (RemainingSectionLength(state) <= GetBytesAvailable(state));
1373
3.26k
    return last ? BRUNSLI_INVALID_BRN : BRUNSLI_NOT_ENOUGH_DATA;
1374
23.2k
  } else {
1375
23.2k
    return result;
1376
23.2k
  }
1377
26.5k
}
1378
1379
26.3k
static void PrepareBitReader(BrunsliBitReader* br, State* state) {
1380
26.3k
  size_t chunk_len =
1381
26.3k
      std::min(GetBytesAvailable(state), RemainingSectionLength(state));
1382
26.3k
  BrunsliBitReaderResume(br, state->data + state->pos, chunk_len);
1383
26.3k
  BRUNSLI_DCHECK(BrunsliBitReaderIsHealthy(br));
1384
26.3k
}
1385
1386
/**
1387
 * Marks data used by bit-reader as consumed.
1388
 */
1389
static BrunsliStatus SuspendBitReader(BrunsliBitReader* br, State* state,
1390
26.3k
                                      BrunsliStatus result) {
1391
26.3k
  size_t chunk_len =
1392
26.3k
      std::min(GetBytesAvailable(state), RemainingSectionLength(state));
1393
26.3k
  size_t unused_bytes = BrunsliBitReaderSuspend(br);
1394
26.3k
  size_t consumed_bytes = chunk_len - unused_bytes;
1395
26.3k
  SkipBytes(state, consumed_bytes);
1396
26.3k
  result = CheckBoundary(state, result);
1397
  // Once BitReader becomes unhealthy, further decoding should be impossible.
1398
26.3k
  BRUNSLI_DCHECK(
1399
26.3k
      BrunsliBitReaderIsHealthy(br) ||
1400
26.3k
      ((result != BRUNSLI_OK) && (result != BRUNSLI_NOT_ENOUGH_DATA)));
1401
26.3k
  return result;
1402
26.3k
}
1403
1404
11.4k
static BrunsliStatus DecodeJPEGInternalsSection(State* state, JPEGData* jpg) {
1405
11.4k
  InternalState& s = *state->internal;
1406
11.4k
  JpegInternalsState& js = s.internals;
1407
11.4k
  BrunsliBitReader* br = &js.br;
1408
1409
11.4k
  if (js.stage == JpegInternalsState::INIT) {
1410
11.4k
    BrunsliBitReaderInit(br);
1411
11.4k
    js.stage = JpegInternalsState::READ_MARKERS;
1412
11.4k
  }
1413
11.4k
  PrepareBitReader(br, state);
1414
1415
11.4k
  const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus {
1416
11.4k
    return SuspendBitReader(br, state, result);
1417
11.4k
  };
1418
1419
11.4k
  if (js.stage == JpegInternalsState::READ_MARKERS) {
1420
3.00M
    while (true) {
1421
3.00M
      if (!BrunsliBitReaderCanRead(br, 6)) {
1422
187
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1423
187
      }
1424
3.00M
      uint8_t marker = 0xc0 + BrunsliBitReaderRead(br, 6);
1425
3.00M
      jpg->marker_order.push_back(marker);
1426
3.00M
      if (marker == 0xc4) ++js.dht_count;
1427
3.00M
      if (marker == 0xdd) js.have_dri = true;
1428
3.00M
      if (marker == 0xda) ++js.num_scans;
1429
3.00M
      if (marker == 0xd9) break;
1430
3.00M
    }
1431
11.2k
    js.stage = JpegInternalsState::READ_DRI;
1432
11.2k
  }
1433
1434
11.2k
  if (js.stage == JpegInternalsState::READ_DRI) {
1435
11.2k
    if (js.have_dri) {
1436
1.51k
      if (!BrunsliBitReaderCanRead(br, 16)) {
1437
132
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1438
132
      }
1439
1.37k
      jpg->restart_interval = BrunsliBitReaderRead(br, 16);
1440
1.37k
    }
1441
11.1k
    js.stage = JpegInternalsState::READ_HUFFMAN_LAST;
1442
11.1k
  }
1443
1444
11.1k
  if (js.stage & JpegInternalsState::DECODE_HUFFMAN_MASK) {
1445
11.1k
    BrunsliStatus status = DecodeHuffmanCode(state, jpg);
1446
11.1k
    if (status != BRUNSLI_OK) return suspend_bit_reader(status);
1447
10.7k
    js.stage = JpegInternalsState::PREPARE_READ_SCANS;
1448
10.7k
  }
1449
1450
10.7k
  if (js.stage == JpegInternalsState::PREPARE_READ_SCANS) {
1451
10.7k
    if (js.dht_count != js.terminal_huffman_code_count) {
1452
149
      BRUNSLI_LOG_ERROR() << "Invalid number of DHT markers" << BRUNSLI_ENDL();
1453
149
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1454
149
    }
1455
10.6k
    if (js.num_scans > 0) {
1456
5.00k
      jpg->scan_info.resize(js.num_scans);
1457
5.00k
      js.i = 0;
1458
5.00k
      js.stage = JpegInternalsState::READ_SCAN_COMMON;
1459
5.62k
    } else {
1460
5.62k
      js.stage = JpegInternalsState::READ_NUM_QUANT;
1461
5.62k
    }
1462
10.6k
  }
1463
1464
10.6k
  if (js.stage & JpegInternalsState::DECODE_SCAN_MASK) {
1465
5.00k
    BrunsliStatus status = DecodeScanInfo(state, jpg);
1466
5.00k
    if (status != BRUNSLI_OK) return suspend_bit_reader(status);
1467
4.69k
    js.stage = JpegInternalsState::READ_NUM_QUANT;
1468
4.69k
  }
1469
1470
10.3k
  if (js.stage == JpegInternalsState::READ_NUM_QUANT) {
1471
10.3k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1472
167
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1473
167
    }
1474
10.1k
    int num_quant_tables = BrunsliBitReaderRead(br, 2) + 1;
1475
10.1k
    jpg->quant.resize(num_quant_tables);
1476
10.1k
    js.i = 0;
1477
10.1k
    js.stage = JpegInternalsState::READ_QUANT;
1478
10.1k
  }
1479
1480
20.2k
  while (js.stage == JpegInternalsState::READ_QUANT) {
1481
20.2k
    if (js.i >= jpg->quant.size()) {
1482
9.85k
      js.stage = JpegInternalsState::READ_COMP_ID_SCHEME;
1483
9.85k
      break;
1484
9.85k
    }
1485
    // 6 or 7 bits are used, but we know that at least one more bit is
1486
    // guaranteed to be used by varint out of the loop.
1487
10.3k
    if (!BrunsliBitReaderCanRead(br, 7)) {
1488
166
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1489
166
    }
1490
10.1k
    JPEGQuantTable* q = &jpg->quant[js.i];
1491
10.1k
    q->index = BrunsliBitReaderRead(br, 2);
1492
10.1k
    q->is_last = (js.i == jpg->quant.size() - 1) || BrunsliBitReaderRead(br, 1);
1493
10.1k
    q->precision = BrunsliBitReaderRead(br, 4);
1494
10.1k
    if (q->precision > 1) {
1495
132
      BRUNSLI_LOG_ERROR() << "Invalid quantization table precision: "
1496
132
                          << q->precision << BRUNSLI_ENDL();
1497
132
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1498
132
    }
1499
    // note that q->values[] are initialized to invalid 0 values.
1500
10.0k
    ++js.i;
1501
10.0k
  }
1502
1503
9.85k
  if (js.stage == JpegInternalsState::READ_COMP_ID_SCHEME) {
1504
9.85k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1505
131
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1506
131
    }
1507
9.72k
    int comp_ids = BrunsliBitReaderRead(br, 2);
1508
9.72k
    static const size_t kMinRequiredComponents[4] = {
1509
9.72k
        3 /* Ids123*/, 1 /* IdsGray */, 3 /* IdsRGB */, 0 /* IdsCustom */
1510
9.72k
    };
1511
9.72k
    if (jpg->components.size() < kMinRequiredComponents[comp_ids]) {
1512
3
      BRUNSLI_LOG_ERROR() << "Insufficient number of components for ColorId #"
1513
3
                          << comp_ids << BRUNSLI_ENDL();
1514
3
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1515
3
    }
1516
9.72k
    js.stage = JpegInternalsState::READ_NUM_PADDING_BITS;
1517
9.72k
    if (comp_ids == kComponentIds123) {
1518
493
      jpg->components[0].id = 1;
1519
493
      jpg->components[1].id = 2;
1520
493
      jpg->components[2].id = 3;
1521
9.23k
    } else if (comp_ids == kComponentIdsGray) {
1522
8.79k
      jpg->components[0].id = 1;
1523
8.79k
    } else if (comp_ids == kComponentIdsRGB) {
1524
33
      jpg->components[0].id = 'R';
1525
33
      jpg->components[1].id = 'G';
1526
33
      jpg->components[2].id = 'B';
1527
405
    } else {
1528
405
      BRUNSLI_DCHECK(comp_ids == kComponentIdsCustom);
1529
405
      js.i = 0;
1530
405
      js.stage = JpegInternalsState::READ_COMP_ID;
1531
405
    }
1532
9.72k
  }
1533
1534
9.72k
  if (js.stage == JpegInternalsState::READ_COMP_ID) {
1535
803
    while (js.i < jpg->components.size()) {
1536
425
      if (!BrunsliBitReaderCanRead(br, 8)) {
1537
27
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1538
27
      }
1539
398
      jpg->components[js.i].id = BrunsliBitReaderRead(br, 8);
1540
398
      ++js.i;
1541
398
    }
1542
378
    js.stage = JpegInternalsState::READ_NUM_PADDING_BITS;
1543
378
  }
1544
1545
9.69k
  if (js.stage == JpegInternalsState::READ_NUM_PADDING_BITS) {
1546
    // TODO(eustas): sanitize: should not be bigger than
1547
    //               7 x (num_scans + num_blocks / dri)
1548
    // security: limit is 32b for n_size
1549
9.69k
    if (!DecodeLimitedVarint<8>(&js.varint, br, 4)) {
1550
95
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1551
95
    }
1552
9.60k
    js.num_padding_bits = js.varint.value;
1553
9.60k
    jpg->has_zero_padding_bit = (js.num_padding_bits > 0);
1554
9.60k
    if (js.num_padding_bits > PaddingBitsLimit(*jpg)) {
1555
42
      BRUNSLI_LOG_ERROR() << "Suspicious number of padding bits "
1556
42
                          << js.num_padding_bits << BRUNSLI_ENDL();
1557
42
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1558
42
    }
1559
9.56k
    js.i = 0;
1560
9.56k
    js.stage = JpegInternalsState::READ_PADDING_BITS;
1561
9.56k
  }
1562
1563
9.56k
  if (js.stage == JpegInternalsState::READ_PADDING_BITS) {
1564
67.6k
    while (js.i < js.num_padding_bits) {
1565
58.1k
      if (!BrunsliBitReaderCanRead(br, 1)) {
1566
22
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1567
22
      }
1568
58.1k
      jpg->padding_bits.emplace_back(BrunsliBitReaderRead(br, 1));
1569
58.1k
      ++js.i;
1570
58.1k
    }
1571
9.53k
    suspend_bit_reader(BRUNSLI_OK);
1572
9.53k
    BrunsliBitReaderFinish(br);
1573
9.53k
    if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN;
1574
9.52k
    js.i = 0;
1575
9.52k
    js.stage = JpegInternalsState::ITERATE_MARKERS;
1576
9.52k
  } else {
1577
    // no-op
1578
0
    suspend_bit_reader(BRUNSLI_OK);
1579
0
  }
1580
1581
2.27M
  while (true) {
1582
2.27M
    switch (js.stage) {
1583
2.21M
      case JpegInternalsState::ITERATE_MARKERS: {
1584
2.21M
        if (js.i >= jpg->marker_order.size()) {
1585
9.17k
          js.stage = JpegInternalsState::DONE;
1586
2.20M
        } else if (jpg->marker_order[js.i] == 0xFF) {
1587
26.6k
          js.stage = JpegInternalsState::READ_INTERMARKER_LENGTH;
1588
2.17M
        } else {
1589
2.17M
          ++js.i;
1590
2.17M
        }
1591
2.21M
        continue;
1592
0
      }
1593
1594
26.6k
      case JpegInternalsState::READ_INTERMARKER_LENGTH: {
1595
26.6k
        BrunsliStatus status = DecodeBase128(state, &js.intermarker_length);
1596
26.6k
        if (status != BRUNSLI_OK) return CheckBoundary(state, status);
1597
26.4k
        if (js.intermarker_length > RemainingSectionLength(state)) {
1598
77
          return BRUNSLI_INVALID_BRN;
1599
77
        }
1600
26.3k
        jpg->inter_marker_data.emplace_back();
1601
26.3k
        js.stage = JpegInternalsState::READ_INTERMARKER_DATA;
1602
26.3k
        continue;
1603
26.4k
      }
1604
1605
26.3k
      case JpegInternalsState::READ_INTERMARKER_DATA: {
1606
26.3k
        auto& dest = jpg->inter_marker_data.back();
1607
26.3k
        size_t piece_limit = js.intermarker_length - dest.size();
1608
26.3k
        size_t piece_size = std::min(piece_limit, GetBytesAvailable(state));
1609
26.3k
        Append(&dest, state->data + state->pos, piece_size);
1610
26.3k
        SkipBytes(state, piece_size);
1611
26.3k
        if (dest.size() < js.intermarker_length) {
1612
128
          BRUNSLI_DCHECK(GetBytesAvailable(state) == 0);
1613
128
          BRUNSLI_DCHECK(RemainingSectionLength(state) > 0);
1614
128
          return BRUNSLI_NOT_ENOUGH_DATA;
1615
128
        }
1616
26.2k
        ++js.i;
1617
26.2k
        js.stage = JpegInternalsState::ITERATE_MARKERS;
1618
26.2k
        continue;
1619
26.3k
      }
1620
1621
9.17k
      default: { /* no-op */ }
1622
2.27M
    }
1623
9.17k
    break;  // no matching stage has been found; exit the loop.
1624
2.27M
  }
1625
1626
9.17k
  if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1627
1628
9.01k
  return BRUNSLI_OK;
1629
9.17k
}
1630
1631
7.57k
static BrunsliStatus DecodeQuantDataSection(State* state, JPEGData* jpg) {
1632
7.57k
  InternalState& s = *state->internal;
1633
7.57k
  QuantDataState& qs = s.quant;
1634
7.57k
  BrunsliBitReader* br = &qs.br;
1635
1636
7.57k
  if (qs.stage == QuantDataState::INIT) {
1637
7.57k
    BrunsliBitReaderInit(br);
1638
7.57k
    qs.stage = QuantDataState::READ_NUM_QUANT;
1639
7.57k
  }
1640
7.57k
  PrepareBitReader(br, state);
1641
1642
7.57k
  const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus {
1643
7.57k
    return SuspendBitReader(br, state, result);
1644
7.57k
  };
1645
1646
7.57k
  if (qs.stage == QuantDataState::READ_NUM_QUANT) {
1647
7.57k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1648
142
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1649
142
    }
1650
7.43k
    size_t num_quant_tables = BrunsliBitReaderRead(br, 2) + 1;
1651
7.43k
    if (jpg->quant.size() != num_quant_tables) {
1652
130
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1653
130
    }
1654
7.30k
    qs.predictor.resize(kDCTBlockSize);
1655
7.30k
    qs.i = 0;
1656
7.30k
    qs.stage = QuantDataState::READ_STOCK;
1657
7.30k
  }
1658
1659
68.3k
  while (true) {
1660
68.3k
    switch (qs.stage) {
1661
13.7k
      case QuantDataState::READ_STOCK: {
1662
13.7k
        if (qs.i >= jpg->quant.size()) {
1663
6.28k
          std::vector<uint8_t>().swap(qs.predictor);
1664
6.28k
          qs.i = 0;
1665
6.28k
          qs.stage = QuantDataState::READ_QUANT_IDX;
1666
6.28k
          continue;
1667
6.28k
        }
1668
        // Depending on еру 1-st bit, it is guaranteed that we will need to read
1669
        // at least 3 or 6 more bits.
1670
7.47k
        if (!BrunsliBitReaderCanRead(br, 4)) {
1671
131
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1672
131
        }
1673
7.34k
        qs.data_precision = 0;
1674
7.34k
        bool is_short = !BrunsliBitReaderRead(br, 1);
1675
7.34k
        if (is_short) {
1676
6.33k
          const size_t short_code = BrunsliBitReaderRead(br, 3);
1677
6.33k
          int32_t* table = jpg->quant[qs.i].values.data();
1678
6.33k
          size_t selector = (qs.i > 0) ? 1 : 0;
1679
411k
          for (size_t k = 0; k < kDCTBlockSize; ++k) {
1680
405k
            table[k] = kStockQuantizationTables[selector][short_code][k];
1681
405k
          }
1682
6.33k
          qs.stage = QuantDataState::UPDATE;
1683
6.33k
        } else {
1684
1.01k
          qs.stage = QuantDataState::READ_Q_FACTOR;
1685
1.01k
        }
1686
7.34k
        continue;
1687
7.47k
      }
1688
1689
1.01k
      case QuantDataState::READ_Q_FACTOR: {
1690
1.01k
        if (!BrunsliBitReaderCanRead(br, 6)) {
1691
150
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1692
150
        }
1693
861
        const uint32_t q_factor = BrunsliBitReaderRead(br, 6);
1694
861
        FillQuantMatrix(qs.i > 0, q_factor, qs.predictor.data());
1695
861
        qs.j = 0;
1696
861
        qs.delta = 0;
1697
861
        qs.stage = QuantDataState::READ_DIFF_IS_ZERO;
1698
861
        continue;
1699
1.01k
      }
1700
1701
17.9k
      case QuantDataState::READ_DIFF_IS_ZERO: {
1702
17.9k
        if (qs.j >= kDCTBlockSize) {
1703
230
          qs.stage = QuantDataState::UPDATE;
1704
230
          continue;
1705
230
        }
1706
17.7k
        if (!BrunsliBitReaderCanRead(br, 1)) {
1707
158
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1708
158
        }
1709
17.5k
        if (BrunsliBitReaderRead(br, 1)) {
1710
2.82k
          qs.stage = QuantDataState::READ_DIFF_SIGN;
1711
14.7k
        } else {
1712
14.7k
          qs.stage = QuantDataState::APPLY_DIFF;
1713
14.7k
        }
1714
17.5k
        continue;
1715
17.7k
      }
1716
1717
2.82k
      case QuantDataState::READ_DIFF_SIGN: {
1718
2.82k
        if (!BrunsliBitReaderCanRead(br, 1)) {
1719
152
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1720
152
        }
1721
2.67k
        qs.sign = BrunsliBitReaderRead(br, 1) ? -1 : 1;
1722
2.67k
        qs.stage = QuantDataState::READ_DIFF;
1723
2.67k
        continue;
1724
2.82k
      }
1725
1726
2.67k
      case QuantDataState::READ_DIFF: {
1727
2.67k
        if (!DecodeVarint(&qs.vs, br, 16)) {
1728
133
          return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1729
133
        }
1730
2.54k
        int diff = static_cast<int>(qs.vs.value) + 1;
1731
2.54k
        qs.delta += qs.sign * diff;
1732
2.54k
        qs.stage = QuantDataState::APPLY_DIFF;
1733
2.54k
        continue;
1734
2.67k
      }
1735
1736
17.2k
      case QuantDataState::APPLY_DIFF: {
1737
17.2k
        const int k = kJPEGNaturalOrder[qs.j];
1738
17.2k
        const int quant_value = qs.predictor[k] + qs.delta;
1739
17.2k
        jpg->quant[qs.i].values[k] = quant_value;
1740
17.2k
        if (quant_value <= 0) {
1741
100
          return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1742
100
        }
1743
17.1k
        if (quant_value >= 256) {
1744
10.4k
          qs.data_precision = 1;
1745
10.4k
        }
1746
17.1k
        if (quant_value >= 65536) {
1747
88
          return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1748
88
        }
1749
17.0k
        ++qs.j;
1750
17.0k
        qs.stage = QuantDataState::READ_DIFF_IS_ZERO;
1751
17.0k
        continue;
1752
17.1k
      }
1753
1754
6.56k
      case QuantDataState::UPDATE: {
1755
6.56k
        if (jpg->quant[qs.i].precision < qs.data_precision) {
1756
108
          return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1757
108
        }
1758
        // jpg->quant[qs.i].precision > qs.data_precision means that original
1759
        // JPEG1 was inefficiently encoded.
1760
6.45k
        ++qs.i;
1761
6.45k
        qs.stage = QuantDataState::READ_STOCK;
1762
6.45k
        continue;
1763
6.56k
      }
1764
1765
6.28k
      default: { /* no-op */ }
1766
68.3k
    }
1767
6.28k
    break;  // no matching stage has been found; exit the loop.
1768
68.3k
  }
1769
1770
19.1k
  while (qs.stage == QuantDataState::READ_QUANT_IDX) {
1771
13.1k
    if (qs.i >= jpg->components.size()) {
1772
6.04k
      qs.stage = QuantDataState::FINISH;
1773
6.04k
      continue;
1774
6.04k
    }
1775
7.08k
    JPEGComponent* c = &jpg->components[qs.i];
1776
7.08k
    if (!BrunsliBitReaderCanRead(br, 2)) {
1777
153
       return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1778
153
    }
1779
6.93k
    c->quant_idx = BrunsliBitReaderRead(br, 2);
1780
6.93k
    if (c->quant_idx >= jpg->quant.size()) {
1781
93
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1782
93
    }
1783
6.83k
    ++qs.i;
1784
6.83k
  }
1785
1786
6.04k
  BRUNSLI_DCHECK(qs.stage == QuantDataState::FINISH);
1787
6.04k
  suspend_bit_reader(BRUNSLI_OK);
1788
6.04k
  BrunsliBitReaderFinish(br);
1789
6.04k
  if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN;
1790
6.03k
  if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1791
5.92k
  return BRUNSLI_OK;
1792
6.03k
}
1793
1794
7.35k
static BrunsliStatus DecodeHistogramDataSection(State* state, JPEGData* jpg) {
1795
7.35k
  InternalState& s = *state->internal;
1796
7.35k
  HistogramDataState& hs = s.histogram;
1797
7.35k
  BrunsliBitReader* br = &hs.br;
1798
1799
7.35k
  if (hs.stage == HistogramDataState::INIT) {
1800
7.35k
    BrunsliBitReaderInit(br);
1801
7.35k
    BRUNSLI_DCHECK(!jpg->components.empty());
1802
7.35k
    s.num_contexts = jpg->components.size();
1803
7.35k
    hs.stage = HistogramDataState::READ_SCHEME;
1804
    /* Optimization: hint arena about maximal used alphabet size: 272.
1805
     * 648 = 272 + 376, where 376 is a "universal" overhead for max-15-bit
1806
     * root-8-bit 2-level Huffman tables. */
1807
7.35k
    hs.arena.reserve(648);
1808
7.35k
  }
1809
7.35k
  PrepareBitReader(br, state);
1810
7.35k
  if (RemainingSectionLength(state) <= GetBytesAvailable(state)) {
1811
    // If end of section is reachable, then we could parse the remainings in
1812
    // non-streaming mode.
1813
6.57k
    BrunsliBitReaderSetOptimistic(br);
1814
6.57k
  }
1815
7.35k
  const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus {
1816
7.35k
    return SuspendBitReader(br, state, result);
1817
7.35k
  };
1818
1819
7.35k
  if (hs.stage == HistogramDataState::READ_SCHEME) {
1820
7.35k
    const size_t num_components = jpg->components.size();
1821
7.35k
    BRUNSLI_DCHECK(num_components <= 4);
1822
7.35k
    if (!BrunsliBitReaderCanRead(br, 3 * num_components)) {
1823
142
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1824
142
    }
1825
15.3k
    for (size_t i = 0; i < num_components; ++i) {
1826
8.21k
      size_t scheme = BrunsliBitReaderRead(br, 3);
1827
8.21k
      if (scheme >= kNumSchemes) return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1828
8.13k
      ComponentMeta& m = state->meta[i];
1829
8.13k
      m.context_bits = scheme;
1830
8.13k
      m.context_offset = s.num_contexts;
1831
8.13k
      s.num_contexts += kNumNonzeroContextSkip[scheme];
1832
8.13k
    }
1833
7.13k
    if (!BrunsliBitReaderIsHealthy(br)) {
1834
11
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1835
11
    }
1836
7.12k
    hs.stage = HistogramDataState::READ_NUM_HISTOGRAMS;
1837
7.12k
  }
1838
1839
7.12k
  if (hs.stage == HistogramDataState::READ_NUM_HISTOGRAMS) {
1840
7.12k
    if (!BrunsliBitReaderCanRead(br, 11)) {
1841
3
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1842
3
    }
1843
7.11k
    s.num_histograms = DecodeVarLenUint8(br) + 1;
1844
7.11k
    if (!BrunsliBitReaderIsHealthy(br)) {
1845
17
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1846
17
    }
1847
7.10k
    if (s.shallow_histograms) {
1848
0
      hs.stage = HistogramDataState::SKIP_CONTENT;
1849
7.10k
    } else {
1850
7.10k
      s.context_map_.resize(s.num_contexts * kNumAvrgContexts);
1851
7.10k
      state->context_map = s.context_map_.data();
1852
7.10k
      s.entropy_codes_.resize(s.num_histograms);
1853
7.10k
      state->entropy_codes = s.entropy_codes_.data();
1854
7.10k
      if (s.num_histograms > 1) {
1855
1.21k
        hs.stage = HistogramDataState::READ_CONTEXT_MAP_CODE;
1856
5.88k
      } else {
1857
5.88k
        hs.i = 0;
1858
5.88k
        hs.counts.resize(kCoeffAlphabetSize);
1859
5.88k
        hs.stage = HistogramDataState::READ_HISTOGRAMS;
1860
5.88k
      }
1861
7.10k
    }
1862
7.10k
  }
1863
1864
7.10k
  if (hs.stage == HistogramDataState::SKIP_CONTENT) {
1865
0
    suspend_bit_reader(BRUNSLI_OK);
1866
0
    if (!BrunsliBitReaderIsHealthy(br)) {
1867
0
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1868
0
    }
1869
0
    SkipAvailableBytes(state, RemainingSectionLength(state));
1870
0
    if (!IsAtSectionBoundary(state)) return BRUNSLI_NOT_ENOUGH_DATA;
1871
0
    hs.stage = HistogramDataState::DONE;
1872
0
  }
1873
1874
7.10k
  if (hs.stage == HistogramDataState::READ_CONTEXT_MAP_CODE) {
1875
1.21k
    if (!BrunsliBitReaderCanRead(br, 207 + s.num_histograms * 8)) {
1876
92
      return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1877
92
    }
1878
1.12k
    hs.max_run_length_prefix = 0;
1879
1.12k
    bool use_rle_for_zeros = !!BrunsliBitReaderRead(br, 1);
1880
1.12k
    if (use_rle_for_zeros) {
1881
399
      hs.max_run_length_prefix = BrunsliBitReaderRead(br, 4) + 1;
1882
399
    }
1883
1.12k
    size_t alphabet_size = s.num_histograms + hs.max_run_length_prefix;
1884
1.12k
    hs.entropy.reset(new HuffmanDecodingData);
1885
1.12k
    if (!hs.entropy->ReadFromBitStream(alphabet_size, br, &hs.arena)) {
1886
314
      return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1887
314
    }
1888
809
    hs.i = 0;
1889
809
    hs.stage = HistogramDataState::READ_CONTEXT_MAP;
1890
809
  }
1891
1892
6.69k
  if (hs.stage == HistogramDataState::READ_CONTEXT_MAP) {
1893
809
    BrunsliStatus status = DecodeContextMap(
1894
809
        *hs.entropy, hs.max_run_length_prefix, &hs.i, &s.context_map_, br);
1895
809
    if (status != BRUNSLI_OK) return suspend_bit_reader(status);
1896
496
    hs.i = 0;
1897
496
    hs.counts.resize(kCoeffAlphabetSize);
1898
496
    hs.stage = HistogramDataState::READ_HISTOGRAMS;
1899
496
  }
1900
1901
6.38k
  if (hs.stage == HistogramDataState::READ_HISTOGRAMS) {
1902
17.8k
    while (hs.i < s.num_histograms) {
1903
11.8k
      if (!BrunsliBitReaderCanRead(br, 9 + kCoeffAlphabetSize * 11)) {
1904
165
        return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA);
1905
165
      }
1906
11.6k
      if (!ReadHistogram(BRUNSLI_ANS_LOG_TAB_SIZE, &hs.counts, br)) {
1907
237
        return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1908
237
      }
1909
11.4k
      if (!s.entropy_codes_[hs.i].Init(hs.counts)) {
1910
0
        return suspend_bit_reader(BRUNSLI_INVALID_BRN);
1911
0
      }
1912
11.4k
      ++hs.i;
1913
11.4k
    }
1914
5.98k
    hs.entropy.reset();
1915
5.98k
    std::vector<uint32_t>().swap(hs.counts);
1916
5.98k
    suspend_bit_reader(BRUNSLI_OK);
1917
5.98k
    BrunsliBitReaderFinish(br);
1918
5.98k
    if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN;
1919
5.96k
    if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1920
5.91k
    hs.stage = HistogramDataState::DONE;
1921
5.91k
  }
1922
1923
5.91k
  hs.arena.reset();
1924
5.91k
  BRUNSLI_DCHECK(hs.stage == HistogramDataState::DONE);
1925
5.91k
  return BRUNSLI_OK;
1926
6.38k
}
1927
1928
5.88k
static BrunsliStatus DecodeDCDataSection(State* state) {
1929
5.88k
  size_t available = GetBytesAvailable(state) & ~1;
1930
5.88k
  size_t limit = RemainingSectionLength(state);
1931
5.88k
  BRUNSLI_DCHECK((limit & 1) == 0);
1932
5.88k
  size_t chunk_len = std::min(available, limit);
1933
  // If end of section is reachable, then we could parse the remainings in
1934
  // non-streaming mode.
1935
5.88k
  bool is_last_chunk = (chunk_len == limit);
1936
5.88k
  WordSource in(state->data + state->pos, chunk_len, is_last_chunk);
1937
1938
5.88k
  BrunsliStatus status = DecodeDC(state, &in);
1939
1940
5.88k
  BRUNSLI_DCHECK((in.pos_ & 1) == 0);
1941
5.88k
  if (in.error_) return BRUNSLI_INVALID_BRN;
1942
5.61k
  BRUNSLI_DCHECK(in.pos_ <= chunk_len);
1943
5.61k
  SkipBytes(state, in.pos_);
1944
5.61k
  if (is_last_chunk) {
1945
5.30k
    BRUNSLI_DCHECK(status != BRUNSLI_NOT_ENOUGH_DATA);
1946
5.30k
    if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1947
5.30k
  }
1948
5.60k
  return status;
1949
5.61k
}
1950
1951
5.28k
static BrunsliStatus DecodeACDataSection(State* state) {
1952
5.28k
  size_t available = GetBytesAvailable(state) & ~1;
1953
5.28k
  size_t limit = RemainingSectionLength(state);
1954
5.28k
  BRUNSLI_DCHECK((limit & 1) == 0);
1955
5.28k
  size_t chunk_len = std::min(available, limit);
1956
  // If end of section is reachable, then we could parse the remainings in
1957
  // non-streaming mode.
1958
5.28k
  bool is_last_chunk = (chunk_len == limit);
1959
5.28k
  WordSource in(state->data + state->pos, chunk_len, is_last_chunk);
1960
1961
5.28k
  BrunsliStatus status = DecodeAC(state, &in);
1962
1963
5.28k
  BRUNSLI_DCHECK((in.pos_ & 1) == 0);
1964
5.28k
  if (in.error_) return BRUNSLI_INVALID_BRN;
1965
4.69k
  BRUNSLI_DCHECK(in.pos_ <= chunk_len);
1966
4.69k
  SkipBytes(state, in.pos_);
1967
4.69k
  if (is_last_chunk) {
1968
4.48k
    BRUNSLI_DCHECK(status != BRUNSLI_NOT_ENOUGH_DATA);
1969
4.48k
    if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN;
1970
4.48k
  }
1971
4.62k
  return status;
1972
4.69k
}
1973
1974
356
static Stage DecodeOriginalJpg(State* state, JPEGData* jpg) {
1975
356
  InternalState& s = *state->internal;
1976
356
  FallbackState& fs = s.fallback;
1977
1978
1.03k
  while (fs.stage != FallbackState::DONE) {
1979
981
    switch (fs.stage) {
1980
356
      case FallbackState::READ_TAG: {
1981
356
        BrunsliStatus status = ReadTag(state, &s.section);
1982
356
        if (status != BRUNSLI_OK) return Fail(state, status);
1983
338
        if (s.section.tag != kBrunsliOriginalJpgTag || !s.section.is_section) {
1984
6
          return Fail(state, BRUNSLI_INVALID_BRN);
1985
6
        }
1986
332
        fs.stage = FallbackState::ENTER_SECTION;
1987
332
        break;
1988
338
      }
1989
1990
332
      case FallbackState::ENTER_SECTION: {
1991
332
        BrunsliStatus status = EnterSection(state, &s.section);
1992
332
        if (status != BRUNSLI_OK) return Fail(state, status);
1993
297
        jpg->original_jpg_size = s.section.remaining;
1994
        // Edge case - empty payload.
1995
297
        if (jpg->original_jpg_size == 0) {
1996
4
          jpg->original_jpg = nullptr;
1997
4
          fs.stage = FallbackState::DONE;
1998
4
          break;
1999
4
        }
2000
293
        fs.stage = FallbackState::READ_CONTENTS;
2001
293
        break;
2002
297
      }
2003
2004
293
      case FallbackState::READ_CONTENTS: {
2005
293
        size_t chunk_size = GetBytesAvailable(state);
2006
293
        if (chunk_size == 0) {
2007
          // TODO(eustas): dcheck s.section.remaining != 0
2008
79
          return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
2009
79
        }
2010
        // Check if it is possible to avoid copy.
2011
214
        const uint8_t* src = state->data + state->pos;
2012
214
        if (fs.storage.empty()) {
2013
214
          if (chunk_size >= jpg->original_jpg_size) {
2014
53
            jpg->original_jpg = src;
2015
53
            SkipBytes(state, jpg->original_jpg_size);
2016
53
            fs.stage = FallbackState::DONE;
2017
53
            break;
2018
53
          }
2019
214
        }
2020
        // Otherwise, copy input.
2021
161
        size_t remaining = jpg->original_jpg_size - fs.storage.size();
2022
161
        size_t to_copy = std::min(chunk_size, remaining);
2023
161
        fs.storage.insert(fs.storage.cend(), src, src + to_copy);
2024
161
        SkipBytes(state, to_copy);
2025
161
        if (fs.storage.size() == jpg->original_jpg_size) {
2026
0
          jpg->original_jpg = fs.storage.data();
2027
0
          fs.stage = FallbackState::DONE;
2028
0
          break;
2029
0
        }
2030
        // TODO(eustas): dcheck GetBytesAvailable(state) == 0
2031
161
        return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
2032
161
      }
2033
2034
0
      default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
2035
981
    }
2036
981
  }
2037
2038
57
  LeaveSection(&s.section);
2039
57
  return Stage::DONE;
2040
356
}
2041
2042
41.9k
static Stage ParseSection(State* state) {
2043
41.9k
  InternalState& s = *state->internal;
2044
41.9k
  SectionHeaderState& sh = s.section_header;
2045
2046
41.9k
  Stage result = Stage::ERROR;
2047
2048
125k
  while (sh.stage != SectionHeaderState::DONE) {
2049
83.8k
    switch (sh.stage) {
2050
41.9k
      case SectionHeaderState::READ_TAG: {
2051
41.9k
        BrunsliStatus status = ReadTag(state, &s.section);
2052
41.9k
        if (status == BRUNSLI_NOT_ENOUGH_DATA) {
2053
79
          if (HasSection(state, kBrunsliACDataTag)) return Stage::DONE;
2054
79
        }
2055
41.9k
        if (status != BRUNSLI_OK) return Fail(state, status);
2056
41.8k
        if (s.section.is_section) {
2057
41.8k
          sh.stage = SectionHeaderState::ENTER_SECTION;
2058
41.8k
          continue;
2059
41.8k
        }
2060
32
        const uint32_t tag_bit = 1u << s.section.tag;
2061
32
        const bool is_known_section_tag = kKnownSectionTags & tag_bit;
2062
32
        if (is_known_section_tag) return Fail(state, BRUNSLI_INVALID_BRN);
2063
30
        sh.stage = SectionHeaderState::READ_VALUE;
2064
30
        continue;
2065
32
      }
2066
2067
30
      case SectionHeaderState::READ_VALUE: {
2068
        // No known varint tags on top level.
2069
30
        size_t sink;
2070
30
        BrunsliStatus status = DecodeBase128(state, &sink);
2071
30
        if (status != BRUNSLI_OK) return Fail(state, status);
2072
24
        result = Stage::SECTION;
2073
24
        sh.stage = SectionHeaderState::DONE;
2074
24
        continue;
2075
30
      }
2076
2077
41.8k
      case SectionHeaderState::ENTER_SECTION: {
2078
41.8k
        BrunsliStatus status = EnterSection(state, &s.section);
2079
41.8k
        if (status != BRUNSLI_OK) return Fail(state, status);
2080
41.8k
        result = Stage::SECTION_BODY;
2081
41.8k
        sh.stage = SectionHeaderState::DONE;
2082
41.8k
        continue;
2083
41.8k
      }
2084
2085
0
      default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
2086
83.8k
    }
2087
83.8k
  }
2088
2089
41.8k
  sh.stage = SectionHeaderState::READ_TAG;
2090
41.8k
  BRUNSLI_DCHECK(result != Stage::ERROR);
2091
41.8k
  return result;
2092
41.9k
}
2093
2094
41.8k
static Stage ProcessSection(State* state, JPEGData* jpg) {
2095
41.8k
  InternalState& s = *state->internal;
2096
2097
41.8k
  const int32_t tag_bit = 1u << s.section.tag;
2098
41.8k
  const bool is_known_section_tag = kKnownSectionTags & tag_bit;
2099
2100
41.8k
  const bool skip_section =
2101
41.8k
      !is_known_section_tag || (state->skip_tags & tag_bit);
2102
2103
41.8k
  if (skip_section) {
2104
    // Skip section content.
2105
159
    size_t to_skip =
2106
159
        std::min(GetBytesAvailable(state), RemainingSectionLength(state));
2107
159
    state->pos += to_skip;
2108
159
    if (RemainingSectionLength(state) != 0) {
2109
122
      BRUNSLI_DCHECK(GetBytesAvailable(state) == 0);
2110
122
      return Fail(state, BRUNSLI_NOT_ENOUGH_DATA);
2111
122
    }
2112
37
    return Stage::SECTION;
2113
159
  }
2114
2115
41.6k
  switch (s.section.tag) {
2116
4.09k
    case kBrunsliMetaDataTag: {
2117
4.09k
      BrunsliStatus status = DecodeMetaDataSection(state, jpg);
2118
4.09k
      if (status != BRUNSLI_OK) return Fail(state, status);
2119
32
      break;
2120
4.09k
    }
2121
2122
11.4k
    case kBrunsliJPEGInternalsTag: {
2123
11.4k
      BrunsliStatus status = DecodeJPEGInternalsSection(state, jpg);
2124
11.4k
      if (status != BRUNSLI_OK) return Fail(state, status);
2125
9.01k
      break;
2126
11.4k
    }
2127
2128
9.01k
    case kBrunsliQuantDataTag: {
2129
7.57k
      if (!HasSection(state, kBrunsliJPEGInternalsTag)) {
2130
1
        return Fail(state, BRUNSLI_INVALID_BRN);
2131
1
      }
2132
7.57k
      BrunsliStatus status = DecodeQuantDataSection(state, jpg);
2133
7.57k
      if (status != BRUNSLI_OK) return Fail(state, status);
2134
5.92k
      break;
2135
7.57k
    }
2136
2137
7.35k
    case kBrunsliHistogramDataTag: {
2138
7.35k
      if (!HasSection(state, kBrunsliJPEGInternalsTag)) {
2139
1
        return Fail(state, BRUNSLI_INVALID_BRN);
2140
1
      }
2141
7.35k
      BrunsliStatus status = DecodeHistogramDataSection(state, jpg);
2142
7.35k
      if (status != BRUNSLI_OK) return Fail(state, status);
2143
5.91k
      break;
2144
7.35k
    }
2145
2146
5.91k
    case kBrunsliDCDataTag: {
2147
5.89k
      if (!HasSection(state, kBrunsliHistogramDataTag)) {
2148
1
        return Fail(state, BRUNSLI_INVALID_BRN);
2149
1
      }
2150
5.89k
      if (!HasSection(state, kBrunsliQuantDataTag)) {
2151
1
        return Fail(state, BRUNSLI_INVALID_BRN);
2152
1
      }
2153
      // This section reads input word by word.
2154
5.89k
      if ((RemainingSectionLength(state) & 1) != 0) {
2155
8
        return Fail(state, BRUNSLI_INVALID_BRN);
2156
8
      }
2157
5.88k
      internal::dec::WarmupMeta(jpg, state);
2158
5.88k
      BrunsliStatus status = DecodeDCDataSection(state);
2159
5.88k
      if (status != BRUNSLI_OK) return Fail(state, status);
2160
5.34k
      break;
2161
5.88k
    }
2162
2163
5.34k
    case kBrunsliACDataTag: {
2164
5.28k
      if (!HasSection(state, kBrunsliDCDataTag)) {
2165
1
        return Fail(state, BRUNSLI_INVALID_BRN);
2166
1
      }
2167
      // This section reads input word by word.
2168
5.28k
      if ((RemainingSectionLength(state) & 1) != 0) {
2169
1
        return Fail(state, BRUNSLI_INVALID_BRN);
2170
1
      }
2171
5.28k
      internal::dec::WarmupMeta(jpg, state);
2172
5.28k
      BrunsliStatus status = DecodeACDataSection(state);
2173
5.28k
      if (status != BRUNSLI_OK) return Fail(state, status);
2174
4.37k
      break;
2175
5.28k
    }
2176
2177
4.37k
    default:
2178
      /* Unreachable */
2179
0
      return Fail(state, BRUNSLI_INVALID_BRN);
2180
41.6k
  }
2181
2182
30.6k
  if (!IsAtSectionBoundary(state)) {
2183
59
    return Fail(state, BRUNSLI_INVALID_BRN);
2184
59
  }
2185
2186
  // Nothing is expected after the AC data.
2187
30.5k
  if (s.section.tag == kBrunsliACDataTag) {
2188
4.37k
    return Stage::DONE;
2189
4.37k
  }
2190
2191
26.1k
  return Stage::SECTION;
2192
30.5k
}
2193
2194
namespace internal {
2195
namespace dec {
2196
2197
15.7k
bool UpdateSubsamplingDerivatives(JPEGData* jpg) {
2198
42.6k
  for (size_t i = 0; i < jpg->components.size(); ++i) {
2199
26.9k
    JPEGComponent* c = &jpg->components[i];
2200
26.9k
    jpg->max_h_samp_factor = std::max(jpg->max_h_samp_factor, c->h_samp_factor);
2201
26.9k
    jpg->max_v_samp_factor = std::max(jpg->max_v_samp_factor, c->v_samp_factor);
2202
26.9k
  }
2203
15.7k
  jpg->MCU_rows = DivCeil(jpg->height, jpg->max_v_samp_factor * 8);
2204
15.7k
  jpg->MCU_cols = DivCeil(jpg->width, jpg->max_h_samp_factor * 8);
2205
42.6k
  for (size_t i = 0; i < jpg->components.size(); ++i) {
2206
26.9k
    JPEGComponent* c = &jpg->components[i];
2207
26.9k
    c->width_in_blocks = jpg->MCU_cols * c->h_samp_factor;
2208
26.9k
    c->height_in_blocks = jpg->MCU_rows * c->v_samp_factor;
2209
    // 8205 == max[ceil((65535 / (i * 8)) * i) for i in range(1, 16 + 1)]
2210
26.9k
    BRUNSLI_DCHECK(c->width_in_blocks <= 8205);
2211
26.9k
    BRUNSLI_DCHECK(c->height_in_blocks <= 8205);
2212
26.9k
    uint32_t num_blocks = c->width_in_blocks * c->height_in_blocks;
2213
26.9k
    if (num_blocks > kBrunsliMaxNumBlocks) {
2214
1
      return false;
2215
1
    }
2216
26.9k
    c->num_blocks = num_blocks;
2217
26.9k
  }
2218
15.7k
  return true;
2219
15.7k
}
2220
2221
15.7k
void PrepareMeta(const JPEGData* jpg, State* state) {
2222
15.7k
  InternalState& s = *state->internal;
2223
2224
15.7k
  size_t num_components = jpg->components.size();
2225
15.7k
  s.block_state_.resize(num_components);
2226
15.7k
  std::vector<ComponentMeta>& meta = state->meta;
2227
15.7k
  meta.resize(num_components);
2228
42.6k
  for (size_t i = 0; i < num_components; ++i) {
2229
26.9k
    const JPEGComponent& c = jpg->components[i];
2230
26.9k
    ComponentMeta& m = meta[i];
2231
26.9k
    m.h_samp = c.h_samp_factor;
2232
26.9k
    m.v_samp = c.v_samp_factor;
2233
26.9k
    m.width_in_blocks = jpg->MCU_cols * m.h_samp;
2234
26.9k
    m.height_in_blocks = jpg->MCU_rows * m.v_samp;
2235
26.9k
  }
2236
15.7k
}
2237
2238
11.1k
void WarmupMeta(JPEGData* jpg, State* state) {
2239
11.1k
  InternalState& s = *state->internal;
2240
11.1k
  std::vector<ComponentMeta>& meta = state->meta;
2241
11.1k
  const size_t num_components = meta.size();
2242
2243
11.1k
  if (!state->is_storage_allocated) {
2244
5.88k
    state->is_storage_allocated = true;
2245
12.4k
    for (size_t i = 0; i < num_components; ++i) {
2246
6.51k
      size_t num_blocks = meta[i].width_in_blocks * meta[i].height_in_blocks;
2247
6.51k
      jpg->components[i].coeffs.resize(num_blocks * kDCTBlockSize);
2248
6.51k
      s.block_state_[i].resize(num_blocks);
2249
6.51k
      meta[i].block_state = s.block_state_[i].data();
2250
6.51k
    }
2251
5.88k
  }
2252
2253
11.1k
  if (!s.is_meta_warm) {
2254
5.88k
    s.is_meta_warm = true;
2255
12.4k
    for (size_t c = 0; c < num_components; ++c) {
2256
6.51k
      ComponentMeta& m = meta[c];
2257
6.51k
      const JPEGQuantTable& q = jpg->quant[jpg->components[c].quant_idx];
2258
6.51k
      m.ac_coeffs = jpg->components[c].coeffs.data();
2259
6.51k
      m.ac_stride = m.width_in_blocks * kDCTBlockSize;
2260
6.51k
      m.b_stride = m.width_in_blocks;
2261
6.51k
      memcpy(m.quant.data(), q.values.data(),
2262
6.51k
             kDCTBlockSize * sizeof(m.quant[0]));
2263
6.51k
    }
2264
5.88k
  }
2265
11.1k
}
2266
2267
16.8k
BrunsliStatus DoProcessJpeg(State* state, JPEGData* jpg) {
2268
134k
  while (true) {
2269
134k
    switch (state->stage) {
2270
16.8k
      case Stage::SIGNATURE:
2271
16.8k
        state->stage = VerifySignature(state);
2272
16.8k
        break;
2273
2274
16.7k
      case Stage::HEADER:
2275
16.7k
        state->stage = DecodeHeader(state, jpg);
2276
16.7k
        break;
2277
2278
356
      case Stage::FALLBACK:
2279
356
        state->stage = DecodeOriginalJpg(state, jpg);
2280
356
        break;
2281
2282
41.9k
      case Stage::SECTION:
2283
41.9k
        state->stage = ParseSection(state);
2284
41.9k
        break;
2285
2286
41.8k
      case Stage::SECTION_BODY:
2287
41.8k
        state->stage = ProcessSection(state, jpg);
2288
41.8k
        break;
2289
2290
4.43k
      case Stage::DONE:
2291
        // It is expected that there is no garbage after the valid brunsli
2292
        // stream.
2293
4.43k
        if (state->pos != state->len) {
2294
44
          state->stage = Fail(state, BRUNSLI_INVALID_BRN);
2295
44
          break;
2296
44
        }
2297
4.39k
        return BRUNSLI_OK;
2298
2299
12.4k
      case Stage::ERROR:
2300
12.4k
        return state->internal->result;
2301
2302
0
      default:
2303
        /* Unreachable */
2304
0
        state->stage = Fail(state, BRUNSLI_DECOMPRESSION_ERROR);
2305
0
        break;
2306
134k
    }
2307
134k
  }
2308
16.8k
}
2309
2310
/** Adds new input to buffer. */
2311
16.8k
void ChargeBuffer(State* state) {
2312
16.8k
  InternalState& s = *state->internal;
2313
16.8k
  Buffer& b = s.buffer;
2314
2315
16.8k
  b.borrowed_len = 0;
2316
16.8k
  b.external_data = state->data;
2317
16.8k
  b.external_pos = state->pos;
2318
16.8k
  b.external_len = state->len;
2319
16.8k
}
2320
2321
constexpr size_t kBufferMaxReadAhead = 600;
2322
2323
/** Sets input source either to buffered, or to external data. */
2324
16.8k
void LoadInput(State* state) {
2325
16.8k
  InternalState& s = *state->internal;
2326
16.8k
  Buffer& b = s.buffer;
2327
2328
  // No data buffered. Just pass external data as is.
2329
16.8k
  if (b.data_len == 0) {
2330
16.8k
    state->data = b.external_data;
2331
16.8k
    state->pos = b.external_pos;
2332
16.8k
    state->len = b.external_len;
2333
16.8k
    return;
2334
16.8k
  }
2335
2336
0
  BRUNSLI_DCHECK(b.data_len <= kBufferMaxReadAhead);
2337
2338
  // Otherwise use buffered data.
2339
0
  size_t available = b.external_len - b.external_pos;
2340
  // Always try to borrow as much as parser could require. This way, when
2341
  // buffer is unable to provide enough input, we could switch to unbuffered
2342
  // input.
2343
0
  b.borrowed_len = std::min(kBufferMaxReadAhead, available);
2344
0
  memcpy(b.data.data() + b.data_len, b.external_data + b.external_pos,
2345
0
         b.borrowed_len);
2346
0
  state->data = b.data.data();
2347
0
  state->pos = 0;
2348
0
  state->len = b.data_len + b.borrowed_len;
2349
0
}
2350
2351
/**
2352
 * Cancel borrowed bytes, if any.
2353
 *
2354
 * Returns false, if it is impossible to continue parsing.
2355
 */
2356
16.8k
bool UnloadInput(State* state, BrunsliStatus result) {
2357
16.8k
  InternalState& s = *state->internal;
2358
16.8k
  Buffer& b = s.buffer;
2359
2360
  // Non-buffered input; put tail to buffer.
2361
16.8k
  if (state->data == b.external_data) {
2362
16.8k
    b.external_pos = state->pos;
2363
16.8k
    BRUNSLI_DCHECK(b.external_pos <= b.external_len);
2364
16.8k
    if (result != BRUNSLI_NOT_ENOUGH_DATA) return true;
2365
6.12k
    BRUNSLI_DCHECK(b.data_len == 0);
2366
6.12k
    size_t available = b.external_len - b.external_pos;
2367
6.12k
    BRUNSLI_DCHECK(available < kBufferMaxReadAhead);
2368
6.12k
    if (b.data.empty()) b.data.resize(2 * kBufferMaxReadAhead);
2369
6.12k
    b.data_len = available;
2370
6.12k
    memcpy(b.data.data(), b.external_data + b.external_pos, b.data_len);
2371
6.12k
    b.external_pos += available;
2372
6.12k
    return false;
2373
16.8k
  }
2374
2375
  // Buffer depleted; switch to non-buffered input.
2376
0
  if (state->pos >= b.data_len) {
2377
0
    size_t used_borrowed_bytes = state->pos - b.data_len;
2378
0
    b.data_len = 0;
2379
0
    b.external_pos += used_borrowed_bytes;
2380
0
    return true;
2381
0
  }
2382
2383
  // Buffer not depleted; either problem discovered was already buffered data,
2384
  // or extra input was too-short.
2385
0
  b.data_len -= state->pos;
2386
0
  if (result == BRUNSLI_NOT_ENOUGH_DATA) {
2387
    // We couldn't have taken more bytes.
2388
0
    BRUNSLI_DCHECK(b.external_pos + b.borrowed_len == b.external_len);
2389
    // Remaining piece is not too large.
2390
0
    BRUNSLI_DCHECK(b.data_len + b.borrowed_len < kBufferMaxReadAhead);
2391
0
    b.data_len += b.borrowed_len;
2392
0
    b.external_pos += b.borrowed_len;
2393
0
  }
2394
0
  BRUNSLI_DCHECK(!b.data.empty());
2395
0
  if (state->pos > 0 && b.data_len > 0) {
2396
0
    memmove(b.data.data(), b.data.data() + state->pos, b.data_len);
2397
0
  }
2398
0
  BRUNSLI_DCHECK(b.data_len <= kBufferMaxReadAhead);
2399
2400
0
  return (result != BRUNSLI_NOT_ENOUGH_DATA);
2401
0
}
2402
2403
/** Sets back user-provided input. */
2404
16.8k
void UnchargeBuffer(State* state) {
2405
16.8k
  InternalState& s = *state->internal;
2406
16.8k
  Buffer& b = s.buffer;
2407
2408
16.8k
  state->data = b.external_data;
2409
16.8k
  state->pos = b.external_pos;
2410
16.8k
  state->len = b.external_len;
2411
16.8k
}
2412
2413
16.8k
BrunsliStatus ProcessJpeg(State* state, JPEGData* jpg) {
2414
16.8k
  InternalState& s = *state->internal;
2415
2416
16.8k
  if (state->pos > state->len) return BRUNSLI_INVALID_PARAM;
2417
16.8k
  ChargeBuffer(state);
2418
2419
16.8k
  BrunsliStatus result = BRUNSLI_NOT_ENOUGH_DATA;
2420
27.4k
  while (result == BRUNSLI_NOT_ENOUGH_DATA) {
2421
16.8k
    if (state->stage == Stage::ERROR) {
2422
      // General error -> no recovery.
2423
0
      if (s.result != BRUNSLI_NOT_ENOUGH_DATA) return s.result;
2424
      // Continue parsing.
2425
0
      s.result = BRUNSLI_OK;
2426
0
      state->stage = s.last_stage;
2427
0
      s.last_stage = Stage::ERROR;
2428
0
    }
2429
2430
16.8k
    LoadInput(state);
2431
16.8k
    if (s.section.is_active) {
2432
0
      s.section.milestone = state->pos;
2433
0
      s.section.projected_end = s.section.milestone + s.section.remaining;
2434
0
    }
2435
2436
16.8k
    s.section.tags_met |= state->tags_met;
2437
16.8k
    result = DoProcessJpeg(state, jpg);
2438
2439
16.8k
    if (s.section.is_active) {
2440
      // TODO(eustas): dcheck state->pos > s.section.milestone
2441
16.4k
      size_t processed_len = state->pos - s.section.milestone;
2442
      // TODO(eustas): dcheck processed_len < s.section.remaining
2443
16.4k
      s.section.remaining -= processed_len;
2444
16.4k
    }
2445
2446
16.8k
    if (!UnloadInput(state, result)) break;
2447
16.8k
  }
2448
16.8k
  UnchargeBuffer(state);
2449
16.8k
  return result;
2450
16.8k
}
2451
2452
}  // namespace dec
2453
}  // namespace internal
2454
2455
BrunsliStatus BrunsliDecodeJpeg(const uint8_t* data, const size_t len,
2456
16.8k
                                JPEGData* jpg) {
2457
16.8k
  if (!data) return BRUNSLI_INVALID_PARAM;
2458
2459
16.8k
  State state;
2460
16.8k
  state.data = data;
2461
16.8k
  state.len = len;
2462
2463
16.8k
  return internal::dec::ProcessJpeg(&state, jpg);
2464
16.8k
}
2465
2466
size_t BrunsliEstimateDecoderPeakMemoryUsage(const uint8_t* data,
2467
0
                                             const size_t len) {
2468
0
  if (!data) return BRUNSLI_INVALID_PARAM;
2469
2470
0
  State state;
2471
0
  state.data = data;
2472
0
  state.len = len;
2473
0
  state.skip_tags = ~(1u << kBrunsliHistogramDataTag);
2474
0
  InternalState& s = *state.internal;
2475
0
  s.shallow_histograms = true;
2476
2477
0
  JPEGData jpg;
2478
0
  BrunsliStatus status = internal::dec::ProcessJpeg(&state, &jpg);
2479
2480
0
  if (status != BRUNSLI_OK) return 0;
2481
2482
0
  size_t out_size = 2 * len;
2483
0
  size_t total_num_blocks = 0;
2484
0
  size_t component_state_size = 0;
2485
0
  for (size_t i = 0; i < jpg.components.size(); ++i) {
2486
0
    const JPEGComponent& c = jpg.components[i];
2487
0
    total_num_blocks += c.num_blocks;
2488
0
    component_state_size += ComponentState::SizeInBytes(c.width_in_blocks);
2489
0
  }
2490
0
  size_t jpeg_data_size = total_num_blocks * kDCTBlockSize * sizeof(coeff_t);
2491
0
  size_t context_map_size = s.num_contexts * kNumAvrgContexts * sizeof(int32_t);
2492
0
  size_t histogram_size = s.num_histograms * sizeof(ANSDecodingData);
2493
0
  size_t decode_peak = context_map_size + histogram_size + component_state_size;
2494
0
  size_t jpeg_writer_size = (1u << 17u) + (1u << 16u) * sizeof(int32_t);
2495
0
  return (out_size + jpeg_data_size + std::max(decode_peak, jpeg_writer_size));
2496
0
}
2497
2498
0
BrunsliDecoder::BrunsliDecoder() {
2499
0
  jpg_.reset(new JPEGData);
2500
0
  state_.reset(new State);
2501
0
}
2502
2503
0
BrunsliDecoder::~BrunsliDecoder() {}
2504
2505
BrunsliDecoder::Status BrunsliDecoder::Decode(size_t* available_in,
2506
                                              const uint8_t** next_in,
2507
                                              size_t* available_out,
2508
0
                                              uint8_t** next_out) {
2509
0
  JPEGData* jpg = jpg_.get();
2510
0
  BRUNSLI_DCHECK(jpg);
2511
0
  State* state = state_.get();
2512
0
  BRUNSLI_DCHECK(state);
2513
2514
0
  state->data = *next_in;
2515
0
  state->pos = 0;
2516
0
  state->len = *available_in;
2517
0
  BrunsliStatus parse_status = internal::dec::ProcessJpeg(state, jpg);
2518
0
  size_t consumed_bytes = state->pos;
2519
0
  *available_in -= consumed_bytes;
2520
0
  *next_in += consumed_bytes;
2521
2522
0
  if ((parse_status != BRUNSLI_OK) &&
2523
0
      (parse_status != BRUNSLI_NOT_ENOUGH_DATA)) {
2524
0
    return BrunsliDecoder::ERROR;
2525
0
  }
2526
2527
  // All the input given input should be consumed.
2528
0
  BRUNSLI_DCHECK(*available_in == 0);
2529
2530
0
  SerializationStatus serialization_status =
2531
0
      SerializeJpeg(state, *jpg, available_out, next_out);
2532
0
  if (serialization_status == SerializationStatus::ERROR) {
2533
0
    return BrunsliDecoder::ERROR;
2534
0
  }
2535
2536
0
  switch (serialization_status) {
2537
0
    case SerializationStatus::DONE:
2538
      // Should be impossible to finish serialization without finishing parsing.
2539
0
      BRUNSLI_DCHECK(parse_status == BRUNSLI_OK);
2540
0
      return BrunsliDecoder::DONE;
2541
2542
0
    case SerializationStatus::NEEDS_MORE_INPUT:
2543
      // If serializer says that data is incomplete, parser should say the same.
2544
0
      BRUNSLI_DCHECK(parse_status == BRUNSLI_NOT_ENOUGH_DATA);
2545
0
      return BrunsliDecoder::NEEDS_MORE_INPUT;
2546
2547
0
    case SerializationStatus::NEEDS_MORE_OUTPUT:
2548
      // TODO(eustas): make sure that serializer could produce more bytes
2549
      //               without providing more bytes to parser
2550
0
      BRUNSLI_DCHECK(*available_out == 0);
2551
0
      return BrunsliDecoder::NEEDS_MORE_OUTPUT;
2552
2553
0
    case SerializationStatus::ERROR:
2554
0
      return BrunsliDecoder::ERROR;
2555
2556
0
    default:
2557
      /* Unreachable */
2558
0
      BRUNSLI_DCHECK(false);
2559
0
      return BrunsliDecoder::ERROR;
2560
0
  }
2561
0
}
2562
2563
}  // namespace brunsli