/src/brunsli/c/dec/brunsli_decode.cc
Line | Count | Source (jump to first uncovered line) |
1 | | // Copyright (c) Google LLC 2019 |
2 | | // |
3 | | // Use of this source code is governed by an MIT-style |
4 | | // license that can be found in the LICENSE file or at |
5 | | // https://opensource.org/licenses/MIT. |
6 | | |
7 | | #include <brunsli/brunsli_decode.h> |
8 | | |
9 | | #include <algorithm> |
10 | | #include <cstdlib> |
11 | | #include <cstring> |
12 | | #include <iterator> |
13 | | #include <string> |
14 | | #include <vector> |
15 | | |
16 | | #include <brotli/decode.h> |
17 | | #include "../common/constants.h" |
18 | | #include "../common/context.h" |
19 | | #include <brunsli/jpeg_data.h> |
20 | | #include "../common/lehmer_code.h" |
21 | | #include "../common/platform.h" |
22 | | #include "../common/predict.h" |
23 | | #include "../common/quant_matrix.h" |
24 | | #include <brunsli/status.h> |
25 | | #include <brunsli/types.h> |
26 | | #include "./ans_decode.h" |
27 | | #include "./arith_decode.h" |
28 | | #include "./bit_reader.h" |
29 | | #include "./brunsli_input.h" |
30 | | #include "./context_map_decode.h" |
31 | | #include "./histogram_decode.h" |
32 | | #include "./huffman_table.h" |
33 | | #include <brunsli/jpeg_data_writer.h> |
34 | | #include "./state.h" |
35 | | #include "./state_internal.h" |
36 | | |
37 | | namespace brunsli { |
38 | | |
39 | | using ::brunsli::internal::dec::AcDcState; |
40 | | using ::brunsli::internal::dec::BlockI32; |
41 | | using ::brunsli::internal::dec::Buffer; |
42 | | using ::brunsli::internal::dec::ComponentMeta; |
43 | | using ::brunsli::internal::dec::FallbackState; |
44 | | using ::brunsli::internal::dec::HeaderState; |
45 | | using ::brunsli::internal::dec::HistogramDataState; |
46 | | using ::brunsli::internal::dec::InternalState; |
47 | | using ::brunsli::internal::dec::JpegInternalsState; |
48 | | using ::brunsli::internal::dec::MetadataDecompressionStage; |
49 | | using ::brunsli::internal::dec::MetadataState; |
50 | | using ::brunsli::internal::dec::PrepareMeta; |
51 | | using ::brunsli::internal::dec::QuantDataState; |
52 | | using ::brunsli::internal::dec::SectionHeaderState; |
53 | | using ::brunsli::internal::dec::SectionState; |
54 | | using ::brunsli::internal::dec::SerializationStatus; |
55 | | using ::brunsli::internal::dec::Stage; |
56 | | using ::brunsli::internal::dec::State; |
57 | | using ::brunsli::internal::dec::UpdateSubsamplingDerivatives; |
58 | | using ::brunsli::internal::dec::VarintState; |
59 | | |
60 | | static const int kNumDirectCodes = 8; |
61 | | static const int kCoeffAlphabetSize = kNumDirectCodes + 10; |
62 | | |
63 | | static const uint32_t kKnownSectionTags = |
64 | | (1u << kBrunsliSignatureTag) | (1u << kBrunsliHeaderTag) | |
65 | | (1u << kBrunsliMetaDataTag) | (1u << kBrunsliJPEGInternalsTag) | |
66 | | (1u << kBrunsliQuantDataTag) | (1u << kBrunsliHistogramDataTag) | |
67 | | (1u << kBrunsliDCDataTag) | (1u << kBrunsliACDataTag) | |
68 | | (1u << kBrunsliOriginalJpgTag); |
69 | | |
70 | | static const uint32_t kKnownHeaderVarintTags = |
71 | | (1u << kBrunsliHeaderWidthTag) | (1u << kBrunsliHeaderHeightTag) | |
72 | | (1u << kBrunsliHeaderVersionCompTag) | (1u << kBrunsliHeaderSubsamplingTag); |
73 | | |
74 | 0 | bool IsBrunsli(const uint8_t* data, const size_t len) { |
75 | 0 | static const uint8_t kSignature[6] = { |
76 | 0 | /* marker */ 0x0A, |
77 | 0 | /* length */ 0x04, 0x42, 0xD2, 0xD5, 0x4E}; |
78 | 0 | static const size_t kSignatureLen = sizeof(kSignature); |
79 | 0 | if (len < kSignatureLen) return false; |
80 | 0 | return (memcmp(kSignature, data, kSignatureLen) == 0); |
81 | 0 | } |
82 | | |
83 | | // Returns ceil(a/b). |
84 | 60.8k | inline int DivCeil(int a, int b) { return (a + b - 1) / b; } |
85 | | |
86 | | // Decodes a number in the range [0..255], by reading 1 - 11 bits. |
87 | 13.9k | inline uint32_t DecodeVarLenUint8(BrunsliBitReader* br) { |
88 | 13.9k | if (BrunsliBitReaderRead(br, 1)) { |
89 | 2.56k | uint32_t nbits = BrunsliBitReaderRead(br, 3); |
90 | 2.56k | if (nbits == 0) { |
91 | 1.22k | return 1u; |
92 | 1.34k | } else { |
93 | 1.34k | return BrunsliBitReaderRead(br, nbits) + (1u << nbits); |
94 | 1.34k | } |
95 | 2.56k | } |
96 | 11.4k | return 0; |
97 | 13.9k | } |
98 | | |
99 | 11.2M | bool DecodeVarint(VarintState* s, BrunsliBitReader* br, size_t max_bits) { |
100 | 11.2M | if (s->stage == VarintState::INIT) { |
101 | 10.4M | s->value = 0; |
102 | 10.4M | s->i = 0; |
103 | 10.4M | s->stage = VarintState::READ_CONTINUATION; |
104 | 10.4M | } |
105 | | |
106 | 25.3M | while (true) { |
107 | 25.3M | switch (s->stage) { |
108 | 18.2M | case VarintState::READ_CONTINUATION: { |
109 | 18.2M | if (s->i >= max_bits) { |
110 | 1.75k | s->stage = VarintState::INIT; |
111 | 1.75k | return true; |
112 | 1.75k | } |
113 | 18.2M | if (s->i + 1 != max_bits) { |
114 | 18.2M | if (!BrunsliBitReaderCanRead(br, 1)) return false; |
115 | 17.5M | if (!BrunsliBitReaderRead(br, 1)) { |
116 | 10.4M | s->stage = VarintState::INIT; |
117 | 10.4M | return true; |
118 | 10.4M | } |
119 | 17.5M | } |
120 | 7.07M | s->stage = VarintState::READ_DATA; |
121 | 7.07M | continue; |
122 | 18.2M | } |
123 | 7.08M | case VarintState::READ_DATA: { |
124 | 7.08M | if (!BrunsliBitReaderCanRead(br, 1)) return false; |
125 | 7.07M | size_t next_bit = BrunsliBitReaderRead(br, 1); |
126 | 7.07M | s->value |= next_bit << s->i; |
127 | 7.07M | ++s->i; |
128 | 7.07M | s->stage = VarintState::READ_CONTINUATION; |
129 | 7.07M | continue; |
130 | 7.08M | } |
131 | 0 | default: { |
132 | 0 | BRUNSLI_CHECK(false); |
133 | 0 | return false; |
134 | 7.08M | } |
135 | 25.3M | } |
136 | 25.3M | } |
137 | 11.2M | } |
138 | | |
139 | | template <size_t kChunkSize> |
140 | | bool DecodeLimitedVarint(VarintState* s, BrunsliBitReader* br, |
141 | 162k | size_t max_symbols) { |
142 | 162k | if (s->stage == VarintState::INIT) { |
143 | 147k | s->value = 0; |
144 | 147k | s->i = 0; |
145 | 147k | s->stage = VarintState::READ_CONTINUATION; |
146 | 147k | } |
147 | 243k | while (true) { |
148 | 243k | switch (s->stage) { |
149 | 198k | case VarintState::READ_CONTINUATION: { |
150 | 198k | if (s->i < max_symbols) { |
151 | 193k | if (!BrunsliBitReaderCanRead(br, 1)) return false; |
152 | 183k | if (BrunsliBitReaderRead(br, 1)) { |
153 | 40.3k | s->stage = VarintState::READ_DATA; |
154 | 40.3k | continue; |
155 | 40.3k | } |
156 | 183k | } |
157 | 147k | s->stage = VarintState::INIT; |
158 | 147k | return true; |
159 | 198k | } |
160 | 45.4k | case VarintState::READ_DATA: { |
161 | 45.4k | if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false; |
162 | 40.2k | size_t next_bits = BrunsliBitReaderRead(br, kChunkSize); |
163 | 40.2k | s->value |= next_bits << (s->i * kChunkSize); |
164 | 40.2k | ++s->i; |
165 | 40.2k | s->stage = VarintState::READ_CONTINUATION; |
166 | 40.2k | continue; |
167 | 45.4k | } |
168 | 0 | default: { |
169 | 0 | BRUNSLI_CHECK(false); |
170 | 0 | return false; |
171 | 45.4k | } |
172 | 243k | } |
173 | 243k | } |
174 | 162k | } bool brunsli::DecodeLimitedVarint<2ul>(brunsli::internal::dec::VarintState*, brunsli::BrunsliBitReader*, unsigned long) Line | Count | Source | 141 | 143k | size_t max_symbols) { | 142 | 143k | if (s->stage == VarintState::INIT) { | 143 | 128k | s->value = 0; | 144 | 128k | s->i = 0; | 145 | 128k | s->stage = VarintState::READ_CONTINUATION; | 146 | 128k | } | 147 | 220k | while (true) { | 148 | 220k | switch (s->stage) { | 149 | 177k | case VarintState::READ_CONTINUATION: { | 150 | 177k | if (s->i < max_symbols) { | 151 | 173k | if (!BrunsliBitReaderCanRead(br, 1)) return false; | 152 | 163k | if (BrunsliBitReaderRead(br, 1)) { | 153 | 38.5k | s->stage = VarintState::READ_DATA; | 154 | 38.5k | continue; | 155 | 38.5k | } | 156 | 163k | } | 157 | 128k | s->stage = VarintState::INIT; | 158 | 128k | return true; | 159 | 177k | } | 160 | 42.9k | case VarintState::READ_DATA: { | 161 | 42.9k | if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false; | 162 | 38.5k | size_t next_bits = BrunsliBitReaderRead(br, kChunkSize); | 163 | 38.5k | s->value |= next_bits << (s->i * kChunkSize); | 164 | 38.5k | ++s->i; | 165 | 38.5k | s->stage = VarintState::READ_CONTINUATION; | 166 | 38.5k | continue; | 167 | 42.9k | } | 168 | 0 | default: { | 169 | 0 | BRUNSLI_CHECK(false); | 170 | 0 | return false; | 171 | 42.9k | } | 172 | 220k | } | 173 | 220k | } | 174 | 143k | } |
bool brunsli::DecodeLimitedVarint<8ul>(brunsli::internal::dec::VarintState*, brunsli::BrunsliBitReader*, unsigned long) Line | Count | Source | 141 | 19.7k | size_t max_symbols) { | 142 | 19.7k | if (s->stage == VarintState::INIT) { | 143 | 18.9k | s->value = 0; | 144 | 18.9k | s->i = 0; | 145 | 18.9k | s->stage = VarintState::READ_CONTINUATION; | 146 | 18.9k | } | 147 | 23.1k | while (true) { | 148 | 23.1k | switch (s->stage) { | 149 | 20.6k | case VarintState::READ_CONTINUATION: { | 150 | 20.6k | if (s->i < max_symbols) { | 151 | 20.5k | if (!BrunsliBitReaderCanRead(br, 1)) return false; | 152 | 20.5k | if (BrunsliBitReaderRead(br, 1)) { | 153 | 1.79k | s->stage = VarintState::READ_DATA; | 154 | 1.79k | continue; | 155 | 1.79k | } | 156 | 20.5k | } | 157 | 18.7k | s->stage = VarintState::INIT; | 158 | 18.7k | return true; | 159 | 20.6k | } | 160 | 2.55k | case VarintState::READ_DATA: { | 161 | 2.55k | if (!BrunsliBitReaderCanRead(br, kChunkSize)) return false; | 162 | 1.66k | size_t next_bits = BrunsliBitReaderRead(br, kChunkSize); | 163 | 1.66k | s->value |= next_bits << (s->i * kChunkSize); | 164 | 1.66k | ++s->i; | 165 | 1.66k | s->stage = VarintState::READ_CONTINUATION; | 166 | 1.66k | continue; | 167 | 2.55k | } | 168 | 0 | default: { | 169 | 0 | BRUNSLI_CHECK(false); | 170 | 0 | return false; | 171 | 2.55k | } | 172 | 23.1k | } | 173 | 23.1k | } | 174 | 19.7k | } |
|
175 | | |
176 | 38.3k | std::vector<uint8_t> GenerateApp0Marker(uint8_t app0_status) { |
177 | 38.3k | std::vector<uint8_t> app0_marker(AppData_0xe0, AppData_0xe0 + 17); |
178 | 38.3k | app0_marker[9] = app0_status & 1u ? 2 : 1; |
179 | 38.3k | app0_status >>= 1u; |
180 | 38.3k | app0_marker[10] = app0_status & 0x3u; |
181 | 38.3k | app0_status >>= 2u; |
182 | 38.3k | uint16_t x_dens = kApp0Densities[app0_status]; |
183 | 38.3k | app0_marker[11] = app0_marker[13] = x_dens >> 8u; |
184 | 38.3k | app0_marker[12] = app0_marker[14] = x_dens & 0xFFu; |
185 | 38.3k | return app0_marker; |
186 | 38.3k | } |
187 | | |
188 | 14.0k | std::vector<uint8_t> GenerateAppMarker(uint8_t marker, uint8_t code) { |
189 | 14.0k | std::vector<uint8_t> s; |
190 | 14.0k | if (marker == 0x80) { |
191 | 5.13k | s = std::vector<uint8_t>(AppData_0xe2, AppData_0xe2 + 3161); |
192 | 5.13k | s[84] = code; |
193 | 8.86k | } else if (marker == 0x81) { |
194 | 3.36k | s = std::vector<uint8_t>(AppData_0xec, AppData_0xec + 18); |
195 | 3.36k | s[15] = code; |
196 | 5.50k | } else { |
197 | 5.50k | BRUNSLI_DCHECK(marker == 0x82); |
198 | 5.50k | s = std::vector<uint8_t>(AppData_0xee, AppData_0xee + 15); |
199 | 5.50k | s[10] = code; |
200 | 5.50k | } |
201 | 14.0k | return s; |
202 | 14.0k | } |
203 | | |
204 | | bool ProcessMetaData(const uint8_t* data, size_t len, MetadataState* state, |
205 | 830k | JPEGData* jpg) { |
206 | 830k | size_t pos = 0; |
207 | 1.75M | while (pos < len) { |
208 | 922k | switch (state->stage) { |
209 | 103k | case MetadataState::READ_MARKER: { |
210 | 103k | state->marker = static_cast<uint8_t>(data[pos++]); |
211 | 103k | if (state->marker == 0xD9) { |
212 | 357 | jpg->tail_data = std::vector<uint8_t>(); |
213 | 357 | state->stage = MetadataState::READ_TAIL; |
214 | 357 | continue; |
215 | 103k | } else if (state->marker < 0x40) { |
216 | 38.3k | state->short_marker_count++; |
217 | 38.3k | if (state->short_marker_count > kBrunsliShortMarkerLimit) { |
218 | 16 | return false; |
219 | 16 | } |
220 | 38.3k | jpg->app_data.push_back(GenerateApp0Marker(state->marker)); |
221 | 38.3k | continue; |
222 | 65.2k | } else if (state->marker >= 0x80 && state->marker <= 0x82) { |
223 | 14.0k | state->short_marker_count++; |
224 | 14.0k | if (state->short_marker_count > kBrunsliShortMarkerLimit) { |
225 | 5 | return false; |
226 | 5 | } |
227 | 14.0k | state->stage = MetadataState::READ_CODE; |
228 | 14.0k | continue; |
229 | 14.0k | } |
230 | | // Otherwise - mutlibyte sequence. |
231 | 51.1k | if ((state->marker != 0xFE) && ((state->marker >> 4u) != 0x0E)) { |
232 | 233 | return false; |
233 | 233 | } |
234 | 50.9k | state->stage = MetadataState::READ_LENGTH_HI; |
235 | 50.9k | continue; |
236 | 51.1k | } |
237 | | |
238 | 158k | case MetadataState::READ_TAIL: { |
239 | 158k | Append(&jpg->tail_data, data + pos, data + len); |
240 | 158k | pos = len; |
241 | 158k | continue; |
242 | 51.1k | } |
243 | | |
244 | 14.0k | case MetadataState::READ_CODE: { |
245 | 14.0k | const uint8_t code = data[pos++]; |
246 | 14.0k | jpg->app_data.push_back(GenerateAppMarker(state->marker, code)); |
247 | 14.0k | state->stage = MetadataState::READ_MARKER; |
248 | 14.0k | continue; |
249 | 51.1k | } |
250 | | |
251 | 50.9k | case MetadataState::READ_LENGTH_HI: { |
252 | 50.9k | state->length_hi = data[pos++]; |
253 | 50.9k | state->stage = MetadataState::READ_LENGTH_LO; |
254 | 50.9k | continue; |
255 | 51.1k | } |
256 | | |
257 | 50.9k | case MetadataState::READ_LENGTH_LO: { |
258 | 50.9k | const uint8_t lo = data[pos++]; |
259 | 50.9k | size_t marker_len = (state->length_hi << 8u) + lo; |
260 | 50.9k | if (marker_len < 2) return false; |
261 | 50.9k | state->remaining_multibyte_length = marker_len - 2; |
262 | 50.9k | uint8_t head[3] = {state->marker, state->length_hi, lo}; |
263 | 50.9k | auto* dest = (state->marker == 0xFE) ? &jpg->com_data : &jpg->app_data; |
264 | 50.9k | size_t delta = (state->marker == 0xFE) ? 0 : state->short_marker_count; |
265 | 50.9k | if (dest->size() - delta >= kBrunsliMultibyteMarkerLimit) { |
266 | 5 | return false; |
267 | 5 | } |
268 | 50.9k | dest->emplace_back(head, head + 3); |
269 | 50.9k | state->multibyte_sink = &dest->back(); |
270 | | // Turn state machine to default state in case there is no payload in |
271 | | // multibyte sequence. This is important when such a sequence concludes |
272 | | // the input. |
273 | 50.9k | state->stage = (state->remaining_multibyte_length > 0) |
274 | 50.9k | ? MetadataState::READ_MULTIBYTE |
275 | 50.9k | : MetadataState::READ_MARKER; |
276 | 50.9k | continue; |
277 | 50.9k | } |
278 | | |
279 | 544k | case MetadataState::READ_MULTIBYTE: { |
280 | 544k | size_t chunk_size = |
281 | 544k | std::min(state->remaining_multibyte_length, len - pos); |
282 | 544k | Append(state->multibyte_sink, data + pos, chunk_size); |
283 | 544k | state->remaining_multibyte_length -= chunk_size; |
284 | 544k | pos += chunk_size; |
285 | 544k | if (state->remaining_multibyte_length == 0) { |
286 | 48.5k | state->stage = MetadataState::READ_MARKER; |
287 | 48.5k | } |
288 | 544k | continue; |
289 | 50.9k | } |
290 | | |
291 | 0 | default: return false; |
292 | 922k | } |
293 | 922k | } |
294 | 830k | return true; |
295 | 830k | } |
296 | | |
297 | 73.0k | static BrunsliStatus DecodeHuffmanCode(State* state, JPEGData* jpg) { |
298 | 73.0k | InternalState& s = *state->internal; |
299 | 73.0k | JpegInternalsState& js = s.internals; |
300 | 73.0k | BrunsliBitReader* br = &js.br; |
301 | | |
302 | 463k | while (true) { |
303 | 463k | switch (js.stage) { |
304 | 53.1k | case JpegInternalsState::READ_HUFFMAN_LAST: { |
305 | 53.1k | if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA; |
306 | 51.1k | js.is_known_last_huffman_code = BrunsliBitReaderRead(br, 1); |
307 | 51.1k | jpg->huffman_code.emplace_back(); |
308 | 51.1k | js.stage = JpegInternalsState::READ_HUFFMAN_SIMPLE; |
309 | 51.1k | continue; |
310 | 53.1k | } |
311 | 71.7k | case JpegInternalsState::READ_HUFFMAN_SIMPLE: { |
312 | 71.7k | if (!BrunsliBitReaderCanRead(br, 5 + !js.is_known_last_huffman_code)) { |
313 | 20.9k | return BRUNSLI_NOT_ENOUGH_DATA; |
314 | 20.9k | } |
315 | 50.8k | JPEGHuffmanCode* huff = &jpg->huffman_code.back(); |
316 | | |
317 | 50.8k | huff->slot_id = BrunsliBitReaderRead(br, 2); |
318 | 50.8k | js.is_dc_table = (BrunsliBitReaderRead(br, 1) == 0); |
319 | 50.8k | huff->slot_id += js.is_dc_table ? 0 : 0x10; |
320 | 50.8k | huff->is_last = |
321 | 50.8k | js.is_known_last_huffman_code || BrunsliBitReaderRead(br, 1); |
322 | 50.8k | huff->counts[0] = 0; |
323 | 50.8k | int found_match = BrunsliBitReaderRead(br, 1); |
324 | 50.8k | if (found_match) { |
325 | 30.5k | if (js.is_dc_table) { |
326 | 16.6k | int huff_table_idx = BrunsliBitReaderRead(br, 1); |
327 | 16.6k | memcpy(&huff->counts[1], kStockDCHuffmanCodeCounts[huff_table_idx], |
328 | 16.6k | sizeof(kStockDCHuffmanCodeCounts[0])); |
329 | 16.6k | memcpy(&huff->values[0], kStockDCHuffmanCodeValues[huff_table_idx], |
330 | 16.6k | sizeof(kStockDCHuffmanCodeValues[0])); |
331 | 16.6k | } else { |
332 | 13.9k | int huff_table_idx = BrunsliBitReaderRead(br, 1); |
333 | 13.9k | memcpy(&huff->counts[1], kStockACHuffmanCodeCounts[huff_table_idx], |
334 | 13.9k | sizeof(kStockACHuffmanCodeCounts[0])); |
335 | 13.9k | memcpy(&huff->values[0], kStockACHuffmanCodeValues[huff_table_idx], |
336 | 13.9k | sizeof(kStockACHuffmanCodeValues[0])); |
337 | 13.9k | } |
338 | 30.5k | js.stage = JpegInternalsState::HUFFMAN_UPDATE; |
339 | 30.5k | } else { |
340 | | // One less bit is used than requested, but it is guaranteed to be |
341 | | // consumed in complex Huffman code case. |
342 | 20.2k | js.p.Init(js.is_dc_table |
343 | 20.2k | ? std::vector<uint8_t>(kDefaultDCValues, |
344 | 14.4k | std::end(kDefaultDCValues)) |
345 | 20.2k | : std::vector<uint8_t>(kDefaultACValues, |
346 | 5.82k | std::end(kDefaultACValues))); |
347 | 20.2k | js.stage = JpegInternalsState::READ_HUFFMAN_MAX_LEN; |
348 | 20.2k | } |
349 | 50.8k | continue; |
350 | 71.7k | } |
351 | 23.7k | case JpegInternalsState::READ_HUFFMAN_MAX_LEN: { |
352 | 23.7k | if (!BrunsliBitReaderCanRead(br, 4)) return BRUNSLI_NOT_ENOUGH_DATA; |
353 | 20.2k | js.max_len = BrunsliBitReaderRead(br, 4) + 1; |
354 | 20.2k | js.total_count = 0; |
355 | 20.2k | js.max_count = |
356 | 20.2k | js.is_dc_table ? kJpegDCAlphabetSize : kJpegHuffmanAlphabetSize; |
357 | 20.2k | js.space = (1u << kJpegHuffmanMaxBitLength) - |
358 | 20.2k | (1u << (kJpegHuffmanMaxBitLength - js.max_len)); |
359 | 20.2k | js.i = 1; |
360 | 20.2k | js.stage = JpegInternalsState::READ_HUFFMAN_COUNT; |
361 | 20.2k | continue; |
362 | 23.7k | } |
363 | 101k | case JpegInternalsState::READ_HUFFMAN_COUNT: { |
364 | 101k | JPEGHuffmanCode* huff = &jpg->huffman_code.back(); |
365 | 101k | if (js.i <= js.max_len) { |
366 | 81.4k | size_t shift = kJpegHuffmanMaxBitLength - js.i; |
367 | 81.4k | size_t count_limit = |
368 | 81.4k | std::min(js.max_count - js.total_count, js.space >> shift); |
369 | 81.4k | if (count_limit > 0) { |
370 | 77.9k | int nbits = |
371 | 77.9k | Log2FloorNonZero(static_cast<uint32_t>(count_limit)) + 1; |
372 | 77.9k | if (!BrunsliBitReaderCanRead(br, nbits)) { |
373 | 10.8k | return BRUNSLI_NOT_ENOUGH_DATA; |
374 | 10.8k | } |
375 | 67.1k | size_t count = BrunsliBitReaderRead(br, nbits); |
376 | 67.1k | if (count > count_limit) { |
377 | 9 | return BRUNSLI_INVALID_BRN; |
378 | 9 | } |
379 | 67.1k | huff->counts[js.i] = static_cast<int>(count); |
380 | 67.1k | js.total_count += count; |
381 | 67.1k | js.space -= count * (static_cast<size_t>(1) << shift); |
382 | 67.1k | } |
383 | 70.6k | ++js.i; |
384 | 70.6k | continue; |
385 | 81.4k | } |
386 | 20.0k | ++huff->counts[js.max_len]; |
387 | 20.0k | js.i = 0; |
388 | 20.0k | js.stage = JpegInternalsState::READ_HUFFMAN_PERMUTATION; |
389 | 20.0k | continue; |
390 | 101k | } |
391 | 163k | case JpegInternalsState::READ_HUFFMAN_PERMUTATION: { |
392 | 163k | JPEGHuffmanCode* huff = &jpg->huffman_code.back(); |
393 | 163k | if (js.i < js.total_count) { |
394 | 143k | const int nbits = js.p.num_bits(); |
395 | 143k | if (!DecodeLimitedVarint<2>(&js.varint, br, (nbits + 1) >> 1u)) { |
396 | 14.4k | return BRUNSLI_NOT_ENOUGH_DATA; |
397 | 14.4k | } |
398 | 128k | uint8_t value; |
399 | 128k | if (!js.p.Remove(js.varint.value, &value)) { |
400 | 11 | return BRUNSLI_INVALID_BRN; |
401 | 11 | } |
402 | 128k | huff->values[js.i] = value; |
403 | 128k | ++js.i; |
404 | 128k | continue; |
405 | 128k | } |
406 | 19.9k | huff->values[js.total_count] = kJpegHuffmanAlphabetSize; |
407 | 19.9k | js.stage = JpegInternalsState::HUFFMAN_UPDATE; |
408 | 19.9k | continue; |
409 | 163k | } |
410 | 50.5k | case JpegInternalsState::HUFFMAN_UPDATE: { |
411 | | // This stage does not perform reading -> transient. |
412 | 50.5k | if (jpg->huffman_code.back().is_last) { |
413 | 25.6k | js.terminal_huffman_code_count++; |
414 | 25.6k | } |
415 | 50.5k | if (js.is_known_last_huffman_code) { |
416 | 21.1k | js.p.Clear(); |
417 | 21.1k | return BRUNSLI_OK; |
418 | 21.1k | } |
419 | 29.3k | if (jpg->huffman_code.size() >= kMaxDHTMarkers) { |
420 | | // Too many Huffman codes for a valid bit-stream. Normally, a jpeg |
421 | | // file can have any arbitrary number of DHT, DQT, etc. But i prefer |
422 | | // we force a reasonable lower bound instead of open door to likely |
423 | | // forged BRN input. |
424 | 2 | return BRUNSLI_INVALID_BRN; |
425 | 2 | } |
426 | 29.3k | js.stage = JpegInternalsState::READ_HUFFMAN_LAST; |
427 | 29.3k | continue; |
428 | 29.3k | } |
429 | 0 | default: |
430 | 0 | return BRUNSLI_DECOMPRESSION_ERROR; |
431 | 463k | } |
432 | 463k | } |
433 | 0 | return BRUNSLI_OK; |
434 | 73.0k | } |
435 | | |
436 | 1.74M | BrunsliStatus DecodeScanInfo(State* state, JPEGData* jpg) { |
437 | 1.74M | InternalState& s = *state->internal; |
438 | 1.74M | JpegInternalsState& js = s.internals; |
439 | 1.74M | BrunsliBitReader* br = &js.br; |
440 | | |
441 | 4.50M | const auto maybe_add_zero_run = [&js, jpg] () { |
442 | 4.50M | if (js.last_num > 0) { |
443 | 4.48M | JPEGScanInfo::ExtraZeroRunInfo info; |
444 | 4.48M | info.block_idx = js.last_block_idx; |
445 | 4.48M | info.num_extra_zero_runs = js.last_num; |
446 | 4.48M | jpg->scan_info[js.i].extra_zero_runs.push_back(info); |
447 | 4.48M | js.last_num = 0; |
448 | 4.48M | } |
449 | 4.50M | }; |
450 | | |
451 | 23.0M | while (true) { |
452 | 23.0M | switch (js.stage) { |
453 | 172k | case JpegInternalsState::READ_SCAN_COMMON: { |
454 | 172k | JPEGScanInfo* si = &jpg->scan_info[js.i]; |
455 | 172k | if (!BrunsliBitReaderCanRead(br, 22)) return BRUNSLI_NOT_ENOUGH_DATA; |
456 | 54.2k | si->Ss = BrunsliBitReaderRead(br, 6); |
457 | 54.2k | si->Se = BrunsliBitReaderRead(br, 6); |
458 | 54.2k | si->Ah = BrunsliBitReaderRead(br, 4); |
459 | 54.2k | si->Al = BrunsliBitReaderRead(br, 4); |
460 | 54.2k | si->num_components = BrunsliBitReaderRead(br, 2) + 1; |
461 | 54.2k | js.j = 0; |
462 | 54.2k | js.stage = JpegInternalsState::READ_SCAN_COMPONENT; |
463 | 54.2k | continue; |
464 | 172k | } |
465 | 291k | case JpegInternalsState::READ_SCAN_COMPONENT: { |
466 | 291k | JPEGScanInfo* si = &jpg->scan_info[js.i]; |
467 | 291k | if (js.j < si->num_components) { |
468 | 237k | if (!BrunsliBitReaderCanRead(br, 6)) return BRUNSLI_NOT_ENOUGH_DATA; |
469 | 118k | si->components[js.j].comp_idx = BrunsliBitReaderRead(br, 2); |
470 | 118k | si->components[js.j].dc_tbl_idx = BrunsliBitReaderRead(br, 2); |
471 | 118k | si->components[js.j].ac_tbl_idx = BrunsliBitReaderRead(br, 2); |
472 | 118k | js.j++; |
473 | 118k | } else { |
474 | 54.1k | js.last_block_idx = -1; |
475 | 54.1k | js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION; |
476 | 54.1k | } |
477 | 172k | continue; |
478 | 291k | } |
479 | 5.59M | case JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION: { |
480 | 5.59M | if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA; |
481 | 4.98M | if (BrunsliBitReaderRead(br, 1)) { |
482 | 4.93M | js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_DATA; |
483 | 4.93M | } else { |
484 | 53.9k | js.last_block_idx = 0; |
485 | 53.9k | js.last_num = 0; |
486 | 53.9k | js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION; |
487 | 53.9k | } |
488 | 4.98M | continue; |
489 | 5.59M | } |
490 | 4.94M | case JpegInternalsState::READ_SCAN_RESET_POINT_DATA: { |
491 | 4.94M | JPEGScanInfo* si = &jpg->scan_info[js.i]; |
492 | 4.94M | if (!DecodeVarint(&js.varint, br, 28)) return BRUNSLI_NOT_ENOUGH_DATA; |
493 | 4.93M | int block_idx = |
494 | 4.93M | js.last_block_idx + static_cast<int>(js.varint.value) + 1; |
495 | 4.93M | si->reset_points.emplace_back(block_idx); |
496 | 4.93M | js.last_block_idx = block_idx; |
497 | | // TODO(eustas): limit to exact number of blocks. |
498 | 4.93M | if (js.last_block_idx > (1 << 30)) { |
499 | | // At most 8K x 8K x num_channels blocks are expected. That is, |
500 | | // typically, 1.5 * 2^27. 2^30 should be sufficient for any sane |
501 | | // image. |
502 | 12 | return BRUNSLI_INVALID_BRN; |
503 | 12 | } |
504 | 4.93M | js.stage = JpegInternalsState::READ_SCAN_RESET_POINT_CONTINUATION; |
505 | 4.93M | continue; |
506 | 4.93M | } |
507 | 5.74M | case JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION: { |
508 | 5.74M | if (!BrunsliBitReaderCanRead(br, 1)) return BRUNSLI_NOT_ENOUGH_DATA; |
509 | 5.59M | if (BrunsliBitReaderRead(br, 1)) { |
510 | 5.53M | js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_DATA; |
511 | 5.53M | } else { |
512 | 53.7k | maybe_add_zero_run(); |
513 | 53.7k | ++js.i; |
514 | 53.7k | if (js.i < js.num_scans) { |
515 | 44.2k | js.stage = JpegInternalsState::READ_SCAN_COMMON; |
516 | 44.2k | continue; |
517 | 44.2k | } |
518 | 9.51k | return BRUNSLI_OK; |
519 | 53.7k | } |
520 | 5.53M | continue; |
521 | 5.59M | } |
522 | 6.26M | case JpegInternalsState::READ_SCAN_ZERO_RUN_DATA: { |
523 | 6.26M | if (!DecodeVarint(&js.varint, br, 28)) return BRUNSLI_NOT_ENOUGH_DATA; |
524 | 5.53M | int block_idx = js.last_block_idx + static_cast<int>(js.varint.value); |
525 | 5.53M | if (block_idx > js.last_block_idx) maybe_add_zero_run(); |
526 | 5.53M | ++js.last_num; |
527 | 5.53M | js.last_block_idx = block_idx; |
528 | | // TODO(eustas): limit to exact number of blocks. |
529 | 5.53M | if (js.last_block_idx > (1 << 30)) { |
530 | | // At most 8K x 8K x num_channels blocks are expected. That is, |
531 | | // typically, 1.5 * 2^27. 2^30 should be sufficient for any sane |
532 | | // image. |
533 | 2 | return BRUNSLI_INVALID_BRN; |
534 | 2 | } |
535 | 5.53M | js.stage = JpegInternalsState::READ_SCAN_ZERO_RUN_CONTINUATION; |
536 | 5.53M | continue; |
537 | 5.53M | } |
538 | 0 | default: return BRUNSLI_DECOMPRESSION_ERROR; |
539 | 23.0M | } |
540 | 23.0M | } |
541 | 1.74M | } |
542 | | |
543 | | static bool BRUNSLI_NOINLINE DecodeCoeffOrder(uint32_t* order, BitSource* br, |
544 | 11.0k | WordSource* in) { |
545 | 11.0k | uint32_t lehmer[kDCTBlockSize] = {0}; |
546 | 11.0k | static const int kSpan = 16; |
547 | 55.3k | for (int i = 0; i < kDCTBlockSize; i += kSpan) { |
548 | 44.2k | if (!br->ReadBits(1, in)) continue; // span is all-zero |
549 | 5.25k | const int start = (i > 0) ? i : 1; |
550 | 5.25k | const int end = i + kSpan; |
551 | 85.4k | for (int j = start; j < end; ++j) { |
552 | 80.1k | uint32_t v = 0; |
553 | 102k | while (v <= kDCTBlockSize) { |
554 | 102k | const uint32_t bits = br->ReadBits(3, in); |
555 | 102k | v += bits; |
556 | 102k | if (bits < 7) break; |
557 | 102k | } |
558 | 80.1k | if (v > kDCTBlockSize) return false; |
559 | 80.1k | lehmer[j] = v; |
560 | 80.1k | } |
561 | 5.25k | } |
562 | 11.0k | int end = kDCTBlockSize - 1; |
563 | 648k | while (end >= 1 && lehmer[end] == 0) { |
564 | 637k | --end; |
565 | 637k | } |
566 | 11.0k | if (lehmer[end] == 1) return false; |
567 | 56.7k | for (int i = 1; i <= end; ++i) { |
568 | 46.1k | if (lehmer[i] == 0) return false; |
569 | 45.7k | --lehmer[i]; |
570 | 45.7k | } |
571 | 10.6k | if (!DecodeLehmerCode(lehmer, kDCTBlockSize, order)) return false; |
572 | 687k | for (int k = 0; k < kDCTBlockSize; ++k) { |
573 | 677k | order[k] = kJPEGNaturalOrder[order[k]]; |
574 | 677k | } |
575 | 10.5k | return true; |
576 | 10.6k | } |
577 | | |
578 | | /** Reads 0..6 words from |in| and returns the value in the range 0..63. */ |
579 | | static size_t DecodeNumNonzeros(Prob* p, BinaryArithmeticDecoder* ac, |
580 | 3.11M | WordSource* in) { |
581 | | // To simplity BST navigation, we use 1-based indexing. |
582 | 3.11M | Prob* bst = p - 1; |
583 | 3.11M | size_t ctx = 1; |
584 | | |
585 | 21.8M | for (size_t b = 0; b < kNumNonZeroBits; ++b) { |
586 | 18.7M | const int bit = ac->ReadBit(bst[ctx].get_proba(), in); |
587 | 18.7M | bst[ctx].Add(bit); |
588 | 18.7M | ctx = 2 * ctx + bit; |
589 | 18.7M | } |
590 | | |
591 | | // Leaf index in the level corresponds to the resuling value. |
592 | 3.11M | size_t val = ctx - (1u << kNumNonZeroBits); |
593 | 3.11M | BRUNSLI_DCHECK(val <= kNumNonZeroTreeSize); |
594 | 3.11M | return val; |
595 | 3.11M | } |
596 | | |
597 | 121k | void EnsureSubdecodersInitialized(State* state, WordSource* in) { |
598 | 121k | InternalState& s = *state->internal; |
599 | 121k | if (!s.subdecoders_initialized) { |
600 | 21.5k | s.ans_decoder.Init(in); |
601 | 21.5k | s.bit_reader.Init(in); |
602 | 21.5k | s.arith_decoder.Init(in); |
603 | 21.5k | s.subdecoders_initialized = true; |
604 | 21.5k | } |
605 | 121k | } |
606 | | |
607 | 20.7k | bool FinalizeSubdecoders(State* state) { |
608 | 20.7k | InternalState& s = *state->internal; |
609 | 20.7k | if (!s.ans_decoder.CheckCRC()) return false; |
610 | 19.5k | if (!s.bit_reader.Finish()) return false; |
611 | 19.4k | s.subdecoders_initialized = false; |
612 | 19.4k | return true; |
613 | 19.5k | } |
614 | | |
615 | 94.3k | BrunsliStatus DecodeDC(State* state, WordSource* in) { |
616 | 94.3k | const std::vector<ComponentMeta>& meta = state->meta; |
617 | 94.3k | const size_t num_components = meta.size(); |
618 | 94.3k | const int mcu_rows = meta[0].height_in_blocks / meta[0].v_samp; |
619 | 94.3k | InternalState& s = *state->internal; |
620 | 94.3k | AcDcState& ac_dc_state = s.ac_dc; |
621 | | |
622 | 94.3k | std::vector<ComponentStateDC>& comps = ac_dc_state.dc; |
623 | 94.3k | if (comps.empty()) { |
624 | 11.5k | comps.resize(num_components); |
625 | 24.3k | for (size_t c = 0; c < num_components; ++c) { |
626 | 12.8k | comps[c].SetWidth(meta[c].width_in_blocks); |
627 | 12.8k | } |
628 | 11.5k | } |
629 | | |
630 | 94.3k | if (!in->CanRead(5)) return BRUNSLI_NOT_ENOUGH_DATA; |
631 | 26.4k | EnsureSubdecodersInitialized(state, in); |
632 | 26.4k | ANSDecoder ans = s.ans_decoder; |
633 | 26.4k | BitSource br = s.bit_reader; |
634 | 26.4k | BinaryArithmeticDecoder ac = s.arith_decoder; |
635 | | |
636 | | // We decode DC components in the following interleaved manner: |
637 | | // v_samp[0] rows from component 0 |
638 | | // v_samp[1] rows from component 1 |
639 | | // v_samp[2] rows from component 2 |
640 | | // v_samp[3] rows from component 3 (if present) |
641 | | // |
642 | | // E.g. in a YUV420 image, we decode 2 rows of DC components from Y and then |
643 | | // 1 row of DC components from U and 1 row of DC components from V. |
644 | 287k | for (int mcu_y = ac_dc_state.next_mcu_y; mcu_y < mcu_rows; ++mcu_y) { |
645 | 539k | for (size_t i = ac_dc_state.next_component; i < num_components; ++i) { |
646 | 279k | ComponentStateDC* c = &comps[i]; |
647 | 279k | const ComponentMeta& m = meta[i]; |
648 | 279k | const uint8_t* context_map = state->context_map + i * kNumAvrgContexts; |
649 | 279k | const int ac_stride = static_cast<int>(m.ac_stride); |
650 | 279k | const size_t b_stride = m.b_stride; |
651 | 279k | const int width = m.width_in_blocks; |
652 | 279k | int y = mcu_y * m.v_samp + ac_dc_state.next_iy; |
653 | 279k | int* const prev_sgn = &c->prev_sign[1]; |
654 | 279k | int* const prev_abs = &c->prev_abs_coeff[2]; |
655 | 1.03M | for (int iy = ac_dc_state.next_iy; iy < m.v_samp; ++iy, ++y) { |
656 | 768k | coeff_t* coeffs = |
657 | 768k | m.ac_coeffs + y * ac_stride + ac_dc_state.next_x * kDCTBlockSize; |
658 | 768k | uint8_t* block_state = |
659 | 768k | m.block_state + y * b_stride + ac_dc_state.next_x; |
660 | 76.3M | for (int x = ac_dc_state.next_x; x < width; ++x) { |
661 | 75.5M | if (BRUNSLI_PREDICT_FALSE(!in->CanRead(6))) { |
662 | 15.3k | ac_dc_state.next_mcu_y = mcu_y; |
663 | 15.3k | ac_dc_state.next_component = i; |
664 | 15.3k | ac_dc_state.next_iy = iy; |
665 | 15.3k | ac_dc_state.next_x = x; |
666 | 15.3k | s.ans_decoder = ans; |
667 | 15.3k | s.bit_reader = br; |
668 | 15.3k | s.arith_decoder = ac; |
669 | 15.3k | return BRUNSLI_NOT_ENOUGH_DATA; |
670 | 15.3k | } |
671 | 75.5M | const int is_empty_ctx = |
672 | 75.5M | IsEmptyBlockContext(&c->prev_is_nonempty[1], x); |
673 | 75.5M | Prob* BRUNSLI_RESTRICT is_empty_p = |
674 | 75.5M | &c->is_empty_block_prob[is_empty_ctx]; |
675 | 75.5M | const bool is_empty_block = !ac.ReadBit(is_empty_p->get_proba(), in); |
676 | 75.5M | is_empty_p->Add(!is_empty_block); |
677 | 75.5M | c->prev_is_nonempty[x + 1] = !is_empty_block; |
678 | 75.5M | *block_state = is_empty_block; |
679 | 75.5M | int abs_val = 0; |
680 | 75.5M | int sign = 0; |
681 | 75.5M | if (!is_empty_block) { |
682 | 11.8M | Prob* BRUNSLI_RESTRICT p_is_zero = &c->is_zero_prob; |
683 | 11.8M | int is_zero = ac.ReadBit(p_is_zero->get_proba(), in); |
684 | 11.8M | p_is_zero->Add(is_zero); |
685 | 11.8M | if (!is_zero) { |
686 | 2.19M | const int avg_ctx = WeightedAverageContextDC(prev_abs, x); |
687 | 2.19M | const int sign_ctx = prev_sgn[x] * 3 + prev_sgn[x - 1]; |
688 | 2.19M | Prob* BRUNSLI_RESTRICT sign_p = &c->sign_prob[sign_ctx]; |
689 | 2.19M | sign = ac.ReadBit(sign_p->get_proba(), in); |
690 | 2.19M | sign_p->Add(sign); |
691 | 2.19M | const int entropy_ix = context_map[avg_ctx]; |
692 | 2.19M | int code = ans.ReadSymbol(state->entropy_codes[entropy_ix], in); |
693 | 2.19M | if (code < kNumDirectCodes) { |
694 | 782k | abs_val = code + 1; |
695 | 1.41M | } else { |
696 | 1.41M | int nbits = code - kNumDirectCodes; |
697 | 1.41M | Prob* BRUNSLI_RESTRICT p_first_extra_bit = |
698 | 1.41M | &c->first_extra_bit_prob[nbits]; |
699 | 1.41M | int first_extra_bit = |
700 | 1.41M | ac.ReadBit(p_first_extra_bit->get_proba(), in); |
701 | 1.41M | p_first_extra_bit->Add(first_extra_bit); |
702 | 1.41M | int extra_bits_val = first_extra_bit << nbits; |
703 | 1.41M | if (nbits > 0) { |
704 | 1.25M | extra_bits_val |= static_cast<int>(br.ReadBits(nbits, in)); |
705 | 1.25M | } |
706 | 1.41M | abs_val = kNumDirectCodes - 1 + (2 << nbits) + extra_bits_val; |
707 | 1.41M | } |
708 | 2.19M | } |
709 | 11.8M | } |
710 | 75.5M | prev_abs[x] = abs_val; |
711 | 75.5M | prev_sgn[x] = abs_val ? sign + 1 : 0; |
712 | 75.5M | coeffs[0] = ((1 - 2 * sign) * abs_val + |
713 | 75.5M | PredictWithAdaptiveMedian(coeffs, x, y, ac_stride)); |
714 | 75.5M | block_state++; |
715 | 75.5M | coeffs += kDCTBlockSize; |
716 | 75.5M | } |
717 | 752k | ac_dc_state.next_x = 0; |
718 | 752k | } |
719 | 263k | ac_dc_state.next_iy = 0; |
720 | 263k | } |
721 | 260k | ac_dc_state.next_component = 0; |
722 | 260k | } |
723 | | |
724 | | // Prepare for AC decoding. |
725 | 11.1k | ac_dc_state.next_mcu_y = 0; |
726 | 11.1k | ac_dc_state.next_component = 0; |
727 | 11.1k | ac_dc_state.next_iy = 0; |
728 | 11.1k | ac_dc_state.next_x = 0; |
729 | | |
730 | 11.1k | comps.clear(); |
731 | 11.1k | comps.shrink_to_fit(); |
732 | | |
733 | 11.1k | s.ans_decoder = ans; |
734 | 11.1k | s.bit_reader = br; |
735 | 11.1k | s.arith_decoder = ac; |
736 | 11.1k | if (!FinalizeSubdecoders(state)) return BRUNSLI_INVALID_BRN; |
737 | | |
738 | 10.6k | return BRUNSLI_OK; |
739 | 11.1k | } |
740 | | |
741 | | static void BRUNSLI_NOINLINE DecodeEmptyAcBlock( |
742 | 19.5M | int* BRUNSLI_RESTRICT prev_sgn, int* BRUNSLI_RESTRICT prev_abs) { |
743 | 1.24G | for (int k = 1; k < kDCTBlockSize; ++k) { |
744 | 1.23G | prev_sgn[k] = 0; |
745 | 1.23G | prev_abs[k] = 0; |
746 | 1.23G | } |
747 | 19.5M | } |
748 | | |
749 | | /** All the necessary things for decoding AC block. */ |
750 | | struct AcBlockCookie { |
751 | | int x; |
752 | | int y; |
753 | | uint8_t* BRUNSLI_RESTRICT prev_num_nonzeros; |
754 | | int* BRUNSLI_RESTRICT prev_sgn; |
755 | | int* BRUNSLI_RESTRICT prev_abs; |
756 | | Prob* BRUNSLI_RESTRICT num_nonzero_prob; |
757 | | |
758 | | BinaryArithmeticDecoder* BRUNSLI_RESTRICT ac; |
759 | | WordSource* BRUNSLI_RESTRICT in; |
760 | | ANSDecoder* BRUNSLI_RESTRICT ans; |
761 | | BitSource* BRUNSLI_RESTRICT br; |
762 | | |
763 | | coeff_t* BRUNSLI_RESTRICT coeffs; |
764 | | const coeff_t* BRUNSLI_RESTRICT prev_row_coeffs; |
765 | | const coeff_t* BRUNSLI_RESTRICT prev_col_coeffs; |
766 | | Prob* BRUNSLI_RESTRICT is_zero_prob; |
767 | | const uint32_t* BRUNSLI_RESTRICT order; |
768 | | const uint8_t* BRUNSLI_RESTRICT context_modes; |
769 | | const int* BRUNSLI_RESTRICT mult_col; |
770 | | const int* BRUNSLI_RESTRICT mult_row; |
771 | | int prev_row_delta; |
772 | | Prob* BRUNSLI_RESTRICT sign_prob; |
773 | | size_t context_bits; |
774 | | const uint8_t* BRUNSLI_RESTRICT context_map; |
775 | | const ANSDecodingData* BRUNSLI_RESTRICT entropy_codes; |
776 | | Prob* BRUNSLI_RESTRICT first_extra_bit_prob; |
777 | | }; |
778 | | |
779 | 3.11M | static size_t BRUNSLI_NOINLINE DecodeAcBlock(const AcBlockCookie& cookie) { |
780 | 3.11M | AcBlockCookie c = cookie; |
781 | | |
782 | 3.11M | BinaryArithmeticDecoder ac = *c.ac; |
783 | 3.11M | WordSource* in = c.in; |
784 | 3.11M | ANSDecoder ans = *c.ans; |
785 | 3.11M | BitSource br = *c.br; |
786 | | |
787 | 3.11M | size_t num_nonzeros = 0; |
788 | | |
789 | 3.11M | const uint8_t nonzero_ctx = NumNonzerosContext(c.prev_num_nonzeros, c.x, c.y); |
790 | 3.11M | size_t last_nz = DecodeNumNonzeros( |
791 | 3.11M | c.num_nonzero_prob + kNumNonZeroTreeSize * nonzero_ctx, &ac, in); |
792 | 167M | for (size_t k = last_nz + 1; k < kDCTBlockSize; ++k) { |
793 | 164M | c.prev_sgn[k] = 0; |
794 | 164M | c.prev_abs[k] = 0; |
795 | 164M | } |
796 | 35.2M | for (size_t k = last_nz; k > 0; --k) { |
797 | 32.1M | int is_zero = 0; |
798 | 32.1M | if (k < last_nz) { |
799 | 31.2M | size_t bucket = kNonzeroBuckets[num_nonzeros - 1]; |
800 | 31.2M | size_t is_zero_ctx = bucket * kDCTBlockSize + k; |
801 | 31.2M | Prob& p = c.is_zero_prob[is_zero_ctx]; |
802 | 31.2M | is_zero = ac.ReadBit(p.get_proba(), in); |
803 | 31.2M | p.Add(is_zero); |
804 | 31.2M | } |
805 | 32.1M | int abs_val = 0; |
806 | 32.1M | int sign = 1; |
807 | 32.1M | const int k_nat = c.order[k]; |
808 | 32.1M | if (!is_zero) { |
809 | 5.93M | size_t context_type = c.context_modes[k_nat]; |
810 | 5.93M | size_t avg_ctx = 0; |
811 | 5.93M | size_t sign_ctx = kMaxAverageContext; |
812 | 5.93M | if ((context_type & 1) && (c.y > 0)) { |
813 | 1.13M | size_t offset = k_nat & 7; |
814 | 1.13M | ACPredictContextRow(c.prev_row_coeffs + offset, c.coeffs + offset, |
815 | 1.13M | c.mult_col + offset * 8, &avg_ctx, &sign_ctx); |
816 | 4.79M | } else if ((context_type & 2) && (c.x > 0)) { |
817 | 1.30M | size_t offset = k_nat & ~7; |
818 | 1.30M | ACPredictContextCol(c.prev_col_coeffs + offset, c.coeffs + offset, |
819 | 1.30M | c.mult_row + offset, &avg_ctx, &sign_ctx); |
820 | 3.49M | } else if (!context_type) { |
821 | 3.39M | avg_ctx = WeightedAverageContext(c.prev_abs + k, c.prev_row_delta); |
822 | 3.39M | sign_ctx = |
823 | 3.39M | c.prev_sgn[k] * 3 + c.prev_sgn[static_cast<int>(k) - kDCTBlockSize]; |
824 | 3.39M | } |
825 | 5.93M | sign_ctx = sign_ctx * kDCTBlockSize + k; |
826 | 5.93M | Prob& sign_p = c.sign_prob[sign_ctx]; |
827 | 5.93M | sign = ac.ReadBit(sign_p.get_proba(), in); |
828 | 5.93M | sign_p.Add(sign); |
829 | 5.93M | c.prev_sgn[k] = sign + 1; |
830 | 5.93M | sign = 1 - 2 * sign; |
831 | 5.93M | const size_t z_dens_ctx = |
832 | 5.93M | ZeroDensityContext(num_nonzeros, k, c.context_bits); |
833 | 5.93M | size_t histo_ix = z_dens_ctx * kNumAvrgContexts + avg_ctx; |
834 | 5.93M | size_t entropy_ix = c.context_map[histo_ix]; |
835 | 5.93M | int code = ans.ReadSymbol(c.entropy_codes[entropy_ix], in); |
836 | 5.93M | if (code < kNumDirectCodes) { |
837 | 3.23M | abs_val = code + 1; |
838 | 3.23M | } else { |
839 | 2.69M | int nbits = code - kNumDirectCodes; |
840 | 2.69M | Prob& p = c.first_extra_bit_prob[k * 10 + nbits]; |
841 | 2.69M | int first_extra_bit = ac.ReadBit(p.get_proba(), in); |
842 | 2.69M | p.Add(first_extra_bit); |
843 | 2.69M | int extra_bits_val = first_extra_bit << nbits; |
844 | 2.69M | if (nbits > 0) { |
845 | 2.46M | extra_bits_val |= br.ReadBits(nbits, in); |
846 | 2.46M | } |
847 | 2.69M | abs_val = kNumDirectCodes - 1 + (2u << nbits) + extra_bits_val; |
848 | 2.69M | } |
849 | 5.93M | ++num_nonzeros; |
850 | 26.2M | } else { |
851 | 26.2M | c.prev_sgn[k] = 0; |
852 | 26.2M | } |
853 | 32.1M | int coeff = sign * abs_val; |
854 | 32.1M | c.coeffs[k_nat] = coeff; |
855 | 32.1M | c.prev_abs[k] = abs_val; |
856 | 32.1M | } |
857 | | |
858 | 3.11M | *c.ans = ans; |
859 | 3.11M | *c.br = br; |
860 | 3.11M | *c.ac = ac; |
861 | | |
862 | 3.11M | return num_nonzeros; |
863 | 3.11M | } |
864 | | |
865 | 168k | BrunsliStatus DecodeAC(State* state, WordSource* in) { |
866 | 168k | const std::vector<ComponentMeta>& meta = state->meta; |
867 | 168k | const size_t num_components = meta.size(); |
868 | 168k | const int mcu_rows = meta[0].height_in_blocks / meta[0].v_samp; |
869 | 168k | InternalState& s = *state->internal; |
870 | 168k | AcDcState& ac_dc_state = s.ac_dc; |
871 | | |
872 | 168k | std::vector<ComponentState>& comps = ac_dc_state.ac; |
873 | 168k | if (comps.empty()) { |
874 | 10.4k | comps.resize(num_components); |
875 | 22.0k | for (size_t c = 0; c < num_components; ++c) { |
876 | 11.5k | comps[c].SetWidth(meta[c].width_in_blocks); |
877 | 11.5k | ComputeACPredictMultipliers(&meta[c].quant[0], comps[c].mult_row, |
878 | 11.5k | comps[c].mult_col); |
879 | 11.5k | } |
880 | 10.4k | } |
881 | | |
882 | 168k | if (!in->CanRead(5)) return BRUNSLI_NOT_ENOUGH_DATA; |
883 | 95.4k | EnsureSubdecodersInitialized(state, in); |
884 | | |
885 | 95.4k | if (!ac_dc_state.ac_coeffs_order_decoded) { |
886 | 78.4k | while (ac_dc_state.next_component < num_components) { |
887 | 68.7k | if (!in->CanRead(121)) return BRUNSLI_NOT_ENOUGH_DATA; |
888 | 11.0k | if (!DecodeCoeffOrder(comps[ac_dc_state.next_component].order, |
889 | 11.0k | &s.bit_reader, in)) { |
890 | 492 | return BRUNSLI_INVALID_BRN; |
891 | 492 | } |
892 | 10.5k | ac_dc_state.next_component++; |
893 | 10.5k | } |
894 | 9.72k | ac_dc_state.next_component = 0; |
895 | 9.72k | ac_dc_state.ac_coeffs_order_decoded = true; |
896 | 9.72k | } |
897 | | |
898 | 37.2k | AcBlockCookie c; |
899 | 37.2k | c.ac = &s.arith_decoder; |
900 | 37.2k | c.in = in; |
901 | 37.2k | c.ans = &s.ans_decoder; |
902 | 37.2k | c.br = &s.bit_reader; |
903 | 37.2k | c.entropy_codes = state->entropy_codes; |
904 | 37.2k | c.context_modes = |
905 | 37.2k | kContextAlgorithm + (state->use_legacy_context_model ? 64 : 0); |
906 | | |
907 | 242k | for (int mcu_y = ac_dc_state.next_mcu_y; mcu_y < mcu_rows; ++mcu_y) { |
908 | 438k | for (size_t i = ac_dc_state.next_component; i < num_components; ++i) { |
909 | 233k | ComponentState& cst = comps[i]; |
910 | 233k | c.prev_num_nonzeros = cst.prev_num_nonzeros.data(); |
911 | 233k | c.num_nonzero_prob = cst.num_nonzero_prob; |
912 | 233k | c.is_zero_prob = cst.is_zero_prob.data(); |
913 | 233k | c.order = cst.order; |
914 | 233k | c.mult_col = cst.mult_col; |
915 | 233k | c.mult_row = cst.mult_row; |
916 | 233k | c.sign_prob = cst.sign_prob.data(); |
917 | 233k | c.first_extra_bit_prob = cst.first_extra_bit_prob.data(); |
918 | 233k | const ComponentMeta& m = meta[i]; |
919 | 233k | c.context_map = state->context_map + m.context_offset * kNumAvrgContexts; |
920 | 233k | c.context_bits = m.context_bits; |
921 | 233k | const int width = m.width_in_blocks; |
922 | 233k | const size_t ac_stride = m.ac_stride; |
923 | 233k | const size_t b_stride = m.b_stride; |
924 | 233k | const int next_iy = ac_dc_state.next_iy; |
925 | 233k | c.y = mcu_y * m.v_samp + next_iy; |
926 | 233k | c.prev_row_delta = (1 - 2 * (c.y & 1u)) * (width + 3) * kDCTBlockSize; |
927 | 868k | for (int iy = next_iy; iy < m.v_samp; ++iy, ++c.y) { |
928 | 662k | const int next_x = ac_dc_state.next_x; |
929 | 662k | const size_t block_offset = next_x * kDCTBlockSize; |
930 | 662k | c.coeffs = m.ac_coeffs + c.y * ac_stride + block_offset; |
931 | 662k | c.prev_row_coeffs = c.coeffs - ac_stride; |
932 | 662k | c.prev_col_coeffs = c.coeffs - kDCTBlockSize; |
933 | 662k | const uint8_t* block_state = m.block_state + c.y * b_stride + next_x; |
934 | 662k | c.prev_sgn = &cst.prev_sign[kDCTBlockSize] + block_offset; |
935 | 662k | c.prev_abs = &cst.prev_abs_coeff[((c.y & 1u) * (width + 3) + 2) * |
936 | 662k | kDCTBlockSize] + |
937 | 662k | block_offset; |
938 | 23.3M | for (c.x = next_x; c.x < width; ++c.x) { |
939 | 22.6M | bool is_empty = *(block_state++); |
940 | 22.6M | if (!is_empty) { |
941 | 3.14M | if (BRUNSLI_PREDICT_FALSE(!in->CanRead(297))) { |
942 | 27.6k | ac_dc_state.next_mcu_y = mcu_y; |
943 | 27.6k | ac_dc_state.next_component = i; |
944 | 27.6k | ac_dc_state.next_iy = iy; |
945 | 27.6k | ac_dc_state.next_x = c.x; |
946 | 27.6k | return BRUNSLI_NOT_ENOUGH_DATA; |
947 | 27.6k | } |
948 | 3.11M | size_t num_nonzeros = DecodeAcBlock(c); |
949 | 3.11M | BRUNSLI_DCHECK(num_nonzeros <= kNumNonZeroTreeSize); |
950 | 3.11M | c.prev_num_nonzeros[c.x] = static_cast<uint8_t>(num_nonzeros); |
951 | 19.5M | } else { |
952 | 19.5M | DecodeEmptyAcBlock(c.prev_sgn, c.prev_abs); |
953 | 19.5M | c.prev_num_nonzeros[c.x] = 0; |
954 | 19.5M | } |
955 | 22.6M | c.coeffs += kDCTBlockSize; |
956 | 22.6M | c.prev_sgn += kDCTBlockSize; |
957 | 22.6M | c.prev_abs += kDCTBlockSize; |
958 | 22.6M | c.prev_row_coeffs += kDCTBlockSize; |
959 | 22.6M | c.prev_col_coeffs += kDCTBlockSize; |
960 | 22.6M | } |
961 | 634k | c.prev_row_delta *= -1; |
962 | 634k | ac_dc_state.next_x = 0; |
963 | 634k | } |
964 | 205k | ac_dc_state.next_iy = 0; |
965 | 205k | } |
966 | 205k | ac_dc_state.next_component = 0; |
967 | 205k | } |
968 | 9.66k | ac_dc_state.next_mcu_y = 0; |
969 | | |
970 | 9.66k | comps.clear(); |
971 | 9.66k | comps.shrink_to_fit(); |
972 | | |
973 | 9.66k | if (!FinalizeSubdecoders(state)) return BRUNSLI_INVALID_BRN; |
974 | | |
975 | 8.83k | return BRUNSLI_OK; |
976 | 9.66k | } |
977 | | |
978 | 809k | static bool CheckCanRead(State* state, size_t required) { |
979 | | // TODO(eustas): dcheck len > pos |
980 | 809k | size_t available = state->len - state->pos; |
981 | 809k | return required <= available; |
982 | 809k | } |
983 | | |
984 | 377k | static bool CheckCanReadByte(State* state) { |
985 | | // TODO(eustas): dcheck len > pos |
986 | 377k | return state->pos != state->len; |
987 | 377k | } |
988 | | |
989 | 239k | static uint8_t ReadByte(State* state) { |
990 | | // TODO(eustas): dcheck len > pos |
991 | 239k | return state->data[state->pos++]; |
992 | 239k | } |
993 | | |
994 | 506k | static uint8_t PeekByte(State* state, size_t offset) { |
995 | | // TODO(eustas): dcheck overflow. |
996 | 506k | return state->data[state->pos + offset]; |
997 | 506k | } |
998 | | |
999 | 6.59M | static void SkipBytes(State* state, size_t len) { |
1000 | | // TODO(eustas): dcheck overflow. |
1001 | 6.59M | state->pos += len; |
1002 | 6.59M | } |
1003 | | |
1004 | 16.7M | static size_t GetBytesAvailable(State* state) { |
1005 | | // TODO(eustas): dcheck len > pos |
1006 | 16.7M | return state->len - state->pos; |
1007 | 16.7M | } |
1008 | | |
1009 | 11.4k | static size_t SkipAvailableBytes(State* state, size_t len) { |
1010 | 11.4k | size_t available = GetBytesAvailable(state); |
1011 | 11.4k | size_t skip_bytes = std::min(available, len); |
1012 | 11.4k | state->pos += skip_bytes; |
1013 | 11.4k | return skip_bytes; |
1014 | 11.4k | } |
1015 | | |
1016 | 459k | static BrunsliStatus DecodeBase128(State* state, size_t* val) { |
1017 | 459k | *val = 0; |
1018 | 459k | uint64_t b = 0x80; |
1019 | 459k | size_t i = 0; |
1020 | 965k | while ((i < 9) && (b & 0x80u)) { |
1021 | 684k | if (!CheckCanRead(state, i + 1)) return BRUNSLI_NOT_ENOUGH_DATA; |
1022 | 506k | b = PeekByte(state, i); |
1023 | 506k | *val |= (b & 0x7Fu) << (i * 7); |
1024 | 506k | ++i; |
1025 | 506k | } |
1026 | 281k | SkipBytes(state, i); |
1027 | 281k | return ((b & 0x80u) == 0) ? BRUNSLI_OK : BRUNSLI_INVALID_BRN; |
1028 | 459k | } |
1029 | | |
1030 | 6.24M | static Stage Fail(State* state, BrunsliStatus result) { |
1031 | 6.24M | InternalState& s = *state->internal; |
1032 | 6.24M | s.result = result; |
1033 | | // Preserve current stage for continuation / error reporting. |
1034 | 6.24M | s.last_stage = state->stage; |
1035 | 6.24M | return Stage::ERROR; |
1036 | 6.24M | } |
1037 | | |
1038 | 377k | static BrunsliStatus ReadTag(State* state, SectionState* section) { |
1039 | 377k | if (!CheckCanReadByte(state)) return BRUNSLI_NOT_ENOUGH_DATA; |
1040 | 239k | const uint8_t marker = ReadByte(state); |
1041 | | |
1042 | 239k | const size_t tag = marker >> 3u; |
1043 | 239k | if (tag == 0 || tag > 15) return BRUNSLI_INVALID_BRN; |
1044 | 239k | section->tag = tag; |
1045 | | |
1046 | 239k | const size_t wiring_type = marker & 0x7u; |
1047 | 239k | if (wiring_type != kBrunsliWiringTypeVarint && |
1048 | 239k | wiring_type != kBrunsliWiringTypeLengthDelimited) { |
1049 | 48 | return BRUNSLI_INVALID_BRN; |
1050 | 48 | } |
1051 | 239k | section->is_section = (wiring_type == kBrunsliWiringTypeLengthDelimited); |
1052 | | |
1053 | 239k | const uint32_t tag_bit = 1u << tag; |
1054 | 239k | if (section->tags_met & tag_bit) { |
1055 | 31 | BRUNSLI_LOG_ERROR() << "Duplicate marker " << std::hex |
1056 | 31 | << static_cast<int>(marker) << BRUNSLI_ENDL(); |
1057 | 31 | return BRUNSLI_INVALID_BRN; |
1058 | 31 | } |
1059 | 239k | section->tags_met |= tag_bit; |
1060 | | |
1061 | 239k | return BRUNSLI_OK; |
1062 | 239k | } |
1063 | | |
1064 | 189k | static BrunsliStatus EnterSection(State* state, SectionState* section) { |
1065 | 189k | size_t section_size; |
1066 | 189k | BrunsliStatus status = DecodeBase128(state, §ion_size); |
1067 | 189k | if (status != BRUNSLI_OK) return status; |
1068 | 114k | section->is_active = true; |
1069 | 114k | section->remaining = section_size; |
1070 | 114k | section->milestone = state->pos; |
1071 | 114k | section->projected_end = state->pos + section->remaining; |
1072 | 114k | return BRUNSLI_OK; |
1073 | 189k | } |
1074 | | |
1075 | 31.1k | static void LeaveSection(SectionState* section) { |
1076 | 31.1k | section->is_active = false; |
1077 | 31.1k | } |
1078 | | |
1079 | 17.4M | static bool IsOutOfSectionBounds(State* state) { |
1080 | 17.4M | return state->pos > state->internal->section.projected_end; |
1081 | 17.4M | } |
1082 | | |
1083 | 17.4M | static size_t RemainingSectionLength(State* state) { |
1084 | | // TODO(eustas): remove this check? |
1085 | 17.4M | if (IsOutOfSectionBounds(state)) return 0; |
1086 | 17.4M | return state->internal->section.projected_end - state->pos; |
1087 | 17.4M | } |
1088 | | |
1089 | 345k | static bool IsAtSectionBoundary(State* state) { |
1090 | 345k | return state->pos == state->internal->section.projected_end; |
1091 | 345k | } |
1092 | | |
1093 | 124k | Stage VerifySignature(State* state) { |
1094 | 124k | InternalState& s = *state->internal; |
1095 | | |
1096 | 124k | if (!CheckCanRead(state, kBrunsliSignatureSize)) { |
1097 | 92.3k | return Fail(state, BRUNSLI_NOT_ENOUGH_DATA); |
1098 | 92.3k | } |
1099 | 32.4k | const bool is_signature_ok = |
1100 | 32.4k | (memcmp(state->data + state->pos, kBrunsliSignature, |
1101 | 32.4k | kBrunsliSignatureSize) != 0); |
1102 | 32.4k | state->pos += kBrunsliSignatureSize; |
1103 | 32.4k | s.section.tags_met |= 1u << kBrunsliSignatureTag; |
1104 | 32.4k | if (is_signature_ok) return Fail(state, BRUNSLI_INVALID_BRN); |
1105 | 32.3k | return Stage::HEADER; |
1106 | 32.4k | } |
1107 | | |
1108 | | // Parses the brunsli header starting at data[*pos] and fills in *jpg. |
1109 | | // Sets *pos to the position after the header. |
1110 | | // Returns BRUNSLI_OK, unless the data is not valid brunsli byte stream |
1111 | | // or is truncated. |
1112 | 202k | Stage DecodeHeader(State* state, JPEGData* jpg) { |
1113 | 202k | InternalState& s = *state->internal; |
1114 | 202k | HeaderState& hs = s.header; |
1115 | | |
1116 | 589k | while (hs.stage != HeaderState::DONE) { |
1117 | 558k | switch (hs.stage) { |
1118 | 63.0k | case HeaderState::READ_TAG: { |
1119 | 63.0k | BrunsliStatus status = ReadTag(state, &s.section); |
1120 | 63.0k | if (status != BRUNSLI_OK) return Fail(state, status); |
1121 | 32.2k | if (s.section.tag != kBrunsliHeaderTag || !s.section.is_section) { |
1122 | 12 | return Fail(state, BRUNSLI_INVALID_BRN); |
1123 | 12 | } |
1124 | 32.2k | hs.stage = HeaderState::ENTER_SECTION; |
1125 | 32.2k | break; |
1126 | 32.2k | } |
1127 | | |
1128 | 48.2k | case HeaderState::ENTER_SECTION: { |
1129 | 48.2k | BrunsliStatus status = EnterSection(state, &s.section); |
1130 | 48.2k | if (status != BRUNSLI_OK) return Fail(state, status); |
1131 | 32.2k | hs.stage = HeaderState::ITEM_READ_TAG; |
1132 | 32.2k | break; |
1133 | 48.2k | } |
1134 | | |
1135 | 216k | case HeaderState::ITEM_READ_TAG: { |
1136 | 216k | if (IsAtSectionBoundary(state)) { |
1137 | 31.6k | hs.stage = HeaderState::FINALE; |
1138 | 31.6k | break; |
1139 | 31.6k | } |
1140 | 184k | BrunsliStatus status = ReadTag(state, &hs.section); |
1141 | 184k | if (status != BRUNSLI_OK) return Fail(state, status); |
1142 | 124k | const uint32_t tag_bit = 1u << hs.section.tag; |
1143 | 124k | if (hs.section.is_section) { |
1144 | 10.6k | if (kKnownHeaderVarintTags & tag_bit) { |
1145 | 10.5k | Fail(state, BRUNSLI_INVALID_BRN); |
1146 | 10.5k | } |
1147 | 10.6k | hs.stage = HeaderState::ITEM_ENTER_SECTION; |
1148 | 10.6k | break; |
1149 | 10.6k | } |
1150 | 114k | hs.stage = HeaderState::ITEM_READ_VALUE; |
1151 | 114k | break; |
1152 | 124k | } |
1153 | | |
1154 | 16.8k | case HeaderState::ITEM_ENTER_SECTION: { |
1155 | 16.8k | BrunsliStatus status = DecodeBase128(state, &hs.remaining_skip_length); |
1156 | 16.8k | if (status != BRUNSLI_OK) return Fail(state, status); |
1157 | 10.6k | hs.stage = HeaderState::ITEM_SKIP_CONTENTS; |
1158 | 10.6k | break; |
1159 | 16.8k | } |
1160 | | |
1161 | 11.4k | case HeaderState::ITEM_SKIP_CONTENTS: { |
1162 | 11.4k | size_t bytes_skipped = |
1163 | 11.4k | SkipAvailableBytes(state, hs.remaining_skip_length); |
1164 | 11.4k | hs.remaining_skip_length -= bytes_skipped; |
1165 | 11.4k | if (hs.remaining_skip_length > 0) { |
1166 | 1.01k | return Fail(state, BRUNSLI_NOT_ENOUGH_DATA); |
1167 | 1.01k | } |
1168 | 10.3k | hs.stage = HeaderState::ITEM_READ_TAG; |
1169 | 10.3k | break; |
1170 | 11.4k | } |
1171 | | |
1172 | 170k | case HeaderState::ITEM_READ_VALUE: { |
1173 | 170k | size_t value; |
1174 | 170k | BrunsliStatus status = DecodeBase128(state, &value); |
1175 | 170k | if (status != BRUNSLI_OK) return Fail(state, status); |
1176 | 114k | hs.varint_values[hs.section.tag] = value; |
1177 | 114k | hs.stage = HeaderState::ITEM_READ_TAG; |
1178 | 114k | break; |
1179 | 170k | } |
1180 | | |
1181 | 31.6k | case HeaderState::FINALE: { |
1182 | 31.6k | const bool has_version = |
1183 | 31.6k | hs.section.tags_met & (1u << kBrunsliHeaderVersionCompTag); |
1184 | 31.6k | if (!has_version) return Fail(state, BRUNSLI_INVALID_BRN); |
1185 | 31.6k | const size_t version_and_comp_count = |
1186 | 31.6k | hs.varint_values[kBrunsliHeaderVersionCompTag]; |
1187 | | |
1188 | 31.6k | const size_t version = version_and_comp_count >> 2u; |
1189 | 31.6k | jpg->version = static_cast<int>(version); |
1190 | | |
1191 | 31.6k | if (version == 1) { // fallback mode |
1192 | | // TODO(eustas): do we need this? |
1193 | 647 | jpg->width = 0; |
1194 | 647 | jpg->height = 0; |
1195 | 647 | hs.stage = HeaderState::DONE; |
1196 | 647 | break; |
1197 | 647 | } |
1198 | | |
1199 | | // Wrong mode = fallback + something. |
1200 | 31.0k | if ((version & 1u) != 0) { |
1201 | 36 | return Fail(state, BRUNSLI_INVALID_BRN); |
1202 | 36 | } |
1203 | | // Unknown mode - only 3 bits are defined. |
1204 | 30.9k | if ((version & ~0x7u) != 0) { |
1205 | 94 | return Fail(state, BRUNSLI_INVALID_BRN); |
1206 | 94 | } |
1207 | | |
1208 | | // Otherwise regular brunsli. |
1209 | 30.8k | state->use_legacy_context_model = !(version & 2); |
1210 | | |
1211 | | // Do not allow "original_jpg" for regular Brunsli files. |
1212 | 30.8k | s.section.tags_met |= 1u << kBrunsliOriginalJpgTag; |
1213 | | |
1214 | 30.8k | const bool has_width = |
1215 | 30.8k | hs.section.tags_met & (1u << kBrunsliHeaderWidthTag); |
1216 | 30.8k | if (!has_width) return Fail(state, BRUNSLI_INVALID_BRN); |
1217 | 30.8k | const size_t width = hs.varint_values[kBrunsliHeaderWidthTag]; |
1218 | 30.8k | const bool has_height = |
1219 | 30.8k | hs.section.tags_met & (1u << kBrunsliHeaderHeightTag); |
1220 | 30.8k | if (!has_height) return Fail(state, BRUNSLI_INVALID_BRN); |
1221 | 30.8k | const size_t height = hs.varint_values[kBrunsliHeaderHeightTag]; |
1222 | | |
1223 | 30.8k | if (width == 0 || height == 0) return Fail(state, BRUNSLI_INVALID_BRN); |
1224 | 30.8k | if (width > kMaxDimPixels || height > kMaxDimPixels) { |
1225 | 358 | return Fail(state, BRUNSLI_INVALID_BRN); |
1226 | 358 | } |
1227 | 30.5k | jpg->width = static_cast<int>(width); |
1228 | 30.5k | jpg->height = static_cast<int>(height); |
1229 | | |
1230 | 30.5k | const size_t num_components = (version_and_comp_count & 3u) + 1u; |
1231 | 30.5k | jpg->components.resize(num_components); |
1232 | | |
1233 | 30.5k | const bool has_subsampling = |
1234 | 30.5k | hs.section.tags_met & (1u << kBrunsliHeaderSubsamplingTag); |
1235 | 30.5k | if (!has_subsampling) return Fail(state, BRUNSLI_INVALID_BRN); |
1236 | 30.4k | size_t subsampling_code = |
1237 | 30.4k | hs.varint_values[kBrunsliHeaderSubsamplingTag]; |
1238 | | |
1239 | 79.1k | for (size_t i = 0; i < jpg->components.size(); ++i) { |
1240 | 48.6k | JPEGComponent* c = &jpg->components[i]; |
1241 | 48.6k | c->v_samp_factor = (subsampling_code & 0xFu) + 1; |
1242 | 48.6k | subsampling_code >>= 4u; |
1243 | 48.6k | c->h_samp_factor = (subsampling_code & 0xFu) + 1; |
1244 | 48.6k | subsampling_code >>= 4u; |
1245 | 48.6k | if (c->v_samp_factor > kBrunsliMaxSampling) { |
1246 | 2 | return Fail(state, BRUNSLI_INVALID_BRN); |
1247 | 2 | } |
1248 | 48.6k | if (c->h_samp_factor > kBrunsliMaxSampling) { |
1249 | 2 | return Fail(state, BRUNSLI_INVALID_BRN); |
1250 | 2 | } |
1251 | 48.6k | } |
1252 | 30.4k | if (!UpdateSubsamplingDerivatives(jpg)) { |
1253 | 5 | return Fail(state, BRUNSLI_INVALID_BRN); |
1254 | 5 | } |
1255 | | |
1256 | 30.4k | PrepareMeta(jpg, state); |
1257 | | |
1258 | 30.4k | hs.stage = HeaderState::DONE; |
1259 | 30.4k | break; |
1260 | 30.4k | } |
1261 | | |
1262 | 0 | default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR); |
1263 | 558k | } |
1264 | 558k | } |
1265 | | |
1266 | 31.0k | LeaveSection(&s.section); |
1267 | 31.0k | return (jpg->version == kFallbackVersion) ? Stage::FALLBACK : Stage::SECTION; |
1268 | 202k | } |
1269 | | |
1270 | 477k | static BrunsliStatus DecodeMetaDataSection(State* state, JPEGData* jpg) { |
1271 | 477k | InternalState& s = *state->internal; |
1272 | 477k | MetadataState& ms = s.metadata; |
1273 | | |
1274 | 477k | if (ms.decompression_stage == MetadataDecompressionStage::DONE) { |
1275 | 0 | return BRUNSLI_INVALID_BRN; |
1276 | 0 | } |
1277 | | |
1278 | 477k | if (ms.decompression_stage == MetadataDecompressionStage::INITIAL) { |
1279 | 7.71k | if (IsAtSectionBoundary(state)) { |
1280 | 7 | ms.decompression_stage = MetadataDecompressionStage::DONE; |
1281 | 7 | return BRUNSLI_OK; |
1282 | 7 | } |
1283 | 7.70k | if (RemainingSectionLength(state) == 1) { |
1284 | 142 | if (!CheckCanReadByte(state)) { |
1285 | 45 | return BRUNSLI_NOT_ENOUGH_DATA; |
1286 | 45 | } |
1287 | 97 | uint8_t data[1]; |
1288 | 97 | data[0] = ReadByte(state); |
1289 | 97 | bool ok = ProcessMetaData(data, 1, &ms, jpg) && ms.CanFinish(); |
1290 | 97 | ms.decompression_stage = MetadataDecompressionStage::DONE; |
1291 | 97 | return ok ? BRUNSLI_OK : BRUNSLI_INVALID_BRN; |
1292 | 142 | } |
1293 | 7.56k | ms.decompression_stage = |
1294 | 7.56k | MetadataDecompressionStage::READ_LENGTH; |
1295 | 7.56k | } |
1296 | | |
1297 | 477k | if (ms.decompression_stage == MetadataDecompressionStage::READ_LENGTH) { |
1298 | 13.9k | BrunsliStatus status = DecodeBase128(state, &ms.metadata_size); |
1299 | 13.9k | if (status != BRUNSLI_OK) return status; |
1300 | | // TODO(eustas): ms.metadata_size should be limited to avoid "zip-bombs". |
1301 | 7.40k | if (IsOutOfSectionBounds(state)) return BRUNSLI_INVALID_BRN; |
1302 | 7.39k | if (RemainingSectionLength(state) == 0) return BRUNSLI_INVALID_BRN; |
1303 | 7.39k | ms.brotli = BrotliDecoderCreateInstance(nullptr, nullptr, nullptr); |
1304 | 7.39k | if (ms.brotli == nullptr) return BRUNSLI_DECOMPRESSION_ERROR; |
1305 | 7.39k | ms.decompression_stage = MetadataDecompressionStage::DECOMPRESSING; |
1306 | 7.39k | } |
1307 | | |
1308 | 470k | if (ms.decompression_stage == MetadataDecompressionStage::DECOMPRESSING) { |
1309 | | // Free Brotli decoder and return result |
1310 | 470k | const auto finish_decompression = [&ms] (BrunsliStatus result) { |
1311 | 3.54k | BRUNSLI_DCHECK(ms.brotli != nullptr); |
1312 | 3.54k | BrotliDecoderDestroyInstance(ms.brotli); |
1313 | 3.54k | ms.brotli = nullptr; |
1314 | 3.54k | ms.decompression_stage = MetadataDecompressionStage::DONE; |
1315 | 3.54k | return result; |
1316 | 3.54k | }; |
1317 | | |
1318 | 833k | while (true) { |
1319 | 833k | size_t available_bytes = |
1320 | 833k | std::min(GetBytesAvailable(state), RemainingSectionLength(state)); |
1321 | 833k | size_t available_in = available_bytes; |
1322 | 833k | const uint8_t* next_in = state->data + state->pos; |
1323 | 833k | size_t available_out = 0; |
1324 | 833k | BrotliDecoderResult result = BrotliDecoderDecompressStream( |
1325 | 833k | ms.brotli, &available_in, &next_in, &available_out, nullptr, nullptr); |
1326 | 833k | if (result == BROTLI_DECODER_RESULT_ERROR) { |
1327 | 1.65k | return finish_decompression(BRUNSLI_INVALID_BRN); |
1328 | 1.65k | } |
1329 | 831k | size_t chunk_size = 0; |
1330 | 831k | const uint8_t* chunk_data = |
1331 | 831k | BrotliDecoderTakeOutput(ms.brotli, &chunk_size); |
1332 | 831k | ms.decompressed_size += chunk_size; |
1333 | 831k | if (ms.decompressed_size > ms.metadata_size) { |
1334 | 1.25k | return finish_decompression(BRUNSLI_INVALID_BRN); |
1335 | 1.25k | } |
1336 | 830k | size_t consumed_bytes = available_bytes - available_in; |
1337 | 830k | SkipBytes(state, consumed_bytes); |
1338 | 830k | bool chunk_ok = ProcessMetaData(chunk_data, chunk_size, &ms, jpg); |
1339 | 830k | if (!chunk_ok) return finish_decompression(BRUNSLI_INVALID_BRN); |
1340 | 830k | if (result == BROTLI_DECODER_RESULT_SUCCESS) { |
1341 | 353 | if (RemainingSectionLength(state) != 0) { |
1342 | 218 | return finish_decompression(BRUNSLI_INVALID_BRN); |
1343 | 218 | } |
1344 | 135 | if (ms.decompressed_size != ms.metadata_size) { |
1345 | 128 | return finish_decompression(BRUNSLI_INVALID_BRN); |
1346 | 128 | } |
1347 | 7 | if (!ms.CanFinish()) return finish_decompression(BRUNSLI_INVALID_BRN); |
1348 | 5 | return finish_decompression(BRUNSLI_OK); |
1349 | 7 | } |
1350 | 829k | if (result == BROTLI_DECODER_RESULT_NEEDS_MORE_OUTPUT) continue; |
1351 | 467k | BRUNSLI_DCHECK(result == BROTLI_DECODER_RESULT_NEEDS_MORE_INPUT); |
1352 | 467k | if (RemainingSectionLength(state) == 0) { |
1353 | 48 | return finish_decompression(BRUNSLI_INVALID_BRN); |
1354 | 48 | } |
1355 | 467k | return BRUNSLI_NOT_ENOUGH_DATA; |
1356 | 467k | } |
1357 | 470k | } |
1358 | | |
1359 | | // Unreachable. |
1360 | 0 | BRUNSLI_DCHECK(false); |
1361 | 0 | return BRUNSLI_DECOMPRESSION_ERROR; |
1362 | 470k | } |
1363 | | |
1364 | | /** |
1365 | | * Wraps result, depending on the state of input. |
1366 | | * |
1367 | | * If parser needs more data, but section data is depleted, |
1368 | | * then input is corrupted. |
1369 | | */ |
1370 | 5.21M | static BrunsliStatus CheckBoundary(State* state, BrunsliStatus result) { |
1371 | 5.21M | if (result == BRUNSLI_NOT_ENOUGH_DATA) { |
1372 | 5.12M | bool last = (RemainingSectionLength(state) <= GetBytesAvailable(state)); |
1373 | 5.12M | return last ? BRUNSLI_INVALID_BRN : BRUNSLI_NOT_ENOUGH_DATA; |
1374 | 5.12M | } else { |
1375 | 83.7k | return result; |
1376 | 83.7k | } |
1377 | 5.21M | } |
1378 | | |
1379 | 5.17M | static void PrepareBitReader(BrunsliBitReader* br, State* state) { |
1380 | 5.17M | size_t chunk_len = |
1381 | 5.17M | std::min(GetBytesAvailable(state), RemainingSectionLength(state)); |
1382 | 5.17M | BrunsliBitReaderResume(br, state->data + state->pos, chunk_len); |
1383 | 5.17M | BRUNSLI_DCHECK(BrunsliBitReaderIsHealthy(br)); |
1384 | 5.17M | } |
1385 | | |
1386 | | /** |
1387 | | * Marks data used by bit-reader as consumed. |
1388 | | */ |
1389 | | static BrunsliStatus SuspendBitReader(BrunsliBitReader* br, State* state, |
1390 | 5.17M | BrunsliStatus result) { |
1391 | 5.17M | size_t chunk_len = |
1392 | 5.17M | std::min(GetBytesAvailable(state), RemainingSectionLength(state)); |
1393 | 5.17M | size_t unused_bytes = BrunsliBitReaderSuspend(br); |
1394 | 5.17M | size_t consumed_bytes = chunk_len - unused_bytes; |
1395 | 5.17M | SkipBytes(state, consumed_bytes); |
1396 | 5.17M | result = CheckBoundary(state, result); |
1397 | | // Once BitReader becomes unhealthy, further decoding should be impossible. |
1398 | 5.17M | BRUNSLI_DCHECK( |
1399 | 5.17M | BrunsliBitReaderIsHealthy(br) || |
1400 | 5.17M | ((result != BRUNSLI_OK) && (result != BRUNSLI_NOT_ENOUGH_DATA))); |
1401 | 5.17M | return result; |
1402 | 5.17M | } |
1403 | | |
1404 | 5.07M | static BrunsliStatus DecodeJPEGInternalsSection(State* state, JPEGData* jpg) { |
1405 | 5.07M | InternalState& s = *state->internal; |
1406 | 5.07M | JpegInternalsState& js = s.internals; |
1407 | 5.07M | BrunsliBitReader* br = &js.br; |
1408 | | |
1409 | 5.07M | if (js.stage == JpegInternalsState::INIT) { |
1410 | 22.3k | BrunsliBitReaderInit(br); |
1411 | 22.3k | js.stage = JpegInternalsState::READ_MARKERS; |
1412 | 22.3k | } |
1413 | 5.07M | PrepareBitReader(br, state); |
1414 | | |
1415 | 5.07M | const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus { |
1416 | 5.07M | return SuspendBitReader(br, state, result); |
1417 | 5.07M | }; |
1418 | | |
1419 | 5.07M | if (js.stage == JpegInternalsState::READ_MARKERS) { |
1420 | 14.9M | while (true) { |
1421 | 14.9M | if (!BrunsliBitReaderCanRead(br, 6)) { |
1422 | 2.67M | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1423 | 2.67M | } |
1424 | 12.2M | uint8_t marker = 0xc0 + BrunsliBitReaderRead(br, 6); |
1425 | 12.2M | jpg->marker_order.push_back(marker); |
1426 | 12.2M | if (marker == 0xc4) ++js.dht_count; |
1427 | 12.2M | if (marker == 0xdd) js.have_dri = true; |
1428 | 12.2M | if (marker == 0xda) ++js.num_scans; |
1429 | 12.2M | if (marker == 0xd9) break; |
1430 | 12.2M | } |
1431 | 21.9k | js.stage = JpegInternalsState::READ_DRI; |
1432 | 21.9k | } |
1433 | | |
1434 | 2.39M | if (js.stage == JpegInternalsState::READ_DRI) { |
1435 | 25.3k | if (js.have_dri) { |
1436 | 6.77k | if (!BrunsliBitReaderCanRead(br, 16)) { |
1437 | 3.59k | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1438 | 3.59k | } |
1439 | 3.18k | jpg->restart_interval = BrunsliBitReaderRead(br, 16); |
1440 | 3.18k | } |
1441 | 21.7k | js.stage = JpegInternalsState::READ_HUFFMAN_LAST; |
1442 | 21.7k | } |
1443 | | |
1444 | 2.38M | if (js.stage & JpegInternalsState::DECODE_HUFFMAN_MASK) { |
1445 | 73.0k | BrunsliStatus status = DecodeHuffmanCode(state, jpg); |
1446 | 73.0k | if (status != BRUNSLI_OK) return suspend_bit_reader(status); |
1447 | 21.1k | js.stage = JpegInternalsState::PREPARE_READ_SCANS; |
1448 | 21.1k | } |
1449 | | |
1450 | 2.33M | if (js.stage == JpegInternalsState::PREPARE_READ_SCANS) { |
1451 | 21.1k | if (js.dht_count != js.terminal_huffman_code_count) { |
1452 | 340 | BRUNSLI_LOG_ERROR() << "Invalid number of DHT markers" << BRUNSLI_ENDL(); |
1453 | 340 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1454 | 340 | } |
1455 | 20.8k | if (js.num_scans > 0) { |
1456 | 10.2k | jpg->scan_info.resize(js.num_scans); |
1457 | 10.2k | js.i = 0; |
1458 | 10.2k | js.stage = JpegInternalsState::READ_SCAN_COMMON; |
1459 | 10.5k | } else { |
1460 | 10.5k | js.stage = JpegInternalsState::READ_NUM_QUANT; |
1461 | 10.5k | } |
1462 | 20.8k | } |
1463 | | |
1464 | 2.33M | if (js.stage & JpegInternalsState::DECODE_SCAN_MASK) { |
1465 | 1.74M | BrunsliStatus status = DecodeScanInfo(state, jpg); |
1466 | 1.74M | if (status != BRUNSLI_OK) return suspend_bit_reader(status); |
1467 | 9.51k | js.stage = JpegInternalsState::READ_NUM_QUANT; |
1468 | 9.51k | } |
1469 | | |
1470 | 600k | if (js.stage == JpegInternalsState::READ_NUM_QUANT) { |
1471 | 21.2k | if (!BrunsliBitReaderCanRead(br, 2)) { |
1472 | 1.39k | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1473 | 1.39k | } |
1474 | 19.8k | int num_quant_tables = BrunsliBitReaderRead(br, 2) + 1; |
1475 | 19.8k | jpg->quant.resize(num_quant_tables); |
1476 | 19.8k | js.i = 0; |
1477 | 19.8k | js.stage = JpegInternalsState::READ_QUANT; |
1478 | 19.8k | } |
1479 | | |
1480 | 618k | while (js.stage == JpegInternalsState::READ_QUANT) { |
1481 | 49.4k | if (js.i >= jpg->quant.size()) { |
1482 | 19.2k | js.stage = JpegInternalsState::READ_COMP_ID_SCHEME; |
1483 | 19.2k | break; |
1484 | 19.2k | } |
1485 | | // 6 or 7 bits are used, but we know that at least one more bit is |
1486 | | // guaranteed to be used by varint out of the loop. |
1487 | 30.2k | if (!BrunsliBitReaderCanRead(br, 7)) { |
1488 | 10.0k | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1489 | 10.0k | } |
1490 | 20.2k | JPEGQuantTable* q = &jpg->quant[js.i]; |
1491 | 20.2k | q->index = BrunsliBitReaderRead(br, 2); |
1492 | 20.2k | q->is_last = (js.i == jpg->quant.size() - 1) || BrunsliBitReaderRead(br, 1); |
1493 | 20.2k | q->precision = BrunsliBitReaderRead(br, 4); |
1494 | 20.2k | if (q->precision > 1) { |
1495 | 303 | BRUNSLI_LOG_ERROR() << "Invalid quantization table precision: " |
1496 | 303 | << q->precision << BRUNSLI_ENDL(); |
1497 | 303 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1498 | 303 | } |
1499 | | // note that q->values[] are initialized to invalid 0 values. |
1500 | 19.8k | ++js.i; |
1501 | 19.8k | } |
1502 | | |
1503 | 588k | if (js.stage == JpegInternalsState::READ_COMP_ID_SCHEME) { |
1504 | 19.2k | if (!BrunsliBitReaderCanRead(br, 2)) { |
1505 | 233 | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1506 | 233 | } |
1507 | 19.0k | int comp_ids = BrunsliBitReaderRead(br, 2); |
1508 | 19.0k | static const size_t kMinRequiredComponents[4] = { |
1509 | 19.0k | 3 /* Ids123*/, 1 /* IdsGray */, 3 /* IdsRGB */, 0 /* IdsCustom */ |
1510 | 19.0k | }; |
1511 | 19.0k | if (jpg->components.size() < kMinRequiredComponents[comp_ids]) { |
1512 | 42 | BRUNSLI_LOG_ERROR() << "Insufficient number of components for ColorId #" |
1513 | 42 | << comp_ids << BRUNSLI_ENDL(); |
1514 | 42 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1515 | 42 | } |
1516 | 18.9k | js.stage = JpegInternalsState::READ_NUM_PADDING_BITS; |
1517 | 18.9k | if (comp_ids == kComponentIds123) { |
1518 | 816 | jpg->components[0].id = 1; |
1519 | 816 | jpg->components[1].id = 2; |
1520 | 816 | jpg->components[2].id = 3; |
1521 | 18.1k | } else if (comp_ids == kComponentIdsGray) { |
1522 | 16.8k | jpg->components[0].id = 1; |
1523 | 16.8k | } else if (comp_ids == kComponentIdsRGB) { |
1524 | 148 | jpg->components[0].id = 'R'; |
1525 | 148 | jpg->components[1].id = 'G'; |
1526 | 148 | jpg->components[2].id = 'B'; |
1527 | 1.14k | } else { |
1528 | 1.14k | BRUNSLI_DCHECK(comp_ids == kComponentIdsCustom); |
1529 | 1.14k | js.i = 0; |
1530 | 1.14k | js.stage = JpegInternalsState::READ_COMP_ID; |
1531 | 1.14k | } |
1532 | 18.9k | } |
1533 | | |
1534 | 588k | if (js.stage == JpegInternalsState::READ_COMP_ID) { |
1535 | 2.92k | while (js.i < jpg->components.size()) { |
1536 | 1.85k | if (!BrunsliBitReaderCanRead(br, 8)) { |
1537 | 717 | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1538 | 717 | } |
1539 | 1.13k | jpg->components[js.i].id = BrunsliBitReaderRead(br, 8); |
1540 | 1.13k | ++js.i; |
1541 | 1.13k | } |
1542 | 1.07k | js.stage = JpegInternalsState::READ_NUM_PADDING_BITS; |
1543 | 1.07k | } |
1544 | | |
1545 | 587k | if (js.stage == JpegInternalsState::READ_NUM_PADDING_BITS) { |
1546 | | // TODO(eustas): sanitize: should not be bigger than |
1547 | | // 7 x (num_scans + num_blocks / dri) |
1548 | | // security: limit is 32b for n_size |
1549 | 19.7k | if (!DecodeLimitedVarint<8>(&js.varint, br, 4)) { |
1550 | 922 | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1551 | 922 | } |
1552 | 18.7k | js.num_padding_bits = js.varint.value; |
1553 | 18.7k | jpg->has_zero_padding_bit = (js.num_padding_bits > 0); |
1554 | 18.7k | if (js.num_padding_bits > PaddingBitsLimit(*jpg)) { |
1555 | 107 | BRUNSLI_LOG_ERROR() << "Suspicious number of padding bits " |
1556 | 107 | << js.num_padding_bits << BRUNSLI_ENDL(); |
1557 | 107 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1558 | 107 | } |
1559 | 18.6k | js.i = 0; |
1560 | 18.6k | js.stage = JpegInternalsState::READ_PADDING_BITS; |
1561 | 18.6k | } |
1562 | | |
1563 | 586k | if (js.stage == JpegInternalsState::READ_PADDING_BITS) { |
1564 | 6.82M | while (js.i < js.num_padding_bits) { |
1565 | 6.80M | if (!BrunsliBitReaderCanRead(br, 1)) { |
1566 | 529k | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1567 | 529k | } |
1568 | 6.27M | jpg->padding_bits.emplace_back(BrunsliBitReaderRead(br, 1)); |
1569 | 6.27M | ++js.i; |
1570 | 6.27M | } |
1571 | 18.5k | suspend_bit_reader(BRUNSLI_OK); |
1572 | 18.5k | BrunsliBitReaderFinish(br); |
1573 | 18.5k | if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN; |
1574 | 18.5k | js.i = 0; |
1575 | 18.5k | js.stage = JpegInternalsState::ITERATE_MARKERS; |
1576 | 38.0k | } else { |
1577 | | // no-op |
1578 | 38.0k | suspend_bit_reader(BRUNSLI_OK); |
1579 | 38.0k | } |
1580 | | |
1581 | 443k | while (true) { |
1582 | 443k | switch (js.stage) { |
1583 | 318k | case JpegInternalsState::ITERATE_MARKERS: { |
1584 | 318k | if (js.i >= jpg->marker_order.size()) { |
1585 | 17.9k | js.stage = JpegInternalsState::DONE; |
1586 | 300k | } else if (jpg->marker_order[js.i] == 0xFF) { |
1587 | 34.6k | js.stage = JpegInternalsState::READ_INTERMARKER_LENGTH; |
1588 | 265k | } else { |
1589 | 265k | ++js.i; |
1590 | 265k | } |
1591 | 318k | continue; |
1592 | 0 | } |
1593 | | |
1594 | 67.9k | case JpegInternalsState::READ_INTERMARKER_LENGTH: { |
1595 | 67.9k | BrunsliStatus status = DecodeBase128(state, &js.intermarker_length); |
1596 | 67.9k | if (status != BRUNSLI_OK) return CheckBoundary(state, status); |
1597 | 34.4k | if (js.intermarker_length > RemainingSectionLength(state)) { |
1598 | 140 | return BRUNSLI_INVALID_BRN; |
1599 | 140 | } |
1600 | 34.2k | jpg->inter_marker_data.emplace_back(); |
1601 | 34.2k | js.stage = JpegInternalsState::READ_INTERMARKER_DATA; |
1602 | 34.2k | continue; |
1603 | 34.4k | } |
1604 | | |
1605 | 39.0k | case JpegInternalsState::READ_INTERMARKER_DATA: { |
1606 | 39.0k | auto& dest = jpg->inter_marker_data.back(); |
1607 | 39.0k | size_t piece_limit = js.intermarker_length - dest.size(); |
1608 | 39.0k | size_t piece_size = std::min(piece_limit, GetBytesAvailable(state)); |
1609 | 39.0k | Append(&dest, state->data + state->pos, piece_size); |
1610 | 39.0k | SkipBytes(state, piece_size); |
1611 | 39.0k | if (dest.size() < js.intermarker_length) { |
1612 | 4.92k | BRUNSLI_DCHECK(GetBytesAvailable(state) == 0); |
1613 | 4.92k | BRUNSLI_DCHECK(RemainingSectionLength(state) > 0); |
1614 | 4.92k | return BRUNSLI_NOT_ENOUGH_DATA; |
1615 | 4.92k | } |
1616 | 34.1k | ++js.i; |
1617 | 34.1k | js.stage = JpegInternalsState::ITERATE_MARKERS; |
1618 | 34.1k | continue; |
1619 | 39.0k | } |
1620 | | |
1621 | 17.9k | default: { /* no-op */ } |
1622 | 443k | } |
1623 | 17.9k | break; // no matching stage has been found; exit the loop. |
1624 | 443k | } |
1625 | | |
1626 | 17.9k | if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN; |
1627 | | |
1628 | 17.7k | return BRUNSLI_OK; |
1629 | 17.9k | } |
1630 | | |
1631 | 27.8k | static BrunsliStatus DecodeQuantDataSection(State* state, JPEGData* jpg) { |
1632 | 27.8k | InternalState& s = *state->internal; |
1633 | 27.8k | QuantDataState& qs = s.quant; |
1634 | 27.8k | BrunsliBitReader* br = &qs.br; |
1635 | | |
1636 | 27.8k | if (qs.stage == QuantDataState::INIT) { |
1637 | 14.6k | BrunsliBitReaderInit(br); |
1638 | 14.6k | qs.stage = QuantDataState::READ_NUM_QUANT; |
1639 | 14.6k | } |
1640 | 27.8k | PrepareBitReader(br, state); |
1641 | | |
1642 | 27.8k | const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus { |
1643 | 27.8k | return SuspendBitReader(br, state, result); |
1644 | 27.8k | }; |
1645 | | |
1646 | 27.8k | if (qs.stage == QuantDataState::READ_NUM_QUANT) { |
1647 | 22.8k | if (!BrunsliBitReaderCanRead(br, 2)) { |
1648 | 8.47k | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1649 | 8.47k | } |
1650 | 14.4k | size_t num_quant_tables = BrunsliBitReaderRead(br, 2) + 1; |
1651 | 14.4k | if (jpg->quant.size() != num_quant_tables) { |
1652 | 183 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1653 | 183 | } |
1654 | 14.2k | qs.predictor.resize(kDCTBlockSize); |
1655 | 14.2k | qs.i = 0; |
1656 | 14.2k | qs.stage = QuantDataState::READ_STOCK; |
1657 | 14.2k | } |
1658 | | |
1659 | 137k | while (true) { |
1660 | 137k | switch (qs.stage) { |
1661 | 26.8k | case QuantDataState::READ_STOCK: { |
1662 | 26.8k | if (qs.i >= jpg->quant.size()) { |
1663 | 12.2k | std::vector<uint8_t>().swap(qs.predictor); |
1664 | 12.2k | qs.i = 0; |
1665 | 12.2k | qs.stage = QuantDataState::READ_QUANT_IDX; |
1666 | 12.2k | continue; |
1667 | 12.2k | } |
1668 | | // Depending on еру 1-st bit, it is guaranteed that we will need to read |
1669 | | // at least 3 or 6 more bits. |
1670 | 14.6k | if (!BrunsliBitReaderCanRead(br, 4)) { |
1671 | 264 | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1672 | 264 | } |
1673 | 14.3k | qs.data_precision = 0; |
1674 | 14.3k | bool is_short = !BrunsliBitReaderRead(br, 1); |
1675 | 14.3k | if (is_short) { |
1676 | 12.3k | const size_t short_code = BrunsliBitReaderRead(br, 3); |
1677 | 12.3k | int32_t* table = jpg->quant[qs.i].values.data(); |
1678 | 12.3k | size_t selector = (qs.i > 0) ? 1 : 0; |
1679 | 805k | for (size_t k = 0; k < kDCTBlockSize; ++k) { |
1680 | 792k | table[k] = kStockQuantizationTables[selector][short_code][k]; |
1681 | 792k | } |
1682 | 12.3k | qs.stage = QuantDataState::UPDATE; |
1683 | 12.3k | } else { |
1684 | 1.97k | qs.stage = QuantDataState::READ_Q_FACTOR; |
1685 | 1.97k | } |
1686 | 14.3k | continue; |
1687 | 14.6k | } |
1688 | | |
1689 | 2.75k | case QuantDataState::READ_Q_FACTOR: { |
1690 | 2.75k | if (!BrunsliBitReaderCanRead(br, 6)) { |
1691 | 1.02k | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1692 | 1.02k | } |
1693 | 1.72k | const uint32_t q_factor = BrunsliBitReaderRead(br, 6); |
1694 | 1.72k | FillQuantMatrix(qs.i > 0, q_factor, qs.predictor.data()); |
1695 | 1.72k | qs.j = 0; |
1696 | 1.72k | qs.delta = 0; |
1697 | 1.72k | qs.stage = QuantDataState::READ_DIFF_IS_ZERO; |
1698 | 1.72k | continue; |
1699 | 2.75k | } |
1700 | | |
1701 | 35.1k | case QuantDataState::READ_DIFF_IS_ZERO: { |
1702 | 35.1k | if (qs.j >= kDCTBlockSize) { |
1703 | 410 | qs.stage = QuantDataState::UPDATE; |
1704 | 410 | continue; |
1705 | 410 | } |
1706 | 34.7k | if (!BrunsliBitReaderCanRead(br, 1)) { |
1707 | 1.89k | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1708 | 1.89k | } |
1709 | 32.8k | if (BrunsliBitReaderRead(br, 1)) { |
1710 | 6.74k | qs.stage = QuantDataState::READ_DIFF_SIGN; |
1711 | 26.1k | } else { |
1712 | 26.1k | qs.stage = QuantDataState::APPLY_DIFF; |
1713 | 26.1k | } |
1714 | 32.8k | continue; |
1715 | 34.7k | } |
1716 | | |
1717 | 6.94k | case QuantDataState::READ_DIFF_SIGN: { |
1718 | 6.94k | if (!BrunsliBitReaderCanRead(br, 1)) { |
1719 | 459 | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1720 | 459 | } |
1721 | 6.49k | qs.sign = BrunsliBitReaderRead(br, 1) ? -1 : 1; |
1722 | 6.49k | qs.stage = QuantDataState::READ_DIFF; |
1723 | 6.49k | continue; |
1724 | 6.94k | } |
1725 | | |
1726 | 8.59k | case QuantDataState::READ_DIFF: { |
1727 | 8.59k | if (!DecodeVarint(&qs.vs, br, 16)) { |
1728 | 2.39k | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1729 | 2.39k | } |
1730 | 6.19k | int diff = static_cast<int>(qs.vs.value) + 1; |
1731 | 6.19k | qs.delta += qs.sign * diff; |
1732 | 6.19k | qs.stage = QuantDataState::APPLY_DIFF; |
1733 | 6.19k | continue; |
1734 | 8.59k | } |
1735 | | |
1736 | 32.3k | case QuantDataState::APPLY_DIFF: { |
1737 | 32.3k | const int k = kJPEGNaturalOrder[qs.j]; |
1738 | 32.3k | const int quant_value = qs.predictor[k] + qs.delta; |
1739 | 32.3k | jpg->quant[qs.i].values[k] = quant_value; |
1740 | 32.3k | if (quant_value <= 0) { |
1741 | 244 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1742 | 244 | } |
1743 | 32.1k | if (quant_value >= 256) { |
1744 | 16.1k | qs.data_precision = 1; |
1745 | 16.1k | } |
1746 | 32.1k | if (quant_value >= 65536) { |
1747 | 237 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1748 | 237 | } |
1749 | 31.8k | ++qs.j; |
1750 | 31.8k | qs.stage = QuantDataState::READ_DIFF_IS_ZERO; |
1751 | 31.8k | continue; |
1752 | 32.1k | } |
1753 | | |
1754 | 12.7k | case QuantDataState::UPDATE: { |
1755 | 12.7k | if (jpg->quant[qs.i].precision < qs.data_precision) { |
1756 | 211 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1757 | 211 | } |
1758 | | // jpg->quant[qs.i].precision > qs.data_precision means that original |
1759 | | // JPEG1 was inefficiently encoded. |
1760 | 12.5k | ++qs.i; |
1761 | 12.5k | qs.stage = QuantDataState::READ_STOCK; |
1762 | 12.5k | continue; |
1763 | 12.7k | } |
1764 | | |
1765 | 12.4k | default: { /* no-op */ } |
1766 | 137k | } |
1767 | 12.4k | break; // no matching stage has been found; exit the loop. |
1768 | 137k | } |
1769 | | |
1770 | 37.6k | while (qs.stage == QuantDataState::READ_QUANT_IDX) { |
1771 | 25.8k | if (qs.i >= jpg->components.size()) { |
1772 | 11.7k | qs.stage = QuantDataState::FINISH; |
1773 | 11.7k | continue; |
1774 | 11.7k | } |
1775 | 14.0k | JPEGComponent* c = &jpg->components[qs.i]; |
1776 | 14.0k | if (!BrunsliBitReaderCanRead(br, 2)) { |
1777 | 461 | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1778 | 461 | } |
1779 | 13.6k | c->quant_idx = BrunsliBitReaderRead(br, 2); |
1780 | 13.6k | if (c->quant_idx >= jpg->quant.size()) { |
1781 | 243 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1782 | 243 | } |
1783 | 13.3k | ++qs.i; |
1784 | 13.3k | } |
1785 | | |
1786 | 11.7k | BRUNSLI_DCHECK(qs.stage == QuantDataState::FINISH); |
1787 | 11.7k | suspend_bit_reader(BRUNSLI_OK); |
1788 | 11.7k | BrunsliBitReaderFinish(br); |
1789 | 11.7k | if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN; |
1790 | 11.7k | if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN; |
1791 | 11.5k | return BRUNSLI_OK; |
1792 | 11.7k | } |
1793 | | |
1794 | 79.2k | static BrunsliStatus DecodeHistogramDataSection(State* state, JPEGData* jpg) { |
1795 | 79.2k | InternalState& s = *state->internal; |
1796 | 79.2k | HistogramDataState& hs = s.histogram; |
1797 | 79.2k | BrunsliBitReader* br = &hs.br; |
1798 | | |
1799 | 79.2k | if (hs.stage == HistogramDataState::INIT) { |
1800 | 14.6k | BrunsliBitReaderInit(br); |
1801 | 14.6k | BRUNSLI_DCHECK(!jpg->components.empty()); |
1802 | 14.6k | s.num_contexts = jpg->components.size(); |
1803 | 14.6k | hs.stage = HistogramDataState::READ_SCHEME; |
1804 | | /* Optimization: hint arena about maximal used alphabet size: 272. |
1805 | | * 648 = 272 + 376, where 376 is a "universal" overhead for max-15-bit |
1806 | | * root-8-bit 2-level Huffman tables. */ |
1807 | 14.6k | hs.arena.reserve(648); |
1808 | 14.6k | } |
1809 | 79.2k | PrepareBitReader(br, state); |
1810 | 79.2k | if (RemainingSectionLength(state) <= GetBytesAvailable(state)) { |
1811 | | // If end of section is reachable, then we could parse the remainings in |
1812 | | // non-streaming mode. |
1813 | 12.8k | BrunsliBitReaderSetOptimistic(br); |
1814 | 12.8k | } |
1815 | 79.2k | const auto suspend_bit_reader = [&](BrunsliStatus result) -> BrunsliStatus { |
1816 | 79.2k | return SuspendBitReader(br, state, result); |
1817 | 79.2k | }; |
1818 | | |
1819 | 79.2k | if (hs.stage == HistogramDataState::READ_SCHEME) { |
1820 | 22.9k | const size_t num_components = jpg->components.size(); |
1821 | 22.9k | BRUNSLI_DCHECK(num_components <= 4); |
1822 | 22.9k | if (!BrunsliBitReaderCanRead(br, 3 * num_components)) { |
1823 | 8.47k | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1824 | 8.47k | } |
1825 | 30.6k | for (size_t i = 0; i < num_components; ++i) { |
1826 | 16.4k | size_t scheme = BrunsliBitReaderRead(br, 3); |
1827 | 16.4k | if (scheme >= kNumSchemes) return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1828 | 16.2k | ComponentMeta& m = state->meta[i]; |
1829 | 16.2k | m.context_bits = scheme; |
1830 | 16.2k | m.context_offset = s.num_contexts; |
1831 | 16.2k | s.num_contexts += kNumNonzeroContextSkip[scheme]; |
1832 | 16.2k | } |
1833 | 14.2k | if (!BrunsliBitReaderIsHealthy(br)) { |
1834 | 27 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1835 | 27 | } |
1836 | 14.2k | hs.stage = HistogramDataState::READ_NUM_HISTOGRAMS; |
1837 | 14.2k | } |
1838 | | |
1839 | 70.5k | if (hs.stage == HistogramDataState::READ_NUM_HISTOGRAMS) { |
1840 | 21.5k | if (!BrunsliBitReaderCanRead(br, 11)) { |
1841 | 7.54k | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1842 | 7.54k | } |
1843 | 13.9k | s.num_histograms = DecodeVarLenUint8(br) + 1; |
1844 | 13.9k | if (!BrunsliBitReaderIsHealthy(br)) { |
1845 | 22 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1846 | 22 | } |
1847 | 13.9k | if (s.shallow_histograms) { |
1848 | 0 | hs.stage = HistogramDataState::SKIP_CONTENT; |
1849 | 13.9k | } else { |
1850 | 13.9k | s.context_map_.resize(s.num_contexts * kNumAvrgContexts); |
1851 | 13.9k | state->context_map = s.context_map_.data(); |
1852 | 13.9k | s.entropy_codes_.resize(s.num_histograms); |
1853 | 13.9k | state->entropy_codes = s.entropy_codes_.data(); |
1854 | 13.9k | if (s.num_histograms > 1) { |
1855 | 2.54k | hs.stage = HistogramDataState::READ_CONTEXT_MAP_CODE; |
1856 | 11.4k | } else { |
1857 | 11.4k | hs.i = 0; |
1858 | 11.4k | hs.counts.resize(kCoeffAlphabetSize); |
1859 | 11.4k | hs.stage = HistogramDataState::READ_HISTOGRAMS; |
1860 | 11.4k | } |
1861 | 13.9k | } |
1862 | 13.9k | } |
1863 | | |
1864 | 62.9k | if (hs.stage == HistogramDataState::SKIP_CONTENT) { |
1865 | 0 | suspend_bit_reader(BRUNSLI_OK); |
1866 | 0 | if (!BrunsliBitReaderIsHealthy(br)) { |
1867 | 0 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1868 | 0 | } |
1869 | 0 | SkipAvailableBytes(state, RemainingSectionLength(state)); |
1870 | 0 | if (!IsAtSectionBoundary(state)) return BRUNSLI_NOT_ENOUGH_DATA; |
1871 | 0 | hs.stage = HistogramDataState::DONE; |
1872 | 0 | } |
1873 | | |
1874 | 62.9k | if (hs.stage == HistogramDataState::READ_CONTEXT_MAP_CODE) { |
1875 | 29.1k | if (!BrunsliBitReaderCanRead(br, 207 + s.num_histograms * 8)) { |
1876 | 26.8k | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1877 | 26.8k | } |
1878 | 2.29k | hs.max_run_length_prefix = 0; |
1879 | 2.29k | bool use_rle_for_zeros = !!BrunsliBitReaderRead(br, 1); |
1880 | 2.29k | if (use_rle_for_zeros) { |
1881 | 885 | hs.max_run_length_prefix = BrunsliBitReaderRead(br, 4) + 1; |
1882 | 885 | } |
1883 | 2.29k | size_t alphabet_size = s.num_histograms + hs.max_run_length_prefix; |
1884 | 2.29k | hs.entropy.reset(new HuffmanDecodingData); |
1885 | 2.29k | if (!hs.entropy->ReadFromBitStream(alphabet_size, br, &hs.arena)) { |
1886 | 653 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1887 | 653 | } |
1888 | 1.63k | hs.i = 0; |
1889 | 1.63k | hs.stage = HistogramDataState::READ_CONTEXT_MAP; |
1890 | 1.63k | } |
1891 | | |
1892 | 35.4k | if (hs.stage == HistogramDataState::READ_CONTEXT_MAP) { |
1893 | 7.60k | BrunsliStatus status = DecodeContextMap( |
1894 | 7.60k | *hs.entropy, hs.max_run_length_prefix, &hs.i, &s.context_map_, br); |
1895 | 7.60k | if (status != BRUNSLI_OK) return suspend_bit_reader(status); |
1896 | 1.02k | hs.i = 0; |
1897 | 1.02k | hs.counts.resize(kCoeffAlphabetSize); |
1898 | 1.02k | hs.stage = HistogramDataState::READ_HISTOGRAMS; |
1899 | 1.02k | } |
1900 | | |
1901 | 28.8k | if (hs.stage == HistogramDataState::READ_HISTOGRAMS) { |
1902 | 52.4k | while (hs.i < s.num_histograms) { |
1903 | 40.7k | if (!BrunsliBitReaderCanRead(br, 9 + kCoeffAlphabetSize * 11)) { |
1904 | 16.7k | return suspend_bit_reader(BRUNSLI_NOT_ENOUGH_DATA); |
1905 | 16.7k | } |
1906 | 24.0k | if (!ReadHistogram(BRUNSLI_ANS_LOG_TAB_SIZE, &hs.counts, br)) { |
1907 | 415 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1908 | 415 | } |
1909 | 23.5k | if (!s.entropy_codes_[hs.i].Init(hs.counts)) { |
1910 | 0 | return suspend_bit_reader(BRUNSLI_INVALID_BRN); |
1911 | 0 | } |
1912 | 23.5k | ++hs.i; |
1913 | 23.5k | } |
1914 | 11.7k | hs.entropy.reset(); |
1915 | 11.7k | std::vector<uint32_t>().swap(hs.counts); |
1916 | 11.7k | suspend_bit_reader(BRUNSLI_OK); |
1917 | 11.7k | BrunsliBitReaderFinish(br); |
1918 | 11.7k | if (!BrunsliBitReaderIsHealthy(br)) return BRUNSLI_INVALID_BRN; |
1919 | 11.6k | if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN; |
1920 | 11.5k | hs.stage = HistogramDataState::DONE; |
1921 | 11.5k | } |
1922 | | |
1923 | 11.5k | hs.arena.reset(); |
1924 | 11.5k | BRUNSLI_DCHECK(hs.stage == HistogramDataState::DONE); |
1925 | 11.5k | return BRUNSLI_OK; |
1926 | 28.8k | } |
1927 | | |
1928 | 94.3k | static BrunsliStatus DecodeDCDataSection(State* state) { |
1929 | 94.3k | size_t available = GetBytesAvailable(state) & ~1; |
1930 | 94.3k | size_t limit = RemainingSectionLength(state); |
1931 | 94.3k | BRUNSLI_DCHECK((limit & 1) == 0); |
1932 | 94.3k | size_t chunk_len = std::min(available, limit); |
1933 | | // If end of section is reachable, then we could parse the remainings in |
1934 | | // non-streaming mode. |
1935 | 94.3k | bool is_last_chunk = (chunk_len == limit); |
1936 | 94.3k | WordSource in(state->data + state->pos, chunk_len, is_last_chunk); |
1937 | | |
1938 | 94.3k | BrunsliStatus status = DecodeDC(state, &in); |
1939 | | |
1940 | 94.3k | BRUNSLI_DCHECK((in.pos_ & 1) == 0); |
1941 | 94.3k | if (in.error_) return BRUNSLI_INVALID_BRN; |
1942 | 93.8k | BRUNSLI_DCHECK(in.pos_ <= chunk_len); |
1943 | 93.8k | SkipBytes(state, in.pos_); |
1944 | 93.8k | if (is_last_chunk) { |
1945 | 10.5k | BRUNSLI_DCHECK(status != BRUNSLI_NOT_ENOUGH_DATA); |
1946 | 10.5k | if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN; |
1947 | 10.5k | } |
1948 | 93.8k | return status; |
1949 | 93.8k | } |
1950 | | |
1951 | 168k | static BrunsliStatus DecodeACDataSection(State* state) { |
1952 | 168k | size_t available = GetBytesAvailable(state) & ~1; |
1953 | 168k | size_t limit = RemainingSectionLength(state); |
1954 | 168k | BRUNSLI_DCHECK((limit & 1) == 0); |
1955 | 168k | size_t chunk_len = std::min(available, limit); |
1956 | | // If end of section is reachable, then we could parse the remainings in |
1957 | | // non-streaming mode. |
1958 | 168k | bool is_last_chunk = (chunk_len == limit); |
1959 | 168k | WordSource in(state->data + state->pos, chunk_len, is_last_chunk); |
1960 | | |
1961 | 168k | BrunsliStatus status = DecodeAC(state, &in); |
1962 | | |
1963 | 168k | BRUNSLI_DCHECK((in.pos_ & 1) == 0); |
1964 | 168k | if (in.error_) return BRUNSLI_INVALID_BRN; |
1965 | 167k | BRUNSLI_DCHECK(in.pos_ <= chunk_len); |
1966 | 167k | SkipBytes(state, in.pos_); |
1967 | 167k | if (is_last_chunk) { |
1968 | 8.97k | BRUNSLI_DCHECK(status != BRUNSLI_NOT_ENOUGH_DATA); |
1969 | 8.97k | if (!IsAtSectionBoundary(state)) return BRUNSLI_INVALID_BRN; |
1970 | 8.97k | } |
1971 | 167k | return status; |
1972 | 167k | } |
1973 | | |
1974 | 2.81k | static Stage DecodeOriginalJpg(State* state, JPEGData* jpg) { |
1975 | 2.81k | InternalState& s = *state->internal; |
1976 | 2.81k | FallbackState& fs = s.fallback; |
1977 | | |
1978 | 3.99k | while (fs.stage != FallbackState::DONE) { |
1979 | 3.94k | switch (fs.stage) { |
1980 | 902 | case FallbackState::READ_TAG: { |
1981 | 902 | BrunsliStatus status = ReadTag(state, &s.section); |
1982 | 902 | if (status != BRUNSLI_OK) return Fail(state, status); |
1983 | 614 | if (s.section.tag != kBrunsliOriginalJpgTag || !s.section.is_section) { |
1984 | 14 | return Fail(state, BRUNSLI_INVALID_BRN); |
1985 | 14 | } |
1986 | 600 | fs.stage = FallbackState::ENTER_SECTION; |
1987 | 600 | break; |
1988 | 614 | } |
1989 | | |
1990 | 1.64k | case FallbackState::ENTER_SECTION: { |
1991 | 1.64k | BrunsliStatus status = EnterSection(state, &s.section); |
1992 | 1.64k | if (status != BRUNSLI_OK) return Fail(state, status); |
1993 | 530 | jpg->original_jpg_size = s.section.remaining; |
1994 | | // Edge case - empty payload. |
1995 | 530 | if (jpg->original_jpg_size == 0) { |
1996 | 6 | jpg->original_jpg = nullptr; |
1997 | 6 | fs.stage = FallbackState::DONE; |
1998 | 6 | break; |
1999 | 6 | } |
2000 | 524 | fs.stage = FallbackState::READ_CONTENTS; |
2001 | 524 | break; |
2002 | 530 | } |
2003 | | |
2004 | 1.39k | case FallbackState::READ_CONTENTS: { |
2005 | 1.39k | size_t chunk_size = GetBytesAvailable(state); |
2006 | 1.39k | if (chunk_size == 0) { |
2007 | | // TODO(eustas): dcheck s.section.remaining != 0 |
2008 | 464 | return Fail(state, BRUNSLI_NOT_ENOUGH_DATA); |
2009 | 464 | } |
2010 | | // Check if it is possible to avoid copy. |
2011 | 932 | const uint8_t* src = state->data + state->pos; |
2012 | 932 | if (fs.storage.empty()) { |
2013 | 364 | if (chunk_size >= jpg->original_jpg_size) { |
2014 | 38 | jpg->original_jpg = src; |
2015 | 38 | SkipBytes(state, jpg->original_jpg_size); |
2016 | 38 | fs.stage = FallbackState::DONE; |
2017 | 38 | break; |
2018 | 38 | } |
2019 | 364 | } |
2020 | | // Otherwise, copy input. |
2021 | 894 | size_t remaining = jpg->original_jpg_size - fs.storage.size(); |
2022 | 894 | size_t to_copy = std::min(chunk_size, remaining); |
2023 | 894 | fs.storage.insert(fs.storage.cend(), src, src + to_copy); |
2024 | 894 | SkipBytes(state, to_copy); |
2025 | 894 | if (fs.storage.size() == jpg->original_jpg_size) { |
2026 | 11 | jpg->original_jpg = fs.storage.data(); |
2027 | 11 | fs.stage = FallbackState::DONE; |
2028 | 11 | break; |
2029 | 11 | } |
2030 | | // TODO(eustas): dcheck GetBytesAvailable(state) == 0 |
2031 | 883 | return Fail(state, BRUNSLI_NOT_ENOUGH_DATA); |
2032 | 894 | } |
2033 | | |
2034 | 0 | default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR); |
2035 | 3.94k | } |
2036 | 3.94k | } |
2037 | | |
2038 | 55 | LeaveSection(&s.section); |
2039 | 55 | return Stage::DONE; |
2040 | 2.81k | } |
2041 | | |
2042 | 187k | static Stage ParseSection(State* state) { |
2043 | 187k | InternalState& s = *state->internal; |
2044 | 187k | SectionHeaderState& sh = s.section_header; |
2045 | | |
2046 | 187k | Stage result = Stage::ERROR; |
2047 | | |
2048 | 350k | while (sh.stage != SectionHeaderState::DONE) { |
2049 | 268k | switch (sh.stage) { |
2050 | 128k | case SectionHeaderState::READ_TAG: { |
2051 | 128k | BrunsliStatus status = ReadTag(state, &s.section); |
2052 | 128k | if (status == BRUNSLI_NOT_ENOUGH_DATA) { |
2053 | 46.8k | if (HasSection(state, kBrunsliACDataTag)) return Stage::DONE; |
2054 | 46.8k | } |
2055 | 128k | if (status != BRUNSLI_OK) return Fail(state, status); |
2056 | 81.7k | if (s.section.is_section) { |
2057 | 81.6k | sh.stage = SectionHeaderState::ENTER_SECTION; |
2058 | 81.6k | continue; |
2059 | 81.6k | } |
2060 | 92 | const uint32_t tag_bit = 1u << s.section.tag; |
2061 | 92 | const bool is_known_section_tag = kKnownSectionTags & tag_bit; |
2062 | 92 | if (is_known_section_tag) return Fail(state, BRUNSLI_INVALID_BRN); |
2063 | 88 | sh.stage = SectionHeaderState::READ_VALUE; |
2064 | 88 | continue; |
2065 | 92 | } |
2066 | | |
2067 | 218 | case SectionHeaderState::READ_VALUE: { |
2068 | | // No known varint tags on top level. |
2069 | 218 | size_t sink; |
2070 | 218 | BrunsliStatus status = DecodeBase128(state, &sink); |
2071 | 218 | if (status != BRUNSLI_OK) return Fail(state, status); |
2072 | 74 | result = Stage::SECTION; |
2073 | 74 | sh.stage = SectionHeaderState::DONE; |
2074 | 74 | continue; |
2075 | 218 | } |
2076 | | |
2077 | 140k | case SectionHeaderState::ENTER_SECTION: { |
2078 | 140k | BrunsliStatus status = EnterSection(state, &s.section); |
2079 | 140k | if (status != BRUNSLI_OK) return Fail(state, status); |
2080 | 81.6k | result = Stage::SECTION_BODY; |
2081 | 81.6k | sh.stage = SectionHeaderState::DONE; |
2082 | 81.6k | continue; |
2083 | 140k | } |
2084 | | |
2085 | 0 | default: return Fail(state, BRUNSLI_DECOMPRESSION_ERROR); |
2086 | 268k | } |
2087 | 268k | } |
2088 | | |
2089 | 81.7k | sh.stage = SectionHeaderState::READ_TAG; |
2090 | 81.7k | BRUNSLI_DCHECK(result != Stage::ERROR); |
2091 | 81.7k | return result; |
2092 | 187k | } |
2093 | | |
2094 | 5.92M | static Stage ProcessSection(State* state, JPEGData* jpg) { |
2095 | 5.92M | InternalState& s = *state->internal; |
2096 | | |
2097 | 5.92M | const int32_t tag_bit = 1u << s.section.tag; |
2098 | 5.92M | const bool is_known_section_tag = kKnownSectionTags & tag_bit; |
2099 | | |
2100 | 5.92M | const bool skip_section = |
2101 | 5.92M | !is_known_section_tag || (state->skip_tags & tag_bit); |
2102 | | |
2103 | 5.92M | if (skip_section) { |
2104 | | // Skip section content. |
2105 | 617 | size_t to_skip = |
2106 | 617 | std::min(GetBytesAvailable(state), RemainingSectionLength(state)); |
2107 | 617 | state->pos += to_skip; |
2108 | 617 | if (RemainingSectionLength(state) != 0) { |
2109 | 557 | BRUNSLI_DCHECK(GetBytesAvailable(state) == 0); |
2110 | 557 | return Fail(state, BRUNSLI_NOT_ENOUGH_DATA); |
2111 | 557 | } |
2112 | 60 | return Stage::SECTION; |
2113 | 617 | } |
2114 | | |
2115 | 5.92M | switch (s.section.tag) { |
2116 | 477k | case kBrunsliMetaDataTag: { |
2117 | 477k | BrunsliStatus status = DecodeMetaDataSection(state, jpg); |
2118 | 477k | if (status != BRUNSLI_OK) return Fail(state, status); |
2119 | 72 | break; |
2120 | 477k | } |
2121 | | |
2122 | 5.07M | case kBrunsliJPEGInternalsTag: { |
2123 | 5.07M | BrunsliStatus status = DecodeJPEGInternalsSection(state, jpg); |
2124 | 5.07M | if (status != BRUNSLI_OK) return Fail(state, status); |
2125 | 17.7k | break; |
2126 | 5.07M | } |
2127 | | |
2128 | 27.8k | case kBrunsliQuantDataTag: { |
2129 | 27.8k | if (!HasSection(state, kBrunsliJPEGInternalsTag)) { |
2130 | 2 | return Fail(state, BRUNSLI_INVALID_BRN); |
2131 | 2 | } |
2132 | 27.8k | BrunsliStatus status = DecodeQuantDataSection(state, jpg); |
2133 | 27.8k | if (status != BRUNSLI_OK) return Fail(state, status); |
2134 | 11.5k | break; |
2135 | 27.8k | } |
2136 | | |
2137 | 79.2k | case kBrunsliHistogramDataTag: { |
2138 | 79.2k | if (!HasSection(state, kBrunsliJPEGInternalsTag)) { |
2139 | 2 | return Fail(state, BRUNSLI_INVALID_BRN); |
2140 | 2 | } |
2141 | 79.2k | BrunsliStatus status = DecodeHistogramDataSection(state, jpg); |
2142 | 79.2k | if (status != BRUNSLI_OK) return Fail(state, status); |
2143 | 11.5k | break; |
2144 | 79.2k | } |
2145 | | |
2146 | 94.3k | case kBrunsliDCDataTag: { |
2147 | 94.3k | if (!HasSection(state, kBrunsliHistogramDataTag)) { |
2148 | 3 | return Fail(state, BRUNSLI_INVALID_BRN); |
2149 | 3 | } |
2150 | 94.3k | if (!HasSection(state, kBrunsliQuantDataTag)) { |
2151 | 3 | return Fail(state, BRUNSLI_INVALID_BRN); |
2152 | 3 | } |
2153 | | // This section reads input word by word. |
2154 | 94.3k | if ((RemainingSectionLength(state) & 1) != 0) { |
2155 | 4 | return Fail(state, BRUNSLI_INVALID_BRN); |
2156 | 4 | } |
2157 | 94.3k | internal::dec::WarmupMeta(jpg, state); |
2158 | 94.3k | BrunsliStatus status = DecodeDCDataSection(state); |
2159 | 94.3k | if (status != BRUNSLI_OK) return Fail(state, status); |
2160 | 10.5k | break; |
2161 | 94.3k | } |
2162 | | |
2163 | 168k | case kBrunsliACDataTag: { |
2164 | 168k | if (!HasSection(state, kBrunsliDCDataTag)) { |
2165 | 3 | return Fail(state, BRUNSLI_INVALID_BRN); |
2166 | 3 | } |
2167 | | // This section reads input word by word. |
2168 | 168k | if ((RemainingSectionLength(state) & 1) != 0) { |
2169 | 7 | return Fail(state, BRUNSLI_INVALID_BRN); |
2170 | 7 | } |
2171 | 168k | internal::dec::WarmupMeta(jpg, state); |
2172 | 168k | BrunsliStatus status = DecodeACDataSection(state); |
2173 | 168k | if (status != BRUNSLI_OK) return Fail(state, status); |
2174 | 8.79k | break; |
2175 | 168k | } |
2176 | | |
2177 | 8.79k | default: |
2178 | | /* Unreachable */ |
2179 | 0 | return Fail(state, BRUNSLI_INVALID_BRN); |
2180 | 5.92M | } |
2181 | | |
2182 | 60.3k | if (!IsAtSectionBoundary(state)) { |
2183 | 117 | return Fail(state, BRUNSLI_INVALID_BRN); |
2184 | 117 | } |
2185 | | |
2186 | | // Nothing is expected after the AC data. |
2187 | 60.2k | if (s.section.tag == kBrunsliACDataTag) { |
2188 | 8.79k | return Stage::DONE; |
2189 | 8.79k | } |
2190 | | |
2191 | 51.4k | return Stage::SECTION; |
2192 | 60.2k | } |
2193 | | |
2194 | | namespace internal { |
2195 | | namespace dec { |
2196 | | |
2197 | 30.4k | bool UpdateSubsamplingDerivatives(JPEGData* jpg) { |
2198 | 79.1k | for (size_t i = 0; i < jpg->components.size(); ++i) { |
2199 | 48.6k | JPEGComponent* c = &jpg->components[i]; |
2200 | 48.6k | jpg->max_h_samp_factor = std::max(jpg->max_h_samp_factor, c->h_samp_factor); |
2201 | 48.6k | jpg->max_v_samp_factor = std::max(jpg->max_v_samp_factor, c->v_samp_factor); |
2202 | 48.6k | } |
2203 | 30.4k | jpg->MCU_rows = DivCeil(jpg->height, jpg->max_v_samp_factor * 8); |
2204 | 30.4k | jpg->MCU_cols = DivCeil(jpg->width, jpg->max_h_samp_factor * 8); |
2205 | 79.1k | for (size_t i = 0; i < jpg->components.size(); ++i) { |
2206 | 48.6k | JPEGComponent* c = &jpg->components[i]; |
2207 | 48.6k | c->width_in_blocks = jpg->MCU_cols * c->h_samp_factor; |
2208 | 48.6k | c->height_in_blocks = jpg->MCU_rows * c->v_samp_factor; |
2209 | | // 8205 == max[ceil((65535 / (i * 8)) * i) for i in range(1, 16 + 1)] |
2210 | 48.6k | BRUNSLI_DCHECK(c->width_in_blocks <= 8205); |
2211 | 48.6k | BRUNSLI_DCHECK(c->height_in_blocks <= 8205); |
2212 | 48.6k | uint32_t num_blocks = c->width_in_blocks * c->height_in_blocks; |
2213 | 48.6k | if (num_blocks > kBrunsliMaxNumBlocks) { |
2214 | 5 | return false; |
2215 | 5 | } |
2216 | 48.6k | c->num_blocks = num_blocks; |
2217 | 48.6k | } |
2218 | 30.4k | return true; |
2219 | 30.4k | } |
2220 | | |
2221 | 30.4k | void PrepareMeta(const JPEGData* jpg, State* state) { |
2222 | 30.4k | InternalState& s = *state->internal; |
2223 | | |
2224 | 30.4k | size_t num_components = jpg->components.size(); |
2225 | 30.4k | s.block_state_.resize(num_components); |
2226 | 30.4k | std::vector<ComponentMeta>& meta = state->meta; |
2227 | 30.4k | meta.resize(num_components); |
2228 | 79.1k | for (size_t i = 0; i < num_components; ++i) { |
2229 | 48.6k | const JPEGComponent& c = jpg->components[i]; |
2230 | 48.6k | ComponentMeta& m = meta[i]; |
2231 | 48.6k | m.h_samp = c.h_samp_factor; |
2232 | 48.6k | m.v_samp = c.v_samp_factor; |
2233 | 48.6k | m.width_in_blocks = jpg->MCU_cols * m.h_samp; |
2234 | 48.6k | m.height_in_blocks = jpg->MCU_rows * m.v_samp; |
2235 | 48.6k | } |
2236 | 30.4k | } |
2237 | | |
2238 | 263k | void WarmupMeta(JPEGData* jpg, State* state) { |
2239 | 263k | InternalState& s = *state->internal; |
2240 | 263k | std::vector<ComponentMeta>& meta = state->meta; |
2241 | 263k | const size_t num_components = meta.size(); |
2242 | | |
2243 | 263k | if (!state->is_storage_allocated) { |
2244 | 11.5k | state->is_storage_allocated = true; |
2245 | 24.3k | for (size_t i = 0; i < num_components; ++i) { |
2246 | 12.8k | size_t num_blocks = meta[i].width_in_blocks * meta[i].height_in_blocks; |
2247 | 12.8k | jpg->components[i].coeffs.resize(num_blocks * kDCTBlockSize); |
2248 | 12.8k | s.block_state_[i].resize(num_blocks); |
2249 | 12.8k | meta[i].block_state = s.block_state_[i].data(); |
2250 | 12.8k | } |
2251 | 11.5k | } |
2252 | | |
2253 | 263k | if (!s.is_meta_warm) { |
2254 | 11.5k | s.is_meta_warm = true; |
2255 | 24.3k | for (size_t c = 0; c < num_components; ++c) { |
2256 | 12.8k | ComponentMeta& m = meta[c]; |
2257 | 12.8k | const JPEGQuantTable& q = jpg->quant[jpg->components[c].quant_idx]; |
2258 | 12.8k | m.ac_coeffs = jpg->components[c].coeffs.data(); |
2259 | 12.8k | m.ac_stride = m.width_in_blocks * kDCTBlockSize; |
2260 | 12.8k | m.b_stride = m.width_in_blocks; |
2261 | 12.8k | memcpy(m.quant.data(), q.values.data(), |
2262 | 12.8k | kDCTBlockSize * sizeof(m.quant[0])); |
2263 | 12.8k | } |
2264 | 11.5k | } |
2265 | 263k | } |
2266 | | |
2267 | 6.24M | BrunsliStatus DoProcessJpeg(State* state, JPEGData* jpg) { |
2268 | 12.6M | while (true) { |
2269 | 12.6M | switch (state->stage) { |
2270 | 124k | case Stage::SIGNATURE: |
2271 | 124k | state->stage = VerifySignature(state); |
2272 | 124k | break; |
2273 | | |
2274 | 202k | case Stage::HEADER: |
2275 | 202k | state->stage = DecodeHeader(state, jpg); |
2276 | 202k | break; |
2277 | | |
2278 | 2.81k | case Stage::FALLBACK: |
2279 | 2.81k | state->stage = DecodeOriginalJpg(state, jpg); |
2280 | 2.81k | break; |
2281 | | |
2282 | 187k | case Stage::SECTION: |
2283 | 187k | state->stage = ParseSection(state); |
2284 | 187k | break; |
2285 | | |
2286 | 5.92M | case Stage::SECTION_BODY: |
2287 | 5.92M | state->stage = ProcessSection(state, jpg); |
2288 | 5.92M | break; |
2289 | | |
2290 | 8.84k | case Stage::DONE: |
2291 | | // It is expected that there is no garbage after the valid brunsli |
2292 | | // stream. |
2293 | 8.84k | if (state->pos != state->len) { |
2294 | 31 | state->stage = Fail(state, BRUNSLI_INVALID_BRN); |
2295 | 31 | break; |
2296 | 31 | } |
2297 | 8.81k | return BRUNSLI_OK; |
2298 | | |
2299 | 6.23M | case Stage::ERROR: |
2300 | 6.23M | return state->internal->result; |
2301 | | |
2302 | 0 | default: |
2303 | | /* Unreachable */ |
2304 | 0 | state->stage = Fail(state, BRUNSLI_DECOMPRESSION_ERROR); |
2305 | 0 | break; |
2306 | 12.6M | } |
2307 | 12.6M | } |
2308 | 6.24M | } |
2309 | | |
2310 | | /** Adds new input to buffer. */ |
2311 | 6.15M | void ChargeBuffer(State* state) { |
2312 | 6.15M | InternalState& s = *state->internal; |
2313 | 6.15M | Buffer& b = s.buffer; |
2314 | | |
2315 | 6.15M | b.borrowed_len = 0; |
2316 | 6.15M | b.external_data = state->data; |
2317 | 6.15M | b.external_pos = state->pos; |
2318 | 6.15M | b.external_len = state->len; |
2319 | 6.15M | } |
2320 | | |
2321 | | constexpr size_t kBufferMaxReadAhead = 600; |
2322 | | |
2323 | | /** Sets input source either to buffered, or to external data. */ |
2324 | 6.24M | void LoadInput(State* state) { |
2325 | 6.24M | InternalState& s = *state->internal; |
2326 | 6.24M | Buffer& b = s.buffer; |
2327 | | |
2328 | | // No data buffered. Just pass external data as is. |
2329 | 6.24M | if (b.data_len == 0) { |
2330 | 5.77M | state->data = b.external_data; |
2331 | 5.77M | state->pos = b.external_pos; |
2332 | 5.77M | state->len = b.external_len; |
2333 | 5.77M | return; |
2334 | 5.77M | } |
2335 | | |
2336 | 468k | BRUNSLI_DCHECK(b.data_len <= kBufferMaxReadAhead); |
2337 | | |
2338 | | // Otherwise use buffered data. |
2339 | 468k | size_t available = b.external_len - b.external_pos; |
2340 | | // Always try to borrow as much as parser could require. This way, when |
2341 | | // buffer is unable to provide enough input, we could switch to unbuffered |
2342 | | // input. |
2343 | 468k | b.borrowed_len = std::min(kBufferMaxReadAhead, available); |
2344 | 468k | memcpy(b.data.data() + b.data_len, b.external_data + b.external_pos, |
2345 | 468k | b.borrowed_len); |
2346 | 468k | state->data = b.data.data(); |
2347 | 468k | state->pos = 0; |
2348 | 468k | state->len = b.data_len + b.borrowed_len; |
2349 | 468k | } |
2350 | | |
2351 | | /** |
2352 | | * Cancel borrowed bytes, if any. |
2353 | | * |
2354 | | * Returns false, if it is impossible to continue parsing. |
2355 | | */ |
2356 | 6.24M | bool UnloadInput(State* state, BrunsliStatus result) { |
2357 | 6.24M | InternalState& s = *state->internal; |
2358 | 6.24M | Buffer& b = s.buffer; |
2359 | | |
2360 | | // Non-buffered input; put tail to buffer. |
2361 | 6.24M | if (state->data == b.external_data) { |
2362 | 5.77M | b.external_pos = state->pos; |
2363 | 5.77M | BRUNSLI_DCHECK(b.external_pos <= b.external_len); |
2364 | 5.77M | if (result != BRUNSLI_NOT_ENOUGH_DATA) return true; |
2365 | 5.75M | BRUNSLI_DCHECK(b.data_len == 0); |
2366 | 5.75M | size_t available = b.external_len - b.external_pos; |
2367 | 5.75M | BRUNSLI_DCHECK(available < kBufferMaxReadAhead); |
2368 | 5.75M | if (b.data.empty()) b.data.resize(2 * kBufferMaxReadAhead); |
2369 | 5.75M | b.data_len = available; |
2370 | 5.75M | memcpy(b.data.data(), b.external_data + b.external_pos, b.data_len); |
2371 | 5.75M | b.external_pos += available; |
2372 | 5.75M | return false; |
2373 | 5.77M | } |
2374 | | |
2375 | | // Buffer depleted; switch to non-buffered input. |
2376 | 468k | if (state->pos >= b.data_len) { |
2377 | 89.9k | size_t used_borrowed_bytes = state->pos - b.data_len; |
2378 | 89.9k | b.data_len = 0; |
2379 | 89.9k | b.external_pos += used_borrowed_bytes; |
2380 | 89.9k | return true; |
2381 | 89.9k | } |
2382 | | |
2383 | | // Buffer not depleted; either problem discovered was already buffered data, |
2384 | | // or extra input was too-short. |
2385 | 378k | b.data_len -= state->pos; |
2386 | 378k | if (result == BRUNSLI_NOT_ENOUGH_DATA) { |
2387 | | // We couldn't have taken more bytes. |
2388 | 377k | BRUNSLI_DCHECK(b.external_pos + b.borrowed_len == b.external_len); |
2389 | | // Remaining piece is not too large. |
2390 | 377k | BRUNSLI_DCHECK(b.data_len + b.borrowed_len < kBufferMaxReadAhead); |
2391 | 377k | b.data_len += b.borrowed_len; |
2392 | 377k | b.external_pos += b.borrowed_len; |
2393 | 377k | } |
2394 | 378k | BRUNSLI_DCHECK(!b.data.empty()); |
2395 | 378k | if (state->pos > 0 && b.data_len > 0) { |
2396 | 11.0k | memmove(b.data.data(), b.data.data() + state->pos, b.data_len); |
2397 | 11.0k | } |
2398 | 378k | BRUNSLI_DCHECK(b.data_len <= kBufferMaxReadAhead); |
2399 | | |
2400 | 378k | return (result != BRUNSLI_NOT_ENOUGH_DATA); |
2401 | 468k | } |
2402 | | |
2403 | | /** Sets back user-provided input. */ |
2404 | 6.15M | void UnchargeBuffer(State* state) { |
2405 | 6.15M | InternalState& s = *state->internal; |
2406 | 6.15M | Buffer& b = s.buffer; |
2407 | | |
2408 | 6.15M | state->data = b.external_data; |
2409 | 6.15M | state->pos = b.external_pos; |
2410 | 6.15M | state->len = b.external_len; |
2411 | 6.15M | } |
2412 | | |
2413 | 6.15M | BrunsliStatus ProcessJpeg(State* state, JPEGData* jpg) { |
2414 | 6.15M | InternalState& s = *state->internal; |
2415 | | |
2416 | 6.15M | if (state->pos > state->len) return BRUNSLI_INVALID_PARAM; |
2417 | 6.15M | ChargeBuffer(state); |
2418 | | |
2419 | 6.15M | BrunsliStatus result = BRUNSLI_NOT_ENOUGH_DATA; |
2420 | 6.26M | while (result == BRUNSLI_NOT_ENOUGH_DATA) { |
2421 | 6.24M | if (state->stage == Stage::ERROR) { |
2422 | | // General error -> no recovery. |
2423 | 6.20M | if (s.result != BRUNSLI_NOT_ENOUGH_DATA) return s.result; |
2424 | | // Continue parsing. |
2425 | 6.20M | s.result = BRUNSLI_OK; |
2426 | 6.20M | state->stage = s.last_stage; |
2427 | 6.20M | s.last_stage = Stage::ERROR; |
2428 | 6.20M | } |
2429 | | |
2430 | 6.24M | LoadInput(state); |
2431 | 6.24M | if (s.section.is_active) { |
2432 | 6.03M | s.section.milestone = state->pos; |
2433 | 6.03M | s.section.projected_end = s.section.milestone + s.section.remaining; |
2434 | 6.03M | } |
2435 | | |
2436 | 6.24M | s.section.tags_met |= state->tags_met; |
2437 | 6.24M | result = DoProcessJpeg(state, jpg); |
2438 | | |
2439 | 6.24M | if (s.section.is_active) { |
2440 | | // TODO(eustas): dcheck state->pos > s.section.milestone |
2441 | 6.06M | size_t processed_len = state->pos - s.section.milestone; |
2442 | | // TODO(eustas): dcheck processed_len < s.section.remaining |
2443 | 6.06M | s.section.remaining -= processed_len; |
2444 | 6.06M | } |
2445 | | |
2446 | 6.24M | if (!UnloadInput(state, result)) break; |
2447 | 6.24M | } |
2448 | 6.15M | UnchargeBuffer(state); |
2449 | 6.15M | return result; |
2450 | 6.15M | } |
2451 | | |
2452 | | } // namespace dec |
2453 | | } // namespace internal |
2454 | | |
2455 | | BrunsliStatus BrunsliDecodeJpeg(const uint8_t* data, const size_t len, |
2456 | 17.0k | JPEGData* jpg) { |
2457 | 17.0k | if (!data) return BRUNSLI_INVALID_PARAM; |
2458 | | |
2459 | 17.0k | State state; |
2460 | 17.0k | state.data = data; |
2461 | 17.0k | state.len = len; |
2462 | | |
2463 | 17.0k | return internal::dec::ProcessJpeg(&state, jpg); |
2464 | 17.0k | } |
2465 | | |
2466 | | size_t BrunsliEstimateDecoderPeakMemoryUsage(const uint8_t* data, |
2467 | 0 | const size_t len) { |
2468 | 0 | if (!data) return BRUNSLI_INVALID_PARAM; |
2469 | | |
2470 | 0 | State state; |
2471 | 0 | state.data = data; |
2472 | 0 | state.len = len; |
2473 | 0 | state.skip_tags = ~(1u << kBrunsliHistogramDataTag); |
2474 | 0 | InternalState& s = *state.internal; |
2475 | 0 | s.shallow_histograms = true; |
2476 | |
|
2477 | 0 | JPEGData jpg; |
2478 | 0 | BrunsliStatus status = internal::dec::ProcessJpeg(&state, &jpg); |
2479 | |
|
2480 | 0 | if (status != BRUNSLI_OK) return 0; |
2481 | | |
2482 | 0 | size_t out_size = 2 * len; |
2483 | 0 | size_t total_num_blocks = 0; |
2484 | 0 | size_t component_state_size = 0; |
2485 | 0 | for (size_t i = 0; i < jpg.components.size(); ++i) { |
2486 | 0 | const JPEGComponent& c = jpg.components[i]; |
2487 | 0 | total_num_blocks += c.num_blocks; |
2488 | 0 | component_state_size += ComponentState::SizeInBytes(c.width_in_blocks); |
2489 | 0 | } |
2490 | 0 | size_t jpeg_data_size = total_num_blocks * kDCTBlockSize * sizeof(coeff_t); |
2491 | 0 | size_t context_map_size = s.num_contexts * kNumAvrgContexts * sizeof(int32_t); |
2492 | 0 | size_t histogram_size = s.num_histograms * sizeof(ANSDecodingData); |
2493 | 0 | size_t decode_peak = context_map_size + histogram_size + component_state_size; |
2494 | 0 | size_t jpeg_writer_size = (1u << 17u) + (1u << 16u) * sizeof(int32_t); |
2495 | 0 | return (out_size + jpeg_data_size + std::max(decode_peak, jpeg_writer_size)); |
2496 | 0 | } |
2497 | | |
2498 | 0 | BrunsliDecoder::BrunsliDecoder() { |
2499 | 0 | jpg_.reset(new JPEGData); |
2500 | 0 | state_.reset(new State); |
2501 | 0 | } |
2502 | | |
2503 | 0 | BrunsliDecoder::~BrunsliDecoder() {} |
2504 | | |
2505 | | BrunsliDecoder::Status BrunsliDecoder::Decode(size_t* available_in, |
2506 | | const uint8_t** next_in, |
2507 | | size_t* available_out, |
2508 | 0 | uint8_t** next_out) { |
2509 | 0 | JPEGData* jpg = jpg_.get(); |
2510 | 0 | BRUNSLI_DCHECK(jpg); |
2511 | 0 | State* state = state_.get(); |
2512 | 0 | BRUNSLI_DCHECK(state); |
2513 | |
|
2514 | 0 | state->data = *next_in; |
2515 | 0 | state->pos = 0; |
2516 | 0 | state->len = *available_in; |
2517 | 0 | BrunsliStatus parse_status = internal::dec::ProcessJpeg(state, jpg); |
2518 | 0 | size_t consumed_bytes = state->pos; |
2519 | 0 | *available_in -= consumed_bytes; |
2520 | 0 | *next_in += consumed_bytes; |
2521 | |
|
2522 | 0 | if ((parse_status != BRUNSLI_OK) && |
2523 | 0 | (parse_status != BRUNSLI_NOT_ENOUGH_DATA)) { |
2524 | 0 | return BrunsliDecoder::ERROR; |
2525 | 0 | } |
2526 | | |
2527 | | // All the input given input should be consumed. |
2528 | 0 | BRUNSLI_DCHECK(*available_in == 0); |
2529 | |
|
2530 | 0 | SerializationStatus serialization_status = |
2531 | 0 | SerializeJpeg(state, *jpg, available_out, next_out); |
2532 | 0 | if (serialization_status == SerializationStatus::ERROR) { |
2533 | 0 | return BrunsliDecoder::ERROR; |
2534 | 0 | } |
2535 | | |
2536 | 0 | switch (serialization_status) { |
2537 | 0 | case SerializationStatus::DONE: |
2538 | | // Should be impossible to finish serialization without finishing parsing. |
2539 | 0 | BRUNSLI_DCHECK(parse_status == BRUNSLI_OK); |
2540 | 0 | return BrunsliDecoder::DONE; |
2541 | | |
2542 | 0 | case SerializationStatus::NEEDS_MORE_INPUT: |
2543 | | // If serializer says that data is incomplete, parser should say the same. |
2544 | 0 | BRUNSLI_DCHECK(parse_status == BRUNSLI_NOT_ENOUGH_DATA); |
2545 | 0 | return BrunsliDecoder::NEEDS_MORE_INPUT; |
2546 | | |
2547 | 0 | case SerializationStatus::NEEDS_MORE_OUTPUT: |
2548 | | // TODO(eustas): make sure that serializer could produce more bytes |
2549 | | // without providing more bytes to parser |
2550 | 0 | BRUNSLI_DCHECK(*available_out == 0); |
2551 | 0 | return BrunsliDecoder::NEEDS_MORE_OUTPUT; |
2552 | | |
2553 | 0 | case SerializationStatus::ERROR: |
2554 | 0 | return BrunsliDecoder::ERROR; |
2555 | | |
2556 | 0 | default: |
2557 | | /* Unreachable */ |
2558 | 0 | BRUNSLI_DCHECK(false); |
2559 | 0 | return BrunsliDecoder::ERROR; |
2560 | 0 | } |
2561 | 0 | } |
2562 | | |
2563 | | } // namespace brunsli |