/src/aom/av1/decoder/decodetxb.c
Line | Count | Source (jump to first uncovered line) |
1 | | /* |
2 | | * Copyright (c) 2017, Alliance for Open Media. All rights reserved. |
3 | | * |
4 | | * This source code is subject to the terms of the BSD 2 Clause License and |
5 | | * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License |
6 | | * was not distributed with this source code in the LICENSE file, you can |
7 | | * obtain it at www.aomedia.org/license/software. If the Alliance for Open |
8 | | * Media Patent License 1.0 was not distributed with this source code in the |
9 | | * PATENTS file, you can obtain it at www.aomedia.org/license/patent. |
10 | | */ |
11 | | |
12 | | #include "av1/decoder/decodetxb.h" |
13 | | |
14 | | #include "aom_ports/mem.h" |
15 | | #include "av1/common/idct.h" |
16 | | #include "av1/common/scan.h" |
17 | | #include "av1/common/txb_common.h" |
18 | | #include "av1/decoder/decodemv.h" |
19 | | |
20 | | #define ACCT_STR __func__ |
21 | | |
22 | 2.71M | static int read_golomb(MACROBLOCKD *xd, aom_reader *r) { |
23 | 2.71M | int x = 1; |
24 | 2.71M | int length = 0; |
25 | 2.71M | int i = 0; |
26 | | |
27 | 11.5M | while (!i) { |
28 | 8.87M | i = aom_read_bit(r, ACCT_STR); |
29 | 8.87M | ++length; |
30 | 8.87M | if (length > 20) { |
31 | 288 | aom_internal_error(xd->error_info, AOM_CODEC_CORRUPT_FRAME, |
32 | 288 | "Invalid length in read_golomb"); |
33 | 288 | break; |
34 | 288 | } |
35 | 8.87M | } |
36 | | |
37 | 8.86M | for (i = 0; i < length - 1; ++i) { |
38 | 6.14M | x <<= 1; |
39 | 6.14M | x += aom_read_bit(r, ACCT_STR); |
40 | 6.14M | } |
41 | | |
42 | 2.71M | return x - 1; |
43 | 2.71M | } |
44 | | |
45 | 6.19M | static inline int rec_eob_pos(const int eob_token, const int extra) { |
46 | 6.19M | int eob = av1_eob_group_start[eob_token]; |
47 | 6.19M | if (eob > 2) { |
48 | 3.54M | eob += extra; |
49 | 3.54M | } |
50 | 6.19M | return eob; |
51 | 6.19M | } |
52 | | |
53 | | static inline int get_dqv(const int16_t *dequant, int coeff_idx, |
54 | 53.3M | const qm_val_t *iqmatrix) { |
55 | 53.3M | int dqv = dequant[!!coeff_idx]; |
56 | 53.3M | if (iqmatrix != NULL) |
57 | 6.25M | dqv = |
58 | 6.25M | ((iqmatrix[coeff_idx] * dqv) + (1 << (AOM_QM_BITS - 1))) >> AOM_QM_BITS; |
59 | 53.3M | return dqv; |
60 | 53.3M | } |
61 | | |
62 | | static inline void read_coeffs_reverse_2d(aom_reader *r, TX_SIZE tx_size, |
63 | | int start_si, int end_si, |
64 | | const int16_t *scan, int bhl, |
65 | | uint8_t *levels, |
66 | | base_cdf_arr base_cdf, |
67 | 3.54M | br_cdf_arr br_cdf) { |
68 | 107M | for (int c = end_si; c >= start_si; --c) { |
69 | 103M | const int pos = scan[c]; |
70 | 103M | const int coeff_ctx = get_lower_levels_ctx_2d(levels, pos, bhl, tx_size); |
71 | 103M | const int nsymbs = 4; |
72 | 103M | int level = aom_read_symbol(r, base_cdf[coeff_ctx], nsymbs, ACCT_STR); |
73 | 103M | if (level > NUM_BASE_LEVELS) { |
74 | 13.5M | const int br_ctx = get_br_ctx_2d(levels, pos, bhl); |
75 | 13.5M | aom_cdf_prob *cdf = br_cdf[br_ctx]; |
76 | 27.3M | for (int idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) { |
77 | 25.2M | const int k = aom_read_symbol(r, cdf, BR_CDF_SIZE, ACCT_STR); |
78 | 25.2M | level += k; |
79 | 25.2M | if (k < BR_CDF_SIZE - 1) break; |
80 | 25.2M | } |
81 | 13.5M | } |
82 | 103M | levels[get_padded_idx(pos, bhl)] = level; |
83 | 103M | } |
84 | 3.54M | } |
85 | | |
86 | | static inline void read_coeffs_reverse(aom_reader *r, TX_SIZE tx_size, |
87 | | TX_CLASS tx_class, int start_si, |
88 | | int end_si, const int16_t *scan, int bhl, |
89 | | uint8_t *levels, base_cdf_arr base_cdf, |
90 | 3.68M | br_cdf_arr br_cdf) { |
91 | 11.2M | for (int c = end_si; c >= start_si; --c) { |
92 | 7.54M | const int pos = scan[c]; |
93 | 7.54M | const int coeff_ctx = |
94 | 7.54M | get_lower_levels_ctx(levels, pos, bhl, tx_size, tx_class); |
95 | 7.54M | const int nsymbs = 4; |
96 | 7.54M | int level = aom_read_symbol(r, base_cdf[coeff_ctx], nsymbs, ACCT_STR); |
97 | 7.54M | if (level > NUM_BASE_LEVELS) { |
98 | 1.81M | const int br_ctx = get_br_ctx(levels, pos, bhl, tx_class); |
99 | 1.81M | aom_cdf_prob *cdf = br_cdf[br_ctx]; |
100 | 4.15M | for (int idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) { |
101 | 3.79M | const int k = aom_read_symbol(r, cdf, BR_CDF_SIZE, ACCT_STR); |
102 | 3.79M | level += k; |
103 | 3.79M | if (k < BR_CDF_SIZE - 1) break; |
104 | 3.79M | } |
105 | 1.81M | } |
106 | 7.54M | levels[get_padded_idx(pos, bhl)] = level; |
107 | 7.54M | } |
108 | 3.68M | } |
109 | | |
110 | | static uint8_t read_coeffs_txb(const AV1_COMMON *const cm, |
111 | | DecoderCodingBlock *dcb, aom_reader *const r, |
112 | | const int blk_row, const int blk_col, |
113 | | const int plane, const TXB_CTX *const txb_ctx, |
114 | 16.6M | const TX_SIZE tx_size) { |
115 | 16.6M | MACROBLOCKD *const xd = &dcb->xd; |
116 | 16.6M | FRAME_CONTEXT *const ec_ctx = xd->tile_ctx; |
117 | 16.6M | const int32_t max_value = (1 << (7 + xd->bd)) - 1; |
118 | 16.6M | const int32_t min_value = -(1 << (7 + xd->bd)); |
119 | 16.6M | const TX_SIZE txs_ctx = get_txsize_entropy_ctx(tx_size); |
120 | 16.6M | const PLANE_TYPE plane_type = get_plane_type(plane); |
121 | 16.6M | MB_MODE_INFO *const mbmi = xd->mi[0]; |
122 | 16.6M | struct macroblockd_plane *const pd = &xd->plane[plane]; |
123 | 16.6M | const int16_t *const dequant = pd->seg_dequant_QTX[mbmi->segment_id]; |
124 | 16.6M | tran_low_t *const tcoeffs = dcb->dqcoeff_block[plane] + dcb->cb_offset[plane]; |
125 | 16.6M | const int shift = av1_get_tx_scale(tx_size); |
126 | 16.6M | const int bhl = get_txb_bhl(tx_size); |
127 | 16.6M | const int width = get_txb_wide(tx_size); |
128 | 16.6M | const int height = get_txb_high(tx_size); |
129 | 16.6M | int cul_level = 0; |
130 | 16.6M | int dc_val = 0; |
131 | 16.6M | uint8_t levels_buf[TX_PAD_2D]; |
132 | 16.6M | uint8_t *const levels = set_levels(levels_buf, height); |
133 | 16.6M | const int all_zero = aom_read_symbol( |
134 | 16.6M | r, ec_ctx->txb_skip_cdf[txs_ctx][txb_ctx->txb_skip_ctx], 2, ACCT_STR); |
135 | 16.6M | eob_info *eob_data = dcb->eob_data[plane] + dcb->txb_offset[plane]; |
136 | 16.6M | uint16_t *const eob = &(eob_data->eob); |
137 | 16.6M | uint16_t *const max_scan_line = &(eob_data->max_scan_line); |
138 | 16.6M | *max_scan_line = 0; |
139 | 16.6M | *eob = 0; |
140 | | |
141 | | #if CONFIG_INSPECTION |
142 | | if (plane == 0) { |
143 | | const int txk_type_idx = |
144 | | av1_get_txk_type_index(mbmi->bsize, blk_row, blk_col); |
145 | | mbmi->tx_skip[txk_type_idx] = all_zero; |
146 | | } |
147 | | #endif |
148 | | |
149 | 16.6M | if (all_zero) { |
150 | 10.3M | *max_scan_line = 0; |
151 | 10.3M | if (plane == 0) { |
152 | 3.09M | xd->tx_type_map[blk_row * xd->tx_type_map_stride + blk_col] = DCT_DCT; |
153 | 3.09M | } |
154 | 10.3M | return 0; |
155 | 10.3M | } |
156 | | |
157 | 6.33M | if (plane == AOM_PLANE_Y) { |
158 | | // only y plane's tx_type is transmitted |
159 | 3.11M | av1_read_tx_type(cm, xd, blk_row, blk_col, tx_size, r); |
160 | 3.11M | } |
161 | 6.33M | const TX_TYPE tx_type = |
162 | 6.33M | av1_get_tx_type(xd, plane_type, blk_row, blk_col, tx_size, |
163 | 6.33M | cm->features.reduced_tx_set_used); |
164 | 6.33M | const TX_CLASS tx_class = tx_type_to_class[tx_type]; |
165 | 6.33M | const qm_val_t *iqmatrix = |
166 | 6.33M | av1_get_iqmatrix(&cm->quant_params, xd, plane, tx_size, tx_type); |
167 | 6.33M | const SCAN_ORDER *const scan_order = get_scan(tx_size, tx_type); |
168 | 6.33M | const int16_t *const scan = scan_order->scan; |
169 | 6.33M | int eob_extra = 0; |
170 | 6.33M | int eob_pt = 1; |
171 | | |
172 | 6.33M | const int eob_multi_size = txsize_log2_minus4[tx_size]; |
173 | 6.33M | const int eob_multi_ctx = (tx_class == TX_CLASS_2D) ? 0 : 1; |
174 | 6.33M | switch (eob_multi_size) { |
175 | 3.94M | case 0: |
176 | 3.94M | eob_pt = |
177 | 3.94M | aom_read_symbol(r, ec_ctx->eob_flag_cdf16[plane_type][eob_multi_ctx], |
178 | 3.94M | 5, ACCT_STR) + |
179 | 3.94M | 1; |
180 | 3.94M | break; |
181 | 359k | case 1: |
182 | 359k | eob_pt = |
183 | 359k | aom_read_symbol(r, ec_ctx->eob_flag_cdf32[plane_type][eob_multi_ctx], |
184 | 359k | 6, ACCT_STR) + |
185 | 359k | 1; |
186 | 359k | break; |
187 | 867k | case 2: |
188 | 867k | eob_pt = |
189 | 867k | aom_read_symbol(r, ec_ctx->eob_flag_cdf64[plane_type][eob_multi_ctx], |
190 | 867k | 7, ACCT_STR) + |
191 | 867k | 1; |
192 | 867k | break; |
193 | 385k | case 3: |
194 | 385k | eob_pt = |
195 | 385k | aom_read_symbol(r, ec_ctx->eob_flag_cdf128[plane_type][eob_multi_ctx], |
196 | 385k | 8, ACCT_STR) + |
197 | 385k | 1; |
198 | 385k | break; |
199 | 365k | case 4: |
200 | 365k | eob_pt = |
201 | 365k | aom_read_symbol(r, ec_ctx->eob_flag_cdf256[plane_type][eob_multi_ctx], |
202 | 365k | 9, ACCT_STR) + |
203 | 365k | 1; |
204 | 365k | break; |
205 | 120k | case 5: |
206 | 120k | eob_pt = |
207 | 120k | aom_read_symbol(r, ec_ctx->eob_flag_cdf512[plane_type][eob_multi_ctx], |
208 | 120k | 10, ACCT_STR) + |
209 | 120k | 1; |
210 | 120k | break; |
211 | 180k | case 6: |
212 | 180k | default: |
213 | 180k | eob_pt = aom_read_symbol( |
214 | 180k | r, ec_ctx->eob_flag_cdf1024[plane_type][eob_multi_ctx], 11, |
215 | 180k | ACCT_STR) + |
216 | 180k | 1; |
217 | 180k | break; |
218 | 6.33M | } |
219 | | |
220 | 6.20M | const int eob_offset_bits = av1_eob_offset_bits[eob_pt]; |
221 | 6.20M | if (eob_offset_bits > 0) { |
222 | 3.55M | const int eob_ctx = eob_pt - 3; |
223 | 3.55M | int bit = aom_read_symbol( |
224 | 3.55M | r, ec_ctx->eob_extra_cdf[txs_ctx][plane_type][eob_ctx], 2, ACCT_STR); |
225 | 3.55M | if (bit) { |
226 | 2.15M | eob_extra += (1 << (eob_offset_bits - 1)); |
227 | 2.15M | } |
228 | | |
229 | 12.2M | for (int i = 1; i < eob_offset_bits; i++) { |
230 | 8.72M | bit = aom_read_bit(r, ACCT_STR); |
231 | 8.72M | if (bit) { |
232 | 4.79M | eob_extra += (1 << (eob_offset_bits - 1 - i)); |
233 | 4.79M | } |
234 | 8.72M | } |
235 | 3.55M | } |
236 | 6.20M | *eob = rec_eob_pos(eob_pt, eob_extra); |
237 | | |
238 | 6.20M | if (*eob > 1) { |
239 | 3.68M | memset(levels_buf, 0, |
240 | 3.68M | sizeof(*levels_buf) * |
241 | 3.68M | ((height + TX_PAD_HOR) * (width + TX_PAD_VER) + TX_PAD_END)); |
242 | 3.68M | } |
243 | | |
244 | 6.20M | { |
245 | | // Read the non-zero coefficient with scan index eob-1 |
246 | | // TODO(angiebird): Put this into a function |
247 | 6.20M | const int c = *eob - 1; |
248 | 6.20M | const int pos = scan[c]; |
249 | 6.20M | const int coeff_ctx = get_lower_levels_ctx_eob(bhl, width, c); |
250 | 6.20M | const int nsymbs = 3; |
251 | 6.20M | aom_cdf_prob *cdf = |
252 | 6.20M | ec_ctx->coeff_base_eob_cdf[txs_ctx][plane_type][coeff_ctx]; |
253 | 6.20M | int level = aom_read_symbol(r, cdf, nsymbs, ACCT_STR) + 1; |
254 | 6.20M | if (level > NUM_BASE_LEVELS) { |
255 | 597k | const int br_ctx = get_br_ctx_eob(pos, bhl, tx_class); |
256 | 597k | cdf = ec_ctx->coeff_br_cdf[AOMMIN(txs_ctx, TX_32X32)][plane_type][br_ctx]; |
257 | 1.72M | for (int idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) { |
258 | 1.49M | const int k = aom_read_symbol(r, cdf, BR_CDF_SIZE, ACCT_STR); |
259 | 1.49M | level += k; |
260 | 1.49M | if (k < BR_CDF_SIZE - 1) break; |
261 | 1.49M | } |
262 | 597k | } |
263 | 6.20M | levels[get_padded_idx(pos, bhl)] = level; |
264 | 6.20M | } |
265 | 6.20M | if (*eob > 1) { |
266 | 3.68M | base_cdf_arr base_cdf = ec_ctx->coeff_base_cdf[txs_ctx][plane_type]; |
267 | 3.68M | br_cdf_arr br_cdf = |
268 | 3.68M | ec_ctx->coeff_br_cdf[AOMMIN(txs_ctx, TX_32X32)][plane_type]; |
269 | 3.68M | if (tx_class == TX_CLASS_2D) { |
270 | 3.54M | read_coeffs_reverse_2d(r, tx_size, 1, *eob - 1 - 1, scan, bhl, levels, |
271 | 3.54M | base_cdf, br_cdf); |
272 | 3.54M | read_coeffs_reverse(r, tx_size, tx_class, 0, 0, scan, bhl, levels, |
273 | 3.54M | base_cdf, br_cdf); |
274 | 3.54M | } else { |
275 | 137k | read_coeffs_reverse(r, tx_size, tx_class, 0, *eob - 1 - 1, scan, bhl, |
276 | 137k | levels, base_cdf, br_cdf); |
277 | 137k | } |
278 | 3.68M | } |
279 | | |
280 | 123M | for (int c = 0; c < *eob; ++c) { |
281 | 117M | const int pos = scan[c]; |
282 | 117M | uint8_t sign; |
283 | 117M | tran_low_t level = levels[get_padded_idx(pos, bhl)]; |
284 | 117M | if (level) { |
285 | 53.3M | *max_scan_line = AOMMAX(*max_scan_line, pos); |
286 | 53.3M | if (c == 0) { |
287 | 5.41M | const int dc_sign_ctx = txb_ctx->dc_sign_ctx; |
288 | 5.41M | sign = aom_read_symbol(r, ec_ctx->dc_sign_cdf[plane_type][dc_sign_ctx], |
289 | 5.41M | 2, ACCT_STR); |
290 | 47.8M | } else { |
291 | 47.8M | sign = aom_read_bit(r, ACCT_STR); |
292 | 47.8M | } |
293 | 53.3M | if (level >= MAX_BASE_BR_RANGE) { |
294 | 2.71M | level += read_golomb(xd, r); |
295 | 2.71M | } |
296 | | |
297 | 53.3M | if (c == 0) dc_val = sign ? -level : level; |
298 | | |
299 | | // Bitmasking to clamp level to valid range: |
300 | | // The valid range for 8/10/12 bit vdieo is at most 14/16/18 bit |
301 | 53.3M | level &= 0xfffff; |
302 | 53.3M | cul_level += level; |
303 | 53.3M | tran_low_t dq_coeff; |
304 | | // Bitmasking to clamp dq_coeff to valid range: |
305 | | // The valid range for 8/10/12 bit video is at most 17/19/21 bit |
306 | 53.3M | dq_coeff = |
307 | 53.3M | (tran_low_t)((int64_t)level * get_dqv(dequant, scan[c], iqmatrix) & |
308 | 53.3M | 0xffffff); |
309 | 53.3M | dq_coeff = dq_coeff >> shift; |
310 | 53.3M | if (sign) { |
311 | 26.4M | dq_coeff = -dq_coeff; |
312 | 26.4M | } |
313 | 53.3M | tcoeffs[pos] = clamp(dq_coeff, min_value, max_value); |
314 | 53.3M | } |
315 | 117M | } |
316 | | |
317 | 6.20M | cul_level = AOMMIN(COEFF_CONTEXT_MASK, cul_level); |
318 | | |
319 | | // DC value |
320 | 6.20M | set_dc_sign(&cul_level, dc_val); |
321 | | |
322 | 6.20M | return cul_level; |
323 | 6.33M | } |
324 | | |
325 | | void av1_read_coeffs_txb(const AV1_COMMON *const cm, DecoderCodingBlock *dcb, |
326 | | aom_reader *const r, const int plane, const int row, |
327 | 16.6M | const int col, const TX_SIZE tx_size) { |
328 | | #if TXCOEFF_TIMER |
329 | | struct aom_usec_timer timer; |
330 | | aom_usec_timer_start(&timer); |
331 | | #endif |
332 | 16.6M | MACROBLOCKD *const xd = &dcb->xd; |
333 | 16.6M | MB_MODE_INFO *const mbmi = xd->mi[0]; |
334 | 16.6M | struct macroblockd_plane *const pd = &xd->plane[plane]; |
335 | | |
336 | 16.6M | const BLOCK_SIZE bsize = mbmi->bsize; |
337 | 16.6M | assert(bsize < BLOCK_SIZES_ALL); |
338 | 16.6M | const BLOCK_SIZE plane_bsize = |
339 | 16.6M | get_plane_block_size(bsize, pd->subsampling_x, pd->subsampling_y); |
340 | | |
341 | 16.6M | TXB_CTX txb_ctx; |
342 | 16.6M | get_txb_ctx(plane_bsize, tx_size, plane, pd->above_entropy_context + col, |
343 | 16.6M | pd->left_entropy_context + row, &txb_ctx); |
344 | 16.6M | const uint8_t cul_level = |
345 | 16.6M | read_coeffs_txb(cm, dcb, r, row, col, plane, &txb_ctx, tx_size); |
346 | 16.6M | av1_set_entropy_contexts(xd, pd, plane, plane_bsize, tx_size, cul_level, col, |
347 | 16.6M | row); |
348 | | |
349 | 16.6M | if (is_inter_block(mbmi)) { |
350 | 282k | const PLANE_TYPE plane_type = get_plane_type(plane); |
351 | | // tx_type will be read out in av1_read_coeffs_txb_facade |
352 | 282k | const TX_TYPE tx_type = av1_get_tx_type(xd, plane_type, row, col, tx_size, |
353 | 282k | cm->features.reduced_tx_set_used); |
354 | | |
355 | 282k | if (plane == 0) { |
356 | 133k | const int txw = tx_size_wide_unit[tx_size]; |
357 | 133k | const int txh = tx_size_high_unit[tx_size]; |
358 | | // The 16x16 unit is due to the constraint from tx_64x64 which sets the |
359 | | // maximum tx size for chroma as 32x32. Coupled with 4x1 transform block |
360 | | // size, the constraint takes effect in 32x16 / 16x32 size too. To solve |
361 | | // the intricacy, cover all the 16x16 units inside a 64 level transform. |
362 | 133k | if (txw == tx_size_wide_unit[TX_64X64] || |
363 | 133k | txh == tx_size_high_unit[TX_64X64]) { |
364 | 5.94k | const int tx_unit = tx_size_wide_unit[TX_16X16]; |
365 | 5.94k | const int stride = xd->tx_type_map_stride; |
366 | 28.0k | for (int idy = 0; idy < txh; idy += tx_unit) { |
367 | 105k | for (int idx = 0; idx < txw; idx += tx_unit) { |
368 | 83.4k | xd->tx_type_map[(row + idy) * stride + col + idx] = tx_type; |
369 | 83.4k | } |
370 | 22.0k | } |
371 | 5.94k | } |
372 | 133k | } |
373 | 282k | } |
374 | | |
375 | | #if TXCOEFF_TIMER |
376 | | aom_usec_timer_mark(&timer); |
377 | | const int64_t elapsed_time = aom_usec_timer_elapsed(&timer); |
378 | | cm->txcoeff_timer += elapsed_time; |
379 | | ++cm->txb_count; |
380 | | #endif |
381 | 16.6M | } |