/src/aom/av1/decoder/decodetxb.c
Line | Count | Source |
1 | | /* |
2 | | * Copyright (c) 2017, Alliance for Open Media. All rights reserved. |
3 | | * |
4 | | * This source code is subject to the terms of the BSD 2 Clause License and |
5 | | * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License |
6 | | * was not distributed with this source code in the LICENSE file, you can |
7 | | * obtain it at www.aomedia.org/license/software. If the Alliance for Open |
8 | | * Media Patent License 1.0 was not distributed with this source code in the |
9 | | * PATENTS file, you can obtain it at www.aomedia.org/license/patent. |
10 | | */ |
11 | | |
12 | | #include "av1/decoder/decodetxb.h" |
13 | | |
14 | | #include "aom_ports/mem.h" |
15 | | #include "av1/common/idct.h" |
16 | | #include "av1/common/scan.h" |
17 | | #include "av1/common/txb_common.h" |
18 | | #include "av1/decoder/decodemv.h" |
19 | | |
20 | | #define ACCT_STR __func__ |
21 | | |
22 | 2.99M | static int read_golomb(MACROBLOCKD *xd, aom_reader *r) { |
23 | 2.99M | int x = 1; |
24 | 2.99M | int length = 0; |
25 | 2.99M | int i = 0; |
26 | | |
27 | 9.20M | while (!i) { |
28 | 6.20M | i = aom_read_bit(r, ACCT_STR); |
29 | 6.20M | ++length; |
30 | 6.20M | if (length > 20) { |
31 | 436 | aom_internal_error(xd->error_info, AOM_CODEC_CORRUPT_FRAME, |
32 | 436 | "Invalid length in read_golomb"); |
33 | 436 | } |
34 | 6.20M | } |
35 | | |
36 | 6.19M | for (i = 0; i < length - 1; ++i) { |
37 | 3.20M | x <<= 1; |
38 | 3.20M | x += aom_read_bit(r, ACCT_STR); |
39 | 3.20M | } |
40 | | |
41 | 2.99M | return x - 1; |
42 | 2.99M | } |
43 | | |
44 | 11.2M | static inline int rec_eob_pos(const int eob_token, const int extra) { |
45 | 11.2M | int eob = av1_eob_group_start[eob_token]; |
46 | 11.2M | if (eob > 2) { |
47 | 7.55M | eob += extra; |
48 | 7.55M | } |
49 | 11.2M | return eob; |
50 | 11.2M | } |
51 | | |
52 | | static inline int get_dqv(const int16_t *dequant, int coeff_idx, |
53 | 99.6M | const qm_val_t *iqmatrix) { |
54 | 99.6M | int dqv = dequant[!!coeff_idx]; |
55 | 99.6M | if (iqmatrix != NULL) |
56 | 20.3M | dqv = |
57 | 20.3M | ((iqmatrix[coeff_idx] * dqv) + (1 << (AOM_QM_BITS - 1))) >> AOM_QM_BITS; |
58 | 99.6M | return dqv; |
59 | 99.6M | } |
60 | | |
61 | | static inline void read_coeffs_reverse_2d(aom_reader *r, TX_SIZE tx_size, |
62 | | int start_si, int end_si, |
63 | | const int16_t *scan, int bhl, |
64 | | uint8_t *levels, |
65 | | base_cdf_arr base_cdf, |
66 | 7.40M | br_cdf_arr br_cdf) { |
67 | 220M | for (int c = end_si; c >= start_si; --c) { |
68 | 213M | const int pos = scan[c]; |
69 | 213M | const int coeff_ctx = get_lower_levels_ctx_2d(levels, pos, bhl, tx_size); |
70 | 213M | const int nsymbs = 4; |
71 | 213M | int level = aom_read_symbol(r, base_cdf[coeff_ctx], nsymbs, ACCT_STR); |
72 | 213M | if (level > NUM_BASE_LEVELS) { |
73 | 21.3M | const int br_ctx = get_br_ctx_2d(levels, pos, bhl); |
74 | 21.3M | aom_cdf_prob *cdf = br_cdf[br_ctx]; |
75 | 39.4M | for (int idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) { |
76 | 36.8M | const int k = aom_read_symbol(r, cdf, BR_CDF_SIZE, ACCT_STR); |
77 | 36.8M | level += k; |
78 | 36.8M | if (k < BR_CDF_SIZE - 1) break; |
79 | 36.8M | } |
80 | 21.3M | } |
81 | 213M | levels[get_padded_idx(pos, bhl)] = level; |
82 | 213M | } |
83 | 7.40M | } |
84 | | |
85 | | static inline void read_coeffs_reverse(aom_reader *r, TX_SIZE tx_size, |
86 | | TX_CLASS tx_class, int start_si, |
87 | | int end_si, const int16_t *scan, int bhl, |
88 | | uint8_t *levels, base_cdf_arr base_cdf, |
89 | 7.92M | br_cdf_arr br_cdf) { |
90 | 27.5M | for (int c = end_si; c >= start_si; --c) { |
91 | 19.6M | const int pos = scan[c]; |
92 | 19.6M | const int coeff_ctx = |
93 | 19.6M | get_lower_levels_ctx(levels, pos, bhl, tx_size, tx_class); |
94 | 19.6M | const int nsymbs = 4; |
95 | 19.6M | int level = aom_read_symbol(r, base_cdf[coeff_ctx], nsymbs, ACCT_STR); |
96 | 19.6M | if (level > NUM_BASE_LEVELS) { |
97 | 3.64M | const int br_ctx = get_br_ctx(levels, pos, bhl, tx_class); |
98 | 3.64M | aom_cdf_prob *cdf = br_cdf[br_ctx]; |
99 | 6.99M | for (int idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) { |
100 | 6.58M | const int k = aom_read_symbol(r, cdf, BR_CDF_SIZE, ACCT_STR); |
101 | 6.58M | level += k; |
102 | 6.58M | if (k < BR_CDF_SIZE - 1) break; |
103 | 6.58M | } |
104 | 3.64M | } |
105 | 19.6M | levels[get_padded_idx(pos, bhl)] = level; |
106 | 19.6M | } |
107 | 7.92M | } |
108 | | |
109 | | static uint8_t read_coeffs_txb(const AV1_COMMON *const cm, |
110 | | DecoderCodingBlock *dcb, aom_reader *const r, |
111 | | const int blk_row, const int blk_col, |
112 | | const int plane, const TXB_CTX *const txb_ctx, |
113 | 21.0M | const TX_SIZE tx_size) { |
114 | 21.0M | MACROBLOCKD *const xd = &dcb->xd; |
115 | 21.0M | FRAME_CONTEXT *const ec_ctx = xd->tile_ctx; |
116 | 21.0M | const int32_t max_value = (1 << (7 + xd->bd)) - 1; |
117 | 21.0M | const int32_t min_value = -(1 << (7 + xd->bd)); |
118 | 21.0M | const TX_SIZE txs_ctx = get_txsize_entropy_ctx(tx_size); |
119 | 21.0M | const PLANE_TYPE plane_type = get_plane_type(plane); |
120 | 21.0M | MB_MODE_INFO *const mbmi = xd->mi[0]; |
121 | 21.0M | struct macroblockd_plane *const pd = &xd->plane[plane]; |
122 | 21.0M | const int16_t *const dequant = pd->seg_dequant_QTX[mbmi->segment_id]; |
123 | 21.0M | tran_low_t *const tcoeffs = dcb->dqcoeff_block[plane] + dcb->cb_offset[plane]; |
124 | 21.0M | const int shift = av1_get_tx_scale(tx_size); |
125 | 21.0M | const int bhl = get_txb_bhl(tx_size); |
126 | 21.0M | const int width = get_txb_wide(tx_size); |
127 | 21.0M | const int height = get_txb_high(tx_size); |
128 | 21.0M | int cul_level = 0; |
129 | 21.0M | int dc_val = 0; |
130 | 21.0M | uint8_t levels_buf[TX_PAD_2D]; |
131 | 21.0M | uint8_t *const levels = set_levels(levels_buf, height); |
132 | 21.0M | const int all_zero = aom_read_symbol( |
133 | 21.0M | r, ec_ctx->txb_skip_cdf[txs_ctx][txb_ctx->txb_skip_ctx], 2, ACCT_STR); |
134 | 21.0M | eob_info *eob_data = dcb->eob_data[plane] + dcb->txb_offset[plane]; |
135 | 21.0M | uint16_t *const eob = &(eob_data->eob); |
136 | 21.0M | uint16_t *const max_scan_line = &(eob_data->max_scan_line); |
137 | 21.0M | *max_scan_line = 0; |
138 | 21.0M | *eob = 0; |
139 | | |
140 | | #if CONFIG_INSPECTION |
141 | | if (plane == 0) { |
142 | | const int txk_type_idx = |
143 | | av1_get_txk_type_index(mbmi->bsize, blk_row, blk_col); |
144 | | mbmi->tx_skip[txk_type_idx] = all_zero; |
145 | | } |
146 | | #endif |
147 | | |
148 | 21.0M | if (all_zero) { |
149 | 9.84M | *max_scan_line = 0; |
150 | 9.84M | if (plane == 0) { |
151 | 2.87M | xd->tx_type_map[blk_row * xd->tx_type_map_stride + blk_col] = DCT_DCT; |
152 | 2.87M | } |
153 | 9.84M | return 0; |
154 | 9.84M | } |
155 | | |
156 | 11.2M | if (plane == AOM_PLANE_Y) { |
157 | | // only y plane's tx_type is transmitted |
158 | 6.69M | av1_read_tx_type(cm, xd, blk_row, blk_col, tx_size, r); |
159 | 6.69M | } |
160 | 11.2M | const TX_TYPE tx_type = |
161 | 11.2M | av1_get_tx_type(xd, plane_type, blk_row, blk_col, tx_size, |
162 | 11.2M | cm->features.reduced_tx_set_used); |
163 | 11.2M | const TX_CLASS tx_class = tx_type_to_class[tx_type]; |
164 | 11.2M | const qm_val_t *iqmatrix = |
165 | 11.2M | av1_get_iqmatrix(&cm->quant_params, xd, plane, tx_size, tx_type); |
166 | 11.2M | const SCAN_ORDER *const scan_order = get_scan(tx_size, tx_type); |
167 | 11.2M | const int16_t *const scan = scan_order->scan; |
168 | 11.2M | int eob_extra = 0; |
169 | 11.2M | int eob_pt = 1; |
170 | | |
171 | 11.2M | const int eob_multi_size = txsize_log2_minus4[tx_size]; |
172 | 11.2M | const int eob_multi_ctx = (tx_class == TX_CLASS_2D) ? 0 : 1; |
173 | 11.2M | switch (eob_multi_size) { |
174 | 4.19M | case 0: |
175 | 4.19M | eob_pt = |
176 | 4.19M | aom_read_symbol(r, ec_ctx->eob_flag_cdf16[plane_type][eob_multi_ctx], |
177 | 4.19M | 5, ACCT_STR) + |
178 | 4.19M | 1; |
179 | 4.19M | break; |
180 | 999k | case 1: |
181 | 999k | eob_pt = |
182 | 999k | aom_read_symbol(r, ec_ctx->eob_flag_cdf32[plane_type][eob_multi_ctx], |
183 | 999k | 6, ACCT_STR) + |
184 | 999k | 1; |
185 | 999k | break; |
186 | 2.41M | case 2: |
187 | 2.41M | eob_pt = |
188 | 2.41M | aom_read_symbol(r, ec_ctx->eob_flag_cdf64[plane_type][eob_multi_ctx], |
189 | 2.41M | 7, ACCT_STR) + |
190 | 2.41M | 1; |
191 | 2.41M | break; |
192 | 891k | case 3: |
193 | 891k | eob_pt = |
194 | 891k | aom_read_symbol(r, ec_ctx->eob_flag_cdf128[plane_type][eob_multi_ctx], |
195 | 891k | 8, ACCT_STR) + |
196 | 891k | 1; |
197 | 891k | break; |
198 | 1.35M | case 4: |
199 | 1.35M | eob_pt = |
200 | 1.35M | aom_read_symbol(r, ec_ctx->eob_flag_cdf256[plane_type][eob_multi_ctx], |
201 | 1.35M | 9, ACCT_STR) + |
202 | 1.35M | 1; |
203 | 1.35M | break; |
204 | 343k | case 5: |
205 | 343k | eob_pt = |
206 | 343k | aom_read_symbol(r, ec_ctx->eob_flag_cdf512[plane_type][eob_multi_ctx], |
207 | 343k | 10, ACCT_STR) + |
208 | 343k | 1; |
209 | 343k | break; |
210 | 1.02M | case 6: |
211 | 1.02M | default: |
212 | 1.02M | eob_pt = aom_read_symbol( |
213 | 1.02M | r, ec_ctx->eob_flag_cdf1024[plane_type][eob_multi_ctx], 11, |
214 | 1.02M | ACCT_STR) + |
215 | 1.02M | 1; |
216 | 1.02M | break; |
217 | 11.2M | } |
218 | | |
219 | 11.2M | const int eob_offset_bits = av1_eob_offset_bits[eob_pt]; |
220 | 11.2M | if (eob_offset_bits > 0) { |
221 | 7.55M | const int eob_ctx = eob_pt - 3; |
222 | 7.55M | int bit = aom_read_symbol( |
223 | 7.55M | r, ec_ctx->eob_extra_cdf[txs_ctx][plane_type][eob_ctx], 2, ACCT_STR); |
224 | 7.55M | if (bit) { |
225 | 3.52M | eob_extra += (1 << (eob_offset_bits - 1)); |
226 | 3.52M | } |
227 | | |
228 | 25.6M | for (int i = 1; i < eob_offset_bits; i++) { |
229 | 18.0M | bit = aom_read_bit(r, ACCT_STR); |
230 | 18.0M | if (bit) { |
231 | 9.09M | eob_extra += (1 << (eob_offset_bits - 1 - i)); |
232 | 9.09M | } |
233 | 18.0M | } |
234 | 7.55M | } |
235 | 11.2M | *eob = rec_eob_pos(eob_pt, eob_extra); |
236 | | |
237 | 11.2M | if (*eob > 1) { |
238 | 7.92M | memset(levels_buf, 0, |
239 | 7.92M | sizeof(*levels_buf) * |
240 | 7.92M | ((height + TX_PAD_HOR) * (width + TX_PAD_VER) + TX_PAD_END)); |
241 | 7.92M | } |
242 | | |
243 | 11.2M | { |
244 | | // Read the non-zero coefficient with scan index eob-1 |
245 | | // TODO(angiebird): Put this into a function |
246 | 11.2M | const int c = *eob - 1; |
247 | 11.2M | const int pos = scan[c]; |
248 | 11.2M | const int coeff_ctx = get_lower_levels_ctx_eob(bhl, width, c); |
249 | 11.2M | const int nsymbs = 3; |
250 | 11.2M | aom_cdf_prob *cdf = |
251 | 11.2M | ec_ctx->coeff_base_eob_cdf[txs_ctx][plane_type][coeff_ctx]; |
252 | 11.2M | int level = aom_read_symbol(r, cdf, nsymbs, ACCT_STR) + 1; |
253 | 11.2M | if (level > NUM_BASE_LEVELS) { |
254 | 478k | const int br_ctx = get_br_ctx_eob(pos, bhl, tx_class); |
255 | 478k | cdf = ec_ctx->coeff_br_cdf[AOMMIN(txs_ctx, TX_32X32)][plane_type][br_ctx]; |
256 | 782k | for (int idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) { |
257 | 749k | const int k = aom_read_symbol(r, cdf, BR_CDF_SIZE, ACCT_STR); |
258 | 749k | level += k; |
259 | 749k | if (k < BR_CDF_SIZE - 1) break; |
260 | 749k | } |
261 | 478k | } |
262 | 11.2M | levels[get_padded_idx(pos, bhl)] = level; |
263 | 11.2M | } |
264 | 11.2M | if (*eob > 1) { |
265 | 7.92M | base_cdf_arr base_cdf = ec_ctx->coeff_base_cdf[txs_ctx][plane_type]; |
266 | 7.92M | br_cdf_arr br_cdf = |
267 | 7.92M | ec_ctx->coeff_br_cdf[AOMMIN(txs_ctx, TX_32X32)][plane_type]; |
268 | 7.92M | if (tx_class == TX_CLASS_2D) { |
269 | 7.40M | read_coeffs_reverse_2d(r, tx_size, 1, *eob - 1 - 1, scan, bhl, levels, |
270 | 7.40M | base_cdf, br_cdf); |
271 | 7.40M | read_coeffs_reverse(r, tx_size, tx_class, 0, 0, scan, bhl, levels, |
272 | 7.40M | base_cdf, br_cdf); |
273 | 7.40M | } else { |
274 | 515k | read_coeffs_reverse(r, tx_size, tx_class, 0, *eob - 1 - 1, scan, bhl, |
275 | 515k | levels, base_cdf, br_cdf); |
276 | 515k | } |
277 | 7.92M | } |
278 | | |
279 | 255M | for (int c = 0; c < *eob; ++c) { |
280 | 244M | const int pos = scan[c]; |
281 | 244M | uint8_t sign; |
282 | 244M | tran_low_t level = levels[get_padded_idx(pos, bhl)]; |
283 | 244M | if (level) { |
284 | 99.6M | *max_scan_line = AOMMAX(*max_scan_line, pos); |
285 | 99.6M | if (c == 0) { |
286 | 9.20M | const int dc_sign_ctx = txb_ctx->dc_sign_ctx; |
287 | 9.20M | sign = aom_read_symbol(r, ec_ctx->dc_sign_cdf[plane_type][dc_sign_ctx], |
288 | 9.20M | 2, ACCT_STR); |
289 | 90.4M | } else { |
290 | 90.4M | sign = aom_read_bit(r, ACCT_STR); |
291 | 90.4M | } |
292 | 99.6M | if (level >= MAX_BASE_BR_RANGE) { |
293 | 2.99M | level += read_golomb(xd, r); |
294 | 2.99M | } |
295 | | |
296 | 99.6M | if (c == 0) dc_val = sign ? -level : level; |
297 | | |
298 | | // Bitmasking to clamp level to valid range: |
299 | | // The valid range for 8/10/12 bit vdieo is at most 14/16/18 bit |
300 | 99.6M | level &= 0xfffff; |
301 | 99.6M | cul_level += level; |
302 | 99.6M | tran_low_t dq_coeff; |
303 | | // Bitmasking to clamp dq_coeff to valid range: |
304 | | // The valid range for 8/10/12 bit video is at most 17/19/21 bit |
305 | 99.6M | dq_coeff = |
306 | 99.6M | (tran_low_t)((int64_t)level * get_dqv(dequant, scan[c], iqmatrix) & |
307 | 99.6M | 0xffffff); |
308 | 99.6M | dq_coeff = dq_coeff >> shift; |
309 | 99.6M | if (sign) { |
310 | 48.9M | dq_coeff = -dq_coeff; |
311 | 48.9M | } |
312 | 99.6M | tcoeffs[pos] = clamp(dq_coeff, min_value, max_value); |
313 | 99.6M | } |
314 | 244M | } |
315 | | |
316 | 11.2M | cul_level = AOMMIN(COEFF_CONTEXT_MASK, cul_level); |
317 | | |
318 | | // DC value |
319 | 11.2M | set_dc_sign(&cul_level, dc_val); |
320 | | |
321 | 11.2M | return cul_level; |
322 | 11.2M | } |
323 | | |
324 | | void av1_read_coeffs_txb(const AV1_COMMON *const cm, DecoderCodingBlock *dcb, |
325 | | aom_reader *const r, const int plane, const int row, |
326 | 21.0M | const int col, const TX_SIZE tx_size) { |
327 | | #if TXCOEFF_TIMER |
328 | | struct aom_usec_timer timer; |
329 | | aom_usec_timer_start(&timer); |
330 | | #endif |
331 | 21.0M | MACROBLOCKD *const xd = &dcb->xd; |
332 | 21.0M | MB_MODE_INFO *const mbmi = xd->mi[0]; |
333 | 21.0M | struct macroblockd_plane *const pd = &xd->plane[plane]; |
334 | | |
335 | 21.0M | const BLOCK_SIZE bsize = mbmi->bsize; |
336 | 21.0M | assert(bsize < BLOCK_SIZES_ALL); |
337 | 21.0M | const BLOCK_SIZE plane_bsize = |
338 | 21.0M | get_plane_block_size(bsize, pd->subsampling_x, pd->subsampling_y); |
339 | | |
340 | 21.0M | TXB_CTX txb_ctx; |
341 | 21.0M | get_txb_ctx(plane_bsize, tx_size, plane, pd->above_entropy_context + col, |
342 | 21.0M | pd->left_entropy_context + row, &txb_ctx); |
343 | | |
344 | 21.0M | assert(dcb->xd.error_info->setjmp); |
345 | 21.0M | const uint8_t cul_level = |
346 | 21.0M | read_coeffs_txb(cm, dcb, r, row, col, plane, &txb_ctx, tx_size); |
347 | 21.0M | av1_set_entropy_contexts(xd, pd, plane, plane_bsize, tx_size, cul_level, col, |
348 | 21.0M | row); |
349 | | |
350 | 21.0M | if (is_inter_block(mbmi)) { |
351 | 286k | const PLANE_TYPE plane_type = get_plane_type(plane); |
352 | | // tx_type will be read out in av1_read_coeffs_txb_facade |
353 | 286k | const TX_TYPE tx_type = av1_get_tx_type(xd, plane_type, row, col, tx_size, |
354 | 286k | cm->features.reduced_tx_set_used); |
355 | | |
356 | 286k | if (plane == 0) { |
357 | 135k | const int txw = tx_size_wide_unit[tx_size]; |
358 | 135k | const int txh = tx_size_high_unit[tx_size]; |
359 | | // The 16x16 unit is due to the constraint from tx_64x64 which sets the |
360 | | // maximum tx size for chroma as 32x32. Coupled with 4x1 transform block |
361 | | // size, the constraint takes effect in 32x16 / 16x32 size too. To solve |
362 | | // the intricacy, cover all the 16x16 units inside a 64 level transform. |
363 | 135k | if (txw == tx_size_wide_unit[TX_64X64] || |
364 | 133k | txh == tx_size_high_unit[TX_64X64]) { |
365 | 1.94k | const int tx_unit = tx_size_wide_unit[TX_16X16]; |
366 | 1.94k | const int stride = xd->tx_type_map_stride; |
367 | 8.89k | for (int idy = 0; idy < txh; idy += tx_unit) { |
368 | 31.2k | for (int idx = 0; idx < txw; idx += tx_unit) { |
369 | 24.3k | xd->tx_type_map[(row + idy) * stride + col + idx] = tx_type; |
370 | 24.3k | } |
371 | 6.95k | } |
372 | 1.94k | } |
373 | 135k | } |
374 | 286k | } |
375 | | |
376 | | #if TXCOEFF_TIMER |
377 | | aom_usec_timer_mark(&timer); |
378 | | const int64_t elapsed_time = aom_usec_timer_elapsed(&timer); |
379 | | cm->txcoeff_timer += elapsed_time; |
380 | | ++cm->txb_count; |
381 | | #endif |
382 | 21.0M | } |