/src/aom/av1/common/mvref_common.c
Line | Count | Source (jump to first uncovered line) |
1 | | /* |
2 | | * Copyright (c) 2016, Alliance for Open Media. All rights reserved. |
3 | | * |
4 | | * This source code is subject to the terms of the BSD 2 Clause License and |
5 | | * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License |
6 | | * was not distributed with this source code in the LICENSE file, you can |
7 | | * obtain it at www.aomedia.org/license/software. If the Alliance for Open |
8 | | * Media Patent License 1.0 was not distributed with this source code in the |
9 | | * PATENTS file, you can obtain it at www.aomedia.org/license/patent. |
10 | | */ |
11 | | |
12 | | #include <stdlib.h> |
13 | | |
14 | | #include "av1/common/mvref_common.h" |
15 | | #include "av1/common/warped_motion.h" |
16 | | |
17 | | // Although we assign 32 bit integers, all the values are strictly under 14 |
18 | | // bits. |
19 | | static const int div_mult[32] = { 0, 16384, 8192, 5461, 4096, 3276, 2730, |
20 | | 2340, 2048, 1820, 1638, 1489, 1365, 1260, |
21 | | 1170, 1092, 1024, 963, 910, 862, 819, |
22 | | 780, 744, 712, 682, 655, 630, 606, |
23 | | 585, 564, 546, 528 }; |
24 | | |
25 | | // TODO(jingning): Consider the use of lookup table for (num / den) |
26 | | // altogether. |
27 | 19.7M | void av1_get_mv_projection(MV *output, MV ref, int num, int den) { |
28 | 19.7M | den = AOMMIN(den, MAX_FRAME_DISTANCE); |
29 | 19.7M | num = num > 0 ? AOMMIN(num, MAX_FRAME_DISTANCE) |
30 | 19.7M | : AOMMAX(num, -MAX_FRAME_DISTANCE); |
31 | 19.7M | const int mv_row = |
32 | 19.7M | ROUND_POWER_OF_TWO_SIGNED(ref.row * num * div_mult[den], 14); |
33 | 19.7M | const int mv_col = |
34 | 19.7M | ROUND_POWER_OF_TWO_SIGNED(ref.col * num * div_mult[den], 14); |
35 | 19.7M | const int clamp_max = MV_UPP - 1; |
36 | 19.7M | const int clamp_min = MV_LOW + 1; |
37 | 19.7M | output->row = (int16_t)clamp(mv_row, clamp_min, clamp_max); |
38 | 19.7M | output->col = (int16_t)clamp(mv_col, clamp_min, clamp_max); |
39 | 19.7M | } |
40 | | |
41 | | void av1_copy_frame_mvs(const AV1_COMMON *const cm, |
42 | | const MB_MODE_INFO *const mi, int mi_row, int mi_col, |
43 | 5.05M | int x_mis, int y_mis) { |
44 | 5.05M | const int frame_mvs_stride = ROUND_POWER_OF_TWO(cm->mi_params.mi_cols, 1); |
45 | 5.05M | MV_REF *frame_mvs = |
46 | 5.05M | cm->cur_frame->mvs + (mi_row >> 1) * frame_mvs_stride + (mi_col >> 1); |
47 | 5.05M | x_mis = ROUND_POWER_OF_TWO(x_mis, 1); |
48 | 5.05M | y_mis = ROUND_POWER_OF_TWO(y_mis, 1); |
49 | 5.05M | int w, h; |
50 | | |
51 | 15.9M | for (h = 0; h < y_mis; h++) { |
52 | 10.8M | MV_REF *mv = frame_mvs; |
53 | 63.6M | for (w = 0; w < x_mis; w++) { |
54 | 52.7M | mv->ref_frame = NONE_FRAME; |
55 | 52.7M | mv->mv.as_int = 0; |
56 | | |
57 | 158M | for (int idx = 0; idx < 2; ++idx) { |
58 | 105M | MV_REFERENCE_FRAME ref_frame = mi->ref_frame[idx]; |
59 | 105M | if (ref_frame > INTRA_FRAME) { |
60 | 68.8M | int8_t ref_idx = cm->ref_frame_side[ref_frame]; |
61 | 68.8M | if (ref_idx) continue; |
62 | 56.4M | if ((abs(mi->mv[idx].as_mv.row) > REFMVS_LIMIT) || |
63 | 56.4M | (abs(mi->mv[idx].as_mv.col) > REFMVS_LIMIT)) |
64 | 1.70M | continue; |
65 | 54.7M | mv->ref_frame = ref_frame; |
66 | 54.7M | mv->mv.as_int = mi->mv[idx].as_int; |
67 | 54.7M | } |
68 | 105M | } |
69 | 52.7M | mv++; |
70 | 52.7M | } |
71 | 10.8M | frame_mvs += frame_mvs_stride; |
72 | 10.8M | } |
73 | 5.05M | } |
74 | | |
75 | | static inline void add_ref_mv_candidate( |
76 | | const MB_MODE_INFO *const candidate, const MV_REFERENCE_FRAME rf[2], |
77 | | uint8_t *refmv_count, uint8_t *ref_match_count, uint8_t *newmv_count, |
78 | | CANDIDATE_MV *ref_mv_stack, uint16_t *ref_mv_weight, |
79 | | int_mv *gm_mv_candidates, const WarpedMotionParams *gm_params, |
80 | 24.6M | uint16_t weight) { |
81 | 24.6M | if (!is_inter_block(candidate)) return; |
82 | 21.4M | assert(weight % 2 == 0); |
83 | 21.4M | int index, ref; |
84 | | |
85 | 21.4M | if (rf[1] == NONE_FRAME) { |
86 | | // single reference frame |
87 | 55.3M | for (ref = 0; ref < 2; ++ref) { |
88 | 36.8M | if (candidate->ref_frame[ref] == rf[0]) { |
89 | 15.7M | const int is_gm_block = |
90 | 15.7M | is_global_mv_block(candidate, gm_params[rf[0]].wmtype); |
91 | 15.7M | const int_mv this_refmv = |
92 | 15.7M | is_gm_block ? gm_mv_candidates[0] : get_block_mv(candidate, ref); |
93 | 27.7M | for (index = 0; index < *refmv_count; ++index) { |
94 | 20.3M | if (ref_mv_stack[index].this_mv.as_int == this_refmv.as_int) { |
95 | 8.30M | ref_mv_weight[index] += weight; |
96 | 8.30M | break; |
97 | 8.30M | } |
98 | 20.3M | } |
99 | | |
100 | | // Add a new item to the list. |
101 | 15.7M | if (index == *refmv_count && *refmv_count < MAX_REF_MV_STACK_SIZE) { |
102 | 7.34M | ref_mv_stack[index].this_mv = this_refmv; |
103 | 7.34M | ref_mv_weight[index] = weight; |
104 | 7.34M | ++(*refmv_count); |
105 | 7.34M | } |
106 | 15.7M | if (have_newmv_in_inter_mode(candidate->mode)) ++*newmv_count; |
107 | 15.7M | ++*ref_match_count; |
108 | 15.7M | } |
109 | 36.8M | } |
110 | 18.4M | } else { |
111 | | // compound reference frame |
112 | 3.04M | if (candidate->ref_frame[0] == rf[0] && candidate->ref_frame[1] == rf[1]) { |
113 | 1.23M | int_mv this_refmv[2]; |
114 | | |
115 | 3.70M | for (ref = 0; ref < 2; ++ref) { |
116 | 2.46M | if (is_global_mv_block(candidate, gm_params[rf[ref]].wmtype)) |
117 | 55.0k | this_refmv[ref] = gm_mv_candidates[ref]; |
118 | 2.41M | else |
119 | 2.41M | this_refmv[ref] = get_block_mv(candidate, ref); |
120 | 2.46M | } |
121 | | |
122 | 1.90M | for (index = 0; index < *refmv_count; ++index) { |
123 | 1.18M | if ((ref_mv_stack[index].this_mv.as_int == this_refmv[0].as_int) && |
124 | 1.18M | (ref_mv_stack[index].comp_mv.as_int == this_refmv[1].as_int)) { |
125 | 511k | ref_mv_weight[index] += weight; |
126 | 511k | break; |
127 | 511k | } |
128 | 1.18M | } |
129 | | |
130 | | // Add a new item to the list. |
131 | 1.23M | if (index == *refmv_count && *refmv_count < MAX_REF_MV_STACK_SIZE) { |
132 | 723k | ref_mv_stack[index].this_mv = this_refmv[0]; |
133 | 723k | ref_mv_stack[index].comp_mv = this_refmv[1]; |
134 | 723k | ref_mv_weight[index] = weight; |
135 | 723k | ++(*refmv_count); |
136 | 723k | } |
137 | 1.23M | if (have_newmv_in_inter_mode(candidate->mode)) ++*newmv_count; |
138 | 1.23M | ++*ref_match_count; |
139 | 1.23M | } |
140 | 3.04M | } |
141 | 21.4M | } |
142 | | |
143 | | static inline void scan_row_mbmi(const AV1_COMMON *cm, const MACROBLOCKD *xd, |
144 | | int mi_col, const MV_REFERENCE_FRAME rf[2], |
145 | | int row_offset, CANDIDATE_MV *ref_mv_stack, |
146 | | uint16_t *ref_mv_weight, uint8_t *refmv_count, |
147 | | uint8_t *ref_match_count, uint8_t *newmv_count, |
148 | | int_mv *gm_mv_candidates, int max_row_offset, |
149 | 8.15M | int *processed_rows) { |
150 | 8.15M | int end_mi = AOMMIN(xd->width, cm->mi_params.mi_cols - mi_col); |
151 | 8.15M | end_mi = AOMMIN(end_mi, mi_size_wide[BLOCK_64X64]); |
152 | 8.15M | const int width_8x8 = mi_size_wide[BLOCK_8X8]; |
153 | 8.15M | const int width_16x16 = mi_size_wide[BLOCK_16X16]; |
154 | 8.15M | int col_offset = 0; |
155 | | // TODO(jingning): Revisit this part after cb4x4 is stable. |
156 | 8.15M | if (abs(row_offset) > 1) { |
157 | 4.49M | col_offset = 1; |
158 | 4.49M | if ((mi_col & 0x01) && xd->width < width_8x8) --col_offset; |
159 | 4.49M | } |
160 | 8.15M | const int use_step_16 = (xd->width >= 16); |
161 | 8.15M | MB_MODE_INFO **const candidate_mi0 = xd->mi + row_offset * xd->mi_stride; |
162 | | |
163 | 17.6M | for (int i = 0; i < end_mi;) { |
164 | 9.47M | const MB_MODE_INFO *const candidate = candidate_mi0[col_offset + i]; |
165 | 9.47M | const int candidate_bsize = candidate->bsize; |
166 | 9.47M | const int n4_w = mi_size_wide[candidate_bsize]; |
167 | 9.47M | int len = AOMMIN(xd->width, n4_w); |
168 | 9.47M | if (use_step_16) |
169 | 362k | len = AOMMAX(width_16x16, len); |
170 | 9.11M | else if (abs(row_offset) > 1) |
171 | 5.13M | len = AOMMAX(len, width_8x8); |
172 | | |
173 | 9.47M | uint16_t weight = 2; |
174 | 9.47M | if (xd->width >= width_8x8 && xd->width <= n4_w) { |
175 | 5.09M | uint16_t inc = AOMMIN(-max_row_offset + row_offset + 1, |
176 | 5.09M | mi_size_high[candidate_bsize]); |
177 | | // Obtain range used in weight calculation. |
178 | 5.09M | weight = AOMMAX(weight, inc); |
179 | | // Update processed rows. |
180 | 5.09M | *processed_rows = inc - row_offset - 1; |
181 | 5.09M | } |
182 | | |
183 | 9.47M | add_ref_mv_candidate(candidate, rf, refmv_count, ref_match_count, |
184 | 9.47M | newmv_count, ref_mv_stack, ref_mv_weight, |
185 | 9.47M | gm_mv_candidates, cm->global_motion, len * weight); |
186 | | |
187 | 9.47M | i += len; |
188 | 9.47M | } |
189 | 8.15M | } |
190 | | |
191 | | static inline void scan_col_mbmi(const AV1_COMMON *cm, const MACROBLOCKD *xd, |
192 | | int mi_row, const MV_REFERENCE_FRAME rf[2], |
193 | | int col_offset, CANDIDATE_MV *ref_mv_stack, |
194 | | uint16_t *ref_mv_weight, uint8_t *refmv_count, |
195 | | uint8_t *ref_match_count, uint8_t *newmv_count, |
196 | | int_mv *gm_mv_candidates, int max_col_offset, |
197 | 8.28M | int *processed_cols) { |
198 | 8.28M | int end_mi = AOMMIN(xd->height, cm->mi_params.mi_rows - mi_row); |
199 | 8.28M | end_mi = AOMMIN(end_mi, mi_size_high[BLOCK_64X64]); |
200 | 8.28M | const int n8_h_8 = mi_size_high[BLOCK_8X8]; |
201 | 8.28M | const int n8_h_16 = mi_size_high[BLOCK_16X16]; |
202 | 8.28M | int i; |
203 | 8.28M | int row_offset = 0; |
204 | 8.28M | if (abs(col_offset) > 1) { |
205 | 4.54M | row_offset = 1; |
206 | 4.54M | if ((mi_row & 0x01) && xd->height < n8_h_8) --row_offset; |
207 | 4.54M | } |
208 | 8.28M | const int use_step_16 = (xd->height >= 16); |
209 | | |
210 | 17.9M | for (i = 0; i < end_mi;) { |
211 | 9.63M | const MB_MODE_INFO *const candidate = |
212 | 9.63M | xd->mi[(row_offset + i) * xd->mi_stride + col_offset]; |
213 | 9.63M | const int candidate_bsize = candidate->bsize; |
214 | 9.63M | const int n4_h = mi_size_high[candidate_bsize]; |
215 | 9.63M | int len = AOMMIN(xd->height, n4_h); |
216 | 9.63M | if (use_step_16) |
217 | 414k | len = AOMMAX(n8_h_16, len); |
218 | 9.22M | else if (abs(col_offset) > 1) |
219 | 5.16M | len = AOMMAX(len, n8_h_8); |
220 | | |
221 | 9.63M | int weight = 2; |
222 | 9.63M | if (xd->height >= n8_h_8 && xd->height <= n4_h) { |
223 | 4.66M | int inc = AOMMIN(-max_col_offset + col_offset + 1, |
224 | 4.66M | mi_size_wide[candidate_bsize]); |
225 | | // Obtain range used in weight calculation. |
226 | 4.66M | weight = AOMMAX(weight, inc); |
227 | | // Update processed cols. |
228 | 4.66M | *processed_cols = inc - col_offset - 1; |
229 | 4.66M | } |
230 | | |
231 | 9.63M | add_ref_mv_candidate(candidate, rf, refmv_count, ref_match_count, |
232 | 9.63M | newmv_count, ref_mv_stack, ref_mv_weight, |
233 | 9.63M | gm_mv_candidates, cm->global_motion, len * weight); |
234 | | |
235 | 9.63M | i += len; |
236 | 9.63M | } |
237 | 8.28M | } |
238 | | |
239 | | static inline void scan_blk_mbmi(const AV1_COMMON *cm, const MACROBLOCKD *xd, |
240 | | const int mi_row, const int mi_col, |
241 | | const MV_REFERENCE_FRAME rf[2], int row_offset, |
242 | | int col_offset, CANDIDATE_MV *ref_mv_stack, |
243 | | uint16_t *ref_mv_weight, |
244 | | uint8_t *ref_match_count, uint8_t *newmv_count, |
245 | | int_mv *gm_mv_candidates, |
246 | 6.03M | uint8_t *refmv_count) { |
247 | 6.03M | const TileInfo *const tile = &xd->tile; |
248 | 6.03M | POSITION mi_pos; |
249 | | |
250 | 6.03M | mi_pos.row = row_offset; |
251 | 6.03M | mi_pos.col = col_offset; |
252 | | |
253 | 6.03M | if (is_inside(tile, mi_col, mi_row, &mi_pos)) { |
254 | 5.55M | const MB_MODE_INFO *const candidate = |
255 | 5.55M | xd->mi[mi_pos.row * xd->mi_stride + mi_pos.col]; |
256 | 5.55M | const int len = mi_size_wide[BLOCK_8X8]; |
257 | | |
258 | 5.55M | add_ref_mv_candidate(candidate, rf, refmv_count, ref_match_count, |
259 | 5.55M | newmv_count, ref_mv_stack, ref_mv_weight, |
260 | 5.55M | gm_mv_candidates, cm->global_motion, 2 * len); |
261 | 5.55M | } // Analyze a single 8x8 block motion information. |
262 | 6.03M | } |
263 | | |
264 | | static int has_top_right(const AV1_COMMON *cm, const MACROBLOCKD *xd, |
265 | 5.49M | int mi_row, int mi_col, int bs) { |
266 | 5.49M | const int sb_mi_size = mi_size_wide[cm->seq_params->sb_size]; |
267 | 5.49M | const int mask_row = mi_row & (sb_mi_size - 1); |
268 | 5.49M | const int mask_col = mi_col & (sb_mi_size - 1); |
269 | | |
270 | 5.49M | if (bs > mi_size_wide[BLOCK_64X64]) return 0; |
271 | | |
272 | | // In a split partition all apart from the bottom right has a top right |
273 | 5.26M | int has_tr = !((mask_row & bs) && (mask_col & bs)); |
274 | | |
275 | | // bs > 0 and bs is a power of 2 |
276 | 5.26M | assert(bs > 0 && !(bs & (bs - 1))); |
277 | | |
278 | | // For each 4x4 group of blocks, when the bottom right is decoded the blocks |
279 | | // to the right have not been decoded therefore the bottom right does |
280 | | // not have a top right |
281 | 7.88M | while (bs < sb_mi_size) { |
282 | 7.41M | if (mask_col & bs) { |
283 | 3.38M | if ((mask_col & (2 * bs)) && (mask_row & (2 * bs))) { |
284 | 764k | has_tr = 0; |
285 | 764k | break; |
286 | 764k | } |
287 | 4.03M | } else { |
288 | 4.03M | break; |
289 | 4.03M | } |
290 | 2.61M | bs <<= 1; |
291 | 2.61M | } |
292 | | |
293 | | // In a VERTICAL or VERTICAL_4 partition, all partition before the last one |
294 | | // always have a top right (as the block above will have been decoded). |
295 | 5.26M | if (xd->width < xd->height) { |
296 | 1.15M | if (!xd->is_last_vertical_rect) has_tr = 1; |
297 | 1.15M | } |
298 | | |
299 | | // In a HORIZONTAL or HORIZONTAL_4 partition, partitions after the first one |
300 | | // never have a top right (as the block to the right won't have been decoded). |
301 | 5.26M | if (xd->width > xd->height) { |
302 | 1.82M | if (!xd->is_first_horizontal_rect) has_tr = 0; |
303 | 1.82M | } |
304 | | |
305 | | // The bottom left square of a Vertical A (in the old format) does |
306 | | // not have a top right as it is decoded before the right hand |
307 | | // rectangle of the partition |
308 | 5.26M | if (xd->mi[0]->partition == PARTITION_VERT_A) { |
309 | 209k | if (xd->width == xd->height) |
310 | 136k | if (mask_row & bs) has_tr = 0; |
311 | 209k | } |
312 | | |
313 | 5.26M | return has_tr; |
314 | 5.26M | } |
315 | | |
316 | | static int check_sb_border(const int mi_row, const int mi_col, |
317 | 5.02M | const int row_offset, const int col_offset) { |
318 | 5.02M | const int sb_mi_size = mi_size_wide[BLOCK_64X64]; |
319 | 5.02M | const int row = mi_row & (sb_mi_size - 1); |
320 | 5.02M | const int col = mi_col & (sb_mi_size - 1); |
321 | | |
322 | 5.02M | if (row + row_offset < 0 || row + row_offset >= sb_mi_size || |
323 | 5.02M | col + col_offset < 0 || col + col_offset >= sb_mi_size) |
324 | 1.76M | return 0; |
325 | | |
326 | 3.26M | return 1; |
327 | 5.02M | } |
328 | | |
329 | | static int add_tpl_ref_mv(const AV1_COMMON *cm, const MACROBLOCKD *xd, |
330 | | int mi_row, int mi_col, MV_REFERENCE_FRAME ref_frame, |
331 | | int blk_row, int blk_col, int_mv *gm_mv_candidates, |
332 | | uint8_t *const refmv_count, |
333 | | CANDIDATE_MV ref_mv_stack[MAX_REF_MV_STACK_SIZE], |
334 | | uint16_t ref_mv_weight[MAX_REF_MV_STACK_SIZE], |
335 | 13.9M | int16_t *mode_context) { |
336 | 13.9M | POSITION mi_pos; |
337 | 13.9M | mi_pos.row = (mi_row & 0x01) ? blk_row : blk_row + 1; |
338 | 13.9M | mi_pos.col = (mi_col & 0x01) ? blk_col : blk_col + 1; |
339 | | |
340 | 13.9M | if (!is_inside(&xd->tile, mi_col, mi_row, &mi_pos)) return 0; |
341 | | |
342 | 13.7M | const TPL_MV_REF *prev_frame_mvs = |
343 | 13.7M | cm->tpl_mvs + |
344 | 13.7M | ((mi_row + mi_pos.row) >> 1) * (cm->mi_params.mi_stride >> 1) + |
345 | 13.7M | ((mi_col + mi_pos.col) >> 1); |
346 | 13.7M | if (prev_frame_mvs->mfmv0.as_int == INVALID_MV) return 0; |
347 | | |
348 | 1.35M | MV_REFERENCE_FRAME rf[2]; |
349 | 1.35M | av1_set_ref_frame(rf, ref_frame); |
350 | | |
351 | 1.35M | const uint16_t weight_unit = 1; // mi_size_wide[BLOCK_8X8]; |
352 | 1.35M | const int cur_frame_index = cm->cur_frame->order_hint; |
353 | 1.35M | const RefCntBuffer *const buf_0 = get_ref_frame_buf(cm, rf[0]); |
354 | 1.35M | const int frame0_index = buf_0->order_hint; |
355 | 1.35M | const int cur_offset_0 = get_relative_dist(&cm->seq_params->order_hint_info, |
356 | 1.35M | cur_frame_index, frame0_index); |
357 | 1.35M | int idx; |
358 | 1.35M | const int allow_high_precision_mv = cm->features.allow_high_precision_mv; |
359 | 1.35M | const int force_integer_mv = cm->features.cur_frame_force_integer_mv; |
360 | | |
361 | 1.35M | int_mv this_refmv; |
362 | 1.35M | av1_get_mv_projection(&this_refmv.as_mv, prev_frame_mvs->mfmv0.as_mv, |
363 | 1.35M | cur_offset_0, prev_frame_mvs->ref_frame_offset); |
364 | 1.35M | lower_mv_precision(&this_refmv.as_mv, allow_high_precision_mv, |
365 | 1.35M | force_integer_mv); |
366 | | |
367 | 1.35M | if (rf[1] == NONE_FRAME) { |
368 | 707k | if (blk_row == 0 && blk_col == 0) { |
369 | 99.5k | if (abs(this_refmv.as_mv.row - gm_mv_candidates[0].as_mv.row) >= 16 || |
370 | 99.5k | abs(this_refmv.as_mv.col - gm_mv_candidates[0].as_mv.col) >= 16) |
371 | 62.1k | mode_context[ref_frame] |= (1 << GLOBALMV_OFFSET); |
372 | 99.5k | } |
373 | | |
374 | 1.53M | for (idx = 0; idx < *refmv_count; ++idx) |
375 | 1.40M | if (this_refmv.as_int == ref_mv_stack[idx].this_mv.as_int) break; |
376 | | |
377 | 707k | if (idx < *refmv_count) ref_mv_weight[idx] += 2 * weight_unit; |
378 | | |
379 | 707k | if (idx == *refmv_count && *refmv_count < MAX_REF_MV_STACK_SIZE) { |
380 | 133k | ref_mv_stack[idx].this_mv.as_int = this_refmv.as_int; |
381 | 133k | ref_mv_weight[idx] = 2 * weight_unit; |
382 | 133k | ++(*refmv_count); |
383 | 133k | } |
384 | 707k | } else { |
385 | | // Process compound inter mode |
386 | 648k | const RefCntBuffer *const buf_1 = get_ref_frame_buf(cm, rf[1]); |
387 | 648k | const int frame1_index = buf_1->order_hint; |
388 | 648k | const int cur_offset_1 = get_relative_dist(&cm->seq_params->order_hint_info, |
389 | 648k | cur_frame_index, frame1_index); |
390 | 648k | int_mv comp_refmv; |
391 | 648k | av1_get_mv_projection(&comp_refmv.as_mv, prev_frame_mvs->mfmv0.as_mv, |
392 | 648k | cur_offset_1, prev_frame_mvs->ref_frame_offset); |
393 | 648k | lower_mv_precision(&comp_refmv.as_mv, allow_high_precision_mv, |
394 | 648k | force_integer_mv); |
395 | | |
396 | 648k | if (blk_row == 0 && blk_col == 0) { |
397 | 55.9k | if (abs(this_refmv.as_mv.row - gm_mv_candidates[0].as_mv.row) >= 16 || |
398 | 55.9k | abs(this_refmv.as_mv.col - gm_mv_candidates[0].as_mv.col) >= 16 || |
399 | 55.9k | abs(comp_refmv.as_mv.row - gm_mv_candidates[1].as_mv.row) >= 16 || |
400 | 55.9k | abs(comp_refmv.as_mv.col - gm_mv_candidates[1].as_mv.col) >= 16) |
401 | 30.7k | mode_context[ref_frame] |= (1 << GLOBALMV_OFFSET); |
402 | 55.9k | } |
403 | | |
404 | 1.25M | for (idx = 0; idx < *refmv_count; ++idx) { |
405 | 1.17M | if (this_refmv.as_int == ref_mv_stack[idx].this_mv.as_int && |
406 | 1.17M | comp_refmv.as_int == ref_mv_stack[idx].comp_mv.as_int) |
407 | 566k | break; |
408 | 1.17M | } |
409 | | |
410 | 648k | if (idx < *refmv_count) ref_mv_weight[idx] += 2 * weight_unit; |
411 | | |
412 | 648k | if (idx == *refmv_count && *refmv_count < MAX_REF_MV_STACK_SIZE) { |
413 | 91.7k | ref_mv_stack[idx].this_mv.as_int = this_refmv.as_int; |
414 | 91.7k | ref_mv_stack[idx].comp_mv.as_int = comp_refmv.as_int; |
415 | 91.7k | ref_mv_weight[idx] = 2 * weight_unit; |
416 | 91.7k | ++(*refmv_count); |
417 | 91.7k | } |
418 | 648k | } |
419 | | |
420 | 1.35M | return 1; |
421 | 13.7M | } |
422 | | |
423 | | static inline void process_compound_ref_mv_candidate( |
424 | | const MB_MODE_INFO *const candidate, const AV1_COMMON *const cm, |
425 | | const MV_REFERENCE_FRAME *const rf, int_mv ref_id[2][2], |
426 | 774k | int ref_id_count[2], int_mv ref_diff[2][2], int ref_diff_count[2]) { |
427 | 2.32M | for (int rf_idx = 0; rf_idx < 2; ++rf_idx) { |
428 | 1.54M | MV_REFERENCE_FRAME can_rf = candidate->ref_frame[rf_idx]; |
429 | | |
430 | 4.64M | for (int cmp_idx = 0; cmp_idx < 2; ++cmp_idx) { |
431 | 3.09M | if (can_rf == rf[cmp_idx] && ref_id_count[cmp_idx] < 2) { |
432 | 827k | ref_id[cmp_idx][ref_id_count[cmp_idx]] = candidate->mv[rf_idx]; |
433 | 827k | ++ref_id_count[cmp_idx]; |
434 | 2.26M | } else if (can_rf > INTRA_FRAME && ref_diff_count[cmp_idx] < 2) { |
435 | 1.16M | int_mv this_mv = candidate->mv[rf_idx]; |
436 | 1.16M | if (cm->ref_frame_sign_bias[can_rf] != |
437 | 1.16M | cm->ref_frame_sign_bias[rf[cmp_idx]]) { |
438 | 300k | this_mv.as_mv.row = -this_mv.as_mv.row; |
439 | 300k | this_mv.as_mv.col = -this_mv.as_mv.col; |
440 | 300k | } |
441 | 1.16M | ref_diff[cmp_idx][ref_diff_count[cmp_idx]] = this_mv; |
442 | 1.16M | ++ref_diff_count[cmp_idx]; |
443 | 1.16M | } |
444 | 3.09M | } |
445 | 1.54M | } |
446 | 774k | } |
447 | | |
448 | | static inline void process_single_ref_mv_candidate( |
449 | | const MB_MODE_INFO *const candidate, const AV1_COMMON *const cm, |
450 | | MV_REFERENCE_FRAME ref_frame, uint8_t *const refmv_count, |
451 | | CANDIDATE_MV ref_mv_stack[MAX_REF_MV_STACK_SIZE], |
452 | 2.72M | uint16_t ref_mv_weight[MAX_REF_MV_STACK_SIZE]) { |
453 | 8.18M | for (int rf_idx = 0; rf_idx < 2; ++rf_idx) { |
454 | 5.45M | if (candidate->ref_frame[rf_idx] > INTRA_FRAME) { |
455 | 2.33M | int_mv this_mv = candidate->mv[rf_idx]; |
456 | 2.33M | if (cm->ref_frame_sign_bias[candidate->ref_frame[rf_idx]] != |
457 | 2.33M | cm->ref_frame_sign_bias[ref_frame]) { |
458 | 66.2k | this_mv.as_mv.row = -this_mv.as_mv.row; |
459 | 66.2k | this_mv.as_mv.col = -this_mv.as_mv.col; |
460 | 66.2k | } |
461 | 2.33M | int stack_idx; |
462 | 2.65M | for (stack_idx = 0; stack_idx < *refmv_count; ++stack_idx) { |
463 | 2.24M | const int_mv stack_mv = ref_mv_stack[stack_idx].this_mv; |
464 | 2.24M | if (this_mv.as_int == stack_mv.as_int) break; |
465 | 2.24M | } |
466 | | |
467 | 2.33M | if (stack_idx == *refmv_count) { |
468 | 408k | ref_mv_stack[stack_idx].this_mv = this_mv; |
469 | | |
470 | | // TODO(jingning): Set an arbitrary small number here. The weight |
471 | | // doesn't matter as long as it is properly initialized. |
472 | 408k | ref_mv_weight[stack_idx] = 2; |
473 | 408k | ++(*refmv_count); |
474 | 408k | } |
475 | 2.33M | } |
476 | 5.45M | } |
477 | 2.72M | } |
478 | | |
479 | | static inline void setup_ref_mv_list( |
480 | | const AV1_COMMON *cm, const MACROBLOCKD *xd, MV_REFERENCE_FRAME ref_frame, |
481 | | uint8_t *const refmv_count, |
482 | | CANDIDATE_MV ref_mv_stack[MAX_REF_MV_STACK_SIZE], |
483 | | uint16_t ref_mv_weight[MAX_REF_MV_STACK_SIZE], |
484 | | int_mv mv_ref_list[MAX_MV_REF_CANDIDATES], int_mv *gm_mv_candidates, |
485 | 3.87M | int mi_row, int mi_col, int16_t *mode_context) { |
486 | 3.87M | const int bs = AOMMAX(xd->width, xd->height); |
487 | 3.87M | const int has_tr = has_top_right(cm, xd, mi_row, mi_col, bs); |
488 | 3.87M | MV_REFERENCE_FRAME rf[2]; |
489 | | |
490 | 3.87M | const TileInfo *const tile = &xd->tile; |
491 | 3.87M | int max_row_offset = 0, max_col_offset = 0; |
492 | 3.87M | const int row_adj = (xd->height < mi_size_high[BLOCK_8X8]) && (mi_row & 0x01); |
493 | 3.87M | const int col_adj = (xd->width < mi_size_wide[BLOCK_8X8]) && (mi_col & 0x01); |
494 | 3.87M | int processed_rows = 0; |
495 | 3.87M | int processed_cols = 0; |
496 | | |
497 | 3.87M | av1_set_ref_frame(rf, ref_frame); |
498 | 3.87M | mode_context[ref_frame] = 0; |
499 | 3.87M | *refmv_count = 0; |
500 | | |
501 | | // Find valid maximum row/col offset. |
502 | 3.87M | if (xd->up_available) { |
503 | 3.65M | max_row_offset = -(MVREF_ROW_COLS << 1) + row_adj; |
504 | | |
505 | 3.65M | if (xd->height < mi_size_high[BLOCK_8X8]) |
506 | 867k | max_row_offset = -(2 << 1) + row_adj; |
507 | | |
508 | 3.65M | max_row_offset = find_valid_row_offset(tile, mi_row, max_row_offset); |
509 | 3.65M | } |
510 | | |
511 | 3.87M | if (xd->left_available) { |
512 | 3.73M | max_col_offset = -(MVREF_ROW_COLS << 1) + col_adj; |
513 | | |
514 | 3.73M | if (xd->width < mi_size_wide[BLOCK_8X8]) |
515 | 709k | max_col_offset = -(2 << 1) + col_adj; |
516 | | |
517 | 3.73M | max_col_offset = find_valid_col_offset(tile, mi_col, max_col_offset); |
518 | 3.73M | } |
519 | | |
520 | 3.87M | uint8_t col_match_count = 0; |
521 | 3.87M | uint8_t row_match_count = 0; |
522 | 3.87M | uint8_t newmv_count = 0; |
523 | | |
524 | | // Scan the first above row mode info. row_offset = -1; |
525 | 3.87M | if (abs(max_row_offset) >= 1) |
526 | 3.65M | scan_row_mbmi(cm, xd, mi_col, rf, -1, ref_mv_stack, ref_mv_weight, |
527 | 3.65M | refmv_count, &row_match_count, &newmv_count, gm_mv_candidates, |
528 | 3.65M | max_row_offset, &processed_rows); |
529 | | // Scan the first left column mode info. col_offset = -1; |
530 | 3.87M | if (abs(max_col_offset) >= 1) |
531 | 3.73M | scan_col_mbmi(cm, xd, mi_row, rf, -1, ref_mv_stack, ref_mv_weight, |
532 | 3.73M | refmv_count, &col_match_count, &newmv_count, gm_mv_candidates, |
533 | 3.73M | max_col_offset, &processed_cols); |
534 | | // Check top-right boundary |
535 | 3.87M | if (has_tr) |
536 | 2.16M | scan_blk_mbmi(cm, xd, mi_row, mi_col, rf, -1, xd->width, ref_mv_stack, |
537 | 2.16M | ref_mv_weight, &row_match_count, &newmv_count, |
538 | 2.16M | gm_mv_candidates, refmv_count); |
539 | | |
540 | 3.87M | const uint8_t nearest_match = (row_match_count > 0) + (col_match_count > 0); |
541 | 3.87M | const uint8_t nearest_refmv_count = *refmv_count; |
542 | | |
543 | | // TODO(yunqing): for comp_search, do it for all 3 cases. |
544 | 9.01M | for (int idx = 0; idx < nearest_refmv_count; ++idx) |
545 | 5.13M | ref_mv_weight[idx] += REF_CAT_LEVEL; |
546 | | |
547 | 3.87M | if (cm->features.allow_ref_frame_mvs) { |
548 | 2.87M | int is_available = 0; |
549 | 2.87M | const int voffset = AOMMAX(mi_size_high[BLOCK_8X8], xd->height); |
550 | 2.87M | const int hoffset = AOMMAX(mi_size_wide[BLOCK_8X8], xd->width); |
551 | 2.87M | const int blk_row_end = AOMMIN(xd->height, mi_size_high[BLOCK_64X64]); |
552 | 2.87M | const int blk_col_end = AOMMIN(xd->width, mi_size_wide[BLOCK_64X64]); |
553 | | |
554 | 2.87M | const int tpl_sample_pos[3][2] = { |
555 | 2.87M | { voffset, -2 }, |
556 | 2.87M | { voffset, hoffset }, |
557 | 2.87M | { voffset - 2, hoffset }, |
558 | 2.87M | }; |
559 | 2.87M | const int allow_extension = (xd->height >= mi_size_high[BLOCK_8X8]) && |
560 | 2.87M | (xd->height < mi_size_high[BLOCK_64X64]) && |
561 | 2.87M | (xd->width >= mi_size_wide[BLOCK_8X8]) && |
562 | 2.87M | (xd->width < mi_size_wide[BLOCK_64X64]); |
563 | | |
564 | 2.87M | const int step_h = (xd->height >= mi_size_high[BLOCK_64X64]) |
565 | 2.87M | ? mi_size_high[BLOCK_16X16] |
566 | 2.87M | : mi_size_high[BLOCK_8X8]; |
567 | 2.87M | const int step_w = (xd->width >= mi_size_wide[BLOCK_64X64]) |
568 | 2.87M | ? mi_size_wide[BLOCK_16X16] |
569 | 2.87M | : mi_size_wide[BLOCK_8X8]; |
570 | | |
571 | 7.81M | for (int blk_row = 0; blk_row < blk_row_end; blk_row += step_h) { |
572 | 15.5M | for (int blk_col = 0; blk_col < blk_col_end; blk_col += step_w) { |
573 | 10.6M | int ret = add_tpl_ref_mv(cm, xd, mi_row, mi_col, ref_frame, blk_row, |
574 | 10.6M | blk_col, gm_mv_candidates, refmv_count, |
575 | 10.6M | ref_mv_stack, ref_mv_weight, mode_context); |
576 | 10.6M | if (blk_row == 0 && blk_col == 0) is_available = ret; |
577 | 10.6M | } |
578 | 4.93M | } |
579 | | |
580 | 2.87M | if (is_available == 0) mode_context[ref_frame] |= (1 << GLOBALMV_OFFSET); |
581 | | |
582 | 7.90M | for (int i = 0; i < 3 && allow_extension; ++i) { |
583 | 5.02M | const int blk_row = tpl_sample_pos[i][0]; |
584 | 5.02M | const int blk_col = tpl_sample_pos[i][1]; |
585 | | |
586 | 5.02M | if (!check_sb_border(mi_row, mi_col, blk_row, blk_col)) continue; |
587 | 3.26M | add_tpl_ref_mv(cm, xd, mi_row, mi_col, ref_frame, blk_row, blk_col, |
588 | 3.26M | gm_mv_candidates, refmv_count, ref_mv_stack, ref_mv_weight, |
589 | 3.26M | mode_context); |
590 | 3.26M | } |
591 | 2.87M | } |
592 | | |
593 | 3.87M | uint8_t dummy_newmv_count = 0; |
594 | | |
595 | | // Scan the second outer area. |
596 | 3.87M | scan_blk_mbmi(cm, xd, mi_row, mi_col, rf, -1, -1, ref_mv_stack, ref_mv_weight, |
597 | 3.87M | &row_match_count, &dummy_newmv_count, gm_mv_candidates, |
598 | 3.87M | refmv_count); |
599 | | |
600 | 11.6M | for (int idx = 2; idx <= MVREF_ROW_COLS; ++idx) { |
601 | 7.75M | const int row_offset = -(idx << 1) + 1 + row_adj; |
602 | 7.75M | const int col_offset = -(idx << 1) + 1 + col_adj; |
603 | | |
604 | 7.75M | if (abs(row_offset) <= abs(max_row_offset) && |
605 | 7.75M | abs(row_offset) > processed_rows) |
606 | 4.49M | scan_row_mbmi(cm, xd, mi_col, rf, row_offset, ref_mv_stack, ref_mv_weight, |
607 | 4.49M | refmv_count, &row_match_count, &dummy_newmv_count, |
608 | 4.49M | gm_mv_candidates, max_row_offset, &processed_rows); |
609 | | |
610 | 7.75M | if (abs(col_offset) <= abs(max_col_offset) && |
611 | 7.75M | abs(col_offset) > processed_cols) |
612 | 4.54M | scan_col_mbmi(cm, xd, mi_row, rf, col_offset, ref_mv_stack, ref_mv_weight, |
613 | 4.54M | refmv_count, &col_match_count, &dummy_newmv_count, |
614 | 4.54M | gm_mv_candidates, max_col_offset, &processed_cols); |
615 | 7.75M | } |
616 | | |
617 | 3.87M | const uint8_t ref_match_count = (row_match_count > 0) + (col_match_count > 0); |
618 | | |
619 | 3.87M | switch (nearest_match) { |
620 | 528k | case 0: |
621 | 528k | if (ref_match_count >= 1) mode_context[ref_frame] |= 1; |
622 | 528k | if (ref_match_count == 1) |
623 | 101k | mode_context[ref_frame] |= (1 << REFMV_OFFSET); |
624 | 427k | else if (ref_match_count >= 2) |
625 | 19.1k | mode_context[ref_frame] |= (2 << REFMV_OFFSET); |
626 | 528k | break; |
627 | 1.13M | case 1: |
628 | 1.13M | mode_context[ref_frame] |= (newmv_count > 0) ? 2 : 3; |
629 | 1.13M | if (ref_match_count == 1) |
630 | 736k | mode_context[ref_frame] |= (3 << REFMV_OFFSET); |
631 | 396k | else if (ref_match_count >= 2) |
632 | 396k | mode_context[ref_frame] |= (4 << REFMV_OFFSET); |
633 | 1.13M | break; |
634 | 2.21M | case 2: |
635 | 2.21M | default: |
636 | 2.21M | if (newmv_count >= 1) |
637 | 1.13M | mode_context[ref_frame] |= 4; |
638 | 1.08M | else |
639 | 1.08M | mode_context[ref_frame] |= 5; |
640 | | |
641 | 2.21M | mode_context[ref_frame] |= (5 << REFMV_OFFSET); |
642 | 2.21M | break; |
643 | 3.87M | } |
644 | | |
645 | | // Rank the likelihood and assign nearest and near mvs. |
646 | 3.87M | int len = nearest_refmv_count; |
647 | 7.85M | while (len > 0) { |
648 | 3.98M | int nr_len = 0; |
649 | 6.05M | for (int idx = 1; idx < len; ++idx) { |
650 | 2.07M | if (ref_mv_weight[idx - 1] < ref_mv_weight[idx]) { |
651 | 748k | const CANDIDATE_MV tmp_mv = ref_mv_stack[idx - 1]; |
652 | 748k | const uint16_t tmp_ref_mv_weight = ref_mv_weight[idx - 1]; |
653 | 748k | ref_mv_stack[idx - 1] = ref_mv_stack[idx]; |
654 | 748k | ref_mv_stack[idx] = tmp_mv; |
655 | 748k | ref_mv_weight[idx - 1] = ref_mv_weight[idx]; |
656 | 748k | ref_mv_weight[idx] = tmp_ref_mv_weight; |
657 | 748k | nr_len = idx; |
658 | 748k | } |
659 | 2.07M | } |
660 | 3.98M | len = nr_len; |
661 | 3.98M | } |
662 | | |
663 | 3.87M | len = *refmv_count; |
664 | 6.05M | while (len > nearest_refmv_count) { |
665 | 2.17M | int nr_len = nearest_refmv_count; |
666 | 3.79M | for (int idx = nearest_refmv_count + 1; idx < len; ++idx) { |
667 | 1.62M | if (ref_mv_weight[idx - 1] < ref_mv_weight[idx]) { |
668 | 497k | const CANDIDATE_MV tmp_mv = ref_mv_stack[idx - 1]; |
669 | 497k | const uint16_t tmp_ref_mv_weight = ref_mv_weight[idx - 1]; |
670 | 497k | ref_mv_stack[idx - 1] = ref_mv_stack[idx]; |
671 | 497k | ref_mv_stack[idx] = tmp_mv; |
672 | 497k | ref_mv_weight[idx - 1] = ref_mv_weight[idx]; |
673 | 497k | ref_mv_weight[idx] = tmp_ref_mv_weight; |
674 | 497k | nr_len = idx; |
675 | 497k | } |
676 | 1.62M | } |
677 | 2.17M | len = nr_len; |
678 | 2.17M | } |
679 | | |
680 | 3.87M | int mi_width = AOMMIN(mi_size_wide[BLOCK_64X64], xd->width); |
681 | 3.87M | mi_width = AOMMIN(mi_width, cm->mi_params.mi_cols - mi_col); |
682 | 3.87M | int mi_height = AOMMIN(mi_size_high[BLOCK_64X64], xd->height); |
683 | 3.87M | mi_height = AOMMIN(mi_height, cm->mi_params.mi_rows - mi_row); |
684 | 3.87M | const int mi_size = AOMMIN(mi_width, mi_height); |
685 | 3.87M | if (rf[1] > NONE_FRAME) { |
686 | | // TODO(jingning, yunqing): Refactor and consolidate the compound and |
687 | | // single reference frame modes. Reduce unnecessary redundancy. |
688 | 607k | if (*refmv_count < MAX_MV_REF_CANDIDATES) { |
689 | 410k | int_mv ref_id[2][2], ref_diff[2][2]; |
690 | 410k | int ref_id_count[2] = { 0 }, ref_diff_count[2] = { 0 }; |
691 | | |
692 | 780k | for (int idx = 0; abs(max_row_offset) >= 1 && idx < mi_size;) { |
693 | 370k | const MB_MODE_INFO *const candidate = xd->mi[-xd->mi_stride + idx]; |
694 | 370k | process_compound_ref_mv_candidate( |
695 | 370k | candidate, cm, rf, ref_id, ref_id_count, ref_diff, ref_diff_count); |
696 | 370k | idx += mi_size_wide[candidate->bsize]; |
697 | 370k | } |
698 | | |
699 | 814k | for (int idx = 0; abs(max_col_offset) >= 1 && idx < mi_size;) { |
700 | 403k | const MB_MODE_INFO *const candidate = xd->mi[idx * xd->mi_stride - 1]; |
701 | 403k | process_compound_ref_mv_candidate( |
702 | 403k | candidate, cm, rf, ref_id, ref_id_count, ref_diff, ref_diff_count); |
703 | 403k | idx += mi_size_high[candidate->bsize]; |
704 | 403k | } |
705 | | |
706 | | // Build up the compound mv predictor |
707 | 410k | int_mv comp_list[MAX_MV_REF_CANDIDATES][2]; |
708 | | |
709 | 1.22M | for (int idx = 0; idx < 2; ++idx) { |
710 | 819k | int comp_idx = 0; |
711 | 819k | for (int list_idx = 0; |
712 | 1.64M | list_idx < ref_id_count[idx] && comp_idx < MAX_MV_REF_CANDIDATES; |
713 | 826k | ++list_idx, ++comp_idx) |
714 | 826k | comp_list[comp_idx][idx] = ref_id[idx][list_idx]; |
715 | 819k | for (int list_idx = 0; |
716 | 1.45M | list_idx < ref_diff_count[idx] && comp_idx < MAX_MV_REF_CANDIDATES; |
717 | 819k | ++list_idx, ++comp_idx) |
718 | 630k | comp_list[comp_idx][idx] = ref_diff[idx][list_idx]; |
719 | 1.00M | for (; comp_idx < MAX_MV_REF_CANDIDATES; ++comp_idx) |
720 | 181k | comp_list[comp_idx][idx] = gm_mv_candidates[idx]; |
721 | 819k | } |
722 | | |
723 | 410k | if (*refmv_count) { |
724 | 234k | assert(*refmv_count == 1); |
725 | 234k | if (comp_list[0][0].as_int == ref_mv_stack[0].this_mv.as_int && |
726 | 234k | comp_list[0][1].as_int == ref_mv_stack[0].comp_mv.as_int) { |
727 | 183k | ref_mv_stack[*refmv_count].this_mv = comp_list[1][0]; |
728 | 183k | ref_mv_stack[*refmv_count].comp_mv = comp_list[1][1]; |
729 | 183k | } else { |
730 | 50.8k | ref_mv_stack[*refmv_count].this_mv = comp_list[0][0]; |
731 | 50.8k | ref_mv_stack[*refmv_count].comp_mv = comp_list[0][1]; |
732 | 50.8k | } |
733 | 234k | ref_mv_weight[*refmv_count] = 2; |
734 | 234k | ++*refmv_count; |
735 | 234k | } else { |
736 | 527k | for (int idx = 0; idx < MAX_MV_REF_CANDIDATES; ++idx) { |
737 | 351k | ref_mv_stack[*refmv_count].this_mv = comp_list[idx][0]; |
738 | 351k | ref_mv_stack[*refmv_count].comp_mv = comp_list[idx][1]; |
739 | 351k | ref_mv_weight[*refmv_count] = 2; |
740 | 351k | ++*refmv_count; |
741 | 351k | } |
742 | 175k | } |
743 | 410k | } |
744 | | |
745 | 607k | assert(*refmv_count >= 2); |
746 | | |
747 | 2.00M | for (int idx = 0; idx < *refmv_count; ++idx) { |
748 | 1.40M | clamp_mv_ref(&ref_mv_stack[idx].this_mv.as_mv, xd->width << MI_SIZE_LOG2, |
749 | 1.40M | xd->height << MI_SIZE_LOG2, xd); |
750 | 1.40M | clamp_mv_ref(&ref_mv_stack[idx].comp_mv.as_mv, xd->width << MI_SIZE_LOG2, |
751 | 1.40M | xd->height << MI_SIZE_LOG2, xd); |
752 | 1.40M | } |
753 | 3.27M | } else { |
754 | | // Handle single reference frame extension |
755 | 4.69M | for (int idx = 0; abs(max_row_offset) >= 1 && idx < mi_size && |
756 | 4.69M | *refmv_count < MAX_MV_REF_CANDIDATES;) { |
757 | 1.42M | const MB_MODE_INFO *const candidate = xd->mi[-xd->mi_stride + idx]; |
758 | 1.42M | process_single_ref_mv_candidate(candidate, cm, ref_frame, refmv_count, |
759 | 1.42M | ref_mv_stack, ref_mv_weight); |
760 | 1.42M | idx += mi_size_wide[candidate->bsize]; |
761 | 1.42M | } |
762 | | |
763 | 4.57M | for (int idx = 0; abs(max_col_offset) >= 1 && idx < mi_size && |
764 | 4.57M | *refmv_count < MAX_MV_REF_CANDIDATES;) { |
765 | 1.30M | const MB_MODE_INFO *const candidate = xd->mi[idx * xd->mi_stride - 1]; |
766 | 1.30M | process_single_ref_mv_candidate(candidate, cm, ref_frame, refmv_count, |
767 | 1.30M | ref_mv_stack, ref_mv_weight); |
768 | 1.30M | idx += mi_size_high[candidate->bsize]; |
769 | 1.30M | } |
770 | | |
771 | 11.1M | for (int idx = 0; idx < *refmv_count; ++idx) { |
772 | 7.88M | clamp_mv_ref(&ref_mv_stack[idx].this_mv.as_mv, xd->width << MI_SIZE_LOG2, |
773 | 7.88M | xd->height << MI_SIZE_LOG2, xd); |
774 | 7.88M | } |
775 | | |
776 | 3.27M | if (mv_ref_list != NULL) { |
777 | 4.52M | for (int idx = *refmv_count; idx < MAX_MV_REF_CANDIDATES; ++idx) |
778 | 1.25M | mv_ref_list[idx].as_int = gm_mv_candidates[0].as_int; |
779 | | |
780 | 8.56M | for (int idx = 0; idx < AOMMIN(MAX_MV_REF_CANDIDATES, *refmv_count); |
781 | 5.29M | ++idx) { |
782 | 5.29M | mv_ref_list[idx].as_int = ref_mv_stack[idx].this_mv.as_int; |
783 | 5.29M | } |
784 | 3.27M | } |
785 | 3.27M | } |
786 | 3.87M | } |
787 | | |
788 | | void av1_find_mv_refs(const AV1_COMMON *cm, const MACROBLOCKD *xd, |
789 | | MB_MODE_INFO *mi, MV_REFERENCE_FRAME ref_frame, |
790 | | uint8_t ref_mv_count[MODE_CTX_REF_FRAMES], |
791 | | CANDIDATE_MV ref_mv_stack[][MAX_REF_MV_STACK_SIZE], |
792 | | uint16_t ref_mv_weight[][MAX_REF_MV_STACK_SIZE], |
793 | | int_mv mv_ref_list[][MAX_MV_REF_CANDIDATES], |
794 | 3.87M | int_mv *global_mvs, int16_t *mode_context) { |
795 | 3.87M | const int mi_row = xd->mi_row; |
796 | 3.87M | const int mi_col = xd->mi_col; |
797 | 3.87M | int_mv gm_mv[2]; |
798 | | |
799 | 3.87M | if (ref_frame == INTRA_FRAME) { |
800 | 61.3k | gm_mv[0].as_int = gm_mv[1].as_int = 0; |
801 | 61.3k | if (global_mvs != NULL) { |
802 | 0 | global_mvs[ref_frame].as_int = INVALID_MV; |
803 | 0 | } |
804 | 3.81M | } else { |
805 | 3.81M | const BLOCK_SIZE bsize = mi->bsize; |
806 | 3.81M | const int allow_high_precision_mv = cm->features.allow_high_precision_mv; |
807 | 3.81M | const int force_integer_mv = cm->features.cur_frame_force_integer_mv; |
808 | 3.81M | if (ref_frame < REF_FRAMES) { |
809 | 3.20M | gm_mv[0] = gm_get_motion_vector(&cm->global_motion[ref_frame], |
810 | 3.20M | allow_high_precision_mv, bsize, mi_col, |
811 | 3.20M | mi_row, force_integer_mv); |
812 | 3.20M | gm_mv[1].as_int = 0; |
813 | 3.20M | if (global_mvs != NULL) global_mvs[ref_frame] = gm_mv[0]; |
814 | 3.20M | } else { |
815 | 605k | MV_REFERENCE_FRAME rf[2]; |
816 | 605k | av1_set_ref_frame(rf, ref_frame); |
817 | 605k | gm_mv[0] = gm_get_motion_vector(&cm->global_motion[rf[0]], |
818 | 605k | allow_high_precision_mv, bsize, mi_col, |
819 | 605k | mi_row, force_integer_mv); |
820 | 605k | gm_mv[1] = gm_get_motion_vector(&cm->global_motion[rf[1]], |
821 | 605k | allow_high_precision_mv, bsize, mi_col, |
822 | 605k | mi_row, force_integer_mv); |
823 | 605k | } |
824 | 3.81M | } |
825 | | |
826 | 3.87M | setup_ref_mv_list(cm, xd, ref_frame, &ref_mv_count[ref_frame], |
827 | 3.87M | ref_mv_stack[ref_frame], ref_mv_weight[ref_frame], |
828 | 3.87M | mv_ref_list ? mv_ref_list[ref_frame] : NULL, gm_mv, mi_row, |
829 | 3.87M | mi_col, mode_context); |
830 | 3.87M | } |
831 | | |
832 | | void av1_find_best_ref_mvs(int allow_hp, int_mv *mvlist, int_mv *nearest_mv, |
833 | 2.41M | int_mv *near_mv, int is_integer) { |
834 | 2.41M | int i; |
835 | | // Make sure all the candidates are properly clamped etc |
836 | 7.25M | for (i = 0; i < MAX_MV_REF_CANDIDATES; ++i) { |
837 | 4.83M | lower_mv_precision(&mvlist[i].as_mv, allow_hp, is_integer); |
838 | 4.83M | } |
839 | 2.41M | *nearest_mv = mvlist[0]; |
840 | 2.41M | *near_mv = mvlist[1]; |
841 | 2.41M | } |
842 | | |
843 | 184k | void av1_setup_frame_buf_refs(AV1_COMMON *cm) { |
844 | 184k | cm->cur_frame->order_hint = cm->current_frame.order_hint; |
845 | 184k | cm->cur_frame->display_order_hint = cm->current_frame.display_order_hint; |
846 | 184k | cm->cur_frame->pyramid_level = cm->current_frame.pyramid_level; |
847 | 184k | cm->cur_frame->filter_level[0] = -1; |
848 | 184k | cm->cur_frame->filter_level[1] = -1; |
849 | 184k | MV_REFERENCE_FRAME ref_frame; |
850 | 1.47M | for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) { |
851 | 1.29M | const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame); |
852 | 1.29M | if (buf != NULL) { |
853 | 480k | cm->cur_frame->ref_order_hints[ref_frame - LAST_FRAME] = buf->order_hint; |
854 | 480k | cm->cur_frame->ref_display_order_hint[ref_frame - LAST_FRAME] = |
855 | 480k | buf->display_order_hint; |
856 | 480k | } |
857 | 1.29M | } |
858 | 184k | } |
859 | | |
860 | 184k | void av1_setup_frame_sign_bias(AV1_COMMON *cm) { |
861 | 184k | MV_REFERENCE_FRAME ref_frame; |
862 | 1.47M | for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) { |
863 | 1.29M | const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame); |
864 | 1.29M | if (cm->seq_params->order_hint_info.enable_order_hint && buf != NULL) { |
865 | 480k | const int ref_order_hint = buf->order_hint; |
866 | 480k | cm->ref_frame_sign_bias[ref_frame] = |
867 | 480k | (get_relative_dist(&cm->seq_params->order_hint_info, ref_order_hint, |
868 | 480k | (int)cm->current_frame.order_hint) <= 0) |
869 | 480k | ? 0 |
870 | 480k | : 1; |
871 | 810k | } else { |
872 | 810k | cm->ref_frame_sign_bias[ref_frame] = 0; |
873 | 810k | } |
874 | 1.29M | } |
875 | 184k | } |
876 | | |
877 | 25.9M | #define MAX_OFFSET_WIDTH 64 |
878 | 28.3M | #define MAX_OFFSET_HEIGHT 0 |
879 | | |
880 | | static int get_block_position(AV1_COMMON *cm, int *mi_r, int *mi_c, int blk_row, |
881 | 17.7M | int blk_col, MV mv, int sign_bias) { |
882 | 17.7M | const int base_blk_row = (blk_row >> 3) << 3; |
883 | 17.7M | const int base_blk_col = (blk_col >> 3) << 3; |
884 | | |
885 | 17.7M | const int row_offset = (mv.row >= 0) ? (mv.row >> (4 + MI_SIZE_LOG2)) |
886 | 17.7M | : -((-mv.row) >> (4 + MI_SIZE_LOG2)); |
887 | | |
888 | 17.7M | const int col_offset = (mv.col >= 0) ? (mv.col >> (4 + MI_SIZE_LOG2)) |
889 | 17.7M | : -((-mv.col) >> (4 + MI_SIZE_LOG2)); |
890 | | |
891 | 17.7M | const int row = |
892 | 17.7M | (sign_bias == 1) ? blk_row - row_offset : blk_row + row_offset; |
893 | 17.7M | const int col = |
894 | 17.7M | (sign_bias == 1) ? blk_col - col_offset : blk_col + col_offset; |
895 | | |
896 | 17.7M | if (row < 0 || row >= (cm->mi_params.mi_rows >> 1) || col < 0 || |
897 | 17.7M | col >= (cm->mi_params.mi_cols >> 1)) |
898 | 3.14M | return 0; |
899 | | |
900 | 14.6M | if (row < base_blk_row - (MAX_OFFSET_HEIGHT >> 3) || |
901 | 14.6M | row >= base_blk_row + 8 + (MAX_OFFSET_HEIGHT >> 3) || |
902 | 14.6M | col < base_blk_col - (MAX_OFFSET_WIDTH >> 3) || |
903 | 14.6M | col >= base_blk_col + 8 + (MAX_OFFSET_WIDTH >> 3)) |
904 | 1.84M | return 0; |
905 | | |
906 | 12.7M | *mi_r = row; |
907 | 12.7M | *mi_c = col; |
908 | | |
909 | 12.7M | return 1; |
910 | 14.6M | } |
911 | | |
912 | | // Note: motion_filed_projection finds motion vectors of current frame's |
913 | | // reference frame, and projects them to current frame. To make it clear, |
914 | | // let's call current frame's reference frame as start frame. |
915 | | // Call Start frame's reference frames as reference frames. |
916 | | // Call ref_offset as frame distances between start frame and its reference |
917 | | // frames. |
918 | | static int motion_field_projection(AV1_COMMON *cm, |
919 | 36.2k | MV_REFERENCE_FRAME start_frame, int dir) { |
920 | 36.2k | TPL_MV_REF *tpl_mvs_base = cm->tpl_mvs; |
921 | 36.2k | int ref_offset[REF_FRAMES] = { 0 }; |
922 | | |
923 | 36.2k | const RefCntBuffer *const start_frame_buf = |
924 | 36.2k | get_ref_frame_buf(cm, start_frame); |
925 | 36.2k | if (start_frame_buf == NULL) return 0; |
926 | | |
927 | 36.2k | if (start_frame_buf->frame_type == KEY_FRAME || |
928 | 36.2k | start_frame_buf->frame_type == INTRA_ONLY_FRAME) |
929 | 20.2k | return 0; |
930 | | |
931 | 16.0k | if (start_frame_buf->mi_rows != cm->mi_params.mi_rows || |
932 | 16.0k | start_frame_buf->mi_cols != cm->mi_params.mi_cols) |
933 | 29 | return 0; |
934 | | |
935 | 16.0k | const int start_frame_order_hint = start_frame_buf->order_hint; |
936 | 16.0k | const unsigned int *const ref_order_hints = |
937 | 16.0k | &start_frame_buf->ref_order_hints[0]; |
938 | 16.0k | const int cur_order_hint = cm->cur_frame->order_hint; |
939 | 16.0k | int start_to_current_frame_offset = get_relative_dist( |
940 | 16.0k | &cm->seq_params->order_hint_info, start_frame_order_hint, cur_order_hint); |
941 | | |
942 | 128k | for (MV_REFERENCE_FRAME rf = LAST_FRAME; rf <= INTER_REFS_PER_FRAME; ++rf) { |
943 | 112k | ref_offset[rf] = get_relative_dist(&cm->seq_params->order_hint_info, |
944 | 112k | start_frame_order_hint, |
945 | 112k | ref_order_hints[rf - LAST_FRAME]); |
946 | 112k | } |
947 | | |
948 | 16.0k | if (dir == 2) start_to_current_frame_offset = -start_to_current_frame_offset; |
949 | | |
950 | 16.0k | MV_REF *mv_ref_base = start_frame_buf->mvs; |
951 | 16.0k | const int mvs_rows = (cm->mi_params.mi_rows + 1) >> 1; |
952 | 16.0k | const int mvs_cols = (cm->mi_params.mi_cols + 1) >> 1; |
953 | | |
954 | 497k | for (int blk_row = 0; blk_row < mvs_rows; ++blk_row) { |
955 | 27.1M | for (int blk_col = 0; blk_col < mvs_cols; ++blk_col) { |
956 | 26.6M | MV_REF *mv_ref = &mv_ref_base[blk_row * mvs_cols + blk_col]; |
957 | 26.6M | MV fwd_mv = mv_ref->mv.as_mv; |
958 | | |
959 | 26.6M | if (mv_ref->ref_frame > INTRA_FRAME) { |
960 | 20.9M | int_mv this_mv; |
961 | 20.9M | int mi_r, mi_c; |
962 | 20.9M | const int ref_frame_offset = ref_offset[mv_ref->ref_frame]; |
963 | | |
964 | 20.9M | int pos_valid = |
965 | 20.9M | abs(ref_frame_offset) <= MAX_FRAME_DISTANCE && |
966 | 20.9M | ref_frame_offset > 0 && |
967 | 20.9M | abs(start_to_current_frame_offset) <= MAX_FRAME_DISTANCE; |
968 | | |
969 | 20.9M | if (pos_valid) { |
970 | 17.7M | av1_get_mv_projection(&this_mv.as_mv, fwd_mv, |
971 | 17.7M | start_to_current_frame_offset, |
972 | 17.7M | ref_frame_offset); |
973 | 17.7M | pos_valid = get_block_position(cm, &mi_r, &mi_c, blk_row, blk_col, |
974 | 17.7M | this_mv.as_mv, dir >> 1); |
975 | 17.7M | } |
976 | | |
977 | 20.9M | if (pos_valid) { |
978 | 12.7M | const int mi_offset = mi_r * (cm->mi_params.mi_stride >> 1) + mi_c; |
979 | | |
980 | 12.7M | tpl_mvs_base[mi_offset].mfmv0.as_mv.row = fwd_mv.row; |
981 | 12.7M | tpl_mvs_base[mi_offset].mfmv0.as_mv.col = fwd_mv.col; |
982 | 12.7M | tpl_mvs_base[mi_offset].ref_frame_offset = ref_frame_offset; |
983 | 12.7M | } |
984 | 20.9M | } |
985 | 26.6M | } |
986 | 481k | } |
987 | | |
988 | 16.0k | return 1; |
989 | 16.0k | } |
990 | | |
991 | | // cm->ref_frame_side is calculated here, and will be used in |
992 | | // av1_copy_frame_mvs() to affect how mvs are copied. |
993 | 163k | void av1_calculate_ref_frame_side(AV1_COMMON *cm) { |
994 | 163k | const OrderHintInfo *const order_hint_info = &cm->seq_params->order_hint_info; |
995 | | |
996 | 163k | memset(cm->ref_frame_side, 0, sizeof(cm->ref_frame_side)); |
997 | 163k | if (!order_hint_info->enable_order_hint) return; |
998 | | |
999 | 117k | const int cur_order_hint = cm->cur_frame->order_hint; |
1000 | | |
1001 | 937k | for (int ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ref_frame++) { |
1002 | 820k | const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame); |
1003 | 820k | int order_hint = 0; |
1004 | | |
1005 | 820k | if (buf != NULL) order_hint = buf->order_hint; |
1006 | | |
1007 | 820k | if (get_relative_dist(order_hint_info, order_hint, cur_order_hint) > 0) |
1008 | 215k | cm->ref_frame_side[ref_frame] = 1; |
1009 | 605k | else if (order_hint == cur_order_hint) |
1010 | 181k | cm->ref_frame_side[ref_frame] = -1; |
1011 | 820k | } |
1012 | 117k | } |
1013 | | |
1014 | 14.0k | void av1_setup_motion_field(AV1_COMMON *cm) { |
1015 | 14.0k | const OrderHintInfo *const order_hint_info = &cm->seq_params->order_hint_info; |
1016 | | |
1017 | 14.0k | if (!order_hint_info->enable_order_hint) return; |
1018 | | |
1019 | 14.0k | TPL_MV_REF *tpl_mvs_base = cm->tpl_mvs; |
1020 | 14.0k | int size = ((cm->mi_params.mi_rows + MAX_MIB_SIZE) >> 1) * |
1021 | 14.0k | (cm->mi_params.mi_stride >> 1); |
1022 | 49.9M | for (int idx = 0; idx < size; ++idx) { |
1023 | 49.9M | tpl_mvs_base[idx].mfmv0.as_int = INVALID_MV; |
1024 | 49.9M | tpl_mvs_base[idx].ref_frame_offset = 0; |
1025 | 49.9M | } |
1026 | | |
1027 | 14.0k | const int cur_order_hint = cm->cur_frame->order_hint; |
1028 | 14.0k | const RefCntBuffer *ref_buf[INTER_REFS_PER_FRAME]; |
1029 | 14.0k | int ref_order_hint[INTER_REFS_PER_FRAME]; |
1030 | | |
1031 | 112k | for (int ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ref_frame++) { |
1032 | 98.4k | const int ref_idx = ref_frame - LAST_FRAME; |
1033 | 98.4k | const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame); |
1034 | 98.4k | int order_hint = 0; |
1035 | | |
1036 | 98.4k | if (buf != NULL) order_hint = buf->order_hint; |
1037 | | |
1038 | 98.4k | ref_buf[ref_idx] = buf; |
1039 | 98.4k | ref_order_hint[ref_idx] = order_hint; |
1040 | 98.4k | } |
1041 | | |
1042 | 14.0k | int ref_stamp = MFMV_STACK_SIZE - 1; |
1043 | | |
1044 | 14.0k | if (ref_buf[LAST_FRAME - LAST_FRAME] != NULL) { |
1045 | 14.0k | const int alt_of_lst_order_hint = |
1046 | 14.0k | ref_buf[LAST_FRAME - LAST_FRAME] |
1047 | 14.0k | ->ref_order_hints[ALTREF_FRAME - LAST_FRAME]; |
1048 | | |
1049 | 14.0k | const int is_lst_overlay = |
1050 | 14.0k | (alt_of_lst_order_hint == ref_order_hint[GOLDEN_FRAME - LAST_FRAME]); |
1051 | 14.0k | if (!is_lst_overlay) motion_field_projection(cm, LAST_FRAME, 2); |
1052 | 14.0k | --ref_stamp; |
1053 | 14.0k | } |
1054 | | |
1055 | 14.0k | if (get_relative_dist(order_hint_info, |
1056 | 14.0k | ref_order_hint[BWDREF_FRAME - LAST_FRAME], |
1057 | 14.0k | cur_order_hint) > 0) { |
1058 | 4.28k | if (motion_field_projection(cm, BWDREF_FRAME, 0)) --ref_stamp; |
1059 | 4.28k | } |
1060 | | |
1061 | 14.0k | if (get_relative_dist(order_hint_info, |
1062 | 14.0k | ref_order_hint[ALTREF2_FRAME - LAST_FRAME], |
1063 | 14.0k | cur_order_hint) > 0) { |
1064 | 4.57k | if (motion_field_projection(cm, ALTREF2_FRAME, 0)) --ref_stamp; |
1065 | 4.57k | } |
1066 | | |
1067 | 14.0k | if (get_relative_dist(order_hint_info, |
1068 | 14.0k | ref_order_hint[ALTREF_FRAME - LAST_FRAME], |
1069 | 14.0k | cur_order_hint) > 0 && |
1070 | 14.0k | ref_stamp >= 0) |
1071 | 4.26k | if (motion_field_projection(cm, ALTREF_FRAME, 0)) --ref_stamp; |
1072 | | |
1073 | 14.0k | if (ref_stamp >= 0) motion_field_projection(cm, LAST2_FRAME, 2); |
1074 | 14.0k | } |
1075 | | |
1076 | | static inline void record_samples(const MB_MODE_INFO *mbmi, int *pts, |
1077 | | int *pts_inref, int row_offset, int sign_r, |
1078 | 4.11M | int col_offset, int sign_c) { |
1079 | 4.11M | const int bw = block_size_wide[mbmi->bsize]; |
1080 | 4.11M | const int bh = block_size_high[mbmi->bsize]; |
1081 | 4.11M | const int x = col_offset * MI_SIZE + sign_c * bw / 2 - 1; |
1082 | 4.11M | const int y = row_offset * MI_SIZE + sign_r * bh / 2 - 1; |
1083 | | |
1084 | 4.11M | pts[0] = GET_MV_SUBPEL(x); |
1085 | 4.11M | pts[1] = GET_MV_SUBPEL(y); |
1086 | 4.11M | pts_inref[0] = pts[0] + mbmi->mv[0].as_mv.col; |
1087 | 4.11M | pts_inref[1] = pts[1] + mbmi->mv[0].as_mv.row; |
1088 | 4.11M | } |
1089 | | |
1090 | | // Select samples according to the motion vector difference. |
1091 | | uint8_t av1_selectSamples(MV *mv, int *pts, int *pts_inref, int len, |
1092 | 176k | BLOCK_SIZE bsize) { |
1093 | 176k | const int bw = block_size_wide[bsize]; |
1094 | 176k | const int bh = block_size_high[bsize]; |
1095 | 176k | const int thresh = clamp(AOMMAX(bw, bh), 16, 112); |
1096 | 176k | uint8_t ret = 0; |
1097 | 176k | assert(len <= LEAST_SQUARES_SAMPLES_MAX); |
1098 | | |
1099 | | // Only keep the samples with MV differences within threshold. |
1100 | 720k | for (int i = 0; i < len; ++i) { |
1101 | 543k | const int diff = abs(pts_inref[2 * i] - pts[2 * i] - mv->col) + |
1102 | 543k | abs(pts_inref[2 * i + 1] - pts[2 * i + 1] - mv->row); |
1103 | 543k | if (diff > thresh) continue; |
1104 | 326k | if (ret != i) { |
1105 | 53.5k | memcpy(pts + 2 * ret, pts + 2 * i, 2 * sizeof(pts[0])); |
1106 | 53.5k | memcpy(pts_inref + 2 * ret, pts_inref + 2 * i, 2 * sizeof(pts_inref[0])); |
1107 | 53.5k | } |
1108 | 326k | ++ret; |
1109 | 326k | } |
1110 | | // Keep at least 1 sample. |
1111 | 176k | return AOMMAX(ret, 1); |
1112 | 176k | } |
1113 | | |
1114 | | // Note: Samples returned are at 1/8-pel precision |
1115 | | // Sample are the neighbor block center point's coordinates relative to the |
1116 | | // left-top pixel of current block. |
1117 | | uint8_t av1_findSamples(const AV1_COMMON *cm, MACROBLOCKD *xd, int *pts, |
1118 | 1.90M | int *pts_inref) { |
1119 | 1.90M | const MB_MODE_INFO *const mbmi0 = xd->mi[0]; |
1120 | 1.90M | const int ref_frame = mbmi0->ref_frame[0]; |
1121 | 1.90M | const int up_available = xd->up_available; |
1122 | 1.90M | const int left_available = xd->left_available; |
1123 | 1.90M | uint8_t np = 0; |
1124 | 1.90M | int do_tl = 1; |
1125 | 1.90M | int do_tr = 1; |
1126 | 1.90M | const int mi_stride = xd->mi_stride; |
1127 | 1.90M | const int mi_row = xd->mi_row; |
1128 | 1.90M | const int mi_col = xd->mi_col; |
1129 | | |
1130 | | // scan the nearest above rows |
1131 | 1.90M | if (up_available) { |
1132 | 1.79M | const int mi_row_offset = -1; |
1133 | 1.79M | const MB_MODE_INFO *mbmi = xd->mi[mi_row_offset * mi_stride]; |
1134 | 1.79M | uint8_t superblock_width = mi_size_wide[mbmi->bsize]; |
1135 | | |
1136 | 1.79M | if (xd->width <= superblock_width) { |
1137 | | // Handle "current block width <= above block width" case. |
1138 | 1.52M | const int col_offset = -mi_col % superblock_width; |
1139 | | |
1140 | 1.52M | if (col_offset < 0) do_tl = 0; |
1141 | 1.52M | if (col_offset + superblock_width > xd->width) do_tr = 0; |
1142 | | |
1143 | 1.52M | if (mbmi->ref_frame[0] == ref_frame && mbmi->ref_frame[1] == NONE_FRAME) { |
1144 | 991k | record_samples(mbmi, pts, pts_inref, 0, -1, col_offset, 1); |
1145 | 991k | pts += 2; |
1146 | 991k | pts_inref += 2; |
1147 | 991k | if (++np >= LEAST_SQUARES_SAMPLES_MAX) return LEAST_SQUARES_SAMPLES_MAX; |
1148 | 991k | } |
1149 | 1.52M | } else { |
1150 | | // Handle "current block width > above block width" case. |
1151 | 968k | for (int i = 0; i < AOMMIN(xd->width, cm->mi_params.mi_cols - mi_col); |
1152 | 692k | i += superblock_width) { |
1153 | 692k | mbmi = xd->mi[i + mi_row_offset * mi_stride]; |
1154 | 692k | superblock_width = mi_size_wide[mbmi->bsize]; |
1155 | | |
1156 | 692k | if (mbmi->ref_frame[0] == ref_frame && |
1157 | 692k | mbmi->ref_frame[1] == NONE_FRAME) { |
1158 | 448k | record_samples(mbmi, pts, pts_inref, 0, -1, i, 1); |
1159 | 448k | pts += 2; |
1160 | 448k | pts_inref += 2; |
1161 | 448k | if (++np >= LEAST_SQUARES_SAMPLES_MAX) |
1162 | 1.13k | return LEAST_SQUARES_SAMPLES_MAX; |
1163 | 448k | } |
1164 | 692k | } |
1165 | 276k | } |
1166 | 1.79M | } |
1167 | 1.89M | assert(np <= LEAST_SQUARES_SAMPLES_MAX); |
1168 | | |
1169 | | // scan the nearest left columns |
1170 | 1.89M | if (left_available) { |
1171 | 1.82M | const int mi_col_offset = -1; |
1172 | 1.82M | const MB_MODE_INFO *mbmi = xd->mi[mi_col_offset]; |
1173 | 1.82M | uint8_t superblock_height = mi_size_high[mbmi->bsize]; |
1174 | | |
1175 | 1.82M | if (xd->height <= superblock_height) { |
1176 | | // Handle "current block height <= above block height" case. |
1177 | 1.52M | const int row_offset = -mi_row % superblock_height; |
1178 | | |
1179 | 1.52M | if (row_offset < 0) do_tl = 0; |
1180 | | |
1181 | 1.52M | if (mbmi->ref_frame[0] == ref_frame && mbmi->ref_frame[1] == NONE_FRAME) { |
1182 | 986k | record_samples(mbmi, pts, pts_inref, row_offset, 1, 0, -1); |
1183 | 986k | pts += 2; |
1184 | 986k | pts_inref += 2; |
1185 | 986k | np++; |
1186 | 986k | if (np >= LEAST_SQUARES_SAMPLES_MAX) return LEAST_SQUARES_SAMPLES_MAX; |
1187 | 986k | } |
1188 | 1.52M | } else { |
1189 | | // Handle "current block height > above block height" case. |
1190 | 1.06M | for (int i = 0; i < AOMMIN(xd->height, cm->mi_params.mi_rows - mi_row); |
1191 | 761k | i += superblock_height) { |
1192 | 761k | mbmi = xd->mi[mi_col_offset + i * mi_stride]; |
1193 | 761k | superblock_height = mi_size_high[mbmi->bsize]; |
1194 | | |
1195 | 761k | if (mbmi->ref_frame[0] == ref_frame && |
1196 | 761k | mbmi->ref_frame[1] == NONE_FRAME) { |
1197 | 509k | record_samples(mbmi, pts, pts_inref, i, 1, 0, -1); |
1198 | 509k | pts += 2; |
1199 | 509k | pts_inref += 2; |
1200 | 509k | if (++np >= LEAST_SQUARES_SAMPLES_MAX) |
1201 | 4.01k | return LEAST_SQUARES_SAMPLES_MAX; |
1202 | 509k | } |
1203 | 761k | } |
1204 | 305k | } |
1205 | 1.82M | } |
1206 | 1.89M | assert(np <= LEAST_SQUARES_SAMPLES_MAX); |
1207 | | |
1208 | | // Top-left block |
1209 | 1.89M | if (do_tl && left_available && up_available) { |
1210 | 1.19M | const int mi_row_offset = -1; |
1211 | 1.19M | const int mi_col_offset = -1; |
1212 | 1.19M | MB_MODE_INFO *mbmi = xd->mi[mi_col_offset + mi_row_offset * mi_stride]; |
1213 | | |
1214 | 1.19M | if (mbmi->ref_frame[0] == ref_frame && mbmi->ref_frame[1] == NONE_FRAME) { |
1215 | 739k | record_samples(mbmi, pts, pts_inref, 0, -1, 0, -1); |
1216 | 739k | pts += 2; |
1217 | 739k | pts_inref += 2; |
1218 | 739k | if (++np >= LEAST_SQUARES_SAMPLES_MAX) return LEAST_SQUARES_SAMPLES_MAX; |
1219 | 739k | } |
1220 | 1.19M | } |
1221 | 1.89M | assert(np <= LEAST_SQUARES_SAMPLES_MAX); |
1222 | | |
1223 | | // Top-right block |
1224 | 1.89M | if (do_tr && |
1225 | 1.89M | has_top_right(cm, xd, mi_row, mi_col, AOMMAX(xd->width, xd->height))) { |
1226 | 822k | const POSITION trb_pos = { -1, xd->width }; |
1227 | 822k | const TileInfo *const tile = &xd->tile; |
1228 | 822k | if (is_inside(tile, mi_col, mi_row, &trb_pos)) { |
1229 | 737k | const int mi_row_offset = -1; |
1230 | 737k | const int mi_col_offset = xd->width; |
1231 | 737k | const MB_MODE_INFO *mbmi = |
1232 | 737k | xd->mi[mi_col_offset + mi_row_offset * mi_stride]; |
1233 | | |
1234 | 737k | if (mbmi->ref_frame[0] == ref_frame && mbmi->ref_frame[1] == NONE_FRAME) { |
1235 | 435k | record_samples(mbmi, pts, pts_inref, 0, -1, xd->width, 1); |
1236 | 435k | if (++np >= LEAST_SQUARES_SAMPLES_MAX) return LEAST_SQUARES_SAMPLES_MAX; |
1237 | 435k | } |
1238 | 737k | } |
1239 | 822k | } |
1240 | 1.88M | assert(np <= LEAST_SQUARES_SAMPLES_MAX); |
1241 | | |
1242 | 1.88M | return np; |
1243 | 1.88M | } |
1244 | | |
1245 | 168k | void av1_setup_skip_mode_allowed(AV1_COMMON *cm) { |
1246 | 168k | const OrderHintInfo *const order_hint_info = &cm->seq_params->order_hint_info; |
1247 | 168k | SkipModeInfo *const skip_mode_info = &cm->current_frame.skip_mode_info; |
1248 | | |
1249 | 168k | skip_mode_info->skip_mode_allowed = 0; |
1250 | 168k | skip_mode_info->ref_frame_idx_0 = INVALID_IDX; |
1251 | 168k | skip_mode_info->ref_frame_idx_1 = INVALID_IDX; |
1252 | | |
1253 | 168k | if (!order_hint_info->enable_order_hint || frame_is_intra_only(cm) || |
1254 | 168k | cm->current_frame.reference_mode == SINGLE_REFERENCE) |
1255 | 142k | return; |
1256 | | |
1257 | 26.3k | const int cur_order_hint = cm->current_frame.order_hint; |
1258 | 26.3k | int ref_order_hints[2] = { -1, INT_MAX }; |
1259 | 26.3k | int ref_idx[2] = { INVALID_IDX, INVALID_IDX }; |
1260 | | |
1261 | | // Identify the nearest forward and backward references. |
1262 | 211k | for (int i = 0; i < INTER_REFS_PER_FRAME; ++i) { |
1263 | 184k | const RefCntBuffer *const buf = get_ref_frame_buf(cm, LAST_FRAME + i); |
1264 | 184k | if (buf == NULL) continue; |
1265 | | |
1266 | 184k | const int ref_order_hint = buf->order_hint; |
1267 | 184k | if (get_relative_dist(order_hint_info, ref_order_hint, cur_order_hint) < |
1268 | 184k | 0) { |
1269 | | // Forward reference |
1270 | 132k | if (ref_order_hints[0] == -1 || |
1271 | 132k | get_relative_dist(order_hint_info, ref_order_hint, |
1272 | 106k | ref_order_hints[0]) > 0) { |
1273 | 43.4k | ref_order_hints[0] = ref_order_hint; |
1274 | 43.4k | ref_idx[0] = i; |
1275 | 43.4k | } |
1276 | 132k | } else if (get_relative_dist(order_hint_info, ref_order_hint, |
1277 | 52.5k | cur_order_hint) > 0) { |
1278 | | // Backward reference |
1279 | 23.8k | if (ref_order_hints[1] == INT_MAX || |
1280 | 23.8k | get_relative_dist(order_hint_info, ref_order_hint, |
1281 | 12.8k | ref_order_hints[1]) < 0) { |
1282 | 12.3k | ref_order_hints[1] = ref_order_hint; |
1283 | 12.3k | ref_idx[1] = i; |
1284 | 12.3k | } |
1285 | 23.8k | } |
1286 | 184k | } |
1287 | | |
1288 | 26.3k | if (ref_idx[0] != INVALID_IDX && ref_idx[1] != INVALID_IDX) { |
1289 | | // == Bi-directional prediction == |
1290 | 10.3k | skip_mode_info->skip_mode_allowed = 1; |
1291 | 10.3k | skip_mode_info->ref_frame_idx_0 = AOMMIN(ref_idx[0], ref_idx[1]); |
1292 | 10.3k | skip_mode_info->ref_frame_idx_1 = AOMMAX(ref_idx[0], ref_idx[1]); |
1293 | 16.0k | } else if (ref_idx[0] != INVALID_IDX && ref_idx[1] == INVALID_IDX) { |
1294 | | // == Forward prediction only == |
1295 | | // Identify the second nearest forward reference. |
1296 | 15.2k | ref_order_hints[1] = -1; |
1297 | 122k | for (int i = 0; i < INTER_REFS_PER_FRAME; ++i) { |
1298 | 106k | const RefCntBuffer *const buf = get_ref_frame_buf(cm, LAST_FRAME + i); |
1299 | 106k | if (buf == NULL) continue; |
1300 | | |
1301 | 106k | const int ref_order_hint = buf->order_hint; |
1302 | 106k | if ((ref_order_hints[0] != -1 && |
1303 | 106k | get_relative_dist(order_hint_info, ref_order_hint, |
1304 | 106k | ref_order_hints[0]) < 0) && |
1305 | 106k | (ref_order_hints[1] == -1 || |
1306 | 34.1k | get_relative_dist(order_hint_info, ref_order_hint, |
1307 | 20.8k | ref_order_hints[1]) > 0)) { |
1308 | | // Second closest forward reference |
1309 | 18.4k | ref_order_hints[1] = ref_order_hint; |
1310 | 18.4k | ref_idx[1] = i; |
1311 | 18.4k | } |
1312 | 106k | } |
1313 | 15.2k | if (ref_order_hints[1] != -1) { |
1314 | 13.3k | skip_mode_info->skip_mode_allowed = 1; |
1315 | 13.3k | skip_mode_info->ref_frame_idx_0 = AOMMIN(ref_idx[0], ref_idx[1]); |
1316 | 13.3k | skip_mode_info->ref_frame_idx_1 = AOMMAX(ref_idx[0], ref_idx[1]); |
1317 | 13.3k | } |
1318 | 15.2k | } |
1319 | 26.3k | } |
1320 | | |
1321 | | typedef struct { |
1322 | | int map_idx; // frame map index |
1323 | | RefCntBuffer *buf; // frame buffer |
1324 | | int sort_idx; // index based on the offset to be used for sorting |
1325 | | } REF_FRAME_INFO; |
1326 | | |
1327 | | // Compares the sort_idx fields. If they are equal, then compares the map_idx |
1328 | | // fields to break the tie. This ensures a stable sort. |
1329 | 421k | static int compare_ref_frame_info(const void *arg_a, const void *arg_b) { |
1330 | 421k | const REF_FRAME_INFO *info_a = (REF_FRAME_INFO *)arg_a; |
1331 | 421k | const REF_FRAME_INFO *info_b = (REF_FRAME_INFO *)arg_b; |
1332 | | |
1333 | 421k | const int sort_idx_diff = info_a->sort_idx - info_b->sort_idx; |
1334 | 421k | if (sort_idx_diff != 0) return sort_idx_diff; |
1335 | 138k | return info_a->map_idx - info_b->map_idx; |
1336 | 421k | } |
1337 | | |
1338 | | static inline void set_ref_frame_info(int *remapped_ref_idx, int frame_idx, |
1339 | 193k | REF_FRAME_INFO *ref_info) { |
1340 | 193k | assert(frame_idx >= 0 && frame_idx < INTER_REFS_PER_FRAME); |
1341 | | |
1342 | 193k | remapped_ref_idx[frame_idx] = ref_info->map_idx; |
1343 | 193k | } |
1344 | | |
1345 | | void av1_set_frame_refs(AV1_COMMON *const cm, int *remapped_ref_idx, |
1346 | 28.0k | int lst_map_idx, int gld_map_idx) { |
1347 | 28.0k | int lst_frame_sort_idx = -1; |
1348 | 28.0k | int gld_frame_sort_idx = -1; |
1349 | | |
1350 | 28.0k | assert(cm->seq_params->order_hint_info.enable_order_hint); |
1351 | 28.0k | assert(cm->seq_params->order_hint_info.order_hint_bits_minus_1 >= 0); |
1352 | 28.0k | const int cur_order_hint = (int)cm->current_frame.order_hint; |
1353 | 28.0k | const int cur_frame_sort_idx = |
1354 | 28.0k | 1 << cm->seq_params->order_hint_info.order_hint_bits_minus_1; |
1355 | | |
1356 | 28.0k | REF_FRAME_INFO ref_frame_info[REF_FRAMES]; |
1357 | 28.0k | int ref_flag_list[INTER_REFS_PER_FRAME] = { 0, 0, 0, 0, 0, 0, 0 }; |
1358 | | |
1359 | 252k | for (int i = 0; i < REF_FRAMES; ++i) { |
1360 | 224k | const int map_idx = i; |
1361 | | |
1362 | 224k | ref_frame_info[i].map_idx = map_idx; |
1363 | 224k | ref_frame_info[i].sort_idx = -1; |
1364 | | |
1365 | 224k | RefCntBuffer *const buf = cm->ref_frame_map[map_idx]; |
1366 | 224k | ref_frame_info[i].buf = buf; |
1367 | | |
1368 | 224k | if (buf == NULL) continue; |
1369 | | // If this assertion fails, there is a reference leak. |
1370 | 209k | assert(buf->ref_count > 0); |
1371 | | |
1372 | 209k | const int offset = (int)buf->order_hint; |
1373 | 209k | ref_frame_info[i].sort_idx = |
1374 | 209k | (offset == -1) ? -1 |
1375 | 209k | : cur_frame_sort_idx + |
1376 | 209k | get_relative_dist(&cm->seq_params->order_hint_info, |
1377 | 209k | offset, cur_order_hint); |
1378 | 209k | assert(ref_frame_info[i].sort_idx >= -1); |
1379 | | |
1380 | 209k | if (map_idx == lst_map_idx) lst_frame_sort_idx = ref_frame_info[i].sort_idx; |
1381 | 209k | if (map_idx == gld_map_idx) gld_frame_sort_idx = ref_frame_info[i].sort_idx; |
1382 | 209k | } |
1383 | | |
1384 | | // Confirm both LAST_FRAME and GOLDEN_FRAME are valid forward reference |
1385 | | // frames. |
1386 | 28.0k | if (lst_frame_sort_idx == -1 || lst_frame_sort_idx >= cur_frame_sort_idx) { |
1387 | 281 | aom_internal_error(cm->error, AOM_CODEC_CORRUPT_FRAME, |
1388 | 281 | "Inter frame requests a look-ahead frame as LAST"); |
1389 | 281 | } |
1390 | 28.0k | if (gld_frame_sort_idx == -1 || gld_frame_sort_idx >= cur_frame_sort_idx) { |
1391 | 223 | aom_internal_error(cm->error, AOM_CODEC_CORRUPT_FRAME, |
1392 | 223 | "Inter frame requests a look-ahead frame as GOLDEN"); |
1393 | 223 | } |
1394 | | |
1395 | | // Sort ref frames based on their frame_offset values. |
1396 | 28.0k | qsort(ref_frame_info, REF_FRAMES, sizeof(REF_FRAME_INFO), |
1397 | 28.0k | compare_ref_frame_info); |
1398 | | |
1399 | | // Identify forward and backward reference frames. |
1400 | | // Forward reference: offset < order_hint |
1401 | | // Backward reference: offset >= order_hint |
1402 | 28.0k | int fwd_start_idx = 0, fwd_end_idx = REF_FRAMES - 1; |
1403 | | |
1404 | 195k | for (int i = 0; i < REF_FRAMES; i++) { |
1405 | 190k | if (ref_frame_info[i].sort_idx == -1) { |
1406 | 14.7k | fwd_start_idx++; |
1407 | 14.7k | continue; |
1408 | 14.7k | } |
1409 | | |
1410 | 175k | if (ref_frame_info[i].sort_idx >= cur_frame_sort_idx) { |
1411 | 23.2k | fwd_end_idx = i - 1; |
1412 | 23.2k | break; |
1413 | 23.2k | } |
1414 | 175k | } |
1415 | | |
1416 | 28.0k | int bwd_start_idx = fwd_end_idx + 1; |
1417 | 28.0k | int bwd_end_idx = REF_FRAMES - 1; |
1418 | | |
1419 | | // === Backward Reference Frames === |
1420 | | |
1421 | | // == ALTREF_FRAME == |
1422 | 28.0k | if (bwd_start_idx <= bwd_end_idx) { |
1423 | 23.2k | set_ref_frame_info(remapped_ref_idx, ALTREF_FRAME - LAST_FRAME, |
1424 | 23.2k | &ref_frame_info[bwd_end_idx]); |
1425 | 23.2k | ref_flag_list[ALTREF_FRAME - LAST_FRAME] = 1; |
1426 | 23.2k | bwd_end_idx--; |
1427 | 23.2k | } |
1428 | | |
1429 | | // == BWDREF_FRAME == |
1430 | 28.0k | if (bwd_start_idx <= bwd_end_idx) { |
1431 | 14.6k | set_ref_frame_info(remapped_ref_idx, BWDREF_FRAME - LAST_FRAME, |
1432 | 14.6k | &ref_frame_info[bwd_start_idx]); |
1433 | 14.6k | ref_flag_list[BWDREF_FRAME - LAST_FRAME] = 1; |
1434 | 14.6k | bwd_start_idx++; |
1435 | 14.6k | } |
1436 | | |
1437 | | // == ALTREF2_FRAME == |
1438 | 28.0k | if (bwd_start_idx <= bwd_end_idx) { |
1439 | 8.20k | set_ref_frame_info(remapped_ref_idx, ALTREF2_FRAME - LAST_FRAME, |
1440 | 8.20k | &ref_frame_info[bwd_start_idx]); |
1441 | 8.20k | ref_flag_list[ALTREF2_FRAME - LAST_FRAME] = 1; |
1442 | 8.20k | } |
1443 | | |
1444 | | // === Forward Reference Frames === |
1445 | | |
1446 | 180k | for (int i = fwd_start_idx; i <= fwd_end_idx; ++i) { |
1447 | | // == LAST_FRAME == |
1448 | 152k | if (ref_frame_info[i].map_idx == lst_map_idx) { |
1449 | 27.5k | set_ref_frame_info(remapped_ref_idx, LAST_FRAME - LAST_FRAME, |
1450 | 27.5k | &ref_frame_info[i]); |
1451 | 27.5k | ref_flag_list[LAST_FRAME - LAST_FRAME] = 1; |
1452 | 27.5k | } |
1453 | | |
1454 | | // == GOLDEN_FRAME == |
1455 | 152k | if (ref_frame_info[i].map_idx == gld_map_idx) { |
1456 | 27.5k | set_ref_frame_info(remapped_ref_idx, GOLDEN_FRAME - LAST_FRAME, |
1457 | 27.5k | &ref_frame_info[i]); |
1458 | 27.5k | ref_flag_list[GOLDEN_FRAME - LAST_FRAME] = 1; |
1459 | 27.5k | } |
1460 | 152k | } |
1461 | | |
1462 | 28.0k | assert(ref_flag_list[LAST_FRAME - LAST_FRAME] == 1 && |
1463 | 28.0k | ref_flag_list[GOLDEN_FRAME - LAST_FRAME] == 1); |
1464 | | |
1465 | | // == LAST2_FRAME == |
1466 | | // == LAST3_FRAME == |
1467 | | // == BWDREF_FRAME == |
1468 | | // == ALTREF2_FRAME == |
1469 | | // == ALTREF_FRAME == |
1470 | | |
1471 | | // Set up the reference frames in the anti-chronological order. |
1472 | 27.5k | static const MV_REFERENCE_FRAME ref_frame_list[INTER_REFS_PER_FRAME - 2] = { |
1473 | 27.5k | LAST2_FRAME, LAST3_FRAME, BWDREF_FRAME, ALTREF2_FRAME, ALTREF_FRAME |
1474 | 27.5k | }; |
1475 | | |
1476 | 27.5k | int ref_idx; |
1477 | 141k | for (ref_idx = 0; ref_idx < (INTER_REFS_PER_FRAME - 2); ref_idx++) { |
1478 | 120k | const MV_REFERENCE_FRAME ref_frame = ref_frame_list[ref_idx]; |
1479 | | |
1480 | 120k | if (ref_flag_list[ref_frame - LAST_FRAME] == 1) continue; |
1481 | | |
1482 | 115k | while (fwd_start_idx <= fwd_end_idx && |
1483 | 115k | (ref_frame_info[fwd_end_idx].map_idx == lst_map_idx || |
1484 | 108k | ref_frame_info[fwd_end_idx].map_idx == gld_map_idx)) { |
1485 | 28.6k | fwd_end_idx--; |
1486 | 28.6k | } |
1487 | 86.4k | if (fwd_start_idx > fwd_end_idx) break; |
1488 | | |
1489 | 79.6k | set_ref_frame_info(remapped_ref_idx, ref_frame - LAST_FRAME, |
1490 | 79.6k | &ref_frame_info[fwd_end_idx]); |
1491 | 79.6k | ref_flag_list[ref_frame - LAST_FRAME] = 1; |
1492 | | |
1493 | 79.6k | fwd_end_idx--; |
1494 | 79.6k | } |
1495 | | |
1496 | | // Assign all the remaining frame(s), if any, to the earliest reference |
1497 | | // frame. |
1498 | 51.7k | for (; ref_idx < (INTER_REFS_PER_FRAME - 2); ref_idx++) { |
1499 | 24.1k | const MV_REFERENCE_FRAME ref_frame = ref_frame_list[ref_idx]; |
1500 | 24.1k | if (ref_flag_list[ref_frame - LAST_FRAME] == 1) continue; |
1501 | 12.1k | set_ref_frame_info(remapped_ref_idx, ref_frame - LAST_FRAME, |
1502 | 12.1k | &ref_frame_info[fwd_start_idx]); |
1503 | 12.1k | ref_flag_list[ref_frame - LAST_FRAME] = 1; |
1504 | 12.1k | } |
1505 | | |
1506 | 220k | for (int i = 0; i < INTER_REFS_PER_FRAME; i++) { |
1507 | 193k | assert(ref_flag_list[i] == 1); |
1508 | 193k | } |
1509 | 27.5k | } |