Coverage Report

Created: 2025-12-31 06:49

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/aom/av1/common/mvref_common.c
Line
Count
Source
1
/*
2
 * Copyright (c) 2016, Alliance for Open Media. All rights reserved.
3
 *
4
 * This source code is subject to the terms of the BSD 2 Clause License and
5
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6
 * was not distributed with this source code in the LICENSE file, you can
7
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8
 * Media Patent License 1.0 was not distributed with this source code in the
9
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10
 */
11
12
#include <stdlib.h>
13
14
#include "av1/common/mvref_common.h"
15
#include "av1/common/warped_motion.h"
16
17
// Although we assign 32 bit integers, all the values are strictly under 14
18
// bits.
19
static const int div_mult[32] = { 0,    16384, 8192, 5461, 4096, 3276, 2730,
20
                                  2340, 2048,  1820, 1638, 1489, 1365, 1260,
21
                                  1170, 1092,  1024, 963,  910,  862,  819,
22
                                  780,  744,   712,  682,  655,  630,  606,
23
                                  585,  564,   546,  528 };
24
25
// TODO(jingning): Consider the use of lookup table for (num / den)
26
// altogether.
27
8.94M
void av1_get_mv_projection(MV *output, MV ref, int num, int den) {
28
8.94M
  den = AOMMIN(den, MAX_FRAME_DISTANCE);
29
8.94M
  num = num > 0 ? AOMMIN(num, MAX_FRAME_DISTANCE)
30
8.94M
                : AOMMAX(num, -MAX_FRAME_DISTANCE);
31
8.94M
  const int mv_row =
32
8.94M
      ROUND_POWER_OF_TWO_SIGNED(ref.row * num * div_mult[den], 14);
33
8.94M
  const int mv_col =
34
8.94M
      ROUND_POWER_OF_TWO_SIGNED(ref.col * num * div_mult[den], 14);
35
8.94M
  const int clamp_max = MV_UPP - 1;
36
8.94M
  const int clamp_min = MV_LOW + 1;
37
8.94M
  output->row = (int16_t)clamp(mv_row, clamp_min, clamp_max);
38
8.94M
  output->col = (int16_t)clamp(mv_col, clamp_min, clamp_max);
39
8.94M
}
40
41
void av1_copy_frame_mvs(const AV1_COMMON *const cm,
42
                        const MB_MODE_INFO *const mi, int mi_row, int mi_col,
43
4.30M
                        int x_mis, int y_mis) {
44
4.30M
  const int frame_mvs_stride = ROUND_POWER_OF_TWO(cm->mi_params.mi_cols, 1);
45
4.30M
  MV_REF *frame_mvs =
46
4.30M
      cm->cur_frame->mvs + (mi_row >> 1) * frame_mvs_stride + (mi_col >> 1);
47
4.30M
  x_mis = ROUND_POWER_OF_TWO(x_mis, 1);
48
4.30M
  y_mis = ROUND_POWER_OF_TWO(y_mis, 1);
49
4.30M
  int w, h;
50
51
12.6M
  for (h = 0; h < y_mis; h++) {
52
8.32M
    MV_REF *mv = frame_mvs;
53
41.1M
    for (w = 0; w < x_mis; w++) {
54
32.8M
      mv->ref_frame = NONE_FRAME;
55
32.8M
      mv->mv.as_int = 0;
56
57
98.4M
      for (int idx = 0; idx < 2; ++idx) {
58
65.6M
        MV_REFERENCE_FRAME ref_frame = mi->ref_frame[idx];
59
65.6M
        if (ref_frame > INTRA_FRAME) {
60
39.9M
          int8_t ref_idx = cm->ref_frame_side[ref_frame];
61
39.9M
          if (ref_idx) continue;
62
33.9M
          if ((abs(mi->mv[idx].as_mv.row) > REFMVS_LIMIT) ||
63
32.6M
              (abs(mi->mv[idx].as_mv.col) > REFMVS_LIMIT))
64
2.19M
            continue;
65
31.8M
          mv->ref_frame = ref_frame;
66
31.8M
          mv->mv.as_int = mi->mv[idx].as_int;
67
31.8M
        }
68
65.6M
      }
69
32.8M
      mv++;
70
32.8M
    }
71
8.32M
    frame_mvs += frame_mvs_stride;
72
8.32M
  }
73
4.30M
}
74
75
static inline void add_ref_mv_candidate(
76
    const MB_MODE_INFO *const candidate, const MV_REFERENCE_FRAME rf[2],
77
    uint8_t *refmv_count, uint8_t *ref_match_count, uint8_t *newmv_count,
78
    CANDIDATE_MV *ref_mv_stack, uint16_t *ref_mv_weight,
79
    int_mv *gm_mv_candidates, const WarpedMotionParams *gm_params,
80
20.4M
    uint16_t weight) {
81
20.4M
  if (!is_inter_block(candidate)) return;
82
20.4M
  assert(weight % 2 == 0);
83
17.3M
  int index, ref;
84
85
17.3M
  if (rf[1] == NONE_FRAME) {
86
    // single reference frame
87
46.9M
    for (ref = 0; ref < 2; ++ref) {
88
31.3M
      if (candidate->ref_frame[ref] == rf[0]) {
89
13.2M
        const int is_gm_block =
90
13.2M
            is_global_mv_block(candidate, gm_params[rf[0]].wmtype);
91
13.2M
        const int_mv this_refmv =
92
13.2M
            is_gm_block ? gm_mv_candidates[0] : get_block_mv(candidate, ref);
93
27.0M
        for (index = 0; index < *refmv_count; ++index) {
94
19.7M
          if (ref_mv_stack[index].this_mv.as_int == this_refmv.as_int) {
95
5.85M
            ref_mv_weight[index] += weight;
96
5.85M
            break;
97
5.85M
          }
98
19.7M
        }
99
100
        // Add a new item to the list.
101
13.2M
        if (index == *refmv_count && *refmv_count < MAX_REF_MV_STACK_SIZE) {
102
7.29M
          ref_mv_stack[index].this_mv = this_refmv;
103
7.29M
          ref_mv_weight[index] = weight;
104
7.29M
          ++(*refmv_count);
105
7.29M
        }
106
13.2M
        if (have_newmv_in_inter_mode(candidate->mode)) ++*newmv_count;
107
13.2M
        ++*ref_match_count;
108
13.2M
      }
109
31.3M
    }
110
15.6M
  } else {
111
    // compound reference frame
112
1.69M
    if (candidate->ref_frame[0] == rf[0] && candidate->ref_frame[1] == rf[1]) {
113
592k
      int_mv this_refmv[2];
114
115
1.77M
      for (ref = 0; ref < 2; ++ref) {
116
1.18M
        if (is_global_mv_block(candidate, gm_params[rf[ref]].wmtype))
117
24.7k
          this_refmv[ref] = gm_mv_candidates[ref];
118
1.15M
        else
119
1.15M
          this_refmv[ref] = get_block_mv(candidate, ref);
120
1.18M
      }
121
122
857k
      for (index = 0; index < *refmv_count; ++index) {
123
505k
        if ((ref_mv_stack[index].this_mv.as_int == this_refmv[0].as_int) &&
124
275k
            (ref_mv_stack[index].comp_mv.as_int == this_refmv[1].as_int)) {
125
241k
          ref_mv_weight[index] += weight;
126
241k
          break;
127
241k
        }
128
505k
      }
129
130
      // Add a new item to the list.
131
592k
      if (index == *refmv_count && *refmv_count < MAX_REF_MV_STACK_SIZE) {
132
350k
        ref_mv_stack[index].this_mv = this_refmv[0];
133
350k
        ref_mv_stack[index].comp_mv = this_refmv[1];
134
350k
        ref_mv_weight[index] = weight;
135
350k
        ++(*refmv_count);
136
350k
      }
137
592k
      if (have_newmv_in_inter_mode(candidate->mode)) ++*newmv_count;
138
592k
      ++*ref_match_count;
139
592k
    }
140
1.69M
  }
141
17.3M
}
142
143
static inline void scan_row_mbmi(const AV1_COMMON *cm, const MACROBLOCKD *xd,
144
                                 int mi_col, const MV_REFERENCE_FRAME rf[2],
145
                                 int row_offset, CANDIDATE_MV *ref_mv_stack,
146
                                 uint16_t *ref_mv_weight, uint8_t *refmv_count,
147
                                 uint8_t *ref_match_count, uint8_t *newmv_count,
148
                                 int_mv *gm_mv_candidates, int max_row_offset,
149
6.78M
                                 int *processed_rows) {
150
6.78M
  int end_mi = AOMMIN(xd->width, cm->mi_params.mi_cols - mi_col);
151
6.78M
  end_mi = AOMMIN(end_mi, mi_size_wide[BLOCK_64X64]);
152
6.78M
  const int width_8x8 = mi_size_wide[BLOCK_8X8];
153
6.78M
  const int width_16x16 = mi_size_wide[BLOCK_16X16];
154
6.78M
  int col_offset = 0;
155
  // TODO(jingning): Revisit this part after cb4x4 is stable.
156
6.78M
  if (abs(row_offset) > 1) {
157
3.81M
    col_offset = 1;
158
3.81M
    if ((mi_col & 0x01) && xd->width < width_8x8) --col_offset;
159
3.81M
  }
160
6.78M
  const int use_step_16 = (xd->width >= 16);
161
6.78M
  MB_MODE_INFO **const candidate_mi0 = xd->mi + row_offset * xd->mi_stride;
162
163
14.6M
  for (int i = 0; i < end_mi;) {
164
7.91M
    const MB_MODE_INFO *const candidate = candidate_mi0[col_offset + i];
165
7.91M
    const int candidate_bsize = candidate->bsize;
166
7.91M
    const int n4_w = mi_size_wide[candidate_bsize];
167
7.91M
    int len = AOMMIN(xd->width, n4_w);
168
7.91M
    if (use_step_16)
169
288k
      len = AOMMAX(width_16x16, len);
170
7.62M
    else if (abs(row_offset) > 1)
171
4.33M
      len = AOMMAX(len, width_8x8);
172
173
7.91M
    uint16_t weight = 2;
174
7.91M
    if (xd->width >= width_8x8 && xd->width <= n4_w) {
175
4.09M
      uint16_t inc = AOMMIN(-max_row_offset + row_offset + 1,
176
4.09M
                            mi_size_high[candidate_bsize]);
177
      // Obtain range used in weight calculation.
178
4.09M
      weight = AOMMAX(weight, inc);
179
      // Update processed rows.
180
4.09M
      *processed_rows = inc - row_offset - 1;
181
4.09M
    }
182
183
7.91M
    add_ref_mv_candidate(candidate, rf, refmv_count, ref_match_count,
184
7.91M
                         newmv_count, ref_mv_stack, ref_mv_weight,
185
7.91M
                         gm_mv_candidates, cm->global_motion, len * weight);
186
187
7.91M
    i += len;
188
7.91M
  }
189
6.78M
}
190
191
static inline void scan_col_mbmi(const AV1_COMMON *cm, const MACROBLOCKD *xd,
192
                                 int mi_row, const MV_REFERENCE_FRAME rf[2],
193
                                 int col_offset, CANDIDATE_MV *ref_mv_stack,
194
                                 uint16_t *ref_mv_weight, uint8_t *refmv_count,
195
                                 uint8_t *ref_match_count, uint8_t *newmv_count,
196
                                 int_mv *gm_mv_candidates, int max_col_offset,
197
6.82M
                                 int *processed_cols) {
198
6.82M
  int end_mi = AOMMIN(xd->height, cm->mi_params.mi_rows - mi_row);
199
6.82M
  end_mi = AOMMIN(end_mi, mi_size_high[BLOCK_64X64]);
200
6.82M
  const int n8_h_8 = mi_size_high[BLOCK_8X8];
201
6.82M
  const int n8_h_16 = mi_size_high[BLOCK_16X16];
202
6.82M
  int i;
203
6.82M
  int row_offset = 0;
204
6.82M
  if (abs(col_offset) > 1) {
205
3.82M
    row_offset = 1;
206
3.82M
    if ((mi_row & 0x01) && xd->height < n8_h_8) --row_offset;
207
3.82M
  }
208
6.82M
  const int use_step_16 = (xd->height >= 16);
209
210
14.8M
  for (i = 0; i < end_mi;) {
211
8.03M
    const MB_MODE_INFO *const candidate =
212
8.03M
        xd->mi[(row_offset + i) * xd->mi_stride + col_offset];
213
8.03M
    const int candidate_bsize = candidate->bsize;
214
8.03M
    const int n4_h = mi_size_high[candidate_bsize];
215
8.03M
    int len = AOMMIN(xd->height, n4_h);
216
8.03M
    if (use_step_16)
217
287k
      len = AOMMAX(n8_h_16, len);
218
7.74M
    else if (abs(col_offset) > 1)
219
4.39M
      len = AOMMAX(len, n8_h_8);
220
221
8.03M
    int weight = 2;
222
8.03M
    if (xd->height >= n8_h_8 && xd->height <= n4_h) {
223
3.72M
      int inc = AOMMIN(-max_col_offset + col_offset + 1,
224
3.72M
                       mi_size_wide[candidate_bsize]);
225
      // Obtain range used in weight calculation.
226
3.72M
      weight = AOMMAX(weight, inc);
227
      // Update processed cols.
228
3.72M
      *processed_cols = inc - col_offset - 1;
229
3.72M
    }
230
231
8.03M
    add_ref_mv_candidate(candidate, rf, refmv_count, ref_match_count,
232
8.03M
                         newmv_count, ref_mv_stack, ref_mv_weight,
233
8.03M
                         gm_mv_candidates, cm->global_motion, len * weight);
234
235
8.03M
    i += len;
236
8.03M
  }
237
6.82M
}
238
239
static inline void scan_blk_mbmi(const AV1_COMMON *cm, const MACROBLOCKD *xd,
240
                                 const int mi_row, const int mi_col,
241
                                 const MV_REFERENCE_FRAME rf[2], int row_offset,
242
                                 int col_offset, CANDIDATE_MV *ref_mv_stack,
243
                                 uint16_t *ref_mv_weight,
244
                                 uint8_t *ref_match_count, uint8_t *newmv_count,
245
                                 int_mv *gm_mv_candidates,
246
4.81M
                                 uint8_t *refmv_count) {
247
4.81M
  const TileInfo *const tile = &xd->tile;
248
4.81M
  POSITION mi_pos;
249
250
4.81M
  mi_pos.row = row_offset;
251
4.81M
  mi_pos.col = col_offset;
252
253
4.81M
  if (is_inside(tile, mi_col, mi_row, &mi_pos)) {
254
4.56M
    const MB_MODE_INFO *const candidate =
255
4.56M
        xd->mi[mi_pos.row * xd->mi_stride + mi_pos.col];
256
4.56M
    const int len = mi_size_wide[BLOCK_8X8];
257
258
4.56M
    add_ref_mv_candidate(candidate, rf, refmv_count, ref_match_count,
259
4.56M
                         newmv_count, ref_mv_stack, ref_mv_weight,
260
4.56M
                         gm_mv_candidates, cm->global_motion, 2 * len);
261
4.56M
  }  // Analyze a single 8x8 block motion information.
262
4.81M
}
263
264
static int has_top_right(const AV1_COMMON *cm, const MACROBLOCKD *xd,
265
4.40M
                         int mi_row, int mi_col, int bs) {
266
4.40M
  const int sb_mi_size = mi_size_wide[cm->seq_params->sb_size];
267
4.40M
  const int mask_row = mi_row & (sb_mi_size - 1);
268
4.40M
  const int mask_col = mi_col & (sb_mi_size - 1);
269
270
4.40M
  if (bs > mi_size_wide[BLOCK_64X64]) return 0;
271
272
  // In a split partition all apart from the bottom right has a top right
273
4.29M
  int has_tr = !((mask_row & bs) && (mask_col & bs));
274
275
  // bs > 0 and bs is a power of 2
276
4.29M
  assert(bs > 0 && !(bs & (bs - 1)));
277
278
  // For each 4x4 group of blocks, when the bottom right is decoded the blocks
279
  // to the right have not been decoded therefore the bottom right does
280
  // not have a top right
281
6.44M
  while (bs < sb_mi_size) {
282
6.13M
    if (mask_col & bs) {
283
2.80M
      if ((mask_col & (2 * bs)) && (mask_row & (2 * bs))) {
284
663k
        has_tr = 0;
285
663k
        break;
286
663k
      }
287
3.32M
    } else {
288
3.32M
      break;
289
3.32M
    }
290
2.14M
    bs <<= 1;
291
2.14M
  }
292
293
  // In a VERTICAL or VERTICAL_4 partition, all partition before the last one
294
  // always have a top right (as the block above will have been decoded).
295
4.30M
  if (xd->width < xd->height) {
296
1.01M
    if (!xd->is_last_vertical_rect) has_tr = 1;
297
1.01M
  }
298
299
  // In a HORIZONTAL or HORIZONTAL_4 partition, partitions after the first one
300
  // never have a top right (as the block to the right won't have been decoded).
301
4.30M
  if (xd->width > xd->height) {
302
1.53M
    if (!xd->is_first_horizontal_rect) has_tr = 0;
303
1.53M
  }
304
305
  // The bottom left square of a Vertical A (in the old format) does
306
  // not have a top right as it is decoded before the right hand
307
  // rectangle of the partition
308
4.30M
  if (xd->mi[0]->partition == PARTITION_VERT_A) {
309
132k
    if (xd->width == xd->height)
310
86.0k
      if (mask_row & bs) has_tr = 0;
311
132k
  }
312
313
4.30M
  return has_tr;
314
4.29M
}
315
316
static int check_sb_border(const int mi_row, const int mi_col,
317
4.59M
                           const int row_offset, const int col_offset) {
318
4.59M
  const int sb_mi_size = mi_size_wide[BLOCK_64X64];
319
4.59M
  const int row = mi_row & (sb_mi_size - 1);
320
4.59M
  const int col = mi_col & (sb_mi_size - 1);
321
322
4.59M
  if (row + row_offset < 0 || row + row_offset >= sb_mi_size ||
323
3.92M
      col + col_offset < 0 || col + col_offset >= sb_mi_size)
324
1.60M
    return 0;
325
326
2.98M
  return 1;
327
4.59M
}
328
329
static int add_tpl_ref_mv(const AV1_COMMON *cm, const MACROBLOCKD *xd,
330
                          int mi_row, int mi_col, MV_REFERENCE_FRAME ref_frame,
331
                          int blk_row, int blk_col, int_mv *gm_mv_candidates,
332
                          uint8_t *const refmv_count,
333
                          CANDIDATE_MV ref_mv_stack[MAX_REF_MV_STACK_SIZE],
334
                          uint16_t ref_mv_weight[MAX_REF_MV_STACK_SIZE],
335
11.9M
                          int16_t *mode_context) {
336
11.9M
  POSITION mi_pos;
337
11.9M
  mi_pos.row = (mi_row & 0x01) ? blk_row : blk_row + 1;
338
11.9M
  mi_pos.col = (mi_col & 0x01) ? blk_col : blk_col + 1;
339
340
11.9M
  if (!is_inside(&xd->tile, mi_col, mi_row, &mi_pos)) return 0;
341
342
11.9M
  const TPL_MV_REF *prev_frame_mvs =
343
11.9M
      cm->tpl_mvs +
344
11.9M
      ((mi_row + mi_pos.row) >> 1) * (cm->mi_params.mi_stride >> 1) +
345
11.9M
      ((mi_col + mi_pos.col) >> 1);
346
11.9M
  if (prev_frame_mvs->mfmv0.as_int == INVALID_MV) return 0;
347
348
856k
  MV_REFERENCE_FRAME rf[2];
349
856k
  av1_set_ref_frame(rf, ref_frame);
350
351
856k
  const uint16_t weight_unit = 1;  // mi_size_wide[BLOCK_8X8];
352
856k
  const int cur_frame_index = cm->cur_frame->order_hint;
353
856k
  const RefCntBuffer *const buf_0 = get_ref_frame_buf(cm, rf[0]);
354
856k
  const int frame0_index = buf_0->order_hint;
355
856k
  const int cur_offset_0 = get_relative_dist(&cm->seq_params->order_hint_info,
356
856k
                                             cur_frame_index, frame0_index);
357
856k
  int idx;
358
856k
  const int allow_high_precision_mv = cm->features.allow_high_precision_mv;
359
856k
  const int force_integer_mv = cm->features.cur_frame_force_integer_mv;
360
361
856k
  int_mv this_refmv;
362
856k
  av1_get_mv_projection(&this_refmv.as_mv, prev_frame_mvs->mfmv0.as_mv,
363
856k
                        cur_offset_0, prev_frame_mvs->ref_frame_offset);
364
856k
  lower_mv_precision(&this_refmv.as_mv, allow_high_precision_mv,
365
856k
                     force_integer_mv);
366
367
856k
  if (rf[1] == NONE_FRAME) {
368
465k
    if (blk_row == 0 && blk_col == 0) {
369
67.1k
      if (abs(this_refmv.as_mv.row - gm_mv_candidates[0].as_mv.row) >= 16 ||
370
59.0k
          abs(this_refmv.as_mv.col - gm_mv_candidates[0].as_mv.col) >= 16)
371
38.9k
        mode_context[ref_frame] |= (1 << GLOBALMV_OFFSET);
372
67.1k
    }
373
374
1.04M
    for (idx = 0; idx < *refmv_count; ++idx)
375
983k
      if (this_refmv.as_int == ref_mv_stack[idx].this_mv.as_int) break;
376
377
465k
    if (idx < *refmv_count) ref_mv_weight[idx] += 2 * weight_unit;
378
379
465k
    if (idx == *refmv_count && *refmv_count < MAX_REF_MV_STACK_SIZE) {
380
90.0k
      ref_mv_stack[idx].this_mv.as_int = this_refmv.as_int;
381
90.0k
      ref_mv_weight[idx] = 2 * weight_unit;
382
90.0k
      ++(*refmv_count);
383
90.0k
    }
384
465k
  } else {
385
    // Process compound inter mode
386
390k
    const RefCntBuffer *const buf_1 = get_ref_frame_buf(cm, rf[1]);
387
390k
    const int frame1_index = buf_1->order_hint;
388
390k
    const int cur_offset_1 = get_relative_dist(&cm->seq_params->order_hint_info,
389
390k
                                               cur_frame_index, frame1_index);
390
390k
    int_mv comp_refmv;
391
390k
    av1_get_mv_projection(&comp_refmv.as_mv, prev_frame_mvs->mfmv0.as_mv,
392
390k
                          cur_offset_1, prev_frame_mvs->ref_frame_offset);
393
390k
    lower_mv_precision(&comp_refmv.as_mv, allow_high_precision_mv,
394
390k
                       force_integer_mv);
395
396
390k
    if (blk_row == 0 && blk_col == 0) {
397
35.4k
      if (abs(this_refmv.as_mv.row - gm_mv_candidates[0].as_mv.row) >= 16 ||
398
32.8k
          abs(this_refmv.as_mv.col - gm_mv_candidates[0].as_mv.col) >= 16 ||
399
15.4k
          abs(comp_refmv.as_mv.row - gm_mv_candidates[1].as_mv.row) >= 16 ||
400
15.0k
          abs(comp_refmv.as_mv.col - gm_mv_candidates[1].as_mv.col) >= 16)
401
21.9k
        mode_context[ref_frame] |= (1 << GLOBALMV_OFFSET);
402
35.4k
    }
403
404
844k
    for (idx = 0; idx < *refmv_count; ++idx) {
405
797k
      if (this_refmv.as_int == ref_mv_stack[idx].this_mv.as_int &&
406
350k
          comp_refmv.as_int == ref_mv_stack[idx].comp_mv.as_int)
407
343k
        break;
408
797k
    }
409
410
390k
    if (idx < *refmv_count) ref_mv_weight[idx] += 2 * weight_unit;
411
412
390k
    if (idx == *refmv_count && *refmv_count < MAX_REF_MV_STACK_SIZE) {
413
66.3k
      ref_mv_stack[idx].this_mv.as_int = this_refmv.as_int;
414
66.3k
      ref_mv_stack[idx].comp_mv.as_int = comp_refmv.as_int;
415
66.3k
      ref_mv_weight[idx] = 2 * weight_unit;
416
66.3k
      ++(*refmv_count);
417
66.3k
    }
418
390k
  }
419
420
856k
  return 1;
421
11.9M
}
422
423
static inline void process_compound_ref_mv_candidate(
424
    const MB_MODE_INFO *const candidate, const AV1_COMMON *const cm,
425
    const MV_REFERENCE_FRAME *const rf, int_mv ref_id[2][2],
426
471k
    int ref_id_count[2], int_mv ref_diff[2][2], int ref_diff_count[2]) {
427
1.41M
  for (int rf_idx = 0; rf_idx < 2; ++rf_idx) {
428
941k
    MV_REFERENCE_FRAME can_rf = candidate->ref_frame[rf_idx];
429
430
2.82M
    for (int cmp_idx = 0; cmp_idx < 2; ++cmp_idx) {
431
1.88M
      if (can_rf == rf[cmp_idx] && ref_id_count[cmp_idx] < 2) {
432
491k
        ref_id[cmp_idx][ref_id_count[cmp_idx]] = candidate->mv[rf_idx];
433
491k
        ++ref_id_count[cmp_idx];
434
1.39M
      } else if (can_rf > INTRA_FRAME && ref_diff_count[cmp_idx] < 2) {
435
697k
        int_mv this_mv = candidate->mv[rf_idx];
436
697k
        if (cm->ref_frame_sign_bias[can_rf] !=
437
697k
            cm->ref_frame_sign_bias[rf[cmp_idx]]) {
438
132k
          this_mv.as_mv.row = -this_mv.as_mv.row;
439
132k
          this_mv.as_mv.col = -this_mv.as_mv.col;
440
132k
        }
441
697k
        ref_diff[cmp_idx][ref_diff_count[cmp_idx]] = this_mv;
442
697k
        ++ref_diff_count[cmp_idx];
443
697k
      }
444
1.88M
    }
445
941k
  }
446
471k
}
447
448
static inline void process_single_ref_mv_candidate(
449
    const MB_MODE_INFO *const candidate, const AV1_COMMON *const cm,
450
    MV_REFERENCE_FRAME ref_frame, uint8_t *const refmv_count,
451
    CANDIDATE_MV ref_mv_stack[MAX_REF_MV_STACK_SIZE],
452
1.80M
    uint16_t ref_mv_weight[MAX_REF_MV_STACK_SIZE]) {
453
5.42M
  for (int rf_idx = 0; rf_idx < 2; ++rf_idx) {
454
3.61M
    if (candidate->ref_frame[rf_idx] > INTRA_FRAME) {
455
1.40M
      int_mv this_mv = candidate->mv[rf_idx];
456
1.40M
      if (cm->ref_frame_sign_bias[candidate->ref_frame[rf_idx]] !=
457
1.40M
          cm->ref_frame_sign_bias[ref_frame]) {
458
34.7k
        this_mv.as_mv.row = -this_mv.as_mv.row;
459
34.7k
        this_mv.as_mv.col = -this_mv.as_mv.col;
460
34.7k
      }
461
1.40M
      int stack_idx;
462
1.63M
      for (stack_idx = 0; stack_idx < *refmv_count; ++stack_idx) {
463
1.31M
        const int_mv stack_mv = ref_mv_stack[stack_idx].this_mv;
464
1.31M
        if (this_mv.as_int == stack_mv.as_int) break;
465
1.31M
      }
466
467
1.40M
      if (stack_idx == *refmv_count) {
468
320k
        ref_mv_stack[stack_idx].this_mv = this_mv;
469
470
        // TODO(jingning): Set an arbitrary small number here. The weight
471
        // doesn't matter as long as it is properly initialized.
472
320k
        ref_mv_weight[stack_idx] = 2;
473
320k
        ++(*refmv_count);
474
320k
      }
475
1.40M
    }
476
3.61M
  }
477
1.80M
}
478
479
static inline void setup_ref_mv_list(
480
    const AV1_COMMON *cm, const MACROBLOCKD *xd, MV_REFERENCE_FRAME ref_frame,
481
    uint8_t *const refmv_count,
482
    CANDIDATE_MV ref_mv_stack[MAX_REF_MV_STACK_SIZE],
483
    uint16_t ref_mv_weight[MAX_REF_MV_STACK_SIZE],
484
    int_mv mv_ref_list[MAX_MV_REF_CANDIDATES], int_mv *gm_mv_candidates,
485
3.08M
    int mi_row, int mi_col, int16_t *mode_context) {
486
3.08M
  const int bs = AOMMAX(xd->width, xd->height);
487
3.08M
  const int has_tr = has_top_right(cm, xd, mi_row, mi_col, bs);
488
3.08M
  MV_REFERENCE_FRAME rf[2];
489
490
3.08M
  const TileInfo *const tile = &xd->tile;
491
3.08M
  int max_row_offset = 0, max_col_offset = 0;
492
3.08M
  const int row_adj = (xd->height < mi_size_high[BLOCK_8X8]) && (mi_row & 0x01);
493
3.08M
  const int col_adj = (xd->width < mi_size_wide[BLOCK_8X8]) && (mi_col & 0x01);
494
3.08M
  int processed_rows = 0;
495
3.08M
  int processed_cols = 0;
496
497
3.08M
  av1_set_ref_frame(rf, ref_frame);
498
3.08M
  mode_context[ref_frame] = 0;
499
3.08M
  *refmv_count = 0;
500
501
  // Find valid maximum row/col offset.
502
3.08M
  if (xd->up_available) {
503
2.97M
    max_row_offset = -(MVREF_ROW_COLS << 1) + row_adj;
504
505
2.97M
    if (xd->height < mi_size_high[BLOCK_8X8])
506
727k
      max_row_offset = -(2 << 1) + row_adj;
507
508
2.97M
    max_row_offset = find_valid_row_offset(tile, mi_row, max_row_offset);
509
2.97M
  }
510
511
3.08M
  if (xd->left_available) {
512
3.00M
    max_col_offset = -(MVREF_ROW_COLS << 1) + col_adj;
513
514
3.00M
    if (xd->width < mi_size_wide[BLOCK_8X8])
515
607k
      max_col_offset = -(2 << 1) + col_adj;
516
517
3.00M
    max_col_offset = find_valid_col_offset(tile, mi_col, max_col_offset);
518
3.00M
  }
519
520
3.08M
  uint8_t col_match_count = 0;
521
3.08M
  uint8_t row_match_count = 0;
522
3.08M
  uint8_t newmv_count = 0;
523
524
  // Scan the first above row mode info. row_offset = -1;
525
3.08M
  if (abs(max_row_offset) >= 1)
526
2.97M
    scan_row_mbmi(cm, xd, mi_col, rf, -1, ref_mv_stack, ref_mv_weight,
527
2.97M
                  refmv_count, &row_match_count, &newmv_count, gm_mv_candidates,
528
2.97M
                  max_row_offset, &processed_rows);
529
  // Scan the first left column mode info. col_offset = -1;
530
3.08M
  if (abs(max_col_offset) >= 1)
531
3.00M
    scan_col_mbmi(cm, xd, mi_row, rf, -1, ref_mv_stack, ref_mv_weight,
532
3.00M
                  refmv_count, &col_match_count, &newmv_count, gm_mv_candidates,
533
3.00M
                  max_col_offset, &processed_cols);
534
  // Check top-right boundary
535
3.08M
  if (has_tr)
536
1.72M
    scan_blk_mbmi(cm, xd, mi_row, mi_col, rf, -1, xd->width, ref_mv_stack,
537
1.72M
                  ref_mv_weight, &row_match_count, &newmv_count,
538
1.72M
                  gm_mv_candidates, refmv_count);
539
540
3.08M
  const uint8_t nearest_match = (row_match_count > 0) + (col_match_count > 0);
541
3.08M
  const uint8_t nearest_refmv_count = *refmv_count;
542
543
  // TODO(yunqing): for comp_search, do it for all 3 cases.
544
7.59M
  for (int idx = 0; idx < nearest_refmv_count; ++idx)
545
4.51M
    ref_mv_weight[idx] += REF_CAT_LEVEL;
546
547
3.08M
  if (cm->features.allow_ref_frame_mvs) {
548
2.71M
    int is_available = 0;
549
2.71M
    const int voffset = AOMMAX(mi_size_high[BLOCK_8X8], xd->height);
550
2.71M
    const int hoffset = AOMMAX(mi_size_wide[BLOCK_8X8], xd->width);
551
2.71M
    const int blk_row_end = AOMMIN(xd->height, mi_size_high[BLOCK_64X64]);
552
2.71M
    const int blk_col_end = AOMMIN(xd->width, mi_size_wide[BLOCK_64X64]);
553
554
2.71M
    const int tpl_sample_pos[3][2] = {
555
2.71M
      { voffset, -2 },
556
2.71M
      { voffset, hoffset },
557
2.71M
      { voffset - 2, hoffset },
558
2.71M
    };
559
2.71M
    const int allow_extension = (xd->height >= mi_size_high[BLOCK_8X8]) &&
560
2.07M
                                (xd->height < mi_size_high[BLOCK_64X64]) &&
561
1.97M
                                (xd->width >= mi_size_wide[BLOCK_8X8]) &&
562
1.57M
                                (xd->width < mi_size_wide[BLOCK_64X64]);
563
564
2.71M
    const int step_h = (xd->height >= mi_size_high[BLOCK_64X64])
565
2.71M
                           ? mi_size_high[BLOCK_16X16]
566
2.71M
                           : mi_size_high[BLOCK_8X8];
567
2.71M
    const int step_w = (xd->width >= mi_size_wide[BLOCK_64X64])
568
2.71M
                           ? mi_size_wide[BLOCK_16X16]
569
2.71M
                           : mi_size_wide[BLOCK_8X8];
570
571
7.19M
    for (int blk_row = 0; blk_row < blk_row_end; blk_row += step_h) {
572
13.4M
      for (int blk_col = 0; blk_col < blk_col_end; blk_col += step_w) {
573
9.01M
        int ret = add_tpl_ref_mv(cm, xd, mi_row, mi_col, ref_frame, blk_row,
574
9.01M
                                 blk_col, gm_mv_candidates, refmv_count,
575
9.01M
                                 ref_mv_stack, ref_mv_weight, mode_context);
576
9.01M
        if (blk_row == 0 && blk_col == 0) is_available = ret;
577
9.01M
      }
578
4.47M
    }
579
580
2.71M
    if (is_available == 0) mode_context[ref_frame] |= (1 << GLOBALMV_OFFSET);
581
582
7.31M
    for (int i = 0; i < 3 && allow_extension; ++i) {
583
4.59M
      const int blk_row = tpl_sample_pos[i][0];
584
4.59M
      const int blk_col = tpl_sample_pos[i][1];
585
586
4.59M
      if (!check_sb_border(mi_row, mi_col, blk_row, blk_col)) continue;
587
2.98M
      add_tpl_ref_mv(cm, xd, mi_row, mi_col, ref_frame, blk_row, blk_col,
588
2.98M
                     gm_mv_candidates, refmv_count, ref_mv_stack, ref_mv_weight,
589
2.98M
                     mode_context);
590
2.98M
    }
591
2.71M
  }
592
593
3.08M
  uint8_t dummy_newmv_count = 0;
594
595
  // Scan the second outer area.
596
3.08M
  scan_blk_mbmi(cm, xd, mi_row, mi_col, rf, -1, -1, ref_mv_stack, ref_mv_weight,
597
3.08M
                &row_match_count, &dummy_newmv_count, gm_mv_candidates,
598
3.08M
                refmv_count);
599
600
9.25M
  for (int idx = 2; idx <= MVREF_ROW_COLS; ++idx) {
601
6.16M
    const int row_offset = -(idx << 1) + 1 + row_adj;
602
6.16M
    const int col_offset = -(idx << 1) + 1 + col_adj;
603
604
6.16M
    if (abs(row_offset) <= abs(max_row_offset) &&
605
5.15M
        abs(row_offset) > processed_rows)
606
3.81M
      scan_row_mbmi(cm, xd, mi_col, rf, row_offset, ref_mv_stack, ref_mv_weight,
607
3.81M
                    refmv_count, &row_match_count, &dummy_newmv_count,
608
3.81M
                    gm_mv_candidates, max_row_offset, &processed_rows);
609
610
6.16M
    if (abs(col_offset) <= abs(max_col_offset) &&
611
5.36M
        abs(col_offset) > processed_cols)
612
3.82M
      scan_col_mbmi(cm, xd, mi_row, rf, col_offset, ref_mv_stack, ref_mv_weight,
613
3.82M
                    refmv_count, &col_match_count, &dummy_newmv_count,
614
3.82M
                    gm_mv_candidates, max_col_offset, &processed_cols);
615
6.16M
  }
616
617
3.08M
  const uint8_t ref_match_count = (row_match_count > 0) + (col_match_count > 0);
618
619
3.08M
  switch (nearest_match) {
620
395k
    case 0:
621
395k
      if (ref_match_count >= 1) mode_context[ref_frame] |= 1;
622
395k
      if (ref_match_count == 1)
623
86.2k
        mode_context[ref_frame] |= (1 << REFMV_OFFSET);
624
309k
      else if (ref_match_count >= 2)
625
21.8k
        mode_context[ref_frame] |= (2 << REFMV_OFFSET);
626
395k
      break;
627
972k
    case 1:
628
972k
      mode_context[ref_frame] |= (newmv_count > 0) ? 2 : 3;
629
972k
      if (ref_match_count == 1)
630
569k
        mode_context[ref_frame] |= (3 << REFMV_OFFSET);
631
403k
      else if (ref_match_count >= 2)
632
403k
        mode_context[ref_frame] |= (4 << REFMV_OFFSET);
633
972k
      break;
634
1.72M
    case 2:
635
1.72M
    default:
636
1.72M
      if (newmv_count >= 1)
637
1.18M
        mode_context[ref_frame] |= 4;
638
535k
      else
639
535k
        mode_context[ref_frame] |= 5;
640
641
1.72M
      mode_context[ref_frame] |= (5 << REFMV_OFFSET);
642
1.72M
      break;
643
3.08M
  }
644
645
  // Rank the likelihood and assign nearest and near mvs.
646
3.08M
  int len = nearest_refmv_count;
647
6.43M
  while (len > 0) {
648
3.34M
    int nr_len = 0;
649
5.51M
    for (int idx = 1; idx < len; ++idx) {
650
2.17M
      if (ref_mv_weight[idx - 1] < ref_mv_weight[idx]) {
651
799k
        const CANDIDATE_MV tmp_mv = ref_mv_stack[idx - 1];
652
799k
        const uint16_t tmp_ref_mv_weight = ref_mv_weight[idx - 1];
653
799k
        ref_mv_stack[idx - 1] = ref_mv_stack[idx];
654
799k
        ref_mv_stack[idx] = tmp_mv;
655
799k
        ref_mv_weight[idx - 1] = ref_mv_weight[idx];
656
799k
        ref_mv_weight[idx] = tmp_ref_mv_weight;
657
799k
        nr_len = idx;
658
799k
      }
659
2.17M
    }
660
3.34M
    len = nr_len;
661
3.34M
  }
662
663
3.08M
  len = *refmv_count;
664
5.23M
  while (len > nearest_refmv_count) {
665
2.14M
    int nr_len = nearest_refmv_count;
666
3.97M
    for (int idx = nearest_refmv_count + 1; idx < len; ++idx) {
667
1.82M
      if (ref_mv_weight[idx - 1] < ref_mv_weight[idx]) {
668
531k
        const CANDIDATE_MV tmp_mv = ref_mv_stack[idx - 1];
669
531k
        const uint16_t tmp_ref_mv_weight = ref_mv_weight[idx - 1];
670
531k
        ref_mv_stack[idx - 1] = ref_mv_stack[idx];
671
531k
        ref_mv_stack[idx] = tmp_mv;
672
531k
        ref_mv_weight[idx - 1] = ref_mv_weight[idx];
673
531k
        ref_mv_weight[idx] = tmp_ref_mv_weight;
674
531k
        nr_len = idx;
675
531k
      }
676
1.82M
    }
677
2.14M
    len = nr_len;
678
2.14M
  }
679
680
3.08M
  int mi_width = AOMMIN(mi_size_wide[BLOCK_64X64], xd->width);
681
3.08M
  mi_width = AOMMIN(mi_width, cm->mi_params.mi_cols - mi_col);
682
3.08M
  int mi_height = AOMMIN(mi_size_high[BLOCK_64X64], xd->height);
683
3.08M
  mi_height = AOMMIN(mi_height, cm->mi_params.mi_rows - mi_row);
684
3.08M
  const int mi_size = AOMMIN(mi_width, mi_height);
685
3.08M
  if (rf[1] > NONE_FRAME) {
686
    // TODO(jingning, yunqing): Refactor and consolidate the compound and
687
    // single reference frame modes. Reduce unnecessary redundancy.
688
337k
    if (*refmv_count < MAX_MV_REF_CANDIDATES) {
689
240k
      int_mv ref_id[2][2], ref_diff[2][2];
690
240k
      int ref_id_count[2] = { 0 }, ref_diff_count[2] = { 0 };
691
692
467k
      for (int idx = 0; abs(max_row_offset) >= 1 && idx < mi_size;) {
693
227k
        const MB_MODE_INFO *const candidate = xd->mi[-xd->mi_stride + idx];
694
227k
        process_compound_ref_mv_candidate(
695
227k
            candidate, cm, rf, ref_id, ref_id_count, ref_diff, ref_diff_count);
696
227k
        idx += mi_size_wide[candidate->bsize];
697
227k
      }
698
699
484k
      for (int idx = 0; abs(max_col_offset) >= 1 && idx < mi_size;) {
700
244k
        const MB_MODE_INFO *const candidate = xd->mi[idx * xd->mi_stride - 1];
701
244k
        process_compound_ref_mv_candidate(
702
244k
            candidate, cm, rf, ref_id, ref_id_count, ref_diff, ref_diff_count);
703
244k
        idx += mi_size_high[candidate->bsize];
704
244k
      }
705
706
      // Build up the compound mv predictor
707
240k
      int_mv comp_list[MAX_MV_REF_CANDIDATES][2];
708
709
722k
      for (int idx = 0; idx < 2; ++idx) {
710
481k
        int comp_idx = 0;
711
481k
        for (int list_idx = 0;
712
973k
             list_idx < ref_id_count[idx] && comp_idx < MAX_MV_REF_CANDIDATES;
713
491k
             ++list_idx, ++comp_idx)
714
491k
          comp_list[comp_idx][idx] = ref_id[idx][list_idx];
715
481k
        for (int list_idx = 0;
716
860k
             list_idx < ref_diff_count[idx] && comp_idx < MAX_MV_REF_CANDIDATES;
717
481k
             ++list_idx, ++comp_idx)
718
379k
          comp_list[comp_idx][idx] = ref_diff[idx][list_idx];
719
573k
        for (; comp_idx < MAX_MV_REF_CANDIDATES; ++comp_idx)
720
91.8k
          comp_list[comp_idx][idx] = gm_mv_candidates[idx];
721
481k
      }
722
723
240k
      if (*refmv_count) {
724
138k
        assert(*refmv_count == 1);
725
138k
        if (comp_list[0][0].as_int == ref_mv_stack[0].this_mv.as_int &&
726
115k
            comp_list[0][1].as_int == ref_mv_stack[0].comp_mv.as_int) {
727
106k
          ref_mv_stack[*refmv_count].this_mv = comp_list[1][0];
728
106k
          ref_mv_stack[*refmv_count].comp_mv = comp_list[1][1];
729
106k
        } else {
730
32.3k
          ref_mv_stack[*refmv_count].this_mv = comp_list[0][0];
731
32.3k
          ref_mv_stack[*refmv_count].comp_mv = comp_list[0][1];
732
32.3k
        }
733
138k
        ref_mv_weight[*refmv_count] = 2;
734
138k
        ++*refmv_count;
735
138k
      } else {
736
305k
        for (int idx = 0; idx < MAX_MV_REF_CANDIDATES; ++idx) {
737
203k
          ref_mv_stack[*refmv_count].this_mv = comp_list[idx][0];
738
203k
          ref_mv_stack[*refmv_count].comp_mv = comp_list[idx][1];
739
203k
          ref_mv_weight[*refmv_count] = 2;
740
203k
          ++*refmv_count;
741
203k
        }
742
101k
      }
743
240k
    }
744
745
337k
    assert(*refmv_count >= 2);
746
747
1.09M
    for (int idx = 0; idx < *refmv_count; ++idx) {
748
758k
      clamp_mv_ref(&ref_mv_stack[idx].this_mv.as_mv, xd->width << MI_SIZE_LOG2,
749
758k
                   xd->height << MI_SIZE_LOG2, xd);
750
758k
      clamp_mv_ref(&ref_mv_stack[idx].comp_mv.as_mv, xd->width << MI_SIZE_LOG2,
751
758k
                   xd->height << MI_SIZE_LOG2, xd);
752
758k
    }
753
2.75M
  } else {
754
    // Handle single reference frame extension
755
3.70M
    for (int idx = 0; abs(max_row_offset) >= 1 && idx < mi_size &&
756
2.75M
                      *refmv_count < MAX_MV_REF_CANDIDATES;) {
757
953k
      const MB_MODE_INFO *const candidate = xd->mi[-xd->mi_stride + idx];
758
953k
      process_single_ref_mv_candidate(candidate, cm, ref_frame, refmv_count,
759
953k
                                      ref_mv_stack, ref_mv_weight);
760
953k
      idx += mi_size_wide[candidate->bsize];
761
953k
    }
762
763
3.60M
    for (int idx = 0; abs(max_col_offset) >= 1 && idx < mi_size &&
764
2.76M
                      *refmv_count < MAX_MV_REF_CANDIDATES;) {
765
853k
      const MB_MODE_INFO *const candidate = xd->mi[idx * xd->mi_stride - 1];
766
853k
      process_single_ref_mv_candidate(candidate, cm, ref_frame, refmv_count,
767
853k
                                      ref_mv_stack, ref_mv_weight);
768
853k
      idx += mi_size_high[candidate->bsize];
769
853k
    }
770
771
10.4M
    for (int idx = 0; idx < *refmv_count; ++idx) {
772
7.70M
      clamp_mv_ref(&ref_mv_stack[idx].this_mv.as_mv, xd->width << MI_SIZE_LOG2,
773
7.70M
                   xd->height << MI_SIZE_LOG2, xd);
774
7.70M
    }
775
776
2.75M
    if (mv_ref_list != NULL) {
777
3.55M
      for (int idx = *refmv_count; idx < MAX_MV_REF_CANDIDATES; ++idx)
778
804k
        mv_ref_list[idx].as_int = gm_mv_candidates[0].as_int;
779
780
7.44M
      for (int idx = 0; idx < AOMMIN(MAX_MV_REF_CANDIDATES, *refmv_count);
781
4.69M
           ++idx) {
782
4.69M
        mv_ref_list[idx].as_int = ref_mv_stack[idx].this_mv.as_int;
783
4.69M
      }
784
2.75M
    }
785
2.75M
  }
786
3.08M
}
787
788
void av1_find_mv_refs(const AV1_COMMON *cm, const MACROBLOCKD *xd,
789
                      MB_MODE_INFO *mi, MV_REFERENCE_FRAME ref_frame,
790
                      uint8_t ref_mv_count[MODE_CTX_REF_FRAMES],
791
                      CANDIDATE_MV ref_mv_stack[][MAX_REF_MV_STACK_SIZE],
792
                      uint16_t ref_mv_weight[][MAX_REF_MV_STACK_SIZE],
793
                      int_mv mv_ref_list[][MAX_MV_REF_CANDIDATES],
794
3.08M
                      int_mv *global_mvs, int16_t *mode_context) {
795
3.08M
  const int mi_row = xd->mi_row;
796
3.08M
  const int mi_col = xd->mi_col;
797
3.08M
  int_mv gm_mv[2];
798
799
3.08M
  if (ref_frame == INTRA_FRAME) {
800
23.7k
    gm_mv[0].as_int = gm_mv[1].as_int = 0;
801
23.7k
    if (global_mvs != NULL) {
802
0
      global_mvs[ref_frame].as_int = INVALID_MV;
803
0
    }
804
3.05M
  } else {
805
3.05M
    const BLOCK_SIZE bsize = mi->bsize;
806
3.05M
    const int allow_high_precision_mv = cm->features.allow_high_precision_mv;
807
3.05M
    const int force_integer_mv = cm->features.cur_frame_force_integer_mv;
808
3.05M
    if (ref_frame < REF_FRAMES) {
809
2.72M
      gm_mv[0] = gm_get_motion_vector(&cm->global_motion[ref_frame],
810
2.72M
                                      allow_high_precision_mv, bsize, mi_col,
811
2.72M
                                      mi_row, force_integer_mv);
812
2.72M
      gm_mv[1].as_int = 0;
813
2.72M
      if (global_mvs != NULL) global_mvs[ref_frame] = gm_mv[0];
814
2.72M
    } else {
815
332k
      MV_REFERENCE_FRAME rf[2];
816
332k
      av1_set_ref_frame(rf, ref_frame);
817
332k
      gm_mv[0] = gm_get_motion_vector(&cm->global_motion[rf[0]],
818
332k
                                      allow_high_precision_mv, bsize, mi_col,
819
332k
                                      mi_row, force_integer_mv);
820
332k
      gm_mv[1] = gm_get_motion_vector(&cm->global_motion[rf[1]],
821
332k
                                      allow_high_precision_mv, bsize, mi_col,
822
332k
                                      mi_row, force_integer_mv);
823
332k
    }
824
3.05M
  }
825
826
3.08M
  setup_ref_mv_list(cm, xd, ref_frame, &ref_mv_count[ref_frame],
827
3.08M
                    ref_mv_stack[ref_frame], ref_mv_weight[ref_frame],
828
3.08M
                    mv_ref_list ? mv_ref_list[ref_frame] : NULL, gm_mv, mi_row,
829
3.08M
                    mi_col, mode_context);
830
3.08M
}
831
832
void av1_find_best_ref_mvs(int allow_hp, int_mv *mvlist, int_mv *nearest_mv,
833
2.37M
                           int_mv *near_mv, int is_integer) {
834
2.37M
  int i;
835
  // Make sure all the candidates are properly clamped etc
836
7.11M
  for (i = 0; i < MAX_MV_REF_CANDIDATES; ++i) {
837
4.74M
    lower_mv_precision(&mvlist[i].as_mv, allow_hp, is_integer);
838
4.74M
  }
839
2.37M
  *nearest_mv = mvlist[0];
840
2.37M
  *near_mv = mvlist[1];
841
2.37M
}
842
843
81.5k
void av1_setup_frame_buf_refs(AV1_COMMON *cm) {
844
81.5k
  cm->cur_frame->order_hint = cm->current_frame.order_hint;
845
81.5k
  cm->cur_frame->display_order_hint = cm->current_frame.display_order_hint;
846
81.5k
  cm->cur_frame->pyramid_level = cm->current_frame.pyramid_level;
847
81.5k
  cm->cur_frame->filter_level[0] = -1;
848
81.5k
  cm->cur_frame->filter_level[1] = -1;
849
81.5k
  MV_REFERENCE_FRAME ref_frame;
850
652k
  for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) {
851
571k
    const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame);
852
571k
    if (buf != NULL) {
853
241k
      cm->cur_frame->ref_order_hints[ref_frame - LAST_FRAME] = buf->order_hint;
854
241k
      cm->cur_frame->ref_display_order_hint[ref_frame - LAST_FRAME] =
855
241k
          buf->display_order_hint;
856
241k
    }
857
571k
  }
858
81.5k
}
859
860
81.5k
void av1_setup_frame_sign_bias(AV1_COMMON *cm) {
861
81.5k
  MV_REFERENCE_FRAME ref_frame;
862
652k
  for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) {
863
571k
    const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame);
864
571k
    if (cm->seq_params->order_hint_info.enable_order_hint && buf != NULL) {
865
241k
      const int ref_order_hint = buf->order_hint;
866
241k
      cm->ref_frame_sign_bias[ref_frame] =
867
241k
          (get_relative_dist(&cm->seq_params->order_hint_info, ref_order_hint,
868
241k
                             (int)cm->current_frame.order_hint) <= 0)
869
241k
              ? 0
870
241k
              : 1;
871
329k
    } else {
872
329k
      cm->ref_frame_sign_bias[ref_frame] = 0;
873
329k
    }
874
571k
  }
875
81.5k
}
876
877
14.6M
#define MAX_OFFSET_WIDTH 64
878
14.8M
#define MAX_OFFSET_HEIGHT 0
879
880
static int get_block_position(AV1_COMMON *cm, int *mi_r, int *mi_c, int blk_row,
881
7.75M
                              int blk_col, MV mv, int sign_bias) {
882
7.75M
  const int base_blk_row = (blk_row >> 3) << 3;
883
7.75M
  const int base_blk_col = (blk_col >> 3) << 3;
884
885
7.75M
  const int row_offset = (mv.row >= 0) ? (mv.row >> (4 + MI_SIZE_LOG2))
886
7.75M
                                       : -((-mv.row) >> (4 + MI_SIZE_LOG2));
887
888
7.75M
  const int col_offset = (mv.col >= 0) ? (mv.col >> (4 + MI_SIZE_LOG2))
889
7.75M
                                       : -((-mv.col) >> (4 + MI_SIZE_LOG2));
890
891
7.75M
  const int row =
892
7.75M
      (sign_bias == 1) ? blk_row - row_offset : blk_row + row_offset;
893
7.75M
  const int col =
894
7.75M
      (sign_bias == 1) ? blk_col - col_offset : blk_col + col_offset;
895
896
7.75M
  if (row < 0 || row >= (cm->mi_params.mi_rows >> 1) || col < 0 ||
897
7.47M
      col >= (cm->mi_params.mi_cols >> 1))
898
291k
    return 0;
899
900
7.45M
  if (row < base_blk_row - (MAX_OFFSET_HEIGHT >> 3) ||
901
7.39M
      row >= base_blk_row + 8 + (MAX_OFFSET_HEIGHT >> 3) ||
902
7.34M
      col < base_blk_col - (MAX_OFFSET_WIDTH >> 3) ||
903
7.33M
      col >= base_blk_col + 8 + (MAX_OFFSET_WIDTH >> 3))
904
128k
    return 0;
905
906
7.32M
  *mi_r = row;
907
7.32M
  *mi_c = col;
908
909
7.32M
  return 1;
910
7.45M
}
911
912
// Note: motion_filed_projection finds motion vectors of current frame's
913
// reference frame, and projects them to current frame. To make it clear,
914
// let's call current frame's reference frame as start frame.
915
// Call Start frame's reference frames as reference frames.
916
// Call ref_offset as frame distances between start frame and its reference
917
// frames.
918
static int motion_field_projection(AV1_COMMON *cm,
919
16.3k
                                   MV_REFERENCE_FRAME start_frame, int dir) {
920
16.3k
  TPL_MV_REF *tpl_mvs_base = cm->tpl_mvs;
921
16.3k
  int ref_offset[REF_FRAMES] = { 0 };
922
923
16.3k
  const RefCntBuffer *const start_frame_buf =
924
16.3k
      get_ref_frame_buf(cm, start_frame);
925
16.3k
  if (start_frame_buf == NULL) return 0;
926
927
16.3k
  if (start_frame_buf->frame_type == KEY_FRAME ||
928
8.21k
      start_frame_buf->frame_type == INTRA_ONLY_FRAME)
929
8.92k
    return 0;
930
931
7.42k
  if (start_frame_buf->mi_rows != cm->mi_params.mi_rows ||
932
7.41k
      start_frame_buf->mi_cols != cm->mi_params.mi_cols)
933
25
    return 0;
934
935
7.40k
  const int start_frame_order_hint = start_frame_buf->order_hint;
936
7.40k
  const unsigned int *const ref_order_hints =
937
7.40k
      &start_frame_buf->ref_order_hints[0];
938
7.40k
  const int cur_order_hint = cm->cur_frame->order_hint;
939
7.40k
  int start_to_current_frame_offset = get_relative_dist(
940
7.40k
      &cm->seq_params->order_hint_info, start_frame_order_hint, cur_order_hint);
941
942
59.2k
  for (MV_REFERENCE_FRAME rf = LAST_FRAME; rf <= INTER_REFS_PER_FRAME; ++rf) {
943
51.8k
    ref_offset[rf] = get_relative_dist(&cm->seq_params->order_hint_info,
944
51.8k
                                       start_frame_order_hint,
945
51.8k
                                       ref_order_hints[rf - LAST_FRAME]);
946
51.8k
  }
947
948
7.40k
  if (dir == 2) start_to_current_frame_offset = -start_to_current_frame_offset;
949
950
7.40k
  MV_REF *mv_ref_base = start_frame_buf->mvs;
951
7.40k
  const int mvs_rows = (cm->mi_params.mi_rows + 1) >> 1;
952
7.40k
  const int mvs_cols = (cm->mi_params.mi_cols + 1) >> 1;
953
954
203k
  for (int blk_row = 0; blk_row < mvs_rows; ++blk_row) {
955
13.0M
    for (int blk_col = 0; blk_col < mvs_cols; ++blk_col) {
956
12.8M
      MV_REF *mv_ref = &mv_ref_base[blk_row * mvs_cols + blk_col];
957
12.8M
      MV fwd_mv = mv_ref->mv.as_mv;
958
959
12.8M
      if (mv_ref->ref_frame > INTRA_FRAME) {
960
9.17M
        int_mv this_mv;
961
9.17M
        int mi_r, mi_c;
962
9.17M
        const int ref_frame_offset = ref_offset[mv_ref->ref_frame];
963
964
9.17M
        int pos_valid =
965
9.17M
            abs(ref_frame_offset) <= MAX_FRAME_DISTANCE &&
966
7.75M
            ref_frame_offset > 0 &&
967
7.75M
            abs(start_to_current_frame_offset) <= MAX_FRAME_DISTANCE;
968
969
9.17M
        if (pos_valid) {
970
7.75M
          av1_get_mv_projection(&this_mv.as_mv, fwd_mv,
971
7.75M
                                start_to_current_frame_offset,
972
7.75M
                                ref_frame_offset);
973
7.75M
          pos_valid = get_block_position(cm, &mi_r, &mi_c, blk_row, blk_col,
974
7.75M
                                         this_mv.as_mv, dir >> 1);
975
7.75M
        }
976
977
9.17M
        if (pos_valid) {
978
7.32M
          const int mi_offset = mi_r * (cm->mi_params.mi_stride >> 1) + mi_c;
979
980
7.32M
          tpl_mvs_base[mi_offset].mfmv0.as_mv.row = fwd_mv.row;
981
7.32M
          tpl_mvs_base[mi_offset].mfmv0.as_mv.col = fwd_mv.col;
982
7.32M
          tpl_mvs_base[mi_offset].ref_frame_offset = ref_frame_offset;
983
7.32M
        }
984
9.17M
      }
985
12.8M
    }
986
196k
  }
987
988
7.40k
  return 1;
989
7.42k
}
990
991
// cm->ref_frame_side is calculated here, and will be used in
992
// av1_copy_frame_mvs() to affect how mvs are copied.
993
69.3k
void av1_calculate_ref_frame_side(AV1_COMMON *cm) {
994
69.3k
  const OrderHintInfo *const order_hint_info = &cm->seq_params->order_hint_info;
995
996
69.3k
  memset(cm->ref_frame_side, 0, sizeof(cm->ref_frame_side));
997
69.3k
  if (!order_hint_info->enable_order_hint) return;
998
999
48.0k
  const int cur_order_hint = cm->cur_frame->order_hint;
1000
1001
384k
  for (int ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ref_frame++) {
1002
336k
    const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame);
1003
336k
    int order_hint = 0;
1004
1005
336k
    if (buf != NULL) order_hint = buf->order_hint;
1006
1007
336k
    if (get_relative_dist(order_hint_info, order_hint, cur_order_hint) > 0)
1008
98.3k
      cm->ref_frame_side[ref_frame] = 1;
1009
238k
    else if (order_hint == cur_order_hint)
1010
66.8k
      cm->ref_frame_side[ref_frame] = -1;
1011
336k
  }
1012
48.0k
}
1013
1014
6.62k
void av1_setup_motion_field(AV1_COMMON *cm) {
1015
6.62k
  const OrderHintInfo *const order_hint_info = &cm->seq_params->order_hint_info;
1016
1017
6.62k
  if (!order_hint_info->enable_order_hint) return;
1018
1019
6.62k
  TPL_MV_REF *tpl_mvs_base = cm->tpl_mvs;
1020
6.62k
  int size = ((cm->mi_params.mi_rows + MAX_MIB_SIZE) >> 1) *
1021
6.62k
             (cm->mi_params.mi_stride >> 1);
1022
32.5M
  for (int idx = 0; idx < size; ++idx) {
1023
32.5M
    tpl_mvs_base[idx].mfmv0.as_int = INVALID_MV;
1024
32.5M
    tpl_mvs_base[idx].ref_frame_offset = 0;
1025
32.5M
  }
1026
1027
6.62k
  const int cur_order_hint = cm->cur_frame->order_hint;
1028
6.62k
  const RefCntBuffer *ref_buf[INTER_REFS_PER_FRAME];
1029
6.62k
  int ref_order_hint[INTER_REFS_PER_FRAME];
1030
1031
53.0k
  for (int ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ref_frame++) {
1032
46.3k
    const int ref_idx = ref_frame - LAST_FRAME;
1033
46.3k
    const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame);
1034
46.3k
    int order_hint = 0;
1035
1036
46.3k
    if (buf != NULL) order_hint = buf->order_hint;
1037
1038
46.3k
    ref_buf[ref_idx] = buf;
1039
46.3k
    ref_order_hint[ref_idx] = order_hint;
1040
46.3k
  }
1041
1042
6.62k
  int ref_stamp = MFMV_STACK_SIZE - 1;
1043
1044
6.62k
  if (ref_buf[LAST_FRAME - LAST_FRAME] != NULL) {
1045
6.62k
    const int alt_of_lst_order_hint =
1046
6.62k
        ref_buf[LAST_FRAME - LAST_FRAME]
1047
6.62k
            ->ref_order_hints[ALTREF_FRAME - LAST_FRAME];
1048
1049
6.62k
    const int is_lst_overlay =
1050
6.62k
        (alt_of_lst_order_hint == ref_order_hint[GOLDEN_FRAME - LAST_FRAME]);
1051
6.62k
    if (!is_lst_overlay) motion_field_projection(cm, LAST_FRAME, 2);
1052
6.62k
    --ref_stamp;
1053
6.62k
  }
1054
1055
6.62k
  if (get_relative_dist(order_hint_info,
1056
6.62k
                        ref_order_hint[BWDREF_FRAME - LAST_FRAME],
1057
6.62k
                        cur_order_hint) > 0) {
1058
1.33k
    if (motion_field_projection(cm, BWDREF_FRAME, 0)) --ref_stamp;
1059
1.33k
  }
1060
1061
6.62k
  if (get_relative_dist(order_hint_info,
1062
6.62k
                        ref_order_hint[ALTREF2_FRAME - LAST_FRAME],
1063
6.62k
                        cur_order_hint) > 0) {
1064
1.94k
    if (motion_field_projection(cm, ALTREF2_FRAME, 0)) --ref_stamp;
1065
1.94k
  }
1066
1067
6.62k
  if (get_relative_dist(order_hint_info,
1068
6.62k
                        ref_order_hint[ALTREF_FRAME - LAST_FRAME],
1069
6.62k
                        cur_order_hint) > 0 &&
1070
2.09k
      ref_stamp >= 0)
1071
1.96k
    if (motion_field_projection(cm, ALTREF_FRAME, 0)) --ref_stamp;
1072
1073
6.62k
  if (ref_stamp >= 0) motion_field_projection(cm, LAST2_FRAME, 2);
1074
6.62k
}
1075
1076
static inline void record_samples(const MB_MODE_INFO *mbmi, int *pts,
1077
                                  int *pts_inref, int row_offset, int sign_r,
1078
3.35M
                                  int col_offset, int sign_c) {
1079
3.35M
  const int bw = block_size_wide[mbmi->bsize];
1080
3.35M
  const int bh = block_size_high[mbmi->bsize];
1081
3.35M
  const int x = col_offset * MI_SIZE + sign_c * bw / 2 - 1;
1082
3.35M
  const int y = row_offset * MI_SIZE + sign_r * bh / 2 - 1;
1083
1084
3.35M
  pts[0] = GET_MV_SUBPEL(x);
1085
3.35M
  pts[1] = GET_MV_SUBPEL(y);
1086
3.35M
  pts_inref[0] = pts[0] + mbmi->mv[0].as_mv.col;
1087
3.35M
  pts_inref[1] = pts[1] + mbmi->mv[0].as_mv.row;
1088
3.35M
}
1089
1090
// Select samples according to the motion vector difference.
1091
uint8_t av1_selectSamples(MV *mv, int *pts, int *pts_inref, int len,
1092
185k
                          BLOCK_SIZE bsize) {
1093
185k
  const int bw = block_size_wide[bsize];
1094
185k
  const int bh = block_size_high[bsize];
1095
185k
  const int thresh = clamp(AOMMAX(bw, bh), 16, 112);
1096
185k
  uint8_t ret = 0;
1097
185k
  assert(len <= LEAST_SQUARES_SAMPLES_MAX);
1098
1099
  // Only keep the samples with MV differences within threshold.
1100
769k
  for (int i = 0; i < len; ++i) {
1101
584k
    const int diff = abs(pts_inref[2 * i] - pts[2 * i] - mv->col) +
1102
584k
                     abs(pts_inref[2 * i + 1] - pts[2 * i + 1] - mv->row);
1103
584k
    if (diff > thresh) continue;
1104
342k
    if (ret != i) {
1105
57.2k
      memcpy(pts + 2 * ret, pts + 2 * i, 2 * sizeof(pts[0]));
1106
57.2k
      memcpy(pts_inref + 2 * ret, pts_inref + 2 * i, 2 * sizeof(pts_inref[0]));
1107
57.2k
    }
1108
342k
    ++ret;
1109
342k
  }
1110
  // Keep at least 1 sample.
1111
185k
  return AOMMAX(ret, 1);
1112
185k
}
1113
1114
// Note: Samples returned are at 1/8-pel precision
1115
// Sample are the neighbor block center point's coordinates relative to the
1116
// left-top pixel of current block.
1117
uint8_t av1_findSamples(const AV1_COMMON *cm, MACROBLOCKD *xd, int *pts,
1118
1.56M
                        int *pts_inref) {
1119
1.56M
  const MB_MODE_INFO *const mbmi0 = xd->mi[0];
1120
1.56M
  const int ref_frame = mbmi0->ref_frame[0];
1121
1.56M
  const int up_available = xd->up_available;
1122
1.56M
  const int left_available = xd->left_available;
1123
1.56M
  uint8_t np = 0;
1124
1.56M
  int do_tl = 1;
1125
1.56M
  int do_tr = 1;
1126
1.56M
  const int mi_stride = xd->mi_stride;
1127
1.56M
  const int mi_row = xd->mi_row;
1128
1.56M
  const int mi_col = xd->mi_col;
1129
1130
  // scan the nearest above rows
1131
1.56M
  if (up_available) {
1132
1.50M
    const int mi_row_offset = -1;
1133
1.50M
    const MB_MODE_INFO *mbmi = xd->mi[mi_row_offset * mi_stride];
1134
1.50M
    uint8_t superblock_width = mi_size_wide[mbmi->bsize];
1135
1136
1.50M
    if (xd->width <= superblock_width) {
1137
      // Handle "current block width <= above block width" case.
1138
1.26M
      const int col_offset = -mi_col % superblock_width;
1139
1140
1.26M
      if (col_offset < 0) do_tl = 0;
1141
1.26M
      if (col_offset + superblock_width > xd->width) do_tr = 0;
1142
1143
1.26M
      if (mbmi->ref_frame[0] == ref_frame && mbmi->ref_frame[1] == NONE_FRAME) {
1144
786k
        record_samples(mbmi, pts, pts_inref, 0, -1, col_offset, 1);
1145
786k
        pts += 2;
1146
786k
        pts_inref += 2;
1147
786k
        if (++np >= LEAST_SQUARES_SAMPLES_MAX) return LEAST_SQUARES_SAMPLES_MAX;
1148
786k
      }
1149
1.26M
    } else {
1150
      // Handle "current block width > above block width" case.
1151
865k
      for (int i = 0; i < AOMMIN(xd->width, cm->mi_params.mi_cols - mi_col);
1152
624k
           i += superblock_width) {
1153
624k
        mbmi = xd->mi[i + mi_row_offset * mi_stride];
1154
624k
        superblock_width = mi_size_wide[mbmi->bsize];
1155
1156
624k
        if (mbmi->ref_frame[0] == ref_frame &&
1157
427k
            mbmi->ref_frame[1] == NONE_FRAME) {
1158
388k
          record_samples(mbmi, pts, pts_inref, 0, -1, i, 1);
1159
388k
          pts += 2;
1160
388k
          pts_inref += 2;
1161
388k
          if (++np >= LEAST_SQUARES_SAMPLES_MAX)
1162
1.20k
            return LEAST_SQUARES_SAMPLES_MAX;
1163
388k
        }
1164
624k
      }
1165
242k
    }
1166
1.50M
  }
1167
1.56M
  assert(np <= LEAST_SQUARES_SAMPLES_MAX);
1168
1169
  // scan the nearest left columns
1170
1.55M
  if (left_available) {
1171
1.52M
    const int mi_col_offset = -1;
1172
1.52M
    const MB_MODE_INFO *mbmi = xd->mi[mi_col_offset];
1173
1.52M
    uint8_t superblock_height = mi_size_high[mbmi->bsize];
1174
1175
1.52M
    if (xd->height <= superblock_height) {
1176
      // Handle "current block height <= above block height" case.
1177
1.26M
      const int row_offset = -mi_row % superblock_height;
1178
1179
1.26M
      if (row_offset < 0) do_tl = 0;
1180
1181
1.26M
      if (mbmi->ref_frame[0] == ref_frame && mbmi->ref_frame[1] == NONE_FRAME) {
1182
771k
        record_samples(mbmi, pts, pts_inref, row_offset, 1, 0, -1);
1183
771k
        pts += 2;
1184
771k
        pts_inref += 2;
1185
771k
        np++;
1186
771k
        if (np >= LEAST_SQUARES_SAMPLES_MAX) return LEAST_SQUARES_SAMPLES_MAX;
1187
771k
      }
1188
1.26M
    } else {
1189
      // Handle "current block height > above block height" case.
1190
939k
      for (int i = 0; i < AOMMIN(xd->height, cm->mi_params.mi_rows - mi_row);
1191
676k
           i += superblock_height) {
1192
676k
        mbmi = xd->mi[mi_col_offset + i * mi_stride];
1193
676k
        superblock_height = mi_size_high[mbmi->bsize];
1194
1195
676k
        if (mbmi->ref_frame[0] == ref_frame &&
1196
476k
            mbmi->ref_frame[1] == NONE_FRAME) {
1197
439k
          record_samples(mbmi, pts, pts_inref, i, 1, 0, -1);
1198
439k
          pts += 2;
1199
439k
          pts_inref += 2;
1200
439k
          if (++np >= LEAST_SQUARES_SAMPLES_MAX)
1201
4.02k
            return LEAST_SQUARES_SAMPLES_MAX;
1202
439k
        }
1203
676k
      }
1204
267k
    }
1205
1.52M
  }
1206
1.55M
  assert(np <= LEAST_SQUARES_SAMPLES_MAX);
1207
1208
  // Top-left block
1209
1.55M
  if (do_tl && left_available && up_available) {
1210
1.01M
    const int mi_row_offset = -1;
1211
1.01M
    const int mi_col_offset = -1;
1212
1.01M
    MB_MODE_INFO *mbmi = xd->mi[mi_col_offset + mi_row_offset * mi_stride];
1213
1214
1.01M
    if (mbmi->ref_frame[0] == ref_frame && mbmi->ref_frame[1] == NONE_FRAME) {
1215
609k
      record_samples(mbmi, pts, pts_inref, 0, -1, 0, -1);
1216
609k
      pts += 2;
1217
609k
      pts_inref += 2;
1218
609k
      if (++np >= LEAST_SQUARES_SAMPLES_MAX) return LEAST_SQUARES_SAMPLES_MAX;
1219
609k
    }
1220
1.01M
  }
1221
1.55M
  assert(np <= LEAST_SQUARES_SAMPLES_MAX);
1222
1223
  // Top-right block
1224
1.55M
  if (do_tr &&
1225
1.32M
      has_top_right(cm, xd, mi_row, mi_col, AOMMAX(xd->width, xd->height))) {
1226
681k
    const POSITION trb_pos = { -1, xd->width };
1227
681k
    const TileInfo *const tile = &xd->tile;
1228
681k
    if (is_inside(tile, mi_col, mi_row, &trb_pos)) {
1229
636k
      const int mi_row_offset = -1;
1230
636k
      const int mi_col_offset = xd->width;
1231
636k
      const MB_MODE_INFO *mbmi =
1232
636k
          xd->mi[mi_col_offset + mi_row_offset * mi_stride];
1233
1234
636k
      if (mbmi->ref_frame[0] == ref_frame && mbmi->ref_frame[1] == NONE_FRAME) {
1235
361k
        record_samples(mbmi, pts, pts_inref, 0, -1, xd->width, 1);
1236
361k
        if (++np >= LEAST_SQUARES_SAMPLES_MAX) return LEAST_SQUARES_SAMPLES_MAX;
1237
361k
      }
1238
636k
    }
1239
681k
  }
1240
1.55M
  assert(np <= LEAST_SQUARES_SAMPLES_MAX);
1241
1242
1.54M
  return np;
1243
1.54M
}
1244
1245
72.6k
void av1_setup_skip_mode_allowed(AV1_COMMON *cm) {
1246
72.6k
  const OrderHintInfo *const order_hint_info = &cm->seq_params->order_hint_info;
1247
72.6k
  SkipModeInfo *const skip_mode_info = &cm->current_frame.skip_mode_info;
1248
1249
72.6k
  skip_mode_info->skip_mode_allowed = 0;
1250
72.6k
  skip_mode_info->ref_frame_idx_0 = INVALID_IDX;
1251
72.6k
  skip_mode_info->ref_frame_idx_1 = INVALID_IDX;
1252
1253
72.6k
  if (!order_hint_info->enable_order_hint || frame_is_intra_only(cm) ||
1254
19.6k
      cm->current_frame.reference_mode == SINGLE_REFERENCE)
1255
61.0k
    return;
1256
1257
11.6k
  const int cur_order_hint = cm->current_frame.order_hint;
1258
11.6k
  int ref_order_hints[2] = { -1, INT_MAX };
1259
11.6k
  int ref_idx[2] = { INVALID_IDX, INVALID_IDX };
1260
1261
  // Identify the nearest forward and backward references.
1262
92.9k
  for (int i = 0; i < INTER_REFS_PER_FRAME; ++i) {
1263
81.2k
    const RefCntBuffer *const buf = get_ref_frame_buf(cm, LAST_FRAME + i);
1264
81.2k
    if (buf == NULL) continue;
1265
1266
81.2k
    const int ref_order_hint = buf->order_hint;
1267
81.2k
    if (get_relative_dist(order_hint_info, ref_order_hint, cur_order_hint) <
1268
81.2k
        0) {
1269
      // Forward reference
1270
56.3k
      if (ref_order_hints[0] == -1 ||
1271
44.9k
          get_relative_dist(order_hint_info, ref_order_hint,
1272
44.9k
                            ref_order_hints[0]) > 0) {
1273
18.8k
        ref_order_hints[0] = ref_order_hint;
1274
18.8k
        ref_idx[0] = i;
1275
18.8k
      }
1276
56.3k
    } else if (get_relative_dist(order_hint_info, ref_order_hint,
1277
24.9k
                                 cur_order_hint) > 0) {
1278
      // Backward reference
1279
9.14k
      if (ref_order_hints[1] == INT_MAX ||
1280
5.12k
          get_relative_dist(order_hint_info, ref_order_hint,
1281
5.12k
                            ref_order_hints[1]) < 0) {
1282
4.58k
        ref_order_hints[1] = ref_order_hint;
1283
4.58k
        ref_idx[1] = i;
1284
4.58k
      }
1285
9.14k
    }
1286
81.2k
  }
1287
1288
11.6k
  if (ref_idx[0] != INVALID_IDX && ref_idx[1] != INVALID_IDX) {
1289
    // == Bi-directional prediction ==
1290
3.81k
    skip_mode_info->skip_mode_allowed = 1;
1291
3.81k
    skip_mode_info->ref_frame_idx_0 = AOMMIN(ref_idx[0], ref_idx[1]);
1292
3.81k
    skip_mode_info->ref_frame_idx_1 = AOMMAX(ref_idx[0], ref_idx[1]);
1293
7.79k
  } else if (ref_idx[0] != INVALID_IDX && ref_idx[1] == INVALID_IDX) {
1294
    // == Forward prediction only ==
1295
    // Identify the second nearest forward reference.
1296
7.57k
    ref_order_hints[1] = -1;
1297
60.6k
    for (int i = 0; i < INTER_REFS_PER_FRAME; ++i) {
1298
53.0k
      const RefCntBuffer *const buf = get_ref_frame_buf(cm, LAST_FRAME + i);
1299
53.0k
      if (buf == NULL) continue;
1300
1301
53.0k
      const int ref_order_hint = buf->order_hint;
1302
53.0k
      if ((ref_order_hints[0] != -1 &&
1303
53.0k
           get_relative_dist(order_hint_info, ref_order_hint,
1304
53.0k
                             ref_order_hints[0]) < 0) &&
1305
17.0k
          (ref_order_hints[1] == -1 ||
1306
10.1k
           get_relative_dist(order_hint_info, ref_order_hint,
1307
10.1k
                             ref_order_hints[1]) > 0)) {
1308
        // Second closest forward reference
1309
8.49k
        ref_order_hints[1] = ref_order_hint;
1310
8.49k
        ref_idx[1] = i;
1311
8.49k
      }
1312
53.0k
    }
1313
7.57k
    if (ref_order_hints[1] != -1) {
1314
6.91k
      skip_mode_info->skip_mode_allowed = 1;
1315
6.91k
      skip_mode_info->ref_frame_idx_0 = AOMMIN(ref_idx[0], ref_idx[1]);
1316
6.91k
      skip_mode_info->ref_frame_idx_1 = AOMMAX(ref_idx[0], ref_idx[1]);
1317
6.91k
    }
1318
7.57k
  }
1319
11.6k
}
1320
1321
typedef struct {
1322
  int map_idx;        // frame map index
1323
  RefCntBuffer *buf;  // frame buffer
1324
  int sort_idx;       // index based on the offset to be used for sorting
1325
} REF_FRAME_INFO;
1326
1327
// Compares the sort_idx fields. If they are equal, then compares the map_idx
1328
// fields to break the tie. This ensures a stable sort.
1329
163k
static int compare_ref_frame_info(const void *arg_a, const void *arg_b) {
1330
163k
  const REF_FRAME_INFO *info_a = (REF_FRAME_INFO *)arg_a;
1331
163k
  const REF_FRAME_INFO *info_b = (REF_FRAME_INFO *)arg_b;
1332
1333
163k
  const int sort_idx_diff = info_a->sort_idx - info_b->sort_idx;
1334
163k
  if (sort_idx_diff != 0) return sort_idx_diff;
1335
55.7k
  return info_a->map_idx - info_b->map_idx;
1336
163k
}
1337
1338
static inline void set_ref_frame_info(int *remapped_ref_idx, int frame_idx,
1339
74.7k
                                      REF_FRAME_INFO *ref_info) {
1340
74.7k
  assert(frame_idx >= 0 && frame_idx < INTER_REFS_PER_FRAME);
1341
1342
74.7k
  remapped_ref_idx[frame_idx] = ref_info->map_idx;
1343
74.7k
}
1344
1345
void av1_set_frame_refs(AV1_COMMON *const cm, int *remapped_ref_idx,
1346
10.8k
                        int lst_map_idx, int gld_map_idx) {
1347
10.8k
  int lst_frame_sort_idx = -1;
1348
10.8k
  int gld_frame_sort_idx = -1;
1349
1350
10.8k
  assert(cm->seq_params->order_hint_info.enable_order_hint);
1351
10.8k
  assert(cm->seq_params->order_hint_info.order_hint_bits_minus_1 >= 0);
1352
10.8k
  const int cur_order_hint = (int)cm->current_frame.order_hint;
1353
10.8k
  const int cur_frame_sort_idx =
1354
10.8k
      1 << cm->seq_params->order_hint_info.order_hint_bits_minus_1;
1355
1356
10.8k
  REF_FRAME_INFO ref_frame_info[REF_FRAMES];
1357
10.8k
  int ref_flag_list[INTER_REFS_PER_FRAME] = { 0, 0, 0, 0, 0, 0, 0 };
1358
1359
97.5k
  for (int i = 0; i < REF_FRAMES; ++i) {
1360
86.6k
    const int map_idx = i;
1361
1362
86.6k
    ref_frame_info[i].map_idx = map_idx;
1363
86.6k
    ref_frame_info[i].sort_idx = -1;
1364
1365
86.6k
    RefCntBuffer *const buf = cm->ref_frame_map[map_idx];
1366
86.6k
    ref_frame_info[i].buf = buf;
1367
1368
86.6k
    if (buf == NULL) continue;
1369
    // If this assertion fails, there is a reference leak.
1370
86.6k
    assert(buf->ref_count > 0);
1371
1372
80.3k
    const int offset = (int)buf->order_hint;
1373
80.3k
    ref_frame_info[i].sort_idx =
1374
80.3k
        (offset == -1) ? -1
1375
80.3k
                       : cur_frame_sort_idx +
1376
80.3k
                             get_relative_dist(&cm->seq_params->order_hint_info,
1377
80.3k
                                               offset, cur_order_hint);
1378
80.3k
    assert(ref_frame_info[i].sort_idx >= -1);
1379
1380
80.3k
    if (map_idx == lst_map_idx) lst_frame_sort_idx = ref_frame_info[i].sort_idx;
1381
80.3k
    if (map_idx == gld_map_idx) gld_frame_sort_idx = ref_frame_info[i].sort_idx;
1382
80.3k
  }
1383
1384
  // Confirm both LAST_FRAME and GOLDEN_FRAME are valid forward reference
1385
  // frames.
1386
10.8k
  if (lst_frame_sort_idx == -1 || lst_frame_sort_idx >= cur_frame_sort_idx) {
1387
116
    aom_internal_error(cm->error, AOM_CODEC_CORRUPT_FRAME,
1388
116
                       "Inter frame requests a look-ahead frame as LAST");
1389
116
  }
1390
10.8k
  if (gld_frame_sort_idx == -1 || gld_frame_sort_idx >= cur_frame_sort_idx) {
1391
46
    aom_internal_error(cm->error, AOM_CODEC_CORRUPT_FRAME,
1392
46
                       "Inter frame requests a look-ahead frame as GOLDEN");
1393
46
  }
1394
1395
  // Sort ref frames based on their frame_offset values.
1396
10.8k
  qsort(ref_frame_info, REF_FRAMES, sizeof(REF_FRAME_INFO),
1397
10.8k
        compare_ref_frame_info);
1398
1399
  // Identify forward and backward reference frames.
1400
  // Forward  reference: offset < order_hint
1401
  // Backward reference: offset >= order_hint
1402
10.8k
  int fwd_start_idx = 0, fwd_end_idx = REF_FRAMES - 1;
1403
1404
75.1k
  for (int i = 0; i < REF_FRAMES; i++) {
1405
73.0k
    if (ref_frame_info[i].sort_idx == -1) {
1406
6.30k
      fwd_start_idx++;
1407
6.30k
      continue;
1408
6.30k
    }
1409
1410
66.7k
    if (ref_frame_info[i].sort_idx >= cur_frame_sort_idx) {
1411
8.75k
      fwd_end_idx = i - 1;
1412
8.75k
      break;
1413
8.75k
    }
1414
66.7k
  }
1415
1416
10.8k
  int bwd_start_idx = fwd_end_idx + 1;
1417
10.8k
  int bwd_end_idx = REF_FRAMES - 1;
1418
1419
  // === Backward Reference Frames ===
1420
1421
  // == ALTREF_FRAME ==
1422
10.8k
  if (bwd_start_idx <= bwd_end_idx) {
1423
8.75k
    set_ref_frame_info(remapped_ref_idx, ALTREF_FRAME - LAST_FRAME,
1424
8.75k
                       &ref_frame_info[bwd_end_idx]);
1425
8.75k
    ref_flag_list[ALTREF_FRAME - LAST_FRAME] = 1;
1426
8.75k
    bwd_end_idx--;
1427
8.75k
  }
1428
1429
  // == BWDREF_FRAME ==
1430
10.8k
  if (bwd_start_idx <= bwd_end_idx) {
1431
6.32k
    set_ref_frame_info(remapped_ref_idx, BWDREF_FRAME - LAST_FRAME,
1432
6.32k
                       &ref_frame_info[bwd_start_idx]);
1433
6.32k
    ref_flag_list[BWDREF_FRAME - LAST_FRAME] = 1;
1434
6.32k
    bwd_start_idx++;
1435
6.32k
  }
1436
1437
  // == ALTREF2_FRAME ==
1438
10.8k
  if (bwd_start_idx <= bwd_end_idx) {
1439
3.39k
    set_ref_frame_info(remapped_ref_idx, ALTREF2_FRAME - LAST_FRAME,
1440
3.39k
                       &ref_frame_info[bwd_start_idx]);
1441
3.39k
    ref_flag_list[ALTREF2_FRAME - LAST_FRAME] = 1;
1442
3.39k
  }
1443
1444
  // === Forward Reference Frames ===
1445
1446
68.8k
  for (int i = fwd_start_idx; i <= fwd_end_idx; ++i) {
1447
    // == LAST_FRAME ==
1448
57.9k
    if (ref_frame_info[i].map_idx == lst_map_idx) {
1449
10.6k
      set_ref_frame_info(remapped_ref_idx, LAST_FRAME - LAST_FRAME,
1450
10.6k
                         &ref_frame_info[i]);
1451
10.6k
      ref_flag_list[LAST_FRAME - LAST_FRAME] = 1;
1452
10.6k
    }
1453
1454
    // == GOLDEN_FRAME ==
1455
57.9k
    if (ref_frame_info[i].map_idx == gld_map_idx) {
1456
10.6k
      set_ref_frame_info(remapped_ref_idx, GOLDEN_FRAME - LAST_FRAME,
1457
10.6k
                         &ref_frame_info[i]);
1458
10.6k
      ref_flag_list[GOLDEN_FRAME - LAST_FRAME] = 1;
1459
10.6k
    }
1460
57.9k
  }
1461
1462
10.8k
  assert(ref_flag_list[LAST_FRAME - LAST_FRAME] == 1 &&
1463
10.8k
         ref_flag_list[GOLDEN_FRAME - LAST_FRAME] == 1);
1464
1465
  // == LAST2_FRAME ==
1466
  // == LAST3_FRAME ==
1467
  // == BWDREF_FRAME ==
1468
  // == ALTREF2_FRAME ==
1469
  // == ALTREF_FRAME ==
1470
1471
  // Set up the reference frames in the anti-chronological order.
1472
10.6k
  static const MV_REFERENCE_FRAME ref_frame_list[INTER_REFS_PER_FRAME - 2] = {
1473
10.6k
    LAST2_FRAME, LAST3_FRAME, BWDREF_FRAME, ALTREF2_FRAME, ALTREF_FRAME
1474
10.6k
  };
1475
1476
10.6k
  int ref_idx;
1477
55.0k
  for (ref_idx = 0; ref_idx < (INTER_REFS_PER_FRAME - 2); ref_idx++) {
1478
46.9k
    const MV_REFERENCE_FRAME ref_frame = ref_frame_list[ref_idx];
1479
1480
46.9k
    if (ref_flag_list[ref_frame - LAST_FRAME] == 1) continue;
1481
1482
45.6k
    while (fwd_start_idx <= fwd_end_idx &&
1483
43.0k
           (ref_frame_info[fwd_end_idx].map_idx == lst_map_idx ||
1484
36.7k
            ref_frame_info[fwd_end_idx].map_idx == gld_map_idx)) {
1485
13.0k
      fwd_end_idx--;
1486
13.0k
    }
1487
32.6k
    if (fwd_start_idx > fwd_end_idx) break;
1488
1489
29.9k
    set_ref_frame_info(remapped_ref_idx, ref_frame - LAST_FRAME,
1490
29.9k
                       &ref_frame_info[fwd_end_idx]);
1491
29.9k
    ref_flag_list[ref_frame - LAST_FRAME] = 1;
1492
1493
29.9k
    fwd_end_idx--;
1494
29.9k
  }
1495
1496
  // Assign all the remaining frame(s), if any, to the earliest reference
1497
  // frame.
1498
19.6k
  for (; ref_idx < (INTER_REFS_PER_FRAME - 2); ref_idx++) {
1499
9.01k
    const MV_REFERENCE_FRAME ref_frame = ref_frame_list[ref_idx];
1500
9.01k
    if (ref_flag_list[ref_frame - LAST_FRAME] == 1) continue;
1501
4.89k
    set_ref_frame_info(remapped_ref_idx, ref_frame - LAST_FRAME,
1502
4.89k
                       &ref_frame_info[fwd_start_idx]);
1503
4.89k
    ref_flag_list[ref_frame - LAST_FRAME] = 1;
1504
4.89k
  }
1505
1506
85.3k
  for (int i = 0; i < INTER_REFS_PER_FRAME; i++) {
1507
    assert(ref_flag_list[i] == 1);
1508
74.7k
  }
1509
10.6k
}