Coverage Report

Created: 2026-04-01 07:24

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/aom/av1/encoder/intra_mode_search.c
Line
Count
Source
1
/*
2
 * Copyright (c) 2020, Alliance for Open Media. All rights reserved.
3
 *
4
 * This source code is subject to the terms of the BSD 2 Clause License and
5
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6
 * was not distributed with this source code in the LICENSE file, you can
7
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8
 * Media Patent License 1.0 was not distributed with this source code in the
9
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10
 */
11
12
#include <stdbool.h>
13
14
#include "av1/common/av1_common_int.h"
15
#include "av1/common/cfl.h"
16
#include "av1/common/reconintra.h"
17
18
#include "av1/encoder/intra_mode_search.h"
19
#include "av1/encoder/intra_mode_search_utils.h"
20
#include "av1/encoder/palette.h"
21
#include "av1/encoder/speed_features.h"
22
#include "av1/encoder/tx_search.h"
23
24
// Even though there are 7 delta angles, this macro is set to 9 to facilitate
25
// the rd threshold check to prune -3 and 3 delta angles.
26
0
#define SIZE_OF_ANGLE_DELTA_RD_COST_ARRAY (2 * MAX_ANGLE_DELTA + 3)
27
28
// The order for evaluating delta angles while processing the luma directional
29
// intra modes. Currently, this order of evaluation is applicable only when
30
// speed feature prune_luma_odd_delta_angles_in_intra is enabled. In this case,
31
// even angles are evaluated first in order to facilitate the pruning of odd
32
// delta angles based on the rd costs of the neighboring delta angles.
33
static const int8_t luma_delta_angles_order[2 * MAX_ANGLE_DELTA] = {
34
  -2, 2, -3, -1, 1, 3,
35
};
36
37
/*!\cond */
38
static const PREDICTION_MODE intra_rd_search_mode_order[INTRA_MODES] = {
39
  DC_PRED,       H_PRED,        V_PRED,    SMOOTH_PRED, PAETH_PRED,
40
  SMOOTH_V_PRED, SMOOTH_H_PRED, D135_PRED, D203_PRED,   D157_PRED,
41
  D67_PRED,      D113_PRED,     D45_PRED,
42
};
43
44
static const UV_PREDICTION_MODE uv_rd_search_mode_order[UV_INTRA_MODES] = {
45
  UV_DC_PRED,     UV_CFL_PRED,   UV_H_PRED,        UV_V_PRED,
46
  UV_SMOOTH_PRED, UV_PAETH_PRED, UV_SMOOTH_V_PRED, UV_SMOOTH_H_PRED,
47
  UV_D135_PRED,   UV_D203_PRED,  UV_D157_PRED,     UV_D67_PRED,
48
  UV_D113_PRED,   UV_D45_PRED,
49
};
50
51
// The bitmask corresponds to the filter intra modes as defined in enums.h
52
// FILTER_INTRA_MODE enumeration type. Setting a bit to 0 in the mask means to
53
// disable the evaluation of corresponding filter intra mode. The table
54
// av1_derived_filter_intra_mode_used_flag is used when speed feature
55
// prune_filter_intra_level is 1. The evaluated filter intra modes are union
56
// of the following:
57
// 1) FILTER_DC_PRED
58
// 2) mode that corresponds to best mode so far of DC_PRED, V_PRED, H_PRED,
59
// D157_PRED and PAETH_PRED. (Eg: FILTER_V_PRED if best mode so far is V_PRED).
60
static const uint8_t av1_derived_filter_intra_mode_used_flag[INTRA_MODES] = {
61
  0x01,  // DC_PRED:           0000 0001
62
  0x03,  // V_PRED:            0000 0011
63
  0x05,  // H_PRED:            0000 0101
64
  0x01,  // D45_PRED:          0000 0001
65
  0x01,  // D135_PRED:         0000 0001
66
  0x01,  // D113_PRED:         0000 0001
67
  0x09,  // D157_PRED:         0000 1001
68
  0x01,  // D203_PRED:         0000 0001
69
  0x01,  // D67_PRED:          0000 0001
70
  0x01,  // SMOOTH_PRED:       0000 0001
71
  0x01,  // SMOOTH_V_PRED:     0000 0001
72
  0x01,  // SMOOTH_H_PRED:     0000 0001
73
  0x11   // PAETH_PRED:        0001 0001
74
};
75
76
// The bitmask corresponds to the chroma intra modes as defined in enums.h
77
// UV_PREDICTION_MODE enumeration type. Setting a bit to 0 in the mask means to
78
// disable the evaluation of corresponding chroma intra mode. The table
79
// av1_derived_chroma_intra_mode_used_flag is used when speed feature
80
// prune_chroma_modes_using_luma_winner is enabled. The evaluated chroma
81
// intra modes are union of the following:
82
// 1) UV_DC_PRED
83
// 2) UV_SMOOTH_PRED
84
// 3) UV_CFL_PRED
85
// 4) mode that corresponds to luma intra mode winner (Eg : UV_V_PRED if luma
86
// intra mode winner is V_PRED).
87
static const uint16_t av1_derived_chroma_intra_mode_used_flag[INTRA_MODES] = {
88
  0x2201,  // DC_PRED:           0010 0010 0000 0001
89
  0x2203,  // V_PRED:            0010 0010 0000 0011
90
  0x2205,  // H_PRED:            0010 0010 0000 0101
91
  0x2209,  // D45_PRED:          0010 0010 0000 1001
92
  0x2211,  // D135_PRED:         0010 0010 0001 0001
93
  0x2221,  // D113_PRED:         0010 0010 0010 0001
94
  0x2241,  // D157_PRED:         0010 0010 0100 0001
95
  0x2281,  // D203_PRED:         0010 0010 1000 0001
96
  0x2301,  // D67_PRED:          0010 0011 0000 0001
97
  0x2201,  // SMOOTH_PRED:       0010 0010 0000 0001
98
  0x2601,  // SMOOTH_V_PRED:     0010 0110 0000 0001
99
  0x2a01,  // SMOOTH_H_PRED:     0010 1010 0000 0001
100
  0x3201   // PAETH_PRED:        0011 0010 0000 0001
101
};
102
103
DECLARE_ALIGNED(16, static const uint8_t, all_zeros[MAX_SB_SIZE]) = { 0 };
104
DECLARE_ALIGNED(16, static const uint16_t,
105
                highbd_all_zeros[MAX_SB_SIZE]) = { 0 };
106
107
int av1_calc_normalized_variance(aom_variance_fn_t vf, const uint8_t *const buf,
108
0
                                 const int stride, const int is_hbd) {
109
0
  unsigned int sse;
110
111
0
  if (is_hbd)
112
0
    return vf(buf, stride, CONVERT_TO_BYTEPTR(highbd_all_zeros), 0, &sse);
113
0
  else
114
0
    return vf(buf, stride, all_zeros, 0, &sse);
115
0
}
116
117
// Computes average of log(1 + variance) across 4x4 sub-blocks for source and
118
// reconstructed blocks.
119
static void compute_avg_log_variance(const AV1_COMP *const cpi, MACROBLOCK *x,
120
                                     const BLOCK_SIZE bs,
121
                                     double *avg_log_src_variance,
122
0
                                     double *avg_log_recon_variance) {
123
0
  const MACROBLOCKD *const xd = &x->e_mbd;
124
0
  const BLOCK_SIZE sb_size = cpi->common.seq_params->sb_size;
125
0
  const int mi_row_in_sb = x->e_mbd.mi_row & (mi_size_high[sb_size] - 1);
126
0
  const int mi_col_in_sb = x->e_mbd.mi_col & (mi_size_wide[sb_size] - 1);
127
0
  const int right_overflow =
128
0
      (xd->mb_to_right_edge < 0) ? ((-xd->mb_to_right_edge) >> 3) : 0;
129
0
  const int bottom_overflow =
130
0
      (xd->mb_to_bottom_edge < 0) ? ((-xd->mb_to_bottom_edge) >> 3) : 0;
131
0
  const int bw = (MI_SIZE * mi_size_wide[bs] - right_overflow);
132
0
  const int bh = (MI_SIZE * mi_size_high[bs] - bottom_overflow);
133
0
  const int is_hbd = is_cur_buf_hbd(xd);
134
135
0
  aom_variance_fn_t vf = cpi->ppi->fn_ptr[BLOCK_4X4].vf;
136
0
  for (int i = 0; i < bh; i += MI_SIZE) {
137
0
    const int r = mi_row_in_sb + (i >> MI_SIZE_LOG2);
138
0
    for (int j = 0; j < bw; j += MI_SIZE) {
139
0
      const int c = mi_col_in_sb + (j >> MI_SIZE_LOG2);
140
0
      const int mi_offset = r * mi_size_wide[sb_size] + c;
141
0
      Block4x4VarInfo *block_4x4_var_info =
142
0
          &x->src_var_info_of_4x4_sub_blocks[mi_offset];
143
0
      int src_var = block_4x4_var_info->var;
144
0
      double log_src_var = block_4x4_var_info->log_var;
145
      // Compute average of log(1 + variance) for the source block from 4x4
146
      // sub-block variance values. Calculate and store 4x4 sub-block variance
147
      // and log(1 + variance), if the values present in
148
      // src_var_of_4x4_sub_blocks are invalid. Reuse the same if it is readily
149
      // available with valid values.
150
0
      if (src_var < 0) {
151
0
        src_var = av1_calc_normalized_variance(
152
0
            vf, x->plane[0].src.buf + i * x->plane[0].src.stride + j,
153
0
            x->plane[0].src.stride, is_hbd);
154
0
        block_4x4_var_info->var = src_var;
155
0
        log_src_var = log1p(src_var / 16.0);
156
0
        block_4x4_var_info->log_var = log_src_var;
157
0
      } else {
158
        // When source variance is already calculated and available for
159
        // retrieval, check if log(1 + variance) is also available. If it is
160
        // available, then retrieve from buffer. Else, calculate the same and
161
        // store to the buffer.
162
0
        if (log_src_var < 0) {
163
0
          log_src_var = log1p(src_var / 16.0);
164
0
          block_4x4_var_info->log_var = log_src_var;
165
0
        }
166
0
      }
167
0
      *avg_log_src_variance += log_src_var;
168
169
0
      const int recon_var = av1_calc_normalized_variance(
170
0
          vf, xd->plane[0].dst.buf + i * xd->plane[0].dst.stride + j,
171
0
          xd->plane[0].dst.stride, is_hbd);
172
0
      *avg_log_recon_variance += log1p(recon_var / 16.0);
173
0
    }
174
0
  }
175
176
0
  const int blocks = (bw * bh) / 16;
177
0
  *avg_log_src_variance /= (double)blocks;
178
0
  *avg_log_recon_variance /= (double)blocks;
179
0
}
180
181
// Returns a factor to be applied to the RD value based on how well the
182
// reconstructed block variance matches the source variance.
183
static double intra_rd_variance_factor(const AV1_COMP *cpi, MACROBLOCK *x,
184
0
                                       BLOCK_SIZE bs) {
185
0
  double threshold = INTRA_RD_VAR_THRESH(cpi->oxcf.speed);
186
  // For non-positive threshold values, the comparison of source and
187
  // reconstructed variances with threshold evaluates to false
188
  // (src_var < threshold/rec_var < threshold) as these metrics are greater than
189
  // than 0. Hence further calculations are skipped.
190
0
  if (threshold <= 0) return 1.0;
191
192
0
  double variance_rd_factor = 1.0;
193
0
  double avg_log_src_variance = 0.0;
194
0
  double avg_log_recon_variance = 0.0;
195
0
  double var_diff = 0.0;
196
197
0
  compute_avg_log_variance(cpi, x, bs, &avg_log_src_variance,
198
0
                           &avg_log_recon_variance);
199
200
  // Dont allow 0 to prevent / 0 below.
201
0
  avg_log_src_variance += 0.000001;
202
0
  avg_log_recon_variance += 0.000001;
203
204
0
  if (avg_log_src_variance >= avg_log_recon_variance) {
205
0
    var_diff = (avg_log_src_variance - avg_log_recon_variance);
206
0
    if ((var_diff > 0.5) && (avg_log_recon_variance < threshold)) {
207
0
      variance_rd_factor = 1.0 + ((var_diff * 2) / avg_log_src_variance);
208
0
    }
209
0
  } else {
210
0
    var_diff = (avg_log_recon_variance - avg_log_src_variance);
211
0
    if ((var_diff > 0.5) && (avg_log_src_variance < threshold)) {
212
0
      variance_rd_factor = 1.0 + (var_diff / (2 * avg_log_src_variance));
213
0
    }
214
0
  }
215
216
  // Limit adjustment;
217
0
  variance_rd_factor = AOMMIN(3.0, variance_rd_factor);
218
219
0
  return variance_rd_factor;
220
0
}
221
/*!\endcond */
222
223
/*!\brief Search for the best filter_intra mode when coding intra frame.
224
 *
225
 * \ingroup intra_mode_search
226
 * \callergraph
227
 * This function loops through all filter_intra modes to find the best one.
228
 *
229
 * \return Returns 1 if a new filter_intra mode is selected; 0 otherwise.
230
 */
231
static int rd_pick_filter_intra_sby(const AV1_COMP *const cpi, MACROBLOCK *x,
232
                                    int *rate, int *rate_tokenonly,
233
                                    int64_t *distortion, uint8_t *skippable,
234
                                    BLOCK_SIZE bsize, int mode_cost,
235
                                    PREDICTION_MODE best_mode_so_far,
236
                                    int64_t *best_rd, int64_t *best_model_rd,
237
0
                                    PICK_MODE_CONTEXT *ctx) {
238
  // Skip the evaluation of filter intra modes.
239
0
  if (cpi->sf.intra_sf.prune_filter_intra_level == 2) return 0;
240
241
0
  MACROBLOCKD *const xd = &x->e_mbd;
242
0
  MB_MODE_INFO *mbmi = xd->mi[0];
243
0
  int filter_intra_selected_flag = 0;
244
0
  FILTER_INTRA_MODE mode;
245
0
  TX_SIZE best_tx_size = TX_8X8;
246
0
  FILTER_INTRA_MODE_INFO filter_intra_mode_info;
247
0
  uint8_t best_tx_type_map[MAX_MIB_SIZE * MAX_MIB_SIZE];
248
0
  av1_zero(filter_intra_mode_info);
249
0
  mbmi->filter_intra_mode_info.use_filter_intra = 1;
250
0
  mbmi->mode = DC_PRED;
251
0
  mbmi->palette_mode_info.palette_size[0] = 0;
252
253
  // Skip the evaluation of filter-intra if cached MB_MODE_INFO does not have
254
  // filter-intra as winner.
255
0
  if (x->use_mb_mode_cache &&
256
0
      !x->mb_mode_cache->filter_intra_mode_info.use_filter_intra)
257
0
    return 0;
258
259
0
  for (mode = 0; mode < FILTER_INTRA_MODES; ++mode) {
260
0
    int64_t this_rd;
261
0
    RD_STATS tokenonly_rd_stats;
262
0
    mbmi->filter_intra_mode_info.filter_intra_mode = mode;
263
264
0
    if ((cpi->sf.intra_sf.prune_filter_intra_level == 1) &&
265
0
        !(av1_derived_filter_intra_mode_used_flag[best_mode_so_far] &
266
0
          (1 << mode)))
267
0
      continue;
268
269
    // Skip the evaluation of modes that do not match with the winner mode in
270
    // x->mb_mode_cache.
271
0
    if (x->use_mb_mode_cache &&
272
0
        mode != x->mb_mode_cache->filter_intra_mode_info.filter_intra_mode)
273
0
      continue;
274
275
0
    if (model_intra_yrd_and_prune(cpi, x, bsize, best_model_rd)) {
276
0
      continue;
277
0
    }
278
0
    av1_pick_uniform_tx_size_type_yrd(cpi, x, &tokenonly_rd_stats, bsize,
279
0
                                      *best_rd);
280
0
    if (tokenonly_rd_stats.rate == INT_MAX) continue;
281
0
    const int this_rate =
282
0
        tokenonly_rd_stats.rate +
283
0
        intra_mode_info_cost_y(cpi, x, mbmi, bsize, mode_cost, 0);
284
0
    this_rd = RDCOST(x->rdmult, this_rate, tokenonly_rd_stats.dist);
285
286
    // Visual quality adjustment based on recon vs source variance.
287
0
    if ((cpi->oxcf.mode == ALLINTRA) && (this_rd != INT64_MAX)) {
288
0
      this_rd = (int64_t)(this_rd * intra_rd_variance_factor(cpi, x, bsize));
289
0
    }
290
291
    // Collect mode stats for multiwinner mode processing
292
0
    const int txfm_search_done = 1;
293
0
    store_winner_mode_stats(
294
0
        &cpi->common, x, mbmi, NULL, NULL, NULL, 0, NULL, bsize, this_rd,
295
0
        cpi->sf.winner_mode_sf.multi_winner_mode_type, txfm_search_done);
296
0
    if (this_rd < *best_rd) {
297
0
      *best_rd = this_rd;
298
0
      best_tx_size = mbmi->tx_size;
299
0
      filter_intra_mode_info = mbmi->filter_intra_mode_info;
300
0
      av1_copy_array(best_tx_type_map, xd->tx_type_map, ctx->num_4x4_blk);
301
0
      memcpy(ctx->blk_skip, x->txfm_search_info.blk_skip,
302
0
             sizeof(x->txfm_search_info.blk_skip[0]) * ctx->num_4x4_blk);
303
0
      *rate = this_rate;
304
0
      *rate_tokenonly = tokenonly_rd_stats.rate;
305
0
      *distortion = tokenonly_rd_stats.dist;
306
0
      *skippable = tokenonly_rd_stats.skip_txfm;
307
0
      filter_intra_selected_flag = 1;
308
0
    }
309
0
  }
310
311
0
  if (filter_intra_selected_flag) {
312
0
    mbmi->mode = DC_PRED;
313
0
    mbmi->tx_size = best_tx_size;
314
0
    mbmi->filter_intra_mode_info = filter_intra_mode_info;
315
0
    av1_copy_array(ctx->tx_type_map, best_tx_type_map, ctx->num_4x4_blk);
316
0
    return 1;
317
0
  } else {
318
0
    return 0;
319
0
  }
320
0
}
321
322
void av1_count_colors(const uint8_t *src, int stride, int rows, int cols,
323
0
                      int *val_count, int *num_colors) {
324
0
  const int max_pix_val = 1 << 8;
325
0
  memset(val_count, 0, max_pix_val * sizeof(val_count[0]));
326
0
  for (int r = 0; r < rows; ++r) {
327
0
    for (int c = 0; c < cols; ++c) {
328
0
      const int this_val = src[r * stride + c];
329
0
      assert(this_val < max_pix_val);
330
0
      ++val_count[this_val];
331
0
    }
332
0
  }
333
0
  int n = 0;
334
0
  for (int i = 0; i < max_pix_val; ++i) {
335
0
    if (val_count[i]) ++n;
336
0
  }
337
0
  *num_colors = n;
338
0
}
339
340
void av1_count_colors_highbd(const uint8_t *src8, int stride, int rows,
341
                             int cols, int bit_depth, int *val_count,
342
                             int *bin_val_count, int *num_color_bins,
343
0
                             int *num_colors) {
344
0
  assert(bit_depth <= 12);
345
0
  const int max_bin_val = 1 << 8;
346
0
  const int max_pix_val = 1 << bit_depth;
347
0
  const uint16_t *src = CONVERT_TO_SHORTPTR(src8);
348
0
  memset(bin_val_count, 0, max_bin_val * sizeof(val_count[0]));
349
0
  if (val_count != NULL)
350
0
    memset(val_count, 0, max_pix_val * sizeof(val_count[0]));
351
0
  for (int r = 0; r < rows; ++r) {
352
0
    for (int c = 0; c < cols; ++c) {
353
      /*
354
       * Down-convert the pixels to 8-bit domain before counting.
355
       * This provides consistency of behavior for palette search
356
       * between lbd and hbd encodes. This down-converted pixels
357
       * are only used for calculating the threshold (n).
358
       */
359
0
      const int this_val = ((src[r * stride + c]) >> (bit_depth - 8));
360
0
      assert(this_val < max_bin_val);
361
0
      if (this_val >= max_bin_val) continue;
362
0
      ++bin_val_count[this_val];
363
0
      if (val_count != NULL) ++val_count[(src[r * stride + c])];
364
0
    }
365
0
  }
366
0
  int n = 0;
367
  // Count the colors based on 8-bit domain used to gate the palette path
368
0
  for (int i = 0; i < max_bin_val; ++i) {
369
0
    if (bin_val_count[i]) ++n;
370
0
  }
371
0
  *num_color_bins = n;
372
373
  // Count the actual hbd colors used to create top_colors
374
0
  n = 0;
375
0
  if (val_count != NULL) {
376
0
    for (int i = 0; i < max_pix_val; ++i) {
377
0
      if (val_count[i]) ++n;
378
0
    }
379
0
    *num_colors = n;
380
0
  }
381
0
}
382
383
bool av1_count_colors_with_threshold(const uint8_t *src, int stride, int rows,
384
                                     int cols, int num_colors_threshold,
385
0
                                     int *num_colors) {
386
0
  bool has_color[1 << 8] = { false };
387
0
  *num_colors = 0;
388
389
0
  for (int r = 0; r < rows; ++r) {
390
0
    for (int c = 0; c < cols; ++c) {
391
0
      const int this_val = src[r * stride + c];
392
0
      if (!has_color[this_val]) {
393
0
        has_color[this_val] = true;
394
0
        (*num_colors)++;
395
0
        if (*num_colors > num_colors_threshold) {
396
          // We're over the threshold, so we can exit early
397
0
          return false;
398
0
        }
399
0
      }
400
0
    }
401
0
  }
402
0
  return true;
403
0
}
404
405
void set_y_mode_and_delta_angle(const int mode_idx, MB_MODE_INFO *const mbmi,
406
0
                                int reorder_delta_angle_eval) {
407
0
  if (mode_idx < INTRA_MODE_END) {
408
0
    mbmi->mode = intra_rd_search_mode_order[mode_idx];
409
0
    mbmi->angle_delta[PLANE_TYPE_Y] = 0;
410
0
  } else {
411
0
    mbmi->mode = (mode_idx - INTRA_MODE_END) / (MAX_ANGLE_DELTA * 2) + V_PRED;
412
0
    int delta_angle_eval_idx =
413
0
        (mode_idx - INTRA_MODE_END) % (MAX_ANGLE_DELTA * 2);
414
0
    if (reorder_delta_angle_eval) {
415
0
      mbmi->angle_delta[PLANE_TYPE_Y] =
416
0
          luma_delta_angles_order[delta_angle_eval_idx];
417
0
    } else {
418
0
      mbmi->angle_delta[PLANE_TYPE_Y] =
419
0
          (delta_angle_eval_idx < 3 ? (delta_angle_eval_idx - 3)
420
0
                                    : (delta_angle_eval_idx - 2));
421
0
    }
422
0
  }
423
0
}
424
425
static inline int get_model_rd_index_for_pruning(
426
    const MACROBLOCK *const x,
427
0
    const INTRA_MODE_SPEED_FEATURES *const intra_sf) {
428
0
  const int top_intra_model_count_allowed =
429
0
      intra_sf->top_intra_model_count_allowed;
430
0
  if (!intra_sf->adapt_top_model_rd_count_using_neighbors)
431
0
    return top_intra_model_count_allowed - 1;
432
433
0
  const MACROBLOCKD *const xd = &x->e_mbd;
434
0
  const PREDICTION_MODE mode = xd->mi[0]->mode;
435
0
  int model_rd_index_for_pruning = top_intra_model_count_allowed - 1;
436
0
  int is_left_mode_neq_cur_mode = 0, is_above_mode_neq_cur_mode = 0;
437
0
  if (xd->left_available)
438
0
    is_left_mode_neq_cur_mode = xd->left_mbmi->mode != mode;
439
0
  if (xd->up_available)
440
0
    is_above_mode_neq_cur_mode = xd->above_mbmi->mode != mode;
441
  // The pruning of luma intra modes is made more aggressive at lower quantizers
442
  // and vice versa. The value for model_rd_index_for_pruning is derived as
443
  // follows.
444
  // qidx 0 to 127: Reduce the index of a candidate used for comparison only if
445
  // the current mode does not match either of the available neighboring modes.
446
  // qidx 128 to 255: Reduce the index of a candidate used for comparison only
447
  // if the current mode does not match both the available neighboring modes.
448
0
  if (x->qindex <= 127) {
449
0
    if (is_left_mode_neq_cur_mode || is_above_mode_neq_cur_mode)
450
0
      model_rd_index_for_pruning = AOMMAX(model_rd_index_for_pruning - 1, 0);
451
0
  } else {
452
0
    if (is_left_mode_neq_cur_mode && is_above_mode_neq_cur_mode)
453
0
      model_rd_index_for_pruning = AOMMAX(model_rd_index_for_pruning - 1, 0);
454
0
  }
455
0
  return model_rd_index_for_pruning;
456
0
}
457
458
/*! \brief prune luma intra mode based on the model rd.
459
 * \param[in]    this_model_rd              model rd for current mode.
460
 * \param[in]    best_model_rd              Best model RD seen for this block so
461
 *                                          far.
462
 * \param[in]    top_intra_model_rd         Top intra model RD seen for this
463
 *                                          block so far.
464
 * \param[in]    max_model_cnt_allowed      The maximum number of top intra
465
 *                                          model RD allowed.
466
 * \param[in]    model_rd_index_for_pruning Index of the candidate used for
467
 *                                          pruning based on model rd.
468
 */
469
static int prune_intra_y_mode(int64_t this_model_rd, int64_t *best_model_rd,
470
                              int64_t top_intra_model_rd[],
471
                              int max_model_cnt_allowed,
472
0
                              int model_rd_index_for_pruning) {
473
0
  const double thresh_best = 1.50;
474
0
  const double thresh_top = 1.00;
475
0
  for (int i = 0; i < max_model_cnt_allowed; i++) {
476
0
    if (this_model_rd < top_intra_model_rd[i]) {
477
0
      for (int j = max_model_cnt_allowed - 1; j > i; j--) {
478
0
        top_intra_model_rd[j] = top_intra_model_rd[j - 1];
479
0
      }
480
0
      top_intra_model_rd[i] = this_model_rd;
481
0
      break;
482
0
    }
483
0
  }
484
0
  if (top_intra_model_rd[model_rd_index_for_pruning] != INT64_MAX &&
485
0
      this_model_rd >
486
0
          thresh_top * top_intra_model_rd[model_rd_index_for_pruning])
487
0
    return 1;
488
489
0
  if (this_model_rd != INT64_MAX &&
490
0
      this_model_rd > thresh_best * (*best_model_rd))
491
0
    return 1;
492
0
  if (this_model_rd < *best_model_rd) *best_model_rd = this_model_rd;
493
0
  return 0;
494
0
}
495
496
// Run RD calculation with given chroma intra prediction angle., and return
497
// the RD cost. Update the best mode info. if the RD cost is the best so far.
498
static int64_t pick_intra_angle_routine_sbuv(
499
    const AV1_COMP *const cpi, MACROBLOCK *x, BLOCK_SIZE bsize,
500
    int rate_overhead, int64_t best_rd_in, int *rate, RD_STATS *rd_stats,
501
0
    int *best_angle_delta, int64_t *best_rd) {
502
0
  MB_MODE_INFO *mbmi = x->e_mbd.mi[0];
503
0
  assert(!is_inter_block(mbmi));
504
0
  int this_rate;
505
0
  int64_t this_rd;
506
0
  RD_STATS tokenonly_rd_stats;
507
508
0
  if (!av1_txfm_uvrd(cpi, x, &tokenonly_rd_stats, bsize, best_rd_in))
509
0
    return INT64_MAX;
510
0
  this_rate = tokenonly_rd_stats.rate +
511
0
              intra_mode_info_cost_uv(cpi, x, mbmi, bsize, rate_overhead);
512
0
  this_rd = RDCOST(x->rdmult, this_rate, tokenonly_rd_stats.dist);
513
0
  if (this_rd < *best_rd) {
514
0
    *best_rd = this_rd;
515
0
    *best_angle_delta = mbmi->angle_delta[PLANE_TYPE_UV];
516
0
    *rate = this_rate;
517
0
    rd_stats->rate = tokenonly_rd_stats.rate;
518
0
    rd_stats->dist = tokenonly_rd_stats.dist;
519
0
    rd_stats->skip_txfm = tokenonly_rd_stats.skip_txfm;
520
0
  }
521
0
  return this_rd;
522
0
}
523
524
/*!\brief Search for the best angle delta for chroma prediction
525
 *
526
 * \ingroup intra_mode_search
527
 * \callergraph
528
 * Given a chroma directional intra prediction mode, this function will try to
529
 * estimate the best delta_angle.
530
 *
531
 * \returns Return if there is a new mode with smaller rdcost than best_rd.
532
 */
533
static int rd_pick_intra_angle_sbuv(const AV1_COMP *const cpi, MACROBLOCK *x,
534
                                    BLOCK_SIZE bsize, int rate_overhead,
535
                                    int64_t best_rd, int *rate,
536
0
                                    RD_STATS *rd_stats) {
537
0
  MACROBLOCKD *const xd = &x->e_mbd;
538
0
  MB_MODE_INFO *mbmi = xd->mi[0];
539
0
  assert(!is_inter_block(mbmi));
540
0
  int i, angle_delta, best_angle_delta = 0;
541
0
  int64_t this_rd, best_rd_in, rd_cost[2 * (MAX_ANGLE_DELTA + 2)];
542
543
0
  rd_stats->rate = INT_MAX;
544
0
  rd_stats->skip_txfm = 0;
545
0
  rd_stats->dist = INT64_MAX;
546
0
  for (i = 0; i < 2 * (MAX_ANGLE_DELTA + 2); ++i) rd_cost[i] = INT64_MAX;
547
548
0
  for (angle_delta = 0; angle_delta <= MAX_ANGLE_DELTA; angle_delta += 2) {
549
0
    for (i = 0; i < 2; ++i) {
550
0
      best_rd_in = (best_rd == INT64_MAX)
551
0
                       ? INT64_MAX
552
0
                       : (best_rd + (best_rd >> ((angle_delta == 0) ? 3 : 5)));
553
0
      mbmi->angle_delta[PLANE_TYPE_UV] = (1 - 2 * i) * angle_delta;
554
0
      this_rd = pick_intra_angle_routine_sbuv(cpi, x, bsize, rate_overhead,
555
0
                                              best_rd_in, rate, rd_stats,
556
0
                                              &best_angle_delta, &best_rd);
557
0
      rd_cost[2 * angle_delta + i] = this_rd;
558
0
      if (angle_delta == 0) {
559
0
        if (this_rd == INT64_MAX) return 0;
560
0
        rd_cost[1] = this_rd;
561
0
        break;
562
0
      }
563
0
    }
564
0
  }
565
566
0
  assert(best_rd != INT64_MAX);
567
0
  for (angle_delta = 1; angle_delta <= MAX_ANGLE_DELTA; angle_delta += 2) {
568
0
    int64_t rd_thresh;
569
0
    for (i = 0; i < 2; ++i) {
570
0
      int skip_search = 0;
571
0
      rd_thresh = best_rd + (best_rd >> 5);
572
0
      if (rd_cost[2 * (angle_delta + 1) + i] > rd_thresh &&
573
0
          rd_cost[2 * (angle_delta - 1) + i] > rd_thresh)
574
0
        skip_search = 1;
575
0
      if (!skip_search) {
576
0
        mbmi->angle_delta[PLANE_TYPE_UV] = (1 - 2 * i) * angle_delta;
577
0
        pick_intra_angle_routine_sbuv(cpi, x, bsize, rate_overhead, best_rd,
578
0
                                      rate, rd_stats, &best_angle_delta,
579
0
                                      &best_rd);
580
0
      }
581
0
    }
582
0
  }
583
584
0
  mbmi->angle_delta[PLANE_TYPE_UV] = best_angle_delta;
585
0
  return rd_stats->rate != INT_MAX;
586
0
}
587
588
#define PLANE_SIGN_TO_JOINT_SIGN(plane, a, b) \
589
0
  (plane == CFL_PRED_U ? a * CFL_SIGNS + b - 1 : b * CFL_SIGNS + a - 1)
590
591
static void cfl_idx_to_sign_and_alpha(int cfl_idx, CFL_SIGN_TYPE *cfl_sign,
592
0
                                      int *cfl_alpha) {
593
0
  int cfl_linear_idx = cfl_idx - CFL_INDEX_ZERO;
594
0
  if (cfl_linear_idx == 0) {
595
0
    *cfl_sign = CFL_SIGN_ZERO;
596
0
    *cfl_alpha = 0;
597
0
  } else {
598
0
    *cfl_sign = cfl_linear_idx > 0 ? CFL_SIGN_POS : CFL_SIGN_NEG;
599
0
    *cfl_alpha = abs(cfl_linear_idx) - 1;
600
0
  }
601
0
}
602
603
static int64_t cfl_compute_rd(const AV1_COMP *const cpi, MACROBLOCK *x,
604
                              int plane, TX_SIZE tx_size,
605
                              BLOCK_SIZE plane_bsize, int cfl_idx,
606
0
                              int fast_mode, RD_STATS *rd_stats) {
607
0
  assert(IMPLIES(fast_mode, rd_stats == NULL));
608
0
  const AV1_COMMON *const cm = &cpi->common;
609
0
  MACROBLOCKD *const xd = &x->e_mbd;
610
0
  MB_MODE_INFO *const mbmi = xd->mi[0];
611
0
  int cfl_plane = get_cfl_pred_type(plane);
612
0
  CFL_SIGN_TYPE cfl_sign;
613
0
  int cfl_alpha;
614
0
  cfl_idx_to_sign_and_alpha(cfl_idx, &cfl_sign, &cfl_alpha);
615
  // We conly build CFL for a given plane, the other plane's sign is dummy
616
0
  int dummy_sign = CFL_SIGN_NEG;
617
0
  const int8_t orig_cfl_alpha_signs = mbmi->cfl_alpha_signs;
618
0
  const uint8_t orig_cfl_alpha_idx = mbmi->cfl_alpha_idx;
619
0
  mbmi->cfl_alpha_signs =
620
0
      PLANE_SIGN_TO_JOINT_SIGN(cfl_plane, cfl_sign, dummy_sign);
621
0
  mbmi->cfl_alpha_idx = (cfl_alpha << CFL_ALPHABET_SIZE_LOG2) + cfl_alpha;
622
0
  int64_t cfl_cost;
623
0
  if (fast_mode) {
624
0
    cfl_cost =
625
0
        intra_model_rd(cm, x, plane, plane_bsize, tx_size, /*use_hadamard=*/0);
626
0
  } else {
627
0
    av1_init_rd_stats(rd_stats);
628
0
    av1_txfm_rd_in_plane(x, cpi, rd_stats, INT64_MAX, 0, plane, plane_bsize,
629
0
                         tx_size, FTXS_NONE, 0);
630
0
    av1_rd_cost_update(x->rdmult, rd_stats);
631
0
    cfl_cost = rd_stats->rdcost;
632
0
  }
633
0
  mbmi->cfl_alpha_signs = orig_cfl_alpha_signs;
634
0
  mbmi->cfl_alpha_idx = orig_cfl_alpha_idx;
635
0
  return cfl_cost;
636
0
}
637
638
static const int cfl_dir_ls[2] = { 1, -1 };
639
640
// If cfl_search_range is CFL_MAGS_SIZE, return zero. Otherwise return the index
641
// of the best alpha found using intra_model_rd().
642
static int cfl_pick_plane_parameter(const AV1_COMP *const cpi, MACROBLOCK *x,
643
                                    int plane, TX_SIZE tx_size,
644
0
                                    int cfl_search_range) {
645
0
  assert(cfl_search_range >= 1 && cfl_search_range <= CFL_MAGS_SIZE);
646
647
0
  if (cfl_search_range == CFL_MAGS_SIZE) return CFL_INDEX_ZERO;
648
649
0
  const MACROBLOCKD *const xd = &x->e_mbd;
650
0
  const MB_MODE_INFO *const mbmi = xd->mi[0];
651
0
  assert(mbmi->uv_mode == UV_CFL_PRED);
652
0
  const MACROBLOCKD_PLANE *pd = &xd->plane[plane];
653
0
  const BLOCK_SIZE plane_bsize =
654
0
      get_plane_block_size(mbmi->bsize, pd->subsampling_x, pd->subsampling_y);
655
656
0
  int est_best_cfl_idx = CFL_INDEX_ZERO;
657
0
  int fast_mode = 1;
658
0
  int start_cfl_idx = CFL_INDEX_ZERO;
659
0
  int64_t best_cfl_cost = cfl_compute_rd(cpi, x, plane, tx_size, plane_bsize,
660
0
                                         start_cfl_idx, fast_mode, NULL);
661
0
  for (int si = 0; si < 2; ++si) {
662
0
    const int dir = cfl_dir_ls[si];
663
0
    for (int i = 1; i < CFL_MAGS_SIZE; ++i) {
664
0
      int cfl_idx = start_cfl_idx + dir * i;
665
0
      if (cfl_idx < 0 || cfl_idx >= CFL_MAGS_SIZE) break;
666
0
      int64_t cfl_cost = cfl_compute_rd(cpi, x, plane, tx_size, plane_bsize,
667
0
                                        cfl_idx, fast_mode, NULL);
668
0
      if (cfl_cost < best_cfl_cost) {
669
0
        best_cfl_cost = cfl_cost;
670
0
        est_best_cfl_idx = cfl_idx;
671
0
      } else {
672
0
        break;
673
0
      }
674
0
    }
675
0
  }
676
0
  return est_best_cfl_idx;
677
0
}
678
679
static inline void set_invalid_cfl_parameters(uint8_t *best_cfl_alpha_idx,
680
0
                                              int8_t *best_cfl_alpha_signs) {
681
0
  *best_cfl_alpha_idx = 0;
682
0
  *best_cfl_alpha_signs = 0;
683
0
}
684
685
static void cfl_pick_plane_rd(const AV1_COMP *const cpi, MACROBLOCK *x,
686
                              int plane, TX_SIZE tx_size, int cfl_search_range,
687
                              RD_STATS cfl_rd_arr[CFL_MAGS_SIZE],
688
0
                              int est_best_cfl_idx) {
689
0
  assert(cfl_search_range >= 1 && cfl_search_range <= CFL_MAGS_SIZE);
690
0
  const MACROBLOCKD *const xd = &x->e_mbd;
691
0
  const MB_MODE_INFO *const mbmi = xd->mi[0];
692
0
  assert(mbmi->uv_mode == UV_CFL_PRED);
693
0
  const MACROBLOCKD_PLANE *pd = &xd->plane[plane];
694
0
  const BLOCK_SIZE plane_bsize =
695
0
      get_plane_block_size(mbmi->bsize, pd->subsampling_x, pd->subsampling_y);
696
697
0
  for (int cfl_idx = 0; cfl_idx < CFL_MAGS_SIZE; ++cfl_idx) {
698
0
    av1_invalid_rd_stats(&cfl_rd_arr[cfl_idx]);
699
0
  }
700
701
0
  int fast_mode = 0;
702
0
  int start_cfl_idx = est_best_cfl_idx;
703
0
  cfl_compute_rd(cpi, x, plane, tx_size, plane_bsize, start_cfl_idx, fast_mode,
704
0
                 &cfl_rd_arr[start_cfl_idx]);
705
706
0
  if (cfl_search_range == 1) return;
707
708
0
  for (int si = 0; si < 2; ++si) {
709
0
    const int dir = cfl_dir_ls[si];
710
0
    for (int i = 1; i < cfl_search_range; ++i) {
711
0
      int cfl_idx = start_cfl_idx + dir * i;
712
0
      if (cfl_idx < 0 || cfl_idx >= CFL_MAGS_SIZE) break;
713
0
      cfl_compute_rd(cpi, x, plane, tx_size, plane_bsize, cfl_idx, fast_mode,
714
0
                     &cfl_rd_arr[cfl_idx]);
715
0
    }
716
0
  }
717
0
}
718
719
/*!\brief Pick the optimal parameters for Chroma to Luma (CFL) component
720
 *
721
 * \ingroup intra_mode_search
722
 * \callergraph
723
 *
724
 * This function will use DCT_DCT followed by computing SATD (sum of absolute
725
 * transformed differences) to estimate the RD score and find the best possible
726
 * CFL parameter.
727
 *
728
 * Then the function will apply a full RD search near the best possible CFL
729
 * parameter to find the best actual CFL parameter.
730
 *
731
 * Side effect:
732
 * We use ths buffers in x->plane[] and xd->plane[] as throw-away buffers for RD
733
 * search.
734
 *
735
 * \param[in] x                Encoder prediction block structure.
736
 * \param[in] cpi              Top-level encoder instance structure.
737
 * \param[in] tx_size          Transform size.
738
 * \param[in] ref_best_rd      Reference best RD.
739
 * \param[in] cfl_search_range The search range of full RD search near the
740
 *                             estimated best CFL parameter.
741
 *
742
 * \param[out]   best_rd_stats          RD stats of the best CFL parameter
743
 * \param[out]   best_cfl_alpha_idx     Best CFL alpha index
744
 * \param[out]   best_cfl_alpha_signs   Best CFL joint signs
745
 *
746
 */
747
static int cfl_rd_pick_alpha(MACROBLOCK *const x, const AV1_COMP *const cpi,
748
                             TX_SIZE tx_size, int64_t ref_best_rd,
749
                             int cfl_search_range, RD_STATS *best_rd_stats,
750
                             uint8_t *best_cfl_alpha_idx,
751
0
                             int8_t *best_cfl_alpha_signs) {
752
0
  assert(cfl_search_range >= 1 && cfl_search_range <= CFL_MAGS_SIZE);
753
0
  const ModeCosts *mode_costs = &x->mode_costs;
754
0
  RD_STATS cfl_rd_arr_u[CFL_MAGS_SIZE];
755
0
  RD_STATS cfl_rd_arr_v[CFL_MAGS_SIZE];
756
0
  MACROBLOCKD *const xd = &x->e_mbd;
757
0
  int est_best_cfl_idx_u, est_best_cfl_idx_v;
758
759
0
  av1_invalid_rd_stats(best_rd_stats);
760
761
  // As the dc pred data is same for different values of alpha, enable the
762
  // caching of dc pred data. Call clear_cfl_dc_pred_cache_flags() before
763
  // returning to avoid the unintentional usage of cached dc pred data.
764
0
  xd->cfl.use_dc_pred_cache = true;
765
  // Evaluate alpha parameter of each chroma plane.
766
0
  est_best_cfl_idx_u =
767
0
      cfl_pick_plane_parameter(cpi, x, 1, tx_size, cfl_search_range);
768
0
  est_best_cfl_idx_v =
769
0
      cfl_pick_plane_parameter(cpi, x, 2, tx_size, cfl_search_range);
770
771
0
  if (cfl_search_range == 1) {
772
    // For cfl_search_range=1, further refinement of alpha is not enabled. Hence
773
    // CfL index=0 for both the chroma planes implies invalid CfL mode.
774
0
    if (est_best_cfl_idx_u == CFL_INDEX_ZERO &&
775
0
        est_best_cfl_idx_v == CFL_INDEX_ZERO) {
776
0
      set_invalid_cfl_parameters(best_cfl_alpha_idx, best_cfl_alpha_signs);
777
0
      clear_cfl_dc_pred_cache_flags(&xd->cfl);
778
0
      return 0;
779
0
    }
780
781
0
    int cfl_alpha_u, cfl_alpha_v;
782
0
    CFL_SIGN_TYPE cfl_sign_u, cfl_sign_v;
783
0
    const MB_MODE_INFO *mbmi = xd->mi[0];
784
0
    cfl_idx_to_sign_and_alpha(est_best_cfl_idx_u, &cfl_sign_u, &cfl_alpha_u);
785
0
    cfl_idx_to_sign_and_alpha(est_best_cfl_idx_v, &cfl_sign_v, &cfl_alpha_v);
786
0
    const int joint_sign = cfl_sign_u * CFL_SIGNS + cfl_sign_v - 1;
787
    // Compute alpha and mode signaling rate.
788
0
    const int rate_overhead =
789
0
        mode_costs->cfl_cost[joint_sign][CFL_PRED_U][cfl_alpha_u] +
790
0
        mode_costs->cfl_cost[joint_sign][CFL_PRED_V][cfl_alpha_v] +
791
0
        mode_costs
792
0
            ->intra_uv_mode_cost[is_cfl_allowed(xd)][mbmi->mode][UV_CFL_PRED];
793
    // Skip the CfL mode evaluation if the RD cost derived using the rate needed
794
    // to signal the CfL mode and alpha parameter exceeds the ref_best_rd.
795
0
    if (RDCOST(x->rdmult, rate_overhead, 0) > ref_best_rd) {
796
0
      set_invalid_cfl_parameters(best_cfl_alpha_idx, best_cfl_alpha_signs);
797
0
      clear_cfl_dc_pred_cache_flags(&xd->cfl);
798
0
      return 0;
799
0
    }
800
0
  }
801
802
  // Compute the rd cost of each chroma plane using the alpha parameters which
803
  // were already evaluated.
804
0
  cfl_pick_plane_rd(cpi, x, 1, tx_size, cfl_search_range, cfl_rd_arr_u,
805
0
                    est_best_cfl_idx_u);
806
0
  cfl_pick_plane_rd(cpi, x, 2, tx_size, cfl_search_range, cfl_rd_arr_v,
807
0
                    est_best_cfl_idx_v);
808
809
0
  clear_cfl_dc_pred_cache_flags(&xd->cfl);
810
811
0
  for (int ui = 0; ui < CFL_MAGS_SIZE; ++ui) {
812
0
    if (cfl_rd_arr_u[ui].rate == INT_MAX) continue;
813
0
    int cfl_alpha_u;
814
0
    CFL_SIGN_TYPE cfl_sign_u;
815
0
    cfl_idx_to_sign_and_alpha(ui, &cfl_sign_u, &cfl_alpha_u);
816
0
    for (int vi = 0; vi < CFL_MAGS_SIZE; ++vi) {
817
0
      if (cfl_rd_arr_v[vi].rate == INT_MAX) continue;
818
0
      int cfl_alpha_v;
819
0
      CFL_SIGN_TYPE cfl_sign_v;
820
0
      cfl_idx_to_sign_and_alpha(vi, &cfl_sign_v, &cfl_alpha_v);
821
      // cfl_sign_u == CFL_SIGN_ZERO && cfl_sign_v == CFL_SIGN_ZERO is not a
822
      // valid parameter for CFL
823
0
      if (cfl_sign_u == CFL_SIGN_ZERO && cfl_sign_v == CFL_SIGN_ZERO) continue;
824
0
      int joint_sign = cfl_sign_u * CFL_SIGNS + cfl_sign_v - 1;
825
0
      RD_STATS rd_stats = cfl_rd_arr_u[ui];
826
0
      av1_merge_rd_stats(&rd_stats, &cfl_rd_arr_v[vi]);
827
0
      if (rd_stats.rate != INT_MAX) {
828
0
        rd_stats.rate +=
829
0
            mode_costs->cfl_cost[joint_sign][CFL_PRED_U][cfl_alpha_u];
830
0
        rd_stats.rate +=
831
0
            mode_costs->cfl_cost[joint_sign][CFL_PRED_V][cfl_alpha_v];
832
0
      }
833
0
      av1_rd_cost_update(x->rdmult, &rd_stats);
834
0
      if (rd_stats.rdcost < best_rd_stats->rdcost) {
835
0
        *best_rd_stats = rd_stats;
836
0
        *best_cfl_alpha_idx =
837
0
            (cfl_alpha_u << CFL_ALPHABET_SIZE_LOG2) + cfl_alpha_v;
838
0
        *best_cfl_alpha_signs = joint_sign;
839
0
      }
840
0
    }
841
0
  }
842
0
  if (best_rd_stats->rdcost >= ref_best_rd) {
843
0
    av1_invalid_rd_stats(best_rd_stats);
844
    // Set invalid CFL parameters here since the rdcost is not better than
845
    // ref_best_rd.
846
0
    set_invalid_cfl_parameters(best_cfl_alpha_idx, best_cfl_alpha_signs);
847
0
    return 0;
848
0
  }
849
0
  return 1;
850
0
}
851
852
static bool should_prune_chroma_smooth_pred_based_on_source_variance(
853
0
    const AV1_COMP *cpi, const MACROBLOCK *x, BLOCK_SIZE bsize) {
854
0
  if (!cpi->sf.intra_sf.prune_smooth_intra_mode_for_chroma) return false;
855
856
  // If the source variance of both chroma planes is less than 20 (empirically
857
  // derived), prune UV_SMOOTH_PRED.
858
0
  for (int i = AOM_PLANE_U; i < av1_num_planes(&cpi->common); i++) {
859
0
    const unsigned int variance = av1_get_perpixel_variance_facade(
860
0
        cpi, &x->e_mbd, &x->plane[i].src, bsize, i);
861
0
    if (variance >= 20) return false;
862
0
  }
863
0
  return true;
864
0
}
865
866
int64_t av1_rd_pick_intra_sbuv_mode(const AV1_COMP *const cpi, MACROBLOCK *x,
867
                                    int *rate, int *rate_tokenonly,
868
                                    int64_t *distortion, uint8_t *skippable,
869
0
                                    BLOCK_SIZE bsize, TX_SIZE max_tx_size) {
870
0
  const AV1_COMMON *const cm = &cpi->common;
871
0
  MACROBLOCKD *xd = &x->e_mbd;
872
0
  MB_MODE_INFO *mbmi = xd->mi[0];
873
0
  assert(!is_inter_block(mbmi));
874
0
  MB_MODE_INFO best_mbmi = *mbmi;
875
0
  int64_t best_rd = INT64_MAX, this_rd;
876
0
  const ModeCosts *mode_costs = &x->mode_costs;
877
0
  const IntraModeCfg *const intra_mode_cfg = &cpi->oxcf.intra_mode_cfg;
878
879
0
  init_sbuv_mode(mbmi);
880
881
  // Return if the current block does not correspond to a chroma block.
882
0
  if (!xd->is_chroma_ref) {
883
0
    *rate = 0;
884
0
    *rate_tokenonly = 0;
885
0
    *distortion = 0;
886
0
    *skippable = 1;
887
0
    return INT64_MAX;
888
0
  }
889
890
  // Only store reconstructed luma when there's chroma RDO. When there's no
891
  // chroma RDO, the reconstructed luma will be stored in encode_superblock().
892
0
  xd->cfl.store_y = store_cfl_required_rdo(cm, x);
893
0
  if (xd->cfl.store_y) {
894
    // Restore reconstructed luma values.
895
    // TODO(chiyotsai@google.com): right now we are re-computing the txfm in
896
    // this function everytime we search through uv modes. There is some
897
    // potential speed up here if we cache the result to avoid redundant
898
    // computation.
899
0
    av1_encode_intra_block_plane(cpi, x, mbmi->bsize, AOM_PLANE_Y,
900
0
                                 DRY_RUN_NORMAL,
901
0
                                 cpi->optimize_seg_arr[mbmi->segment_id]);
902
0
    xd->cfl.store_y = 0;
903
0
  }
904
0
  IntraModeSearchState intra_search_state;
905
0
  init_intra_mode_search_state(&intra_search_state);
906
0
  const CFL_ALLOWED_TYPE cfl_allowed = is_cfl_allowed(xd);
907
908
  // Search through all non-palette modes.
909
0
  for (int mode_idx = 0; mode_idx < UV_INTRA_MODES; ++mode_idx) {
910
0
    int this_rate;
911
0
    RD_STATS tokenonly_rd_stats;
912
0
    UV_PREDICTION_MODE uv_mode = uv_rd_search_mode_order[mode_idx];
913
914
    // Skip the current mode evaluation if the RD cost derived using the mode
915
    // signaling rate exceeds the best_rd so far.
916
0
    const int mode_rate =
917
0
        mode_costs->intra_uv_mode_cost[cfl_allowed][mbmi->mode][uv_mode];
918
0
    if (RDCOST(x->rdmult, mode_rate, 0) > best_rd) continue;
919
920
0
    PREDICTION_MODE intra_mode = get_uv_mode(uv_mode);
921
0
    const int is_diagonal_mode = av1_is_diagonal_mode(intra_mode);
922
0
    const int is_directional_mode = av1_is_directional_mode(intra_mode);
923
924
0
    if (is_diagonal_mode && !cpi->oxcf.intra_mode_cfg.enable_diagonal_intra)
925
0
      continue;
926
0
    if (is_directional_mode &&
927
0
        !cpi->oxcf.intra_mode_cfg.enable_directional_intra)
928
0
      continue;
929
930
0
    if (!(cpi->sf.intra_sf.intra_uv_mode_mask[txsize_sqr_up_map[max_tx_size]] &
931
0
          (1 << uv_mode)))
932
0
      continue;
933
0
    if (!intra_mode_cfg->enable_smooth_intra && uv_mode >= UV_SMOOTH_PRED &&
934
0
        uv_mode <= UV_SMOOTH_H_PRED)
935
0
      continue;
936
937
0
    if (!intra_mode_cfg->enable_paeth_intra && uv_mode == UV_PAETH_PRED)
938
0
      continue;
939
940
0
    assert(mbmi->mode < INTRA_MODES);
941
0
    if (cpi->sf.intra_sf.prune_chroma_modes_using_luma_winner &&
942
0
        !(av1_derived_chroma_intra_mode_used_flag[mbmi->mode] & (1 << uv_mode)))
943
0
      continue;
944
945
0
    mbmi->uv_mode = uv_mode;
946
947
    // Init variables for cfl and angle delta
948
0
    const SPEED_FEATURES *sf = &cpi->sf;
949
0
    mbmi->angle_delta[PLANE_TYPE_UV] = 0;
950
0
    if (uv_mode == UV_CFL_PRED) {
951
0
      if (!cfl_allowed || !intra_mode_cfg->enable_cfl_intra) continue;
952
0
      assert(!is_directional_mode);
953
0
      const TX_SIZE uv_tx_size = av1_get_tx_size(AOM_PLANE_U, xd);
954
0
      if (!cfl_rd_pick_alpha(x, cpi, uv_tx_size, best_rd,
955
0
                             sf->intra_sf.cfl_search_range, &tokenonly_rd_stats,
956
0
                             &mbmi->cfl_alpha_idx, &mbmi->cfl_alpha_signs)) {
957
0
        continue;
958
0
      }
959
0
    } else if (is_directional_mode && av1_use_angle_delta(mbmi->bsize) &&
960
0
               intra_mode_cfg->enable_angle_delta) {
961
0
      if (sf->intra_sf.chroma_intra_pruning_with_hog &&
962
0
          !intra_search_state.dir_mode_skip_mask_ready) {
963
0
        static const float thresh[2][4] = {
964
0
          { -1.2f, 0.0f, 0.0f, 1.2f },    // Interframe
965
0
          { -1.2f, -1.2f, -0.6f, 0.4f },  // Intraframe
966
0
        };
967
0
        const int is_chroma = 1;
968
0
        const int is_intra_frame = frame_is_intra_only(cm);
969
0
        prune_intra_mode_with_hog(
970
0
            x, bsize, cm->seq_params->sb_size,
971
0
            thresh[is_intra_frame]
972
0
                  [sf->intra_sf.chroma_intra_pruning_with_hog - 1],
973
0
            intra_search_state.directional_mode_skip_mask, is_chroma);
974
0
        intra_search_state.dir_mode_skip_mask_ready = 1;
975
0
      }
976
0
      if (intra_search_state.directional_mode_skip_mask[uv_mode]) {
977
0
        continue;
978
0
      }
979
980
      // Search through angle delta
981
0
      const int rate_overhead =
982
0
          mode_costs->intra_uv_mode_cost[cfl_allowed][mbmi->mode][uv_mode];
983
0
      if (!rd_pick_intra_angle_sbuv(cpi, x, bsize, rate_overhead, best_rd,
984
0
                                    &this_rate, &tokenonly_rd_stats))
985
0
        continue;
986
0
    } else {
987
0
      if (uv_mode == UV_SMOOTH_PRED &&
988
0
          should_prune_chroma_smooth_pred_based_on_source_variance(cpi, x,
989
0
                                                                   bsize))
990
0
        continue;
991
992
      // Predict directly if we don't need to search for angle delta.
993
0
      if (!av1_txfm_uvrd(cpi, x, &tokenonly_rd_stats, bsize, best_rd)) {
994
0
        continue;
995
0
      }
996
0
    }
997
0
    const int mode_cost =
998
0
        mode_costs->intra_uv_mode_cost[cfl_allowed][mbmi->mode][uv_mode];
999
0
    this_rate = tokenonly_rd_stats.rate +
1000
0
                intra_mode_info_cost_uv(cpi, x, mbmi, bsize, mode_cost);
1001
0
    this_rd = RDCOST(x->rdmult, this_rate, tokenonly_rd_stats.dist);
1002
1003
0
    if (this_rd < best_rd) {
1004
0
      best_mbmi = *mbmi;
1005
0
      best_rd = this_rd;
1006
0
      *rate = this_rate;
1007
0
      *rate_tokenonly = tokenonly_rd_stats.rate;
1008
0
      *distortion = tokenonly_rd_stats.dist;
1009
0
      *skippable = tokenonly_rd_stats.skip_txfm;
1010
0
    }
1011
0
  }
1012
1013
  // Search palette mode
1014
0
  const int try_palette =
1015
0
      cpi->oxcf.tool_cfg.enable_palette &&
1016
0
      av1_allow_palette(cpi->common.features.allow_screen_content_tools,
1017
0
                        mbmi->bsize);
1018
0
  if (try_palette) {
1019
0
    uint8_t *best_palette_color_map = x->palette_buffer->best_palette_color_map;
1020
0
    av1_rd_pick_palette_intra_sbuv(
1021
0
        cpi, x,
1022
0
        mode_costs->intra_uv_mode_cost[cfl_allowed][mbmi->mode][UV_DC_PRED],
1023
0
        best_palette_color_map, &best_mbmi, &best_rd, rate, rate_tokenonly,
1024
0
        distortion, skippable);
1025
0
  }
1026
1027
0
  *mbmi = best_mbmi;
1028
  // Make sure we actually chose a mode
1029
0
  assert(best_rd < INT64_MAX);
1030
0
  return best_rd;
1031
0
}
1032
1033
// Searches palette mode for luma channel in inter frame.
1034
int av1_search_palette_mode(IntraModeSearchState *intra_search_state,
1035
                            const AV1_COMP *cpi, MACROBLOCK *x,
1036
                            BLOCK_SIZE bsize, unsigned int ref_frame_cost,
1037
                            PICK_MODE_CONTEXT *ctx, RD_STATS *this_rd_cost,
1038
0
                            int64_t best_rd) {
1039
0
  const AV1_COMMON *const cm = &cpi->common;
1040
0
  MB_MODE_INFO *const mbmi = x->e_mbd.mi[0];
1041
0
  PALETTE_MODE_INFO *const pmi = &mbmi->palette_mode_info;
1042
0
  const int num_planes = av1_num_planes(cm);
1043
0
  MACROBLOCKD *const xd = &x->e_mbd;
1044
0
  int rate2 = 0;
1045
0
  int64_t distortion2 = 0, best_rd_palette = best_rd, this_rd;
1046
0
  int skippable = 0;
1047
0
  uint8_t *const best_palette_color_map =
1048
0
      x->palette_buffer->best_palette_color_map;
1049
0
  uint8_t *const color_map = xd->plane[0].color_index_map;
1050
0
  MB_MODE_INFO best_mbmi_palette = *mbmi;
1051
0
  uint8_t best_blk_skip[MAX_MIB_SIZE * MAX_MIB_SIZE];
1052
0
  uint8_t best_tx_type_map[MAX_MIB_SIZE * MAX_MIB_SIZE];
1053
0
  const ModeCosts *mode_costs = &x->mode_costs;
1054
0
  const int *const intra_mode_cost =
1055
0
      mode_costs->mbmode_cost[size_group_lookup[bsize]];
1056
0
  const int rows = block_size_high[bsize];
1057
0
  const int cols = block_size_wide[bsize];
1058
1059
0
  mbmi->mode = DC_PRED;
1060
0
  mbmi->uv_mode = UV_DC_PRED;
1061
0
  mbmi->ref_frame[0] = INTRA_FRAME;
1062
0
  mbmi->ref_frame[1] = NONE_FRAME;
1063
0
  av1_zero(pmi->palette_size);
1064
1065
0
  RD_STATS rd_stats_y;
1066
0
  av1_invalid_rd_stats(&rd_stats_y);
1067
0
  av1_rd_pick_palette_intra_sby(cpi, x, bsize, intra_mode_cost[DC_PRED],
1068
0
                                &best_mbmi_palette, best_palette_color_map,
1069
0
                                &best_rd_palette, &rd_stats_y.rate, NULL,
1070
0
                                &rd_stats_y.dist, &rd_stats_y.skip_txfm, NULL,
1071
0
                                ctx, best_blk_skip, best_tx_type_map);
1072
0
  if (rd_stats_y.rate == INT_MAX || pmi->palette_size[0] == 0) {
1073
0
    this_rd_cost->rdcost = INT64_MAX;
1074
0
    return skippable;
1075
0
  }
1076
1077
0
  memcpy(x->txfm_search_info.blk_skip, best_blk_skip,
1078
0
         sizeof(best_blk_skip[0]) * bsize_to_num_blk(bsize));
1079
0
  av1_copy_array(xd->tx_type_map, best_tx_type_map, ctx->num_4x4_blk);
1080
0
  memcpy(color_map, best_palette_color_map,
1081
0
         rows * cols * sizeof(best_palette_color_map[0]));
1082
1083
0
  skippable = rd_stats_y.skip_txfm;
1084
0
  distortion2 = rd_stats_y.dist;
1085
0
  rate2 = rd_stats_y.rate + ref_frame_cost;
1086
0
  if (num_planes > 1) {
1087
0
    if (intra_search_state->rate_uv_intra == INT_MAX) {
1088
      // We have not found any good uv mode yet, so we need to search for it.
1089
0
      TX_SIZE uv_tx = av1_get_tx_size(AOM_PLANE_U, xd);
1090
0
      av1_rd_pick_intra_sbuv_mode(cpi, x, &intra_search_state->rate_uv_intra,
1091
0
                                  &intra_search_state->rate_uv_tokenonly,
1092
0
                                  &intra_search_state->dist_uvs,
1093
0
                                  &intra_search_state->skip_uvs, bsize, uv_tx);
1094
0
      intra_search_state->mode_uv = mbmi->uv_mode;
1095
0
      intra_search_state->pmi_uv = *pmi;
1096
0
      intra_search_state->uv_angle_delta = mbmi->angle_delta[PLANE_TYPE_UV];
1097
0
    }
1098
1099
    // We have found at least one good uv mode before, so copy and paste it
1100
    // over.
1101
0
    mbmi->uv_mode = intra_search_state->mode_uv;
1102
0
    pmi->palette_size[1] = intra_search_state->pmi_uv.palette_size[1];
1103
0
    if (pmi->palette_size[1] > 0) {
1104
0
      memcpy(pmi->palette_colors + PALETTE_MAX_SIZE,
1105
0
             intra_search_state->pmi_uv.palette_colors + PALETTE_MAX_SIZE,
1106
0
             2 * PALETTE_MAX_SIZE * sizeof(pmi->palette_colors[0]));
1107
0
    }
1108
0
    mbmi->angle_delta[PLANE_TYPE_UV] = intra_search_state->uv_angle_delta;
1109
0
    skippable = skippable && intra_search_state->skip_uvs;
1110
0
    distortion2 += intra_search_state->dist_uvs;
1111
0
    rate2 += intra_search_state->rate_uv_intra;
1112
0
  }
1113
1114
0
  if (skippable) {
1115
0
    rate2 -= rd_stats_y.rate;
1116
0
    if (num_planes > 1) rate2 -= intra_search_state->rate_uv_tokenonly;
1117
0
    rate2 += mode_costs->skip_txfm_cost[av1_get_skip_txfm_context(xd)][1];
1118
0
  } else {
1119
0
    rate2 += mode_costs->skip_txfm_cost[av1_get_skip_txfm_context(xd)][0];
1120
0
  }
1121
0
  this_rd = RDCOST(x->rdmult, rate2, distortion2);
1122
0
  this_rd_cost->rate = rate2;
1123
0
  this_rd_cost->dist = distortion2;
1124
0
  this_rd_cost->rdcost = this_rd;
1125
0
  return skippable;
1126
0
}
1127
1128
void av1_search_palette_mode_luma(const AV1_COMP *cpi, MACROBLOCK *x,
1129
                                  BLOCK_SIZE bsize, unsigned int ref_frame_cost,
1130
                                  PICK_MODE_CONTEXT *ctx,
1131
0
                                  RD_STATS *this_rd_cost, int64_t best_rd) {
1132
0
  MB_MODE_INFO *const mbmi = x->e_mbd.mi[0];
1133
0
  PALETTE_MODE_INFO *const pmi = &mbmi->palette_mode_info;
1134
0
  MACROBLOCKD *const xd = &x->e_mbd;
1135
0
  int64_t best_rd_palette = best_rd, this_rd;
1136
0
  uint8_t *const best_palette_color_map =
1137
0
      x->palette_buffer->best_palette_color_map;
1138
0
  uint8_t *const color_map = xd->plane[0].color_index_map;
1139
0
  MB_MODE_INFO best_mbmi_palette = *mbmi;
1140
0
  uint8_t best_blk_skip[MAX_MIB_SIZE * MAX_MIB_SIZE];
1141
0
  uint8_t best_tx_type_map[MAX_MIB_SIZE * MAX_MIB_SIZE];
1142
0
  const ModeCosts *mode_costs = &x->mode_costs;
1143
0
  const int *const intra_mode_cost =
1144
0
      mode_costs->mbmode_cost[size_group_lookup[bsize]];
1145
0
  const int rows = block_size_high[bsize];
1146
0
  const int cols = block_size_wide[bsize];
1147
1148
0
  mbmi->mode = DC_PRED;
1149
0
  mbmi->uv_mode = UV_DC_PRED;
1150
0
  mbmi->ref_frame[0] = INTRA_FRAME;
1151
0
  mbmi->ref_frame[1] = NONE_FRAME;
1152
0
  av1_zero(pmi->palette_size);
1153
1154
0
  RD_STATS rd_stats_y;
1155
0
  av1_invalid_rd_stats(&rd_stats_y);
1156
0
  av1_rd_pick_palette_intra_sby(cpi, x, bsize, intra_mode_cost[DC_PRED],
1157
0
                                &best_mbmi_palette, best_palette_color_map,
1158
0
                                &best_rd_palette, &rd_stats_y.rate, NULL,
1159
0
                                &rd_stats_y.dist, &rd_stats_y.skip_txfm, NULL,
1160
0
                                ctx, best_blk_skip, best_tx_type_map);
1161
0
  if (rd_stats_y.rate == INT_MAX || pmi->palette_size[0] == 0) {
1162
0
    this_rd_cost->rdcost = INT64_MAX;
1163
0
    return;
1164
0
  }
1165
1166
0
  memcpy(x->txfm_search_info.blk_skip, best_blk_skip,
1167
0
         sizeof(best_blk_skip[0]) * bsize_to_num_blk(bsize));
1168
0
  av1_copy_array(xd->tx_type_map, best_tx_type_map, ctx->num_4x4_blk);
1169
0
  memcpy(color_map, best_palette_color_map,
1170
0
         rows * cols * sizeof(best_palette_color_map[0]));
1171
1172
0
  rd_stats_y.rate += ref_frame_cost;
1173
1174
0
  if (rd_stats_y.skip_txfm) {
1175
0
    rd_stats_y.rate =
1176
0
        ref_frame_cost +
1177
0
        mode_costs->skip_txfm_cost[av1_get_skip_txfm_context(xd)][1];
1178
0
  } else {
1179
0
    rd_stats_y.rate +=
1180
0
        mode_costs->skip_txfm_cost[av1_get_skip_txfm_context(xd)][0];
1181
0
  }
1182
0
  this_rd = RDCOST(x->rdmult, rd_stats_y.rate, rd_stats_y.dist);
1183
0
  this_rd_cost->rate = rd_stats_y.rate;
1184
0
  this_rd_cost->dist = rd_stats_y.dist;
1185
0
  this_rd_cost->rdcost = this_rd;
1186
0
  this_rd_cost->skip_txfm = rd_stats_y.skip_txfm;
1187
0
}
1188
1189
/*!\brief Get the intra prediction by searching through tx_type and tx_size.
1190
 *
1191
 * \ingroup intra_mode_search
1192
 * \callergraph
1193
 * Currently this function is only used in the intra frame code path for
1194
 * winner-mode processing.
1195
 *
1196
 * \return Returns whether the current mode is an improvement over best_rd.
1197
 */
1198
static inline int intra_block_yrd(const AV1_COMP *const cpi, MACROBLOCK *x,
1199
                                  BLOCK_SIZE bsize, const int *bmode_costs,
1200
                                  int64_t *best_rd, int *rate,
1201
                                  int *rate_tokenonly, int64_t *distortion,
1202
                                  uint8_t *skippable, MB_MODE_INFO *best_mbmi,
1203
0
                                  PICK_MODE_CONTEXT *ctx) {
1204
0
  MACROBLOCKD *const xd = &x->e_mbd;
1205
0
  MB_MODE_INFO *const mbmi = xd->mi[0];
1206
0
  RD_STATS rd_stats;
1207
  // In order to improve txfm search, avoid rd based breakouts during winner
1208
  // mode evaluation. Hence passing ref_best_rd as INT64_MAX by default when the
1209
  // speed feature use_rd_based_breakout_for_intra_tx_search is disabled.
1210
0
  int64_t ref_best_rd = cpi->sf.tx_sf.use_rd_based_breakout_for_intra_tx_search
1211
0
                            ? *best_rd
1212
0
                            : INT64_MAX;
1213
0
  av1_pick_uniform_tx_size_type_yrd(cpi, x, &rd_stats, bsize, ref_best_rd);
1214
0
  if (rd_stats.rate == INT_MAX) return 0;
1215
0
  int this_rate_tokenonly = rd_stats.rate;
1216
0
  if (!xd->lossless[mbmi->segment_id] && block_signals_txsize(mbmi->bsize)) {
1217
    // av1_pick_uniform_tx_size_type_yrd above includes the cost of the tx_size
1218
    // in the tokenonly rate, but for intra blocks, tx_size is always coded
1219
    // (prediction granularity), so we account for it in the full rate,
1220
    // not the tokenonly rate.
1221
0
    this_rate_tokenonly -= tx_size_cost(x, bsize, mbmi->tx_size);
1222
0
  }
1223
0
  const int this_rate =
1224
0
      rd_stats.rate +
1225
0
      intra_mode_info_cost_y(cpi, x, mbmi, bsize, bmode_costs[mbmi->mode], 0);
1226
0
  const int64_t this_rd = RDCOST(x->rdmult, this_rate, rd_stats.dist);
1227
0
  if (this_rd < *best_rd) {
1228
0
    *best_mbmi = *mbmi;
1229
0
    *best_rd = this_rd;
1230
0
    *rate = this_rate;
1231
0
    *rate_tokenonly = this_rate_tokenonly;
1232
0
    *distortion = rd_stats.dist;
1233
0
    *skippable = rd_stats.skip_txfm;
1234
0
    av1_copy_array(ctx->blk_skip, x->txfm_search_info.blk_skip,
1235
0
                   ctx->num_4x4_blk);
1236
0
    av1_copy_array(ctx->tx_type_map, xd->tx_type_map, ctx->num_4x4_blk);
1237
0
    return 1;
1238
0
  }
1239
0
  return 0;
1240
0
}
1241
1242
/*!\brief Search for the best filter_intra mode when coding inter frame.
1243
 *
1244
 * \ingroup intra_mode_search
1245
 * \callergraph
1246
 * This function loops through all filter_intra modes to find the best one.
1247
 *
1248
 * \remark Returns nothing, but updates the mbmi and rd_stats.
1249
 */
1250
static inline void handle_filter_intra_mode(const AV1_COMP *cpi, MACROBLOCK *x,
1251
                                            BLOCK_SIZE bsize,
1252
                                            const PICK_MODE_CONTEXT *ctx,
1253
                                            RD_STATS *rd_stats_y, int mode_cost,
1254
                                            int64_t best_rd,
1255
0
                                            int64_t best_rd_so_far) {
1256
0
  MACROBLOCKD *const xd = &x->e_mbd;
1257
0
  MB_MODE_INFO *const mbmi = xd->mi[0];
1258
0
  assert(mbmi->mode == DC_PRED &&
1259
0
         av1_filter_intra_allowed_bsize(&cpi->common, bsize));
1260
1261
0
  RD_STATS rd_stats_y_fi;
1262
0
  int filter_intra_selected_flag = 0;
1263
0
  TX_SIZE best_tx_size = mbmi->tx_size;
1264
0
  FILTER_INTRA_MODE best_fi_mode = FILTER_DC_PRED;
1265
0
  uint8_t best_blk_skip[MAX_MIB_SIZE * MAX_MIB_SIZE];
1266
0
  memcpy(best_blk_skip, x->txfm_search_info.blk_skip,
1267
0
         sizeof(best_blk_skip[0]) * ctx->num_4x4_blk);
1268
0
  uint8_t best_tx_type_map[MAX_MIB_SIZE * MAX_MIB_SIZE];
1269
0
  av1_copy_array(best_tx_type_map, xd->tx_type_map, ctx->num_4x4_blk);
1270
0
  mbmi->filter_intra_mode_info.use_filter_intra = 1;
1271
0
  for (FILTER_INTRA_MODE fi_mode = FILTER_DC_PRED; fi_mode < FILTER_INTRA_MODES;
1272
0
       ++fi_mode) {
1273
0
    mbmi->filter_intra_mode_info.filter_intra_mode = fi_mode;
1274
0
    av1_pick_uniform_tx_size_type_yrd(cpi, x, &rd_stats_y_fi, bsize, best_rd);
1275
0
    if (rd_stats_y_fi.rate == INT_MAX) continue;
1276
0
    const int this_rate_tmp =
1277
0
        rd_stats_y_fi.rate +
1278
0
        intra_mode_info_cost_y(cpi, x, mbmi, bsize, mode_cost, 0);
1279
0
    const int64_t this_rd_tmp =
1280
0
        RDCOST(x->rdmult, this_rate_tmp, rd_stats_y_fi.dist);
1281
1282
0
    if (this_rd_tmp != INT64_MAX && this_rd_tmp / 2 > best_rd) {
1283
0
      break;
1284
0
    }
1285
0
    if (this_rd_tmp < best_rd_so_far) {
1286
0
      best_tx_size = mbmi->tx_size;
1287
0
      av1_copy_array(best_tx_type_map, xd->tx_type_map, ctx->num_4x4_blk);
1288
0
      memcpy(best_blk_skip, x->txfm_search_info.blk_skip,
1289
0
             sizeof(best_blk_skip[0]) * ctx->num_4x4_blk);
1290
0
      best_fi_mode = fi_mode;
1291
0
      *rd_stats_y = rd_stats_y_fi;
1292
0
      filter_intra_selected_flag = 1;
1293
0
      best_rd_so_far = this_rd_tmp;
1294
0
    }
1295
0
  }
1296
1297
0
  mbmi->tx_size = best_tx_size;
1298
0
  av1_copy_array(xd->tx_type_map, best_tx_type_map, ctx->num_4x4_blk);
1299
0
  memcpy(x->txfm_search_info.blk_skip, best_blk_skip,
1300
0
         sizeof(x->txfm_search_info.blk_skip[0]) * ctx->num_4x4_blk);
1301
1302
0
  if (filter_intra_selected_flag) {
1303
0
    mbmi->filter_intra_mode_info.use_filter_intra = 1;
1304
0
    mbmi->filter_intra_mode_info.filter_intra_mode = best_fi_mode;
1305
0
  } else {
1306
0
    mbmi->filter_intra_mode_info.use_filter_intra = 0;
1307
0
  }
1308
0
}
1309
1310
// Evaluate a given luma intra-mode in inter frames.
1311
int av1_handle_intra_y_mode(IntraModeSearchState *intra_search_state,
1312
                            const AV1_COMP *cpi, MACROBLOCK *x,
1313
                            BLOCK_SIZE bsize, unsigned int ref_frame_cost,
1314
                            const PICK_MODE_CONTEXT *ctx, RD_STATS *rd_stats_y,
1315
                            int64_t best_rd, int *mode_cost_y, int64_t *rd_y,
1316
                            int64_t *best_model_rd,
1317
0
                            int64_t top_intra_model_rd[]) {
1318
0
  const AV1_COMMON *cm = &cpi->common;
1319
0
  const INTRA_MODE_SPEED_FEATURES *const intra_sf = &cpi->sf.intra_sf;
1320
0
  MACROBLOCKD *const xd = &x->e_mbd;
1321
0
  MB_MODE_INFO *const mbmi = xd->mi[0];
1322
0
  assert(mbmi->ref_frame[0] == INTRA_FRAME);
1323
0
  const PREDICTION_MODE mode = mbmi->mode;
1324
0
  const ModeCosts *mode_costs = &x->mode_costs;
1325
0
  const int mode_cost =
1326
0
      mode_costs->mbmode_cost[size_group_lookup[bsize]][mode] + ref_frame_cost;
1327
0
  const int skip_ctx = av1_get_skip_txfm_context(xd);
1328
1329
0
  int known_rate = mode_cost;
1330
0
  const int intra_cost_penalty = av1_get_intra_cost_penalty(
1331
0
      cm->quant_params.base_qindex, cm->quant_params.y_dc_delta_q,
1332
0
      cm->seq_params->bit_depth);
1333
1334
0
  if (mode != DC_PRED && mode != PAETH_PRED) known_rate += intra_cost_penalty;
1335
0
  known_rate += AOMMIN(mode_costs->skip_txfm_cost[skip_ctx][0],
1336
0
                       mode_costs->skip_txfm_cost[skip_ctx][1]);
1337
0
  const int64_t known_rd = RDCOST(x->rdmult, known_rate, 0);
1338
0
  if (known_rd > best_rd) {
1339
0
    intra_search_state->skip_intra_modes = 1;
1340
0
    return 0;
1341
0
  }
1342
1343
0
  const int is_directional_mode = av1_is_directional_mode(mode);
1344
0
  if (is_directional_mode && av1_use_angle_delta(bsize) &&
1345
0
      cpi->oxcf.intra_mode_cfg.enable_angle_delta) {
1346
0
    if (intra_sf->intra_pruning_with_hog &&
1347
0
        !intra_search_state->dir_mode_skip_mask_ready) {
1348
0
      const float thresh[4] = { -1.2f, 0.0f, 0.0f, 1.2f };
1349
0
      const int is_chroma = 0;
1350
0
      prune_intra_mode_with_hog(x, bsize, cm->seq_params->sb_size,
1351
0
                                thresh[intra_sf->intra_pruning_with_hog - 1],
1352
0
                                intra_search_state->directional_mode_skip_mask,
1353
0
                                is_chroma);
1354
0
      intra_search_state->dir_mode_skip_mask_ready = 1;
1355
0
    }
1356
0
    if (intra_search_state->directional_mode_skip_mask[mode]) return 0;
1357
0
  }
1358
0
  const TX_SIZE tx_size = AOMMIN(TX_32X32, max_txsize_lookup[bsize]);
1359
0
  const int64_t this_model_rd =
1360
0
      intra_model_rd(&cpi->common, x, 0, bsize, tx_size, /*use_hadamard=*/1);
1361
1362
0
  const int model_rd_index_for_pruning =
1363
0
      get_model_rd_index_for_pruning(x, intra_sf);
1364
1365
0
  if (prune_intra_y_mode(this_model_rd, best_model_rd, top_intra_model_rd,
1366
0
                         intra_sf->top_intra_model_count_allowed,
1367
0
                         model_rd_index_for_pruning))
1368
0
    return 0;
1369
0
  av1_init_rd_stats(rd_stats_y);
1370
0
  av1_pick_uniform_tx_size_type_yrd(cpi, x, rd_stats_y, bsize, best_rd);
1371
1372
  // Pick filter intra modes.
1373
0
  if (mode == DC_PRED && av1_filter_intra_allowed_bsize(cm, bsize)) {
1374
0
    int try_filter_intra = 1;
1375
0
    int64_t best_rd_so_far = INT64_MAX;
1376
0
    if (rd_stats_y->rate != INT_MAX) {
1377
      // best_rd_so_far is the rdcost of DC_PRED without using filter_intra.
1378
      // Later, in filter intra search, best_rd_so_far is used for comparison.
1379
0
      mbmi->filter_intra_mode_info.use_filter_intra = 0;
1380
0
      const int tmp_rate =
1381
0
          rd_stats_y->rate +
1382
0
          intra_mode_info_cost_y(cpi, x, mbmi, bsize, mode_cost, 0);
1383
0
      best_rd_so_far = RDCOST(x->rdmult, tmp_rate, rd_stats_y->dist);
1384
0
      try_filter_intra = (best_rd_so_far / 2) <= best_rd;
1385
0
    } else if (intra_sf->skip_filter_intra_in_inter_frames >= 1) {
1386
      // As rd cost of luma intra dc mode is more than best_rd (i.e.,
1387
      // rd_stats_y->rate = INT_MAX), skip the evaluation of filter intra modes.
1388
0
      try_filter_intra = 0;
1389
0
    }
1390
1391
0
    if (try_filter_intra) {
1392
0
      handle_filter_intra_mode(cpi, x, bsize, ctx, rd_stats_y, mode_cost,
1393
0
                               best_rd, best_rd_so_far);
1394
0
    }
1395
0
  }
1396
1397
0
  if (rd_stats_y->rate == INT_MAX) return 0;
1398
1399
0
  *mode_cost_y = intra_mode_info_cost_y(cpi, x, mbmi, bsize, mode_cost, 0);
1400
0
  const int rate_y = rd_stats_y->skip_txfm
1401
0
                         ? mode_costs->skip_txfm_cost[skip_ctx][1]
1402
0
                         : rd_stats_y->rate;
1403
0
  *rd_y = RDCOST(x->rdmult, rate_y + *mode_cost_y, rd_stats_y->dist);
1404
0
  if (best_rd < (INT64_MAX / 2) && *rd_y > (best_rd + (best_rd >> 2))) {
1405
0
    intra_search_state->skip_intra_modes = 1;
1406
0
    return 0;
1407
0
  }
1408
1409
0
  return 1;
1410
0
}
1411
1412
int av1_search_intra_uv_modes_in_interframe(
1413
    IntraModeSearchState *intra_search_state, const AV1_COMP *cpi,
1414
    MACROBLOCK *x, BLOCK_SIZE bsize, RD_STATS *rd_stats,
1415
0
    const RD_STATS *rd_stats_y, RD_STATS *rd_stats_uv, int64_t best_rd) {
1416
0
  const AV1_COMMON *cm = &cpi->common;
1417
0
  MACROBLOCKD *const xd = &x->e_mbd;
1418
0
  MB_MODE_INFO *const mbmi = xd->mi[0];
1419
0
  assert(mbmi->ref_frame[0] == INTRA_FRAME);
1420
1421
  // TODO(chiyotsai@google.com): Consolidate the chroma search code here with
1422
  // the one in av1_search_palette_mode.
1423
0
  PALETTE_MODE_INFO *const pmi = &mbmi->palette_mode_info;
1424
0
  const int try_palette =
1425
0
      cpi->oxcf.tool_cfg.enable_palette &&
1426
0
      av1_allow_palette(cm->features.allow_screen_content_tools, mbmi->bsize);
1427
1428
0
  assert(intra_search_state->rate_uv_intra == INT_MAX);
1429
0
  if (intra_search_state->rate_uv_intra == INT_MAX) {
1430
    // If no good uv-predictor had been found, search for it.
1431
0
    const TX_SIZE uv_tx = av1_get_tx_size(AOM_PLANE_U, xd);
1432
0
    av1_rd_pick_intra_sbuv_mode(cpi, x, &intra_search_state->rate_uv_intra,
1433
0
                                &intra_search_state->rate_uv_tokenonly,
1434
0
                                &intra_search_state->dist_uvs,
1435
0
                                &intra_search_state->skip_uvs, bsize, uv_tx);
1436
0
    intra_search_state->mode_uv = mbmi->uv_mode;
1437
0
    if (try_palette) intra_search_state->pmi_uv = *pmi;
1438
0
    intra_search_state->uv_angle_delta = mbmi->angle_delta[PLANE_TYPE_UV];
1439
1440
0
    const int uv_rate = intra_search_state->rate_uv_tokenonly;
1441
0
    const int64_t uv_dist = intra_search_state->dist_uvs;
1442
0
    const int64_t uv_rd = RDCOST(x->rdmult, uv_rate, uv_dist);
1443
0
    if (uv_rd > best_rd) {
1444
      // If there is no good intra uv-mode available, we can skip all intra
1445
      // modes.
1446
0
      intra_search_state->skip_intra_modes = 1;
1447
0
      return 0;
1448
0
    }
1449
0
  }
1450
1451
  // If we are here, then the encoder has found at least one good intra uv
1452
  // predictor, so we can directly copy its statistics over.
1453
  // TODO(any): the stats here is not right if the best uv mode is CFL but the
1454
  // best y mode is palette.
1455
0
  rd_stats_uv->rate = intra_search_state->rate_uv_tokenonly;
1456
0
  rd_stats_uv->dist = intra_search_state->dist_uvs;
1457
0
  rd_stats_uv->skip_txfm = intra_search_state->skip_uvs;
1458
0
  rd_stats->skip_txfm = rd_stats_y->skip_txfm && rd_stats_uv->skip_txfm;
1459
0
  mbmi->uv_mode = intra_search_state->mode_uv;
1460
0
  if (try_palette) {
1461
0
    pmi->palette_size[1] = intra_search_state->pmi_uv.palette_size[1];
1462
0
    memcpy(pmi->palette_colors + PALETTE_MAX_SIZE,
1463
0
           intra_search_state->pmi_uv.palette_colors + PALETTE_MAX_SIZE,
1464
0
           2 * PALETTE_MAX_SIZE * sizeof(pmi->palette_colors[0]));
1465
0
  }
1466
0
  mbmi->angle_delta[PLANE_TYPE_UV] = intra_search_state->uv_angle_delta;
1467
1468
0
  return 1;
1469
0
}
1470
1471
// Checks if odd delta angles can be pruned based on rdcosts of even delta
1472
// angles of the corresponding directional mode.
1473
static inline int prune_luma_odd_delta_angles_using_rd_cost(
1474
    const MB_MODE_INFO *const mbmi, const int64_t *const intra_modes_rd_cost,
1475
0
    int64_t best_rd, int prune_luma_odd_delta_angles_in_intra) {
1476
0
  const int luma_delta_angle = mbmi->angle_delta[PLANE_TYPE_Y];
1477
0
  if (!prune_luma_odd_delta_angles_in_intra ||
1478
0
      !av1_is_directional_mode(mbmi->mode) || !(abs(luma_delta_angle) & 1) ||
1479
0
      best_rd == INT64_MAX)
1480
0
    return 0;
1481
1482
0
  const int64_t rd_thresh = best_rd + (best_rd >> 3);
1483
1484
  // Neighbour rdcosts are considered for pruning of odd delta angles as
1485
  // mentioned below:
1486
  // Delta angle      Delta angle rdcost
1487
  // to be pruned     to be considered
1488
  //    -3                   -2
1489
  //    -1                -2, 0
1490
  //     1                 0, 2
1491
  //     3                    2
1492
0
  return intra_modes_rd_cost[luma_delta_angle + MAX_ANGLE_DELTA] > rd_thresh &&
1493
0
         intra_modes_rd_cost[luma_delta_angle + MAX_ANGLE_DELTA + 2] >
1494
0
             rd_thresh;
1495
0
}
1496
1497
// Finds the best non-intrabc mode on an intra frame.
1498
int64_t av1_rd_pick_intra_sby_mode(const AV1_COMP *const cpi, MACROBLOCK *x,
1499
                                   int *rate, int *rate_tokenonly,
1500
                                   int64_t *distortion, uint8_t *skippable,
1501
                                   BLOCK_SIZE bsize, int64_t best_rd,
1502
0
                                   PICK_MODE_CONTEXT *ctx) {
1503
0
  MACROBLOCKD *const xd = &x->e_mbd;
1504
0
  MB_MODE_INFO *const mbmi = xd->mi[0];
1505
0
  assert(!is_inter_block(mbmi));
1506
0
  int64_t best_model_rd = INT64_MAX;
1507
0
  int is_directional_mode;
1508
0
  uint8_t directional_mode_skip_mask[INTRA_MODES] = { 0 };
1509
  // Flag to check rd of any intra mode is better than best_rd passed to this
1510
  // function
1511
0
  int beat_best_rd = 0;
1512
0
  const int *bmode_costs;
1513
0
  const IntraModeCfg *const intra_mode_cfg = &cpi->oxcf.intra_mode_cfg;
1514
0
  PALETTE_MODE_INFO *const pmi = &mbmi->palette_mode_info;
1515
0
  const int try_palette =
1516
0
      cpi->oxcf.tool_cfg.enable_palette &&
1517
0
      av1_allow_palette(cpi->common.features.allow_screen_content_tools,
1518
0
                        mbmi->bsize);
1519
0
  uint8_t *best_palette_color_map =
1520
0
      try_palette ? x->palette_buffer->best_palette_color_map : NULL;
1521
0
  const MB_MODE_INFO *above_mi = xd->above_mbmi;
1522
0
  const MB_MODE_INFO *left_mi = xd->left_mbmi;
1523
0
  const PREDICTION_MODE A = av1_above_block_mode(above_mi);
1524
0
  const PREDICTION_MODE L = av1_left_block_mode(left_mi);
1525
0
  const int above_ctx = intra_mode_context[A];
1526
0
  const int left_ctx = intra_mode_context[L];
1527
0
  bmode_costs = x->mode_costs.y_mode_costs[above_ctx][left_ctx];
1528
1529
0
  mbmi->angle_delta[PLANE_TYPE_Y] = 0;
1530
0
  const INTRA_MODE_SPEED_FEATURES *const intra_sf = &cpi->sf.intra_sf;
1531
0
  if (intra_sf->intra_pruning_with_hog) {
1532
    // Less aggressive thresholds are used here than those used in inter frame
1533
    // encoding in av1_handle_intra_y_mode() because we want key frames/intra
1534
    // frames to have higher quality.
1535
0
    const float thresh[4] = { -1.2f, -1.2f, -0.6f, 0.4f };
1536
0
    const int is_chroma = 0;
1537
0
    prune_intra_mode_with_hog(x, bsize, cpi->common.seq_params->sb_size,
1538
0
                              thresh[intra_sf->intra_pruning_with_hog - 1],
1539
0
                              directional_mode_skip_mask, is_chroma);
1540
0
  }
1541
0
  mbmi->filter_intra_mode_info.use_filter_intra = 0;
1542
0
  pmi->palette_size[0] = 0;
1543
1544
  // Set params for mode evaluation
1545
0
  set_mode_eval_params(cpi, x, MODE_EVAL);
1546
1547
0
  MB_MODE_INFO best_mbmi = *mbmi;
1548
0
  const int max_winner_mode_count =
1549
0
      winner_mode_count_allowed[cpi->sf.winner_mode_sf.multi_winner_mode_type];
1550
0
  zero_winner_mode_stats(bsize, max_winner_mode_count, x->winner_mode_stats);
1551
0
  x->winner_mode_count = 0;
1552
1553
  // Searches the intra-modes except for intrabc, palette, and filter_intra.
1554
0
  int64_t top_intra_model_rd[TOP_INTRA_MODEL_COUNT];
1555
0
  for (int i = 0; i < TOP_INTRA_MODEL_COUNT; i++) {
1556
0
    top_intra_model_rd[i] = INT64_MAX;
1557
0
  }
1558
1559
  // Initialize the rdcost corresponding to all the directional and
1560
  // non-directional intra modes.
1561
  // 1. For directional modes, it stores the rdcost values for delta angles -4,
1562
  // -3, ..., 3, 4.
1563
  // 2. The rdcost value for luma_delta_angle is stored at index
1564
  // luma_delta_angle + MAX_ANGLE_DELTA + 1.
1565
  // 3. The rdcost values for fictitious/nonexistent luma_delta_angle -4 and 4
1566
  // (array indices 0 and 8) are always set to INT64_MAX (the initial value).
1567
0
  int64_t intra_modes_rd_cost[INTRA_MODE_END]
1568
0
                             [SIZE_OF_ANGLE_DELTA_RD_COST_ARRAY];
1569
0
  for (int i = 0; i < INTRA_MODE_END; i++) {
1570
0
    for (int j = 0; j < SIZE_OF_ANGLE_DELTA_RD_COST_ARRAY; j++) {
1571
0
      intra_modes_rd_cost[i][j] = INT64_MAX;
1572
0
    }
1573
0
  }
1574
1575
0
  for (int mode_idx = INTRA_MODE_START; mode_idx < LUMA_MODE_COUNT;
1576
0
       ++mode_idx) {
1577
0
    set_y_mode_and_delta_angle(mode_idx, mbmi,
1578
0
                               intra_sf->prune_luma_odd_delta_angles_in_intra);
1579
0
    RD_STATS this_rd_stats;
1580
0
    int this_rate, this_rate_tokenonly, s;
1581
0
    int is_diagonal_mode;
1582
0
    int64_t this_distortion, this_rd;
1583
0
    const int luma_delta_angle = mbmi->angle_delta[PLANE_TYPE_Y];
1584
1585
0
    is_diagonal_mode = av1_is_diagonal_mode(mbmi->mode);
1586
0
    if (is_diagonal_mode && !intra_mode_cfg->enable_diagonal_intra) continue;
1587
0
    if (av1_is_directional_mode(mbmi->mode) &&
1588
0
        !intra_mode_cfg->enable_directional_intra)
1589
0
      continue;
1590
1591
    // The smooth prediction mode appears to be more frequently picked
1592
    // than horizontal / vertical smooth prediction modes. Hence treat
1593
    // them differently in speed features.
1594
0
    if ((!intra_mode_cfg->enable_smooth_intra ||
1595
0
         intra_sf->disable_smooth_intra) &&
1596
0
        (mbmi->mode == SMOOTH_H_PRED || mbmi->mode == SMOOTH_V_PRED))
1597
0
      continue;
1598
0
    if (!intra_mode_cfg->enable_smooth_intra && mbmi->mode == SMOOTH_PRED)
1599
0
      continue;
1600
1601
    // The functionality of filter intra modes and smooth prediction
1602
    // overlap. Hence smooth prediction is pruned only if all the
1603
    // filter intra modes are enabled.
1604
0
    if (intra_sf->disable_smooth_intra &&
1605
0
        intra_sf->prune_filter_intra_level == 0 && mbmi->mode == SMOOTH_PRED)
1606
0
      continue;
1607
0
    if (!intra_mode_cfg->enable_paeth_intra && mbmi->mode == PAETH_PRED)
1608
0
      continue;
1609
1610
    // Skip the evaluation of modes that do not match with the winner mode in
1611
    // x->mb_mode_cache.
1612
0
    if (x->use_mb_mode_cache && mbmi->mode != x->mb_mode_cache->mode) continue;
1613
1614
0
    is_directional_mode = av1_is_directional_mode(mbmi->mode);
1615
0
    if (is_directional_mode && directional_mode_skip_mask[mbmi->mode]) continue;
1616
0
    if (is_directional_mode &&
1617
0
        !(av1_use_angle_delta(bsize) && intra_mode_cfg->enable_angle_delta) &&
1618
0
        luma_delta_angle != 0)
1619
0
      continue;
1620
1621
    // Use intra_y_mode_mask speed feature to skip intra mode evaluation.
1622
0
    if (!(intra_sf->intra_y_mode_mask[max_txsize_lookup[bsize]] &
1623
0
          (1 << mbmi->mode)))
1624
0
      continue;
1625
1626
0
    if (prune_luma_odd_delta_angles_using_rd_cost(
1627
0
            mbmi, intra_modes_rd_cost[mbmi->mode], best_rd,
1628
0
            intra_sf->prune_luma_odd_delta_angles_in_intra))
1629
0
      continue;
1630
1631
0
    const TX_SIZE tx_size = AOMMIN(TX_32X32, max_txsize_lookup[bsize]);
1632
0
    const int64_t this_model_rd =
1633
0
        intra_model_rd(&cpi->common, x, 0, bsize, tx_size, /*use_hadamard=*/1);
1634
1635
0
    const int model_rd_index_for_pruning =
1636
0
        get_model_rd_index_for_pruning(x, intra_sf);
1637
1638
0
    if (prune_intra_y_mode(this_model_rd, &best_model_rd, top_intra_model_rd,
1639
0
                           intra_sf->top_intra_model_count_allowed,
1640
0
                           model_rd_index_for_pruning))
1641
0
      continue;
1642
1643
    // Builds the actual prediction. The prediction from
1644
    // model_intra_yrd_and_prune was just an estimation that did not take into
1645
    // account the effect of txfm pipeline, so we need to redo it for real
1646
    // here.
1647
0
    av1_pick_uniform_tx_size_type_yrd(cpi, x, &this_rd_stats, bsize, best_rd);
1648
0
    this_rate_tokenonly = this_rd_stats.rate;
1649
0
    this_distortion = this_rd_stats.dist;
1650
0
    s = this_rd_stats.skip_txfm;
1651
1652
0
    if (this_rate_tokenonly == INT_MAX) continue;
1653
1654
0
    if (!xd->lossless[mbmi->segment_id] && block_signals_txsize(mbmi->bsize)) {
1655
      // av1_pick_uniform_tx_size_type_yrd above includes the cost of the
1656
      // tx_size in the tokenonly rate, but for intra blocks, tx_size is always
1657
      // coded (prediction granularity), so we account for it in the full rate,
1658
      // not the tokenonly rate.
1659
0
      this_rate_tokenonly -= tx_size_cost(x, bsize, mbmi->tx_size);
1660
0
    }
1661
0
    this_rate =
1662
0
        this_rd_stats.rate +
1663
0
        intra_mode_info_cost_y(cpi, x, mbmi, bsize, bmode_costs[mbmi->mode], 0);
1664
0
    this_rd = RDCOST(x->rdmult, this_rate, this_distortion);
1665
1666
    // Visual quality adjustment based on recon vs source variance.
1667
0
    if ((cpi->oxcf.mode == ALLINTRA) && (this_rd != INT64_MAX)) {
1668
0
      this_rd = (int64_t)(this_rd * intra_rd_variance_factor(cpi, x, bsize));
1669
0
    }
1670
1671
0
    intra_modes_rd_cost[mbmi->mode][luma_delta_angle + MAX_ANGLE_DELTA + 1] =
1672
0
        this_rd;
1673
1674
    // Collect mode stats for multiwinner mode processing
1675
0
    const int txfm_search_done = 1;
1676
0
    store_winner_mode_stats(
1677
0
        &cpi->common, x, mbmi, NULL, NULL, NULL, 0, NULL, bsize, this_rd,
1678
0
        cpi->sf.winner_mode_sf.multi_winner_mode_type, txfm_search_done);
1679
0
    if (this_rd < best_rd) {
1680
0
      best_mbmi = *mbmi;
1681
0
      best_rd = this_rd;
1682
      // Setting beat_best_rd flag because current mode rd is better than
1683
      // best_rd passed to this function
1684
0
      beat_best_rd = 1;
1685
0
      *rate = this_rate;
1686
0
      *rate_tokenonly = this_rate_tokenonly;
1687
0
      *distortion = this_distortion;
1688
0
      *skippable = s;
1689
0
      memcpy(ctx->blk_skip, x->txfm_search_info.blk_skip,
1690
0
             sizeof(x->txfm_search_info.blk_skip[0]) * ctx->num_4x4_blk);
1691
0
      av1_copy_array(ctx->tx_type_map, xd->tx_type_map, ctx->num_4x4_blk);
1692
0
    }
1693
0
  }
1694
1695
  // Searches palette
1696
0
  if (try_palette) {
1697
0
    av1_rd_pick_palette_intra_sby(
1698
0
        cpi, x, bsize, bmode_costs[DC_PRED], &best_mbmi, best_palette_color_map,
1699
0
        &best_rd, rate, rate_tokenonly, distortion, skippable, &beat_best_rd,
1700
0
        ctx, ctx->blk_skip, ctx->tx_type_map);
1701
0
  }
1702
1703
  // Searches filter_intra
1704
0
  if (beat_best_rd && av1_filter_intra_allowed_bsize(&cpi->common, bsize)) {
1705
0
    if (rd_pick_filter_intra_sby(cpi, x, rate, rate_tokenonly, distortion,
1706
0
                                 skippable, bsize, bmode_costs[DC_PRED],
1707
0
                                 best_mbmi.mode, &best_rd, &best_model_rd,
1708
0
                                 ctx)) {
1709
0
      best_mbmi = *mbmi;
1710
0
    }
1711
0
  }
1712
1713
  // No mode is identified with less rd value than best_rd passed to this
1714
  // function. In such cases winner mode processing is not necessary and return
1715
  // best_rd as INT64_MAX to indicate best mode is not identified
1716
0
  if (!beat_best_rd) return INT64_MAX;
1717
1718
  // In multi-winner mode processing, perform tx search for few best modes
1719
  // identified during mode evaluation. Winner mode processing uses best tx
1720
  // configuration for tx search.
1721
0
  if (cpi->sf.winner_mode_sf.multi_winner_mode_type) {
1722
0
    int best_mode_idx = 0;
1723
0
    int block_width, block_height;
1724
0
    uint8_t *color_map_dst = xd->plane[PLANE_TYPE_Y].color_index_map;
1725
0
    av1_get_block_dimensions(bsize, AOM_PLANE_Y, xd, &block_width,
1726
0
                             &block_height, NULL, NULL);
1727
1728
0
    for (int mode_idx = 0; mode_idx < x->winner_mode_count; mode_idx++) {
1729
0
      *mbmi = x->winner_mode_stats[mode_idx].mbmi;
1730
0
      if (is_winner_mode_processing_enabled(cpi, x, mbmi, 0)) {
1731
        // Restore color_map of palette mode before winner mode processing
1732
0
        if (mbmi->palette_mode_info.palette_size[0] > 0) {
1733
0
          uint8_t *color_map_src =
1734
0
              x->winner_mode_stats[mode_idx].color_index_map;
1735
0
          memcpy(color_map_dst, color_map_src,
1736
0
                 block_width * block_height * sizeof(*color_map_src));
1737
0
        }
1738
        // Set params for winner mode evaluation
1739
0
        set_mode_eval_params(cpi, x, WINNER_MODE_EVAL);
1740
1741
        // Winner mode processing
1742
        // If previous searches use only the default tx type/no R-D optimization
1743
        // of quantized coeffs, do an extra search for the best tx type/better
1744
        // R-D optimization of quantized coeffs
1745
0
        if (intra_block_yrd(cpi, x, bsize, bmode_costs, &best_rd, rate,
1746
0
                            rate_tokenonly, distortion, skippable, &best_mbmi,
1747
0
                            ctx))
1748
0
          best_mode_idx = mode_idx;
1749
0
      }
1750
0
    }
1751
    // Copy color_map of palette mode for final winner mode
1752
0
    if (best_mbmi.palette_mode_info.palette_size[0] > 0) {
1753
0
      uint8_t *color_map_src =
1754
0
          x->winner_mode_stats[best_mode_idx].color_index_map;
1755
0
      memcpy(color_map_dst, color_map_src,
1756
0
             block_width * block_height * sizeof(*color_map_src));
1757
0
    }
1758
0
  } else {
1759
    // If previous searches use only the default tx type/no R-D optimization of
1760
    // quantized coeffs, do an extra search for the best tx type/better R-D
1761
    // optimization of quantized coeffs
1762
0
    if (is_winner_mode_processing_enabled(cpi, x, mbmi, 0)) {
1763
      // Set params for winner mode evaluation
1764
0
      set_mode_eval_params(cpi, x, WINNER_MODE_EVAL);
1765
0
      *mbmi = best_mbmi;
1766
0
      intra_block_yrd(cpi, x, bsize, bmode_costs, &best_rd, rate,
1767
0
                      rate_tokenonly, distortion, skippable, &best_mbmi, ctx);
1768
0
    }
1769
0
  }
1770
0
  *mbmi = best_mbmi;
1771
  av1_copy_array(xd->tx_type_map, ctx->tx_type_map, ctx->num_4x4_blk);
1772
0
  return best_rd;
1773
0
}