Coverage Report

Created: 2026-06-16 07:20

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/aom/av1/encoder/encoder.c
Line
Count
Source
1
/*
2
 * Copyright (c) 2016, Alliance for Open Media. All rights reserved.
3
 *
4
 * This source code is subject to the terms of the BSD 2 Clause License and
5
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6
 * was not distributed with this source code in the LICENSE file, you can
7
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8
 * Media Patent License 1.0 was not distributed with this source code in the
9
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10
 */
11
12
#include <assert.h>
13
#include <float.h>
14
#include <inttypes.h>
15
#include <limits.h>
16
#include <math.h>
17
#include <stdbool.h>
18
#include <stdint.h>
19
#include <stdio.h>
20
#include <stdlib.h>
21
#include <time.h>
22
23
#include "av1/common/scale.h"
24
#include "config/aom_config.h"
25
#include "config/aom_dsp_rtcd.h"
26
27
#include "aom/aomcx.h"
28
29
#if CONFIG_DENOISE
30
#include "aom_dsp/grain_table.h"
31
#include "aom_dsp/noise_util.h"
32
#include "aom_dsp/noise_model.h"
33
#endif
34
#include "aom_dsp/flow_estimation/corner_detect.h"
35
#include "aom_dsp/psnr.h"
36
#if CONFIG_INTERNAL_STATS
37
#include "aom_dsp/ssim.h"
38
#endif
39
#include "aom_ports/aom_timer.h"
40
#include "aom_ports/mem.h"
41
#include "aom_util/aom_pthread.h"
42
#if CONFIG_BITSTREAM_DEBUG
43
#include "aom_util/debug_util.h"
44
#endif  // CONFIG_BITSTREAM_DEBUG
45
46
#include "av1/common/alloccommon.h"
47
#include "av1/common/debugmodes.h"
48
#include "av1/common/filter.h"
49
#include "av1/common/idct.h"
50
#include "av1/common/reconinter.h"
51
#include "av1/common/reconintra.h"
52
#include "av1/common/resize.h"
53
#include "av1/common/tile_common.h"
54
55
#include "av1/encoder/allintra_vis.h"
56
#include "av1/encoder/aq_complexity.h"
57
#include "av1/encoder/aq_cyclicrefresh.h"
58
#include "av1/encoder/aq_variance.h"
59
#include "av1/encoder/bitstream.h"
60
#if CONFIG_INTERNAL_STATS
61
#include "av1/encoder/blockiness.h"
62
#endif
63
#include "av1/encoder/context_tree.h"
64
#include "av1/encoder/dwt.h"
65
#include "av1/encoder/encodeframe.h"
66
#include "av1/encoder/encodemv.h"
67
#include "av1/encoder/encode_strategy.h"
68
#include "av1/encoder/encoder.h"
69
#include "av1/encoder/encoder_alloc.h"
70
#include "av1/encoder/encoder_utils.h"
71
#include "av1/encoder/encodetxb.h"
72
#include "av1/encoder/ethread.h"
73
#include "av1/encoder/firstpass.h"
74
#include "av1/encoder/hash_motion.h"
75
#include "av1/encoder/hybrid_fwd_txfm.h"
76
#include "av1/encoder/intra_mode_search.h"
77
#include "av1/encoder/mv_prec.h"
78
#include "av1/encoder/pass2_strategy.h"
79
#include "av1/encoder/pickcdef.h"
80
#include "av1/encoder/picklpf.h"
81
#include "av1/encoder/pickrst.h"
82
#include "av1/encoder/random.h"
83
#include "av1/encoder/ratectrl.h"
84
#include "av1/encoder/rc_utils.h"
85
#include "av1/encoder/rd.h"
86
#include "av1/encoder/rdopt.h"
87
#if CONFIG_SALIENCY_MAP
88
#include "av1/encoder/saliency_map.h"
89
#endif
90
#include "av1/encoder/segmentation.h"
91
#include "av1/encoder/speed_features.h"
92
#include "av1/encoder/superres_scale.h"
93
#if CONFIG_THREE_PASS
94
#include "av1/encoder/thirdpass.h"
95
#endif
96
#include "av1/encoder/tpl_model.h"
97
#include "av1/encoder/reconinter_enc.h"
98
#include "av1/encoder/var_based_part.h"
99
100
0
#define DEFAULT_EXPLICIT_ORDER_HINT_BITS 7
101
102
// #define OUTPUT_YUV_REC
103
#ifdef OUTPUT_YUV_REC
104
FILE *yuv_rec_file;
105
#define FILE_NAME_LEN 100
106
#endif
107
108
#ifdef OUTPUT_YUV_DENOISED
109
FILE *yuv_denoised_file = NULL;
110
#endif
111
112
0
static inline void Scale2Ratio(AOM_SCALING_MODE mode, int *hr, int *hs) {
113
0
  switch (mode) {
114
0
    case AOME_NORMAL:
115
0
      *hr = 1;
116
0
      *hs = 1;
117
0
      break;
118
0
    case AOME_FOURFIVE:
119
0
      *hr = 4;
120
0
      *hs = 5;
121
0
      break;
122
0
    case AOME_THREEFIVE:
123
0
      *hr = 3;
124
0
      *hs = 5;
125
0
      break;
126
0
    case AOME_THREEFOUR:
127
0
      *hr = 3;
128
0
      *hs = 4;
129
0
      break;
130
0
    case AOME_ONEFOUR:
131
0
      *hr = 1;
132
0
      *hs = 4;
133
0
      break;
134
0
    case AOME_ONEEIGHT:
135
0
      *hr = 1;
136
0
      *hs = 8;
137
0
      break;
138
0
    case AOME_ONETWO:
139
0
      *hr = 1;
140
0
      *hs = 2;
141
0
      break;
142
0
    case AOME_TWOTHREE:
143
0
      *hr = 2;
144
0
      *hs = 3;
145
0
      break;
146
0
    case AOME_ONETHREE:
147
0
      *hr = 1;
148
0
      *hs = 3;
149
0
      break;
150
0
    default:
151
0
      *hr = 1;
152
0
      *hs = 1;
153
0
      assert(0);
154
0
      break;
155
0
  }
156
0
}
157
158
0
static int check_seg_range(int seg_data[8], int range) {
159
0
  for (int i = 0; i < 8; ++i) {
160
    // Note abs() alone can't be used as the behavior of abs(INT_MIN) is
161
    // undefined.
162
0
    if (seg_data[i] > range || seg_data[i] < -range) {
163
0
      return 0;
164
0
    }
165
0
  }
166
0
  return 1;
167
0
}
168
169
int av1_set_roi_map(AV1_COMP *cpi, unsigned char *map, unsigned int rows,
170
                    unsigned int cols, int delta_q[8], int delta_lf[8],
171
0
                    int skip[8], int ref_frame[8]) {
172
0
  AV1_COMMON *cm = &cpi->common;
173
0
  aom_roi_map_t *roi = &cpi->roi;
174
0
  const int range = 63;
175
0
  const int ref_frame_range = REF_FRAMES;
176
0
  const int skip_range = 1;
177
0
  const int frame_rows = cpi->common.mi_params.mi_rows;
178
0
  const int frame_cols = cpi->common.mi_params.mi_cols;
179
180
  // Check number of rows and columns match
181
0
  if (frame_rows != (int)rows || frame_cols != (int)cols) {
182
0
    return AOM_CODEC_INVALID_PARAM;
183
0
  }
184
185
0
  if (!check_seg_range(delta_q, range) || !check_seg_range(delta_lf, range) ||
186
0
      !check_seg_range(ref_frame, ref_frame_range) ||
187
0
      !check_seg_range(skip, skip_range))
188
0
    return AOM_CODEC_INVALID_PARAM;
189
190
  // Also disable segmentation if no deltas are specified.
191
0
  if (!map ||
192
0
      (!(delta_q[0] | delta_q[1] | delta_q[2] | delta_q[3] | delta_q[4] |
193
0
         delta_q[5] | delta_q[6] | delta_q[7] | delta_lf[0] | delta_lf[1] |
194
0
         delta_lf[2] | delta_lf[3] | delta_lf[4] | delta_lf[5] | delta_lf[6] |
195
0
         delta_lf[7] | skip[0] | skip[1] | skip[2] | skip[3] | skip[4] |
196
0
         skip[5] | skip[6] | skip[7]) &&
197
0
       (ref_frame[0] == -1 && ref_frame[1] == -1 && ref_frame[2] == -1 &&
198
0
        ref_frame[3] == -1 && ref_frame[4] == -1 && ref_frame[5] == -1 &&
199
0
        ref_frame[6] == -1 && ref_frame[7] == -1))) {
200
0
    av1_disable_segmentation(&cm->seg);
201
0
    cpi->roi.enabled = 0;
202
0
    return AOM_CODEC_OK;
203
0
  }
204
205
0
  if (roi->roi_map) {
206
0
    aom_free(roi->roi_map);
207
0
    roi->roi_map = NULL;
208
0
  }
209
0
  roi->roi_map = aom_malloc(rows * cols);
210
0
  if (!roi->roi_map) return AOM_CODEC_MEM_ERROR;
211
212
  // Copy to ROI structure in the compressor.
213
0
  memcpy(roi->roi_map, map, rows * cols);
214
0
  memcpy(&roi->delta_q, delta_q, MAX_SEGMENTS * sizeof(delta_q[0]));
215
0
  memcpy(&roi->delta_lf, delta_lf, MAX_SEGMENTS * sizeof(delta_lf[0]));
216
0
  memcpy(&roi->skip, skip, MAX_SEGMENTS * sizeof(skip[0]));
217
0
  memcpy(&roi->ref_frame, ref_frame, MAX_SEGMENTS * sizeof(ref_frame[0]));
218
0
  roi->enabled = 1;
219
0
  roi->rows = rows;
220
0
  roi->cols = cols;
221
222
0
  return AOM_CODEC_OK;
223
0
}
224
225
int av1_set_active_map(AV1_COMP *cpi, unsigned char *new_map_16x16, int rows,
226
0
                       int cols) {
227
0
  const CommonModeInfoParams *const mi_params = &cpi->common.mi_params;
228
0
  if (rows == mi_params->mb_rows && cols == mi_params->mb_cols) {
229
0
    unsigned char *const active_map_4x4 = cpi->active_map.map;
230
0
    const int mi_rows = mi_params->mi_rows;
231
0
    const int mi_cols = mi_params->mi_cols;
232
0
    cpi->active_map.update = 0;
233
0
    cpi->rc.percent_blocks_inactive = 0;
234
0
    assert(mi_rows % 2 == 0 && mi_rows > 0);
235
0
    assert(mi_cols % 2 == 0 && mi_cols > 0);
236
0
    if (new_map_16x16) {
237
0
      int num_samples = 0;
238
0
      int num_blocks_inactive = 0;
239
0
      for (int r = 0; r < mi_rows; r += 4) {
240
0
        for (int c = 0; c < mi_cols; c += 4) {
241
0
          const uint8_t val = new_map_16x16[(r >> 2) * cols + (c >> 2)]
242
0
                                  ? AM_SEGMENT_ID_ACTIVE
243
0
                                  : AM_SEGMENT_ID_INACTIVE;
244
0
          num_samples++;
245
0
          if (val == AM_SEGMENT_ID_INACTIVE) num_blocks_inactive++;
246
0
          const int row_max = AOMMIN(4, mi_rows - r);
247
0
          const int col_max = AOMMIN(4, mi_cols - c);
248
0
          for (int x = 0; x < row_max; ++x) {
249
0
            for (int y = 0; y < col_max; ++y) {
250
0
              active_map_4x4[(r + x) * mi_cols + (c + y)] = val;
251
0
            }
252
0
          }
253
0
        }
254
0
      }
255
0
      cpi->active_map.enabled = 1;
256
0
      cpi->active_map.update = 1;
257
0
      assert(num_samples);
258
0
      cpi->rc.percent_blocks_inactive =
259
0
          (num_blocks_inactive * 100) / num_samples;
260
0
    }
261
0
    return 0;
262
0
  }
263
264
0
  return -1;
265
0
}
266
267
int av1_get_active_map(AV1_COMP *cpi, unsigned char *new_map_16x16, int rows,
268
0
                       int cols) {
269
0
  const CommonModeInfoParams *const mi_params = &cpi->common.mi_params;
270
0
  if (rows == mi_params->mb_rows && cols == mi_params->mb_cols &&
271
0
      new_map_16x16) {
272
0
    unsigned char *const seg_map_8x8 = cpi->enc_seg.map;
273
0
    const int mi_rows = mi_params->mi_rows;
274
0
    const int mi_cols = mi_params->mi_cols;
275
0
    const int row_scale = mi_size_high_log2[BLOCK_16X16];
276
0
    const int col_scale = mi_size_wide_log2[BLOCK_16X16];
277
0
    assert(mi_rows % 2 == 0);
278
0
    assert(mi_cols % 2 == 0);
279
280
0
    memset(new_map_16x16, !cpi->active_map.enabled, rows * cols);
281
0
    if (cpi->active_map.enabled) {
282
0
      for (int r = 0; r < (mi_rows >> row_scale); ++r) {
283
0
        for (int c = 0; c < (mi_cols >> col_scale); ++c) {
284
          // Cyclic refresh segments are considered active despite not having
285
          // AM_SEGMENT_ID_ACTIVE
286
0
          uint8_t temp = 0;
287
0
          temp |= seg_map_8x8[(2 * r + 0) * mi_cols + (2 * c + 0)] !=
288
0
                  AM_SEGMENT_ID_INACTIVE;
289
0
          temp |= seg_map_8x8[(2 * r + 0) * mi_cols + (2 * c + 1)] !=
290
0
                  AM_SEGMENT_ID_INACTIVE;
291
0
          temp |= seg_map_8x8[(2 * r + 1) * mi_cols + (2 * c + 0)] !=
292
0
                  AM_SEGMENT_ID_INACTIVE;
293
0
          temp |= seg_map_8x8[(2 * r + 1) * mi_cols + (2 * c + 1)] !=
294
0
                  AM_SEGMENT_ID_INACTIVE;
295
0
          new_map_16x16[r * cols + c] |= temp;
296
0
        }
297
0
      }
298
0
    }
299
0
    return 0;
300
0
  }
301
302
0
  return -1;
303
0
}
304
305
0
void av1_initialize_enc(unsigned int usage, enum aom_rc_mode end_usage) {
306
0
  bool is_allintra = usage == ALLINTRA;
307
308
0
  av1_rtcd();
309
0
  aom_dsp_rtcd();
310
0
  aom_scale_rtcd();
311
0
  av1_init_intra_predictors();
312
0
  av1_init_me_luts();
313
0
  if (!is_allintra) av1_init_wedge_masks();
314
0
  if (!is_allintra || end_usage != AOM_Q) av1_rc_init_minq_luts();
315
0
}
316
317
0
void av1_new_framerate(AV1_COMP *cpi, double framerate) {
318
0
  cpi->framerate = framerate < 0.1 ? 30 : framerate;
319
0
  av1_rc_update_framerate(cpi, cpi->common.width, cpi->common.height);
320
0
}
321
322
double av1_get_compression_ratio(const AV1_COMMON *const cm,
323
0
                                 size_t encoded_frame_size) {
324
0
  const int upscaled_width = cm->superres_upscaled_width;
325
0
  const int height = cm->height;
326
0
  const int64_t luma_pic_size = (int64_t)upscaled_width * height;
327
0
  const SequenceHeader *const seq_params = cm->seq_params;
328
0
  const BITSTREAM_PROFILE profile = seq_params->profile;
329
0
  const int pic_size_profile_factor =
330
0
      profile == PROFILE_0 ? 15 : (profile == PROFILE_1 ? 30 : 36);
331
0
  encoded_frame_size =
332
0
      (encoded_frame_size > 129 ? encoded_frame_size - 128 : 1);
333
0
  const int64_t uncompressed_frame_size =
334
0
      (luma_pic_size * pic_size_profile_factor) >> 3;
335
0
  return (double)uncompressed_frame_size / encoded_frame_size;
336
0
}
337
338
static void auto_tile_size_balancing(AV1_COMMON *const cm, int num_sbs,
339
0
                                     int num_tiles_lg, int tile_col_row) {
340
0
  CommonTileParams *const tiles = &cm->tiles;
341
0
  int i, start_sb;
342
0
  int size_sb = num_sbs >> num_tiles_lg;
343
0
  int res_sbs = num_sbs - (size_sb << num_tiles_lg);
344
0
  int num_tiles = 1 << num_tiles_lg;
345
0
  int inc_index = num_tiles - res_sbs;
346
347
0
  tiles->uniform_spacing = 0;
348
349
0
  const int max_size_sb =
350
0
      tile_col_row ? tiles->max_width_sb : tiles->max_height_sb;
351
0
  for (i = 0, start_sb = 0; start_sb < num_sbs && i < MAX_TILE_COLS; ++i) {
352
0
    if (i == inc_index) ++size_sb;
353
0
    if (tile_col_row)
354
0
      tiles->col_start_sb[i] = start_sb;
355
0
    else
356
0
      tiles->row_start_sb[i] = start_sb;
357
358
0
    start_sb += AOMMIN(size_sb, max_size_sb);
359
0
  }
360
361
0
  if (tile_col_row) {
362
0
    tiles->cols = i;
363
0
    tiles->col_start_sb[i] = num_sbs;
364
0
  } else {
365
0
    tiles->rows = i;
366
0
    tiles->row_start_sb[i] = num_sbs;
367
0
  }
368
0
}
369
370
static void set_tile_info(AV1_COMMON *const cm,
371
0
                          const TileConfig *const tile_cfg) {
372
0
  const CommonModeInfoParams *const mi_params = &cm->mi_params;
373
0
  const SequenceHeader *const seq_params = cm->seq_params;
374
0
  CommonTileParams *const tiles = &cm->tiles;
375
0
  int i, start_sb;
376
377
0
  av1_get_tile_limits(cm);
378
379
0
  int sb_cols =
380
0
      CEIL_POWER_OF_TWO(mi_params->mi_cols, seq_params->mib_size_log2);
381
  // configure tile columns
382
0
  if (tile_cfg->tile_width_count == 0 || tile_cfg->tile_height_count == 0) {
383
0
    tiles->uniform_spacing = 1;
384
0
    tiles->log2_cols = AOMMAX(tile_cfg->tile_columns, tiles->min_log2_cols);
385
    // Add a special case to handle super resolution
386
0
    sb_cols = coded_to_superres_mi(sb_cols, cm->superres_scale_denominator);
387
0
    int min_log2_cols = 0;
388
0
    for (; (tiles->max_width_sb << min_log2_cols) <= sb_cols; ++min_log2_cols) {
389
0
    }
390
0
    tiles->log2_cols = AOMMAX(tiles->log2_cols, min_log2_cols);
391
392
0
    tiles->log2_cols = AOMMIN(tiles->log2_cols, tiles->max_log2_cols);
393
0
  } else if (tile_cfg->tile_widths[0] < 0) {
394
0
    auto_tile_size_balancing(cm, sb_cols, tile_cfg->tile_columns, 1);
395
0
  } else {
396
0
    int size_sb, j = 0;
397
0
    tiles->uniform_spacing = 0;
398
0
    for (i = 0, start_sb = 0; start_sb < sb_cols && i < MAX_TILE_COLS; i++) {
399
0
      tiles->col_start_sb[i] = start_sb;
400
0
      size_sb = tile_cfg->tile_widths[j++];
401
0
      if (j >= tile_cfg->tile_width_count) j = 0;
402
0
      start_sb += AOMMIN(size_sb, tiles->max_width_sb);
403
0
    }
404
0
    tiles->cols = i;
405
0
    tiles->col_start_sb[i] = sb_cols;
406
0
  }
407
0
  av1_calculate_tile_cols(seq_params, mi_params->mi_rows, mi_params->mi_cols,
408
0
                          tiles);
409
410
  // configure tile rows
411
0
  int sb_rows =
412
0
      CEIL_POWER_OF_TWO(mi_params->mi_rows, seq_params->mib_size_log2);
413
0
  if (tiles->uniform_spacing) {
414
0
    tiles->log2_rows = AOMMAX(tile_cfg->tile_rows, tiles->min_log2_rows);
415
0
    tiles->log2_rows = AOMMIN(tiles->log2_rows, tiles->max_log2_rows);
416
0
  } else if (tile_cfg->tile_heights[0] < 0) {
417
0
    auto_tile_size_balancing(cm, sb_rows, tile_cfg->tile_rows, 0);
418
0
  } else {
419
0
    int size_sb, j = 0;
420
0
    for (i = 0, start_sb = 0; start_sb < sb_rows && i < MAX_TILE_ROWS; i++) {
421
0
      tiles->row_start_sb[i] = start_sb;
422
0
      size_sb = tile_cfg->tile_heights[j++];
423
0
      if (j >= tile_cfg->tile_height_count) j = 0;
424
0
      start_sb += AOMMIN(size_sb, tiles->max_height_sb);
425
0
    }
426
0
    tiles->rows = i;
427
0
    tiles->row_start_sb[i] = sb_rows;
428
0
  }
429
0
  av1_calculate_tile_rows(seq_params, mi_params->mi_rows, tiles);
430
0
}
431
432
0
void av1_update_frame_size(AV1_COMP *cpi) {
433
0
  AV1_COMMON *const cm = &cpi->common;
434
0
  MACROBLOCKD *const xd = &cpi->td.mb.e_mbd;
435
436
  // Setup mi_params here in case we need more mi's.
437
0
  CommonModeInfoParams *const mi_params = &cm->mi_params;
438
0
  mi_params->set_mb_mi(mi_params, cm->width, cm->height,
439
0
                       cpi->sf.part_sf.default_min_partition_size);
440
441
0
  av1_init_macroblockd(cm, xd);
442
443
0
  if (!cpi->ppi->seq_params_locked)
444
0
    set_sb_size(cm->seq_params,
445
0
                av1_select_sb_size(&cpi->oxcf, cm->width, cm->height,
446
0
                                   cpi->ppi->number_spatial_layers));
447
448
0
  set_tile_info(cm, &cpi->oxcf.tile_cfg);
449
0
}
450
451
static inline int does_level_match(int width, int height, double fps,
452
                                   int lvl_width, int lvl_height,
453
0
                                   double lvl_fps, int lvl_dim_mult) {
454
0
  const int64_t lvl_luma_pels = (int64_t)lvl_width * lvl_height;
455
0
  const double lvl_display_sample_rate = lvl_luma_pels * lvl_fps;
456
0
  const int64_t luma_pels = (int64_t)width * height;
457
0
  const double display_sample_rate = luma_pels * fps;
458
0
  return luma_pels <= lvl_luma_pels &&
459
0
         display_sample_rate <= lvl_display_sample_rate &&
460
0
         width <= lvl_width * lvl_dim_mult &&
461
0
         height <= lvl_height * lvl_dim_mult;
462
0
}
463
464
static void set_bitstream_level_tier(AV1_PRIMARY *const ppi, int width,
465
0
                                     int height, double init_framerate) {
466
0
  SequenceHeader *const seq_params = &ppi->seq_params;
467
0
  const AV1LevelParams *const level_params = &ppi->level_params;
468
  // TODO(any): This is a placeholder function that only addresses dimensions
469
  // and max display sample rates.
470
  // Need to add checks for max bit rate, max decoded luma sample rate, header
471
  // rate, etc. that are not covered by this function.
472
0
  AV1_LEVEL level = SEQ_LEVEL_MAX;
473
0
  if (does_level_match(width, height, init_framerate, 512, 288, 30.0, 4)) {
474
0
    level = SEQ_LEVEL_2_0;
475
0
  } else if (does_level_match(width, height, init_framerate, 704, 396, 30.0,
476
0
                              4)) {
477
0
    level = SEQ_LEVEL_2_1;
478
0
  } else if (does_level_match(width, height, init_framerate, 1088, 612, 30.0,
479
0
                              4)) {
480
0
    level = SEQ_LEVEL_3_0;
481
0
  } else if (does_level_match(width, height, init_framerate, 1376, 774, 30.0,
482
0
                              4)) {
483
0
    level = SEQ_LEVEL_3_1;
484
0
  } else if (does_level_match(width, height, init_framerate, 2048, 1152, 30.0,
485
0
                              3)) {
486
0
    level = SEQ_LEVEL_4_0;
487
0
  } else if (does_level_match(width, height, init_framerate, 2048, 1152, 60.0,
488
0
                              3)) {
489
0
    level = SEQ_LEVEL_4_1;
490
0
  } else if (does_level_match(width, height, init_framerate, 4096, 2176, 30.0,
491
0
                              2)) {
492
0
    level = SEQ_LEVEL_5_0;
493
0
  } else if (does_level_match(width, height, init_framerate, 4096, 2176, 60.0,
494
0
                              2)) {
495
0
    level = SEQ_LEVEL_5_1;
496
0
  } else if (does_level_match(width, height, init_framerate, 4096, 2176, 120.0,
497
0
                              2)) {
498
0
    level = SEQ_LEVEL_5_2;
499
0
  } else if (does_level_match(width, height, init_framerate, 8192, 4352, 30.0,
500
0
                              2)) {
501
0
    level = SEQ_LEVEL_6_0;
502
0
  } else if (does_level_match(width, height, init_framerate, 8192, 4352, 60.0,
503
0
                              2)) {
504
0
    level = SEQ_LEVEL_6_1;
505
0
  } else if (does_level_match(width, height, init_framerate, 8192, 4352, 120.0,
506
0
                              2)) {
507
0
    level = SEQ_LEVEL_6_2;
508
0
  }
509
#if CONFIG_CWG_C013
510
  // TODO(bohanli): currently target level is only working for the 0th operating
511
  // point, so scalable coding is not supported.
512
  else if (level_params->target_seq_level_idx[0] >= SEQ_LEVEL_7_0 &&
513
           level_params->target_seq_level_idx[0] <= SEQ_LEVEL_8_3) {
514
    // Only use level 7.x to 8.x when explicitly asked to.
515
    if (does_level_match(width, height, init_framerate, 16384, 8704, 30.0, 2)) {
516
      level = SEQ_LEVEL_7_0;
517
    } else if (does_level_match(width, height, init_framerate, 16384, 8704,
518
                                60.0, 2)) {
519
      level = SEQ_LEVEL_7_1;
520
    } else if (does_level_match(width, height, init_framerate, 16384, 8704,
521
                                120.0, 2)) {
522
      level = SEQ_LEVEL_7_2;
523
    } else if (does_level_match(width, height, init_framerate, 32768, 17408,
524
                                30.0, 2)) {
525
      level = SEQ_LEVEL_8_0;
526
    } else if (does_level_match(width, height, init_framerate, 32768, 17408,
527
                                60.0, 2)) {
528
      level = SEQ_LEVEL_8_1;
529
    } else if (does_level_match(width, height, init_framerate, 32768, 17408,
530
                                120.0, 2)) {
531
      level = SEQ_LEVEL_8_2;
532
    }
533
  }
534
#endif
535
536
0
  for (int i = 0; i < MAX_NUM_OPERATING_POINTS; ++i) {
537
0
    assert(is_valid_seq_level_idx(level_params->target_seq_level_idx[i]) ||
538
0
           level_params->target_seq_level_idx[i] == SEQ_LEVEL_KEEP_STATS);
539
    // If a higher target level is specified, it is then used rather than the
540
    // inferred one from resolution and framerate.
541
0
    seq_params->seq_level_idx[i] =
542
0
        level_params->target_seq_level_idx[i] < SEQ_LEVELS &&
543
0
                level_params->target_seq_level_idx[i] > level
544
0
            ? level_params->target_seq_level_idx[i]
545
0
            : level;
546
    // Set the maximum parameters for bitrate and buffer size for this profile,
547
    // level, and tier
548
0
    seq_params->op_params[i].bitrate = av1_max_level_bitrate(
549
0
        seq_params->profile, seq_params->seq_level_idx[i], seq_params->tier[i]);
550
    // Level with seq_level_idx = 31 returns a high "dummy" bitrate to pass the
551
    // check
552
0
    if (seq_params->op_params[i].bitrate == 0)
553
0
      aom_internal_error(
554
0
          &ppi->error, AOM_CODEC_UNSUP_BITSTREAM,
555
0
          "AV1 does not support this combination of profile, level, and tier.");
556
    // Buffer size in bits is bitrate in bits/s * 1 s
557
0
    seq_params->op_params[i].buffer_size = seq_params->op_params[i].bitrate;
558
0
  }
559
0
}
560
561
0
void av1_set_svc_seq_params(AV1_PRIMARY *const ppi) {
562
0
  SequenceHeader *const seq = &ppi->seq_params;
563
0
  if (seq->operating_points_cnt_minus_1 == 0) {
564
0
    seq->operating_point_idc[0] = 0;
565
0
    seq->has_nonzero_operating_point_idc = false;
566
0
  } else {
567
    // Set operating_point_idc[] such that the i=0 point corresponds to the
568
    // highest quality operating point (all layers), and subsequent
569
    // operarting points (i > 0) are lower quality corresponding to
570
    // skip decoding enhancement  layers (temporal first).
571
0
    int i = 0;
572
0
    assert(seq->operating_points_cnt_minus_1 ==
573
0
           (int)(ppi->number_spatial_layers * ppi->number_temporal_layers - 1));
574
0
    for (unsigned int sl = 0; sl < ppi->number_spatial_layers; sl++) {
575
0
      for (unsigned int tl = 0; tl < ppi->number_temporal_layers; tl++) {
576
0
        seq->operating_point_idc[i] =
577
0
            (~(~0u << (ppi->number_spatial_layers - sl)) << 8) |
578
0
            ~(~0u << (ppi->number_temporal_layers - tl));
579
0
        assert(seq->operating_point_idc[i] != 0);
580
0
        i++;
581
0
      }
582
0
    }
583
0
    seq->has_nonzero_operating_point_idc = true;
584
0
  }
585
0
}
586
587
static void init_seq_coding_tools(AV1_PRIMARY *const ppi,
588
                                  const AV1EncoderConfig *oxcf,
589
0
                                  int disable_frame_id_numbers) {
590
0
  SequenceHeader *const seq = &ppi->seq_params;
591
0
  const FrameDimensionCfg *const frm_dim_cfg = &oxcf->frm_dim_cfg;
592
0
  const ToolCfg *const tool_cfg = &oxcf->tool_cfg;
593
594
0
  seq->still_picture =
595
0
      !tool_cfg->force_video_mode && (oxcf->input_cfg.limit == 1);
596
0
  seq->reduced_still_picture_hdr =
597
0
      seq->still_picture && !tool_cfg->full_still_picture_hdr;
598
0
  seq->force_screen_content_tools = 2;
599
0
  seq->force_integer_mv = 2;
600
0
  seq->order_hint_info.enable_order_hint = tool_cfg->enable_order_hint;
601
0
  seq->frame_id_numbers_present_flag =
602
0
      !seq->reduced_still_picture_hdr &&
603
0
      !oxcf->tile_cfg.enable_large_scale_tile &&
604
0
      tool_cfg->error_resilient_mode && !disable_frame_id_numbers;
605
0
  if (seq->reduced_still_picture_hdr) {
606
0
    seq->order_hint_info.enable_order_hint = 0;
607
0
    seq->force_screen_content_tools = 2;
608
0
    seq->force_integer_mv = 2;
609
0
  }
610
0
  seq->order_hint_info.order_hint_bits_minus_1 =
611
0
      seq->order_hint_info.enable_order_hint
612
0
          ? DEFAULT_EXPLICIT_ORDER_HINT_BITS - 1
613
0
          : -1;
614
615
0
  seq->max_frame_width = frm_dim_cfg->forced_max_frame_width
616
0
                             ? frm_dim_cfg->forced_max_frame_width
617
0
                             : AOMMAX(seq->max_frame_width, frm_dim_cfg->width);
618
0
  seq->max_frame_height =
619
0
      frm_dim_cfg->forced_max_frame_height
620
0
          ? frm_dim_cfg->forced_max_frame_height
621
0
          : AOMMAX(seq->max_frame_height, frm_dim_cfg->height);
622
0
  seq->num_bits_width =
623
0
      (seq->max_frame_width > 1) ? get_msb(seq->max_frame_width - 1) + 1 : 1;
624
0
  seq->num_bits_height =
625
0
      (seq->max_frame_height > 1) ? get_msb(seq->max_frame_height - 1) + 1 : 1;
626
0
  assert(seq->num_bits_width <= 16);
627
0
  assert(seq->num_bits_height <= 16);
628
629
0
  seq->frame_id_length = FRAME_ID_LENGTH;
630
0
  seq->delta_frame_id_length = DELTA_FRAME_ID_LENGTH;
631
632
0
  seq->enable_dual_filter = tool_cfg->enable_dual_filter;
633
0
  seq->order_hint_info.enable_dist_wtd_comp =
634
0
      oxcf->comp_type_cfg.enable_dist_wtd_comp;
635
0
  seq->order_hint_info.enable_dist_wtd_comp &=
636
0
      seq->order_hint_info.enable_order_hint;
637
0
  seq->order_hint_info.enable_ref_frame_mvs = tool_cfg->ref_frame_mvs_present;
638
0
  seq->order_hint_info.enable_ref_frame_mvs &=
639
0
      seq->order_hint_info.enable_order_hint;
640
0
  seq->enable_superres = oxcf->superres_cfg.enable_superres;
641
0
  seq->enable_cdef = tool_cfg->cdef_control != CDEF_NONE ? 1 : 0;
642
0
  seq->enable_restoration = tool_cfg->enable_restoration;
643
0
  seq->enable_warped_motion = oxcf->motion_mode_cfg.enable_warped_motion;
644
0
  seq->enable_interintra_compound = tool_cfg->enable_interintra_comp;
645
0
  seq->enable_masked_compound = oxcf->comp_type_cfg.enable_masked_comp;
646
0
  seq->enable_intra_edge_filter = oxcf->intra_mode_cfg.enable_intra_edge_filter;
647
0
  seq->enable_filter_intra = oxcf->intra_mode_cfg.enable_filter_intra;
648
649
0
  set_bitstream_level_tier(ppi, frm_dim_cfg->width, frm_dim_cfg->height,
650
0
                           oxcf->input_cfg.init_framerate);
651
0
  av1_set_svc_seq_params(ppi);
652
0
}
653
654
static void init_config_sequence(struct AV1_PRIMARY *ppi,
655
0
                                 const AV1EncoderConfig *oxcf) {
656
0
  SequenceHeader *const seq_params = &ppi->seq_params;
657
0
  const DecoderModelCfg *const dec_model_cfg = &oxcf->dec_model_cfg;
658
0
  const ColorCfg *const color_cfg = &oxcf->color_cfg;
659
660
0
  ppi->use_svc = 0;
661
0
  ppi->number_spatial_layers = 1;
662
0
  ppi->number_temporal_layers = 1;
663
664
0
  seq_params->profile = oxcf->profile;
665
0
  seq_params->bit_depth = oxcf->tool_cfg.bit_depth;
666
0
  seq_params->use_highbitdepth = oxcf->use_highbitdepth;
667
0
  seq_params->color_primaries = color_cfg->color_primaries;
668
0
  seq_params->transfer_characteristics = color_cfg->transfer_characteristics;
669
0
  seq_params->matrix_coefficients = color_cfg->matrix_coefficients;
670
0
  seq_params->monochrome = oxcf->tool_cfg.enable_monochrome;
671
0
  seq_params->chroma_sample_position = color_cfg->chroma_sample_position;
672
0
  seq_params->color_range = color_cfg->color_range;
673
0
  seq_params->timing_info_present = dec_model_cfg->timing_info_present;
674
0
  seq_params->timing_info.num_units_in_display_tick =
675
0
      dec_model_cfg->timing_info.num_units_in_display_tick;
676
0
  seq_params->timing_info.time_scale = dec_model_cfg->timing_info.time_scale;
677
0
  seq_params->timing_info.equal_picture_interval =
678
0
      dec_model_cfg->timing_info.equal_picture_interval;
679
0
  seq_params->timing_info.num_ticks_per_picture =
680
0
      dec_model_cfg->timing_info.num_ticks_per_picture;
681
682
0
  seq_params->display_model_info_present_flag =
683
0
      dec_model_cfg->display_model_info_present_flag;
684
0
  seq_params->decoder_model_info_present_flag =
685
0
      dec_model_cfg->decoder_model_info_present_flag;
686
0
  if (dec_model_cfg->decoder_model_info_present_flag) {
687
    // set the decoder model parameters in schedule mode
688
0
    seq_params->decoder_model_info.num_units_in_decoding_tick =
689
0
        dec_model_cfg->num_units_in_decoding_tick;
690
0
    ppi->buffer_removal_time_present = 1;
691
0
    av1_set_aom_dec_model_info(&seq_params->decoder_model_info);
692
0
    av1_set_dec_model_op_parameters(&seq_params->op_params[0]);
693
0
  } else if (seq_params->timing_info_present &&
694
0
             seq_params->timing_info.equal_picture_interval &&
695
0
             !seq_params->decoder_model_info_present_flag) {
696
    // set the decoder model parameters in resource availability mode
697
0
    av1_set_resource_availability_parameters(&seq_params->op_params[0]);
698
0
  } else {
699
0
    seq_params->op_params[0].initial_display_delay =
700
0
        10;  // Default value (not signaled)
701
0
  }
702
703
0
  if (seq_params->monochrome) {
704
0
    seq_params->subsampling_x = 1;
705
0
    seq_params->subsampling_y = 1;
706
0
  } else if (seq_params->color_primaries == AOM_CICP_CP_BT_709 &&
707
0
             seq_params->transfer_characteristics == AOM_CICP_TC_SRGB &&
708
0
             seq_params->matrix_coefficients == AOM_CICP_MC_IDENTITY) {
709
0
    seq_params->subsampling_x = 0;
710
0
    seq_params->subsampling_y = 0;
711
0
  } else {
712
0
    if (seq_params->profile == 0) {
713
0
      seq_params->subsampling_x = 1;
714
0
      seq_params->subsampling_y = 1;
715
0
    } else if (seq_params->profile == 1) {
716
0
      seq_params->subsampling_x = 0;
717
0
      seq_params->subsampling_y = 0;
718
0
    } else {
719
0
      if (seq_params->bit_depth == AOM_BITS_12) {
720
0
        seq_params->subsampling_x = oxcf->input_cfg.chroma_subsampling_x;
721
0
        seq_params->subsampling_y = oxcf->input_cfg.chroma_subsampling_y;
722
0
      } else {
723
0
        seq_params->subsampling_x = 1;
724
0
        seq_params->subsampling_y = 0;
725
0
      }
726
0
    }
727
0
  }
728
0
  av1_change_config_seq(ppi, oxcf, NULL);
729
0
}
730
731
0
static void init_config(struct AV1_COMP *cpi, const AV1EncoderConfig *oxcf) {
732
0
  AV1_COMMON *const cm = &cpi->common;
733
0
  ResizePendingParams *resize_pending_params = &cpi->resize_pending_params;
734
735
0
  cpi->oxcf = *oxcf;
736
0
  cpi->framerate = oxcf->input_cfg.init_framerate;
737
738
0
  cm->width = oxcf->frm_dim_cfg.width;
739
0
  cm->height = oxcf->frm_dim_cfg.height;
740
0
  cpi->is_dropped_frame = false;
741
742
0
  alloc_compressor_data(cpi);
743
744
0
  cpi->data_alloc_width = cm->width;
745
0
  cpi->data_alloc_height = cm->height;
746
0
  cpi->frame_size_related_setup_done = false;
747
748
  // Single thread case: use counts in common.
749
0
  cpi->td.counts = &cpi->counts;
750
751
  // Init SVC parameters.
752
0
  cpi->svc.number_spatial_layers = 1;
753
0
  cpi->svc.number_temporal_layers = 1;
754
0
  cm->spatial_layer_id = 0;
755
0
  cm->temporal_layer_id = 0;
756
0
  cpi->src_sad_blk_alloc_size = 0;
757
  // Init rtc_ref parameters.
758
0
  cpi->ppi->rtc_ref.set_ref_frame_config = 0;
759
0
  cpi->ppi->rtc_ref.non_reference_frame = 0;
760
0
  cpi->ppi->rtc_ref.ref_frame_comp[0] = 0;
761
0
  cpi->ppi->rtc_ref.ref_frame_comp[1] = 0;
762
0
  cpi->ppi->rtc_ref.ref_frame_comp[2] = 0;
763
764
  // change includes all joint functionality
765
0
  av1_change_config(cpi, oxcf, false);
766
767
0
  cpi->ref_frame_flags = 0;
768
769
  // Reset resize pending flags
770
0
  resize_pending_params->width = 0;
771
0
  resize_pending_params->height = 0;
772
773
  // Setup identity scale factor
774
0
  av1_setup_scale_factors_for_frame(&cm->sf_identity, 1, 1, 1, 1);
775
776
0
  init_buffer_indices(&cpi->force_intpel_info, cm->remapped_ref_idx);
777
778
0
  av1_noise_estimate_init(&cpi->noise_estimate, cm->width, cm->height);
779
0
}
780
781
void av1_change_config_seq(struct AV1_PRIMARY *ppi,
782
                           const AV1EncoderConfig *oxcf,
783
0
                           bool *is_sb_size_changed) {
784
0
  SequenceHeader *const seq_params = &ppi->seq_params;
785
0
  const FrameDimensionCfg *const frm_dim_cfg = &oxcf->frm_dim_cfg;
786
0
  const DecoderModelCfg *const dec_model_cfg = &oxcf->dec_model_cfg;
787
0
  const ColorCfg *const color_cfg = &oxcf->color_cfg;
788
789
0
  if (seq_params->profile != oxcf->profile) seq_params->profile = oxcf->profile;
790
0
  seq_params->bit_depth = oxcf->tool_cfg.bit_depth;
791
0
  seq_params->color_primaries = color_cfg->color_primaries;
792
0
  seq_params->transfer_characteristics = color_cfg->transfer_characteristics;
793
0
  seq_params->matrix_coefficients = color_cfg->matrix_coefficients;
794
0
  seq_params->monochrome = oxcf->tool_cfg.enable_monochrome;
795
0
  seq_params->chroma_sample_position = color_cfg->chroma_sample_position;
796
0
  seq_params->color_range = color_cfg->color_range;
797
798
0
  assert(IMPLIES(seq_params->profile <= PROFILE_1,
799
0
                 seq_params->bit_depth <= AOM_BITS_10));
800
801
0
  seq_params->timing_info_present = dec_model_cfg->timing_info_present;
802
0
  seq_params->timing_info.num_units_in_display_tick =
803
0
      dec_model_cfg->timing_info.num_units_in_display_tick;
804
0
  seq_params->timing_info.time_scale = dec_model_cfg->timing_info.time_scale;
805
0
  seq_params->timing_info.equal_picture_interval =
806
0
      dec_model_cfg->timing_info.equal_picture_interval;
807
0
  seq_params->timing_info.num_ticks_per_picture =
808
0
      dec_model_cfg->timing_info.num_ticks_per_picture;
809
810
0
  seq_params->display_model_info_present_flag =
811
0
      dec_model_cfg->display_model_info_present_flag;
812
0
  seq_params->decoder_model_info_present_flag =
813
0
      dec_model_cfg->decoder_model_info_present_flag;
814
0
  if (dec_model_cfg->decoder_model_info_present_flag) {
815
    // set the decoder model parameters in schedule mode
816
0
    seq_params->decoder_model_info.num_units_in_decoding_tick =
817
0
        dec_model_cfg->num_units_in_decoding_tick;
818
0
    ppi->buffer_removal_time_present = 1;
819
0
    av1_set_aom_dec_model_info(&seq_params->decoder_model_info);
820
0
    av1_set_dec_model_op_parameters(&seq_params->op_params[0]);
821
0
  } else if (seq_params->timing_info_present &&
822
0
             seq_params->timing_info.equal_picture_interval &&
823
0
             !seq_params->decoder_model_info_present_flag) {
824
    // set the decoder model parameters in resource availability mode
825
0
    av1_set_resource_availability_parameters(&seq_params->op_params[0]);
826
0
  } else {
827
0
    seq_params->op_params[0].initial_display_delay =
828
0
        10;  // Default value (not signaled)
829
0
  }
830
831
0
#if !CONFIG_REALTIME_ONLY
832
0
  av1_update_film_grain_parameters_seq(ppi, oxcf);
833
0
#endif
834
835
0
  int sb_size = seq_params->sb_size;
836
  // Superblock size should not be updated after the first key frame.
837
0
  if (!ppi->seq_params_locked) {
838
0
    set_sb_size(seq_params, av1_select_sb_size(oxcf, frm_dim_cfg->width,
839
0
                                               frm_dim_cfg->height,
840
0
                                               ppi->number_spatial_layers));
841
0
    for (int i = 0; i < MAX_NUM_OPERATING_POINTS; ++i)
842
0
      seq_params->tier[i] = (oxcf->tier_mask >> i) & 1;
843
0
  }
844
0
  if (is_sb_size_changed != NULL && sb_size != seq_params->sb_size)
845
0
    *is_sb_size_changed = true;
846
847
  // Init sequence level coding tools
848
  // This should not be called after the first key frame.
849
  // Note that for SVC encoding the sequence parameters
850
  // (operating_points_cnt_minus_1, operating_point_idc[],
851
  // has_nonzero_operating_point_idc) should be updated whenever the
852
  // number of layers is changed. This is done in the
853
  // ctrl_set_svc_params().
854
0
  if (!ppi->seq_params_locked) {
855
0
    seq_params->operating_points_cnt_minus_1 =
856
0
        (ppi->number_spatial_layers > 1 || ppi->number_temporal_layers > 1)
857
0
            ? ppi->number_spatial_layers * ppi->number_temporal_layers - 1
858
0
            : 0;
859
0
    init_seq_coding_tools(ppi, oxcf,
860
0
                          ppi->use_svc || ppi->rtc_ref.set_ref_frame_config);
861
0
  }
862
0
  seq_params->timing_info_present &= !seq_params->reduced_still_picture_hdr;
863
864
0
#if CONFIG_AV1_HIGHBITDEPTH
865
0
  highbd_set_var_fns(ppi);
866
0
#endif
867
868
0
  set_primary_rc_buffer_sizes(oxcf, ppi);
869
0
}
870
871
void av1_change_config(struct AV1_COMP *cpi, const AV1EncoderConfig *oxcf,
872
0
                       bool is_sb_size_changed) {
873
0
  AV1_COMMON *const cm = &cpi->common;
874
0
  SequenceHeader *const seq_params = cm->seq_params;
875
0
  RATE_CONTROL *const rc = &cpi->rc;
876
0
  PRIMARY_RATE_CONTROL *const p_rc = &cpi->ppi->p_rc;
877
0
  MACROBLOCK *const x = &cpi->td.mb;
878
0
  AV1LevelParams *const level_params = &cpi->ppi->level_params;
879
0
  RefreshFrameInfo *const refresh_frame = &cpi->refresh_frame;
880
0
  const FrameDimensionCfg *const frm_dim_cfg = &cpi->oxcf.frm_dim_cfg;
881
0
  const RateControlCfg *const rc_cfg = &oxcf->rc_cfg;
882
0
  FeatureFlags *const features = &cm->features;
883
0
  const int is_highbitdepth = seq_params->use_highbitdepth;
884
885
  // in case of LAP, lag in frames is set according to number of lap buffers
886
  // calculated at init time. This stores and restores LAP's lag in frames to
887
  // prevent override by new cfg.
888
0
  int lap_lag_in_frames = -1;
889
0
  if (cpi->ppi->lap_enabled && cpi->compressor_stage == LAP_STAGE) {
890
0
    lap_lag_in_frames = cpi->oxcf.gf_cfg.lag_in_frames;
891
0
  }
892
893
0
  cpi->oxcf = *oxcf;
894
895
0
#if !CONFIG_REALTIME_ONLY
896
0
  av1_update_film_grain_parameters(cpi, oxcf);
897
0
#endif
898
899
  // When user provides superres_mode = AOM_SUPERRES_AUTO, we still initialize
900
  // superres mode for current encoding = AOM_SUPERRES_NONE. This is to ensure
901
  // that any analysis (e.g. TPL) happening outside the main encoding loop still
902
  // happens at full resolution.
903
  // This value will later be set appropriately just before main encoding loop.
904
0
  cpi->superres_mode = oxcf->superres_cfg.superres_mode == AOM_SUPERRES_AUTO
905
0
                           ? AOM_SUPERRES_NONE
906
0
                           : oxcf->superres_cfg.superres_mode;  // default
907
0
  x->e_mbd.bd = (int)seq_params->bit_depth;
908
0
  x->e_mbd.global_motion = cm->global_motion;
909
910
0
  memcpy(level_params->target_seq_level_idx, cpi->oxcf.target_seq_level_idx,
911
0
         sizeof(level_params->target_seq_level_idx));
912
0
  level_params->keep_level_stats = 0;
913
0
  for (int i = 0; i < MAX_NUM_OPERATING_POINTS; ++i) {
914
0
    if (level_params->target_seq_level_idx[i] < SEQ_LEVELS ||
915
0
        level_params->target_seq_level_idx[i] == SEQ_LEVEL_KEEP_STATS) {
916
0
      level_params->keep_level_stats |= 1u << i;
917
0
      if (!level_params->level_info[i]) {
918
0
        CHECK_MEM_ERROR(cm, level_params->level_info[i],
919
0
                        aom_calloc(1, sizeof(*level_params->level_info[i])));
920
0
      }
921
0
    }
922
0
  }
923
924
  // TODO(huisu@): level targeting currently only works for the 0th operating
925
  // point, so scalable coding is not supported yet.
926
0
  if (level_params->target_seq_level_idx[0] < SEQ_LEVELS) {
927
    // Adjust encoder config in order to meet target level.
928
0
    config_target_level(cpi, level_params->target_seq_level_idx[0],
929
0
                        seq_params->tier[0]);
930
0
  }
931
932
0
  if (has_no_stats_stage(cpi) && (rc_cfg->mode == AOM_Q)) {
933
0
    p_rc->baseline_gf_interval = FIXED_GF_INTERVAL;
934
0
  } else if (!is_one_pass_rt_params(cpi) ||
935
0
             cm->current_frame.frame_number == 0) {
936
    // For rtc mode: logic for setting the baseline_gf_interval is done
937
    // in av1_get_one_pass_rt_params(), and it should not be reset here in
938
    // change_config(), unless after init_config (first frame).
939
0
    p_rc->baseline_gf_interval = (MIN_GF_INTERVAL + MAX_GF_INTERVAL) / 2;
940
0
  }
941
942
0
  refresh_frame->golden_frame = false;
943
0
  refresh_frame->bwd_ref_frame = false;
944
945
0
  features->refresh_frame_context =
946
0
      (oxcf->tool_cfg.frame_parallel_decoding_mode)
947
0
          ? REFRESH_FRAME_CONTEXT_DISABLED
948
0
          : REFRESH_FRAME_CONTEXT_BACKWARD;
949
0
  if (oxcf->tile_cfg.enable_large_scale_tile)
950
0
    features->refresh_frame_context = REFRESH_FRAME_CONTEXT_DISABLED;
951
952
0
  if (x->palette_buffer == NULL) {
953
0
    CHECK_MEM_ERROR(cm, x->palette_buffer,
954
0
                    aom_memalign(16, sizeof(*x->palette_buffer)));
955
0
  }
956
957
0
  if (x->tmp_conv_dst == NULL) {
958
0
    CHECK_MEM_ERROR(
959
0
        cm, x->tmp_conv_dst,
960
0
        aom_memalign(32, MAX_SB_SIZE * MAX_SB_SIZE * sizeof(*x->tmp_conv_dst)));
961
0
    x->e_mbd.tmp_conv_dst = x->tmp_conv_dst;
962
0
  }
963
  // The buffers 'tmp_pred_bufs[]' and 'comp_rd_buffer' are used in inter frames
964
  // to store intermediate inter mode prediction results and are not required
965
  // for allintra encoding mode. Hence, the memory allocations for these buffers
966
  // are avoided for allintra encoding mode.
967
0
  if (cpi->oxcf.kf_cfg.key_freq_max != 0) {
968
0
    if (x->comp_rd_buffer.pred0 == NULL)
969
0
      alloc_compound_type_rd_buffers(cm->error, &x->comp_rd_buffer);
970
971
0
    for (int i = 0; i < 2; ++i) {
972
0
      if (x->tmp_pred_bufs[i] == NULL) {
973
0
        CHECK_MEM_ERROR(cm, x->tmp_pred_bufs[i],
974
0
                        aom_memalign(32, 2 * MAX_MB_PLANE * MAX_SB_SQUARE *
975
0
                                             sizeof(*x->tmp_pred_bufs[i])));
976
0
        x->e_mbd.tmp_obmc_bufs[i] = x->tmp_pred_bufs[i];
977
0
      }
978
0
    }
979
0
  }
980
981
0
  if (x->upsample_pred == NULL) {
982
0
    CHECK_MEM_ERROR(
983
0
        cm, x->upsample_pred,
984
0
        aom_memalign(16, (1 + is_highbitdepth) * ((MAX_SB_SIZE + 16) + 16) *
985
0
                             MAX_SB_SIZE * sizeof(*x->upsample_pred)));
986
0
    x->e_mbd.tmp_upsample_pred = x->upsample_pred;
987
0
  }
988
989
0
  av1_reset_segment_features(cm);
990
991
0
  av1_set_high_precision_mv(cpi, 1, 0);
992
993
  // Under a configuration change, where maximum_buffer_size may change,
994
  // keep buffer level clipped to the maximum allowed buffer size.
995
0
  p_rc->bits_off_target =
996
0
      AOMMIN(p_rc->bits_off_target, p_rc->maximum_buffer_size);
997
0
  p_rc->buffer_level = AOMMIN(p_rc->buffer_level, p_rc->maximum_buffer_size);
998
999
  // Set up frame rate and related parameters rate control values.
1000
0
  av1_new_framerate(cpi, cpi->framerate);
1001
1002
  // Set absolute upper and lower quality limits
1003
0
  rc->worst_quality = rc_cfg->worst_allowed_q;
1004
0
  rc->best_quality = rc_cfg->best_allowed_q;
1005
1006
  // If lossless has been requested make sure average Q accumulators are reset.
1007
0
  if (is_lossless_requested(&cpi->oxcf.rc_cfg)) {
1008
0
    int i;
1009
0
    for (i = 0; i < FRAME_TYPES; ++i) {
1010
0
      p_rc->avg_frame_qindex[i] = 0;
1011
0
    }
1012
0
  }
1013
1014
0
  features->interp_filter =
1015
0
      oxcf->tile_cfg.enable_large_scale_tile ? EIGHTTAP_REGULAR : SWITCHABLE;
1016
0
  features->switchable_motion_mode = is_switchable_motion_mode_allowed(
1017
0
      features->allow_warped_motion, oxcf->motion_mode_cfg.enable_obmc);
1018
1019
0
  if (frm_dim_cfg->render_width > 0 && frm_dim_cfg->render_height > 0) {
1020
0
    cm->render_width = frm_dim_cfg->render_width;
1021
0
    cm->render_height = frm_dim_cfg->render_height;
1022
0
  } else {
1023
0
    cm->render_width = frm_dim_cfg->width;
1024
0
    cm->render_height = frm_dim_cfg->height;
1025
0
  }
1026
1027
0
  int last_width = cm->width;
1028
0
  int last_height = cm->height;
1029
0
  cm->width = frm_dim_cfg->width;
1030
0
  cm->height = frm_dim_cfg->height;
1031
1032
0
  if (cm->width > cpi->data_alloc_width ||
1033
0
      cm->height > cpi->data_alloc_height || is_sb_size_changed) {
1034
0
    av1_free_context_buffers(cm);
1035
0
    av1_free_shared_coeff_buffer(&cpi->td.shared_coeff_buf);
1036
0
    av1_free_sms_tree(&cpi->td);
1037
0
    av1_free_pmc(cpi->td.firstpass_ctx, av1_num_planes(cm));
1038
0
    cpi->td.firstpass_ctx = NULL;
1039
0
    alloc_compressor_data(cpi);
1040
0
    realloc_segmentation_maps(cpi);
1041
0
    cpi->data_alloc_width = cm->width;
1042
0
    cpi->data_alloc_height = cm->height;
1043
0
    cpi->frame_size_related_setup_done = false;
1044
0
  }
1045
0
  av1_update_frame_size(cpi);
1046
1047
0
  if (cm->width != last_width || cm->height != last_height) {
1048
0
    if (cpi->oxcf.q_cfg.aq_mode == CYCLIC_REFRESH_AQ) {
1049
0
      int mi_rows = cpi->common.mi_params.mi_rows;
1050
0
      int mi_cols = cpi->common.mi_params.mi_cols;
1051
0
      aom_free(cpi->cyclic_refresh->map);
1052
0
      CHECK_MEM_ERROR(
1053
0
          cm, cpi->cyclic_refresh->map,
1054
0
          aom_calloc(mi_rows * mi_cols, sizeof(*cpi->cyclic_refresh->map)));
1055
0
      if (cpi->svc.number_spatial_layers > 1) {
1056
0
        for (int sl = 0; sl < cpi->svc.number_spatial_layers; ++sl) {
1057
0
          const int layer =
1058
0
              LAYER_IDS_TO_IDX(sl, 0, cpi->svc.number_temporal_layers);
1059
0
          LAYER_CONTEXT *const lc = &cpi->svc.layer_context[layer];
1060
0
          lc->sb_index = 0;
1061
0
          lc->actual_num_seg1_blocks = 0;
1062
0
          lc->actual_num_seg2_blocks = 0;
1063
0
          lc->counter_encode_maxq_scene_change = 0;
1064
0
          aom_free(lc->map);
1065
0
          CHECK_MEM_ERROR(cm, lc->map,
1066
0
                          aom_calloc(mi_rows * mi_cols, sizeof(*lc->map)));
1067
0
        }
1068
0
      }
1069
0
    }
1070
0
  }
1071
1072
0
  rc->is_src_frame_alt_ref = 0;
1073
1074
0
  if (!cpi->ppi->rtc_ref.set_ref_frame_config)
1075
0
    cpi->ext_flags.refresh_frame.update_pending = 0;
1076
0
  cpi->ext_flags.refresh_frame_context_pending = 0;
1077
1078
0
  if (cpi->ppi->use_svc)
1079
0
    av1_update_layer_context_change_config(cpi, rc_cfg->target_bandwidth);
1080
1081
0
  check_reset_rc_flag(cpi);
1082
1083
  // restore the value of lag_in_frame for LAP stage.
1084
0
  if (lap_lag_in_frames != -1) {
1085
0
    cpi->oxcf.gf_cfg.lag_in_frames = lap_lag_in_frames;
1086
0
  }
1087
1088
#if CONFIG_REALTIME_ONLY
1089
  assert(!oxcf->tool_cfg.enable_global_motion);
1090
  cpi->alloc_pyramid = false;
1091
#else
1092
0
  cpi->alloc_pyramid = oxcf->tool_cfg.enable_global_motion;
1093
0
#endif  // CONFIG_REALTIME_ONLY
1094
0
}
1095
1096
static inline void init_frame_info(FRAME_INFO *frame_info,
1097
0
                                   const AV1_COMMON *const cm) {
1098
0
  const CommonModeInfoParams *const mi_params = &cm->mi_params;
1099
0
  const SequenceHeader *const seq_params = cm->seq_params;
1100
0
  frame_info->frame_width = cm->width;
1101
0
  frame_info->frame_height = cm->height;
1102
0
  frame_info->mi_cols = mi_params->mi_cols;
1103
0
  frame_info->mi_rows = mi_params->mi_rows;
1104
0
  frame_info->mb_cols = mi_params->mb_cols;
1105
0
  frame_info->mb_rows = mi_params->mb_rows;
1106
0
  frame_info->num_mbs = mi_params->MBs;
1107
0
  frame_info->bit_depth = seq_params->bit_depth;
1108
0
  frame_info->subsampling_x = seq_params->subsampling_x;
1109
0
  frame_info->subsampling_y = seq_params->subsampling_y;
1110
0
}
1111
1112
0
static inline void init_frame_index_set(FRAME_INDEX_SET *frame_index_set) {
1113
0
  frame_index_set->show_frame_count = 0;
1114
0
}
1115
1116
0
static inline void update_counters_for_show_frame(AV1_COMP *const cpi) {
1117
0
  assert(cpi->common.show_frame);
1118
0
  cpi->frame_index_set.show_frame_count++;
1119
0
  cpi->common.current_frame.frame_number++;
1120
0
}
1121
1122
AV1_PRIMARY *av1_create_primary_compressor(
1123
    struct aom_codec_pkt_list *pkt_list_head, int num_lap_buffers,
1124
0
    const AV1EncoderConfig *oxcf) {
1125
0
  AV1_PRIMARY *volatile const ppi = aom_memalign(32, sizeof(AV1_PRIMARY));
1126
0
  if (!ppi) return NULL;
1127
0
  av1_zero(*ppi);
1128
1129
  // The jmp_buf is valid only for the duration of the function that calls
1130
  // setjmp(). Therefore, this function must reset the 'setjmp' field to 0
1131
  // before it returns.
1132
0
  if (setjmp(ppi->error.jmp)) {
1133
0
    ppi->error.setjmp = 0;
1134
0
    av1_remove_primary_compressor(ppi);
1135
0
    return 0;
1136
0
  }
1137
0
  ppi->error.setjmp = 1;
1138
1139
0
  ppi->seq_params_locked = 0;
1140
0
  ppi->lap_enabled = num_lap_buffers > 0;
1141
0
  ppi->output_pkt_list = pkt_list_head;
1142
0
  ppi->b_calculate_psnr = CONFIG_INTERNAL_STATS;
1143
0
  ppi->frames_left = oxcf->input_cfg.limit;
1144
0
  ppi->num_fp_contexts = 1;
1145
1146
0
  init_config_sequence(ppi, oxcf);
1147
1148
#if CONFIG_ENTROPY_STATS
1149
  av1_zero(ppi->aggregate_fc);
1150
#endif  // CONFIG_ENTROPY_STATS
1151
1152
0
  av1_primary_rc_init(oxcf, &ppi->p_rc);
1153
1154
  // For two pass and lag_in_frames > 33 in LAP.
1155
0
  ppi->p_rc.enable_scenecut_detection = ENABLE_SCENECUT_MODE_2;
1156
0
  if (ppi->lap_enabled) {
1157
0
    if ((num_lap_buffers <
1158
0
         (MAX_GF_LENGTH_LAP + SCENE_CUT_KEY_TEST_INTERVAL + 1)) &&
1159
0
        num_lap_buffers >= (MAX_GF_LENGTH_LAP + 3)) {
1160
      /*
1161
       * For lag in frames >= 19 and <33, enable scenecut
1162
       * with limited future frame prediction.
1163
       */
1164
0
      ppi->p_rc.enable_scenecut_detection = ENABLE_SCENECUT_MODE_1;
1165
0
    } else if (num_lap_buffers < (MAX_GF_LENGTH_LAP + 3)) {
1166
      // Disable scenecut when lag_in_frames < 19.
1167
0
      ppi->p_rc.enable_scenecut_detection = DISABLE_SCENECUT;
1168
0
    }
1169
0
  }
1170
1171
0
#define BFP(BT, SDF, SDAF, VF, SVF, SVAF, SDX4DF, SDX3DF) \
1172
0
  ppi->fn_ptr[BT].sdf = SDF;                              \
1173
0
  ppi->fn_ptr[BT].sdaf = SDAF;                            \
1174
0
  ppi->fn_ptr[BT].vf = VF;                                \
1175
0
  ppi->fn_ptr[BT].svf = SVF;                              \
1176
0
  ppi->fn_ptr[BT].svaf = SVAF;                            \
1177
0
  ppi->fn_ptr[BT].sdx4df = SDX4DF;                        \
1178
0
  ppi->fn_ptr[BT].sdx3df = SDX3DF;
1179
1180
// Realtime mode doesn't use 4x rectangular blocks.
1181
0
#if !CONFIG_REALTIME_ONLY
1182
  // sdaf (used in compound prediction, get_mvpred_compound_sad()) is unused
1183
  // for 4xN and Nx4 blocks.
1184
0
  BFP(BLOCK_4X16, aom_sad4x16, /*SDAF=*/NULL, aom_variance4x16,
1185
0
      aom_sub_pixel_variance4x16, aom_sub_pixel_avg_variance4x16,
1186
0
      aom_sad4x16x4d, aom_sad4x16x3d)
1187
1188
  // sdaf (used in compound prediction, get_mvpred_compound_sad()) is unused
1189
  // for 4xN and Nx4 blocks.
1190
0
  BFP(BLOCK_16X4, aom_sad16x4, /*SDAF=*/NULL, aom_variance16x4,
1191
0
      aom_sub_pixel_variance16x4, aom_sub_pixel_avg_variance16x4,
1192
0
      aom_sad16x4x4d, aom_sad16x4x3d)
1193
1194
0
  BFP(BLOCK_8X32, aom_sad8x32, aom_sad8x32_avg, aom_variance8x32,
1195
0
      aom_sub_pixel_variance8x32, aom_sub_pixel_avg_variance8x32,
1196
0
      aom_sad8x32x4d, aom_sad8x32x3d)
1197
1198
0
  BFP(BLOCK_32X8, aom_sad32x8, aom_sad32x8_avg, aom_variance32x8,
1199
0
      aom_sub_pixel_variance32x8, aom_sub_pixel_avg_variance32x8,
1200
0
      aom_sad32x8x4d, aom_sad32x8x3d)
1201
1202
0
  BFP(BLOCK_16X64, aom_sad16x64, aom_sad16x64_avg, aom_variance16x64,
1203
0
      aom_sub_pixel_variance16x64, aom_sub_pixel_avg_variance16x64,
1204
0
      aom_sad16x64x4d, aom_sad16x64x3d)
1205
1206
0
  BFP(BLOCK_64X16, aom_sad64x16, aom_sad64x16_avg, aom_variance64x16,
1207
0
      aom_sub_pixel_variance64x16, aom_sub_pixel_avg_variance64x16,
1208
0
      aom_sad64x16x4d, aom_sad64x16x3d)
1209
0
#endif  // !CONFIG_REALTIME_ONLY
1210
1211
0
  BFP(BLOCK_128X128, aom_sad128x128, aom_sad128x128_avg, aom_variance128x128,
1212
0
      aom_sub_pixel_variance128x128, aom_sub_pixel_avg_variance128x128,
1213
0
      aom_sad128x128x4d, aom_sad128x128x3d)
1214
1215
0
  BFP(BLOCK_128X64, aom_sad128x64, aom_sad128x64_avg, aom_variance128x64,
1216
0
      aom_sub_pixel_variance128x64, aom_sub_pixel_avg_variance128x64,
1217
0
      aom_sad128x64x4d, aom_sad128x64x3d)
1218
1219
0
  BFP(BLOCK_64X128, aom_sad64x128, aom_sad64x128_avg, aom_variance64x128,
1220
0
      aom_sub_pixel_variance64x128, aom_sub_pixel_avg_variance64x128,
1221
0
      aom_sad64x128x4d, aom_sad64x128x3d)
1222
1223
0
  BFP(BLOCK_32X16, aom_sad32x16, aom_sad32x16_avg, aom_variance32x16,
1224
0
      aom_sub_pixel_variance32x16, aom_sub_pixel_avg_variance32x16,
1225
0
      aom_sad32x16x4d, aom_sad32x16x3d)
1226
1227
0
  BFP(BLOCK_16X32, aom_sad16x32, aom_sad16x32_avg, aom_variance16x32,
1228
0
      aom_sub_pixel_variance16x32, aom_sub_pixel_avg_variance16x32,
1229
0
      aom_sad16x32x4d, aom_sad16x32x3d)
1230
1231
0
  BFP(BLOCK_64X32, aom_sad64x32, aom_sad64x32_avg, aom_variance64x32,
1232
0
      aom_sub_pixel_variance64x32, aom_sub_pixel_avg_variance64x32,
1233
0
      aom_sad64x32x4d, aom_sad64x32x3d)
1234
1235
0
  BFP(BLOCK_32X64, aom_sad32x64, aom_sad32x64_avg, aom_variance32x64,
1236
0
      aom_sub_pixel_variance32x64, aom_sub_pixel_avg_variance32x64,
1237
0
      aom_sad32x64x4d, aom_sad32x64x3d)
1238
1239
0
  BFP(BLOCK_32X32, aom_sad32x32, aom_sad32x32_avg, aom_variance32x32,
1240
0
      aom_sub_pixel_variance32x32, aom_sub_pixel_avg_variance32x32,
1241
0
      aom_sad32x32x4d, aom_sad32x32x3d)
1242
1243
0
  BFP(BLOCK_64X64, aom_sad64x64, aom_sad64x64_avg, aom_variance64x64,
1244
0
      aom_sub_pixel_variance64x64, aom_sub_pixel_avg_variance64x64,
1245
0
      aom_sad64x64x4d, aom_sad64x64x3d)
1246
1247
0
  BFP(BLOCK_16X16, aom_sad16x16, aom_sad16x16_avg, aom_variance16x16,
1248
0
      aom_sub_pixel_variance16x16, aom_sub_pixel_avg_variance16x16,
1249
0
      aom_sad16x16x4d, aom_sad16x16x3d)
1250
1251
0
  BFP(BLOCK_16X8, aom_sad16x8, aom_sad16x8_avg, aom_variance16x8,
1252
0
      aom_sub_pixel_variance16x8, aom_sub_pixel_avg_variance16x8,
1253
0
      aom_sad16x8x4d, aom_sad16x8x3d)
1254
1255
0
  BFP(BLOCK_8X16, aom_sad8x16, aom_sad8x16_avg, aom_variance8x16,
1256
0
      aom_sub_pixel_variance8x16, aom_sub_pixel_avg_variance8x16,
1257
0
      aom_sad8x16x4d, aom_sad8x16x3d)
1258
1259
0
  BFP(BLOCK_8X8, aom_sad8x8, aom_sad8x8_avg, aom_variance8x8,
1260
0
      aom_sub_pixel_variance8x8, aom_sub_pixel_avg_variance8x8, aom_sad8x8x4d,
1261
0
      aom_sad8x8x3d)
1262
1263
  // sdaf (used in compound prediction, get_mvpred_compound_sad()) is unused
1264
  // for 4xN and Nx4 blocks.
1265
0
  BFP(BLOCK_8X4, aom_sad8x4, /*SDAF=*/NULL, aom_variance8x4,
1266
0
      aom_sub_pixel_variance8x4, aom_sub_pixel_avg_variance8x4, aom_sad8x4x4d,
1267
0
      aom_sad8x4x3d)
1268
1269
  // sdaf (used in compound prediction, get_mvpred_compound_sad()) is unused
1270
  // for 4xN and Nx4 blocks.
1271
0
  BFP(BLOCK_4X8, aom_sad4x8, /*SDAF=*/NULL, aom_variance4x8,
1272
0
      aom_sub_pixel_variance4x8, aom_sub_pixel_avg_variance4x8, aom_sad4x8x4d,
1273
0
      aom_sad4x8x3d)
1274
1275
  // sdaf (used in compound prediction, get_mvpred_compound_sad()) is unused
1276
  // for 4xN and Nx4 blocks.
1277
0
  BFP(BLOCK_4X4, aom_sad4x4, /*SDAF=*/NULL, aom_variance4x4,
1278
0
      aom_sub_pixel_variance4x4, aom_sub_pixel_avg_variance4x4, aom_sad4x4x4d,
1279
0
      aom_sad4x4x3d)
1280
1281
0
#if !CONFIG_REALTIME_ONLY
1282
0
#define OBFP(BT, OSDF, OVF, OSVF) \
1283
0
  ppi->fn_ptr[BT].osdf = OSDF;    \
1284
0
  ppi->fn_ptr[BT].ovf = OVF;      \
1285
0
  ppi->fn_ptr[BT].osvf = OSVF;
1286
1287
0
  OBFP(BLOCK_128X128, aom_obmc_sad128x128, aom_obmc_variance128x128,
1288
0
       aom_obmc_sub_pixel_variance128x128)
1289
0
  OBFP(BLOCK_128X64, aom_obmc_sad128x64, aom_obmc_variance128x64,
1290
0
       aom_obmc_sub_pixel_variance128x64)
1291
0
  OBFP(BLOCK_64X128, aom_obmc_sad64x128, aom_obmc_variance64x128,
1292
0
       aom_obmc_sub_pixel_variance64x128)
1293
0
  OBFP(BLOCK_64X64, aom_obmc_sad64x64, aom_obmc_variance64x64,
1294
0
       aom_obmc_sub_pixel_variance64x64)
1295
0
  OBFP(BLOCK_64X32, aom_obmc_sad64x32, aom_obmc_variance64x32,
1296
0
       aom_obmc_sub_pixel_variance64x32)
1297
0
  OBFP(BLOCK_32X64, aom_obmc_sad32x64, aom_obmc_variance32x64,
1298
0
       aom_obmc_sub_pixel_variance32x64)
1299
0
  OBFP(BLOCK_32X32, aom_obmc_sad32x32, aom_obmc_variance32x32,
1300
0
       aom_obmc_sub_pixel_variance32x32)
1301
0
  OBFP(BLOCK_32X16, aom_obmc_sad32x16, aom_obmc_variance32x16,
1302
0
       aom_obmc_sub_pixel_variance32x16)
1303
0
  OBFP(BLOCK_16X32, aom_obmc_sad16x32, aom_obmc_variance16x32,
1304
0
       aom_obmc_sub_pixel_variance16x32)
1305
0
  OBFP(BLOCK_16X16, aom_obmc_sad16x16, aom_obmc_variance16x16,
1306
0
       aom_obmc_sub_pixel_variance16x16)
1307
0
  OBFP(BLOCK_16X8, aom_obmc_sad16x8, aom_obmc_variance16x8,
1308
0
       aom_obmc_sub_pixel_variance16x8)
1309
0
  OBFP(BLOCK_8X16, aom_obmc_sad8x16, aom_obmc_variance8x16,
1310
0
       aom_obmc_sub_pixel_variance8x16)
1311
0
  OBFP(BLOCK_8X8, aom_obmc_sad8x8, aom_obmc_variance8x8,
1312
0
       aom_obmc_sub_pixel_variance8x8)
1313
0
  OBFP(BLOCK_4X8, aom_obmc_sad4x8, aom_obmc_variance4x8,
1314
0
       aom_obmc_sub_pixel_variance4x8)
1315
0
  OBFP(BLOCK_8X4, aom_obmc_sad8x4, aom_obmc_variance8x4,
1316
0
       aom_obmc_sub_pixel_variance8x4)
1317
0
  OBFP(BLOCK_4X4, aom_obmc_sad4x4, aom_obmc_variance4x4,
1318
0
       aom_obmc_sub_pixel_variance4x4)
1319
0
  OBFP(BLOCK_4X16, aom_obmc_sad4x16, aom_obmc_variance4x16,
1320
0
       aom_obmc_sub_pixel_variance4x16)
1321
0
  OBFP(BLOCK_16X4, aom_obmc_sad16x4, aom_obmc_variance16x4,
1322
0
       aom_obmc_sub_pixel_variance16x4)
1323
0
  OBFP(BLOCK_8X32, aom_obmc_sad8x32, aom_obmc_variance8x32,
1324
0
       aom_obmc_sub_pixel_variance8x32)
1325
0
  OBFP(BLOCK_32X8, aom_obmc_sad32x8, aom_obmc_variance32x8,
1326
0
       aom_obmc_sub_pixel_variance32x8)
1327
0
  OBFP(BLOCK_16X64, aom_obmc_sad16x64, aom_obmc_variance16x64,
1328
0
       aom_obmc_sub_pixel_variance16x64)
1329
0
  OBFP(BLOCK_64X16, aom_obmc_sad64x16, aom_obmc_variance64x16,
1330
0
       aom_obmc_sub_pixel_variance64x16)
1331
0
#endif  // !CONFIG_REALTIME_ONLY
1332
1333
0
#define MBFP(BT, MCSDF, MCSVF)  \
1334
0
  ppi->fn_ptr[BT].msdf = MCSDF; \
1335
0
  ppi->fn_ptr[BT].msvf = MCSVF;
1336
1337
0
  MBFP(BLOCK_128X128, aom_masked_sad128x128,
1338
0
       aom_masked_sub_pixel_variance128x128)
1339
0
  MBFP(BLOCK_128X64, aom_masked_sad128x64, aom_masked_sub_pixel_variance128x64)
1340
0
  MBFP(BLOCK_64X128, aom_masked_sad64x128, aom_masked_sub_pixel_variance64x128)
1341
0
  MBFP(BLOCK_64X64, aom_masked_sad64x64, aom_masked_sub_pixel_variance64x64)
1342
0
  MBFP(BLOCK_64X32, aom_masked_sad64x32, aom_masked_sub_pixel_variance64x32)
1343
0
  MBFP(BLOCK_32X64, aom_masked_sad32x64, aom_masked_sub_pixel_variance32x64)
1344
0
  MBFP(BLOCK_32X32, aom_masked_sad32x32, aom_masked_sub_pixel_variance32x32)
1345
0
  MBFP(BLOCK_32X16, aom_masked_sad32x16, aom_masked_sub_pixel_variance32x16)
1346
0
  MBFP(BLOCK_16X32, aom_masked_sad16x32, aom_masked_sub_pixel_variance16x32)
1347
0
  MBFP(BLOCK_16X16, aom_masked_sad16x16, aom_masked_sub_pixel_variance16x16)
1348
0
  MBFP(BLOCK_16X8, aom_masked_sad16x8, aom_masked_sub_pixel_variance16x8)
1349
0
  MBFP(BLOCK_8X16, aom_masked_sad8x16, aom_masked_sub_pixel_variance8x16)
1350
0
  MBFP(BLOCK_8X8, aom_masked_sad8x8, aom_masked_sub_pixel_variance8x8)
1351
0
  MBFP(BLOCK_4X8, aom_masked_sad4x8, aom_masked_sub_pixel_variance4x8)
1352
0
  MBFP(BLOCK_8X4, aom_masked_sad8x4, aom_masked_sub_pixel_variance8x4)
1353
0
  MBFP(BLOCK_4X4, aom_masked_sad4x4, aom_masked_sub_pixel_variance4x4)
1354
1355
0
#if !CONFIG_REALTIME_ONLY
1356
0
  MBFP(BLOCK_4X16, aom_masked_sad4x16, aom_masked_sub_pixel_variance4x16)
1357
0
  MBFP(BLOCK_16X4, aom_masked_sad16x4, aom_masked_sub_pixel_variance16x4)
1358
0
  MBFP(BLOCK_8X32, aom_masked_sad8x32, aom_masked_sub_pixel_variance8x32)
1359
0
  MBFP(BLOCK_32X8, aom_masked_sad32x8, aom_masked_sub_pixel_variance32x8)
1360
0
  MBFP(BLOCK_16X64, aom_masked_sad16x64, aom_masked_sub_pixel_variance16x64)
1361
0
  MBFP(BLOCK_64X16, aom_masked_sad64x16, aom_masked_sub_pixel_variance64x16)
1362
0
#endif
1363
1364
0
#define SDSFP(BT, SDSF, SDSX4DF) \
1365
0
  ppi->fn_ptr[BT].sdsf = SDSF;   \
1366
0
  ppi->fn_ptr[BT].sdsx4df = SDSX4DF;
1367
1368
0
  SDSFP(BLOCK_128X128, aom_sad_skip_128x128, aom_sad_skip_128x128x4d)
1369
0
  SDSFP(BLOCK_128X64, aom_sad_skip_128x64, aom_sad_skip_128x64x4d)
1370
0
  SDSFP(BLOCK_64X128, aom_sad_skip_64x128, aom_sad_skip_64x128x4d)
1371
0
  SDSFP(BLOCK_64X64, aom_sad_skip_64x64, aom_sad_skip_64x64x4d)
1372
0
  SDSFP(BLOCK_64X32, aom_sad_skip_64x32, aom_sad_skip_64x32x4d)
1373
1374
0
  SDSFP(BLOCK_32X64, aom_sad_skip_32x64, aom_sad_skip_32x64x4d)
1375
0
  SDSFP(BLOCK_32X32, aom_sad_skip_32x32, aom_sad_skip_32x32x4d)
1376
0
  SDSFP(BLOCK_32X16, aom_sad_skip_32x16, aom_sad_skip_32x16x4d)
1377
1378
0
  SDSFP(BLOCK_16X32, aom_sad_skip_16x32, aom_sad_skip_16x32x4d)
1379
0
  SDSFP(BLOCK_16X16, aom_sad_skip_16x16, aom_sad_skip_16x16x4d)
1380
0
  SDSFP(BLOCK_8X16, aom_sad_skip_8x16, aom_sad_skip_8x16x4d)
1381
1382
0
#if !CONFIG_REALTIME_ONLY
1383
0
  SDSFP(BLOCK_64X16, aom_sad_skip_64x16, aom_sad_skip_64x16x4d)
1384
0
  SDSFP(BLOCK_16X64, aom_sad_skip_16x64, aom_sad_skip_16x64x4d)
1385
0
  SDSFP(BLOCK_8X32, aom_sad_skip_8x32, aom_sad_skip_8x32x4d)
1386
0
  SDSFP(BLOCK_4X16, aom_sad_skip_4x16, aom_sad_skip_4x16x4d)
1387
0
#endif
1388
0
#undef SDSFP
1389
1390
0
#if CONFIG_AV1_HIGHBITDEPTH
1391
0
  highbd_set_var_fns(ppi);
1392
0
#endif
1393
1394
0
  {
1395
    // As cm->mi_params is a part of the frame level context (cpi), it is
1396
    // unavailable at this point. mi_params is created as a local temporary
1397
    // variable, to be passed into the functions used for allocating tpl
1398
    // buffers. The values in this variable are populated according to initial
1399
    // width and height of the frame.
1400
0
    CommonModeInfoParams mi_params;
1401
0
    enc_set_mb_mi(&mi_params, oxcf->frm_dim_cfg.width, oxcf->frm_dim_cfg.height,
1402
0
                  BLOCK_4X4);
1403
1404
0
    const BLOCK_SIZE bsize = BLOCK_16X16;
1405
0
    const int w = mi_size_wide[bsize];
1406
0
    const int h = mi_size_high[bsize];
1407
0
    const int num_cols = (mi_params.mi_cols + w - 1) / w;
1408
0
    const int num_rows = (mi_params.mi_rows + h - 1) / h;
1409
0
    AOM_CHECK_MEM_ERROR(
1410
0
        &ppi->error, ppi->tpl_sb_rdmult_scaling_factors,
1411
0
        aom_calloc(num_rows * num_cols,
1412
0
                   sizeof(*ppi->tpl_sb_rdmult_scaling_factors)));
1413
1414
#if CONFIG_INTERNAL_STATS
1415
    ppi->b_calculate_blockiness = 1;
1416
    ppi->b_calculate_consistency = 1;
1417
1418
    for (int i = 0; i <= STAT_ALL; i++) {
1419
      ppi->psnr[0].stat[i] = 0;
1420
      ppi->psnr[1].stat[i] = 0;
1421
1422
      ppi->fastssim.stat[i] = 0;
1423
      ppi->psnrhvs.stat[i] = 0;
1424
    }
1425
1426
    ppi->psnr[0].worst = 100.0;
1427
    ppi->psnr[1].worst = 100.0;
1428
    ppi->worst_ssim = 100.0;
1429
    ppi->worst_ssim_hbd = 100.0;
1430
1431
    ppi->count[0] = 0;
1432
    ppi->count[1] = 0;
1433
    ppi->total_bytes = 0;
1434
1435
    if (ppi->b_calculate_psnr) {
1436
      ppi->total_sq_error[0] = 0;
1437
      ppi->total_samples[0] = 0;
1438
      ppi->total_sq_error[1] = 0;
1439
      ppi->total_samples[1] = 0;
1440
      ppi->total_recode_hits = 0;
1441
      ppi->summed_quality = 0;
1442
      ppi->summed_weights = 0;
1443
      ppi->summed_quality_hbd = 0;
1444
      ppi->summed_weights_hbd = 0;
1445
    }
1446
1447
    ppi->fastssim.worst = 100.0;
1448
    ppi->psnrhvs.worst = 100.0;
1449
1450
    if (ppi->b_calculate_blockiness) {
1451
      ppi->total_blockiness = 0;
1452
      ppi->worst_blockiness = 0.0;
1453
    }
1454
1455
    ppi->total_inconsistency = 0;
1456
    ppi->worst_consistency = 100.0;
1457
    if (ppi->b_calculate_consistency) {
1458
      AOM_CHECK_MEM_ERROR(&ppi->error, ppi->ssim_vars,
1459
                          aom_malloc(sizeof(*ppi->ssim_vars) * 4 *
1460
                                     mi_params.mi_rows * mi_params.mi_cols));
1461
    }
1462
#endif
1463
0
  }
1464
1465
0
  ppi->error.setjmp = 0;
1466
0
  return ppi;
1467
0
}
1468
1469
AV1_COMP *av1_create_compressor(AV1_PRIMARY *ppi, const AV1EncoderConfig *oxcf,
1470
                                BufferPool *const pool, COMPRESSOR_STAGE stage,
1471
0
                                int lap_lag_in_frames) {
1472
0
  AV1_COMP *volatile const cpi = aom_memalign(32, sizeof(AV1_COMP));
1473
1474
0
  if (!cpi) return NULL;
1475
1476
0
  av1_zero(*cpi);
1477
1478
0
  cpi->ppi = ppi;
1479
1480
0
  AV1_COMMON *volatile const cm = &cpi->common;
1481
0
  cm->seq_params = &ppi->seq_params;
1482
0
  cm->error =
1483
0
      (struct aom_internal_error_info *)aom_calloc(1, sizeof(*cm->error));
1484
0
  if (!cm->error) {
1485
0
    aom_free(cpi);
1486
0
    return NULL;
1487
0
  }
1488
1489
  // The jmp_buf is valid only for the duration of the function that calls
1490
  // setjmp(). Therefore, this function must reset the 'setjmp' field to 0
1491
  // before it returns.
1492
0
  if (setjmp(cm->error->jmp)) {
1493
0
    cm->error->setjmp = 0;
1494
0
    av1_remove_compressor(cpi);
1495
0
    return NULL;
1496
0
  }
1497
1498
0
  cm->error->setjmp = 1;
1499
0
  cpi->compressor_stage = stage;
1500
1501
0
  cpi->do_frame_data_update = true;
1502
1503
0
  CommonModeInfoParams *const mi_params = &cm->mi_params;
1504
0
  mi_params->free_mi = enc_free_mi;
1505
0
  mi_params->setup_mi = enc_setup_mi;
1506
0
  mi_params->set_mb_mi =
1507
0
      (oxcf->pass == AOM_RC_FIRST_PASS || cpi->compressor_stage == LAP_STAGE)
1508
0
          ? stat_stage_set_mb_mi
1509
0
          : enc_set_mb_mi;
1510
1511
0
  mi_params->mi_alloc_bsize = BLOCK_4X4;
1512
1513
0
  CHECK_MEM_ERROR(cm, cm->fc,
1514
0
                  (FRAME_CONTEXT *)aom_memalign(32, sizeof(*cm->fc)));
1515
0
  CHECK_MEM_ERROR(
1516
0
      cm, cm->default_frame_context,
1517
0
      (FRAME_CONTEXT *)aom_memalign(32, sizeof(*cm->default_frame_context)));
1518
0
  memset(cm->fc, 0, sizeof(*cm->fc));
1519
0
  memset(cm->default_frame_context, 0, sizeof(*cm->default_frame_context));
1520
1521
0
  cpi->common.buffer_pool = pool;
1522
1523
0
  init_config(cpi, oxcf);
1524
0
  if (cpi->compressor_stage == LAP_STAGE) {
1525
0
    cpi->oxcf.gf_cfg.lag_in_frames = lap_lag_in_frames;
1526
0
  }
1527
1528
0
  av1_rc_init(&cpi->oxcf, &cpi->rc);
1529
1530
0
  init_frame_info(&cpi->frame_info, cm);
1531
0
  init_frame_index_set(&cpi->frame_index_set);
1532
1533
0
  cm->current_frame.frame_number = 0;
1534
0
  cpi->rc.frame_number_encoded = 0;
1535
0
  cpi->rc.prev_frame_is_dropped = 0;
1536
0
  cpi->rc.max_consec_drop = INT_MAX;
1537
0
  cpi->rc.drop_count_consec = 0;
1538
0
  cm->current_frame_id = -1;
1539
0
  cpi->tile_data = NULL;
1540
0
  cpi->last_show_frame_buf = NULL;
1541
0
  realloc_segmentation_maps(cpi);
1542
1543
0
  cpi->refresh_frame.alt_ref_frame = false;
1544
1545
#if CONFIG_SPEED_STATS
1546
  cpi->tx_search_count = 0;
1547
#endif  // CONFIG_SPEED_STATS
1548
1549
0
  cpi->time_stamps.first_ts_start = INT64_MAX;
1550
1551
#ifdef OUTPUT_YUV_REC
1552
  yuv_rec_file = fopen("rec.yuv", "wb");
1553
#endif
1554
#ifdef OUTPUT_YUV_DENOISED
1555
  yuv_denoised_file = fopen("denoised.yuv", "wb");
1556
#endif
1557
1558
0
#if !CONFIG_REALTIME_ONLY
1559
0
  if (is_stat_consumption_stage(cpi)) {
1560
0
    const size_t packet_sz = sizeof(FIRSTPASS_STATS);
1561
0
    const int packets = (int)(oxcf->twopass_stats_in.sz / packet_sz);
1562
1563
0
    if (!cpi->ppi->lap_enabled) {
1564
      /*Re-initialize to stats buffer, populated by application in the case of
1565
       * two pass*/
1566
0
      cpi->ppi->twopass.stats_buf_ctx->stats_in_start =
1567
0
          oxcf->twopass_stats_in.buf;
1568
0
      cpi->twopass_frame.stats_in =
1569
0
          cpi->ppi->twopass.stats_buf_ctx->stats_in_start;
1570
0
      cpi->ppi->twopass.stats_buf_ctx->stats_in_end =
1571
0
          &cpi->ppi->twopass.stats_buf_ctx->stats_in_start[packets - 1];
1572
1573
      // The buffer size is packets - 1 because the last packet is total_stats.
1574
0
      av1_firstpass_info_init(&cpi->ppi->twopass.firstpass_info,
1575
0
                              oxcf->twopass_stats_in.buf, packets - 1);
1576
0
      av1_init_second_pass(cpi);
1577
0
    } else {
1578
0
      av1_firstpass_info_init(&cpi->ppi->twopass.firstpass_info, NULL, 0);
1579
0
      av1_init_single_pass_lap(cpi);
1580
0
    }
1581
0
  }
1582
0
#endif
1583
1584
  // The buffer "obmc_buffer" is used in inter frames for fast obmc search.
1585
  // Hence, the memory allocation for the same is avoided for allintra encoding
1586
  // mode.
1587
0
  if (cpi->oxcf.kf_cfg.key_freq_max != 0)
1588
0
    alloc_obmc_buffers(&cpi->td.mb.obmc_buffer, cm->error);
1589
1590
0
  for (int x = 0; x < 2; x++) {
1591
0
    CHECK_MEM_ERROR(
1592
0
        cm, cpi->td.mb.intrabc_hash_info.hash_value_buffer[x],
1593
0
        (uint32_t *)aom_malloc(
1594
0
            AOM_BUFFER_SIZE_FOR_BLOCK_HASH *
1595
0
            sizeof(*cpi->td.mb.intrabc_hash_info.hash_value_buffer[x])));
1596
0
  }
1597
1598
0
  cpi->td.mb.intrabc_hash_info.crc_initialized = 0;
1599
1600
0
  av1_set_speed_features_framesize_independent(cpi, oxcf->speed);
1601
0
  av1_set_speed_features_framesize_dependent(cpi, oxcf->speed);
1602
1603
0
  int max_mi_cols = mi_params->mi_cols;
1604
0
  int max_mi_rows = mi_params->mi_rows;
1605
0
  if (oxcf->frm_dim_cfg.forced_max_frame_width) {
1606
0
    max_mi_cols = size_in_mi(oxcf->frm_dim_cfg.forced_max_frame_width);
1607
0
  }
1608
0
  if (oxcf->frm_dim_cfg.forced_max_frame_height) {
1609
0
    max_mi_rows = size_in_mi(oxcf->frm_dim_cfg.forced_max_frame_height);
1610
0
  }
1611
1612
0
  const int consec_zero_mv_alloc_size = (max_mi_rows * max_mi_cols) >> 2;
1613
0
  CHECK_MEM_ERROR(
1614
0
      cm, cpi->consec_zero_mv,
1615
0
      aom_calloc(consec_zero_mv_alloc_size, sizeof(*cpi->consec_zero_mv)));
1616
0
  cpi->consec_zero_mv_alloc_size = consec_zero_mv_alloc_size;
1617
1618
0
  cpi->mb_weber_stats = NULL;
1619
0
  cpi->mb_delta_q = NULL;
1620
0
  cpi->palette_pixel_num = 0;
1621
0
  cpi->scaled_last_source_available = 0;
1622
1623
0
  {
1624
0
    const BLOCK_SIZE bsize = BLOCK_16X16;
1625
0
    const int w = mi_size_wide[bsize];
1626
0
    const int h = mi_size_high[bsize];
1627
0
    const int num_cols = (max_mi_cols + w - 1) / w;
1628
0
    const int num_rows = (max_mi_rows + h - 1) / h;
1629
0
    CHECK_MEM_ERROR(cm, cpi->ssim_rdmult_scaling_factors,
1630
0
                    aom_calloc(num_rows * num_cols,
1631
0
                               sizeof(*cpi->ssim_rdmult_scaling_factors)));
1632
0
    CHECK_MEM_ERROR(cm, cpi->tpl_rdmult_scaling_factors,
1633
0
                    aom_calloc(num_rows * num_cols,
1634
0
                               sizeof(*cpi->tpl_rdmult_scaling_factors)));
1635
0
  }
1636
1637
#if CONFIG_TUNE_VMAF
1638
  {
1639
    const BLOCK_SIZE bsize = BLOCK_64X64;
1640
    const int w = mi_size_wide[bsize];
1641
    const int h = mi_size_high[bsize];
1642
    const int num_cols = (mi_params->mi_cols + w - 1) / w;
1643
    const int num_rows = (mi_params->mi_rows + h - 1) / h;
1644
    CHECK_MEM_ERROR(cm, cpi->vmaf_info.rdmult_scaling_factors,
1645
                    aom_calloc(num_rows * num_cols,
1646
                               sizeof(*cpi->vmaf_info.rdmult_scaling_factors)));
1647
    for (int i = 0; i < MAX_ARF_LAYERS; i++) {
1648
      cpi->vmaf_info.last_frame_unsharp_amount[i] = -1.0;
1649
      cpi->vmaf_info.last_frame_ysse[i] = -1.0;
1650
      cpi->vmaf_info.last_frame_vmaf[i] = -1.0;
1651
    }
1652
    cpi->vmaf_info.original_qindex = -1;
1653
    cpi->vmaf_info.vmaf_model = NULL;
1654
  }
1655
#endif
1656
1657
#if CONFIG_TUNE_BUTTERAUGLI
1658
  {
1659
    const int w = mi_size_wide[butteraugli_rdo_bsize];
1660
    const int h = mi_size_high[butteraugli_rdo_bsize];
1661
    const int num_cols = (mi_params->mi_cols + w - 1) / w;
1662
    const int num_rows = (mi_params->mi_rows + h - 1) / h;
1663
    CHECK_MEM_ERROR(
1664
        cm, cpi->butteraugli_info.rdmult_scaling_factors,
1665
        aom_malloc(num_rows * num_cols *
1666
                   sizeof(*cpi->butteraugli_info.rdmult_scaling_factors)));
1667
    memset(&cpi->butteraugli_info.source, 0,
1668
           sizeof(cpi->butteraugli_info.source));
1669
    memset(&cpi->butteraugli_info.resized_source, 0,
1670
           sizeof(cpi->butteraugli_info.resized_source));
1671
    cpi->butteraugli_info.recon_set = false;
1672
  }
1673
#endif
1674
1675
#if CONFIG_SALIENCY_MAP
1676
  {
1677
    CHECK_MEM_ERROR(cm, cpi->saliency_map,
1678
                    (uint8_t *)aom_calloc(cm->height * cm->width,
1679
                                          sizeof(*cpi->saliency_map)));
1680
    // Buffer initialization based on MIN_MIB_SIZE_LOG2 to ensure that
1681
    // cpi->sm_scaling_factor buffer is allocated big enough, since we have no
1682
    // idea of the actual superblock size we are going to use yet.
1683
    const int min_mi_w_sb = (1 << MIN_MIB_SIZE_LOG2);
1684
    const int min_mi_h_sb = (1 << MIN_MIB_SIZE_LOG2);
1685
    const int max_sb_cols =
1686
        (cm->mi_params.mi_cols + min_mi_w_sb - 1) / min_mi_w_sb;
1687
    const int max_sb_rows =
1688
        (cm->mi_params.mi_rows + min_mi_h_sb - 1) / min_mi_h_sb;
1689
    CHECK_MEM_ERROR(cm, cpi->sm_scaling_factor,
1690
                    (double *)aom_calloc(max_sb_rows * max_sb_cols,
1691
                                         sizeof(*cpi->sm_scaling_factor)));
1692
  }
1693
#endif
1694
1695
#if CONFIG_COLLECT_PARTITION_STATS
1696
  av1_zero(cpi->partition_stats);
1697
#endif  // CONFIG_COLLECT_PARTITION_STATS
1698
1699
  // Initialize the members of DeltaQuantParams with INT_MAX to ensure that
1700
  // the quantizer tables are correctly initialized using the default deltaq
1701
  // parameters when av1_init_quantizer is called for the first time.
1702
0
  DeltaQuantParams *const prev_deltaq_params =
1703
0
      &cpi->enc_quant_dequant_params.prev_deltaq_params;
1704
0
  prev_deltaq_params->y_dc_delta_q = INT_MAX;
1705
0
  prev_deltaq_params->u_dc_delta_q = INT_MAX;
1706
0
  prev_deltaq_params->v_dc_delta_q = INT_MAX;
1707
0
  prev_deltaq_params->u_ac_delta_q = INT_MAX;
1708
0
  prev_deltaq_params->v_ac_delta_q = INT_MAX;
1709
1710
0
  av1_init_quantizer(&cpi->enc_quant_dequant_params, &cm->quant_params,
1711
0
                     cm->seq_params->bit_depth, cpi->oxcf.algo_cfg.sharpness);
1712
0
  av1_qm_init(&cm->quant_params, av1_num_planes(cm));
1713
1714
0
  av1_loop_filter_init(cm);
1715
0
  cm->superres_scale_denominator = SCALE_NUMERATOR;
1716
0
  cm->superres_upscaled_width = oxcf->frm_dim_cfg.width;
1717
0
  cm->superres_upscaled_height = oxcf->frm_dim_cfg.height;
1718
0
#if !CONFIG_REALTIME_ONLY
1719
0
  av1_loop_restoration_precal();
1720
0
#endif
1721
1722
#if CONFIG_THREE_PASS
1723
  cpi->third_pass_ctx = NULL;
1724
  if (cpi->oxcf.pass == AOM_RC_THIRD_PASS) {
1725
    av1_init_thirdpass_ctx(cm, &cpi->third_pass_ctx, NULL);
1726
  }
1727
#endif
1728
1729
0
  cpi->second_pass_log_stream = NULL;
1730
0
  cpi->use_ducky_encode = 0;
1731
1732
0
  cm->error->setjmp = 0;
1733
0
  return cpi;
1734
0
}
1735
1736
#if CONFIG_INTERNAL_STATS
1737
#define SNPRINT(H, T) snprintf((H) + strlen(H), sizeof(H) - strlen(H), (T))
1738
1739
#define SNPRINT2(H, T, V) \
1740
  snprintf((H) + strlen(H), sizeof(H) - strlen(H), (T), (V))
1741
#endif  // CONFIG_INTERNAL_STATS
1742
1743
0
void av1_remove_primary_compressor(AV1_PRIMARY *ppi) {
1744
0
  if (!ppi) return;
1745
0
#if !CONFIG_REALTIME_ONLY
1746
0
  av1_tf_info_free(&ppi->tf_info);
1747
0
#endif  // !CONFIG_REALTIME_ONLY
1748
1749
0
  for (int i = 0; i < MAX_NUM_OPERATING_POINTS; ++i) {
1750
0
    aom_free(ppi->level_params.level_info[i]);
1751
0
  }
1752
0
  av1_lookahead_destroy(ppi->lookahead);
1753
1754
0
  aom_free(ppi->tpl_sb_rdmult_scaling_factors);
1755
0
  ppi->tpl_sb_rdmult_scaling_factors = NULL;
1756
1757
0
  TplParams *const tpl_data = &ppi->tpl_data;
1758
0
  aom_free(tpl_data->txfm_stats_list);
1759
1760
0
  for (int frame = 0; frame < MAX_LAG_BUFFERS; ++frame) {
1761
0
    aom_free(tpl_data->tpl_stats_pool[frame]);
1762
0
    aom_free_frame_buffer(&tpl_data->tpl_rec_pool[frame]);
1763
0
    aom_free_frame_buffer(&tpl_data->prev_gop_arf_src);
1764
0
    aom_free_frame_buffer(&tpl_data->prev_gop_arf_tpl_recon);
1765
0
    tpl_data->prev_gop_arf_disp_order = -1;
1766
0
    tpl_data->tpl_stats_pool[frame] = NULL;
1767
0
  }
1768
1769
0
#if !CONFIG_REALTIME_ONLY
1770
0
  av1_tpl_dealloc(&tpl_data->tpl_mt_sync);
1771
0
#endif
1772
1773
0
  av1_terminate_workers(ppi);
1774
0
  free_thread_data(ppi);
1775
1776
0
  aom_free(ppi->p_mt_info.tile_thr_data);
1777
0
  ppi->p_mt_info.tile_thr_data = NULL;
1778
0
  aom_free(ppi->p_mt_info.workers);
1779
0
  ppi->p_mt_info.workers = NULL;
1780
0
  ppi->p_mt_info.num_workers = 0;
1781
1782
0
  aom_free(ppi);
1783
0
}
1784
1785
0
void av1_remove_compressor(AV1_COMP *cpi) {
1786
0
  if (!cpi) return;
1787
#if CONFIG_RATECTRL_LOG
1788
  if (cpi->oxcf.pass == 3) {
1789
    rc_log_show(&cpi->rc_log);
1790
  }
1791
#endif  // CONFIG_RATECTRL_LOG
1792
1793
0
  AV1_COMMON *cm = &cpi->common;
1794
0
  if (cm->current_frame.frame_number > 0) {
1795
#if CONFIG_SPEED_STATS
1796
    if (!is_stat_generation_stage(cpi)) {
1797
      fprintf(stdout, "tx_search_count = %d\n", cpi->tx_search_count);
1798
    }
1799
#endif  // CONFIG_SPEED_STATS
1800
1801
#if CONFIG_COLLECT_PARTITION_STATS == 2
1802
    if (!is_stat_generation_stage(cpi)) {
1803
      av1_print_fr_partition_timing_stats(&cpi->partition_stats,
1804
                                          "fr_part_timing_data.csv");
1805
    }
1806
#endif
1807
0
  }
1808
1809
#if CONFIG_AV1_TEMPORAL_DENOISING
1810
  av1_denoiser_free(&(cpi->denoiser));
1811
#endif
1812
1813
0
  if (cm->error) {
1814
    // Help detect use after free of the error detail string.
1815
0
    memset(cm->error->detail, 'A', sizeof(cm->error->detail) - 1);
1816
0
    cm->error->detail[sizeof(cm->error->detail) - 1] = '\0';
1817
0
    aom_free(cm->error);
1818
0
  }
1819
0
  aom_free(cpi->td.tctx);
1820
0
  MultiThreadInfo *const mt_info = &cpi->mt_info;
1821
0
#if CONFIG_MULTITHREAD
1822
0
  pthread_mutex_t *const enc_row_mt_mutex_ = mt_info->enc_row_mt.mutex_;
1823
0
  pthread_cond_t *const enc_row_mt_cond_ = mt_info->enc_row_mt.cond_;
1824
0
  pthread_mutex_t *const gm_mt_mutex_ = mt_info->gm_sync.mutex_;
1825
0
  pthread_mutex_t *const tpl_error_mutex_ = mt_info->tpl_row_mt.mutex_;
1826
0
  pthread_mutex_t *const pack_bs_mt_mutex_ = mt_info->pack_bs_sync.mutex_;
1827
0
  if (enc_row_mt_mutex_ != NULL) {
1828
0
    pthread_mutex_destroy(enc_row_mt_mutex_);
1829
0
    aom_free(enc_row_mt_mutex_);
1830
0
  }
1831
0
  if (enc_row_mt_cond_ != NULL) {
1832
0
    pthread_cond_destroy(enc_row_mt_cond_);
1833
0
    aom_free(enc_row_mt_cond_);
1834
0
  }
1835
0
  if (gm_mt_mutex_ != NULL) {
1836
0
    pthread_mutex_destroy(gm_mt_mutex_);
1837
0
    aom_free(gm_mt_mutex_);
1838
0
  }
1839
0
  if (tpl_error_mutex_ != NULL) {
1840
0
    pthread_mutex_destroy(tpl_error_mutex_);
1841
0
    aom_free(tpl_error_mutex_);
1842
0
  }
1843
0
  if (pack_bs_mt_mutex_ != NULL) {
1844
0
    pthread_mutex_destroy(pack_bs_mt_mutex_);
1845
0
    aom_free(pack_bs_mt_mutex_);
1846
0
  }
1847
0
#endif
1848
0
  av1_row_mt_mem_dealloc(cpi);
1849
1850
0
  if (mt_info->num_workers > 1) {
1851
0
    av1_row_mt_sync_mem_dealloc(&cpi->ppi->intra_row_mt_sync);
1852
0
    av1_loop_filter_dealloc(&mt_info->lf_row_sync);
1853
0
    av1_cdef_mt_dealloc(&mt_info->cdef_sync);
1854
0
#if !CONFIG_REALTIME_ONLY
1855
0
    av1_loop_restoration_dealloc(&mt_info->lr_row_sync);
1856
0
    av1_tf_mt_dealloc(&mt_info->tf_sync);
1857
0
#endif
1858
0
  }
1859
1860
#if CONFIG_THREE_PASS
1861
  av1_free_thirdpass_ctx(cpi->third_pass_ctx);
1862
1863
  av1_close_second_pass_log(cpi);
1864
#endif
1865
1866
0
  dealloc_compressor_data(cpi);
1867
1868
0
  av1_ext_part_delete(&cpi->ext_part_controller);
1869
1870
0
  av1_remove_common(cm);
1871
1872
0
  aom_free(cpi);
1873
1874
#ifdef OUTPUT_YUV_REC
1875
  fclose(yuv_rec_file);
1876
#endif
1877
1878
#ifdef OUTPUT_YUV_DENOISED
1879
  fclose(yuv_denoised_file);
1880
#endif
1881
0
}
1882
1883
0
static void generate_psnr_packet(AV1_COMP *cpi) {
1884
0
  struct aom_codec_cx_pkt pkt;
1885
0
  int i;
1886
0
  PSNR_STATS psnr;
1887
0
#if CONFIG_AV1_HIGHBITDEPTH
1888
0
  const uint32_t in_bit_depth = cpi->oxcf.input_cfg.input_bit_depth;
1889
0
  const uint32_t bit_depth = cpi->td.mb.e_mbd.bd;
1890
0
  aom_calc_highbd_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr,
1891
0
                       bit_depth, in_bit_depth);
1892
#else
1893
  aom_calc_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr);
1894
#endif
1895
1896
0
  for (i = 0; i < 4; ++i) {
1897
0
    pkt.data.psnr.samples[i] = psnr.samples[i];
1898
0
    pkt.data.psnr.sse[i] = psnr.sse[i];
1899
0
    pkt.data.psnr.psnr[i] = psnr.psnr[i];
1900
0
  }
1901
1902
0
#if CONFIG_AV1_HIGHBITDEPTH
1903
0
  if ((cpi->source->flags & YV12_FLAG_HIGHBITDEPTH) &&
1904
0
      (in_bit_depth < bit_depth)) {
1905
0
    for (i = 0; i < 4; ++i) {
1906
0
      pkt.data.psnr.samples_hbd[i] = psnr.samples_hbd[i];
1907
0
      pkt.data.psnr.sse_hbd[i] = psnr.sse_hbd[i];
1908
0
      pkt.data.psnr.psnr_hbd[i] = psnr.psnr_hbd[i];
1909
0
    }
1910
0
  }
1911
0
#endif
1912
1913
0
  pkt.kind = AOM_CODEC_PSNR_PKT;
1914
0
  aom_codec_pkt_list_add(cpi->ppi->output_pkt_list, &pkt);
1915
0
}
1916
1917
0
int av1_use_as_reference(int *ext_ref_frame_flags, int ref_frame_flags) {
1918
0
  if (ref_frame_flags > ((1 << INTER_REFS_PER_FRAME) - 1)) return -1;
1919
1920
0
  *ext_ref_frame_flags = ref_frame_flags;
1921
0
  return 0;
1922
0
}
1923
1924
0
int av1_copy_reference_enc(AV1_COMP *cpi, int idx, YV12_BUFFER_CONFIG *sd) {
1925
0
  AV1_COMMON *const cm = &cpi->common;
1926
0
  const int num_planes = av1_num_planes(cm);
1927
0
  YV12_BUFFER_CONFIG *cfg = get_ref_frame(cm, idx);
1928
0
  if (cfg) {
1929
0
    aom_yv12_copy_frame(cfg, sd, num_planes);
1930
0
    return 0;
1931
0
  } else {
1932
0
    return -1;
1933
0
  }
1934
0
}
1935
1936
0
int av1_set_reference_enc(AV1_COMP *cpi, int idx, YV12_BUFFER_CONFIG *sd) {
1937
0
  AV1_COMMON *const cm = &cpi->common;
1938
0
  const int num_planes = av1_num_planes(cm);
1939
0
  YV12_BUFFER_CONFIG *cfg = get_ref_frame(cm, idx);
1940
0
  if (cfg) {
1941
0
    aom_yv12_copy_frame(sd, cfg, num_planes);
1942
0
    return 0;
1943
0
  } else {
1944
0
    return -1;
1945
0
  }
1946
0
}
1947
1948
#ifdef OUTPUT_YUV_REC
1949
static void aom_write_one_yuv_frame(AV1_COMMON *cm, YV12_BUFFER_CONFIG *s) {
1950
  uint8_t *src = s->y_buffer;
1951
  int h = cm->height;
1952
  if (yuv_rec_file == NULL) return;
1953
  if (s->flags & YV12_FLAG_HIGHBITDEPTH) {
1954
    uint16_t *src16 = CONVERT_TO_SHORTPTR(s->y_buffer);
1955
1956
    do {
1957
      fwrite(src16, s->y_width, 2, yuv_rec_file);
1958
      src16 += s->y_stride;
1959
    } while (--h);
1960
1961
    src16 = CONVERT_TO_SHORTPTR(s->u_buffer);
1962
    h = s->uv_height;
1963
1964
    do {
1965
      fwrite(src16, s->uv_width, 2, yuv_rec_file);
1966
      src16 += s->uv_stride;
1967
    } while (--h);
1968
1969
    src16 = CONVERT_TO_SHORTPTR(s->v_buffer);
1970
    h = s->uv_height;
1971
1972
    do {
1973
      fwrite(src16, s->uv_width, 2, yuv_rec_file);
1974
      src16 += s->uv_stride;
1975
    } while (--h);
1976
1977
    fflush(yuv_rec_file);
1978
    return;
1979
  }
1980
1981
  do {
1982
    fwrite(src, s->y_width, 1, yuv_rec_file);
1983
    src += s->y_stride;
1984
  } while (--h);
1985
1986
  src = s->u_buffer;
1987
  h = s->uv_height;
1988
1989
  do {
1990
    fwrite(src, s->uv_width, 1, yuv_rec_file);
1991
    src += s->uv_stride;
1992
  } while (--h);
1993
1994
  src = s->v_buffer;
1995
  h = s->uv_height;
1996
1997
  do {
1998
    fwrite(src, s->uv_width, 1, yuv_rec_file);
1999
    src += s->uv_stride;
2000
  } while (--h);
2001
2002
  fflush(yuv_rec_file);
2003
}
2004
#endif  // OUTPUT_YUV_REC
2005
2006
0
void av1_set_mv_search_params(AV1_COMP *cpi) {
2007
0
  const AV1_COMMON *const cm = &cpi->common;
2008
0
  MotionVectorSearchParams *const mv_search_params = &cpi->mv_search_params;
2009
0
  const int max_mv_def = AOMMAX(cm->width, cm->height);
2010
2011
  // Default based on max resolution.
2012
0
  mv_search_params->mv_step_param = av1_init_search_range(max_mv_def);
2013
2014
0
  if (cpi->sf.mv_sf.auto_mv_step_size) {
2015
0
    if (frame_is_intra_only(cm)) {
2016
      // Initialize max_mv_magnitude for use in the first INTER frame
2017
      // after a key/intra-only frame.
2018
0
      mv_search_params->max_mv_magnitude = max_mv_def;
2019
0
    } else {
2020
      // Use adaptive mv steps based on previous frame stats for show frames and
2021
      // internal arfs.
2022
0
      FRAME_UPDATE_TYPE cur_update_type =
2023
0
          cpi->ppi->gf_group.update_type[cpi->gf_frame_index];
2024
0
      int use_auto_mv_step =
2025
0
          (cm->show_frame || cur_update_type == INTNL_ARF_UPDATE) &&
2026
0
          mv_search_params->max_mv_magnitude != -1 &&
2027
0
          cpi->sf.mv_sf.auto_mv_step_size >= 2;
2028
0
      if (use_auto_mv_step) {
2029
        // Allow mv_steps to correspond to twice the max mv magnitude found
2030
        // in the previous frame, capped by the default max_mv_magnitude based
2031
        // on resolution.
2032
0
        mv_search_params->mv_step_param = av1_init_search_range(
2033
0
            AOMMIN(max_mv_def, 2 * mv_search_params->max_mv_magnitude));
2034
0
      }
2035
      // Reset max_mv_magnitude based on update flag.
2036
0
      if (cpi->do_frame_data_update) mv_search_params->max_mv_magnitude = -1;
2037
0
    }
2038
0
  }
2039
0
}
2040
2041
// Estimate if the source frame is screen content, based on the portion of
2042
// blocks that have few luma colors.
2043
0
static void estimate_screen_content(AV1_COMP *cpi, FeatureFlags *features) {
2044
0
  const AV1_COMMON *const cm = &cpi->common;
2045
0
  const MACROBLOCKD *const xd = &cpi->td.mb.e_mbd;
2046
0
  const uint8_t *src = cpi->unfiltered_source->y_buffer;
2047
0
  assert(src != NULL);
2048
0
  const int use_hbd = cpi->unfiltered_source->flags & YV12_FLAG_HIGHBITDEPTH;
2049
0
  const int stride = cpi->unfiltered_source->y_stride;
2050
0
  const int width = cpi->unfiltered_source->y_width;
2051
0
  const int height = cpi->unfiltered_source->y_height;
2052
0
  const int64_t area = (int64_t)width * height;
2053
0
  const int bd = cm->seq_params->bit_depth;
2054
0
  const int kBlockWidth = 16;
2055
0
  const int kBlockHeight = 16;
2056
0
  const int kBlockArea = kBlockWidth * kBlockHeight;
2057
  // These threshold values are selected experimentally.
2058
0
  const int kColorThresh = 4;
2059
0
  const unsigned int kVarThresh = 0;
2060
  // Counts of blocks with no more than kColorThresh colors.
2061
0
  int64_t counts_1 = 0;
2062
  // Counts of blocks with no more than kColorThresh colors and variance larger
2063
  // than kVarThresh.
2064
0
  int64_t counts_2 = 0;
2065
2066
0
  for (int r = 0; r + kBlockHeight <= height; r += kBlockHeight) {
2067
0
    for (int c = 0; c + kBlockWidth <= width; c += kBlockWidth) {
2068
0
      int count_buf[1 << 8];  // Maximum (1 << 8) bins for hbd path.
2069
0
      const uint8_t *const this_src = src + r * stride + c;
2070
0
      int n_colors;
2071
0
      if (use_hbd) {
2072
0
        av1_count_colors_highbd(this_src, stride, /*rows=*/kBlockHeight,
2073
0
                                /*cols=*/kBlockWidth, bd, NULL, count_buf,
2074
0
                                &n_colors, NULL);
2075
0
      } else {
2076
0
        av1_count_colors(this_src, stride, /*rows=*/kBlockHeight,
2077
0
                         /*cols=*/kBlockWidth, count_buf, &n_colors);
2078
0
      }
2079
0
      if (n_colors > 1 && n_colors <= kColorThresh) {
2080
0
        ++counts_1;
2081
0
        struct buf_2d buf;
2082
0
        buf.stride = stride;
2083
0
        buf.buf = (uint8_t *)this_src;
2084
0
        const unsigned int var = av1_get_perpixel_variance(
2085
0
            cpi, xd, &buf, BLOCK_16X16, AOM_PLANE_Y, use_hbd);
2086
0
        if (var > kVarThresh) ++counts_2;
2087
0
      }
2088
0
    }
2089
0
  }
2090
2091
  // The threshold values are selected experimentally.
2092
0
  features->allow_screen_content_tools = counts_1 * kBlockArea * 10 > area;
2093
  // IntraBC would force loop filters off, so we use more strict rules that also
2094
  // requires that the block has high variance.
2095
0
  features->allow_intrabc =
2096
0
      features->allow_screen_content_tools && counts_2 * kBlockArea * 12 > area;
2097
0
  cpi->use_screen_content_tools = features->allow_screen_content_tools;
2098
0
  cpi->is_screen_content_type =
2099
0
      features->allow_intrabc || (counts_1 * kBlockArea * 10 > area * 4 &&
2100
0
                                  counts_2 * kBlockArea * 30 > area);
2101
0
}
2102
2103
// Macro that helps debug the screen content mode 2 mechanism
2104
// #define OUTPUT_SCR_DET_MODE2_STATS
2105
2106
/*!\brief Helper function that finds the dominant value of a block.
2107
 *
2108
 * This function builds a histogram of all 256 possible (8 bit) values, and
2109
 * returns with the value with the greatest count (i.e. the dominant value).
2110
 */
2111
uint8_t av1_find_dominant_value(const uint8_t *src, int stride, int rows,
2112
0
                                int cols) {
2113
0
  uint32_t value_count[1 << 8] = { 0 };  // Maximum (1 << 8) value levels.
2114
0
  uint32_t dominant_value_count = 0;
2115
0
  uint8_t dominant_value = 0;
2116
2117
0
  for (int r = 0; r < rows; ++r) {
2118
0
    for (int c = 0; c < cols; ++c) {
2119
0
      const uint8_t value = src[r * (ptrdiff_t)stride + c];
2120
2121
0
      value_count[value]++;
2122
2123
0
      if (value_count[value] > dominant_value_count) {
2124
0
        dominant_value = value;
2125
0
        dominant_value_count = value_count[value];
2126
0
      }
2127
0
    }
2128
0
  }
2129
2130
0
  return dominant_value;
2131
0
}
2132
2133
/*!\brief Helper function that performs one round of image dilation on a block.
2134
 *
2135
 * This function finds the dominant value (i.e. the value that appears most
2136
 * often within a block), then performs a round of dilation by "extending" all
2137
 * occurrences of the dominant value outwards in all 8 directions (4 sides + 4
2138
 * corners).
2139
 *
2140
 * For a visual example, let:
2141
 *  - D: the dominant value
2142
 *  - [a-p]: different non-dominant values (usually anti-aliased pixels)
2143
 *  - .: the most common non-dominant value
2144
 *
2145
 * Before dilation:       After dilation:
2146
 * . . a b D c d . .     . . D D D D D . .
2147
 * . e f D D D g h .     D D D D D D D D D
2148
 * . D D D D D D D .     D D D D D D D D D
2149
 * . D D D D D D D .     D D D D D D D D D
2150
 * . i j D D D k l .     D D D D D D D D D
2151
 * . . m n D o p . .     . . D D D D D . .
2152
 */
2153
void av1_dilate_block(const uint8_t *src, int src_stride, uint8_t *dilated,
2154
0
                      int dilated_stride, int rows, int cols) {
2155
0
  uint8_t dominant_value = av1_find_dominant_value(src, src_stride, rows, cols);
2156
2157
0
  for (int r = 0; r < rows; ++r) {
2158
0
    for (int c = 0; c < cols; ++c) {
2159
0
      const uint8_t value = src[r * (ptrdiff_t)src_stride + c];
2160
2161
0
      dilated[r * (ptrdiff_t)dilated_stride + c] = value;
2162
0
    }
2163
0
  }
2164
2165
0
  for (int r = 0; r < rows; ++r) {
2166
0
    for (int c = 0; c < cols; ++c) {
2167
0
      const uint8_t value = src[r * (ptrdiff_t)src_stride + c];
2168
2169
0
      if (value == dominant_value) {
2170
        // Dilate up
2171
0
        if (r != 0) {
2172
0
          dilated[(r - 1) * (ptrdiff_t)dilated_stride + c] = value;
2173
0
        }
2174
        // Dilate down
2175
0
        if (r != rows - 1) {
2176
0
          dilated[(r + 1) * (ptrdiff_t)dilated_stride + c] = value;
2177
0
        }
2178
        // Dilate left
2179
0
        if (c != 0) {
2180
0
          dilated[r * (ptrdiff_t)dilated_stride + (c - 1)] = value;
2181
0
        }
2182
        // Dilate right
2183
0
        if (c != cols - 1) {
2184
0
          dilated[r * (ptrdiff_t)dilated_stride + (c + 1)] = value;
2185
0
        }
2186
        // Dilate upper-left corner
2187
0
        if (r != 0 && c != 0) {
2188
0
          dilated[(r - 1) * (ptrdiff_t)dilated_stride + (c - 1)] = value;
2189
0
        }
2190
        // Dilate upper-right corner
2191
0
        if (r != 0 && c != cols - 1) {
2192
0
          dilated[(r - 1) * (ptrdiff_t)dilated_stride + (c + 1)] = value;
2193
0
        }
2194
        // Dilate lower-left corner
2195
0
        if (r != rows - 1 && c != 0) {
2196
0
          dilated[(r + 1) * (ptrdiff_t)dilated_stride + (c - 1)] = value;
2197
0
        }
2198
        // Dilate lower-right corner
2199
0
        if (r != rows - 1 && c != cols - 1) {
2200
0
          dilated[(r + 1) * (ptrdiff_t)dilated_stride + (c + 1)] = value;
2201
0
        }
2202
0
      }
2203
0
    }
2204
0
  }
2205
0
}
2206
2207
/*!\brief Estimates if the source frame is a candidate to enable palette mode
2208
 * and intra block copy, with an accurate detection of anti-aliased text and
2209
 * graphics.
2210
 *
2211
 * Screen content detection is done by dividing frame's luma plane (Y) into
2212
 * small blocks, counting how many unique colors each block contains and
2213
 * their per-pixel variance, and classifying these blocks into three main
2214
 * categories:
2215
 * 1. Palettizable blocks, low variance (can use palette mode)
2216
 * 2. Palettizable blocks, high variance (can use palette mode and IntraBC)
2217
 * 3. Non palettizable, photo-like blocks (can neither use palette mode nor
2218
 *    IntraBC)
2219
 * Finally, this function decides whether the frame could benefit from
2220
 * enabling palette mode with or without IntraBC, based on the ratio of the
2221
 * three categories mentioned above.
2222
 */
2223
static void estimate_screen_content_antialiasing_aware(AV1_COMP *cpi,
2224
0
                                                       FeatureFlags *features) {
2225
0
  enum {
2226
0
    kBlockWidth = 16,
2227
0
    kBlockHeight = 16,
2228
0
    kBlockArea = kBlockWidth * kBlockHeight
2229
0
  };
2230
2231
0
  const bool fast_detection =
2232
0
      cpi->sf.hl_sf.screen_detection_mode2_fast_detection;
2233
0
  const AV1_COMMON *const cm = &cpi->common;
2234
0
  const MACROBLOCKD *const xd = &cpi->td.mb.e_mbd;
2235
0
  const uint8_t *src = cpi->unfiltered_source->y_buffer;
2236
0
  assert(src != NULL);
2237
0
  const int use_hbd = cpi->unfiltered_source->flags & YV12_FLAG_HIGHBITDEPTH;
2238
0
  const int stride = cpi->unfiltered_source->y_stride;
2239
0
  const int width = cpi->unfiltered_source->y_width;
2240
0
  const int height = cpi->unfiltered_source->y_height;
2241
0
  const int64_t area = (int64_t)width * height;
2242
0
  const int bd = cm->seq_params->bit_depth;
2243
  // Holds the down-converted block to 8 bit (if source is HBD)
2244
0
  uint8_t downconv_blk[kBlockArea];
2245
  // Holds the block after a round of dilation
2246
0
  uint8_t dilated_blk[kBlockArea];
2247
2248
  // These threshold values are selected experimentally
2249
  // Detects text and glyphs without anti-aliasing, and graphics with a 4-color
2250
  // palette
2251
0
  const int kSimpleColorThresh = 4;
2252
  // Detects potential text and glyphs with anti-aliasing, and graphics with a
2253
  // more extended color palette
2254
0
  const int kComplexInitialColorThresh = 40;
2255
  // Detects text and glyphs with anti-aliasing, and graphics with a more
2256
  // extended color palette
2257
0
  const int kComplexFinalColorThresh = 6;
2258
  // Threshold used to classify low-variance and high-variance blocks
2259
0
  const int kVarThresh = 5;
2260
  // Count of blocks that are candidates for using palette mode
2261
0
  int64_t count_palette = 0;
2262
  // Count of blocks that are candidates for using IntraBC
2263
0
  int64_t count_intrabc = 0;
2264
  // Count of "photo-like" blocks (i.e. can't use palette mode or IntraBC)
2265
0
  int64_t count_photo = 0;
2266
2267
#ifdef OUTPUT_SCR_DET_MODE2_STATS
2268
  FILE *stats_file;
2269
  stats_file = fopen("scrdetm2.stt", "a");
2270
2271
  fprintf(stats_file, "\n");
2272
  fprintf(stats_file, "Screen detection mode 2 image map legend\n");
2273
  if (fast_detection) {
2274
    fprintf(stats_file, "Fast detection enabled\n");
2275
  }
2276
  fprintf(stats_file,
2277
          "-------------------------------------------------------\n");
2278
  fprintf(stats_file,
2279
          "S: simple block, high var    C: complex block, high var\n");
2280
  fprintf(stats_file,
2281
          "-: simple block, low var     =: complex block, low var \n");
2282
  fprintf(stats_file,
2283
          "x: photo-like block          .: non-palettizable block \n");
2284
  fprintf(stats_file,
2285
          "(whitespace): solid block                              \n");
2286
  fprintf(stats_file,
2287
          "-------------------------------------------------------\n");
2288
#endif
2289
2290
  // Skip every other block and weigh each block twice as much when performing
2291
  // fast detection
2292
0
  const int multiplier = fast_detection ? 2 : 1;
2293
2294
0
  for (int r = 0; r + kBlockHeight <= height; r += kBlockHeight) {
2295
    // Alternate skipping in a "checkerboard" pattern when performing fast
2296
    // detection
2297
0
    const int initial_col =
2298
0
        (fast_detection && (r / kBlockHeight) % 2) ? kBlockWidth : 0;
2299
2300
0
    for (int c = initial_col; c + kBlockWidth <= width;
2301
0
         c += kBlockWidth * multiplier) {
2302
0
      const uint8_t *blk_src = src + r * (ptrdiff_t)stride + c;
2303
0
      const uint8_t *blk = blk_src;
2304
0
      int blk_stride = stride;
2305
2306
      // Down-convert pixels to 8-bit domain if source is HBD
2307
0
      if (use_hbd) {
2308
0
        const uint16_t *blk_src_hbd = CONVERT_TO_SHORTPTR(blk_src);
2309
2310
0
        for (int blk_r = 0; blk_r < kBlockHeight; ++blk_r) {
2311
0
          for (int blk_c = 0; blk_c < kBlockWidth; ++blk_c) {
2312
0
            const int downconv_val =
2313
0
                (blk_src_hbd[blk_r * (ptrdiff_t)stride + blk_c]) >> (bd - 8);
2314
2315
            // Ensure down-converted value is 8-bit
2316
0
            assert(downconv_val < (1 << 8));
2317
0
            downconv_blk[blk_r * (ptrdiff_t)kBlockWidth + blk_c] = downconv_val;
2318
0
          }
2319
0
        }
2320
2321
        // Switch block source and stride to down-converted buffer and its width
2322
0
        blk = downconv_blk;
2323
0
        blk_stride = kBlockWidth;
2324
0
      }
2325
2326
      // First, find if the block could be palettized
2327
0
      int number_of_colors;
2328
0
      bool under_threshold = av1_count_colors_with_threshold(
2329
0
          blk, blk_stride, /*rows=*/kBlockHeight,
2330
0
          /*cols=*/kBlockWidth, kComplexInitialColorThresh, &number_of_colors);
2331
0
      if (number_of_colors > 1 && under_threshold) {
2332
0
        struct buf_2d buf;
2333
0
        buf.stride = stride;
2334
0
        buf.buf = (uint8_t *)blk_src;
2335
2336
0
        if (number_of_colors <= kSimpleColorThresh) {
2337
          // Simple block detected, add to block count with no further
2338
          // processing required
2339
0
          ++count_palette;
2340
          // Variance always comes from the source image with no down-conversion
2341
0
          int var = av1_get_perpixel_variance(cpi, xd, &buf, BLOCK_16X16,
2342
0
                                              AOM_PLANE_Y, use_hbd);
2343
2344
0
          if (var > kVarThresh) {
2345
0
            ++count_intrabc;
2346
#ifdef OUTPUT_SCR_DET_MODE2_STATS
2347
            fprintf(stats_file, "S");
2348
          } else {
2349
            fprintf(stats_file, "-");
2350
#endif
2351
0
          }
2352
0
        } else {
2353
          // Complex block detected, try to find if it's palettizable
2354
          // Dilate block with dominant color, to exclude anti-aliased pixels
2355
          // from final palette count
2356
0
          av1_dilate_block(blk, blk_stride, dilated_blk, kBlockWidth,
2357
0
                           /*rows=*/kBlockHeight, /*cols=*/kBlockWidth);
2358
0
          under_threshold = av1_count_colors_with_threshold(
2359
0
              dilated_blk, kBlockWidth, /*rows=*/kBlockHeight,
2360
0
              /*cols=*/kBlockWidth, kComplexFinalColorThresh,
2361
0
              &number_of_colors);
2362
2363
0
          if (under_threshold) {
2364
            // Variance always comes from the source image with no
2365
            // down-conversion
2366
0
            int var = av1_get_perpixel_variance(cpi, xd, &buf, BLOCK_16X16,
2367
0
                                                AOM_PLANE_Y, use_hbd);
2368
2369
0
            if (var > kVarThresh) {
2370
0
              ++count_palette;
2371
0
              ++count_intrabc;
2372
#ifdef OUTPUT_SCR_DET_MODE2_STATS
2373
              fprintf(stats_file, "C");
2374
            } else {
2375
              fprintf(stats_file, "=");
2376
#endif
2377
0
            }
2378
#ifdef OUTPUT_SCR_DET_MODE2_STATS
2379
          } else {
2380
            fprintf(stats_file, ".");
2381
#endif
2382
0
          }
2383
0
        }
2384
0
      } else {
2385
0
        if (number_of_colors > kComplexInitialColorThresh) {
2386
0
          ++count_photo;
2387
#ifdef OUTPUT_SCR_DET_MODE2_STATS
2388
          fprintf(stats_file, "x");
2389
        } else {
2390
          fprintf(stats_file, " ");  // Solid block (1 color)
2391
#endif
2392
0
        }
2393
0
      }
2394
0
    }
2395
#ifdef OUTPUT_SCR_DET_MODE2_STATS
2396
    fprintf(stats_file, "\n");
2397
#endif
2398
0
  }
2399
2400
  // Normalize counts to account for the blocks that were skipped
2401
0
  if (fast_detection) {
2402
0
    count_photo *= multiplier;
2403
0
    count_palette *= multiplier;
2404
0
    count_intrabc *= multiplier;
2405
0
  }
2406
2407
  // The threshold values are selected experimentally.
2408
  // Penalize presence of photo-like blocks (1/16th the weight of a palettizable
2409
  // block)
2410
0
  features->allow_screen_content_tools =
2411
0
      ((count_palette - count_photo / 16) * kBlockArea * 10 > area);
2412
2413
  // IntraBC would force loop filters off, so we use more strict rules that also
2414
  // requires that the block has high variance.
2415
  // Penalize presence of photo-like blocks (1/16th the weight of a palettizable
2416
  // block)
2417
0
  features->allow_intrabc =
2418
0
      features->allow_screen_content_tools &&
2419
0
      ((count_intrabc - count_photo / 16) * kBlockArea * 12 > area);
2420
0
  cpi->use_screen_content_tools = features->allow_screen_content_tools;
2421
0
  cpi->is_screen_content_type =
2422
0
      features->allow_intrabc || (count_palette * kBlockArea * 15 > area * 4 &&
2423
0
                                  count_intrabc * kBlockArea * 30 > area);
2424
2425
#ifdef OUTPUT_SCR_DET_MODE2_STATS
2426
  fprintf(stats_file,
2427
          "block count palette: %" PRId64 ", count intrabc: %" PRId64
2428
          ", count photo: %" PRId64 ", total: %d\n",
2429
          count_palette, count_intrabc, count_photo,
2430
          (int)(ceil(width / kBlockWidth) * ceil(height / kBlockHeight)));
2431
  fprintf(stats_file, "sc palette value: %" PRId64 ", threshold %" PRId64 "\n",
2432
          (count_palette - count_photo / 16) * kBlockArea * 10, area);
2433
  fprintf(stats_file, "sc ibc value: %" PRId64 ", threshold %" PRId64 "\n",
2434
          (count_intrabc - count_photo / 16) * kBlockArea * 12, area);
2435
  fprintf(stats_file, "allow sct: %d, allow ibc: %d\n",
2436
          features->allow_screen_content_tools, features->allow_intrabc);
2437
#endif
2438
0
}
2439
2440
0
void av1_set_screen_content_options(AV1_COMP *cpi, FeatureFlags *features) {
2441
0
  const AV1_COMMON *const cm = &cpi->common;
2442
2443
0
  if (cm->seq_params->force_screen_content_tools != 2) {
2444
0
    features->allow_screen_content_tools = features->allow_intrabc =
2445
0
        cm->seq_params->force_screen_content_tools;
2446
0
    return;
2447
0
  }
2448
2449
0
  if (cpi->oxcf.tune_cfg.content == AOM_CONTENT_SCREEN) {
2450
0
    features->allow_screen_content_tools = 1;
2451
0
    features->allow_intrabc = cpi->oxcf.mode == REALTIME ? 0 : 1;
2452
0
    cpi->is_screen_content_type = 1;
2453
0
    cpi->use_screen_content_tools = 1;
2454
0
    return;
2455
0
  }
2456
2457
0
  if (cpi->oxcf.mode == REALTIME) {
2458
0
    features->allow_screen_content_tools = features->allow_intrabc = 0;
2459
0
    return;
2460
0
  }
2461
2462
  // Screen content tools are not evaluated in non-RD encoding mode unless
2463
  // content type is not set explicitly, i.e., when
2464
  // cpi->oxcf.tune_cfg.content != AOM_CONTENT_SCREEN, use_nonrd_pick_mode = 1
2465
  // and hybrid_intra_pickmode = 0. Hence, screen content detection is
2466
  // disabled.
2467
0
  if (cpi->sf.rt_sf.use_nonrd_pick_mode &&
2468
0
      !cpi->sf.rt_sf.hybrid_intra_pickmode) {
2469
0
    features->allow_screen_content_tools = features->allow_intrabc = 0;
2470
0
    return;
2471
0
  }
2472
2473
0
  if (cpi->oxcf.algo_cfg.screen_detection_mode ==
2474
0
      AOM_SCREEN_DETECTION_ANTIALIASING_AWARE) {
2475
0
    estimate_screen_content_antialiasing_aware(cpi, features);
2476
0
  } else {
2477
0
    estimate_screen_content(cpi, features);
2478
0
  }
2479
0
}
2480
2481
0
static void init_motion_estimation(AV1_COMP *cpi) {
2482
0
  AV1_COMMON *const cm = &cpi->common;
2483
0
  MotionVectorSearchParams *const mv_search_params = &cpi->mv_search_params;
2484
0
  const int aligned_width = (cm->width + 7) & ~7;
2485
0
  const int y_stride =
2486
0
      aom_calc_y_stride(aligned_width, cpi->oxcf.border_in_pixels);
2487
0
  const int y_stride_src = ((cpi->oxcf.frm_dim_cfg.width != cm->width ||
2488
0
                             cpi->oxcf.frm_dim_cfg.height != cm->height) ||
2489
0
                            av1_superres_scaled(cm))
2490
0
                               ? y_stride
2491
0
                               : cpi->ppi->lookahead->buf->img.y_stride;
2492
0
  int fpf_y_stride =
2493
0
      cm->cur_frame != NULL ? cm->cur_frame->buf.y_stride : y_stride;
2494
2495
  // Update if search_site_cfg is uninitialized or the current frame has a new
2496
  // stride
2497
0
  const int should_update =
2498
0
      !mv_search_params->search_site_cfg[SS_CFG_SRC][DIAMOND].stride ||
2499
0
      !mv_search_params->search_site_cfg[SS_CFG_LOOKAHEAD][DIAMOND].stride ||
2500
0
      (y_stride !=
2501
0
       mv_search_params->search_site_cfg[SS_CFG_SRC][DIAMOND].stride);
2502
2503
0
  if (!should_update) {
2504
0
    return;
2505
0
  }
2506
2507
  // Initialization of search_site_cfg for NUM_DISTINCT_SEARCH_METHODS.
2508
0
  for (SEARCH_METHODS i = DIAMOND; i < NUM_DISTINCT_SEARCH_METHODS; i++) {
2509
0
    const int level = ((i == NSTEP_8PT) || (i == CLAMPED_DIAMOND)) ? 1 : 0;
2510
0
    av1_init_motion_compensation[i](
2511
0
        &mv_search_params->search_site_cfg[SS_CFG_SRC][i], y_stride, level);
2512
0
    av1_init_motion_compensation[i](
2513
0
        &mv_search_params->search_site_cfg[SS_CFG_LOOKAHEAD][i], y_stride_src,
2514
0
        level);
2515
0
  }
2516
2517
  // First pass search site config initialization.
2518
0
  av1_init_motion_fpf(&mv_search_params->search_site_cfg[SS_CFG_FPF][DIAMOND],
2519
0
                      fpf_y_stride);
2520
0
  for (SEARCH_METHODS i = NSTEP; i < NUM_DISTINCT_SEARCH_METHODS; i++) {
2521
0
    memcpy(&mv_search_params->search_site_cfg[SS_CFG_FPF][i],
2522
0
           &mv_search_params->search_site_cfg[SS_CFG_FPF][DIAMOND],
2523
0
           sizeof(search_site_config));
2524
0
  }
2525
0
}
2526
2527
0
static void init_ref_frame_bufs(AV1_COMP *cpi) {
2528
0
  AV1_COMMON *const cm = &cpi->common;
2529
0
  int i;
2530
0
  if (cm->cur_frame) {
2531
0
    cm->cur_frame->ref_count--;
2532
0
    cm->cur_frame = NULL;
2533
0
  }
2534
0
  for (i = 0; i < REF_FRAMES; ++i) {
2535
0
    if (cm->ref_frame_map[i]) {
2536
0
      cm->ref_frame_map[i]->ref_count--;
2537
0
      cm->ref_frame_map[i] = NULL;
2538
0
    }
2539
0
  }
2540
0
#ifndef NDEBUG
2541
0
  BufferPool *const pool = cm->buffer_pool;
2542
0
  for (i = 0; i < pool->num_frame_bufs; ++i) {
2543
0
    assert(pool->frame_bufs[i].ref_count == 0);
2544
0
  }
2545
0
#endif
2546
0
}
2547
2548
// TODO(chengchen): consider renaming this function as it is necessary
2549
// for the encoder to setup critical parameters, and it does not
2550
// deal with initial width any longer.
2551
aom_codec_err_t av1_check_initial_width(AV1_COMP *cpi, int use_highbitdepth,
2552
0
                                        int subsampling_x, int subsampling_y) {
2553
0
  AV1_COMMON *const cm = &cpi->common;
2554
0
  SequenceHeader *const seq_params = cm->seq_params;
2555
2556
0
  if (!cpi->frame_size_related_setup_done ||
2557
0
      seq_params->use_highbitdepth != use_highbitdepth ||
2558
0
      seq_params->subsampling_x != subsampling_x ||
2559
0
      seq_params->subsampling_y != subsampling_y) {
2560
0
    seq_params->subsampling_x = subsampling_x;
2561
0
    seq_params->subsampling_y = subsampling_y;
2562
0
    seq_params->use_highbitdepth = use_highbitdepth;
2563
2564
0
    av1_set_speed_features_framesize_independent(cpi, cpi->oxcf.speed);
2565
0
    av1_set_speed_features_framesize_dependent(cpi, cpi->oxcf.speed);
2566
2567
0
    if (!is_stat_generation_stage(cpi)) {
2568
0
#if !CONFIG_REALTIME_ONLY
2569
0
      if (!av1_tf_info_alloc(&cpi->ppi->tf_info, cpi))
2570
0
        return AOM_CODEC_MEM_ERROR;
2571
0
#endif  // !CONFIG_REALTIME_ONLY
2572
0
    }
2573
0
    init_ref_frame_bufs(cpi);
2574
2575
0
    init_motion_estimation(cpi);  // TODO(agrange) This can be removed.
2576
2577
0
    cpi->initial_mbs = cm->mi_params.MBs;
2578
0
    cpi->frame_size_related_setup_done = true;
2579
0
  }
2580
0
  return AOM_CODEC_OK;
2581
0
}
2582
2583
#if CONFIG_AV1_TEMPORAL_DENOISING
2584
static void setup_denoiser_buffer(AV1_COMP *cpi) {
2585
  AV1_COMMON *const cm = &cpi->common;
2586
  if (cpi->oxcf.noise_sensitivity > 0 &&
2587
      !cpi->denoiser.frame_buffer_initialized) {
2588
    if (av1_denoiser_alloc(
2589
            cm, &cpi->svc, &cpi->denoiser, cpi->ppi->use_svc,
2590
            cpi->oxcf.noise_sensitivity, cm->width, cm->height,
2591
            cm->seq_params->subsampling_x, cm->seq_params->subsampling_y,
2592
            cm->seq_params->use_highbitdepth, AOM_BORDER_IN_PIXELS))
2593
      aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
2594
                         "Failed to allocate denoiser");
2595
  }
2596
}
2597
#endif
2598
2599
// Returns 1 if the assigned width or height was <= 0.
2600
0
static int set_size_literal(AV1_COMP *cpi, int width, int height) {
2601
0
  AV1_COMMON *cm = &cpi->common;
2602
0
  aom_codec_err_t err = av1_check_initial_width(
2603
0
      cpi, cm->seq_params->use_highbitdepth, cm->seq_params->subsampling_x,
2604
0
      cm->seq_params->subsampling_y);
2605
0
  if (err != AOM_CODEC_OK) {
2606
0
    aom_internal_error(cm->error, err, "av1_check_initial_width() failed");
2607
0
  }
2608
2609
0
  if (width <= 0 || height <= 0) return 1;
2610
2611
0
  cm->width = width;
2612
0
  cm->height = height;
2613
2614
#if CONFIG_AV1_TEMPORAL_DENOISING
2615
  setup_denoiser_buffer(cpi);
2616
#endif
2617
2618
0
  if (cm->width > cpi->data_alloc_width ||
2619
0
      cm->height > cpi->data_alloc_height) {
2620
0
    av1_free_context_buffers(cm);
2621
0
    av1_free_shared_coeff_buffer(&cpi->td.shared_coeff_buf);
2622
0
    av1_free_sms_tree(&cpi->td);
2623
0
    av1_free_pmc(cpi->td.firstpass_ctx, av1_num_planes(cm));
2624
0
    cpi->td.firstpass_ctx = NULL;
2625
0
    alloc_compressor_data(cpi);
2626
0
    realloc_segmentation_maps(cpi);
2627
0
    cpi->data_alloc_width = cm->width;
2628
0
    cpi->data_alloc_height = cm->height;
2629
0
    cpi->frame_size_related_setup_done = false;
2630
0
  }
2631
0
  alloc_mb_mode_info_buffers(cpi);
2632
0
  av1_update_frame_size(cpi);
2633
2634
0
  return 0;
2635
0
}
2636
2637
0
void av1_set_frame_size(AV1_COMP *cpi, int width, int height) {
2638
0
  AV1_COMMON *const cm = &cpi->common;
2639
0
  const SequenceHeader *const seq_params = cm->seq_params;
2640
0
  const int num_planes = av1_num_planes(cm);
2641
0
  MACROBLOCKD *const xd = &cpi->td.mb.e_mbd;
2642
0
  int ref_frame;
2643
2644
0
  if (width != cm->width || height != cm->height) {
2645
    // There has been a change in the encoded frame size
2646
0
    set_size_literal(cpi, width, height);
2647
    // Recalculate 'all_lossless' in case super-resolution was (un)selected.
2648
0
    cm->features.all_lossless =
2649
0
        cm->features.coded_lossless && !av1_superres_scaled(cm);
2650
2651
0
    av1_noise_estimate_init(&cpi->noise_estimate, cm->width, cm->height);
2652
#if CONFIG_AV1_TEMPORAL_DENOISING
2653
    // Reset the denoiser on the resized frame.
2654
    if (cpi->oxcf.noise_sensitivity > 0) {
2655
      av1_denoiser_free(&(cpi->denoiser));
2656
      setup_denoiser_buffer(cpi);
2657
    }
2658
#endif
2659
0
  }
2660
0
  if (is_stat_consumption_stage(cpi)) {
2661
0
    av1_set_target_rate(cpi, cm->width, cm->height);
2662
0
  }
2663
2664
0
  alloc_frame_mvs(cm, cm->cur_frame);
2665
2666
  // Allocate above context buffers
2667
0
  CommonContexts *const above_contexts = &cm->above_contexts;
2668
0
  if (above_contexts->num_planes < av1_num_planes(cm) ||
2669
0
      above_contexts->num_mi_cols < cm->mi_params.mi_cols ||
2670
0
      above_contexts->num_tile_rows < cm->tiles.rows) {
2671
0
    av1_free_above_context_buffers(above_contexts);
2672
0
    if (av1_alloc_above_context_buffers(above_contexts, cm->tiles.rows,
2673
0
                                        cm->mi_params.mi_cols,
2674
0
                                        av1_num_planes(cm)))
2675
0
      aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
2676
0
                         "Failed to allocate context buffers");
2677
0
  }
2678
2679
0
  AV1EncoderConfig *oxcf = &cpi->oxcf;
2680
0
  oxcf->border_in_pixels = av1_get_enc_border_size(
2681
0
      av1_is_resize_needed(oxcf), oxcf->kf_cfg.key_freq_max == 0,
2682
0
      cm->seq_params->sb_size);
2683
2684
  // Reset the frame pointers to the current frame size.
2685
0
  if (aom_realloc_frame_buffer(
2686
0
          &cm->cur_frame->buf, cm->width, cm->height, seq_params->subsampling_x,
2687
0
          seq_params->subsampling_y, seq_params->use_highbitdepth,
2688
0
          cpi->oxcf.border_in_pixels, cm->features.byte_alignment, NULL, NULL,
2689
0
          NULL, cpi->alloc_pyramid, 0))
2690
0
    aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
2691
0
                       "Failed to allocate frame buffer");
2692
2693
0
  if (!is_stat_generation_stage(cpi)) av1_init_cdef_worker(cpi);
2694
2695
0
#if !CONFIG_REALTIME_ONLY
2696
0
  if (is_restoration_used(cm)) {
2697
0
    for (int i = 0; i < num_planes; ++i)
2698
0
      cm->rst_info[i].frame_restoration_type = RESTORE_NONE;
2699
2700
0
    const bool is_sgr_enabled = !cpi->sf.lpf_sf.disable_sgr_filter;
2701
0
    av1_alloc_restoration_buffers(cm, is_sgr_enabled);
2702
    // Store the allocated restoration buffers in MT object.
2703
0
    if (cpi->ppi->p_mt_info.num_workers > 1) {
2704
0
      av1_init_lr_mt_buffers(cpi);
2705
0
    }
2706
0
  }
2707
0
#endif
2708
2709
0
  init_motion_estimation(cpi);
2710
2711
0
  int has_valid_ref_frame = 0;
2712
0
  for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) {
2713
0
    RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame);
2714
0
    if (buf != NULL) {
2715
0
      struct scale_factors *sf = get_ref_scale_factors(cm, ref_frame);
2716
0
      av1_setup_scale_factors_for_frame(sf, buf->buf.y_crop_width,
2717
0
                                        buf->buf.y_crop_height, cm->width,
2718
0
                                        cm->height);
2719
0
      has_valid_ref_frame |= av1_is_valid_scale(sf);
2720
0
      if (av1_is_scaled(sf)) aom_extend_frame_borders(&buf->buf, num_planes);
2721
0
    }
2722
0
  }
2723
  // For 1 pass CBR mode: we can skip this check for spatial enhancement
2724
  // layer if the target_bandwidth is zero, since it will be dropped.
2725
0
  const bool dropped_frame =
2726
0
      has_no_stats_stage(cpi) && cpi->oxcf.rc_cfg.mode == AOM_CBR &&
2727
0
      cpi->svc.spatial_layer_id > 0 && cpi->oxcf.rc_cfg.target_bandwidth == 0;
2728
0
  if (!frame_is_intra_only(cm) && !has_valid_ref_frame && !dropped_frame) {
2729
0
    aom_internal_error(
2730
0
        cm->error, AOM_CODEC_CORRUPT_FRAME,
2731
0
        "Can't find at least one reference frame with valid size");
2732
0
  }
2733
2734
0
  av1_setup_scale_factors_for_frame(&cm->sf_identity, cm->width, cm->height,
2735
0
                                    cm->width, cm->height);
2736
2737
0
  set_ref_ptrs(cm, xd, LAST_FRAME, LAST_FRAME);
2738
0
}
2739
2740
static inline int extend_borders_mt(const AV1_COMP *cpi,
2741
0
                                    MULTI_THREADED_MODULES stage, int plane) {
2742
0
  const AV1_COMMON *const cm = &cpi->common;
2743
0
  if (cpi->mt_info.num_mod_workers[stage] < 2) return 0;
2744
0
  switch (stage) {
2745
    // TODO(deepa.kg@ittiam.com): When cdef and loop-restoration are disabled,
2746
    // multi-thread frame border extension along with loop filter frame.
2747
    // As loop-filtering of a superblock row modifies the pixels of the
2748
    // above superblock row, border extension requires that loop filtering
2749
    // of the current and above superblock row is complete.
2750
0
    case MOD_LPF: return 0;
2751
0
    case MOD_CDEF:
2752
0
      return is_cdef_used(cm) && !cpi->ppi->rtc_ref.non_reference_frame &&
2753
0
             !is_restoration_used(cm) && !av1_superres_scaled(cm);
2754
0
    case MOD_LR:
2755
0
      return is_restoration_used(cm) &&
2756
0
             (cm->rst_info[plane].frame_restoration_type != RESTORE_NONE);
2757
0
    default: assert(0);
2758
0
  }
2759
0
  return 0;
2760
0
}
2761
2762
/*!\brief Select and apply cdef filters and switchable restoration filters
2763
 *
2764
 * \ingroup high_level_algo
2765
 */
2766
static void cdef_restoration_frame(AV1_COMP *cpi, AV1_COMMON *cm,
2767
                                   MACROBLOCKD *xd, int use_restoration,
2768
                                   int use_cdef,
2769
0
                                   unsigned int skip_apply_postproc_filters) {
2770
0
#if !CONFIG_REALTIME_ONLY
2771
0
  if (use_restoration)
2772
0
    av1_loop_restoration_save_boundary_lines(&cm->cur_frame->buf, cm, 0);
2773
#else
2774
  (void)use_restoration;
2775
#endif
2776
2777
0
  if (use_cdef) {
2778
#if CONFIG_COLLECT_COMPONENT_TIMING
2779
    start_timing(cpi, cdef_time);
2780
#endif
2781
0
    const int num_workers = cpi->mt_info.num_mod_workers[MOD_CDEF];
2782
    // Find CDEF parameters
2783
0
    av1_cdef_search(cpi);
2784
2785
    // Apply the filter
2786
0
    if ((skip_apply_postproc_filters & SKIP_APPLY_CDEF) == 0) {
2787
0
      assert(!cpi->ppi->rtc_ref.non_reference_frame);
2788
0
      if (num_workers > 1) {
2789
        // Extension of frame borders is multi-threaded along with cdef.
2790
0
        const int do_extend_border =
2791
0
            extend_borders_mt(cpi, MOD_CDEF, /* plane */ 0);
2792
0
        av1_cdef_frame_mt(cm, xd, cpi->mt_info.cdef_worker,
2793
0
                          cpi->mt_info.workers, &cpi->mt_info.cdef_sync,
2794
0
                          num_workers, av1_cdef_init_fb_row_mt,
2795
0
                          do_extend_border);
2796
0
      } else {
2797
0
        av1_cdef_frame(&cm->cur_frame->buf, cm, xd, av1_cdef_init_fb_row);
2798
0
      }
2799
0
    }
2800
#if CONFIG_COLLECT_COMPONENT_TIMING
2801
    end_timing(cpi, cdef_time);
2802
#endif
2803
0
  }
2804
2805
0
  const int use_superres = av1_superres_scaled(cm);
2806
0
  if (use_superres) {
2807
0
    if ((skip_apply_postproc_filters & SKIP_APPLY_SUPERRES) == 0) {
2808
0
      av1_superres_post_encode(cpi);
2809
0
    }
2810
0
  }
2811
2812
0
#if !CONFIG_REALTIME_ONLY
2813
#if CONFIG_COLLECT_COMPONENT_TIMING
2814
  start_timing(cpi, loop_restoration_time);
2815
#endif
2816
0
  if (use_restoration) {
2817
0
    MultiThreadInfo *const mt_info = &cpi->mt_info;
2818
0
    const int num_workers = mt_info->num_mod_workers[MOD_LR];
2819
0
    av1_loop_restoration_save_boundary_lines(&cm->cur_frame->buf, cm, 1);
2820
0
    av1_pick_filter_restoration(cpi->source, cpi);
2821
0
    if ((skip_apply_postproc_filters & SKIP_APPLY_RESTORATION) == 0 &&
2822
0
        (cm->rst_info[0].frame_restoration_type != RESTORE_NONE ||
2823
0
         cm->rst_info[1].frame_restoration_type != RESTORE_NONE ||
2824
0
         cm->rst_info[2].frame_restoration_type != RESTORE_NONE)) {
2825
0
      if (num_workers > 1) {
2826
        // Extension of frame borders is multi-threaded along with loop
2827
        // restoration filter.
2828
0
        const int do_extend_border = 1;
2829
0
        av1_loop_restoration_filter_frame_mt(
2830
0
            &cm->cur_frame->buf, cm, 0, mt_info->workers, num_workers,
2831
0
            &mt_info->lr_row_sync, &cpi->lr_ctxt, do_extend_border);
2832
0
      } else {
2833
0
        av1_loop_restoration_filter_frame(&cm->cur_frame->buf, cm, 0,
2834
0
                                          &cpi->lr_ctxt);
2835
0
      }
2836
0
    }
2837
0
  }
2838
#if CONFIG_COLLECT_COMPONENT_TIMING
2839
  end_timing(cpi, loop_restoration_time);
2840
#endif
2841
0
#endif  // !CONFIG_REALTIME_ONLY
2842
0
}
2843
2844
0
static void extend_frame_borders(AV1_COMP *cpi) {
2845
0
  const AV1_COMMON *const cm = &cpi->common;
2846
  // TODO(debargha): Fix mv search range on encoder side
2847
0
  for (int plane = 0; plane < av1_num_planes(cm); ++plane) {
2848
0
    const bool extend_border_done = extend_borders_mt(cpi, MOD_CDEF, plane) ||
2849
0
                                    extend_borders_mt(cpi, MOD_LR, plane);
2850
0
    if (!extend_border_done) {
2851
0
      const YV12_BUFFER_CONFIG *const ybf = &cm->cur_frame->buf;
2852
0
      aom_extend_frame_borders_plane_row(ybf, plane, 0,
2853
0
                                         ybf->crop_heights[plane > 0]);
2854
0
    }
2855
0
  }
2856
0
}
2857
2858
/*!\brief Select and apply deblocking filters, cdef filters, and restoration
2859
 * filters.
2860
 *
2861
 * \ingroup high_level_algo
2862
 */
2863
0
static void loopfilter_frame(AV1_COMP *cpi, AV1_COMMON *cm) {
2864
0
  MultiThreadInfo *const mt_info = &cpi->mt_info;
2865
0
  const int num_workers = mt_info->num_mod_workers[MOD_LPF];
2866
0
  const int num_planes = av1_num_planes(cm);
2867
0
  MACROBLOCKD *xd = &cpi->td.mb.e_mbd;
2868
0
  cpi->td.mb.rdmult = cpi->rd.RDMULT;
2869
2870
0
  assert(IMPLIES(is_lossless_requested(&cpi->oxcf.rc_cfg),
2871
0
                 cm->features.coded_lossless && cm->features.all_lossless));
2872
2873
0
  const int use_loopfilter =
2874
0
      is_loopfilter_used(cm) && !cpi->mt_info.pipeline_lpf_mt_with_enc;
2875
0
  const int use_cdef = is_cdef_used(cm);
2876
0
  const int use_superres = av1_superres_scaled(cm);
2877
0
  const int use_restoration = is_restoration_used(cm);
2878
2879
0
  const unsigned int skip_apply_postproc_filters =
2880
0
      derive_skip_apply_postproc_filters(cpi, use_loopfilter, use_cdef,
2881
0
                                         use_superres, use_restoration);
2882
2883
#if CONFIG_COLLECT_COMPONENT_TIMING
2884
  start_timing(cpi, loop_filter_time);
2885
#endif
2886
0
  if (use_loopfilter) {
2887
0
    av1_pick_filter_level(cpi->source, cpi, cpi->sf.lpf_sf.lpf_pick);
2888
0
    struct loopfilter *lf = &cm->lf;
2889
0
    if ((lf->filter_level[0] || lf->filter_level[1]) &&
2890
0
        (skip_apply_postproc_filters & SKIP_APPLY_LOOPFILTER) == 0) {
2891
0
      assert(!cpi->ppi->rtc_ref.non_reference_frame);
2892
      // lpf_opt_level = 1 : Enables dual/quad loop-filtering.
2893
      // lpf_opt_level is set to 1 if transform size search depth in inter
2894
      // blocks is limited to one as quad loop filtering assumes that all the
2895
      // transform blocks within a 16x8/8x16/16x16 prediction block are of the
2896
      // same size. lpf_opt_level = 2 : Filters both chroma planes together, in
2897
      // addition to enabling dual/quad loop-filtering. This is enabled when lpf
2898
      // pick method is LPF_PICK_FROM_Q as u and v plane filter levels are
2899
      // equal.
2900
0
      int lpf_opt_level = get_lpf_opt_level(&cpi->sf);
2901
0
      av1_loop_filter_frame_mt(&cm->cur_frame->buf, cm, xd, 0, num_planes, 0,
2902
0
                               mt_info->workers, num_workers,
2903
0
                               &mt_info->lf_row_sync, lpf_opt_level);
2904
0
    }
2905
0
  }
2906
2907
#if CONFIG_COLLECT_COMPONENT_TIMING
2908
  end_timing(cpi, loop_filter_time);
2909
#endif
2910
2911
0
  cdef_restoration_frame(cpi, cm, xd, use_restoration, use_cdef,
2912
0
                         skip_apply_postproc_filters);
2913
0
}
2914
2915
0
static void update_motion_stat(AV1_COMP *const cpi) {
2916
0
  AV1_COMMON *const cm = &cpi->common;
2917
0
  const CommonModeInfoParams *const mi_params = &cm->mi_params;
2918
0
  RATE_CONTROL *const rc = &cpi->rc;
2919
0
  SVC *const svc = &cpi->svc;
2920
0
  const int avg_cnt_zeromv =
2921
0
      100 * cpi->rc.cnt_zeromv / (mi_params->mi_rows * mi_params->mi_cols);
2922
0
  if (!cpi->ppi->use_svc ||
2923
0
      (cpi->ppi->use_svc &&
2924
0
       !cpi->svc.layer_context[cpi->svc.temporal_layer_id].is_key_frame &&
2925
0
       cpi->svc.spatial_layer_id == cpi->svc.number_spatial_layers - 1)) {
2926
0
    rc->avg_frame_low_motion =
2927
0
        (rc->avg_frame_low_motion == 0)
2928
0
            ? avg_cnt_zeromv
2929
0
            : (3 * rc->avg_frame_low_motion + avg_cnt_zeromv) / 4;
2930
    // For SVC: set avg_frame_low_motion (only computed on top spatial layer)
2931
    // to all lower spatial layers.
2932
0
    if (cpi->ppi->use_svc &&
2933
0
        svc->spatial_layer_id == svc->number_spatial_layers - 1) {
2934
0
      for (int i = 0; i < svc->number_spatial_layers - 1; ++i) {
2935
0
        const int layer = LAYER_IDS_TO_IDX(i, svc->temporal_layer_id,
2936
0
                                           svc->number_temporal_layers);
2937
0
        LAYER_CONTEXT *const lc = &svc->layer_context[layer];
2938
0
        RATE_CONTROL *const lrc = &lc->rc;
2939
0
        lrc->avg_frame_low_motion = rc->avg_frame_low_motion;
2940
0
      }
2941
0
    }
2942
0
  }
2943
0
}
2944
2945
/*!\brief Encode a frame without the recode loop, usually used in one-pass
2946
 * encoding and realtime coding.
2947
 *
2948
 * \ingroup high_level_algo
2949
 *
2950
 * \param[in]    cpi             Top-level encoder structure
2951
 *
2952
 * \return Returns a value to indicate if the encoding is done successfully.
2953
 * \retval #AOM_CODEC_OK
2954
 * \retval #AOM_CODEC_ERROR
2955
 */
2956
0
static int encode_without_recode(AV1_COMP *cpi) {
2957
0
  AV1_COMMON *const cm = &cpi->common;
2958
0
  const QuantizationCfg *const q_cfg = &cpi->oxcf.q_cfg;
2959
0
  SVC *const svc = &cpi->svc;
2960
0
  const int resize_pending = is_frame_resize_pending(cpi);
2961
0
  int top_index = 0, bottom_index = 0, q = 0;
2962
0
  YV12_BUFFER_CONFIG *unscaled = cpi->unscaled_source;
2963
0
  InterpFilter filter_scaler =
2964
0
      cpi->ppi->use_svc ? svc->downsample_filter_type[svc->spatial_layer_id]
2965
0
                        : EIGHTTAP_SMOOTH;
2966
0
  int phase_scaler = cpi->ppi->use_svc
2967
0
                         ? svc->downsample_filter_phase[svc->spatial_layer_id]
2968
0
                         : 0;
2969
2970
0
  if (cpi->rc.postencode_drop && allow_postencode_drop_rtc(cpi))
2971
0
    av1_save_all_coding_context(cpi);
2972
2973
0
  set_size_independent_vars(cpi);
2974
0
  av1_setup_frame_size(cpi);
2975
0
  cm->prev_frame = get_primary_ref_frame_buf(cm);
2976
0
  av1_set_size_dependent_vars(cpi, &q, &bottom_index, &top_index);
2977
0
  av1_set_mv_search_params(cpi);
2978
2979
0
  const SequenceHeader *seq_params = cm->seq_params;
2980
0
  if ((cpi->svc.source_last_TL0.buffer_alloc_sz == 0 ||
2981
0
       cpi->svc.source_last_TL0.y_crop_width != cpi->oxcf.frm_dim_cfg.width ||
2982
0
       cpi->svc.source_last_TL0.y_crop_height != cpi->oxcf.frm_dim_cfg.height ||
2983
0
       cpi->svc.source_last_TL0.subsampling_x != seq_params->subsampling_x ||
2984
0
       cpi->svc.source_last_TL0.subsampling_y != seq_params->subsampling_y ||
2985
0
       cpi->svc.source_last_TL0.flags != cpi->source->flags) &&
2986
0
      (cpi->ppi->use_svc || cpi->oxcf.rc_cfg.drop_frames_water_mark > 0)) {
2987
0
    if (aom_alloc_frame_buffer(
2988
0
            &cpi->svc.source_last_TL0, cpi->oxcf.frm_dim_cfg.width,
2989
0
            cpi->oxcf.frm_dim_cfg.height, seq_params->subsampling_x,
2990
0
            seq_params->subsampling_y, seq_params->use_highbitdepth,
2991
0
            cpi->oxcf.border_in_pixels, cm->features.byte_alignment, false,
2992
0
            0)) {
2993
0
      aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
2994
0
                         "Failed to allocate buffer for source_last_TL0");
2995
0
    }
2996
0
  }
2997
2998
0
  if (!cpi->ppi->use_svc) {
2999
0
    phase_scaler = 8;
3000
    // 2:1 scaling.
3001
0
    if ((cm->width << 1) == unscaled->y_crop_width &&
3002
0
        (cm->height << 1) == unscaled->y_crop_height) {
3003
0
      filter_scaler = BILINEAR;
3004
      // For lower resolutions use eighttap_smooth.
3005
0
      if (cm->width * cm->height <= 320 * 180) filter_scaler = EIGHTTAP_SMOOTH;
3006
0
    } else if ((cm->width << 2) == unscaled->y_crop_width &&
3007
0
               (cm->height << 2) == unscaled->y_crop_height) {
3008
      // 4:1 scaling.
3009
0
      filter_scaler = EIGHTTAP_SMOOTH;
3010
0
    } else if ((cm->width << 2) == 3 * unscaled->y_crop_width &&
3011
0
               (cm->height << 2) == 3 * unscaled->y_crop_height) {
3012
      // 4:3 scaling.
3013
0
      filter_scaler = EIGHTTAP_REGULAR;
3014
0
    }
3015
0
  }
3016
3017
0
  allocate_gradient_info_for_hog(cpi);
3018
3019
0
  allocate_src_var_of_4x4_sub_block_buf(cpi);
3020
3021
0
  const SPEED_FEATURES *sf = &cpi->sf;
3022
0
  if (sf->part_sf.partition_search_type == VAR_BASED_PARTITION)
3023
0
    variance_partition_alloc(cpi);
3024
3025
0
  if (cm->current_frame.frame_type == KEY_FRAME ||
3026
0
      ((sf->inter_sf.extra_prune_warped && cpi->refresh_frame.golden_frame)))
3027
0
    copy_frame_prob_info(cpi);
3028
3029
#if CONFIG_COLLECT_COMPONENT_TIMING
3030
  printf("\n Encoding a frame: \n");
3031
#endif
3032
3033
#if CONFIG_TUNE_BUTTERAUGLI
3034
  if (cpi->oxcf.tune_cfg.tuning == AOM_TUNE_BUTTERAUGLI) {
3035
    av1_setup_butteraugli_rdmult(cpi);
3036
  }
3037
#endif
3038
3039
0
  cpi->source = av1_realloc_and_scale_if_required(
3040
0
      cm, unscaled, &cpi->scaled_source, filter_scaler, phase_scaler, true,
3041
0
      false, cpi->oxcf.border_in_pixels, cpi->alloc_pyramid);
3042
0
  if (frame_is_intra_only(cm) || resize_pending != 0) {
3043
0
    const int current_size =
3044
0
        (cm->mi_params.mi_rows * cm->mi_params.mi_cols) >> 2;
3045
0
    if (cpi->consec_zero_mv &&
3046
0
        (cpi->consec_zero_mv_alloc_size < current_size)) {
3047
0
      aom_free(cpi->consec_zero_mv);
3048
0
      cpi->consec_zero_mv_alloc_size = 0;
3049
0
      CHECK_MEM_ERROR(cm, cpi->consec_zero_mv,
3050
0
                      aom_malloc(current_size * sizeof(*cpi->consec_zero_mv)));
3051
0
      cpi->consec_zero_mv_alloc_size = current_size;
3052
0
    }
3053
0
    assert(cpi->consec_zero_mv != NULL);
3054
0
    memset(cpi->consec_zero_mv, 0, current_size * sizeof(*cpi->consec_zero_mv));
3055
0
  }
3056
3057
0
  if (cpi->scaled_last_source_available) {
3058
0
    cpi->last_source = &cpi->scaled_last_source;
3059
0
    cpi->scaled_last_source_available = 0;
3060
0
  } else if (cpi->unscaled_last_source != NULL) {
3061
0
    cpi->last_source = av1_realloc_and_scale_if_required(
3062
0
        cm, cpi->unscaled_last_source, &cpi->scaled_last_source, filter_scaler,
3063
0
        phase_scaler, true, false, cpi->oxcf.border_in_pixels,
3064
0
        cpi->alloc_pyramid);
3065
0
  }
3066
3067
0
  if (cpi->sf.rt_sf.use_temporal_noise_estimate) {
3068
0
    av1_update_noise_estimate(cpi);
3069
0
  }
3070
3071
#if CONFIG_AV1_TEMPORAL_DENOISING
3072
  if (cpi->oxcf.noise_sensitivity > 0 && cpi->ppi->use_svc)
3073
    av1_denoiser_reset_on_first_frame(cpi);
3074
#endif
3075
3076
  // For 1 spatial layer encoding: if the (non-LAST) reference has different
3077
  // resolution from the source then disable that reference. This is to avoid
3078
  // significant increase in encode time from scaling the references in
3079
  // av1_scale_references. Note GOLDEN is forced to update on the (first/tigger)
3080
  // resized frame and ALTREF will be refreshed ~4 frames later, so both
3081
  // references become available again after few frames.
3082
  // For superres: don't disable golden reference.
3083
0
  if (svc->number_spatial_layers == 1) {
3084
0
    if (!cpi->oxcf.superres_cfg.enable_superres) {
3085
0
      if (cpi->ref_frame_flags & av1_ref_frame_flag_list[GOLDEN_FRAME]) {
3086
0
        const YV12_BUFFER_CONFIG *const ref =
3087
0
            get_ref_frame_yv12_buf(cm, GOLDEN_FRAME);
3088
0
        if (ref == NULL || ref->y_crop_width != cm->width ||
3089
0
            ref->y_crop_height != cm->height) {
3090
0
          cpi->ref_frame_flags ^= AOM_GOLD_FLAG;
3091
0
        }
3092
0
      }
3093
0
    }
3094
0
    if (cpi->ref_frame_flags & av1_ref_frame_flag_list[ALTREF_FRAME]) {
3095
0
      const YV12_BUFFER_CONFIG *const ref =
3096
0
          get_ref_frame_yv12_buf(cm, ALTREF_FRAME);
3097
0
      if (ref == NULL || ref->y_crop_width != cm->width ||
3098
0
          ref->y_crop_height != cm->height) {
3099
0
        cpi->ref_frame_flags ^= AOM_ALT_FLAG;
3100
0
      }
3101
0
    }
3102
0
  }
3103
3104
0
  int scale_references = 0;
3105
#if CONFIG_FPMT_TEST
3106
  scale_references =
3107
      cpi->ppi->fpmt_unit_test_cfg == PARALLEL_SIMULATION_ENCODE ? 1 : 0;
3108
#endif  // CONFIG_FPMT_TEST
3109
0
  if (scale_references ||
3110
0
      cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] == 0) {
3111
0
    if (!frame_is_intra_only(cm)) {
3112
0
      av1_scale_references(cpi, filter_scaler, phase_scaler, 1);
3113
0
    }
3114
0
  }
3115
3116
0
  av1_set_quantizer(cm, q_cfg->qm_minlevel, q_cfg->qm_maxlevel, q,
3117
0
                    q_cfg->enable_chroma_deltaq, q_cfg->enable_hdr_deltaq,
3118
0
                    cpi->oxcf.mode == ALLINTRA, cpi->oxcf.tune_cfg.tuning);
3119
0
  av1_set_speed_features_qindex_dependent(cpi, cpi->oxcf.speed);
3120
0
  av1_init_quantizer(&cpi->enc_quant_dequant_params, &cm->quant_params,
3121
0
                     cm->seq_params->bit_depth, cpi->oxcf.algo_cfg.sharpness);
3122
0
  av1_set_variance_partition_thresholds(cpi, q, 0);
3123
0
  av1_setup_frame(cpi);
3124
3125
  // Check if this high_source_sad (scene/slide change) frame should be
3126
  // encoded at high/max QP, and if so, set the q and adjust some rate
3127
  // control parameters.
3128
0
  if (cpi->sf.rt_sf.overshoot_detection_cbr == FAST_DETECTION_MAXQ &&
3129
0
      cpi->rc.high_source_sad) {
3130
0
    if (av1_encodedframe_overshoot_cbr(cpi, &q)) {
3131
0
      av1_set_quantizer(cm, q_cfg->qm_minlevel, q_cfg->qm_maxlevel, q,
3132
0
                        q_cfg->enable_chroma_deltaq, q_cfg->enable_hdr_deltaq,
3133
0
                        cpi->oxcf.mode == ALLINTRA, cpi->oxcf.tune_cfg.tuning);
3134
0
      av1_set_speed_features_qindex_dependent(cpi, cpi->oxcf.speed);
3135
0
      av1_init_quantizer(&cpi->enc_quant_dequant_params, &cm->quant_params,
3136
0
                         cm->seq_params->bit_depth,
3137
0
                         cpi->oxcf.algo_cfg.sharpness);
3138
0
      av1_set_variance_partition_thresholds(cpi, q, 0);
3139
0
      if (frame_is_intra_only(cm) || cm->features.error_resilient_mode ||
3140
0
          cm->features.primary_ref_frame == PRIMARY_REF_NONE)
3141
0
        av1_setup_frame(cpi);
3142
0
    }
3143
0
  }
3144
0
  av1_apply_active_map(cpi);
3145
0
  if (cpi->roi.enabled) {
3146
    // For now if roi map is used: don't setup cyclic refresh.
3147
0
    av1_apply_roi_map(cpi);
3148
0
  } else if (q_cfg->aq_mode == CYCLIC_REFRESH_AQ) {
3149
0
    av1_cyclic_refresh_setup(cpi);
3150
0
  }
3151
0
  if (cm->seg.enabled) {
3152
0
    if (!cm->seg.update_data && cm->prev_frame) {
3153
0
      segfeatures_copy(&cm->seg, &cm->prev_frame->seg);
3154
0
      cm->seg.enabled = cm->prev_frame->seg.enabled;
3155
0
    } else {
3156
0
      av1_calculate_segdata(&cm->seg);
3157
0
    }
3158
0
  } else {
3159
0
    memset(&cm->seg, 0, sizeof(cm->seg));
3160
0
  }
3161
0
  segfeatures_copy(&cm->cur_frame->seg, &cm->seg);
3162
0
  cm->cur_frame->seg.enabled = cm->seg.enabled;
3163
3164
  // This is for rtc temporal filtering case.
3165
0
  if (is_psnr_calc_enabled(cpi) && cpi->sf.rt_sf.use_rtc_tf) {
3166
0
    if (cpi->orig_source.buffer_alloc_sz == 0 ||
3167
0
        cpi->orig_source.y_crop_width != cpi->source->y_crop_width ||
3168
0
        cpi->orig_source.y_crop_height != cpi->source->y_crop_height ||
3169
0
        cpi->orig_source.subsampling_x != cpi->source->subsampling_x ||
3170
0
        cpi->orig_source.subsampling_y != cpi->source->subsampling_y ||
3171
0
        cpi->orig_source.flags != cpi->source->flags) {
3172
      // Allocate a source buffer to store the original source for psnr
3173
      // calculation.
3174
0
      const int use_highbitdepth =
3175
0
          (cpi->source->flags & YV12_FLAG_HIGHBITDEPTH) != 0;
3176
0
      if (aom_alloc_frame_buffer(&cpi->orig_source, cpi->source->y_crop_width,
3177
0
                                 cpi->source->y_crop_height,
3178
0
                                 cpi->source->subsampling_x,
3179
0
                                 cpi->source->subsampling_y, use_highbitdepth,
3180
0
                                 cpi->oxcf.border_in_pixels,
3181
0
                                 cm->features.byte_alignment, false, 0))
3182
0
        aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
3183
0
                           "Failed to allocate cpi->orig_source buffer");
3184
0
    }
3185
3186
0
    aom_yv12_copy_y(cpi->source, &cpi->orig_source, 1);
3187
0
    aom_yv12_copy_u(cpi->source, &cpi->orig_source, 1);
3188
0
    aom_yv12_copy_v(cpi->source, &cpi->orig_source, 1);
3189
0
  }
3190
3191
#if CONFIG_COLLECT_COMPONENT_TIMING
3192
  start_timing(cpi, av1_encode_frame_time);
3193
#endif
3194
3195
  // Set the motion vector precision based on mv stats from the last coded
3196
  // frame.
3197
0
  if (!frame_is_intra_only(cm)) av1_pick_and_set_high_precision_mv(cpi, q);
3198
3199
0
  if (svc->temporal_layer_id == 0) {
3200
0
    cpi->rc.num_col_blscroll_last_tl0 = 0;
3201
0
    cpi->rc.num_row_blscroll_last_tl0 = 0;
3202
0
  }
3203
3204
  // transform / motion compensation build reconstruction frame
3205
0
  av1_encode_frame(cpi);
3206
3207
0
  if (!cpi->rc.rtc_external_ratectrl && !frame_is_intra_only(cm))
3208
0
    update_motion_stat(cpi);
3209
3210
  // Adjust the refresh of the golden (longer-term) reference based on QP
3211
  // selected for this frame. This is for CBR real-time mode, and only
3212
  // for single layer without usage of the set_ref_frame_config (so
3213
  // reference structure for 1 layer is set internally).
3214
0
  if (!frame_is_intra_only(cm) && cpi->oxcf.rc_cfg.mode == AOM_CBR &&
3215
0
      cpi->oxcf.mode == REALTIME && svc->number_spatial_layers == 1 &&
3216
0
      svc->number_temporal_layers == 1 && !cpi->rc.rtc_external_ratectrl &&
3217
0
      !cpi->ppi->rtc_ref.set_ref_frame_config &&
3218
0
      sf->rt_sf.gf_refresh_based_on_qp)
3219
0
    av1_adjust_gf_refresh_qp_one_pass_rt(cpi);
3220
3221
  // For non-svc: if scaling is required, copy scaled_source
3222
  // into scaled_last_source.
3223
0
  if (cm->current_frame.frame_number > 1 && !cpi->ppi->use_svc &&
3224
0
      cpi->scaled_source.y_buffer != NULL &&
3225
0
      cpi->scaled_last_source.y_buffer != NULL &&
3226
0
      cpi->scaled_source.y_crop_width == cpi->scaled_last_source.y_crop_width &&
3227
0
      cpi->scaled_source.y_crop_height ==
3228
0
          cpi->scaled_last_source.y_crop_height &&
3229
0
      (cm->width != cpi->unscaled_source->y_crop_width ||
3230
0
       cm->height != cpi->unscaled_source->y_crop_height)) {
3231
0
    cpi->scaled_last_source_available = 1;
3232
0
    aom_yv12_copy_y(&cpi->scaled_source, &cpi->scaled_last_source, 1);
3233
0
    aom_yv12_copy_u(&cpi->scaled_source, &cpi->scaled_last_source, 1);
3234
0
    aom_yv12_copy_v(&cpi->scaled_source, &cpi->scaled_last_source, 1);
3235
0
  }
3236
3237
#if CONFIG_COLLECT_COMPONENT_TIMING
3238
  end_timing(cpi, av1_encode_frame_time);
3239
#endif
3240
#if CONFIG_INTERNAL_STATS
3241
  ++cpi->frame_recode_hits;
3242
#endif
3243
3244
0
  return AOM_CODEC_OK;
3245
0
}
3246
3247
#if !CONFIG_REALTIME_ONLY
3248
3249
/*!\brief Recode loop for encoding one frame. the purpose of encoding one frame
3250
 * for multiple times can be approaching a target bitrate or adjusting the usage
3251
 * of global motions.
3252
 *
3253
 * \ingroup high_level_algo
3254
 *
3255
 * \param[in]    cpi             Top-level encoder structure
3256
 * \param[in]    size            Bitstream size
3257
 * \param[out]   dest            Bitstream output buffer
3258
 * \param[in]    dest_size       Bitstream output buffer size
3259
 *
3260
 * \return Returns a value to indicate if the encoding is done successfully.
3261
 * \retval #AOM_CODEC_OK
3262
 * \retval -1
3263
 * \retval #AOM_CODEC_ERROR
3264
 */
3265
static int encode_with_recode_loop(AV1_COMP *cpi, size_t *size, uint8_t *dest,
3266
0
                                   size_t dest_size) {
3267
0
  AV1_COMMON *const cm = &cpi->common;
3268
0
  RATE_CONTROL *const rc = &cpi->rc;
3269
0
  GlobalMotionInfo *const gm_info = &cpi->gm_info;
3270
0
  const AV1EncoderConfig *const oxcf = &cpi->oxcf;
3271
0
  const QuantizationCfg *const q_cfg = &oxcf->q_cfg;
3272
0
  const int allow_recode = (cpi->sf.hl_sf.recode_loop != DISALLOW_RECODE);
3273
  // Must allow recode if minimum compression ratio is set.
3274
0
  assert(IMPLIES(oxcf->rc_cfg.min_cr > 0, allow_recode));
3275
3276
0
  set_size_independent_vars(cpi);
3277
0
  if (is_stat_consumption_stage_twopass(cpi) &&
3278
0
      cpi->sf.interp_sf.adaptive_interp_filter_search)
3279
0
    cpi->interp_search_flags.interp_filter_search_mask =
3280
0
        av1_setup_interp_filter_search_mask(cpi);
3281
3282
0
  av1_setup_frame_size(cpi);
3283
3284
0
  if (av1_superres_in_recode_allowed(cpi) &&
3285
0
      cpi->superres_mode != AOM_SUPERRES_NONE &&
3286
0
      cm->superres_scale_denominator == SCALE_NUMERATOR) {
3287
    // Superres mode is currently enabled, but the denominator selected will
3288
    // disable superres. So no need to continue, as we will go through another
3289
    // recode loop for full-resolution after this anyway.
3290
0
    return -1;
3291
0
  }
3292
3293
0
  int top_index = 0, bottom_index = 0;
3294
0
  int q = 0, q_low = 0, q_high = 0;
3295
0
  av1_set_size_dependent_vars(cpi, &q, &bottom_index, &top_index);
3296
0
  q_low = bottom_index;
3297
0
  q_high = top_index;
3298
3299
0
  av1_set_mv_search_params(cpi);
3300
3301
0
  allocate_gradient_info_for_hog(cpi);
3302
3303
0
  allocate_src_var_of_4x4_sub_block_buf(cpi);
3304
3305
0
  if (cpi->sf.part_sf.partition_search_type == VAR_BASED_PARTITION)
3306
0
    variance_partition_alloc(cpi);
3307
3308
0
  if (cm->current_frame.frame_type == KEY_FRAME) copy_frame_prob_info(cpi);
3309
3310
#if CONFIG_COLLECT_COMPONENT_TIMING
3311
  printf("\n Encoding a frame: \n");
3312
#endif
3313
3314
0
#if !CONFIG_RD_COMMAND
3315
  // Determine whether to use screen content tools using two fast encoding.
3316
0
  if (!cpi->sf.hl_sf.disable_extra_sc_testing && !cpi->use_ducky_encode)
3317
0
    av1_determine_sc_tools_with_encoding(cpi, q);
3318
0
#endif  // !CONFIG_RD_COMMAND
3319
3320
#if CONFIG_TUNE_VMAF
3321
  if (oxcf->tune_cfg.tuning == AOM_TUNE_VMAF_NEG_MAX_GAIN) {
3322
    av1_vmaf_neg_preprocessing(cpi, cpi->unscaled_source);
3323
  }
3324
#endif
3325
3326
#if CONFIG_TUNE_BUTTERAUGLI
3327
  cpi->butteraugli_info.recon_set = false;
3328
  int original_q = 0;
3329
#endif
3330
3331
0
  cpi->num_frame_recode = 0;
3332
3333
  // Loop variables
3334
0
  int loop = 0;
3335
0
  int loop_count = 0;
3336
0
  int overshoot_seen = 0;
3337
0
  int undershoot_seen = 0;
3338
0
  int low_cr_seen = 0;
3339
0
  int last_loop_allow_hp = 0;
3340
3341
0
  do {
3342
0
    loop = 0;
3343
0
    int do_mv_stats_collection = 1;
3344
3345
    // if frame was scaled calculate global_motion_search again if already
3346
    // done
3347
0
    if (loop_count > 0 && cpi->source && gm_info->search_done) {
3348
0
      if (cpi->source->y_crop_width != cm->width ||
3349
0
          cpi->source->y_crop_height != cm->height) {
3350
0
        gm_info->search_done = 0;
3351
0
      }
3352
0
    }
3353
0
    cpi->source = av1_realloc_and_scale_if_required(
3354
0
        cm, cpi->unscaled_source, &cpi->scaled_source, EIGHTTAP_REGULAR, 0,
3355
0
        false, false, cpi->oxcf.border_in_pixels, cpi->alloc_pyramid);
3356
3357
#if CONFIG_TUNE_BUTTERAUGLI
3358
    if (oxcf->tune_cfg.tuning == AOM_TUNE_BUTTERAUGLI) {
3359
      if (loop_count == 0) {
3360
        original_q = q;
3361
        // TODO(sdeng): different q here does not make big difference. Use a
3362
        // faster pass instead.
3363
        q = 96;
3364
        av1_setup_butteraugli_source(cpi);
3365
      } else {
3366
        q = original_q;
3367
      }
3368
    }
3369
#endif
3370
3371
0
    if (cpi->unscaled_last_source != NULL) {
3372
0
      cpi->last_source = av1_realloc_and_scale_if_required(
3373
0
          cm, cpi->unscaled_last_source, &cpi->scaled_last_source,
3374
0
          EIGHTTAP_REGULAR, 0, false, false, cpi->oxcf.border_in_pixels,
3375
0
          cpi->alloc_pyramid);
3376
0
    }
3377
3378
0
    int scale_references = 0;
3379
#if CONFIG_FPMT_TEST
3380
    scale_references =
3381
        cpi->ppi->fpmt_unit_test_cfg == PARALLEL_SIMULATION_ENCODE ? 1 : 0;
3382
#endif  // CONFIG_FPMT_TEST
3383
0
    if (scale_references ||
3384
0
        cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] == 0) {
3385
0
      if (!frame_is_intra_only(cm)) {
3386
0
        if (loop_count > 0) {
3387
0
          release_scaled_references(cpi);
3388
0
        }
3389
0
        av1_scale_references(cpi, EIGHTTAP_REGULAR, 0, 0);
3390
0
      }
3391
0
    }
3392
3393
#if CONFIG_TUNE_VMAF
3394
    if (oxcf->tune_cfg.tuning >= AOM_TUNE_VMAF_WITH_PREPROCESSING &&
3395
        oxcf->tune_cfg.tuning <= AOM_TUNE_VMAF_NEG_MAX_GAIN) {
3396
      cpi->vmaf_info.original_qindex = q;
3397
      q = av1_get_vmaf_base_qindex(cpi, q);
3398
    }
3399
#endif
3400
3401
#if CONFIG_RD_COMMAND
3402
    RD_COMMAND *rd_command = &cpi->rd_command;
3403
    RD_OPTION option = rd_command->option_ls[rd_command->frame_index];
3404
    if (option == RD_OPTION_SET_Q || option == RD_OPTION_SET_Q_RDMULT) {
3405
      q = rd_command->q_index_ls[rd_command->frame_index];
3406
    }
3407
#endif  // CONFIG_RD_COMMAND
3408
3409
#if CONFIG_BITRATE_ACCURACY
3410
#if CONFIG_THREE_PASS
3411
    if (oxcf->pass == AOM_RC_THIRD_PASS && cpi->vbr_rc_info.ready == 1) {
3412
      int frame_coding_idx =
3413
          av1_vbr_rc_frame_coding_idx(&cpi->vbr_rc_info, cpi->gf_frame_index);
3414
      if (frame_coding_idx < cpi->vbr_rc_info.total_frame_count) {
3415
        q = cpi->vbr_rc_info.q_index_list[frame_coding_idx];
3416
      } else {
3417
        // TODO(angiebird): Investigate why sometimes there is an extra frame
3418
        // after the last GOP.
3419
        q = cpi->vbr_rc_info.base_q_index;
3420
      }
3421
    }
3422
#else
3423
    if (cpi->vbr_rc_info.q_index_list_ready) {
3424
      q = cpi->vbr_rc_info.q_index_list[cpi->gf_frame_index];
3425
    }
3426
#endif  // CONFIG_THREE_PASS
3427
#endif  // CONFIG_BITRATE_ACCURACY
3428
3429
#if CONFIG_RATECTRL_LOG && CONFIG_THREE_PASS && CONFIG_BITRATE_ACCURACY
3430
    // TODO(angiebird): Move this into a function.
3431
    if (oxcf->pass == AOM_RC_THIRD_PASS) {
3432
      int frame_coding_idx =
3433
          av1_vbr_rc_frame_coding_idx(&cpi->vbr_rc_info, cpi->gf_frame_index);
3434
      double qstep_ratio = cpi->vbr_rc_info.qstep_ratio_list[frame_coding_idx];
3435
      FRAME_UPDATE_TYPE update_type =
3436
          cpi->vbr_rc_info.update_type_list[frame_coding_idx];
3437
      rc_log_frame_encode_param(&cpi->rc_log, frame_coding_idx, qstep_ratio, q,
3438
                                update_type);
3439
    }
3440
#endif  // CONFIG_RATECTRL_LOG && CONFIG_THREE_PASS && CONFIG_BITRATE_ACCURACY
3441
3442
0
    if (cpi->use_ducky_encode) {
3443
0
      const DuckyEncodeFrameInfo *frame_info =
3444
0
          &cpi->ducky_encode_info.frame_info;
3445
0
      if (frame_info->qp_mode == DUCKY_ENCODE_FRAME_MODE_QINDEX) {
3446
0
        q = frame_info->q_index;
3447
0
        cm->delta_q_info.delta_q_present_flag = frame_info->delta_q_enabled;
3448
0
      }
3449
0
    }
3450
3451
0
    if (av1_encode_for_extrc(&cpi->ext_ratectrl)) {
3452
0
      aom_codec_err_t codec_status;
3453
0
      aom_rc_encodeframe_decision_t encode_frame_decision;
3454
0
      const int sb_rows = CEIL_POWER_OF_TWO(cm->mi_params.mi_rows,
3455
0
                                            cm->seq_params->mib_size_log2);
3456
0
      const int sb_cols = CEIL_POWER_OF_TWO(cm->mi_params.mi_cols,
3457
0
                                            cm->seq_params->mib_size_log2);
3458
      // This assumes frame sizes don't change when used with external RC.
3459
      // cpi->ext_ratectrl is zero'ed at init.
3460
0
      if (cpi->ext_ratectrl.sb_params_list == NULL) {
3461
0
        CHECK_MEM_ERROR(
3462
0
            cm, cpi->ext_ratectrl.sb_params_list,
3463
0
            (aom_sb_params *)aom_calloc(
3464
0
                sb_rows * sb_cols, sizeof(*cpi->ext_ratectrl.sb_params_list)));
3465
0
      }
3466
0
      encode_frame_decision.sb_params_list = cpi->ext_ratectrl.sb_params_list;
3467
0
      encode_frame_decision.use_delta_q = &cpi->ext_ratectrl.use_delta_q;
3468
0
      codec_status = av1_extrc_get_encodeframe_decision(
3469
0
          &cpi->ext_ratectrl, cpi->gf_frame_index, &encode_frame_decision);
3470
0
      if (codec_status != AOM_CODEC_OK) {
3471
0
        aom_internal_error(cm->error, codec_status,
3472
0
                           "av1_extrc_get_encodeframe_decision() failed");
3473
0
      }
3474
      // If the external model recommends a reserved value, we use the default
3475
      // q.
3476
0
      if (encode_frame_decision.q_index != AOM_DEFAULT_Q) {
3477
0
        q = encode_frame_decision.q_index;
3478
0
      }
3479
0
    }
3480
3481
0
    av1_set_quantizer(cm, q_cfg->qm_minlevel, q_cfg->qm_maxlevel, q,
3482
0
                      q_cfg->enable_chroma_deltaq, q_cfg->enable_hdr_deltaq,
3483
0
                      oxcf->mode == ALLINTRA, oxcf->tune_cfg.tuning);
3484
0
    av1_set_speed_features_qindex_dependent(cpi, oxcf->speed);
3485
0
    av1_init_quantizer(&cpi->enc_quant_dequant_params, &cm->quant_params,
3486
0
                       cm->seq_params->bit_depth, cpi->oxcf.algo_cfg.sharpness);
3487
3488
0
    av1_set_variance_partition_thresholds(cpi, q, 0);
3489
3490
0
    if (loop_count == 0) {
3491
0
      av1_setup_frame(cpi);
3492
0
    } else if (get_primary_ref_frame_buf(cm) == NULL) {
3493
      // Base q-index may have changed, so we need to assign proper default coef
3494
      // probs before every iteration.
3495
0
      av1_default_coef_probs(cm);
3496
0
      av1_setup_frame_contexts(cm);
3497
0
    }
3498
3499
0
    if (q_cfg->aq_mode == VARIANCE_AQ) {
3500
0
      av1_vaq_frame_setup(cpi);
3501
0
    } else if (q_cfg->aq_mode == COMPLEXITY_AQ) {
3502
0
      av1_setup_in_frame_q_adj(cpi);
3503
0
    }
3504
3505
0
    if (cm->seg.enabled) {
3506
0
      if (!cm->seg.update_data && cm->prev_frame) {
3507
0
        segfeatures_copy(&cm->seg, &cm->prev_frame->seg);
3508
0
        cm->seg.enabled = cm->prev_frame->seg.enabled;
3509
0
      } else {
3510
0
        av1_calculate_segdata(&cm->seg);
3511
0
      }
3512
0
    } else {
3513
0
      memset(&cm->seg, 0, sizeof(cm->seg));
3514
0
    }
3515
0
    segfeatures_copy(&cm->cur_frame->seg, &cm->seg);
3516
0
    cm->cur_frame->seg.enabled = cm->seg.enabled;
3517
3518
#if CONFIG_COLLECT_COMPONENT_TIMING
3519
    start_timing(cpi, av1_encode_frame_time);
3520
#endif
3521
    // Set the motion vector precision based on mv stats from the last coded
3522
    // frame.
3523
0
    if (!frame_is_intra_only(cm)) {
3524
0
      av1_pick_and_set_high_precision_mv(cpi, q);
3525
3526
      // If the precision has changed during different iteration of the loop,
3527
      // then we need to reset the global motion vectors
3528
0
      if (loop_count > 0 &&
3529
0
          cm->features.allow_high_precision_mv != last_loop_allow_hp) {
3530
0
        gm_info->search_done = 0;
3531
0
      }
3532
0
      last_loop_allow_hp = cm->features.allow_high_precision_mv;
3533
0
    }
3534
3535
    // transform / motion compensation build reconstruction frame
3536
0
    av1_encode_frame(cpi);
3537
3538
    // Disable mv_stats collection for parallel frames based on update flag.
3539
0
    if (!cpi->do_frame_data_update) do_mv_stats_collection = 0;
3540
3541
    // Reset the mv_stats in case we are interrupted by an intraframe or an
3542
    // overlay frame.
3543
0
    if (cpi->mv_stats.valid && do_mv_stats_collection) av1_zero(cpi->mv_stats);
3544
3545
    // Gather the mv_stats for the next frame
3546
0
    if (cpi->sf.hl_sf.high_precision_mv_usage == LAST_MV_DATA &&
3547
0
        av1_frame_allows_smart_mv(cpi) && do_mv_stats_collection) {
3548
0
      av1_collect_mv_stats(cpi, q);
3549
0
    }
3550
3551
#if CONFIG_COLLECT_COMPONENT_TIMING
3552
    end_timing(cpi, av1_encode_frame_time);
3553
#endif
3554
3555
#if CONFIG_BITRATE_ACCURACY || CONFIG_RD_COMMAND
3556
    const int do_dummy_pack = 1;
3557
#else   // CONFIG_BITRATE_ACCURACY
3558
    // Dummy pack of the bitstream using up to date stats to get an
3559
    // accurate estimate of output frame size to determine if we need
3560
    // to recode.
3561
0
    const int do_dummy_pack =
3562
0
        (cpi->sf.hl_sf.recode_loop >= ALLOW_RECODE_KFARFGF &&
3563
0
         oxcf->rc_cfg.mode != AOM_Q) ||
3564
0
        oxcf->rc_cfg.min_cr > 0;
3565
0
#endif  // CONFIG_BITRATE_ACCURACY
3566
0
    if (do_dummy_pack) {
3567
0
      av1_finalize_encoded_frame(cpi);
3568
0
      int largest_tile_id = 0;  // Output from bitstream: unused here
3569
0
      rc->coefficient_size = 0;
3570
0
      if (av1_pack_bitstream(cpi, dest, dest_size, size, &largest_tile_id) !=
3571
0
          AOM_CODEC_OK) {
3572
0
        return AOM_CODEC_ERROR;
3573
0
      }
3574
3575
      // bits used for this frame
3576
0
      rc->projected_frame_size = (int)(*size) << 3;
3577
#if CONFIG_RD_COMMAND
3578
      PSNR_STATS psnr;
3579
      aom_calc_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr);
3580
      printf("q %d rdmult %d rate %d dist %" PRIu64 "\n", q, cpi->rd.RDMULT,
3581
             rc->projected_frame_size, psnr.sse[0]);
3582
      ++rd_command->frame_index;
3583
      if (rd_command->frame_index == rd_command->frame_count) {
3584
        return AOM_CODEC_ERROR;
3585
      }
3586
#endif  // CONFIG_RD_COMMAND
3587
3588
#if CONFIG_RATECTRL_LOG && CONFIG_THREE_PASS && CONFIG_BITRATE_ACCURACY
3589
      if (oxcf->pass == AOM_RC_THIRD_PASS) {
3590
        int frame_coding_idx =
3591
            av1_vbr_rc_frame_coding_idx(&cpi->vbr_rc_info, cpi->gf_frame_index);
3592
        rc_log_frame_entropy(&cpi->rc_log, frame_coding_idx,
3593
                             rc->projected_frame_size, rc->coefficient_size);
3594
      }
3595
#endif  // CONFIG_RATECTRL_LOG && CONFIG_THREE_PASS && CONFIG_BITRATE_ACCURACY
3596
0
    }
3597
3598
#if CONFIG_TUNE_VMAF
3599
    if (oxcf->tune_cfg.tuning >= AOM_TUNE_VMAF_WITH_PREPROCESSING &&
3600
        oxcf->tune_cfg.tuning <= AOM_TUNE_VMAF_NEG_MAX_GAIN) {
3601
      q = cpi->vmaf_info.original_qindex;
3602
    }
3603
#endif
3604
0
    if (allow_recode) {
3605
      // Update q and decide whether to do a recode loop
3606
0
      recode_loop_update_q(cpi, &loop, &q, &q_low, &q_high, top_index,
3607
0
                           bottom_index, &undershoot_seen, &overshoot_seen,
3608
0
                           &low_cr_seen, loop_count);
3609
0
    }
3610
3611
#if CONFIG_TUNE_BUTTERAUGLI
3612
    if (loop_count == 0 && oxcf->tune_cfg.tuning == AOM_TUNE_BUTTERAUGLI) {
3613
      loop = 1;
3614
      av1_setup_butteraugli_rdmult_and_restore_source(cpi, 0.4);
3615
    }
3616
#endif
3617
3618
0
    if (cpi->use_ducky_encode) {
3619
      // Ducky encode currently does not support recode loop.
3620
0
      loop = 0;
3621
0
    }
3622
3623
    // Do not recode if external rate control is used.
3624
0
    if (av1_encode_for_extrc(&cpi->ext_ratectrl)) {
3625
0
      loop = 0;
3626
0
    }
3627
#if CONFIG_BITRATE_ACCURACY || CONFIG_RD_COMMAND
3628
    loop = 0;  // turn off recode loop when CONFIG_BITRATE_ACCURACY is on
3629
#endif         // CONFIG_BITRATE_ACCURACY || CONFIG_RD_COMMAND
3630
3631
0
    if (loop) {
3632
0
      ++loop_count;
3633
0
      cpi->num_frame_recode =
3634
0
          (cpi->num_frame_recode < (NUM_RECODES_PER_FRAME - 1))
3635
0
              ? (cpi->num_frame_recode + 1)
3636
0
              : (NUM_RECODES_PER_FRAME - 1);
3637
#if CONFIG_INTERNAL_STATS
3638
      ++cpi->frame_recode_hits;
3639
#endif
3640
0
    }
3641
#if CONFIG_COLLECT_COMPONENT_TIMING
3642
    if (loop) printf("\n Recoding:");
3643
#endif
3644
0
  } while (loop);
3645
3646
0
  return AOM_CODEC_OK;
3647
0
}
3648
#endif  // !CONFIG_REALTIME_ONLY
3649
3650
// TODO(jingning, paulwilkins): Set up high grain level to test
3651
// hardware decoders. Need to adapt the actual noise variance
3652
// according to the difference between reconstructed frame and the
3653
// source signal.
3654
0
static void set_grain_syn_params(AV1_COMMON *cm) {
3655
0
  aom_film_grain_t *film_grain_params = &cm->film_grain_params;
3656
0
  film_grain_params->apply_grain = 1;
3657
0
  film_grain_params->update_parameters = 1;
3658
0
  film_grain_params->random_seed = rand() & 0xffff;
3659
3660
0
  film_grain_params->num_y_points = 1;
3661
0
  film_grain_params->scaling_points_y[0][0] = 128;
3662
0
  film_grain_params->scaling_points_y[0][1] = 100;
3663
3664
0
  if (!cm->seq_params->monochrome) {
3665
0
    film_grain_params->num_cb_points = 1;
3666
0
    film_grain_params->scaling_points_cb[0][0] = 128;
3667
0
    film_grain_params->scaling_points_cb[0][1] = 100;
3668
3669
0
    film_grain_params->num_cr_points = 1;
3670
0
    film_grain_params->scaling_points_cr[0][0] = 128;
3671
0
    film_grain_params->scaling_points_cr[0][1] = 100;
3672
0
  } else {
3673
0
    film_grain_params->num_cb_points = 0;
3674
0
    film_grain_params->num_cr_points = 0;
3675
0
  }
3676
3677
0
  film_grain_params->chroma_scaling_from_luma = 0;
3678
3679
0
  film_grain_params->scaling_shift = 1;
3680
0
  film_grain_params->ar_coeff_lag = 0;
3681
0
  film_grain_params->ar_coeff_shift = 1;
3682
0
  film_grain_params->overlap_flag = 1;
3683
0
  film_grain_params->grain_scale_shift = 0;
3684
0
}
3685
3686
/*!\brief Recode loop or a single loop for encoding one frame, followed by
3687
 * in-loop deblocking filters, CDEF filters, and restoration filters.
3688
 *
3689
 * \ingroup high_level_algo
3690
 * \callgraph
3691
 * \callergraph
3692
 *
3693
 * \param[in]    cpi             Top-level encoder structure
3694
 * \param[in]    size            Bitstream size
3695
 * \param[out]   dest            Bitstream output buffer
3696
 * \param[in]    dest_size       Bitstream output buffer size
3697
 * \param[in]    sse             Total distortion of the frame
3698
 * \param[in]    rate            Total rate of the frame
3699
 * \param[in]    largest_tile_id Tile id of the last tile
3700
 *
3701
 * \return Returns a value to indicate if the encoding is done successfully.
3702
 * \retval #AOM_CODEC_OK
3703
 * \retval #AOM_CODEC_ERROR
3704
 */
3705
static int encode_with_recode_loop_and_filter(AV1_COMP *cpi, size_t *size,
3706
                                              uint8_t *dest, size_t dest_size,
3707
                                              int64_t *sse, int64_t *rate,
3708
0
                                              int *largest_tile_id) {
3709
#if CONFIG_COLLECT_COMPONENT_TIMING
3710
  start_timing(cpi, encode_with_or_without_recode_time);
3711
#endif
3712
0
  for (int i = 0; i < NUM_RECODES_PER_FRAME; i++) {
3713
0
    cpi->do_update_frame_probs_txtype[i] = 0;
3714
0
    cpi->do_update_frame_probs_obmc[i] = 0;
3715
0
    cpi->do_update_frame_probs_warp[i] = 0;
3716
0
    cpi->do_update_frame_probs_interpfilter[i] = 0;
3717
0
  }
3718
3719
0
  cpi->do_update_vbr_bits_off_target_fast = 0;
3720
0
  int err;
3721
#if CONFIG_REALTIME_ONLY
3722
  err = encode_without_recode(cpi);
3723
#else
3724
0
  if (cpi->sf.hl_sf.recode_loop == DISALLOW_RECODE)
3725
0
    err = encode_without_recode(cpi);
3726
0
  else
3727
0
    err = encode_with_recode_loop(cpi, size, dest, dest_size);
3728
0
#endif
3729
#if CONFIG_COLLECT_COMPONENT_TIMING
3730
  end_timing(cpi, encode_with_or_without_recode_time);
3731
#endif
3732
0
  if (err != AOM_CODEC_OK) {
3733
0
    if (err == -1) {
3734
      // special case as described in encode_with_recode_loop().
3735
      // Encoding was skipped.
3736
0
      err = AOM_CODEC_OK;
3737
0
      if (sse != NULL) *sse = INT64_MAX;
3738
0
      if (rate != NULL) *rate = INT64_MAX;
3739
0
      *largest_tile_id = 0;
3740
0
    }
3741
0
    return err;
3742
0
  }
3743
3744
#ifdef OUTPUT_YUV_DENOISED
3745
  const AV1EncoderConfig *const oxcf = &cpi->oxcf;
3746
  if (oxcf->noise_sensitivity > 0 && denoise_svc(cpi)) {
3747
    aom_write_yuv_frame(yuv_denoised_file,
3748
                        &cpi->denoiser.running_avg_y[INTRA_FRAME]);
3749
  }
3750
#endif
3751
3752
0
  AV1_COMMON *const cm = &cpi->common;
3753
0
  SequenceHeader *const seq_params = cm->seq_params;
3754
3755
  // Special case code to reduce pulsing when key frames are forced at a
3756
  // fixed interval. Note the reconstruction error if it is the frame before
3757
  // the force key frame
3758
0
  if (cpi->ppi->p_rc.next_key_frame_forced && cpi->rc.frames_to_key == 1) {
3759
0
#if CONFIG_AV1_HIGHBITDEPTH
3760
0
    if (seq_params->use_highbitdepth) {
3761
0
      cpi->ambient_err = aom_highbd_get_y_sse(cpi->source, &cm->cur_frame->buf);
3762
0
    } else {
3763
0
      cpi->ambient_err = aom_get_y_sse(cpi->source, &cm->cur_frame->buf);
3764
0
    }
3765
#else
3766
    cpi->ambient_err = aom_get_y_sse(cpi->source, &cm->cur_frame->buf);
3767
#endif
3768
0
  }
3769
3770
0
  cm->cur_frame->buf.color_primaries = seq_params->color_primaries;
3771
0
  cm->cur_frame->buf.transfer_characteristics =
3772
0
      seq_params->transfer_characteristics;
3773
0
  cm->cur_frame->buf.matrix_coefficients = seq_params->matrix_coefficients;
3774
0
  cm->cur_frame->buf.monochrome = seq_params->monochrome;
3775
0
  cm->cur_frame->buf.chroma_sample_position =
3776
0
      seq_params->chroma_sample_position;
3777
0
  cm->cur_frame->buf.color_range = seq_params->color_range;
3778
0
  cm->cur_frame->buf.render_width = cm->render_width;
3779
0
  cm->cur_frame->buf.render_height = cm->render_height;
3780
3781
0
  if (!cpi->mt_info.pipeline_lpf_mt_with_enc)
3782
0
    set_postproc_filter_default_params(&cpi->common);
3783
3784
0
  if (!cm->features.allow_intrabc) {
3785
0
    loopfilter_frame(cpi, cm);
3786
0
  }
3787
3788
0
  if (cpi->oxcf.mode != ALLINTRA && !cpi->ppi->rtc_ref.non_reference_frame) {
3789
0
    extend_frame_borders(cpi);
3790
0
  }
3791
3792
#ifdef OUTPUT_YUV_REC
3793
  aom_write_one_yuv_frame(cm, &cm->cur_frame->buf);
3794
#endif
3795
3796
0
  if (cpi->oxcf.tune_cfg.content == AOM_CONTENT_FILM) {
3797
0
    set_grain_syn_params(cm);
3798
0
  }
3799
3800
0
  av1_finalize_encoded_frame(cpi);
3801
  // Build the bitstream
3802
#if CONFIG_COLLECT_COMPONENT_TIMING
3803
  start_timing(cpi, av1_pack_bitstream_final_time);
3804
#endif
3805
0
  cpi->rc.coefficient_size = 0;
3806
0
  if (av1_pack_bitstream(cpi, dest, dest_size, size, largest_tile_id) !=
3807
0
      AOM_CODEC_OK)
3808
0
    return AOM_CODEC_ERROR;
3809
#if CONFIG_COLLECT_COMPONENT_TIMING
3810
  end_timing(cpi, av1_pack_bitstream_final_time);
3811
#endif
3812
3813
0
  if (cpi->rc.postencode_drop && allow_postencode_drop_rtc(cpi) &&
3814
0
      av1_postencode_drop_cbr(cpi, size)) {
3815
0
    return AOM_CODEC_OK;
3816
0
  }
3817
3818
  // Compute sse and rate.
3819
0
  if (sse != NULL) {
3820
0
#if CONFIG_AV1_HIGHBITDEPTH
3821
0
    *sse = (seq_params->use_highbitdepth)
3822
0
               ? aom_highbd_get_y_sse(cpi->source, &cm->cur_frame->buf)
3823
0
               : aom_get_y_sse(cpi->source, &cm->cur_frame->buf);
3824
#else
3825
    *sse = aom_get_y_sse(cpi->source, &cm->cur_frame->buf);
3826
#endif
3827
0
  }
3828
0
  if (rate != NULL) {
3829
0
    const int64_t bits = (*size << 3);
3830
0
    *rate = (bits << 5);  // To match scale.
3831
0
  }
3832
3833
0
#if !CONFIG_REALTIME_ONLY
3834
0
  if (cpi->use_ducky_encode) {
3835
0
    PSNR_STATS psnr;
3836
0
    aom_calc_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr);
3837
0
    DuckyEncodeFrameResult *frame_result = &cpi->ducky_encode_info.frame_result;
3838
0
    frame_result->global_order_idx = cm->cur_frame->display_order_hint;
3839
0
    frame_result->q_index = cm->quant_params.base_qindex;
3840
0
    frame_result->rdmult = cpi->rd.RDMULT;
3841
0
    frame_result->rate = (int)(*size) * 8;
3842
0
    frame_result->dist = psnr.sse[0];
3843
0
    frame_result->psnr = psnr.psnr[0];
3844
0
  }
3845
0
#endif  // !CONFIG_REALTIME_ONLY
3846
3847
0
  return AOM_CODEC_OK;
3848
0
}
3849
3850
static int encode_with_and_without_superres(AV1_COMP *cpi, size_t *size,
3851
                                            uint8_t *dest, size_t dest_size,
3852
0
                                            int *largest_tile_id) {
3853
0
  const AV1_COMMON *const cm = &cpi->common;
3854
0
  assert(cm->seq_params->enable_superres);
3855
0
  assert(av1_superres_in_recode_allowed(cpi));
3856
0
  aom_codec_err_t err = AOM_CODEC_OK;
3857
0
  av1_save_all_coding_context(cpi);
3858
3859
0
  int64_t sse1 = INT64_MAX;
3860
0
  int64_t rate1 = INT64_MAX;
3861
0
  int largest_tile_id1 = 0;
3862
0
  int64_t sse2 = INT64_MAX;
3863
0
  int64_t rate2 = INT64_MAX;
3864
0
  int largest_tile_id2;
3865
0
  double proj_rdcost1 = DBL_MAX;
3866
0
  const GF_GROUP *const gf_group = &cpi->ppi->gf_group;
3867
0
  const FRAME_UPDATE_TYPE update_type =
3868
0
      gf_group->update_type[cpi->gf_frame_index];
3869
0
  const aom_bit_depth_t bit_depth = cm->seq_params->bit_depth;
3870
3871
  // Encode with superres.
3872
0
  if (cpi->sf.hl_sf.superres_auto_search_type == SUPERRES_AUTO_ALL) {
3873
0
    SuperResCfg *const superres_cfg = &cpi->oxcf.superres_cfg;
3874
0
    int64_t superres_sses[SCALE_NUMERATOR];
3875
0
    int64_t superres_rates[SCALE_NUMERATOR];
3876
0
    int superres_largest_tile_ids[SCALE_NUMERATOR];
3877
    // Use superres for Key-frames and Alt-ref frames only.
3878
0
    if (update_type != OVERLAY_UPDATE && update_type != INTNL_OVERLAY_UPDATE) {
3879
0
      for (int denom = SCALE_NUMERATOR + 1; denom <= 2 * SCALE_NUMERATOR;
3880
0
           ++denom) {
3881
0
        superres_cfg->superres_scale_denominator = denom;
3882
0
        superres_cfg->superres_kf_scale_denominator = denom;
3883
0
        const int this_index = denom - (SCALE_NUMERATOR + 1);
3884
3885
0
        cpi->superres_mode = AOM_SUPERRES_AUTO;  // Super-res on for this loop.
3886
0
        err = encode_with_recode_loop_and_filter(
3887
0
            cpi, size, dest, dest_size, &superres_sses[this_index],
3888
0
            &superres_rates[this_index],
3889
0
            &superres_largest_tile_ids[this_index]);
3890
0
        cpi->superres_mode = AOM_SUPERRES_NONE;  // Reset to default (full-res).
3891
0
        if (err != AOM_CODEC_OK) return err;
3892
0
        restore_all_coding_context(cpi);
3893
0
      }
3894
      // Reset.
3895
0
      superres_cfg->superres_scale_denominator = SCALE_NUMERATOR;
3896
0
      superres_cfg->superres_kf_scale_denominator = SCALE_NUMERATOR;
3897
0
    } else {
3898
0
      for (int denom = SCALE_NUMERATOR + 1; denom <= 2 * SCALE_NUMERATOR;
3899
0
           ++denom) {
3900
0
        const int this_index = denom - (SCALE_NUMERATOR + 1);
3901
0
        superres_sses[this_index] = INT64_MAX;
3902
0
        superres_rates[this_index] = INT64_MAX;
3903
0
        superres_largest_tile_ids[this_index] = 0;
3904
0
      }
3905
0
    }
3906
    // Encode without superres.
3907
0
    assert(cpi->superres_mode == AOM_SUPERRES_NONE);
3908
0
    err = encode_with_recode_loop_and_filter(cpi, size, dest, dest_size, &sse2,
3909
0
                                             &rate2, &largest_tile_id2);
3910
0
    if (err != AOM_CODEC_OK) return err;
3911
3912
    // Note: Both use common rdmult based on base qindex of fullres.
3913
0
    const int64_t rdmult = av1_compute_rd_mult_based_on_qindex(
3914
0
        bit_depth, update_type, cm->quant_params.base_qindex,
3915
0
        cpi->oxcf.tune_cfg.tuning, cpi->oxcf.mode);
3916
3917
    // Find the best rdcost among all superres denoms.
3918
0
    int best_denom = -1;
3919
0
    for (int denom = SCALE_NUMERATOR + 1; denom <= 2 * SCALE_NUMERATOR;
3920
0
         ++denom) {
3921
0
      const int this_index = denom - (SCALE_NUMERATOR + 1);
3922
0
      const int64_t this_sse = superres_sses[this_index];
3923
0
      const int64_t this_rate = superres_rates[this_index];
3924
0
      const int this_largest_tile_id = superres_largest_tile_ids[this_index];
3925
0
      const double this_rdcost = RDCOST_DBL_WITH_NATIVE_BD_DIST(
3926
0
          rdmult, this_rate, this_sse, bit_depth);
3927
0
      if (this_rdcost < proj_rdcost1) {
3928
0
        sse1 = this_sse;
3929
0
        rate1 = this_rate;
3930
0
        largest_tile_id1 = this_largest_tile_id;
3931
0
        proj_rdcost1 = this_rdcost;
3932
0
        best_denom = denom;
3933
0
      }
3934
0
    }
3935
0
    const double proj_rdcost2 =
3936
0
        RDCOST_DBL_WITH_NATIVE_BD_DIST(rdmult, rate2, sse2, bit_depth);
3937
    // Re-encode with superres if it's better.
3938
0
    if (proj_rdcost1 < proj_rdcost2) {
3939
0
      restore_all_coding_context(cpi);
3940
      // TODO(urvang): We should avoid rerunning the recode loop by saving
3941
      // previous output+state, or running encode only for the selected 'q' in
3942
      // previous step.
3943
      // Again, temporarily force the best denom.
3944
0
      superres_cfg->superres_scale_denominator = best_denom;
3945
0
      superres_cfg->superres_kf_scale_denominator = best_denom;
3946
0
      int64_t sse3 = INT64_MAX;
3947
0
      int64_t rate3 = INT64_MAX;
3948
0
      cpi->superres_mode =
3949
0
          AOM_SUPERRES_AUTO;  // Super-res on for this recode loop.
3950
0
      err = encode_with_recode_loop_and_filter(cpi, size, dest, dest_size,
3951
0
                                               &sse3, &rate3, largest_tile_id);
3952
0
      cpi->superres_mode = AOM_SUPERRES_NONE;  // Reset to default (full-res).
3953
0
      assert(sse1 == sse3);
3954
0
      assert(rate1 == rate3);
3955
0
      assert(largest_tile_id1 == *largest_tile_id);
3956
      // Reset.
3957
0
      superres_cfg->superres_scale_denominator = SCALE_NUMERATOR;
3958
0
      superres_cfg->superres_kf_scale_denominator = SCALE_NUMERATOR;
3959
0
    } else {
3960
0
      *largest_tile_id = largest_tile_id2;
3961
0
    }
3962
0
  } else {
3963
0
    assert(cpi->sf.hl_sf.superres_auto_search_type == SUPERRES_AUTO_DUAL);
3964
0
    cpi->superres_mode =
3965
0
        AOM_SUPERRES_AUTO;  // Super-res on for this recode loop.
3966
0
    err = encode_with_recode_loop_and_filter(cpi, size, dest, dest_size, &sse1,
3967
0
                                             &rate1, &largest_tile_id1);
3968
0
    cpi->superres_mode = AOM_SUPERRES_NONE;  // Reset to default (full-res).
3969
0
    if (err != AOM_CODEC_OK) return err;
3970
0
    restore_all_coding_context(cpi);
3971
    // Encode without superres.
3972
0
    assert(cpi->superres_mode == AOM_SUPERRES_NONE);
3973
0
    err = encode_with_recode_loop_and_filter(cpi, size, dest, dest_size, &sse2,
3974
0
                                             &rate2, &largest_tile_id2);
3975
0
    if (err != AOM_CODEC_OK) return err;
3976
3977
    // Note: Both use common rdmult based on base qindex of fullres.
3978
0
    const int64_t rdmult = av1_compute_rd_mult_based_on_qindex(
3979
0
        bit_depth, update_type, cm->quant_params.base_qindex,
3980
0
        cpi->oxcf.tune_cfg.tuning, cpi->oxcf.mode);
3981
0
    proj_rdcost1 =
3982
0
        RDCOST_DBL_WITH_NATIVE_BD_DIST(rdmult, rate1, sse1, bit_depth);
3983
0
    const double proj_rdcost2 =
3984
0
        RDCOST_DBL_WITH_NATIVE_BD_DIST(rdmult, rate2, sse2, bit_depth);
3985
    // Re-encode with superres if it's better.
3986
0
    if (proj_rdcost1 < proj_rdcost2) {
3987
0
      restore_all_coding_context(cpi);
3988
      // TODO(urvang): We should avoid rerunning the recode loop by saving
3989
      // previous output+state, or running encode only for the selected 'q' in
3990
      // previous step.
3991
0
      int64_t sse3 = INT64_MAX;
3992
0
      int64_t rate3 = INT64_MAX;
3993
0
      cpi->superres_mode =
3994
0
          AOM_SUPERRES_AUTO;  // Super-res on for this recode loop.
3995
0
      err = encode_with_recode_loop_and_filter(cpi, size, dest, dest_size,
3996
0
                                               &sse3, &rate3, largest_tile_id);
3997
0
      cpi->superres_mode = AOM_SUPERRES_NONE;  // Reset to default (full-res).
3998
0
      assert(sse1 == sse3);
3999
0
      assert(rate1 == rate3);
4000
0
      assert(largest_tile_id1 == *largest_tile_id);
4001
0
    } else {
4002
0
      *largest_tile_id = largest_tile_id2;
4003
0
    }
4004
0
  }
4005
4006
0
  return err;
4007
0
}
4008
4009
// Conditions to disable cdf_update mode in selective mode for real-time.
4010
// Handle case for layers, scene change, and resizing.
4011
0
static inline int selective_disable_cdf_rtc(const AV1_COMP *cpi) {
4012
0
  const AV1_COMMON *const cm = &cpi->common;
4013
0
  const RATE_CONTROL *const rc = &cpi->rc;
4014
  // For single layer.
4015
0
  if (cpi->svc.number_spatial_layers == 1 &&
4016
0
      cpi->svc.number_temporal_layers == 1) {
4017
    // Don't disable on intra_only, scene change (high_source_sad = 1),
4018
    // or resized frame. To avoid quality loss force enable at
4019
    // for ~30 frames after key or scene/slide change, and
4020
    // after 8 frames since last update if frame_source_sad > 0.
4021
0
    if (frame_is_intra_only(cm) || is_frame_resize_pending(cpi) ||
4022
0
        rc->high_source_sad || rc->frames_since_key < 30 ||
4023
0
        (cpi->oxcf.q_cfg.aq_mode == CYCLIC_REFRESH_AQ &&
4024
0
         cpi->cyclic_refresh->counter_encode_maxq_scene_change < 30) ||
4025
0
        (cpi->frames_since_last_update > 8 && cpi->rc.frame_source_sad > 0))
4026
0
      return 0;
4027
0
    else
4028
0
      return 1;
4029
0
  } else if (cpi->svc.number_temporal_layers > 1) {
4030
    // Disable only on top temporal enhancement layer for now.
4031
0
    return cpi->svc.temporal_layer_id == cpi->svc.number_temporal_layers - 1;
4032
0
  }
4033
0
  return 1;
4034
0
}
4035
4036
#if !CONFIG_REALTIME_ONLY
4037
static void subtract_stats(FIRSTPASS_STATS *section,
4038
0
                           const FIRSTPASS_STATS *frame) {
4039
0
  section->frame -= frame->frame;
4040
0
  section->weight -= frame->weight;
4041
0
  section->intra_error -= frame->intra_error;
4042
0
  section->frame_avg_wavelet_energy -= frame->frame_avg_wavelet_energy;
4043
0
  section->coded_error -= frame->coded_error;
4044
0
  section->sr_coded_error -= frame->sr_coded_error;
4045
0
  section->lt_coded_error -= frame->lt_coded_error;
4046
0
  section->pcnt_inter -= frame->pcnt_inter;
4047
0
  section->pcnt_motion -= frame->pcnt_motion;
4048
0
  section->pcnt_second_ref -= frame->pcnt_second_ref;
4049
0
  section->pcnt_neutral -= frame->pcnt_neutral;
4050
0
  section->intra_skip_pct -= frame->intra_skip_pct;
4051
0
  section->inactive_zone_rows -= frame->inactive_zone_rows;
4052
0
  section->inactive_zone_cols -= frame->inactive_zone_cols;
4053
0
  section->MVr -= frame->MVr;
4054
0
  section->mvr_abs -= frame->mvr_abs;
4055
0
  section->MVc -= frame->MVc;
4056
0
  section->mvc_abs -= frame->mvc_abs;
4057
0
  section->MVrv -= frame->MVrv;
4058
0
  section->MVcv -= frame->MVcv;
4059
0
  section->mv_in_out_count -= frame->mv_in_out_count;
4060
0
  section->new_mv_count -= frame->new_mv_count;
4061
0
  section->count -= frame->count;
4062
0
  section->duration -= frame->duration;
4063
0
}
4064
4065
0
static void calculate_frame_avg_haar_energy(AV1_COMP *cpi) {
4066
0
  TWO_PASS *const twopass = &cpi->ppi->twopass;
4067
0
  const FIRSTPASS_STATS *const total_stats =
4068
0
      twopass->stats_buf_ctx->total_stats;
4069
4070
0
  if (is_one_pass_rt_params(cpi) ||
4071
0
      (cpi->oxcf.q_cfg.deltaq_mode != DELTA_Q_PERCEPTUAL) ||
4072
0
      (is_fp_wavelet_energy_invalid(total_stats) == 0))
4073
0
    return;
4074
4075
0
  const int num_mbs = (cpi->oxcf.resize_cfg.resize_mode != RESIZE_NONE)
4076
0
                          ? cpi->initial_mbs
4077
0
                          : cpi->common.mi_params.MBs;
4078
0
  const YV12_BUFFER_CONFIG *const unfiltered_source = cpi->unfiltered_source;
4079
0
  const uint8_t *const src = unfiltered_source->y_buffer;
4080
0
  const int hbd = unfiltered_source->flags & YV12_FLAG_HIGHBITDEPTH;
4081
0
  const int stride = unfiltered_source->y_stride;
4082
0
  const BLOCK_SIZE fp_block_size =
4083
0
      get_fp_block_size(cpi->is_screen_content_type);
4084
0
  const int fp_block_size_width = block_size_wide[fp_block_size];
4085
0
  const int fp_block_size_height = block_size_high[fp_block_size];
4086
0
  const int num_unit_cols =
4087
0
      get_num_blocks(unfiltered_source->y_crop_width, fp_block_size_width);
4088
0
  const int num_unit_rows =
4089
0
      get_num_blocks(unfiltered_source->y_crop_height, fp_block_size_height);
4090
0
  const int num_8x8_cols = num_unit_cols * (fp_block_size_width / 8);
4091
0
  const int num_8x8_rows = num_unit_rows * (fp_block_size_height / 8);
4092
0
  int64_t frame_avg_wavelet_energy = av1_haar_ac_sad_mxn_uint8_input(
4093
0
      src, stride, hbd, num_8x8_rows, num_8x8_cols);
4094
4095
0
  cpi->twopass_frame.frame_avg_haar_energy =
4096
0
      log1p((double)frame_avg_wavelet_energy / num_mbs);
4097
0
}
4098
#endif
4099
4100
/*!\brief Run the final pass encoding for 1-pass/2-pass encoding mode, and pack
4101
 * the bitstream
4102
 *
4103
 * \ingroup high_level_algo
4104
 * \callgraph
4105
 * \callergraph
4106
 *
4107
 * \param[in]    cpi             Top-level encoder structure
4108
 * \param[in]    size            Bitstream size
4109
 * \param[out]   dest            Bitstream output buffer
4110
 * \param[in]    dest_size       Bitstream output buffer size
4111
 *
4112
 * \return Returns a value to indicate if the encoding is done successfully.
4113
 * \retval #AOM_CODEC_OK
4114
 * \retval #AOM_CODEC_ERROR
4115
 */
4116
static int encode_frame_to_data_rate(AV1_COMP *cpi, size_t *size, uint8_t *dest,
4117
0
                                     size_t dest_size) {
4118
0
  AV1_COMMON *const cm = &cpi->common;
4119
0
  SequenceHeader *const seq_params = cm->seq_params;
4120
0
  CurrentFrame *const current_frame = &cm->current_frame;
4121
0
  const AV1EncoderConfig *const oxcf = &cpi->oxcf;
4122
0
  struct segmentation *const seg = &cm->seg;
4123
0
  FeatureFlags *const features = &cm->features;
4124
0
  const TileConfig *const tile_cfg = &oxcf->tile_cfg;
4125
0
  assert(cpi->source != NULL);
4126
0
  cpi->td.mb.e_mbd.cur_buf = cpi->source;
4127
4128
#if CONFIG_COLLECT_COMPONENT_TIMING
4129
  start_timing(cpi, encode_frame_to_data_rate_time);
4130
#endif
4131
4132
0
#if !CONFIG_REALTIME_ONLY
4133
0
  calculate_frame_avg_haar_energy(cpi);
4134
0
#endif
4135
4136
  // frame type has been decided outside of this function call
4137
0
  cm->cur_frame->frame_type = current_frame->frame_type;
4138
4139
0
  cm->tiles.large_scale = tile_cfg->enable_large_scale_tile;
4140
0
  cm->tiles.single_tile_decoding = tile_cfg->enable_single_tile_decoding;
4141
4142
0
  features->allow_ref_frame_mvs &= frame_might_allow_ref_frame_mvs(cm);
4143
  // features->allow_ref_frame_mvs needs to be written into the frame header
4144
  // while cm->tiles.large_scale is 1, therefore, "cm->tiles.large_scale=1" case
4145
  // is separated from frame_might_allow_ref_frame_mvs().
4146
0
  features->allow_ref_frame_mvs &= !cm->tiles.large_scale;
4147
4148
0
  features->allow_warped_motion = oxcf->motion_mode_cfg.allow_warped_motion &&
4149
0
                                  frame_might_allow_warped_motion(cm);
4150
4151
0
  cpi->last_frame_type = current_frame->frame_type;
4152
4153
0
  if (frame_is_intra_only(cm)) {
4154
0
    cpi->frames_since_last_update = 0;
4155
0
  }
4156
4157
0
  if (frame_is_sframe(cm)) {
4158
0
    GF_GROUP *gf_group = &cpi->ppi->gf_group;
4159
    // S frame will wipe out any previously encoded altref so we cannot place
4160
    // an overlay frame
4161
0
    gf_group->update_type[gf_group->size] = GF_UPDATE;
4162
0
  }
4163
4164
0
  if (encode_show_existing_frame(cm)) {
4165
#if CONFIG_RATECTRL_LOG && CONFIG_THREE_PASS && CONFIG_BITRATE_ACCURACY
4166
    // TODO(angiebird): Move this into a function.
4167
    if (oxcf->pass == AOM_RC_THIRD_PASS) {
4168
      int frame_coding_idx =
4169
          av1_vbr_rc_frame_coding_idx(&cpi->vbr_rc_info, cpi->gf_frame_index);
4170
      rc_log_frame_encode_param(
4171
          &cpi->rc_log, frame_coding_idx, 1, 255,
4172
          cpi->ppi->gf_group.update_type[cpi->gf_frame_index]);
4173
    }
4174
#endif
4175
0
    av1_finalize_encoded_frame(cpi);
4176
    // Build the bitstream
4177
0
    int largest_tile_id = 0;  // Output from bitstream: unused here
4178
0
    cpi->rc.coefficient_size = 0;
4179
0
    if (av1_pack_bitstream(cpi, dest, dest_size, size, &largest_tile_id) !=
4180
0
        AOM_CODEC_OK)
4181
0
      return AOM_CODEC_ERROR;
4182
4183
0
    if (seq_params->frame_id_numbers_present_flag &&
4184
0
        current_frame->frame_type == KEY_FRAME) {
4185
      // Displaying a forward key-frame, so reset the ref buffer IDs
4186
0
      int display_frame_id = cm->ref_frame_id[cpi->existing_fb_idx_to_show];
4187
0
      for (int i = 0; i < REF_FRAMES; i++)
4188
0
        cm->ref_frame_id[i] = display_frame_id;
4189
0
    }
4190
4191
#if DUMP_RECON_FRAMES == 1
4192
    // NOTE(zoeliu): For debug - Output the filtered reconstructed video.
4193
    av1_dump_filtered_recon_frames(cpi);
4194
#endif  // DUMP_RECON_FRAMES
4195
4196
    // NOTE: Save the new show frame buffer index for --test-code=warn, i.e.,
4197
    //       for the purpose to verify no mismatch between encoder and decoder.
4198
0
    if (cm->show_frame) cpi->last_show_frame_buf = cm->cur_frame;
4199
4200
#if CONFIG_AV1_TEMPORAL_DENOISING
4201
    av1_denoiser_update_ref_frame(cpi);
4202
#endif
4203
4204
    // Since we allocate a spot for the OVERLAY frame in the gf group, we need
4205
    // to do post-encoding update accordingly.
4206
0
    av1_set_target_rate(cpi, cm->width, cm->height);
4207
4208
0
    if (is_psnr_calc_enabled(cpi)) {
4209
0
      cpi->source =
4210
0
          realloc_and_scale_source(cpi, cm->cur_frame->buf.y_crop_width,
4211
0
                                   cm->cur_frame->buf.y_crop_height);
4212
0
    }
4213
4214
0
#if !CONFIG_REALTIME_ONLY
4215
0
    if (cpi->use_ducky_encode) {
4216
0
      PSNR_STATS psnr;
4217
0
      aom_calc_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr);
4218
0
      DuckyEncodeFrameResult *frame_result =
4219
0
          &cpi->ducky_encode_info.frame_result;
4220
0
      frame_result->global_order_idx = cm->cur_frame->display_order_hint;
4221
0
      frame_result->q_index = cm->quant_params.base_qindex;
4222
0
      frame_result->rdmult = cpi->rd.RDMULT;
4223
0
      frame_result->rate = (int)(*size) * 8;
4224
0
      frame_result->dist = psnr.sse[0];
4225
0
      frame_result->psnr = psnr.psnr[0];
4226
0
    }
4227
0
#endif  // !CONFIG_REALTIME_ONLY
4228
4229
0
    update_counters_for_show_frame(cpi);
4230
0
    return AOM_CODEC_OK;
4231
0
  }
4232
4233
  // Work out whether to force_integer_mv this frame
4234
0
  if (!is_stat_generation_stage(cpi) &&
4235
0
      cpi->common.features.allow_screen_content_tools &&
4236
0
      !frame_is_intra_only(cm) && !cpi->sf.rt_sf.use_nonrd_pick_mode) {
4237
0
    if (cpi->common.seq_params->force_integer_mv == 2) {
4238
      // Adaptive mode: see what previous frame encoded did
4239
0
      if (cpi->unscaled_last_source != NULL) {
4240
0
        features->cur_frame_force_integer_mv = av1_is_integer_mv(
4241
0
            cpi->source, cpi->unscaled_last_source, &cpi->force_intpel_info);
4242
0
      } else {
4243
0
        cpi->common.features.cur_frame_force_integer_mv = 0;
4244
0
      }
4245
0
    } else {
4246
0
      cpi->common.features.cur_frame_force_integer_mv =
4247
0
          cpi->common.seq_params->force_integer_mv;
4248
0
    }
4249
0
  } else {
4250
0
    cpi->common.features.cur_frame_force_integer_mv = 0;
4251
0
  }
4252
4253
  // This is used by av1_pack_bitstream. So this needs to be set in case of
4254
  // row-mt where the encoding code will use a temporary structure.
4255
0
  cpi->td.mb.e_mbd.cur_frame_force_integer_mv =
4256
0
      cpi->common.features.cur_frame_force_integer_mv;
4257
4258
  // Set default state for segment based loop filter update flags.
4259
0
  cm->lf.mode_ref_delta_update = 0;
4260
4261
  // Set various flags etc to special state if it is a key frame.
4262
0
  if (frame_is_intra_only(cm) || frame_is_sframe(cm)) {
4263
    // Reset the loop filter deltas and segmentation map.
4264
0
    av1_reset_segment_features(cm);
4265
4266
    // If segmentation is enabled force a map update for key frames.
4267
0
    if (seg->enabled) {
4268
0
      seg->update_map = 1;
4269
0
      seg->update_data = 1;
4270
0
    }
4271
0
  }
4272
0
  if (tile_cfg->mtu == 0) {
4273
0
    cpi->num_tg = tile_cfg->num_tile_groups;
4274
0
  } else {
4275
    // Use a default value for the purposes of weighting costs in probability
4276
    // updates
4277
0
    cpi->num_tg = DEFAULT_MAX_NUM_TG;
4278
0
  }
4279
4280
  // For 1 pass CBR mode: check if we are dropping this frame.
4281
0
  if (has_no_stats_stage(cpi) && oxcf->rc_cfg.mode == AOM_CBR) {
4282
    // Always drop for spatial enhancement layer if layer bandwidth is 0.
4283
    // Otherwise check for frame-dropping based on buffer level in
4284
    // av1_rc_drop_frame().
4285
0
    if ((cpi->svc.spatial_layer_id > 0 &&
4286
0
         cpi->oxcf.rc_cfg.target_bandwidth == 0) ||
4287
0
        av1_rc_drop_frame(cpi)) {
4288
0
      cpi->is_dropped_frame = true;
4289
0
    }
4290
0
    if (cpi->is_dropped_frame) {
4291
0
      av1_setup_frame_size(cpi);
4292
0
      av1_set_mv_search_params(cpi);
4293
0
      av1_rc_postencode_update_drop_frame(cpi);
4294
0
      release_scaled_references(cpi);
4295
0
      cpi->ppi->gf_group.is_frame_dropped[cpi->gf_frame_index] = true;
4296
      // A dropped frame might not be shown but it always takes a slot in the gf
4297
      // group. Therefore, even when it is not shown, we still need to update
4298
      // the relevant frame counters.
4299
0
      if (cm->show_frame) {
4300
0
        update_counters_for_show_frame(cpi);
4301
0
      }
4302
0
      return AOM_CODEC_OK;
4303
0
    }
4304
0
  }
4305
4306
0
  if (oxcf->tune_cfg.tuning == AOM_TUNE_SSIM ||
4307
0
      oxcf->tune_cfg.tuning == AOM_TUNE_IQ ||
4308
0
      oxcf->tune_cfg.tuning == AOM_TUNE_SSIMULACRA2) {
4309
0
    av1_set_mb_ssim_rdmult_scaling(cpi);
4310
0
  }
4311
#if CONFIG_SALIENCY_MAP
4312
  else if (oxcf->tune_cfg.tuning == AOM_TUNE_VMAF_SALIENCY_MAP &&
4313
           !(cpi->source->flags & YV12_FLAG_HIGHBITDEPTH)) {
4314
    if (av1_set_saliency_map(cpi) == 0) {
4315
      return AOM_CODEC_MEM_ERROR;
4316
    }
4317
#if !CONFIG_REALTIME_ONLY
4318
    double motion_ratio = av1_setup_motion_ratio(cpi);
4319
#else
4320
    double motion_ratio = 1.0;
4321
#endif
4322
    if (av1_setup_sm_rdmult_scaling_factor(cpi, motion_ratio) == 0) {
4323
      return AOM_CODEC_MEM_ERROR;
4324
    }
4325
  }
4326
#endif
4327
#if CONFIG_TUNE_VMAF
4328
  else if (oxcf->tune_cfg.tuning == AOM_TUNE_VMAF_WITHOUT_PREPROCESSING ||
4329
           oxcf->tune_cfg.tuning == AOM_TUNE_VMAF_MAX_GAIN ||
4330
           oxcf->tune_cfg.tuning == AOM_TUNE_VMAF_NEG_MAX_GAIN) {
4331
    av1_set_mb_vmaf_rdmult_scaling(cpi);
4332
  }
4333
#endif
4334
4335
0
  if (cpi->oxcf.q_cfg.deltaq_mode == DELTA_Q_PERCEPTUAL_AI &&
4336
0
      cpi->sf.rt_sf.use_nonrd_pick_mode == 0) {
4337
0
    av1_init_mb_wiener_var_buffer(cpi);
4338
0
    av1_set_mb_wiener_variance(cpi);
4339
0
  }
4340
4341
0
  if (cpi->oxcf.q_cfg.deltaq_mode == DELTA_Q_USER_RATING_BASED) {
4342
0
    av1_init_mb_ur_var_buffer(cpi);
4343
0
    av1_set_mb_ur_variance(cpi);
4344
0
  }
4345
4346
#if CONFIG_INTERNAL_STATS
4347
  memset(cpi->mode_chosen_counts, 0,
4348
         MAX_MODES * sizeof(*cpi->mode_chosen_counts));
4349
#endif
4350
4351
0
  if (seq_params->frame_id_numbers_present_flag) {
4352
    /* Non-normative definition of current_frame_id ("frame counter" with
4353
     * wraparound) */
4354
0
    if (cm->current_frame_id == -1) {
4355
0
      int lsb, msb;
4356
      /* quasi-random initialization of current_frame_id for a key frame */
4357
0
      if (cpi->source->flags & YV12_FLAG_HIGHBITDEPTH) {
4358
0
        lsb = CONVERT_TO_SHORTPTR(cpi->source->y_buffer)[0] & 0xff;
4359
0
        msb = CONVERT_TO_SHORTPTR(cpi->source->y_buffer)[1] & 0xff;
4360
0
      } else {
4361
0
        lsb = cpi->source->y_buffer[0] & 0xff;
4362
0
        msb = cpi->source->y_buffer[1] & 0xff;
4363
0
      }
4364
0
      cm->current_frame_id =
4365
0
          ((msb << 8) + lsb) % (1 << seq_params->frame_id_length);
4366
4367
      // S_frame is meant for stitching different streams of different
4368
      // resolutions together, so current_frame_id must be the
4369
      // same across different streams of the same content current_frame_id
4370
      // should be the same and not random. 0x37 is a chosen number as start
4371
      // point
4372
0
      if (oxcf->kf_cfg.sframe_dist != 0) cm->current_frame_id = 0x37;
4373
0
    } else {
4374
0
      cm->current_frame_id =
4375
0
          (cm->current_frame_id + 1 + (1 << seq_params->frame_id_length)) %
4376
0
          (1 << seq_params->frame_id_length);
4377
0
    }
4378
0
  }
4379
4380
0
  switch (oxcf->algo_cfg.cdf_update_mode) {
4381
0
    case 0:  // No CDF update for any frames(4~6% compression loss).
4382
0
      features->disable_cdf_update = 1;
4383
0
      break;
4384
0
    case 1:  // Enable CDF update for all frames.
4385
0
      if (cpi->sf.rt_sf.disable_cdf_update_non_reference_frame &&
4386
0
          cpi->ppi->rtc_ref.non_reference_frame && cpi->rc.frames_since_key > 2)
4387
0
        features->disable_cdf_update = 1;
4388
0
      else if (cpi->sf.rt_sf.selective_cdf_update)
4389
0
        features->disable_cdf_update = selective_disable_cdf_rtc(cpi);
4390
0
      else
4391
0
        features->disable_cdf_update = 0;
4392
0
      break;
4393
0
    case 2:
4394
      // Strategically determine at which frames to do CDF update.
4395
      // Currently only enable CDF update for all-intra and no-show frames(1.5%
4396
      // compression loss) for good qualiy or allintra mode.
4397
0
      if (oxcf->mode == GOOD || oxcf->mode == ALLINTRA) {
4398
0
        features->disable_cdf_update =
4399
0
            (frame_is_intra_only(cm) || !cm->show_frame) ? 0 : 1;
4400
0
      } else {
4401
0
        features->disable_cdf_update = selective_disable_cdf_rtc(cpi);
4402
0
      }
4403
0
      break;
4404
0
  }
4405
4406
  // Disable cdf update for the INTNL_ARF_UPDATE frame with
4407
  // frame_parallel_level 1.
4408
0
  if (!cpi->do_frame_data_update &&
4409
0
      cpi->ppi->gf_group.update_type[cpi->gf_frame_index] == INTNL_ARF_UPDATE) {
4410
0
    assert(cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] == 1);
4411
0
    features->disable_cdf_update = 1;
4412
0
  }
4413
4414
0
#if !CONFIG_REALTIME_ONLY
4415
0
  if (cpi->oxcf.tool_cfg.enable_global_motion && !frame_is_intra_only(cm)) {
4416
    // Flush any stale global motion information, which may be left over
4417
    // from a previous frame
4418
0
    aom_invalidate_pyramid(cpi->source->y_pyramid);
4419
0
    av1_invalidate_corner_list(cpi->source->corners);
4420
0
  }
4421
0
#endif  // !CONFIG_REALTIME_ONLY
4422
4423
0
  int largest_tile_id = 0;
4424
0
  if (av1_superres_in_recode_allowed(cpi)) {
4425
0
    if (encode_with_and_without_superres(cpi, size, dest, dest_size,
4426
0
                                         &largest_tile_id) != AOM_CODEC_OK) {
4427
0
      return AOM_CODEC_ERROR;
4428
0
    }
4429
0
  } else {
4430
0
    const aom_superres_mode orig_superres_mode = cpi->superres_mode;  // save
4431
0
    cpi->superres_mode = cpi->oxcf.superres_cfg.superres_mode;
4432
0
    if (encode_with_recode_loop_and_filter(cpi, size, dest, dest_size, NULL,
4433
0
                                           NULL,
4434
0
                                           &largest_tile_id) != AOM_CODEC_OK) {
4435
0
      return AOM_CODEC_ERROR;
4436
0
    }
4437
0
    cpi->superres_mode = orig_superres_mode;  // restore
4438
0
  }
4439
4440
  // Update reference frame ids for reference frames this frame will overwrite
4441
0
  if (seq_params->frame_id_numbers_present_flag) {
4442
0
    for (int i = 0; i < REF_FRAMES; i++) {
4443
0
      if ((current_frame->refresh_frame_flags >> i) & 1) {
4444
0
        cm->ref_frame_id[i] = cm->current_frame_id;
4445
0
      }
4446
0
    }
4447
0
  }
4448
4449
0
  if (cpi->svc.spatial_layer_id == cpi->svc.number_spatial_layers - 1)
4450
0
    cpi->svc.num_encoded_top_layer++;
4451
4452
#if DUMP_RECON_FRAMES == 1
4453
  // NOTE(zoeliu): For debug - Output the filtered reconstructed video.
4454
  av1_dump_filtered_recon_frames(cpi);
4455
#endif  // DUMP_RECON_FRAMES
4456
4457
0
  if (cm->seg.enabled) {
4458
0
    if (cm->seg.update_map == 0 && cm->last_frame_seg_map) {
4459
0
      memcpy(cm->cur_frame->seg_map, cm->last_frame_seg_map,
4460
0
             cm->cur_frame->mi_cols * cm->cur_frame->mi_rows *
4461
0
                 sizeof(*cm->cur_frame->seg_map));
4462
0
    }
4463
0
  }
4464
4465
0
  int release_scaled_refs = 0;
4466
#if CONFIG_FPMT_TEST
4467
  release_scaled_refs =
4468
      (cpi->ppi->fpmt_unit_test_cfg == PARALLEL_SIMULATION_ENCODE) ? 1 : 0;
4469
#endif  // CONFIG_FPMT_TEST
4470
0
  if (release_scaled_refs ||
4471
0
      cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] == 0) {
4472
0
    if (frame_is_intra_only(cm) == 0) {
4473
0
      release_scaled_references(cpi);
4474
0
    }
4475
0
  }
4476
#if CONFIG_AV1_TEMPORAL_DENOISING
4477
  av1_denoiser_update_ref_frame(cpi);
4478
#endif
4479
4480
  // NOTE: Save the new show frame buffer index for --test-code=warn, i.e.,
4481
  //       for the purpose to verify no mismatch between encoder and decoder.
4482
0
  if (cm->show_frame) cpi->last_show_frame_buf = cm->cur_frame;
4483
4484
0
  if (features->refresh_frame_context == REFRESH_FRAME_CONTEXT_BACKWARD) {
4485
0
    *cm->fc = cpi->tile_data[largest_tile_id].tctx;
4486
0
    av1_reset_cdf_symbol_counters(cm->fc);
4487
0
  }
4488
0
  if (!cm->tiles.large_scale) {
4489
0
    cm->cur_frame->frame_context = *cm->fc;
4490
0
  }
4491
4492
0
  if (tile_cfg->enable_ext_tile_debug) {
4493
    // (yunqing) This test ensures the correctness of large scale tile coding.
4494
0
    if (cm->tiles.large_scale && is_stat_consumption_stage(cpi)) {
4495
0
      char fn[20] = "./fc";
4496
0
      fn[4] = current_frame->frame_number / 100 + '0';
4497
0
      fn[5] = (current_frame->frame_number % 100) / 10 + '0';
4498
0
      fn[6] = (current_frame->frame_number % 10) + '0';
4499
0
      fn[7] = '\0';
4500
0
      av1_print_frame_contexts(cm->fc, fn);
4501
0
    }
4502
0
  }
4503
4504
0
  cpi->last_frame_type = current_frame->frame_type;
4505
4506
0
  if (cm->features.disable_cdf_update) {
4507
0
    cpi->frames_since_last_update++;
4508
0
  } else {
4509
0
    cpi->frames_since_last_update = 1;
4510
0
  }
4511
4512
0
  if (cpi->svc.spatial_layer_id == cpi->svc.number_spatial_layers - 1) {
4513
0
    cpi->svc.prev_number_spatial_layers = cpi->svc.number_spatial_layers;
4514
0
  }
4515
0
  cpi->svc.prev_number_temporal_layers = cpi->svc.number_temporal_layers;
4516
4517
  // Clear the one shot update flags for segmentation map and mode/ref loop
4518
  // filter deltas.
4519
0
  cm->seg.update_map = 0;
4520
0
  cm->seg.update_data = 0;
4521
0
  cm->lf.mode_ref_delta_update = 0;
4522
4523
0
  if (cm->show_frame) {
4524
0
    update_counters_for_show_frame(cpi);
4525
0
  }
4526
4527
#if CONFIG_COLLECT_COMPONENT_TIMING
4528
  end_timing(cpi, encode_frame_to_data_rate_time);
4529
#endif
4530
4531
0
  return AOM_CODEC_OK;
4532
0
}
4533
4534
int av1_encode(AV1_COMP *const cpi, uint8_t *const dest, size_t dest_size,
4535
               const EncodeFrameInput *const frame_input,
4536
               const EncodeFrameParams *const frame_params,
4537
0
               size_t *const frame_size) {
4538
0
  AV1_COMMON *const cm = &cpi->common;
4539
0
  CurrentFrame *const current_frame = &cm->current_frame;
4540
4541
0
  cpi->unscaled_source = frame_input->source;
4542
0
  cpi->source = frame_input->source;
4543
0
  cpi->unscaled_last_source = frame_input->last_source;
4544
4545
0
  current_frame->refresh_frame_flags = frame_params->refresh_frame_flags;
4546
0
  cm->features.error_resilient_mode = frame_params->error_resilient_mode;
4547
0
  cm->features.primary_ref_frame = frame_params->primary_ref_frame;
4548
0
  cm->current_frame.frame_type = frame_params->frame_type;
4549
0
  cm->show_frame = frame_params->show_frame;
4550
0
  cpi->ref_frame_flags = frame_params->ref_frame_flags;
4551
0
  cpi->speed = frame_params->speed;
4552
0
  cm->show_existing_frame = frame_params->show_existing_frame;
4553
0
  cpi->existing_fb_idx_to_show = frame_params->existing_fb_idx_to_show;
4554
4555
0
  memcpy(cm->remapped_ref_idx, frame_params->remapped_ref_idx,
4556
0
         REF_FRAMES * sizeof(*cm->remapped_ref_idx));
4557
4558
0
  memcpy(&cpi->refresh_frame, &frame_params->refresh_frame,
4559
0
         sizeof(cpi->refresh_frame));
4560
4561
0
  if (current_frame->frame_type == KEY_FRAME &&
4562
0
      cpi->ppi->gf_group.refbuf_state[cpi->gf_frame_index] == REFBUF_RESET) {
4563
0
    current_frame->frame_number = 0;
4564
0
  }
4565
4566
0
  current_frame->order_hint =
4567
0
      current_frame->frame_number + frame_params->order_offset;
4568
4569
0
  current_frame->display_order_hint = current_frame->order_hint;
4570
0
  current_frame->order_hint %=
4571
0
      (1 << (cm->seq_params->order_hint_info.order_hint_bits_minus_1 + 1));
4572
4573
0
  current_frame->pyramid_level = get_true_pyr_level(
4574
0
      cpi->ppi->gf_group.layer_depth[cpi->gf_frame_index],
4575
0
      current_frame->display_order_hint, cpi->ppi->gf_group.max_layer_depth);
4576
4577
0
#if !CONFIG_REALTIME_ONLY
4578
0
  const GF_GROUP *gf_group = &cpi->ppi->gf_group;
4579
  // Check if this is the last frame in the gop. If so, make a copy of the
4580
  // source for TPL.
4581
0
  if (cpi->oxcf.algo_cfg.enable_tpl_model &&
4582
0
      av1_tpl_stats_ready(&cpi->ppi->tpl_data, cpi->gf_frame_index) &&
4583
0
      gf_group->update_type[cpi->gf_frame_index] != OVERLAY_UPDATE &&
4584
0
      gf_group->update_type[cpi->gf_frame_index] != INTNL_OVERLAY_UPDATE) {
4585
0
    int is_last = 1;
4586
0
    for (int i = 0; i < gf_group->size; ++i) {
4587
0
      if (gf_group->display_idx[i] >
4588
0
          gf_group->display_idx[cpi->gf_frame_index]) {
4589
0
        is_last = 0;
4590
0
        break;
4591
0
      }
4592
0
    }
4593
0
    if (is_last) {
4594
0
      cpi->ppi->tpl_data.prev_gop_arf_disp_order = -1;
4595
0
      const AV1EncoderConfig *const oxcf = &cpi->oxcf;
4596
0
      int available = 1;
4597
0
      int ret = aom_realloc_frame_buffer(
4598
0
          &cpi->ppi->tpl_data.prev_gop_arf_src, oxcf->frm_dim_cfg.width,
4599
0
          oxcf->frm_dim_cfg.height, cm->seq_params->subsampling_x,
4600
0
          cm->seq_params->subsampling_y, cm->seq_params->use_highbitdepth,
4601
0
          cpi->oxcf.border_in_pixels, cm->features.byte_alignment, NULL, NULL,
4602
0
          NULL, cpi->alloc_pyramid, 0);
4603
0
      if (ret)
4604
0
        aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
4605
0
                           "Failed to allocate tpl prev_gop_arf_src buf.");
4606
4607
      // Currently it is not supported if source/reference is resized.
4608
0
      if (cpi->source->y_width == cpi->ppi->tpl_data.prev_gop_arf_src.y_width &&
4609
0
          cpi->source->y_height ==
4610
0
              cpi->ppi->tpl_data.prev_gop_arf_src.y_height) {
4611
        // Copy the content from source to this buffer for next gop.
4612
0
        aom_yv12_copy_frame(cpi->source, &cpi->ppi->tpl_data.prev_gop_arf_src,
4613
0
                            av1_num_planes(cm));
4614
0
      } else {
4615
0
        available = 0;
4616
0
      }
4617
4618
0
      ret = aom_realloc_frame_buffer(
4619
0
          &cpi->ppi->tpl_data.prev_gop_arf_tpl_recon, oxcf->frm_dim_cfg.width,
4620
0
          oxcf->frm_dim_cfg.height, cm->seq_params->subsampling_x,
4621
0
          cm->seq_params->subsampling_y, cm->seq_params->use_highbitdepth,
4622
0
          cpi->oxcf.border_in_pixels, cm->features.byte_alignment, NULL, NULL,
4623
0
          NULL, cpi->alloc_pyramid, 0);
4624
0
      if (ret)
4625
0
        aom_internal_error(
4626
0
            cm->error, AOM_CODEC_MEM_ERROR,
4627
0
            "Failed to allocate tpl prev_gop_arf_tpl_recon buf.");
4628
4629
0
      YV12_BUFFER_CONFIG *prev_gop_arf_tpl_recon_buf =
4630
0
          cpi->ppi->tpl_data.tpl_frame
4631
0
              ? cpi->ppi->tpl_data.tpl_frame[cpi->gf_frame_index].rec_picture
4632
0
              : NULL;
4633
4634
      // Currently it is not supported if source/reference is resized.
4635
0
      if (prev_gop_arf_tpl_recon_buf &&
4636
0
          prev_gop_arf_tpl_recon_buf->y_width ==
4637
0
              cpi->ppi->tpl_data.prev_gop_arf_tpl_recon.y_width &&
4638
0
          prev_gop_arf_tpl_recon_buf->y_height ==
4639
0
              cpi->ppi->tpl_data.prev_gop_arf_tpl_recon.y_height) {
4640
        // Copy the content from source to this buffer for next gop.
4641
0
        aom_yv12_copy_frame(prev_gop_arf_tpl_recon_buf,
4642
0
                            &cpi->ppi->tpl_data.prev_gop_arf_tpl_recon, 1);
4643
0
      } else {
4644
0
        available = 0;
4645
0
      }
4646
4647
0
      if (available) {
4648
0
        cpi->ppi->tpl_data.prev_gop_arf_disp_order =
4649
0
            current_frame->display_order_hint;
4650
0
      }
4651
0
    }
4652
0
  }
4653
0
#endif
4654
4655
0
  if (is_stat_generation_stage(cpi)) {
4656
0
#if !CONFIG_REALTIME_ONLY
4657
0
    if (cpi->oxcf.q_cfg.use_fixed_qp_offsets != 0)
4658
0
      av1_noop_first_pass_frame(cpi, frame_input->ts_duration);
4659
0
    else
4660
0
      av1_first_pass(cpi, frame_input->ts_duration);
4661
0
#endif
4662
0
  } else if (cpi->oxcf.pass == AOM_RC_ONE_PASS ||
4663
0
             cpi->oxcf.pass >= AOM_RC_SECOND_PASS) {
4664
0
    if (encode_frame_to_data_rate(cpi, frame_size, dest, dest_size) !=
4665
0
        AOM_CODEC_OK) {
4666
0
      return AOM_CODEC_ERROR;
4667
0
    }
4668
0
  } else {
4669
0
    return AOM_CODEC_ERROR;
4670
0
  }
4671
4672
0
  if (cpi->ext_ratectrl.ready &&
4673
0
      cpi->ext_ratectrl.funcs.update_encodeframe_result != NULL) {
4674
0
    aom_codec_err_t codec_status = av1_extrc_update_encodeframe_result(
4675
0
        &cpi->ext_ratectrl, (*frame_size) << 3, cm->quant_params.base_qindex);
4676
0
    if (codec_status != AOM_CODEC_OK) {
4677
0
      aom_internal_error(cm->error, codec_status,
4678
0
                         "av1_extrc_update_encodeframe_result() failed");
4679
0
    }
4680
0
  }
4681
4682
0
  return AOM_CODEC_OK;
4683
0
}
4684
4685
#if CONFIG_DENOISE && !CONFIG_REALTIME_ONLY
4686
static int apply_denoise_2d(AV1_COMP *cpi, const YV12_BUFFER_CONFIG *sd,
4687
                            int block_size, float noise_level,
4688
0
                            int64_t time_stamp, int64_t end_time) {
4689
0
  AV1_COMMON *const cm = &cpi->common;
4690
0
  if (!cpi->denoise_and_model) {
4691
0
    cpi->denoise_and_model = aom_denoise_and_model_alloc(
4692
0
        cm->seq_params->bit_depth, block_size, noise_level);
4693
0
    if (!cpi->denoise_and_model) {
4694
0
      aom_set_error(cm->error, AOM_CODEC_MEM_ERROR,
4695
0
                    "Error allocating denoise and model");
4696
0
      return -1;
4697
0
    }
4698
0
  }
4699
0
  if (!cpi->film_grain_table) {
4700
0
    cpi->film_grain_table = aom_malloc(sizeof(*cpi->film_grain_table));
4701
0
    if (!cpi->film_grain_table) {
4702
0
      aom_set_error(cm->error, AOM_CODEC_MEM_ERROR,
4703
0
                    "Error allocating grain table");
4704
0
      return -1;
4705
0
    }
4706
0
    memset(cpi->film_grain_table, 0, sizeof(*cpi->film_grain_table));
4707
0
  }
4708
0
  if (aom_denoise_and_model_run(cpi->denoise_and_model, sd,
4709
0
                                &cm->film_grain_params,
4710
0
                                cpi->oxcf.enable_dnl_denoising)) {
4711
0
    if (cm->film_grain_params.apply_grain) {
4712
0
      aom_film_grain_table_append(cpi->film_grain_table, time_stamp, end_time,
4713
0
                                  &cm->film_grain_params);
4714
0
    }
4715
0
  }
4716
0
  return 0;
4717
0
}
4718
#endif
4719
4720
int av1_receive_raw_frame(AV1_COMP *cpi, aom_enc_frame_flags_t frame_flags,
4721
                          const YV12_BUFFER_CONFIG *sd, int64_t time_stamp,
4722
0
                          int64_t end_time) {
4723
0
  AV1_COMMON *const cm = &cpi->common;
4724
0
  const SequenceHeader *const seq_params = cm->seq_params;
4725
0
  int res = 0;
4726
0
  const int subsampling_x = sd->subsampling_x;
4727
0
  const int subsampling_y = sd->subsampling_y;
4728
0
  const int use_highbitdepth = (sd->flags & YV12_FLAG_HIGHBITDEPTH) != 0;
4729
4730
  // Note: Regarding profile setting, the following checks are added to help
4731
  // choose a proper profile for the input video. The criterion is that all
4732
  // bitstreams must be designated as the lowest profile that match its content.
4733
  // E.G. A bitstream that contains 4:4:4 video must be designated as High
4734
  // Profile in the seq header, and likewise a bitstream that contains 4:2:2
4735
  // bitstream must be designated as Professional Profile in the sequence
4736
  // header.
4737
0
  if ((seq_params->profile == PROFILE_0) && !seq_params->monochrome &&
4738
0
      (subsampling_x != 1 || subsampling_y != 1)) {
4739
0
    aom_set_error(cm->error, AOM_CODEC_INVALID_PARAM,
4740
0
                  "Non-4:2:0 color format requires profile 1 or 2");
4741
0
    return -1;
4742
0
  }
4743
0
  if ((seq_params->profile == PROFILE_1) &&
4744
0
      !(subsampling_x == 0 && subsampling_y == 0)) {
4745
0
    aom_set_error(cm->error, AOM_CODEC_INVALID_PARAM,
4746
0
                  "Profile 1 requires 4:4:4 color format");
4747
0
    return -1;
4748
0
  }
4749
0
  if ((seq_params->profile == PROFILE_2) &&
4750
0
      (seq_params->bit_depth <= AOM_BITS_10) &&
4751
0
      !(subsampling_x == 1 && subsampling_y == 0)) {
4752
0
    aom_set_error(cm->error, AOM_CODEC_INVALID_PARAM,
4753
0
                  "Profile 2 bit-depth <= 10 requires 4:2:2 color format");
4754
0
    return -1;
4755
0
  }
4756
4757
#if CONFIG_TUNE_VMAF
4758
  if (!is_stat_generation_stage(cpi) &&
4759
      cpi->oxcf.tune_cfg.tuning == AOM_TUNE_VMAF_WITH_PREPROCESSING) {
4760
    av1_vmaf_frame_preprocessing(cpi, sd);
4761
  }
4762
  if (!is_stat_generation_stage(cpi) &&
4763
      cpi->oxcf.tune_cfg.tuning == AOM_TUNE_VMAF_MAX_GAIN) {
4764
    av1_vmaf_blk_preprocessing(cpi, sd);
4765
  }
4766
#endif
4767
4768
#if CONFIG_INTERNAL_STATS
4769
  struct aom_usec_timer timer;
4770
  aom_usec_timer_start(&timer);
4771
#endif
4772
4773
#if CONFIG_AV1_TEMPORAL_DENOISING
4774
  setup_denoiser_buffer(cpi);
4775
#endif
4776
4777
0
#if CONFIG_DENOISE
4778
  // even if denoise_noise_level is > 0, we don't need need to denoise on pass
4779
  // 1 of 2 if enable_dnl_denoising is disabled since the 2nd pass will be
4780
  // encoding the original (non-denoised) frame
4781
0
  if (cpi->oxcf.noise_level > 0 && !(cpi->oxcf.pass == AOM_RC_FIRST_PASS &&
4782
0
                                     !cpi->oxcf.enable_dnl_denoising)) {
4783
0
#if !CONFIG_REALTIME_ONLY
4784
    // Choose a synthetic noise level for still images for enhanced perceptual
4785
    // quality based on an estimated noise level in the source, but only if
4786
    // the noise level is set on the command line to > 0.
4787
0
    if (cpi->oxcf.mode == ALLINTRA) {
4788
      // No noise synthesis if source is very clean.
4789
      // Uses a low edge threshold to focus on smooth areas.
4790
      // Increase output noise setting a little compared to measured value.
4791
0
      double y_noise_level = 0.0;
4792
0
      av1_estimate_noise_level(sd, &y_noise_level, AOM_PLANE_Y, AOM_PLANE_Y,
4793
0
                               cm->seq_params->bit_depth, 16);
4794
0
      cpi->oxcf.noise_level = (float)(y_noise_level - 0.1);
4795
0
      cpi->oxcf.noise_level = (float)AOMMAX(0.0, cpi->oxcf.noise_level);
4796
0
      if (cpi->oxcf.noise_level > 0.0) {
4797
0
        cpi->oxcf.noise_level += (float)0.5;
4798
0
      }
4799
0
      cpi->oxcf.noise_level = (float)AOMMIN(5.0, cpi->oxcf.noise_level);
4800
0
    }
4801
4802
0
    if (apply_denoise_2d(cpi, sd, cpi->oxcf.noise_block_size,
4803
0
                         cpi->oxcf.noise_level, time_stamp, end_time) < 0)
4804
0
      res = -1;
4805
0
#endif  // !CONFIG_REALTIME_ONLY
4806
0
  }
4807
0
#endif  //  CONFIG_DENOISE
4808
4809
0
  if (av1_lookahead_push(cpi->ppi->lookahead, sd, time_stamp, end_time,
4810
0
                         use_highbitdepth, cpi->alloc_pyramid, frame_flags)) {
4811
0
    aom_set_error(cm->error, AOM_CODEC_ERROR, "av1_lookahead_push() failed");
4812
0
    res = -1;
4813
0
  }
4814
#if CONFIG_INTERNAL_STATS
4815
  aom_usec_timer_mark(&timer);
4816
  cpi->ppi->total_time_receive_data += aom_usec_timer_elapsed(&timer);
4817
#endif
4818
4819
0
  return res;
4820
0
}
4821
4822
#if CONFIG_ENTROPY_STATS
4823
void print_entropy_stats(AV1_PRIMARY *const ppi) {
4824
  if (!ppi->cpi) return;
4825
4826
  if (ppi->cpi->oxcf.pass != 1 &&
4827
      ppi->cpi->common.current_frame.frame_number > 0) {
4828
    fprintf(stderr, "Writing counts.stt\n");
4829
    FILE *f = fopen("counts.stt", "wb");
4830
    fwrite(&ppi->aggregate_fc, sizeof(ppi->aggregate_fc), 1, f);
4831
    fclose(f);
4832
  }
4833
}
4834
#endif  // CONFIG_ENTROPY_STATS
4835
4836
#if CONFIG_INTERNAL_STATS
4837
static void adjust_image_stat(double y, double u, double v, double all,
4838
                              ImageStat *s) {
4839
  s->stat[STAT_Y] += y;
4840
  s->stat[STAT_U] += u;
4841
  s->stat[STAT_V] += v;
4842
  s->stat[STAT_ALL] += all;
4843
  s->worst = AOMMIN(s->worst, all);
4844
}
4845
4846
static void compute_internal_stats(AV1_COMP *cpi, int frame_bytes) {
4847
  AV1_PRIMARY *const ppi = cpi->ppi;
4848
  AV1_COMMON *const cm = &cpi->common;
4849
  double samples = 0.0;
4850
  const uint32_t in_bit_depth = cpi->oxcf.input_cfg.input_bit_depth;
4851
  const uint32_t bit_depth = cpi->td.mb.e_mbd.bd;
4852
4853
  if (cpi->ppi->use_svc &&
4854
      cpi->svc.spatial_layer_id < cpi->svc.number_spatial_layers - 1)
4855
    return;
4856
4857
#if CONFIG_INTER_STATS_ONLY
4858
  if (cm->current_frame.frame_type == KEY_FRAME) return;  // skip key frame
4859
#endif
4860
  cpi->bytes += frame_bytes;
4861
  if (cm->show_frame) {
4862
    const YV12_BUFFER_CONFIG *orig = cpi->source;
4863
    const YV12_BUFFER_CONFIG *recon = &cpi->common.cur_frame->buf;
4864
    double y, u, v, frame_all;
4865
4866
    ppi->count[0]++;
4867
    ppi->count[1]++;
4868
    if (cpi->ppi->b_calculate_psnr) {
4869
      PSNR_STATS psnr;
4870
      double weight[2] = { 0.0, 0.0 };
4871
      double frame_ssim2[2] = { 0.0, 0.0 };
4872
#if CONFIG_AV1_HIGHBITDEPTH
4873
      aom_calc_highbd_psnr(orig, recon, &psnr, bit_depth, in_bit_depth);
4874
#else
4875
      aom_calc_psnr(orig, recon, &psnr);
4876
#endif
4877
      adjust_image_stat(psnr.psnr[1], psnr.psnr[2], psnr.psnr[3], psnr.psnr[0],
4878
                        &(ppi->psnr[0]));
4879
      ppi->total_sq_error[0] += psnr.sse[0];
4880
      ppi->total_samples[0] += psnr.samples[0];
4881
      samples = psnr.samples[0];
4882
4883
      aom_calc_ssim(orig, recon, bit_depth, in_bit_depth,
4884
                    cm->seq_params->use_highbitdepth, weight, frame_ssim2);
4885
4886
      ppi->worst_ssim = AOMMIN(ppi->worst_ssim, frame_ssim2[0]);
4887
      ppi->summed_quality += frame_ssim2[0] * weight[0];
4888
      ppi->summed_weights += weight[0];
4889
4890
#if CONFIG_AV1_HIGHBITDEPTH
4891
      // Compute PSNR based on stream bit depth
4892
      if ((cpi->source->flags & YV12_FLAG_HIGHBITDEPTH) &&
4893
          (in_bit_depth < bit_depth)) {
4894
        adjust_image_stat(psnr.psnr_hbd[1], psnr.psnr_hbd[2], psnr.psnr_hbd[3],
4895
                          psnr.psnr_hbd[0], &ppi->psnr[1]);
4896
        ppi->total_sq_error[1] += psnr.sse_hbd[0];
4897
        ppi->total_samples[1] += psnr.samples_hbd[0];
4898
4899
        ppi->worst_ssim_hbd = AOMMIN(ppi->worst_ssim_hbd, frame_ssim2[1]);
4900
        ppi->summed_quality_hbd += frame_ssim2[1] * weight[1];
4901
        ppi->summed_weights_hbd += weight[1];
4902
      }
4903
#endif
4904
4905
#if 0
4906
      {
4907
        FILE *f = fopen("q_used.stt", "a");
4908
        double y2 = psnr.psnr[1];
4909
        double u2 = psnr.psnr[2];
4910
        double v2 = psnr.psnr[3];
4911
        double frame_psnr2 = psnr.psnr[0];
4912
        fprintf(f, "%5d : Y%f7.3:U%f7.3:V%f7.3:F%f7.3:S%7.3f\n",
4913
                cm->current_frame.frame_number, y2, u2, v2,
4914
                frame_psnr2, frame_ssim2);
4915
        fclose(f);
4916
      }
4917
#endif
4918
    }
4919
    if (ppi->b_calculate_blockiness) {
4920
      if (!cm->seq_params->use_highbitdepth) {
4921
        const double frame_blockiness =
4922
            av1_get_blockiness(orig->y_buffer, orig->y_stride, recon->y_buffer,
4923
                               recon->y_stride, orig->y_width, orig->y_height);
4924
        ppi->worst_blockiness = AOMMAX(ppi->worst_blockiness, frame_blockiness);
4925
        ppi->total_blockiness += frame_blockiness;
4926
      }
4927
4928
      if (ppi->b_calculate_consistency) {
4929
        if (!cm->seq_params->use_highbitdepth) {
4930
          const double this_inconsistency = aom_get_ssim_metrics(
4931
              orig->y_buffer, orig->y_stride, recon->y_buffer, recon->y_stride,
4932
              orig->y_width, orig->y_height, ppi->ssim_vars, &ppi->metrics, 1);
4933
4934
          const double peak = (double)((1 << in_bit_depth) - 1);
4935
          const double consistency =
4936
              aom_sse_to_psnr(samples, peak, ppi->total_inconsistency);
4937
          if (consistency > 0.0)
4938
            ppi->worst_consistency =
4939
                AOMMIN(ppi->worst_consistency, consistency);
4940
          ppi->total_inconsistency += this_inconsistency;
4941
        }
4942
      }
4943
    }
4944
4945
    frame_all =
4946
        aom_calc_fastssim(orig, recon, &y, &u, &v, bit_depth, in_bit_depth);
4947
    adjust_image_stat(y, u, v, frame_all, &ppi->fastssim);
4948
    frame_all = aom_psnrhvs(orig, recon, &y, &u, &v, bit_depth, in_bit_depth);
4949
    adjust_image_stat(y, u, v, frame_all, &ppi->psnrhvs);
4950
  }
4951
}
4952
4953
void print_internal_stats(AV1_PRIMARY *ppi) {
4954
  if (!ppi->cpi) return;
4955
  AV1_COMP *const cpi = ppi->cpi;
4956
4957
  if (ppi->cpi->oxcf.pass != 1 &&
4958
      ppi->cpi->common.current_frame.frame_number > 0) {
4959
    char headings[512] = { 0 };
4960
    char results[512] = { 0 };
4961
    FILE *f = fopen("opsnr.stt", "a");
4962
    double time_encoded =
4963
        (cpi->time_stamps.prev_ts_end - cpi->time_stamps.first_ts_start) /
4964
        10000000.000;
4965
    double total_encode_time =
4966
        (ppi->total_time_receive_data + ppi->total_time_compress_data) /
4967
        1000.000;
4968
    const double dr =
4969
        (double)ppi->total_bytes * (double)8 / (double)1000 / time_encoded;
4970
    const double peak =
4971
        (double)((1 << ppi->cpi->oxcf.input_cfg.input_bit_depth) - 1);
4972
    const double target_rate =
4973
        (double)ppi->cpi->oxcf.rc_cfg.target_bandwidth / 1000;
4974
    const double rate_err = ((100.0 * (dr - target_rate)) / target_rate);
4975
4976
    if (ppi->b_calculate_psnr) {
4977
      const double total_psnr = aom_sse_to_psnr(
4978
          (double)ppi->total_samples[0], peak, (double)ppi->total_sq_error[0]);
4979
      const double total_ssim =
4980
          100 * pow(ppi->summed_quality / ppi->summed_weights, 8.0);
4981
      snprintf(headings, sizeof(headings),
4982
               "Bitrate\tAVGPsnr\tGLBPsnr\tAVPsnrP\tGLPsnrP\t"
4983
               "AOMSSIM\tVPSSIMP\tFASTSIM\tPSNRHVS\t"
4984
               "WstPsnr\tWstSsim\tWstFast\tWstHVS\t"
4985
               "AVPsrnY\tAPsnrCb\tAPsnrCr");
4986
      snprintf(results, sizeof(results),
4987
               "%7.2f\t%7.3f\t%7.3f\t%7.3f\t%7.3f\t"
4988
               "%7.3f\t%7.3f\t%7.3f\t%7.3f\t"
4989
               "%7.3f\t%7.3f\t%7.3f\t%7.3f\t"
4990
               "%7.3f\t%7.3f\t%7.3f",
4991
               dr, ppi->psnr[0].stat[STAT_ALL] / ppi->count[0], total_psnr,
4992
               ppi->psnr[0].stat[STAT_ALL] / ppi->count[0], total_psnr,
4993
               total_ssim, total_ssim,
4994
               ppi->fastssim.stat[STAT_ALL] / ppi->count[0],
4995
               ppi->psnrhvs.stat[STAT_ALL] / ppi->count[0], ppi->psnr[0].worst,
4996
               ppi->worst_ssim, ppi->fastssim.worst, ppi->psnrhvs.worst,
4997
               ppi->psnr[0].stat[STAT_Y] / ppi->count[0],
4998
               ppi->psnr[0].stat[STAT_U] / ppi->count[0],
4999
               ppi->psnr[0].stat[STAT_V] / ppi->count[0]);
5000
5001
      if (ppi->b_calculate_blockiness) {
5002
        SNPRINT(headings, "\t  Block\tWstBlck");
5003
        SNPRINT2(results, "\t%7.3f", ppi->total_blockiness / ppi->count[0]);
5004
        SNPRINT2(results, "\t%7.3f", ppi->worst_blockiness);
5005
      }
5006
5007
      if (ppi->b_calculate_consistency) {
5008
        double consistency =
5009
            aom_sse_to_psnr((double)ppi->total_samples[0], peak,
5010
                            (double)ppi->total_inconsistency);
5011
5012
        SNPRINT(headings, "\tConsist\tWstCons");
5013
        SNPRINT2(results, "\t%7.3f", consistency);
5014
        SNPRINT2(results, "\t%7.3f", ppi->worst_consistency);
5015
      }
5016
5017
      SNPRINT(headings, "\t   Time\tRcErr\tAbsErr");
5018
      SNPRINT2(results, "\t%8.0f", total_encode_time);
5019
      SNPRINT2(results, " %7.2f", rate_err);
5020
      SNPRINT2(results, " %7.2f", fabs(rate_err));
5021
5022
      SNPRINT(headings, "\tAPsnr611");
5023
      SNPRINT2(results, " %7.3f",
5024
               (6 * ppi->psnr[0].stat[STAT_Y] + ppi->psnr[0].stat[STAT_U] +
5025
                ppi->psnr[0].stat[STAT_V]) /
5026
                   (ppi->count[0] * 8));
5027
5028
#if CONFIG_AV1_HIGHBITDEPTH
5029
      const uint32_t in_bit_depth = ppi->cpi->oxcf.input_cfg.input_bit_depth;
5030
      const uint32_t bit_depth = ppi->seq_params.bit_depth;
5031
      // Since cpi->source->flags is not available here, but total_samples[1]
5032
      // will be non-zero if cpi->source->flags & YV12_FLAG_HIGHBITDEPTH was
5033
      // true in compute_internal_stats
5034
      if ((ppi->total_samples[1] > 0) && (in_bit_depth < bit_depth)) {
5035
        const double peak_hbd = (double)((1 << bit_depth) - 1);
5036
        const double total_psnr_hbd =
5037
            aom_sse_to_psnr((double)ppi->total_samples[1], peak_hbd,
5038
                            (double)ppi->total_sq_error[1]);
5039
        const double total_ssim_hbd =
5040
            100 * pow(ppi->summed_quality_hbd / ppi->summed_weights_hbd, 8.0);
5041
        SNPRINT(headings,
5042
                "\t AVGPsnrH GLBPsnrH AVPsnrPH GLPsnrPH"
5043
                " AVPsnrYH APsnrCbH APsnrCrH WstPsnrH"
5044
                " AOMSSIMH VPSSIMPH WstSsimH");
5045
        SNPRINT2(results, "\t%7.3f",
5046
                 ppi->psnr[1].stat[STAT_ALL] / ppi->count[1]);
5047
        SNPRINT2(results, "  %7.3f", total_psnr_hbd);
5048
        SNPRINT2(results, "  %7.3f",
5049
                 ppi->psnr[1].stat[STAT_ALL] / ppi->count[1]);
5050
        SNPRINT2(results, "  %7.3f", total_psnr_hbd);
5051
        SNPRINT2(results, "  %7.3f", ppi->psnr[1].stat[STAT_Y] / ppi->count[1]);
5052
        SNPRINT2(results, "  %7.3f", ppi->psnr[1].stat[STAT_U] / ppi->count[1]);
5053
        SNPRINT2(results, "  %7.3f", ppi->psnr[1].stat[STAT_V] / ppi->count[1]);
5054
        SNPRINT2(results, "  %7.3f", ppi->psnr[1].worst);
5055
        SNPRINT2(results, "  %7.3f", total_ssim_hbd);
5056
        SNPRINT2(results, "  %7.3f", total_ssim_hbd);
5057
        SNPRINT2(results, "  %7.3f", ppi->worst_ssim_hbd);
5058
      }
5059
#endif
5060
      fprintf(f, "%s\n", headings);
5061
      fprintf(f, "%s\n", results);
5062
    }
5063
5064
    fclose(f);
5065
5066
    aom_free(ppi->ssim_vars);
5067
    ppi->ssim_vars = NULL;
5068
  }
5069
}
5070
#endif  // CONFIG_INTERNAL_STATS
5071
5072
0
static inline void update_keyframe_counters(AV1_COMP *cpi) {
5073
0
  if (cpi->common.show_frame && cpi->rc.frames_to_key) {
5074
0
#if !CONFIG_REALTIME_ONLY
5075
0
    FIRSTPASS_INFO *firstpass_info = &cpi->ppi->twopass.firstpass_info;
5076
0
    if (firstpass_info->past_stats_count > FIRSTPASS_INFO_STATS_PAST_MIN) {
5077
0
      av1_firstpass_info_move_cur_index_and_pop(firstpass_info);
5078
0
    } else {
5079
      // When there is not enough past stats, we move the current
5080
      // index without popping the past stats
5081
0
      av1_firstpass_info_move_cur_index(firstpass_info);
5082
0
    }
5083
0
#endif
5084
0
    if (cpi->svc.spatial_layer_id == cpi->svc.number_spatial_layers - 1) {
5085
0
      cpi->rc.frames_since_key++;
5086
0
      cpi->rc.frames_to_key--;
5087
0
      cpi->rc.frames_to_fwd_kf--;
5088
0
      cpi->rc.frames_since_scene_change++;
5089
0
    }
5090
0
  }
5091
0
}
5092
5093
0
static inline void update_frames_till_gf_update(AV1_COMP *cpi) {
5094
  // TODO(weitinglin): Updating this counter for is_frame_droppable
5095
  // is a work-around to handle the condition when a frame is drop.
5096
  // We should fix the cpi->common.show_frame flag
5097
  // instead of checking the other condition to update the counter properly.
5098
0
  if (cpi->common.show_frame ||
5099
0
      is_frame_droppable(&cpi->ppi->rtc_ref, &cpi->ext_flags.refresh_frame)) {
5100
    // Decrement count down till next gf
5101
0
    if (cpi->rc.frames_till_gf_update_due > 0)
5102
0
      cpi->rc.frames_till_gf_update_due--;
5103
0
  }
5104
0
}
5105
5106
0
static inline void update_gf_group_index(AV1_COMP *cpi) {
5107
  // Increment the gf group index ready for the next frame.
5108
0
  ++cpi->gf_frame_index;
5109
  // Reset gf_frame_index in case it reaches MAX_STATIC_GF_GROUP_LENGTH.
5110
0
  if (cpi->gf_frame_index == MAX_STATIC_GF_GROUP_LENGTH)
5111
0
    cpi->gf_frame_index = 0;
5112
0
}
5113
5114
static void update_fb_of_context_type(const AV1_COMP *const cpi,
5115
0
                                      int *const fb_of_context_type) {
5116
0
  const AV1_COMMON *const cm = &cpi->common;
5117
0
  const int current_frame_ref_type = get_current_frame_ref_type(cpi);
5118
5119
0
  if (frame_is_intra_only(cm) || cm->features.error_resilient_mode ||
5120
0
      cpi->ext_flags.use_primary_ref_none) {
5121
0
    for (int i = 0; i < REF_FRAMES; i++) {
5122
0
      fb_of_context_type[i] = -1;
5123
0
    }
5124
0
    fb_of_context_type[current_frame_ref_type] =
5125
0
        cm->show_frame ? get_ref_frame_map_idx(cm, GOLDEN_FRAME)
5126
0
                       : get_ref_frame_map_idx(cm, ALTREF_FRAME);
5127
0
  }
5128
5129
0
  if (!encode_show_existing_frame(cm)) {
5130
    // Refresh fb_of_context_type[]: see encoder.h for explanation
5131
0
    if (cm->current_frame.frame_type == KEY_FRAME) {
5132
      // All ref frames are refreshed, pick one that will live long enough
5133
0
      fb_of_context_type[current_frame_ref_type] = 0;
5134
0
    } else {
5135
      // If more than one frame is refreshed, it doesn't matter which one we
5136
      // pick so pick the first.  LST sometimes doesn't refresh any: this is ok
5137
5138
0
      for (int i = 0; i < REF_FRAMES; i++) {
5139
0
        if (cm->current_frame.refresh_frame_flags & (1 << i)) {
5140
0
          fb_of_context_type[current_frame_ref_type] = i;
5141
0
          break;
5142
0
        }
5143
0
      }
5144
0
    }
5145
0
  }
5146
0
}
5147
5148
0
static void update_rc_counts(AV1_COMP *cpi) {
5149
0
  update_keyframe_counters(cpi);
5150
0
  update_frames_till_gf_update(cpi);
5151
0
  update_gf_group_index(cpi);
5152
0
}
5153
5154
0
static void update_end_of_frame_stats(AV1_COMP *cpi) {
5155
0
  if (cpi->do_frame_data_update) {
5156
    // Store current frame loopfilter levels in ppi, if update flag is set.
5157
0
    if (!cpi->common.show_existing_frame) {
5158
0
      AV1_COMMON *const cm = &cpi->common;
5159
0
      struct loopfilter *const lf = &cm->lf;
5160
0
      cpi->ppi->filter_level[0] = lf->backup_filter_level[0];
5161
0
      cpi->ppi->filter_level[1] = lf->backup_filter_level[1];
5162
0
      cpi->ppi->filter_level_u = lf->backup_filter_level_u;
5163
0
      cpi->ppi->filter_level_v = lf->backup_filter_level_v;
5164
0
    }
5165
0
  }
5166
  // Store frame level mv_stats from cpi to ppi.
5167
0
  cpi->ppi->mv_stats = cpi->mv_stats;
5168
0
}
5169
5170
// Updates frame level stats related to global motion
5171
0
static inline void update_gm_stats(AV1_COMP *cpi) {
5172
0
  FRAME_UPDATE_TYPE update_type =
5173
0
      cpi->ppi->gf_group.update_type[cpi->gf_frame_index];
5174
0
  int i, is_gm_present = 0;
5175
5176
  // Check if the current frame has any valid global motion model across its
5177
  // reference frames
5178
0
  for (i = 0; i < REF_FRAMES; i++) {
5179
0
    if (cpi->common.global_motion[i].wmtype != IDENTITY) {
5180
0
      is_gm_present = 1;
5181
0
      break;
5182
0
    }
5183
0
  }
5184
0
  int update_actual_stats = 1;
5185
#if CONFIG_FPMT_TEST
5186
  update_actual_stats =
5187
      (cpi->ppi->fpmt_unit_test_cfg == PARALLEL_SIMULATION_ENCODE) ? 0 : 1;
5188
  if (!update_actual_stats) {
5189
    if (cpi->ppi->temp_valid_gm_model_found[update_type] == INT32_MAX) {
5190
      cpi->ppi->temp_valid_gm_model_found[update_type] = is_gm_present;
5191
    } else {
5192
      cpi->ppi->temp_valid_gm_model_found[update_type] |= is_gm_present;
5193
    }
5194
    int show_existing_between_parallel_frames =
5195
        (cpi->ppi->gf_group.update_type[cpi->gf_frame_index] ==
5196
             INTNL_OVERLAY_UPDATE &&
5197
         cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index + 1] == 2);
5198
    if (cpi->do_frame_data_update == 1 &&
5199
        !show_existing_between_parallel_frames) {
5200
      for (i = 0; i < FRAME_UPDATE_TYPES; i++) {
5201
        cpi->ppi->valid_gm_model_found[i] =
5202
            cpi->ppi->temp_valid_gm_model_found[i];
5203
      }
5204
    }
5205
  }
5206
#endif
5207
0
  if (update_actual_stats) {
5208
0
    if (cpi->ppi->valid_gm_model_found[update_type] == INT32_MAX) {
5209
0
      cpi->ppi->valid_gm_model_found[update_type] = is_gm_present;
5210
0
    } else {
5211
0
      cpi->ppi->valid_gm_model_found[update_type] |= is_gm_present;
5212
0
    }
5213
0
  }
5214
0
}
5215
5216
void av1_post_encode_updates(AV1_COMP *const cpi,
5217
0
                             const AV1_COMP_DATA *const cpi_data) {
5218
0
  AV1_PRIMARY *const ppi = cpi->ppi;
5219
0
  AV1_COMMON *const cm = &cpi->common;
5220
5221
0
  if (ppi->b_freeze_internal_state) {
5222
    // Should not update encoder state, just necessary work to get the
5223
    // expected output and then return early.
5224
5225
    // Note *size = 0 indicates a dropped frame for which psnr is not calculated
5226
0
    if (ppi->b_calculate_psnr && cpi_data->frame_size > 0) {
5227
0
      if (cm->show_existing_frame ||
5228
0
          (!is_stat_generation_stage(cpi) && cm->show_frame)) {
5229
0
        generate_psnr_packet(cpi);
5230
0
      }
5231
0
    }
5232
5233
0
    if (cpi_data->pop_lookahead == 1) {
5234
0
      av1_lookahead_pop(cpi->ppi->lookahead, cpi_data->flush,
5235
0
                        cpi->compressor_stage);
5236
0
    }
5237
0
    return;
5238
0
  }
5239
5240
0
  update_gm_stats(cpi);
5241
5242
0
#if !CONFIG_REALTIME_ONLY
5243
  // Update the total stats remaining structure.
5244
0
  if (cpi->twopass_frame.this_frame != NULL &&
5245
0
      ppi->twopass.stats_buf_ctx->total_left_stats) {
5246
0
    subtract_stats(ppi->twopass.stats_buf_ctx->total_left_stats,
5247
0
                   cpi->twopass_frame.this_frame);
5248
0
  }
5249
0
#endif
5250
5251
#if CONFIG_OUTPUT_FRAME_SIZE
5252
  FILE *f = fopen("frame_sizes.csv", "a");
5253
  fprintf(f, "%d,", 8 * (int)cpi_data->frame_size);
5254
  fprintf(f, "%d\n", cm->quant_params.base_qindex);
5255
  fclose(f);
5256
#endif  // CONFIG_OUTPUT_FRAME_SIZE
5257
5258
0
  if (!is_stat_generation_stage(cpi) && !cpi->is_dropped_frame) {
5259
    // Before calling refresh_reference_frames(), copy ppi->ref_frame_map_copy
5260
    // to cm->ref_frame_map for frame_parallel_level 2 frame in a parallel
5261
    // encode set of lower layer frames.
5262
    // TODO(Remya): Move ref_frame_map from AV1_COMMON to AV1_PRIMARY to avoid
5263
    // copy.
5264
0
    if (ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] == 2 &&
5265
0
        ppi->gf_group.frame_parallel_level[cpi->gf_frame_index - 1] == 1 &&
5266
0
        ppi->gf_group.update_type[cpi->gf_frame_index - 1] ==
5267
0
            INTNL_ARF_UPDATE) {
5268
0
      memcpy(cm->ref_frame_map, ppi->ref_frame_map_copy,
5269
0
             sizeof(cm->ref_frame_map));
5270
0
    }
5271
0
    refresh_reference_frames(cpi);
5272
    // For frame_parallel_level 1 frame in a parallel encode set of lower layer
5273
    // frames, store the updated cm->ref_frame_map in ppi->ref_frame_map_copy.
5274
0
    if (ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] == 1 &&
5275
0
        ppi->gf_group.update_type[cpi->gf_frame_index] == INTNL_ARF_UPDATE) {
5276
0
      memcpy(ppi->ref_frame_map_copy, cm->ref_frame_map,
5277
0
             sizeof(cm->ref_frame_map));
5278
0
    }
5279
0
    av1_rc_postencode_update(cpi, cpi_data->frame_size);
5280
0
  }
5281
5282
0
  if (cpi_data->pop_lookahead == 1) {
5283
0
    av1_lookahead_pop(cpi->ppi->lookahead, cpi_data->flush,
5284
0
                      cpi->compressor_stage);
5285
0
  }
5286
0
  if (cpi->common.show_frame) {
5287
0
    cpi->ppi->ts_start_last_show_frame = cpi_data->ts_frame_start;
5288
0
    cpi->ppi->ts_end_last_show_frame = cpi_data->ts_frame_end;
5289
0
  }
5290
0
  if (ppi->level_params.keep_level_stats && !is_stat_generation_stage(cpi)) {
5291
    // Initialize level info. at the beginning of each sequence.
5292
0
    if (cm->current_frame.frame_type == KEY_FRAME &&
5293
0
        ppi->gf_group.refbuf_state[cpi->gf_frame_index] == REFBUF_RESET) {
5294
0
      av1_init_level_info(cpi);
5295
0
    }
5296
0
    av1_update_level_info(cpi, cpi_data->frame_size, cpi_data->ts_frame_start,
5297
0
                          cpi_data->ts_frame_end);
5298
0
  }
5299
5300
0
  if (!is_stat_generation_stage(cpi)) {
5301
0
#if !CONFIG_REALTIME_ONLY
5302
0
    if (!has_no_stats_stage(cpi)) av1_twopass_postencode_update(cpi);
5303
0
#endif
5304
0
    update_fb_of_context_type(cpi, ppi->fb_of_context_type);
5305
0
    update_rc_counts(cpi);
5306
0
    update_end_of_frame_stats(cpi);
5307
0
  }
5308
5309
#if CONFIG_THREE_PASS
5310
  if (cpi->oxcf.pass == AOM_RC_THIRD_PASS && cpi->third_pass_ctx) {
5311
    av1_pop_third_pass_info(cpi->third_pass_ctx);
5312
  }
5313
#endif
5314
5315
0
  if (ppi->rtc_ref.set_ref_frame_config && !cpi->is_dropped_frame) {
5316
0
    av1_svc_update_buffer_slot_refreshed(cpi);
5317
0
    av1_svc_set_reference_was_previous(cpi);
5318
0
  }
5319
5320
0
  if (ppi->use_svc) av1_save_layer_context(cpi);
5321
5322
  // Note *size = 0 indicates a dropped frame for which psnr is not calculated
5323
0
  if (ppi->b_calculate_psnr && cpi_data->frame_size > 0) {
5324
0
    if (cm->show_existing_frame ||
5325
0
        (!is_stat_generation_stage(cpi) && cm->show_frame)) {
5326
0
      generate_psnr_packet(cpi);
5327
0
    }
5328
0
  }
5329
5330
#if CONFIG_INTERNAL_STATS
5331
  if (!is_stat_generation_stage(cpi)) {
5332
    compute_internal_stats(cpi, (int)cpi_data->frame_size);
5333
  }
5334
#endif  // CONFIG_INTERNAL_STATS
5335
5336
#if CONFIG_THREE_PASS
5337
  // Write frame info. Subtract 1 from frame index since if was incremented in
5338
  // update_rc_counts.
5339
  av1_write_second_pass_per_frame_info(cpi, cpi->gf_frame_index - 1);
5340
#endif
5341
0
}
5342
5343
0
int av1_get_compressed_data(AV1_COMP *cpi, AV1_COMP_DATA *const cpi_data) {
5344
0
  const AV1EncoderConfig *const oxcf = &cpi->oxcf;
5345
0
  AV1_COMMON *const cm = &cpi->common;
5346
5347
  // The jmp_buf is valid only for the duration of the function that calls
5348
  // setjmp(). Therefore, this function must reset the 'setjmp' field to 0
5349
  // before it returns.
5350
0
  if (setjmp(cm->error->jmp)) {
5351
0
    cm->error->setjmp = 0;
5352
0
    return cm->error->error_code;
5353
0
  }
5354
0
  cm->error->setjmp = 1;
5355
5356
#if CONFIG_INTERNAL_STATS
5357
  cpi->frame_recode_hits = 0;
5358
  cpi->time_compress_data = 0;
5359
  cpi->bytes = 0;
5360
#endif
5361
#if CONFIG_ENTROPY_STATS
5362
  if (cpi->compressor_stage == ENCODE_STAGE) {
5363
    av1_zero(cpi->counts);
5364
  }
5365
#endif
5366
5367
#if CONFIG_BITSTREAM_DEBUG
5368
  assert(cpi->oxcf.max_threads <= 1 &&
5369
         "bitstream debug tool does not support multithreading");
5370
  bitstream_queue_record_write();
5371
5372
  if (cm->seq_params->order_hint_info.enable_order_hint) {
5373
    aom_bitstream_queue_set_frame_write(cm->current_frame.order_hint * 2 +
5374
                                        cm->show_frame);
5375
  } else {
5376
    // This is currently used in RTC encoding. cm->show_frame is always 1.
5377
    aom_bitstream_queue_set_frame_write(cm->current_frame.frame_number);
5378
  }
5379
#endif
5380
0
  if (cpi->ppi->use_svc) {
5381
0
    av1_one_pass_cbr_svc_start_layer(cpi);
5382
0
  }
5383
5384
0
  cpi->is_dropped_frame = false;
5385
0
  cm->showable_frame = 0;
5386
0
  cpi_data->frame_size = 0;
5387
#if CONFIG_INTERNAL_STATS
5388
  struct aom_usec_timer cmptimer;
5389
  aom_usec_timer_start(&cmptimer);
5390
#endif
5391
0
  av1_set_high_precision_mv(cpi, 1, 0);
5392
5393
  // Normal defaults
5394
0
  cm->features.refresh_frame_context =
5395
0
      oxcf->tool_cfg.frame_parallel_decoding_mode
5396
0
          ? REFRESH_FRAME_CONTEXT_DISABLED
5397
0
          : REFRESH_FRAME_CONTEXT_BACKWARD;
5398
0
  if (oxcf->tile_cfg.enable_large_scale_tile)
5399
0
    cm->features.refresh_frame_context = REFRESH_FRAME_CONTEXT_DISABLED;
5400
5401
0
  if (assign_cur_frame_new_fb(cm) == NULL) {
5402
0
    aom_internal_error(cpi->common.error, AOM_CODEC_ERROR,
5403
0
                       "Failed to allocate new cur_frame");
5404
0
  }
5405
5406
#if CONFIG_COLLECT_COMPONENT_TIMING
5407
  // Accumulate 2nd pass time in 2-pass case or 1 pass time in 1-pass case.
5408
  if (cpi->oxcf.pass == 2 || cpi->oxcf.pass == 0)
5409
    start_timing(cpi, av1_encode_strategy_time);
5410
#endif
5411
5412
0
  const int result = av1_encode_strategy(
5413
0
      cpi, &cpi_data->frame_size, cpi_data->cx_data, cpi_data->cx_data_sz,
5414
0
      &cpi_data->lib_flags, &cpi_data->ts_frame_start, &cpi_data->ts_frame_end,
5415
0
      cpi_data->timestamp_ratio, &cpi_data->pop_lookahead, cpi_data->flush);
5416
5417
#if CONFIG_COLLECT_COMPONENT_TIMING
5418
  if (cpi->oxcf.pass == 2 || cpi->oxcf.pass == 0)
5419
    end_timing(cpi, av1_encode_strategy_time);
5420
5421
  // Print out timing information.
5422
  // Note: Use "cpi->frame_component_time[0] > 100 us" to avoid showing of
5423
  // show_existing_frame and lag-in-frames.
5424
  if ((cpi->oxcf.pass == 2 || cpi->oxcf.pass == 0) &&
5425
      cpi->frame_component_time[0] > 100) {
5426
    int i;
5427
    uint64_t frame_total = 0, total = 0;
5428
    const GF_GROUP *const gf_group = &cpi->ppi->gf_group;
5429
    FRAME_UPDATE_TYPE frame_update_type =
5430
        get_frame_update_type(gf_group, cpi->gf_frame_index);
5431
5432
    fprintf(stderr,
5433
            "\n Frame number: %d, Frame type: %s, Show Frame: %d, Frame Update "
5434
            "Type: %d, Q: %d\n",
5435
            cm->current_frame.frame_number,
5436
            get_frame_type_enum(cm->current_frame.frame_type), cm->show_frame,
5437
            frame_update_type, cm->quant_params.base_qindex);
5438
    for (i = 0; i < kTimingComponents; i++) {
5439
      cpi->component_time[i] += cpi->frame_component_time[i];
5440
      // Use av1_encode_strategy_time (i = 0) as the total time.
5441
      if (i == 0) {
5442
        frame_total = cpi->frame_component_time[0];
5443
        total = cpi->component_time[0];
5444
      }
5445
      fprintf(stderr,
5446
              " %50s:  %15" PRId64 " us [%6.2f%%] (total: %15" PRId64
5447
              " us [%6.2f%%])\n",
5448
              get_component_name(i), cpi->frame_component_time[i],
5449
              (float)((float)cpi->frame_component_time[i] * 100.0 /
5450
                      (float)frame_total),
5451
              cpi->component_time[i],
5452
              (float)((float)cpi->component_time[i] * 100.0 / (float)total));
5453
      cpi->frame_component_time[i] = 0;
5454
    }
5455
  }
5456
#endif
5457
5458
  // Reset the flag to 0 afer encoding.
5459
0
  cpi->rc.use_external_qp_one_pass = 0;
5460
5461
0
  if (result == -1) {
5462
0
    cm->error->setjmp = 0;
5463
    // Returning -1 indicates no frame encoded; more input is required
5464
0
    return -1;
5465
0
  }
5466
0
  if (result != AOM_CODEC_OK) {
5467
0
    aom_internal_error(cpi->common.error, AOM_CODEC_ERROR,
5468
0
                       "Failed to encode frame");
5469
0
  }
5470
#if CONFIG_INTERNAL_STATS
5471
  aom_usec_timer_mark(&cmptimer);
5472
  cpi->time_compress_data += aom_usec_timer_elapsed(&cmptimer);
5473
#endif  // CONFIG_INTERNAL_STATS
5474
5475
#if CONFIG_SPEED_STATS
5476
  if (!is_stat_generation_stage(cpi) && !cm->show_existing_frame) {
5477
    cpi->tx_search_count += cpi->td.mb.txfm_search_info.tx_search_count;
5478
    cpi->td.mb.txfm_search_info.tx_search_count = 0;
5479
  }
5480
#endif  // CONFIG_SPEED_STATS
5481
5482
0
  cm->error->setjmp = 0;
5483
0
  return AOM_CODEC_OK;
5484
0
}
5485
5486
// Populates cpi->scaled_ref_buf corresponding to frames in a parallel encode
5487
// set. Also sets the bitmask 'ref_buffers_used_map'.
5488
0
static void scale_references_fpmt(AV1_COMP *cpi, int *ref_buffers_used_map) {
5489
0
  AV1_COMMON *cm = &cpi->common;
5490
0
  MV_REFERENCE_FRAME ref_frame;
5491
5492
0
  for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) {
5493
    // Need to convert from AOM_REFFRAME to index into ref_mask (subtract 1).
5494
0
    if (cpi->ref_frame_flags & av1_ref_frame_flag_list[ref_frame]) {
5495
0
      const YV12_BUFFER_CONFIG *const ref =
5496
0
          get_ref_frame_yv12_buf(cm, ref_frame);
5497
5498
0
      if (ref == NULL) {
5499
0
        cpi->scaled_ref_buf[ref_frame - 1] = NULL;
5500
0
        continue;
5501
0
      }
5502
5503
      // FPMT does not support scaling yet.
5504
0
      assert(ref->y_crop_width == cm->width &&
5505
0
             ref->y_crop_height == cm->height);
5506
5507
0
      RefCntBuffer *buf = get_ref_frame_buf(cm, ref_frame);
5508
0
      cpi->scaled_ref_buf[ref_frame - 1] = buf;
5509
0
      for (int i = 0; i < cm->buffer_pool->num_frame_bufs; ++i) {
5510
0
        if (&cm->buffer_pool->frame_bufs[i] == buf) {
5511
0
          *ref_buffers_used_map |= (1 << i);
5512
0
        }
5513
0
      }
5514
0
    } else {
5515
0
      if (!has_no_stats_stage(cpi)) cpi->scaled_ref_buf[ref_frame - 1] = NULL;
5516
0
    }
5517
0
  }
5518
0
}
5519
5520
// Increments the ref_count of frame buffers referenced by cpi->scaled_ref_buf
5521
// corresponding to frames in a parallel encode set.
5522
static void increment_scaled_ref_counts_fpmt(BufferPool *buffer_pool,
5523
0
                                             int ref_buffers_used_map) {
5524
0
  for (int i = 0; i < buffer_pool->num_frame_bufs; ++i) {
5525
0
    if (ref_buffers_used_map & (1 << i)) {
5526
0
      ++buffer_pool->frame_bufs[i].ref_count;
5527
0
    }
5528
0
  }
5529
0
}
5530
5531
// Releases cpi->scaled_ref_buf corresponding to frames in a parallel encode
5532
// set.
5533
0
void av1_release_scaled_references_fpmt(AV1_COMP *cpi) {
5534
  // TODO(isbs): only refresh the necessary frames, rather than all of them
5535
0
  for (int i = 0; i < INTER_REFS_PER_FRAME; ++i) {
5536
0
    RefCntBuffer *const buf = cpi->scaled_ref_buf[i];
5537
0
    if (buf != NULL) {
5538
0
      cpi->scaled_ref_buf[i] = NULL;
5539
0
    }
5540
0
  }
5541
0
}
5542
5543
// Decrements the ref_count of frame buffers referenced by cpi->scaled_ref_buf
5544
// corresponding to frames in a parallel encode set.
5545
void av1_decrement_ref_counts_fpmt(BufferPool *buffer_pool,
5546
0
                                   int ref_buffers_used_map) {
5547
0
  for (int i = 0; i < buffer_pool->num_frame_bufs; ++i) {
5548
0
    if (ref_buffers_used_map & (1 << i)) {
5549
0
      --buffer_pool->frame_bufs[i].ref_count;
5550
0
    }
5551
0
  }
5552
0
}
5553
5554
// Initialize parallel frame contexts with screen content decisions.
5555
0
void av1_init_sc_decisions(AV1_PRIMARY *const ppi) {
5556
0
  AV1_COMP *const first_cpi = ppi->cpi;
5557
0
  for (int i = 1; i < ppi->num_fp_contexts; ++i) {
5558
0
    AV1_COMP *cur_cpi = ppi->parallel_cpi[i];
5559
0
    cur_cpi->common.features.allow_screen_content_tools =
5560
0
        first_cpi->common.features.allow_screen_content_tools;
5561
0
    cur_cpi->common.features.allow_intrabc =
5562
0
        first_cpi->common.features.allow_intrabc;
5563
0
    cur_cpi->use_screen_content_tools = first_cpi->use_screen_content_tools;
5564
0
    cur_cpi->is_screen_content_type = first_cpi->is_screen_content_type;
5565
0
  }
5566
0
}
5567
5568
AV1_COMP *av1_get_parallel_frame_enc_data(AV1_PRIMARY *const ppi,
5569
0
                                          AV1_COMP_DATA *const first_cpi_data) {
5570
0
  int cpi_idx = 0;
5571
5572
  // Loop over parallel_cpi to find the cpi that processed the current
5573
  // gf_frame_index ahead of time.
5574
0
  for (int i = 1; i < ppi->num_fp_contexts; i++) {
5575
0
    if (ppi->cpi->gf_frame_index == ppi->parallel_cpi[i]->gf_frame_index) {
5576
0
      cpi_idx = i;
5577
0
      break;
5578
0
    }
5579
0
  }
5580
5581
0
  assert(cpi_idx > 0);
5582
0
  assert(!ppi->parallel_cpi[cpi_idx]->common.show_existing_frame);
5583
5584
  // Release the previously-used frame-buffer.
5585
0
  if (ppi->cpi->common.cur_frame != NULL) {
5586
0
    --ppi->cpi->common.cur_frame->ref_count;
5587
0
    ppi->cpi->common.cur_frame = NULL;
5588
0
  }
5589
5590
  // Swap the appropriate parallel_cpi with the parallel_cpi[0].
5591
0
  ppi->cpi = ppi->parallel_cpi[cpi_idx];
5592
0
  ppi->parallel_cpi[cpi_idx] = ppi->parallel_cpi[0];
5593
0
  ppi->parallel_cpi[0] = ppi->cpi;
5594
5595
  // Copy appropriate parallel_frames_data to local data.
5596
0
  {
5597
0
    AV1_COMP_DATA *data = &ppi->parallel_frames_data[cpi_idx - 1];
5598
0
    assert(data->frame_size > 0);
5599
0
    if (data->frame_size > first_cpi_data->cx_data_sz) {
5600
0
      aom_internal_error(&ppi->error, AOM_CODEC_ERROR,
5601
0
                         "first_cpi_data->cx_data buffer full");
5602
0
    }
5603
5604
0
    first_cpi_data->lib_flags = data->lib_flags;
5605
0
    first_cpi_data->ts_frame_start = data->ts_frame_start;
5606
0
    first_cpi_data->ts_frame_end = data->ts_frame_end;
5607
0
    memcpy(first_cpi_data->cx_data, data->cx_data, data->frame_size);
5608
0
    first_cpi_data->frame_size = data->frame_size;
5609
0
    if (ppi->cpi->common.show_frame) {
5610
0
      first_cpi_data->pop_lookahead = 1;
5611
0
    }
5612
0
  }
5613
5614
0
  return ppi->cpi;
5615
0
}
5616
5617
// Initialises frames belonging to a parallel encode set.
5618
int av1_init_parallel_frame_context(const AV1_COMP_DATA *const first_cpi_data,
5619
                                    AV1_PRIMARY *const ppi,
5620
0
                                    int *ref_buffers_used_map) {
5621
0
  AV1_COMP *const first_cpi = ppi->cpi;
5622
0
  GF_GROUP *const gf_group = &ppi->gf_group;
5623
0
  int gf_index_start = first_cpi->gf_frame_index;
5624
0
  assert(gf_group->frame_parallel_level[gf_index_start] == 1);
5625
0
  int parallel_frame_count = 0;
5626
0
  int cur_frame_num = first_cpi->common.current_frame.frame_number;
5627
0
  int show_frame_count = first_cpi->frame_index_set.show_frame_count;
5628
0
  int frames_since_key = first_cpi->rc.frames_since_key;
5629
0
  int frames_to_key = first_cpi->rc.frames_to_key;
5630
0
  int frames_to_fwd_kf = first_cpi->rc.frames_to_fwd_kf;
5631
0
  int cur_frame_disp = cur_frame_num + gf_group->arf_src_offset[gf_index_start];
5632
0
  const FIRSTPASS_STATS *stats_in = first_cpi->twopass_frame.stats_in;
5633
5634
0
  assert(*ref_buffers_used_map == 0);
5635
5636
  // Release the previously used frame-buffer by a frame_parallel_level 1 frame.
5637
0
  if (first_cpi->common.cur_frame != NULL) {
5638
0
    --first_cpi->common.cur_frame->ref_count;
5639
0
    first_cpi->common.cur_frame = NULL;
5640
0
  }
5641
5642
0
  RefFrameMapPair ref_frame_map_pairs[REF_FRAMES];
5643
0
  RefFrameMapPair first_ref_frame_map_pairs[REF_FRAMES];
5644
0
  init_ref_map_pair(first_cpi, first_ref_frame_map_pairs);
5645
0
  memcpy(ref_frame_map_pairs, first_ref_frame_map_pairs,
5646
0
         sizeof(RefFrameMapPair) * REF_FRAMES);
5647
5648
  // Store the reference refresh index of frame_parallel_level 1 frame in a
5649
  // parallel encode set of lower layer frames.
5650
0
  if (gf_group->update_type[gf_index_start] == INTNL_ARF_UPDATE) {
5651
0
    first_cpi->ref_refresh_index = av1_calc_refresh_idx_for_intnl_arf(
5652
0
        first_cpi, ref_frame_map_pairs, gf_index_start);
5653
0
    assert(first_cpi->ref_refresh_index != INVALID_IDX &&
5654
0
           first_cpi->ref_refresh_index < REF_FRAMES);
5655
0
    first_cpi->refresh_idx_available = true;
5656
    // Update ref_frame_map_pairs.
5657
0
    ref_frame_map_pairs[first_cpi->ref_refresh_index].disp_order =
5658
0
        gf_group->display_idx[gf_index_start];
5659
0
    ref_frame_map_pairs[first_cpi->ref_refresh_index].pyr_level =
5660
0
        gf_group->layer_depth[gf_index_start];
5661
0
  }
5662
5663
  // Set do_frame_data_update flag as false for frame_parallel_level 1 frame.
5664
0
  first_cpi->do_frame_data_update = false;
5665
0
  if (gf_group->arf_src_offset[gf_index_start] == 0) {
5666
0
    first_cpi->time_stamps.prev_ts_start = ppi->ts_start_last_show_frame;
5667
0
    first_cpi->time_stamps.prev_ts_end = ppi->ts_end_last_show_frame;
5668
0
  }
5669
5670
0
  av1_get_ref_frames(first_ref_frame_map_pairs, cur_frame_disp, first_cpi,
5671
0
                     gf_index_start, 1, first_cpi->common.remapped_ref_idx);
5672
5673
0
  scale_references_fpmt(first_cpi, ref_buffers_used_map);
5674
0
  parallel_frame_count++;
5675
5676
  // Iterate through the GF_GROUP to find the remaining frame_parallel_level 2
5677
  // frames which are part of the current parallel encode set and initialize the
5678
  // required cpi elements.
5679
0
  for (int i = gf_index_start + 1; i < gf_group->size; i++) {
5680
    // Update frame counters if previous frame was show frame or show existing
5681
    // frame.
5682
0
    if (gf_group->arf_src_offset[i - 1] == 0) {
5683
0
      cur_frame_num++;
5684
0
      show_frame_count++;
5685
0
      if (frames_to_fwd_kf <= 0)
5686
0
        frames_to_fwd_kf = first_cpi->oxcf.kf_cfg.fwd_kf_dist;
5687
0
      if (frames_to_key) {
5688
0
        frames_since_key++;
5689
0
        frames_to_key--;
5690
0
        frames_to_fwd_kf--;
5691
0
      }
5692
0
      stats_in++;
5693
0
    }
5694
0
    cur_frame_disp = cur_frame_num + gf_group->arf_src_offset[i];
5695
0
    if (gf_group->frame_parallel_level[i] == 2) {
5696
0
      AV1_COMP *cur_cpi = ppi->parallel_cpi[parallel_frame_count];
5697
0
      AV1_COMP_DATA *cur_cpi_data =
5698
0
          &ppi->parallel_frames_data[parallel_frame_count - 1];
5699
0
      cur_cpi->gf_frame_index = i;
5700
0
      cur_cpi->framerate = first_cpi->framerate;
5701
0
      cur_cpi->common.current_frame.frame_number = cur_frame_num;
5702
0
      cur_cpi->common.current_frame.frame_type = gf_group->frame_type[i];
5703
0
      cur_cpi->frame_index_set.show_frame_count = show_frame_count;
5704
0
      cur_cpi->rc.frames_since_key = frames_since_key;
5705
0
      cur_cpi->rc.frames_to_key = frames_to_key;
5706
0
      cur_cpi->rc.frames_to_fwd_kf = frames_to_fwd_kf;
5707
0
      cur_cpi->rc.active_worst_quality = first_cpi->rc.active_worst_quality;
5708
0
      cur_cpi->rc.avg_frame_bandwidth = first_cpi->rc.avg_frame_bandwidth;
5709
0
      cur_cpi->rc.max_frame_bandwidth = first_cpi->rc.max_frame_bandwidth;
5710
0
      cur_cpi->rc.min_frame_bandwidth = first_cpi->rc.min_frame_bandwidth;
5711
0
      cur_cpi->rc.intervals_till_gf_calculate_due =
5712
0
          first_cpi->rc.intervals_till_gf_calculate_due;
5713
0
      cur_cpi->mv_search_params.max_mv_magnitude =
5714
0
          first_cpi->mv_search_params.max_mv_magnitude;
5715
0
      if (gf_group->update_type[cur_cpi->gf_frame_index] == INTNL_ARF_UPDATE) {
5716
0
        cur_cpi->common.lf.mode_ref_delta_enabled = 1;
5717
0
      }
5718
0
      cur_cpi->do_frame_data_update = false;
5719
      // Initialize prev_ts_start and prev_ts_end for show frame(s) and show
5720
      // existing frame(s).
5721
0
      if (gf_group->arf_src_offset[i] == 0) {
5722
        // Choose source of prev frame.
5723
0
        int src_index = gf_group->src_offset[i];
5724
0
        struct lookahead_entry *prev_source = av1_lookahead_peek(
5725
0
            ppi->lookahead, src_index - 1, cur_cpi->compressor_stage);
5726
        // Save timestamps of prev frame.
5727
0
        cur_cpi->time_stamps.prev_ts_start = prev_source->ts_start;
5728
0
        cur_cpi->time_stamps.prev_ts_end = prev_source->ts_end;
5729
0
      }
5730
0
      cur_cpi->time_stamps.first_ts_start =
5731
0
          first_cpi->time_stamps.first_ts_start;
5732
5733
0
      memcpy(cur_cpi->common.ref_frame_map, first_cpi->common.ref_frame_map,
5734
0
             sizeof(first_cpi->common.ref_frame_map));
5735
0
      cur_cpi_data->lib_flags = 0;
5736
0
      cur_cpi_data->timestamp_ratio = first_cpi_data->timestamp_ratio;
5737
0
      cur_cpi_data->flush = first_cpi_data->flush;
5738
0
      cur_cpi_data->frame_size = 0;
5739
0
      if (gf_group->update_type[gf_index_start] == INTNL_ARF_UPDATE) {
5740
        // If the first frame in a parallel encode set is INTNL_ARF_UPDATE
5741
        // frame, initialize lib_flags of frame_parallel_level 2 frame in the
5742
        // set with that of frame_parallel_level 1 frame.
5743
0
        cur_cpi_data->lib_flags = first_cpi_data->lib_flags;
5744
        // Store the reference refresh index of frame_parallel_level 2 frame in
5745
        // a parallel encode set of lower layer frames.
5746
0
        cur_cpi->ref_refresh_index =
5747
0
            av1_calc_refresh_idx_for_intnl_arf(cur_cpi, ref_frame_map_pairs, i);
5748
0
        cur_cpi->refresh_idx_available = true;
5749
        // Skip the reference frame which will be refreshed by
5750
        // frame_parallel_level 1 frame in a parallel encode set of lower layer
5751
        // frames.
5752
0
        cur_cpi->ref_idx_to_skip = first_cpi->ref_refresh_index;
5753
0
      } else {
5754
0
        cur_cpi->ref_idx_to_skip = INVALID_IDX;
5755
0
        cur_cpi->ref_refresh_index = INVALID_IDX;
5756
0
        cur_cpi->refresh_idx_available = false;
5757
0
      }
5758
0
      cur_cpi->twopass_frame.stats_in = stats_in;
5759
5760
0
      av1_get_ref_frames(first_ref_frame_map_pairs, cur_frame_disp, cur_cpi, i,
5761
0
                         1, cur_cpi->common.remapped_ref_idx);
5762
0
      scale_references_fpmt(cur_cpi, ref_buffers_used_map);
5763
0
      parallel_frame_count++;
5764
0
    }
5765
5766
    // Set do_frame_data_update to true for the last frame_parallel_level 2
5767
    // frame in the current parallel encode set.
5768
0
    if (i == (gf_group->size - 1) ||
5769
0
        (gf_group->frame_parallel_level[i + 1] == 0 &&
5770
0
         (gf_group->update_type[i + 1] == ARF_UPDATE ||
5771
0
          gf_group->update_type[i + 1] == INTNL_ARF_UPDATE)) ||
5772
0
        gf_group->frame_parallel_level[i + 1] == 1) {
5773
0
      ppi->parallel_cpi[parallel_frame_count - 1]->do_frame_data_update = true;
5774
0
      break;
5775
0
    }
5776
0
  }
5777
5778
0
  increment_scaled_ref_counts_fpmt(first_cpi->common.buffer_pool,
5779
0
                                   *ref_buffers_used_map);
5780
5781
  // Return the number of frames in the parallel encode set.
5782
0
  return parallel_frame_count;
5783
0
}
5784
5785
0
int av1_get_preview_raw_frame(AV1_COMP *cpi, YV12_BUFFER_CONFIG *dest) {
5786
0
  AV1_COMMON *cm = &cpi->common;
5787
0
  if (!cm->show_frame) {
5788
0
    return -1;
5789
0
  } else {
5790
0
    int ret;
5791
0
    if (cm->cur_frame != NULL && !cpi->oxcf.algo_cfg.skip_postproc_filtering) {
5792
0
      *dest = cm->cur_frame->buf;
5793
0
      dest->y_width = cm->width;
5794
0
      dest->y_height = cm->height;
5795
0
      dest->uv_width = cm->width >> cm->seq_params->subsampling_x;
5796
0
      dest->uv_height = cm->height >> cm->seq_params->subsampling_y;
5797
0
      ret = 0;
5798
0
    } else {
5799
0
      ret = -1;
5800
0
    }
5801
0
    return ret;
5802
0
  }
5803
0
}
5804
5805
0
int av1_get_last_show_frame(AV1_COMP *cpi, YV12_BUFFER_CONFIG *frame) {
5806
0
  if (cpi->last_show_frame_buf == NULL ||
5807
0
      cpi->oxcf.algo_cfg.skip_postproc_filtering)
5808
0
    return -1;
5809
5810
0
  *frame = cpi->last_show_frame_buf->buf;
5811
0
  return 0;
5812
0
}
5813
5814
aom_codec_err_t av1_copy_new_frame_enc(AV1_COMMON *cm,
5815
                                       YV12_BUFFER_CONFIG *new_frame,
5816
0
                                       YV12_BUFFER_CONFIG *sd) {
5817
0
  const int num_planes = av1_num_planes(cm);
5818
0
  if (!equal_dimensions_and_border(new_frame, sd))
5819
0
    aom_internal_error(cm->error, AOM_CODEC_ERROR,
5820
0
                       "Incorrect buffer dimensions");
5821
0
  else
5822
0
    aom_yv12_copy_frame(new_frame, sd, num_planes);
5823
5824
0
  return cm->error->error_code;
5825
0
}
5826
5827
int av1_set_internal_size(AV1EncoderConfig *const oxcf,
5828
                          ResizePendingParams *resize_pending_params,
5829
                          AOM_SCALING_MODE horiz_mode,
5830
0
                          AOM_SCALING_MODE vert_mode) {
5831
0
  int hr = 0, hs = 0, vr = 0, vs = 0;
5832
5833
  // Checks for invalid AOM_SCALING_MODE values.
5834
0
  if (horiz_mode > AOME_ONETHREE || vert_mode > AOME_ONETHREE) return -1;
5835
5836
0
  Scale2Ratio(horiz_mode, &hr, &hs);
5837
0
  Scale2Ratio(vert_mode, &vr, &vs);
5838
5839
  // always go to the next whole number
5840
0
  resize_pending_params->width = (hs - 1 + oxcf->frm_dim_cfg.width * hr) / hs;
5841
0
  resize_pending_params->height = (vs - 1 + oxcf->frm_dim_cfg.height * vr) / vs;
5842
5843
0
  if (horiz_mode != AOME_NORMAL || vert_mode != AOME_NORMAL) {
5844
0
    oxcf->resize_cfg.resize_mode = RESIZE_FIXED;
5845
0
    oxcf->algo_cfg.enable_tpl_model = 0;
5846
0
  }
5847
0
  return 0;
5848
0
}
5849
5850
0
int av1_get_quantizer(AV1_COMP *cpi) {
5851
0
  return cpi->common.quant_params.base_qindex;
5852
0
}
5853
5854
int av1_convert_sect5obus_to_annexb(uint8_t *buffer, size_t buffer_size,
5855
0
                                    size_t *frame_size) {
5856
0
  assert(*frame_size <= buffer_size);
5857
0
  size_t output_size = 0;
5858
0
  size_t remaining_size = *frame_size;
5859
0
  uint8_t *buff_ptr = buffer;
5860
5861
  // go through each OBUs
5862
0
  while (remaining_size > 0) {
5863
0
    uint8_t saved_obu_header[2];
5864
0
    uint64_t obu_payload_size;
5865
0
    size_t length_of_payload_size;
5866
0
    size_t length_of_obu_size;
5867
0
    const uint32_t obu_header_size = (buff_ptr[0] >> 2) & 0x1 ? 2 : 1;
5868
0
    size_t obu_bytes_read = obu_header_size;  // bytes read for current obu
5869
5870
    // save the obu header (1 or 2 bytes)
5871
0
    memcpy(saved_obu_header, buff_ptr, obu_header_size);
5872
    // clear the obu_has_size_field
5873
0
    saved_obu_header[0] &= ~0x2;
5874
5875
    // get the payload_size and length of payload_size
5876
0
    if (aom_uleb_decode(buff_ptr + obu_header_size,
5877
0
                        remaining_size - obu_header_size, &obu_payload_size,
5878
0
                        &length_of_payload_size) != 0) {
5879
0
      return AOM_CODEC_ERROR;
5880
0
    }
5881
0
    obu_bytes_read += length_of_payload_size;
5882
5883
    // calculate the length of size of the obu header plus payload
5884
0
    const uint64_t obu_size = obu_header_size + obu_payload_size;
5885
0
    length_of_obu_size = aom_uleb_size_in_bytes(obu_size);
5886
5887
0
    if (length_of_obu_size + obu_header_size >
5888
0
        buffer_size - output_size - (remaining_size - obu_bytes_read)) {
5889
0
      return AOM_CODEC_ERROR;
5890
0
    }
5891
    // move the rest of data to new location
5892
0
    memmove(buff_ptr + length_of_obu_size + obu_header_size,
5893
0
            buff_ptr + obu_bytes_read, remaining_size - obu_bytes_read);
5894
0
    obu_bytes_read += (size_t)obu_payload_size;
5895
5896
    // write the new obu size
5897
0
    size_t coded_obu_size;
5898
0
    if (aom_uleb_encode(obu_size, length_of_obu_size, buff_ptr,
5899
0
                        &coded_obu_size) != 0 ||
5900
0
        coded_obu_size != length_of_obu_size) {
5901
0
      return AOM_CODEC_ERROR;
5902
0
    }
5903
5904
    // write the saved (modified) obu_header following obu size
5905
0
    memcpy(buff_ptr + length_of_obu_size, saved_obu_header, obu_header_size);
5906
5907
0
    remaining_size -= obu_bytes_read;
5908
0
    buff_ptr += length_of_obu_size + (size_t)obu_size;
5909
0
    output_size += length_of_obu_size + (size_t)obu_size;
5910
0
  }
5911
5912
0
  *frame_size = output_size;
5913
0
  return AOM_CODEC_OK;
5914
0
}
5915
5916
static void rtc_set_updates_ref_frame_config(
5917
    ExtRefreshFrameFlagsInfo *const ext_refresh_frame_flags,
5918
0
    RTC_REF *const rtc_ref) {
5919
0
  ext_refresh_frame_flags->update_pending = 1;
5920
0
  ext_refresh_frame_flags->last_frame = rtc_ref->refresh[rtc_ref->ref_idx[0]];
5921
0
  ext_refresh_frame_flags->golden_frame = rtc_ref->refresh[rtc_ref->ref_idx[3]];
5922
0
  ext_refresh_frame_flags->bwd_ref_frame =
5923
0
      rtc_ref->refresh[rtc_ref->ref_idx[4]];
5924
0
  ext_refresh_frame_flags->alt2_ref_frame =
5925
0
      rtc_ref->refresh[rtc_ref->ref_idx[5]];
5926
0
  ext_refresh_frame_flags->alt_ref_frame =
5927
0
      rtc_ref->refresh[rtc_ref->ref_idx[6]];
5928
0
  rtc_ref->non_reference_frame = 1;
5929
0
  for (int i = 0; i < REF_FRAMES; i++) {
5930
0
    if (rtc_ref->refresh[i] == 1) {
5931
0
      rtc_ref->non_reference_frame = 0;
5932
0
      break;
5933
0
    }
5934
0
  }
5935
0
}
5936
5937
0
static int rtc_set_references_external_ref_frame_config(AV1_COMP *cpi) {
5938
  // LAST_FRAME (0), LAST2_FRAME(1), LAST3_FRAME(2), GOLDEN_FRAME(3),
5939
  // BWDREF_FRAME(4), ALTREF2_FRAME(5), ALTREF_FRAME(6).
5940
0
  int ref = AOM_REFFRAME_ALL;
5941
0
  for (int i = 0; i < INTER_REFS_PER_FRAME; i++) {
5942
0
    if (!cpi->ppi->rtc_ref.reference[i]) ref ^= (1 << i);
5943
0
  }
5944
0
  return ref;
5945
0
}
5946
5947
0
void av1_apply_encoding_flags(AV1_COMP *cpi, aom_enc_frame_flags_t flags) {
5948
  // TODO(yunqingwang): For what references to use, external encoding flags
5949
  // should be consistent with internal reference frame selection. Need to
5950
  // ensure that there is not conflict between the two. In AV1 encoder, the
5951
  // priority rank for 7 reference frames are: LAST, ALTREF, LAST2, LAST3,
5952
  // GOLDEN, BWDREF, ALTREF2.
5953
5954
0
  ExternalFlags *const ext_flags = &cpi->ext_flags;
5955
0
  ExtRefreshFrameFlagsInfo *const ext_refresh_frame_flags =
5956
0
      &ext_flags->refresh_frame;
5957
0
  ext_flags->ref_frame_flags = AOM_REFFRAME_ALL;
5958
0
  if (flags &
5959
0
      (AOM_EFLAG_NO_REF_LAST | AOM_EFLAG_NO_REF_LAST2 | AOM_EFLAG_NO_REF_LAST3 |
5960
0
       AOM_EFLAG_NO_REF_GF | AOM_EFLAG_NO_REF_ARF | AOM_EFLAG_NO_REF_BWD |
5961
0
       AOM_EFLAG_NO_REF_ARF2)) {
5962
0
    int ref = AOM_REFFRAME_ALL;
5963
5964
0
    if (flags & AOM_EFLAG_NO_REF_LAST) ref ^= AOM_LAST_FLAG;
5965
0
    if (flags & AOM_EFLAG_NO_REF_LAST2) ref ^= AOM_LAST2_FLAG;
5966
0
    if (flags & AOM_EFLAG_NO_REF_LAST3) ref ^= AOM_LAST3_FLAG;
5967
5968
0
    if (flags & AOM_EFLAG_NO_REF_GF) ref ^= AOM_GOLD_FLAG;
5969
5970
0
    if (flags & AOM_EFLAG_NO_REF_ARF) {
5971
0
      ref ^= AOM_ALT_FLAG;
5972
0
      ref ^= AOM_BWD_FLAG;
5973
0
      ref ^= AOM_ALT2_FLAG;
5974
0
    } else {
5975
0
      if (flags & AOM_EFLAG_NO_REF_BWD) ref ^= AOM_BWD_FLAG;
5976
0
      if (flags & AOM_EFLAG_NO_REF_ARF2) ref ^= AOM_ALT2_FLAG;
5977
0
    }
5978
5979
0
    av1_use_as_reference(&ext_flags->ref_frame_flags, ref);
5980
0
  } else {
5981
0
    if (cpi->ppi->rtc_ref.set_ref_frame_config) {
5982
0
      int ref = rtc_set_references_external_ref_frame_config(cpi);
5983
0
      av1_use_as_reference(&ext_flags->ref_frame_flags, ref);
5984
0
    }
5985
0
  }
5986
5987
0
  if (flags &
5988
0
      (AOM_EFLAG_NO_UPD_LAST | AOM_EFLAG_NO_UPD_GF | AOM_EFLAG_NO_UPD_ARF)) {
5989
0
    int upd = AOM_REFFRAME_ALL;
5990
5991
    // Refreshing LAST/LAST2/LAST3 is handled by 1 common flag.
5992
0
    if (flags & AOM_EFLAG_NO_UPD_LAST) upd ^= AOM_LAST_FLAG;
5993
5994
0
    if (flags & AOM_EFLAG_NO_UPD_GF) upd ^= AOM_GOLD_FLAG;
5995
5996
0
    if (flags & AOM_EFLAG_NO_UPD_ARF) {
5997
0
      upd ^= AOM_ALT_FLAG;
5998
0
      upd ^= AOM_BWD_FLAG;
5999
0
      upd ^= AOM_ALT2_FLAG;
6000
0
    }
6001
6002
0
    ext_refresh_frame_flags->last_frame = (upd & AOM_LAST_FLAG) != 0;
6003
0
    ext_refresh_frame_flags->golden_frame = (upd & AOM_GOLD_FLAG) != 0;
6004
0
    ext_refresh_frame_flags->alt_ref_frame = (upd & AOM_ALT_FLAG) != 0;
6005
0
    ext_refresh_frame_flags->bwd_ref_frame = (upd & AOM_BWD_FLAG) != 0;
6006
0
    ext_refresh_frame_flags->alt2_ref_frame = (upd & AOM_ALT2_FLAG) != 0;
6007
0
    ext_refresh_frame_flags->update_pending = 1;
6008
0
  } else {
6009
0
    if (cpi->ppi->rtc_ref.set_ref_frame_config)
6010
0
      rtc_set_updates_ref_frame_config(ext_refresh_frame_flags,
6011
0
                                       &cpi->ppi->rtc_ref);
6012
0
    else
6013
0
      ext_refresh_frame_flags->update_pending = 0;
6014
0
  }
6015
6016
0
  ext_flags->use_ref_frame_mvs = cpi->oxcf.tool_cfg.enable_ref_frame_mvs &
6017
0
                                 ((flags & AOM_EFLAG_NO_REF_FRAME_MVS) == 0);
6018
0
  ext_flags->use_error_resilient = cpi->oxcf.tool_cfg.error_resilient_mode |
6019
0
                                   ((flags & AOM_EFLAG_ERROR_RESILIENT) != 0);
6020
0
  ext_flags->use_s_frame =
6021
0
      cpi->oxcf.kf_cfg.enable_sframe | ((flags & AOM_EFLAG_SET_S_FRAME) != 0);
6022
0
  ext_flags->use_primary_ref_none =
6023
0
      (flags & AOM_EFLAG_SET_PRIMARY_REF_NONE) != 0;
6024
6025
0
  if (flags & AOM_EFLAG_NO_UPD_ENTROPY) {
6026
0
    update_entropy(&ext_flags->refresh_frame_context,
6027
0
                   &ext_flags->refresh_frame_context_pending, 0);
6028
0
  }
6029
0
}
6030
6031
0
aom_fixed_buf_t *av1_get_global_headers(AV1_PRIMARY *ppi) {
6032
0
  if (!ppi) return NULL;
6033
6034
0
  uint8_t header_buf[512] = { 0 };
6035
0
  const uint32_t sequence_header_size = av1_write_sequence_header_obu(
6036
0
      &ppi->seq_params, &header_buf[0], sizeof(header_buf));
6037
0
  assert(sequence_header_size <= sizeof(header_buf));
6038
0
  if (sequence_header_size == 0) return NULL;
6039
6040
0
  const size_t obu_header_size = 1;
6041
0
  const size_t size_field_size = aom_uleb_size_in_bytes(sequence_header_size);
6042
0
  const size_t payload_offset = obu_header_size + size_field_size;
6043
6044
0
  if (payload_offset + sequence_header_size > sizeof(header_buf)) return NULL;
6045
0
  memmove(&header_buf[payload_offset], &header_buf[0], sequence_header_size);
6046
6047
0
  if (av1_write_obu_header(&ppi->level_params, &ppi->cpi->frame_header_count,
6048
0
                           OBU_SEQUENCE_HEADER,
6049
0
                           ppi->seq_params.has_nonzero_operating_point_idc,
6050
0
                           /*is_layer_specific_obu=*/false, 0,
6051
0
                           &header_buf[0]) != obu_header_size) {
6052
0
    return NULL;
6053
0
  }
6054
6055
0
  size_t coded_size_field_size = 0;
6056
0
  if (aom_uleb_encode(sequence_header_size, size_field_size,
6057
0
                      &header_buf[obu_header_size],
6058
0
                      &coded_size_field_size) != 0) {
6059
0
    return NULL;
6060
0
  }
6061
0
  assert(coded_size_field_size == size_field_size);
6062
6063
0
  aom_fixed_buf_t *global_headers =
6064
0
      (aom_fixed_buf_t *)malloc(sizeof(*global_headers));
6065
0
  if (!global_headers) return NULL;
6066
6067
0
  const size_t global_header_buf_size =
6068
0
      obu_header_size + size_field_size + sequence_header_size;
6069
6070
0
  global_headers->buf = malloc(global_header_buf_size);
6071
0
  if (!global_headers->buf) {
6072
0
    free(global_headers);
6073
0
    return NULL;
6074
0
  }
6075
6076
0
  memcpy(global_headers->buf, &header_buf[0], global_header_buf_size);
6077
0
  global_headers->sz = global_header_buf_size;
6078
0
  return global_headers;
6079
0
}