Coverage Report

Created: 2025-06-22 08:04

/src/aom/av1/encoder/encoder_utils.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * Copyright (c) 2020, Alliance for Open Media. All rights reserved.
3
 *
4
 * This source code is subject to the terms of the BSD 2 Clause License and
5
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6
 * was not distributed with this source code in the LICENSE file, you can
7
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8
 * Media Patent License 1.0 was not distributed with this source code in the
9
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10
 */
11
12
#include <string.h>
13
14
#include "aom/aomcx.h"
15
16
#include "av1/common/av1_common_int.h"
17
#include "av1/encoder/bitstream.h"
18
#include "av1/encoder/encodeframe.h"
19
#include "av1/encoder/encoder.h"
20
#include "av1/encoder/encoder_alloc.h"
21
#include "av1/encoder/encodetxb.h"
22
#include "av1/encoder/encoder_utils.h"
23
#include "av1/encoder/grain_test_vectors.h"
24
#include "av1/encoder/mv_prec.h"
25
#include "av1/encoder/rc_utils.h"
26
#include "av1/encoder/rdopt.h"
27
#include "av1/encoder/segmentation.h"
28
#include "av1/encoder/superres_scale.h"
29
#include "av1/encoder/tpl_model.h"
30
#include "av1/encoder/var_based_part.h"
31
32
#if CONFIG_TUNE_VMAF
33
#include "av1/encoder/tune_vmaf.h"
34
#endif
35
36
0
#define MIN_BOOST_COMBINE_FACTOR 4.0
37
0
#define MAX_BOOST_COMBINE_FACTOR 12.0
38
39
const int default_tx_type_probs[FRAME_UPDATE_TYPES][TX_SIZES_ALL][TX_TYPES] = {
40
  { { 221, 189, 214, 292, 0, 0, 0, 0, 0, 2, 38, 68, 0, 0, 0, 0 },
41
    { 262, 203, 216, 239, 0, 0, 0, 0, 0, 1, 37, 66, 0, 0, 0, 0 },
42
    { 315, 231, 239, 226, 0, 0, 0, 0, 0, 13, 0, 0, 0, 0, 0, 0 },
43
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
44
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
45
    { 222, 188, 214, 287, 0, 0, 0, 0, 0, 2, 50, 61, 0, 0, 0, 0 },
46
    { 256, 182, 205, 282, 0, 0, 0, 0, 0, 2, 21, 76, 0, 0, 0, 0 },
47
    { 281, 214, 217, 222, 0, 0, 0, 0, 0, 1, 48, 41, 0, 0, 0, 0 },
48
    { 263, 194, 225, 225, 0, 0, 0, 0, 0, 2, 15, 100, 0, 0, 0, 0 },
49
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
50
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
51
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
52
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
53
    { 170, 192, 242, 293, 0, 0, 0, 0, 0, 1, 68, 58, 0, 0, 0, 0 },
54
    { 199, 210, 213, 291, 0, 0, 0, 0, 0, 1, 14, 96, 0, 0, 0, 0 },
55
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
56
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
57
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
58
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
59
  { { 106, 69, 107, 278, 9, 15, 20, 45, 49, 23, 23, 88, 36, 74, 25, 57 },
60
    { 105, 72, 81, 98, 45, 49, 47, 50, 56, 72, 30, 81, 33, 95, 27, 83 },
61
    { 211, 105, 109, 120, 57, 62, 43, 49, 52, 58, 42, 116, 0, 0, 0, 0 },
62
    { 1008, 0, 0, 0, 0, 0, 0, 0, 0, 16, 0, 0, 0, 0, 0, 0 },
63
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
64
    { 131, 57, 98, 172, 19, 40, 37, 64, 69, 22, 41, 52, 51, 77, 35, 59 },
65
    { 176, 83, 93, 202, 22, 24, 28, 47, 50, 16, 12, 93, 26, 76, 17, 59 },
66
    { 136, 72, 89, 95, 46, 59, 47, 56, 61, 68, 35, 51, 32, 82, 26, 69 },
67
    { 122, 80, 87, 105, 49, 47, 46, 46, 57, 52, 13, 90, 19, 103, 15, 93 },
68
    { 1009, 0, 0, 0, 0, 0, 0, 0, 0, 15, 0, 0, 0, 0, 0, 0 },
69
    { 1011, 0, 0, 0, 0, 0, 0, 0, 0, 13, 0, 0, 0, 0, 0, 0 },
70
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
71
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
72
    { 202, 20, 84, 114, 14, 60, 41, 79, 99, 21, 41, 15, 50, 84, 34, 66 },
73
    { 196, 44, 23, 72, 30, 22, 28, 57, 67, 13, 4, 165, 15, 148, 9, 131 },
74
    { 882, 0, 0, 0, 0, 0, 0, 0, 0, 142, 0, 0, 0, 0, 0, 0 },
75
    { 840, 0, 0, 0, 0, 0, 0, 0, 0, 184, 0, 0, 0, 0, 0, 0 },
76
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
77
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
78
  { { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
79
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
80
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
81
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
82
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
83
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
84
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
85
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
86
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
87
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
88
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
89
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
90
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
91
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
92
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
93
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
94
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
95
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
96
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 } },
97
  { { 213, 110, 141, 269, 12, 16, 15, 19, 21, 11, 38, 68, 22, 29, 16, 24 },
98
    { 216, 119, 128, 143, 38, 41, 26, 30, 31, 30, 42, 70, 23, 36, 19, 32 },
99
    { 367, 149, 154, 154, 38, 35, 17, 21, 21, 10, 22, 36, 0, 0, 0, 0 },
100
    { 1022, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0 },
101
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
102
    { 219, 96, 127, 191, 21, 40, 25, 32, 34, 18, 45, 45, 33, 39, 26, 33 },
103
    { 296, 99, 122, 198, 23, 21, 19, 24, 25, 13, 20, 64, 23, 32, 18, 27 },
104
    { 275, 128, 142, 143, 35, 48, 23, 30, 29, 18, 42, 36, 18, 23, 14, 20 },
105
    { 239, 132, 166, 175, 36, 27, 19, 21, 24, 14, 13, 85, 9, 31, 8, 25 },
106
    { 1022, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0 },
107
    { 1022, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0 },
108
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
109
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
110
    { 309, 25, 79, 59, 25, 80, 34, 53, 61, 25, 49, 23, 43, 64, 36, 59 },
111
    { 270, 57, 40, 54, 50, 42, 41, 53, 56, 28, 17, 81, 45, 86, 34, 70 },
112
    { 1005, 0, 0, 0, 0, 0, 0, 0, 0, 19, 0, 0, 0, 0, 0, 0 },
113
    { 992, 0, 0, 0, 0, 0, 0, 0, 0, 32, 0, 0, 0, 0, 0, 0 },
114
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
115
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
116
  { { 133, 63, 55, 83, 57, 87, 58, 72, 68, 16, 24, 35, 29, 105, 25, 114 },
117
    { 131, 75, 74, 60, 71, 77, 65, 66, 73, 33, 21, 79, 20, 83, 18, 78 },
118
    { 276, 95, 82, 58, 86, 93, 63, 60, 64, 17, 38, 92, 0, 0, 0, 0 },
119
    { 1006, 0, 0, 0, 0, 0, 0, 0, 0, 18, 0, 0, 0, 0, 0, 0 },
120
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
121
    { 147, 49, 75, 78, 50, 97, 60, 67, 76, 17, 42, 35, 31, 93, 27, 80 },
122
    { 157, 49, 58, 75, 61, 52, 56, 67, 69, 12, 15, 79, 24, 119, 11, 120 },
123
    { 178, 69, 83, 77, 69, 85, 72, 77, 77, 20, 35, 40, 25, 48, 23, 46 },
124
    { 174, 55, 64, 57, 73, 68, 62, 61, 75, 15, 12, 90, 17, 99, 16, 86 },
125
    { 1008, 0, 0, 0, 0, 0, 0, 0, 0, 16, 0, 0, 0, 0, 0, 0 },
126
    { 1018, 0, 0, 0, 0, 0, 0, 0, 0, 6, 0, 0, 0, 0, 0, 0 },
127
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
128
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
129
    { 266, 31, 63, 64, 21, 52, 39, 54, 63, 30, 52, 31, 48, 89, 46, 75 },
130
    { 272, 26, 32, 44, 29, 31, 32, 53, 51, 13, 13, 88, 22, 153, 16, 149 },
131
    { 923, 0, 0, 0, 0, 0, 0, 0, 0, 101, 0, 0, 0, 0, 0, 0 },
132
    { 969, 0, 0, 0, 0, 0, 0, 0, 0, 55, 0, 0, 0, 0, 0, 0 },
133
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
134
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
135
  { { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
136
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
137
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
138
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
139
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
140
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
141
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
142
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
143
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
144
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
145
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
146
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
147
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
148
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
149
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
150
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
151
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
152
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 },
153
    { 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64 } },
154
  { { 158, 92, 125, 298, 12, 15, 20, 29, 31, 12, 29, 67, 34, 44, 23, 35 },
155
    { 147, 94, 103, 123, 45, 48, 38, 41, 46, 48, 37, 78, 33, 63, 27, 53 },
156
    { 268, 126, 125, 136, 54, 53, 31, 38, 38, 33, 35, 87, 0, 0, 0, 0 },
157
    { 1018, 0, 0, 0, 0, 0, 0, 0, 0, 6, 0, 0, 0, 0, 0, 0 },
158
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
159
    { 159, 72, 103, 194, 20, 35, 37, 50, 56, 21, 39, 40, 51, 61, 38, 48 },
160
    { 259, 86, 95, 188, 32, 20, 25, 34, 37, 13, 12, 85, 25, 53, 17, 43 },
161
    { 189, 99, 113, 123, 45, 59, 37, 46, 48, 44, 39, 41, 31, 47, 26, 37 },
162
    { 175, 110, 113, 128, 58, 38, 33, 33, 43, 29, 13, 100, 14, 68, 12, 57 },
163
    { 1017, 0, 0, 0, 0, 0, 0, 0, 0, 7, 0, 0, 0, 0, 0, 0 },
164
    { 1019, 0, 0, 0, 0, 0, 0, 0, 0, 5, 0, 0, 0, 0, 0, 0 },
165
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
166
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
167
    { 208, 22, 84, 101, 21, 59, 44, 70, 90, 25, 59, 13, 64, 67, 49, 48 },
168
    { 277, 52, 32, 63, 43, 26, 33, 48, 54, 11, 6, 130, 18, 119, 11, 101 },
169
    { 963, 0, 0, 0, 0, 0, 0, 0, 0, 61, 0, 0, 0, 0, 0, 0 },
170
    { 979, 0, 0, 0, 0, 0, 0, 0, 0, 45, 0, 0, 0, 0, 0, 0 },
171
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
172
    { 1024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } }
173
};
174
175
const int default_obmc_probs[FRAME_UPDATE_TYPES][BLOCK_SIZES_ALL] = {
176
  { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
177
  { 0,  0,  0,  106, 90, 90, 97, 67, 59, 70, 28,
178
    30, 38, 16, 16,  16, 0,  0,  44, 50, 26, 25 },
179
  { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
180
  { 0,  0,  0,  98, 93, 97, 68, 82, 85, 33, 30,
181
    33, 16, 16, 16, 16, 0,  0,  43, 37, 26, 16 },
182
  { 0,  0,  0,  91, 80, 76, 78, 55, 49, 24, 16,
183
    16, 16, 16, 16, 16, 0,  0,  29, 45, 16, 38 },
184
  { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 },
185
  { 0,  0,  0,  103, 89, 89, 89, 62, 63, 76, 34,
186
    35, 32, 19, 16,  16, 0,  0,  49, 55, 29, 19 }
187
};
188
189
const int default_warped_probs[FRAME_UPDATE_TYPES] = { 64, 64, 64, 64,
190
                                                       64, 64, 64 };
191
192
// TODO(yunqing): the default probs can be trained later from better
193
// performance.
194
const int default_switchable_interp_probs[FRAME_UPDATE_TYPES]
195
                                         [SWITCHABLE_FILTER_CONTEXTS]
196
                                         [SWITCHABLE_FILTERS] = {
197
                                           { { 512, 512, 512 },
198
                                             { 512, 512, 512 },
199
                                             { 512, 512, 512 },
200
                                             { 512, 512, 512 },
201
                                             { 512, 512, 512 },
202
                                             { 512, 512, 512 },
203
                                             { 512, 512, 512 },
204
                                             { 512, 512, 512 },
205
                                             { 512, 512, 512 },
206
                                             { 512, 512, 512 },
207
                                             { 512, 512, 512 },
208
                                             { 512, 512, 512 },
209
                                             { 512, 512, 512 },
210
                                             { 512, 512, 512 },
211
                                             { 512, 512, 512 },
212
                                             { 512, 512, 512 } },
213
                                           { { 512, 512, 512 },
214
                                             { 512, 512, 512 },
215
                                             { 512, 512, 512 },
216
                                             { 512, 512, 512 },
217
                                             { 512, 512, 512 },
218
                                             { 512, 512, 512 },
219
                                             { 512, 512, 512 },
220
                                             { 512, 512, 512 },
221
                                             { 512, 512, 512 },
222
                                             { 512, 512, 512 },
223
                                             { 512, 512, 512 },
224
                                             { 512, 512, 512 },
225
                                             { 512, 512, 512 },
226
                                             { 512, 512, 512 },
227
                                             { 512, 512, 512 },
228
                                             { 512, 512, 512 } },
229
                                           { { 512, 512, 512 },
230
                                             { 512, 512, 512 },
231
                                             { 512, 512, 512 },
232
                                             { 512, 512, 512 },
233
                                             { 512, 512, 512 },
234
                                             { 512, 512, 512 },
235
                                             { 512, 512, 512 },
236
                                             { 512, 512, 512 },
237
                                             { 512, 512, 512 },
238
                                             { 512, 512, 512 },
239
                                             { 512, 512, 512 },
240
                                             { 512, 512, 512 },
241
                                             { 512, 512, 512 },
242
                                             { 512, 512, 512 },
243
                                             { 512, 512, 512 },
244
                                             { 512, 512, 512 } },
245
                                           { { 512, 512, 512 },
246
                                             { 512, 512, 512 },
247
                                             { 512, 512, 512 },
248
                                             { 512, 512, 512 },
249
                                             { 512, 512, 512 },
250
                                             { 512, 512, 512 },
251
                                             { 512, 512, 512 },
252
                                             { 512, 512, 512 },
253
                                             { 512, 512, 512 },
254
                                             { 512, 512, 512 },
255
                                             { 512, 512, 512 },
256
                                             { 512, 512, 512 },
257
                                             { 512, 512, 512 },
258
                                             { 512, 512, 512 },
259
                                             { 512, 512, 512 },
260
                                             { 512, 512, 512 } },
261
                                           { { 512, 512, 512 },
262
                                             { 512, 512, 512 },
263
                                             { 512, 512, 512 },
264
                                             { 512, 512, 512 },
265
                                             { 512, 512, 512 },
266
                                             { 512, 512, 512 },
267
                                             { 512, 512, 512 },
268
                                             { 512, 512, 512 },
269
                                             { 512, 512, 512 },
270
                                             { 512, 512, 512 },
271
                                             { 512, 512, 512 },
272
                                             { 512, 512, 512 },
273
                                             { 512, 512, 512 },
274
                                             { 512, 512, 512 },
275
                                             { 512, 512, 512 },
276
                                             { 512, 512, 512 } },
277
                                           { { 512, 512, 512 },
278
                                             { 512, 512, 512 },
279
                                             { 512, 512, 512 },
280
                                             { 512, 512, 512 },
281
                                             { 512, 512, 512 },
282
                                             { 512, 512, 512 },
283
                                             { 512, 512, 512 },
284
                                             { 512, 512, 512 },
285
                                             { 512, 512, 512 },
286
                                             { 512, 512, 512 },
287
                                             { 512, 512, 512 },
288
                                             { 512, 512, 512 },
289
                                             { 512, 512, 512 },
290
                                             { 512, 512, 512 },
291
                                             { 512, 512, 512 },
292
                                             { 512, 512, 512 } },
293
                                           { { 512, 512, 512 },
294
                                             { 512, 512, 512 },
295
                                             { 512, 512, 512 },
296
                                             { 512, 512, 512 },
297
                                             { 512, 512, 512 },
298
                                             { 512, 512, 512 },
299
                                             { 512, 512, 512 },
300
                                             { 512, 512, 512 },
301
                                             { 512, 512, 512 },
302
                                             { 512, 512, 512 },
303
                                             { 512, 512, 512 },
304
                                             { 512, 512, 512 },
305
                                             { 512, 512, 512 },
306
                                             { 512, 512, 512 },
307
                                             { 512, 512, 512 },
308
                                             { 512, 512, 512 } }
309
                                         };
310
311
0
static void configure_static_seg_features(AV1_COMP *cpi) {
312
0
  AV1_COMMON *const cm = &cpi->common;
313
0
  const RATE_CONTROL *const rc = &cpi->rc;
314
0
  struct segmentation *const seg = &cm->seg;
315
316
0
  double avg_q;
317
#if CONFIG_FPMT_TEST
318
  avg_q = ((cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] > 0) &&
319
           (cpi->ppi->fpmt_unit_test_cfg == PARALLEL_SIMULATION_ENCODE))
320
              ? cpi->ppi->p_rc.temp_avg_q
321
              : cpi->ppi->p_rc.avg_q;
322
#else
323
0
  avg_q = cpi->ppi->p_rc.avg_q;
324
0
#endif
325
326
0
  int high_q = (int)(avg_q > 48.0);
327
0
  int qi_delta;
328
329
  // Disable and clear down for KF
330
0
  if (cm->current_frame.frame_type == KEY_FRAME) {
331
    // Clear down the global segmentation map
332
0
    memset(cpi->enc_seg.map, 0, cm->mi_params.mi_rows * cm->mi_params.mi_cols);
333
0
    seg->update_map = 0;
334
0
    seg->update_data = 0;
335
336
    // Disable segmentation
337
0
    av1_disable_segmentation(seg);
338
339
    // Clear down the segment features.
340
0
    av1_clearall_segfeatures(seg);
341
0
  } else if (cpi->refresh_frame.alt_ref_frame) {
342
    // If this is an alt ref frame
343
    // Clear down the global segmentation map
344
0
    memset(cpi->enc_seg.map, 0, cm->mi_params.mi_rows * cm->mi_params.mi_cols);
345
0
    seg->update_map = 0;
346
0
    seg->update_data = 0;
347
348
    // Disable segmentation and individual segment features by default
349
0
    av1_disable_segmentation(seg);
350
0
    av1_clearall_segfeatures(seg);
351
352
    // If segmentation was enabled set those features needed for the
353
    // arf itself.
354
0
    if (seg->enabled) {
355
0
      seg->update_map = 1;
356
0
      seg->update_data = 1;
357
358
0
      qi_delta = av1_compute_qdelta(rc, avg_q, avg_q * 0.875,
359
0
                                    cm->seq_params->bit_depth);
360
0
      av1_set_segdata(seg, 1, SEG_LVL_ALT_Q, qi_delta - 2);
361
0
      av1_set_segdata(seg, 1, SEG_LVL_ALT_LF_Y_H, -2);
362
0
      av1_set_segdata(seg, 1, SEG_LVL_ALT_LF_Y_V, -2);
363
0
      av1_set_segdata(seg, 1, SEG_LVL_ALT_LF_U, -2);
364
0
      av1_set_segdata(seg, 1, SEG_LVL_ALT_LF_V, -2);
365
366
0
      av1_enable_segfeature(seg, 1, SEG_LVL_ALT_LF_Y_H);
367
0
      av1_enable_segfeature(seg, 1, SEG_LVL_ALT_LF_Y_V);
368
0
      av1_enable_segfeature(seg, 1, SEG_LVL_ALT_LF_U);
369
0
      av1_enable_segfeature(seg, 1, SEG_LVL_ALT_LF_V);
370
371
0
      av1_enable_segfeature(seg, 1, SEG_LVL_ALT_Q);
372
0
    }
373
0
  } else if (seg->enabled) {
374
    // All other frames if segmentation has been enabled
375
376
    // First normal frame in a valid gf or alt ref group
377
0
    if (rc->frames_since_golden == 0) {
378
      // Set up segment features for normal frames in an arf group
379
      // Disable segmentation and clear down features if alt ref
380
      // is not active for this group
381
382
0
      av1_disable_segmentation(seg);
383
384
0
      memset(cpi->enc_seg.map, 0,
385
0
             cm->mi_params.mi_rows * cm->mi_params.mi_cols);
386
387
0
      seg->update_map = 0;
388
0
      seg->update_data = 0;
389
390
0
      av1_clearall_segfeatures(seg);
391
0
    } else if (rc->is_src_frame_alt_ref) {
392
      // Special case where we are coding over the top of a previous
393
      // alt ref frame.
394
      // Segment coding disabled for compred testing
395
396
      // Enable ref frame features for segment 0 as well
397
0
      av1_enable_segfeature(seg, 0, SEG_LVL_REF_FRAME);
398
0
      av1_enable_segfeature(seg, 1, SEG_LVL_REF_FRAME);
399
400
      // All mbs should use ALTREF_FRAME
401
0
      av1_clear_segdata(seg, 0, SEG_LVL_REF_FRAME);
402
0
      av1_set_segdata(seg, 0, SEG_LVL_REF_FRAME, ALTREF_FRAME);
403
0
      av1_clear_segdata(seg, 1, SEG_LVL_REF_FRAME);
404
0
      av1_set_segdata(seg, 1, SEG_LVL_REF_FRAME, ALTREF_FRAME);
405
406
      // Skip all MBs if high Q (0,0 mv and skip coeffs)
407
0
      if (high_q) {
408
0
        av1_enable_segfeature(seg, 0, SEG_LVL_SKIP);
409
0
        av1_enable_segfeature(seg, 1, SEG_LVL_SKIP);
410
0
      }
411
      // Enable data update
412
0
      seg->update_data = 1;
413
0
    } else {
414
      // All other frames.
415
416
      // No updates.. leave things as they are.
417
0
      seg->update_map = 0;
418
0
      seg->update_data = 0;
419
0
    }
420
0
  }
421
0
}
422
423
0
void av1_apply_active_map(AV1_COMP *cpi) {
424
0
  struct segmentation *const seg = &cpi->common.seg;
425
0
  unsigned char *const seg_map = cpi->enc_seg.map;
426
0
  const unsigned char *const active_map = cpi->active_map.map;
427
428
0
  assert(AM_SEGMENT_ID_ACTIVE == CR_SEGMENT_ID_BASE);
429
430
  // Disable the active_maps on intra_only frames or if the
431
  // input map for the current frame has no inactive blocks.
432
0
  if (frame_is_intra_only(&cpi->common) ||
433
0
      cpi->rc.percent_blocks_inactive == 0) {
434
0
    cpi->active_map.enabled = 0;
435
0
    cpi->active_map.update = 1;
436
0
  }
437
438
0
  if (cpi->active_map.update) {
439
0
    if (cpi->active_map.enabled) {
440
0
      const int num_mis =
441
0
          cpi->common.mi_params.mi_rows * cpi->common.mi_params.mi_cols;
442
0
      memcpy(seg_map, active_map, sizeof(active_map[0]) * num_mis);
443
0
      av1_enable_segmentation(seg);
444
0
      av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_SKIP);
445
0
      av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_H);
446
0
      av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_V);
447
0
      av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_U);
448
0
      av1_enable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_V);
449
450
0
      av1_set_segdata(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_H,
451
0
                      -MAX_LOOP_FILTER);
452
0
      av1_set_segdata(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_V,
453
0
                      -MAX_LOOP_FILTER);
454
0
      av1_set_segdata(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_U,
455
0
                      -MAX_LOOP_FILTER);
456
0
      av1_set_segdata(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_V,
457
0
                      -MAX_LOOP_FILTER);
458
0
    } else {
459
0
      av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_SKIP);
460
0
      av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_H);
461
0
      av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_Y_V);
462
0
      av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_U);
463
0
      av1_disable_segfeature(seg, AM_SEGMENT_ID_INACTIVE, SEG_LVL_ALT_LF_V);
464
0
      if (seg->enabled) {
465
0
        seg->update_data = 1;
466
0
        seg->update_map = 1;
467
0
      }
468
0
    }
469
0
    cpi->active_map.update = 0;
470
0
  }
471
0
}
472
473
#if !CONFIG_REALTIME_ONLY
474
0
static void process_tpl_stats_frame(AV1_COMP *cpi) {
475
0
  const GF_GROUP *const gf_group = &cpi->ppi->gf_group;
476
0
  AV1_COMMON *const cm = &cpi->common;
477
478
0
  assert(IMPLIES(gf_group->size > 0, cpi->gf_frame_index < gf_group->size));
479
480
0
  const int tpl_idx = cpi->gf_frame_index;
481
0
  TplParams *const tpl_data = &cpi->ppi->tpl_data;
482
0
  TplDepFrame *tpl_frame = &tpl_data->tpl_frame[tpl_idx];
483
0
  TplDepStats *tpl_stats = tpl_frame->tpl_stats_ptr;
484
485
0
  if (tpl_frame->is_valid) {
486
0
    int tpl_stride = tpl_frame->stride;
487
0
    double intra_cost_base = 0;
488
0
    double mc_dep_cost_base = 0;
489
0
    double cbcmp_base = 1;
490
0
    const int step = 1 << tpl_data->tpl_stats_block_mis_log2;
491
0
    const int row_step = step;
492
0
    const int col_step_sr =
493
0
        coded_to_superres_mi(step, cm->superres_scale_denominator);
494
0
    const int mi_cols_sr = av1_pixels_to_mi(cm->superres_upscaled_width);
495
496
0
    for (int row = 0; row < cm->mi_params.mi_rows; row += row_step) {
497
0
      for (int col = 0; col < mi_cols_sr; col += col_step_sr) {
498
0
        TplDepStats *this_stats = &tpl_stats[av1_tpl_ptr_pos(
499
0
            row, col, tpl_stride, tpl_data->tpl_stats_block_mis_log2)];
500
0
        double cbcmp = (double)(this_stats->srcrf_dist);
501
0
        int64_t mc_dep_delta =
502
0
            RDCOST(tpl_frame->base_rdmult, this_stats->mc_dep_rate,
503
0
                   this_stats->mc_dep_dist);
504
0
        double dist_scaled = (double)(this_stats->recrf_dist << RDDIV_BITS);
505
0
        intra_cost_base += log(dist_scaled) * cbcmp;
506
0
        mc_dep_cost_base += log(dist_scaled + mc_dep_delta) * cbcmp;
507
0
        cbcmp_base += cbcmp;
508
0
      }
509
0
    }
510
511
0
    if (mc_dep_cost_base == 0) {
512
0
      tpl_frame->is_valid = 0;
513
0
    } else {
514
0
      cpi->rd.r0 = exp((intra_cost_base - mc_dep_cost_base) / cbcmp_base);
515
0
      if (is_frame_tpl_eligible(gf_group, cpi->gf_frame_index)) {
516
0
        if (cpi->ppi->lap_enabled) {
517
0
          double min_boost_factor = sqrt(cpi->ppi->p_rc.baseline_gf_interval);
518
0
          const int gfu_boost = get_gfu_boost_from_r0_lap(
519
0
              min_boost_factor, MAX_GFUBOOST_FACTOR, cpi->rd.r0,
520
0
              cpi->ppi->p_rc.num_stats_required_for_gfu_boost);
521
          // printf("old boost %d new boost %d\n", cpi->rc.gfu_boost,
522
          //        gfu_boost);
523
0
          cpi->ppi->p_rc.gfu_boost = combine_prior_with_tpl_boost(
524
0
              min_boost_factor, MAX_BOOST_COMBINE_FACTOR,
525
0
              cpi->ppi->p_rc.gfu_boost, gfu_boost,
526
0
              cpi->ppi->p_rc.num_stats_used_for_gfu_boost);
527
0
        } else {
528
          // TPL may only look at a subset of frame in the gf group when the
529
          // speed feature 'reduce_num_frames' is on, which affects the r0
530
          // calcuation. Thus, to compensate for TPL not using all frames a
531
          // factor to adjust r0 is used.
532
0
          const int gfu_boost =
533
0
              (int)(200.0 * cpi->ppi->tpl_data.r0_adjust_factor / cpi->rd.r0);
534
0
          cpi->ppi->p_rc.gfu_boost = combine_prior_with_tpl_boost(
535
0
              MIN_BOOST_COMBINE_FACTOR, MAX_BOOST_COMBINE_FACTOR,
536
0
              cpi->ppi->p_rc.gfu_boost, gfu_boost, cpi->rc.frames_to_key);
537
0
        }
538
0
      }
539
0
    }
540
0
  }
541
0
}
542
#endif  // !CONFIG_REALTIME_ONLY
543
544
void av1_set_size_dependent_vars(AV1_COMP *cpi, int *q, int *bottom_index,
545
0
                                 int *top_index) {
546
0
  AV1_COMMON *const cm = &cpi->common;
547
548
  // Setup variables that depend on the dimensions of the frame.
549
0
  av1_set_speed_features_framesize_dependent(cpi, cpi->speed);
550
551
0
#if !CONFIG_REALTIME_ONLY
552
0
  GF_GROUP *gf_group = &cpi->ppi->gf_group;
553
0
  if (cpi->oxcf.algo_cfg.enable_tpl_model &&
554
0
      av1_tpl_stats_ready(&cpi->ppi->tpl_data, cpi->gf_frame_index)) {
555
0
    process_tpl_stats_frame(cpi);
556
0
    av1_tpl_rdmult_setup(cpi);
557
0
  }
558
0
#endif
559
560
  // Decide q and q bounds.
561
0
  *q = av1_rc_pick_q_and_bounds(cpi, cm->width, cm->height, cpi->gf_frame_index,
562
0
                                bottom_index, top_index);
563
564
0
  if (cpi->oxcf.rc_cfg.mode == AOM_CBR && cpi->rc.force_max_q) {
565
0
    *q = cpi->rc.worst_quality;
566
0
    cpi->rc.force_max_q = 0;
567
0
  }
568
569
0
#if !CONFIG_REALTIME_ONLY
570
0
  if (cpi->oxcf.rc_cfg.mode == AOM_Q &&
571
0
      cpi->ppi->tpl_data.tpl_frame[cpi->gf_frame_index].is_valid &&
572
0
      !is_lossless_requested(&cpi->oxcf.rc_cfg)) {
573
0
    const RateControlCfg *const rc_cfg = &cpi->oxcf.rc_cfg;
574
0
    const int tpl_q = av1_tpl_get_q_index(
575
0
        &cpi->ppi->tpl_data, cpi->gf_frame_index, cpi->rc.active_worst_quality,
576
0
        cm->seq_params->bit_depth);
577
0
    *q = clamp(tpl_q, rc_cfg->best_allowed_q, rc_cfg->worst_allowed_q);
578
0
    *top_index = *bottom_index = *q;
579
0
    if (gf_group->update_type[cpi->gf_frame_index] == ARF_UPDATE)
580
0
      cpi->ppi->p_rc.arf_q = *q;
581
0
  }
582
583
0
  if (cpi->oxcf.q_cfg.use_fixed_qp_offsets && cpi->oxcf.rc_cfg.mode == AOM_Q) {
584
0
    if (is_frame_tpl_eligible(gf_group, cpi->gf_frame_index)) {
585
0
      const double qratio_grad =
586
0
          cpi->ppi->p_rc.baseline_gf_interval > 20 ? 0.2 : 0.3;
587
0
      const double qstep_ratio =
588
0
          0.2 +
589
0
          (1.0 - (double)cpi->rc.active_worst_quality / MAXQ) * qratio_grad;
590
0
      *q = av1_get_q_index_from_qstep_ratio(
591
0
          cpi->rc.active_worst_quality, qstep_ratio, cm->seq_params->bit_depth);
592
0
      *top_index = *bottom_index = *q;
593
0
      if (gf_group->update_type[cpi->gf_frame_index] == ARF_UPDATE ||
594
0
          gf_group->update_type[cpi->gf_frame_index] == KF_UPDATE ||
595
0
          gf_group->update_type[cpi->gf_frame_index] == GF_UPDATE)
596
0
        cpi->ppi->p_rc.arf_q = *q;
597
0
    } else if (gf_group->layer_depth[cpi->gf_frame_index] <
598
0
               gf_group->max_layer_depth) {
599
0
      int this_height = gf_group->layer_depth[cpi->gf_frame_index];
600
0
      int arf_q = cpi->ppi->p_rc.arf_q;
601
0
      while (this_height > 1) {
602
0
        arf_q = (arf_q + cpi->oxcf.rc_cfg.cq_level + 1) / 2;
603
0
        --this_height;
604
0
      }
605
0
      *top_index = *bottom_index = *q = arf_q;
606
0
    }
607
0
  }
608
0
#endif
609
610
  // Configure experimental use of segmentation for enhanced coding of
611
  // static regions if indicated.
612
  // Only allowed in the second pass of a two pass encode, as it requires
613
  // lagged coding, and if the relevant speed feature flag is set.
614
0
  if (is_stat_consumption_stage_twopass(cpi) &&
615
0
      cpi->sf.hl_sf.static_segmentation)
616
0
    configure_static_seg_features(cpi);
617
0
}
618
619
#if !CONFIG_REALTIME_ONLY
620
0
static void reset_film_grain_chroma_params(aom_film_grain_t *pars) {
621
0
  pars->num_cr_points = 0;
622
0
  pars->cr_mult = 0;
623
0
  pars->cr_luma_mult = 0;
624
0
  memset(pars->scaling_points_cr, 0, sizeof(pars->scaling_points_cr));
625
0
  memset(pars->ar_coeffs_cr, 0, sizeof(pars->ar_coeffs_cr));
626
0
  pars->num_cb_points = 0;
627
0
  pars->cb_mult = 0;
628
0
  pars->cb_luma_mult = 0;
629
0
  pars->chroma_scaling_from_luma = 0;
630
0
  memset(pars->scaling_points_cb, 0, sizeof(pars->scaling_points_cb));
631
0
  memset(pars->ar_coeffs_cb, 0, sizeof(pars->ar_coeffs_cb));
632
0
}
633
634
void av1_update_film_grain_parameters_seq(struct AV1_PRIMARY *ppi,
635
0
                                          const AV1EncoderConfig *oxcf) {
636
0
  SequenceHeader *const seq_params = &ppi->seq_params;
637
0
  const TuneCfg *const tune_cfg = &oxcf->tune_cfg;
638
639
0
  if (tune_cfg->film_grain_test_vector || tune_cfg->film_grain_table_filename ||
640
0
      tune_cfg->content == AOM_CONTENT_FILM) {
641
0
    seq_params->film_grain_params_present = 1;
642
0
  } else {
643
0
#if CONFIG_DENOISE
644
0
    seq_params->film_grain_params_present = (oxcf->noise_level > 0);
645
#else
646
    seq_params->film_grain_params_present = 0;
647
#endif
648
0
  }
649
0
}
650
651
void av1_update_film_grain_parameters(struct AV1_COMP *cpi,
652
0
                                      const AV1EncoderConfig *oxcf) {
653
0
  AV1_COMMON *const cm = &cpi->common;
654
0
  const TuneCfg *const tune_cfg = &oxcf->tune_cfg;
655
656
0
  if (cpi->film_grain_table) {
657
0
    aom_film_grain_table_free(cpi->film_grain_table);
658
0
    aom_free(cpi->film_grain_table);
659
0
    cpi->film_grain_table = NULL;
660
0
  }
661
662
0
  if (tune_cfg->film_grain_test_vector) {
663
0
    if (cm->current_frame.frame_type == KEY_FRAME) {
664
0
      memcpy(&cm->film_grain_params,
665
0
             film_grain_test_vectors + tune_cfg->film_grain_test_vector - 1,
666
0
             sizeof(cm->film_grain_params));
667
0
      if (oxcf->tool_cfg.enable_monochrome)
668
0
        reset_film_grain_chroma_params(&cm->film_grain_params);
669
0
      cm->film_grain_params.bit_depth = cm->seq_params->bit_depth;
670
0
      if (cm->seq_params->color_range == AOM_CR_FULL_RANGE) {
671
0
        cm->film_grain_params.clip_to_restricted_range = 0;
672
0
      }
673
0
    }
674
0
  } else if (tune_cfg->film_grain_table_filename) {
675
0
    CHECK_MEM_ERROR(cm, cpi->film_grain_table,
676
0
                    aom_calloc(1, sizeof(*cpi->film_grain_table)));
677
678
0
    aom_film_grain_table_read(cpi->film_grain_table,
679
0
                              tune_cfg->film_grain_table_filename, cm->error);
680
0
  } else if (tune_cfg->content == AOM_CONTENT_FILM) {
681
0
    cm->film_grain_params.bit_depth = cm->seq_params->bit_depth;
682
0
    if (oxcf->tool_cfg.enable_monochrome)
683
0
      reset_film_grain_chroma_params(&cm->film_grain_params);
684
0
    if (cm->seq_params->color_range == AOM_CR_FULL_RANGE)
685
0
      cm->film_grain_params.clip_to_restricted_range = 0;
686
0
  } else {
687
0
    memset(&cm->film_grain_params, 0, sizeof(cm->film_grain_params));
688
0
  }
689
0
}
690
#endif  // !CONFIG_REALTIME_ONLY
691
692
void av1_scale_references(AV1_COMP *cpi, const InterpFilter filter,
693
0
                          const int phase, const int use_optimized_scaler) {
694
0
  AV1_COMMON *cm = &cpi->common;
695
0
  const int num_planes = av1_num_planes(cm);
696
0
  MV_REFERENCE_FRAME ref_frame;
697
698
0
  for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) {
699
    // Need to convert from AOM_REFFRAME to index into ref_mask (subtract 1).
700
0
    if (cpi->ref_frame_flags & av1_ref_frame_flag_list[ref_frame]) {
701
0
      BufferPool *const pool = cm->buffer_pool;
702
0
      const YV12_BUFFER_CONFIG *const ref =
703
0
          get_ref_frame_yv12_buf(cm, ref_frame);
704
705
0
      if (ref == NULL) {
706
0
        cpi->scaled_ref_buf[ref_frame - 1] = NULL;
707
0
        continue;
708
0
      }
709
710
      // For RTC-SVC: if force_zero_mode_spatial_ref is enabled, check if the
711
      // motion search can be skipped for the references: last, golden, altref.
712
      // If so, we can skip scaling that reference.
713
0
      if (cpi->ppi->use_svc && cpi->svc.force_zero_mode_spatial_ref &&
714
0
          cpi->ppi->rtc_ref.set_ref_frame_config) {
715
0
        if (ref_frame == LAST_FRAME && cpi->svc.skip_mvsearch_last) continue;
716
0
        if (ref_frame == GOLDEN_FRAME && cpi->svc.skip_mvsearch_gf) continue;
717
0
        if (ref_frame == ALTREF_FRAME && cpi->svc.skip_mvsearch_altref)
718
0
          continue;
719
0
      }
720
      // For RTC with superres on: golden reference only needs to be scaled
721
      // if it was refreshed in previous frame.
722
0
      if (is_one_pass_rt_params(cpi) &&
723
0
          cpi->oxcf.superres_cfg.enable_superres && ref_frame == GOLDEN_FRAME &&
724
0
          cpi->rc.frame_num_last_gf_refresh <
725
0
              (int)cm->current_frame.frame_number - 1) {
726
0
        continue;
727
0
      }
728
729
0
      if (ref->y_crop_width != cm->width || ref->y_crop_height != cm->height) {
730
        // Replace the reference buffer with a copy having a thicker border,
731
        // if the reference buffer is higher resolution than the current
732
        // frame, and the border is thin.
733
0
        if ((ref->y_crop_width > cm->width ||
734
0
             ref->y_crop_height > cm->height) &&
735
0
            ref->border < AOM_BORDER_IN_PIXELS) {
736
0
          RefCntBuffer *ref_fb = get_ref_frame_buf(cm, ref_frame);
737
0
          if (aom_yv12_realloc_with_new_border(
738
0
                  &ref_fb->buf, AOM_BORDER_IN_PIXELS,
739
0
                  cm->features.byte_alignment, cpi->alloc_pyramid,
740
0
                  num_planes) != 0) {
741
0
            aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
742
0
                               "Failed to allocate frame buffer");
743
0
          }
744
0
        }
745
0
        int force_scaling = 0;
746
0
        RefCntBuffer *new_fb = cpi->scaled_ref_buf[ref_frame - 1];
747
0
        if (new_fb == NULL) {
748
0
          const int new_fb_idx = get_free_fb(cm);
749
0
          if (new_fb_idx == INVALID_IDX) {
750
0
            aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
751
0
                               "Unable to find free frame buffer");
752
0
          }
753
0
          force_scaling = 1;
754
0
          new_fb = &pool->frame_bufs[new_fb_idx];
755
0
        }
756
757
0
        if (force_scaling || new_fb->buf.y_crop_width != cm->width ||
758
0
            new_fb->buf.y_crop_height != cm->height) {
759
0
          if (aom_realloc_frame_buffer(
760
0
                  &new_fb->buf, cm->width, cm->height,
761
0
                  cm->seq_params->subsampling_x, cm->seq_params->subsampling_y,
762
0
                  cm->seq_params->use_highbitdepth, AOM_BORDER_IN_PIXELS,
763
0
                  cm->features.byte_alignment, NULL, NULL, NULL, false, 0)) {
764
0
            if (force_scaling) {
765
              // Release the reference acquired in the get_free_fb() call above.
766
0
              --new_fb->ref_count;
767
0
            }
768
0
            aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
769
0
                               "Failed to allocate frame buffer");
770
0
          }
771
0
          bool has_optimized_scaler = av1_has_optimized_scaler(
772
0
              ref->y_crop_width, ref->y_crop_height, new_fb->buf.y_crop_width,
773
0
              new_fb->buf.y_crop_height);
774
0
          if (num_planes > 1) {
775
0
            has_optimized_scaler =
776
0
                has_optimized_scaler &&
777
0
                av1_has_optimized_scaler(
778
0
                    ref->uv_crop_width, ref->uv_crop_height,
779
0
                    new_fb->buf.uv_crop_width, new_fb->buf.uv_crop_height);
780
0
          }
781
0
#if CONFIG_AV1_HIGHBITDEPTH
782
0
          if (use_optimized_scaler && has_optimized_scaler &&
783
0
              cm->seq_params->bit_depth == AOM_BITS_8) {
784
0
            av1_resize_and_extend_frame(ref, &new_fb->buf, filter, phase,
785
0
                                        num_planes);
786
0
          } else if (!av1_resize_and_extend_frame_nonnormative(
787
0
                         ref, &new_fb->buf, (int)cm->seq_params->bit_depth,
788
0
                         num_planes)) {
789
0
            aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
790
0
                               "Failed to allocate buffer during resize");
791
0
          }
792
#else
793
          if (use_optimized_scaler && has_optimized_scaler) {
794
            av1_resize_and_extend_frame(ref, &new_fb->buf, filter, phase,
795
                                        num_planes);
796
          } else if (!av1_resize_and_extend_frame_nonnormative(
797
                         ref, &new_fb->buf, (int)cm->seq_params->bit_depth,
798
                         num_planes)) {
799
            aom_internal_error(cm->error, AOM_CODEC_MEM_ERROR,
800
                               "Failed to allocate buffer during resize");
801
          }
802
#endif
803
0
          cpi->scaled_ref_buf[ref_frame - 1] = new_fb;
804
0
          alloc_frame_mvs(cm, new_fb);
805
0
        }
806
0
      } else {
807
0
        RefCntBuffer *buf = get_ref_frame_buf(cm, ref_frame);
808
0
        buf->buf.y_crop_width = ref->y_crop_width;
809
0
        buf->buf.y_crop_height = ref->y_crop_height;
810
0
        cpi->scaled_ref_buf[ref_frame - 1] = buf;
811
0
        ++buf->ref_count;
812
0
      }
813
0
    } else {
814
0
      if (!has_no_stats_stage(cpi)) cpi->scaled_ref_buf[ref_frame - 1] = NULL;
815
0
    }
816
0
  }
817
0
}
818
819
BLOCK_SIZE av1_select_sb_size(const AV1EncoderConfig *const oxcf, int width,
820
0
                              int height, int number_spatial_layers) {
821
0
  if (oxcf->tool_cfg.superblock_size == AOM_SUPERBLOCK_SIZE_64X64) {
822
0
    return BLOCK_64X64;
823
0
  }
824
0
  if (oxcf->tool_cfg.superblock_size == AOM_SUPERBLOCK_SIZE_128X128) {
825
0
    return BLOCK_128X128;
826
0
  }
827
#if CONFIG_TFLITE
828
  if (oxcf->q_cfg.deltaq_mode == DELTA_Q_USER_RATING_BASED) return BLOCK_64X64;
829
#endif
830
  // Force 64x64 superblock size to increase resolution in perceptual
831
  // AQ and user rating based modes.
832
0
  if (oxcf->mode == ALLINTRA &&
833
0
      (oxcf->q_cfg.deltaq_mode == DELTA_Q_PERCEPTUAL_AI ||
834
0
       oxcf->q_cfg.deltaq_mode == DELTA_Q_USER_RATING_BASED)) {
835
0
    return BLOCK_64X64;
836
0
  }
837
  // Variance Boost only supports 64x64 superblocks.
838
0
  if (oxcf->q_cfg.deltaq_mode == DELTA_Q_VARIANCE_BOOST) {
839
0
    return BLOCK_64X64;
840
0
  }
841
0
  assert(oxcf->tool_cfg.superblock_size == AOM_SUPERBLOCK_SIZE_DYNAMIC);
842
843
0
  if (number_spatial_layers > 1 ||
844
0
      oxcf->resize_cfg.resize_mode != RESIZE_NONE) {
845
    // Use the configured size (top resolution) for spatial layers or
846
    // on resize.
847
0
    return AOMMIN(oxcf->frm_dim_cfg.width, oxcf->frm_dim_cfg.height) > 720
848
0
               ? BLOCK_128X128
849
0
               : BLOCK_64X64;
850
0
  } else if (oxcf->mode == REALTIME) {
851
0
    if (oxcf->tune_cfg.content == AOM_CONTENT_SCREEN) {
852
0
      const TileConfig *const tile_cfg = &oxcf->tile_cfg;
853
0
      const int num_tiles =
854
0
          (1 << tile_cfg->tile_columns) * (1 << tile_cfg->tile_rows);
855
      // For multi-thread encode: if the number of (128x128) superblocks
856
      // per tile is low use 64X64 superblock.
857
0
      if (oxcf->row_mt == 1 && oxcf->max_threads >= 4 &&
858
0
          oxcf->max_threads >= num_tiles && AOMMIN(width, height) >= 720 &&
859
0
          (width * height) / (128 * 128 * num_tiles) < 40)
860
0
        return BLOCK_64X64;
861
0
      else
862
0
        return AOMMIN(width, height) >= 720 ? BLOCK_128X128 : BLOCK_64X64;
863
0
    } else {
864
0
      return AOMMIN(width, height) > 720 ? BLOCK_128X128 : BLOCK_64X64;
865
0
    }
866
0
  }
867
868
  // TODO(any): Possibly could improve this with a heuristic.
869
  // When superres / resize is on, 'cm->width / height' can change between
870
  // calls, so we don't apply this heuristic there.
871
  // Things break if superblock size changes between the first pass and second
872
  // pass encoding, which is why this heuristic is not configured as a
873
  // speed-feature.
874
0
  if (oxcf->superres_cfg.superres_mode == AOM_SUPERRES_NONE &&
875
0
      oxcf->resize_cfg.resize_mode == RESIZE_NONE) {
876
0
    int is_480p_or_lesser = AOMMIN(width, height) <= 480;
877
0
    if (oxcf->speed >= 1 && is_480p_or_lesser) return BLOCK_64X64;
878
879
    // For 1080p and lower resolutions, choose SB size adaptively based on
880
    // resolution and speed level for multi-thread encode.
881
0
    int is_1080p_or_lesser = AOMMIN(width, height) <= 1080;
882
0
    if (!is_480p_or_lesser && is_1080p_or_lesser && oxcf->mode == GOOD &&
883
0
        oxcf->row_mt == 1 && oxcf->max_threads > 1 && oxcf->speed >= 5)
884
0
      return BLOCK_64X64;
885
886
    // For allintra encode, since the maximum partition size is set to 32X32 for
887
    // speed>=6, superblock size is set to 64X64 instead of 128X128. This
888
    // improves the multithread performance due to reduction in top right delay
889
    // and thread sync wastage. Currently, this setting is selectively enabled
890
    // only for speed>=9 and resolutions less than 4k since cost update
891
    // frequency is set to INTERNAL_COST_UPD_OFF in these cases.
892
0
    const int is_4k_or_larger = AOMMIN(width, height) >= 2160;
893
0
    if (oxcf->mode == ALLINTRA && oxcf->speed >= 9 && !is_4k_or_larger)
894
0
      return BLOCK_64X64;
895
0
  }
896
0
  return BLOCK_128X128;
897
0
}
898
899
0
void av1_setup_frame(AV1_COMP *cpi) {
900
0
  AV1_COMMON *const cm = &cpi->common;
901
  // Set up entropy context depending on frame type. The decoder mandates
902
  // the use of the default context, index 0, for keyframes and inter
903
  // frames where the error_resilient_mode or intra_only flag is set. For
904
  // other inter-frames the encoder currently uses only two contexts;
905
  // context 1 for ALTREF frames and context 0 for the others.
906
907
0
  if (frame_is_intra_only(cm) || cm->features.error_resilient_mode ||
908
0
      cpi->ext_flags.use_primary_ref_none) {
909
0
    av1_setup_past_independence(cm);
910
0
  }
911
912
0
  if ((cm->current_frame.frame_type == KEY_FRAME && cm->show_frame) ||
913
0
      frame_is_sframe(cm)) {
914
0
    if (!cpi->ppi->seq_params_locked) {
915
0
      set_sb_size(cm->seq_params,
916
0
                  av1_select_sb_size(&cpi->oxcf, cm->width, cm->height,
917
0
                                     cpi->ppi->number_spatial_layers));
918
0
    }
919
0
  } else {
920
0
    const RefCntBuffer *const primary_ref_buf = get_primary_ref_frame_buf(cm);
921
0
    if (primary_ref_buf == NULL) {
922
0
      av1_setup_past_independence(cm);
923
0
      cm->seg.update_map = 1;
924
0
      cm->seg.update_data = 1;
925
0
    } else {
926
0
      *cm->fc = primary_ref_buf->frame_context;
927
0
    }
928
0
  }
929
930
0
  av1_zero(cm->cur_frame->interp_filter_selected);
931
0
  cm->prev_frame = get_primary_ref_frame_buf(cm);
932
0
  cpi->vaq_refresh = 0;
933
0
}
934
935
#if !CONFIG_REALTIME_ONLY
936
static int get_interp_filter_selected(const AV1_COMMON *const cm,
937
                                      MV_REFERENCE_FRAME ref,
938
0
                                      InterpFilter ifilter) {
939
0
  const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref);
940
0
  if (buf == NULL) return 0;
941
0
  return buf->interp_filter_selected[ifilter];
942
0
}
943
944
0
uint16_t av1_setup_interp_filter_search_mask(AV1_COMP *cpi) {
945
0
  const AV1_COMMON *const cm = &cpi->common;
946
0
  int ref_total[REF_FRAMES] = { 0 };
947
0
  uint16_t mask = ALLOW_ALL_INTERP_FILT_MASK;
948
949
0
  if (cpi->last_frame_type == KEY_FRAME || cpi->refresh_frame.alt_ref_frame)
950
0
    return mask;
951
952
0
  for (MV_REFERENCE_FRAME ref = LAST_FRAME; ref <= ALTREF_FRAME; ++ref) {
953
0
    for (InterpFilter ifilter = EIGHTTAP_REGULAR; ifilter <= MULTITAP_SHARP;
954
0
         ++ifilter) {
955
0
      ref_total[ref] += get_interp_filter_selected(cm, ref, ifilter);
956
0
    }
957
0
  }
958
0
  int ref_total_total = (ref_total[LAST2_FRAME] + ref_total[LAST3_FRAME] +
959
0
                         ref_total[GOLDEN_FRAME] + ref_total[BWDREF_FRAME] +
960
0
                         ref_total[ALTREF2_FRAME] + ref_total[ALTREF_FRAME]);
961
962
0
  for (InterpFilter ifilter = EIGHTTAP_REGULAR; ifilter <= MULTITAP_SHARP;
963
0
       ++ifilter) {
964
0
    int last_score = get_interp_filter_selected(cm, LAST_FRAME, ifilter) * 30;
965
0
    if (ref_total[LAST_FRAME] && last_score <= ref_total[LAST_FRAME]) {
966
0
      int filter_score =
967
0
          get_interp_filter_selected(cm, LAST2_FRAME, ifilter) * 20 +
968
0
          get_interp_filter_selected(cm, LAST3_FRAME, ifilter) * 20 +
969
0
          get_interp_filter_selected(cm, GOLDEN_FRAME, ifilter) * 20 +
970
0
          get_interp_filter_selected(cm, BWDREF_FRAME, ifilter) * 10 +
971
0
          get_interp_filter_selected(cm, ALTREF2_FRAME, ifilter) * 10 +
972
0
          get_interp_filter_selected(cm, ALTREF_FRAME, ifilter) * 10;
973
0
      if (filter_score < ref_total_total) {
974
0
        DUAL_FILTER_TYPE filt_type = ifilter + SWITCHABLE_FILTERS * ifilter;
975
0
        reset_interp_filter_allowed_mask(&mask, filt_type);
976
0
      }
977
0
    }
978
0
  }
979
0
  return mask;
980
0
}
981
982
0
#define STRICT_PSNR_DIFF_THRESH 0.9
983
// Encode key frame with/without screen content tools to determine whether
984
// screen content tools should be enabled for this key frame group or not.
985
// The first encoding is without screen content tools.
986
// The second encoding is with screen content tools.
987
// We compare the psnr and frame size to make the decision.
988
static void screen_content_tools_determination(
989
    AV1_COMP *cpi, const int allow_screen_content_tools_orig_decision,
990
    const int allow_intrabc_orig_decision,
991
    const int use_screen_content_tools_orig_decision,
992
    const int is_screen_content_type_orig_decision, const int pass,
993
0
    int *projected_size_pass, PSNR_STATS *psnr) {
994
0
  AV1_COMMON *const cm = &cpi->common;
995
0
  FeatureFlags *const features = &cm->features;
996
997
#if CONFIG_FPMT_TEST
998
  projected_size_pass[pass] =
999
      ((cpi->ppi->gf_group.frame_parallel_level[cpi->gf_frame_index] > 0) &&
1000
       (cpi->ppi->fpmt_unit_test_cfg == PARALLEL_SIMULATION_ENCODE))
1001
          ? cpi->ppi->p_rc.temp_projected_frame_size
1002
          : cpi->rc.projected_frame_size;
1003
#else
1004
0
  projected_size_pass[pass] = cpi->rc.projected_frame_size;
1005
0
#endif
1006
1007
0
#if CONFIG_AV1_HIGHBITDEPTH
1008
0
  const uint32_t in_bit_depth = cpi->oxcf.input_cfg.input_bit_depth;
1009
0
  const uint32_t bit_depth = cpi->td.mb.e_mbd.bd;
1010
0
  aom_calc_highbd_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr[pass],
1011
0
                       bit_depth, in_bit_depth);
1012
#else
1013
  aom_calc_psnr(cpi->source, &cpi->common.cur_frame->buf, &psnr[pass]);
1014
#endif
1015
0
  if (pass != 1) return;
1016
1017
0
  const double psnr_diff = psnr[1].psnr[0] - psnr[0].psnr[0];
1018
  // Calculate % of palette mode to be chosen in a frame from mode decision.
1019
0
  const double palette_ratio =
1020
0
      (double)cpi->palette_pixel_num / (double)(cm->height * cm->width);
1021
0
  const int psnr_diff_is_large = (psnr_diff > STRICT_PSNR_DIFF_THRESH);
1022
0
  const int ratio_is_large =
1023
0
      ((palette_ratio >= 0.0001) && ((psnr_diff / palette_ratio) > 4));
1024
0
  const int is_sc_encoding_much_better = (psnr_diff_is_large || ratio_is_large);
1025
0
  if (is_sc_encoding_much_better) {
1026
    // Use screen content tools, if we get coding gain.
1027
0
    features->allow_screen_content_tools = 1;
1028
0
    features->allow_intrabc = cpi->intrabc_used;
1029
0
    cpi->use_screen_content_tools = 1;
1030
0
    cpi->is_screen_content_type = 1;
1031
0
  } else {
1032
    // Use original screen content decision.
1033
0
    features->allow_screen_content_tools =
1034
0
        allow_screen_content_tools_orig_decision;
1035
0
    features->allow_intrabc = allow_intrabc_orig_decision;
1036
0
    cpi->use_screen_content_tools = use_screen_content_tools_orig_decision;
1037
0
    cpi->is_screen_content_type = is_screen_content_type_orig_decision;
1038
0
  }
1039
0
}
1040
1041
// Set some encoding parameters to make the encoding process fast.
1042
// A fixed block partition size, and a large q is used.
1043
static void set_encoding_params_for_screen_content(AV1_COMP *cpi,
1044
0
                                                   const int pass) {
1045
0
  AV1_COMMON *const cm = &cpi->common;
1046
0
  if (pass == 0) {
1047
    // In the first pass, encode without screen content tools.
1048
    // Use a high q, and a fixed block size for fast encoding.
1049
0
    cm->features.allow_screen_content_tools = 0;
1050
0
    cm->features.allow_intrabc = 0;
1051
0
    cpi->use_screen_content_tools = 0;
1052
0
    cpi->sf.part_sf.partition_search_type = FIXED_PARTITION;
1053
0
    cpi->sf.part_sf.fixed_partition_size = BLOCK_32X32;
1054
0
    return;
1055
0
  }
1056
0
  assert(pass == 1);
1057
  // In the second pass, encode with screen content tools.
1058
  // Use a high q, and a fixed block size for fast encoding.
1059
0
  cm->features.allow_screen_content_tools = 1;
1060
  // TODO(chengchen): turn intrabc on could lead to data race issue.
1061
  // cm->allow_intrabc = 1;
1062
0
  cpi->use_screen_content_tools = 1;
1063
0
  cpi->sf.part_sf.partition_search_type = FIXED_PARTITION;
1064
0
  cpi->sf.part_sf.fixed_partition_size = BLOCK_32X32;
1065
0
}
1066
1067
// Determines whether to use screen content tools for the key frame group.
1068
// This function modifies "cm->features.allow_screen_content_tools",
1069
// "cm->features.allow_intrabc" and "cpi->use_screen_content_tools".
1070
0
void av1_determine_sc_tools_with_encoding(AV1_COMP *cpi, const int q_orig) {
1071
0
  AV1_COMMON *const cm = &cpi->common;
1072
0
  const AV1EncoderConfig *const oxcf = &cpi->oxcf;
1073
0
  const QuantizationCfg *const q_cfg = &oxcf->q_cfg;
1074
  // Variables to help determine if we should allow screen content tools.
1075
0
  int projected_size_pass[3] = { 0 };
1076
0
  PSNR_STATS psnr[3];
1077
0
  const int is_key_frame = cm->current_frame.frame_type == KEY_FRAME;
1078
0
  const int allow_screen_content_tools_orig_decision =
1079
0
      cm->features.allow_screen_content_tools;
1080
0
  const int allow_intrabc_orig_decision = cm->features.allow_intrabc;
1081
0
  const int use_screen_content_tools_orig_decision =
1082
0
      cpi->use_screen_content_tools;
1083
0
  const int is_screen_content_type_orig_decision = cpi->is_screen_content_type;
1084
  // Turn off the encoding trial for forward key frame and superres.
1085
0
  if (cpi->sf.rt_sf.use_nonrd_pick_mode || oxcf->kf_cfg.fwd_kf_enabled ||
1086
0
      cpi->superres_mode != AOM_SUPERRES_NONE || oxcf->mode == REALTIME ||
1087
0
      use_screen_content_tools_orig_decision || !is_key_frame) {
1088
0
    return;
1089
0
  }
1090
1091
  // TODO(chengchen): multiple encoding for the lossless mode is time consuming.
1092
  // Find a better way to determine whether screen content tools should be used
1093
  // for lossless coding.
1094
  // Use a high q and a fixed partition to do quick encoding.
1095
0
  const int q_for_screen_content_quick_run =
1096
0
      is_lossless_requested(&oxcf->rc_cfg) ? q_orig : AOMMAX(q_orig, 244);
1097
0
  const int partition_search_type_orig = cpi->sf.part_sf.partition_search_type;
1098
0
  const BLOCK_SIZE fixed_partition_block_size_orig =
1099
0
      cpi->sf.part_sf.fixed_partition_size;
1100
1101
  // Setup necessary params for encoding, including frame source, etc.
1102
1103
0
  cpi->source = av1_realloc_and_scale_if_required(
1104
0
      cm, cpi->unscaled_source, &cpi->scaled_source, cm->features.interp_filter,
1105
0
      0, false, false, cpi->oxcf.border_in_pixels, cpi->alloc_pyramid);
1106
0
  if (cpi->unscaled_last_source != NULL) {
1107
0
    cpi->last_source = av1_realloc_and_scale_if_required(
1108
0
        cm, cpi->unscaled_last_source, &cpi->scaled_last_source,
1109
0
        cm->features.interp_filter, 0, false, false, cpi->oxcf.border_in_pixels,
1110
0
        cpi->alloc_pyramid);
1111
0
  }
1112
1113
0
  av1_setup_frame(cpi);
1114
1115
0
  if (cm->seg.enabled) {
1116
0
    if (!cm->seg.update_data && cm->prev_frame) {
1117
0
      segfeatures_copy(&cm->seg, &cm->prev_frame->seg);
1118
0
      cm->seg.enabled = cm->prev_frame->seg.enabled;
1119
0
    } else {
1120
0
      av1_calculate_segdata(&cm->seg);
1121
0
    }
1122
0
  } else {
1123
0
    memset(&cm->seg, 0, sizeof(cm->seg));
1124
0
  }
1125
0
  segfeatures_copy(&cm->cur_frame->seg, &cm->seg);
1126
0
  cm->cur_frame->seg.enabled = cm->seg.enabled;
1127
1128
  // The two encoding passes aim to help determine whether to use screen
1129
  // content tools, with a high q and fixed partition.
1130
0
  for (int pass = 0; pass < 2; ++pass) {
1131
0
    set_encoding_params_for_screen_content(cpi, pass);
1132
0
    av1_set_quantizer(cm, q_cfg->qm_minlevel, q_cfg->qm_maxlevel,
1133
0
                      q_for_screen_content_quick_run,
1134
0
                      q_cfg->enable_chroma_deltaq, q_cfg->enable_hdr_deltaq,
1135
0
                      oxcf->mode == ALLINTRA, oxcf->tune_cfg.tuning);
1136
0
    av1_set_speed_features_qindex_dependent(cpi, oxcf->speed);
1137
0
    av1_init_quantizer(&cpi->enc_quant_dequant_params, &cm->quant_params,
1138
0
                       cm->seq_params->bit_depth);
1139
1140
0
    av1_set_variance_partition_thresholds(cpi, q_for_screen_content_quick_run,
1141
0
                                          0);
1142
    // transform / motion compensation build reconstruction frame
1143
0
    av1_encode_frame(cpi);
1144
    // Screen content decision
1145
0
    screen_content_tools_determination(
1146
0
        cpi, allow_screen_content_tools_orig_decision,
1147
0
        allow_intrabc_orig_decision, use_screen_content_tools_orig_decision,
1148
0
        is_screen_content_type_orig_decision, pass, projected_size_pass, psnr);
1149
0
  }
1150
1151
  // Set partition speed feature back.
1152
0
  cpi->sf.part_sf.partition_search_type = partition_search_type_orig;
1153
0
  cpi->sf.part_sf.fixed_partition_size = fixed_partition_block_size_orig;
1154
1155
  // Free token related info if screen content coding tools are not enabled.
1156
0
  if (!cm->features.allow_screen_content_tools)
1157
0
    free_token_info(&cpi->token_info);
1158
0
}
1159
#endif  // CONFIG_REALTIME_ONLY
1160
1161
static void fix_interp_filter(InterpFilter *const interp_filter,
1162
0
                              const FRAME_COUNTS *const counts) {
1163
0
  if (*interp_filter == SWITCHABLE) {
1164
    // Check to see if only one of the filters is actually used
1165
0
    int count[SWITCHABLE_FILTERS] = { 0 };
1166
0
    int num_filters_used = 0;
1167
0
    for (int i = 0; i < SWITCHABLE_FILTERS; ++i) {
1168
0
      for (int j = 0; j < SWITCHABLE_FILTER_CONTEXTS; ++j)
1169
0
        count[i] += counts->switchable_interp[j][i];
1170
0
      num_filters_used += (count[i] > 0);
1171
0
    }
1172
0
    if (num_filters_used == 1) {
1173
      // Only one filter is used. So set the filter at frame level
1174
0
      for (int i = 0; i < SWITCHABLE_FILTERS; ++i) {
1175
0
        if (count[i]) {
1176
0
          *interp_filter = i;
1177
0
          break;
1178
0
        }
1179
0
      }
1180
0
    }
1181
0
  }
1182
0
}
1183
1184
0
void av1_finalize_encoded_frame(AV1_COMP *const cpi) {
1185
0
  AV1_COMMON *const cm = &cpi->common;
1186
0
  CurrentFrame *const current_frame = &cm->current_frame;
1187
1188
0
  if (!cm->seq_params->reduced_still_picture_hdr &&
1189
0
      encode_show_existing_frame(cm)) {
1190
0
    RefCntBuffer *const frame_to_show =
1191
0
        cm->ref_frame_map[cpi->existing_fb_idx_to_show];
1192
1193
0
    if (frame_to_show == NULL) {
1194
0
      aom_internal_error(cm->error, AOM_CODEC_UNSUP_BITSTREAM,
1195
0
                         "Buffer does not contain a reconstructed frame");
1196
0
    }
1197
0
    assert(frame_to_show->ref_count > 0);
1198
0
    assign_frame_buffer_p(&cm->cur_frame, frame_to_show);
1199
0
  }
1200
1201
0
  if (!encode_show_existing_frame(cm) &&
1202
0
      cm->seq_params->film_grain_params_present &&
1203
0
      (cm->show_frame || cm->showable_frame)) {
1204
    // Copy the current frame's film grain params to the its corresponding
1205
    // RefCntBuffer slot.
1206
0
    cm->cur_frame->film_grain_params = cm->film_grain_params;
1207
1208
    // We must update the parameters if this is not an INTER_FRAME
1209
0
    if (current_frame->frame_type != INTER_FRAME)
1210
0
      cm->cur_frame->film_grain_params.update_parameters = 1;
1211
1212
    // Iterate the random seed for the next frame.
1213
0
    cm->film_grain_params.random_seed += 3381;
1214
0
    if (cm->film_grain_params.random_seed == 0)
1215
0
      cm->film_grain_params.random_seed = 7391;
1216
0
  }
1217
1218
  // Initialise all tiles' contexts from the global frame context
1219
0
  for (int tile_col = 0; tile_col < cm->tiles.cols; tile_col++) {
1220
0
    for (int tile_row = 0; tile_row < cm->tiles.rows; tile_row++) {
1221
0
      const int tile_idx = tile_row * cm->tiles.cols + tile_col;
1222
0
      cpi->tile_data[tile_idx].tctx = *cm->fc;
1223
0
    }
1224
0
  }
1225
1226
0
  if (!frame_is_intra_only(cm))
1227
0
    fix_interp_filter(&cm->features.interp_filter, cpi->td.counts);
1228
0
}
1229
1230
int av1_is_integer_mv(const YV12_BUFFER_CONFIG *cur_picture,
1231
                      const YV12_BUFFER_CONFIG *last_picture,
1232
0
                      ForceIntegerMVInfo *const force_intpel_info) {
1233
  // check use hash ME
1234
0
  int k;
1235
1236
0
  const int block_size = FORCE_INT_MV_DECISION_BLOCK_SIZE;
1237
0
  const double threshold_current = 0.8;
1238
0
  const double threshold_average = 0.95;
1239
0
  const int max_history_size = 32;
1240
0
  int T = 0;  // total block
1241
0
  int C = 0;  // match with collocated block
1242
0
  int S = 0;  // smooth region but not match with collocated block
1243
1244
0
  const int pic_width = cur_picture->y_width;
1245
0
  const int pic_height = cur_picture->y_height;
1246
0
  for (int i = 0; i + block_size <= pic_height; i += block_size) {
1247
0
    for (int j = 0; j + block_size <= pic_width; j += block_size) {
1248
0
      const int x_pos = j;
1249
0
      const int y_pos = i;
1250
0
      int match = 1;
1251
0
      T++;
1252
1253
      // check whether collocated block match with current
1254
0
      uint8_t *p_cur = cur_picture->y_buffer;
1255
0
      uint8_t *p_ref = last_picture->y_buffer;
1256
0
      int stride_cur = cur_picture->y_stride;
1257
0
      int stride_ref = last_picture->y_stride;
1258
0
      p_cur += (y_pos * stride_cur + x_pos);
1259
0
      p_ref += (y_pos * stride_ref + x_pos);
1260
1261
0
      if (cur_picture->flags & YV12_FLAG_HIGHBITDEPTH) {
1262
0
        uint16_t *p16_cur = CONVERT_TO_SHORTPTR(p_cur);
1263
0
        uint16_t *p16_ref = CONVERT_TO_SHORTPTR(p_ref);
1264
0
        for (int tmpY = 0; tmpY < block_size && match; tmpY++) {
1265
0
          for (int tmpX = 0; tmpX < block_size && match; tmpX++) {
1266
0
            if (p16_cur[tmpX] != p16_ref[tmpX]) {
1267
0
              match = 0;
1268
0
            }
1269
0
          }
1270
0
          p16_cur += stride_cur;
1271
0
          p16_ref += stride_ref;
1272
0
        }
1273
0
      } else {
1274
0
        for (int tmpY = 0; tmpY < block_size && match; tmpY++) {
1275
0
          for (int tmpX = 0; tmpX < block_size && match; tmpX++) {
1276
0
            if (p_cur[tmpX] != p_ref[tmpX]) {
1277
0
              match = 0;
1278
0
            }
1279
0
          }
1280
0
          p_cur += stride_cur;
1281
0
          p_ref += stride_ref;
1282
0
        }
1283
0
      }
1284
1285
0
      if (match) {
1286
0
        C++;
1287
0
        continue;
1288
0
      }
1289
1290
0
      if (av1_hash_is_horizontal_perfect(cur_picture, block_size, x_pos,
1291
0
                                         y_pos) ||
1292
0
          av1_hash_is_vertical_perfect(cur_picture, block_size, x_pos, y_pos)) {
1293
0
        S++;
1294
0
        continue;
1295
0
      }
1296
0
    }
1297
0
  }
1298
1299
0
  assert(T > 0);
1300
0
  double cs_rate = ((double)(C + S)) / ((double)(T));
1301
1302
0
  force_intpel_info->cs_rate_array[force_intpel_info->rate_index] = cs_rate;
1303
1304
0
  force_intpel_info->rate_index =
1305
0
      (force_intpel_info->rate_index + 1) % max_history_size;
1306
0
  force_intpel_info->rate_size++;
1307
0
  force_intpel_info->rate_size =
1308
0
      AOMMIN(force_intpel_info->rate_size, max_history_size);
1309
1310
0
  if (cs_rate < threshold_current) {
1311
0
    return 0;
1312
0
  }
1313
1314
0
  if (C == T) {
1315
0
    return 1;
1316
0
  }
1317
1318
0
  double cs_average = 0.0;
1319
1320
0
  for (k = 0; k < force_intpel_info->rate_size; k++) {
1321
0
    cs_average += force_intpel_info->cs_rate_array[k];
1322
0
  }
1323
0
  cs_average /= force_intpel_info->rate_size;
1324
1325
0
  if (cs_average < threshold_average) {
1326
0
    return 0;
1327
0
  }
1328
1329
0
  if ((T - C - S) < 0) {
1330
0
    return 1;
1331
0
  }
1332
1333
0
  if (cs_average > 1.01) {
1334
0
    return 1;
1335
0
  }
1336
1337
0
  return 0;
1338
0
}
1339
1340
0
void av1_set_mb_ssim_rdmult_scaling(AV1_COMP *cpi) {
1341
0
  const CommonModeInfoParams *const mi_params = &cpi->common.mi_params;
1342
0
  const MACROBLOCKD *const xd = &cpi->td.mb.e_mbd;
1343
0
  uint8_t *y_buffer = cpi->source->y_buffer;
1344
0
  const int y_stride = cpi->source->y_stride;
1345
0
  const int block_size = BLOCK_16X16;
1346
1347
0
  const int num_mi_w = mi_size_wide[block_size];
1348
0
  const int num_mi_h = mi_size_high[block_size];
1349
0
  const int num_cols = (mi_params->mi_cols + num_mi_w - 1) / num_mi_w;
1350
0
  const int num_rows = (mi_params->mi_rows + num_mi_h - 1) / num_mi_h;
1351
0
  double log_sum = 0.0;
1352
1353
  // Loop through each 16x16 block.
1354
0
  for (int row = 0; row < num_rows; ++row) {
1355
0
    for (int col = 0; col < num_cols; ++col) {
1356
0
      double var = 0.0, num_of_var = 0.0;
1357
0
      const int index = row * num_cols + col;
1358
1359
      // Loop through each 8x8 block.
1360
0
      for (int mi_row = row * num_mi_h;
1361
0
           mi_row < mi_params->mi_rows && mi_row < (row + 1) * num_mi_h;
1362
0
           mi_row += 2) {
1363
0
        for (int mi_col = col * num_mi_w;
1364
0
             mi_col < mi_params->mi_cols && mi_col < (col + 1) * num_mi_w;
1365
0
             mi_col += 2) {
1366
0
          struct buf_2d buf;
1367
0
          const int row_offset_y = mi_row << 2;
1368
0
          const int col_offset_y = mi_col << 2;
1369
1370
0
          buf.buf = y_buffer + row_offset_y * y_stride + col_offset_y;
1371
0
          buf.stride = y_stride;
1372
1373
0
          var += av1_get_perpixel_variance_facade(cpi, xd, &buf, BLOCK_8X8,
1374
0
                                                  AOM_PLANE_Y);
1375
0
          num_of_var += 1.0;
1376
0
        }
1377
0
      }
1378
0
      var = var / num_of_var;
1379
1380
      // Curve fitting with an exponential model on all 16x16 blocks from the
1381
      // midres dataset.
1382
0
      var = 67.035434 * (1 - exp(-0.0021489 * var)) + 17.492222;
1383
1384
      // As per the above computation, var will be in the range of
1385
      // [17.492222, 84.527656], assuming the data type is of infinite
1386
      // precision. The following assert conservatively checks if var is in the
1387
      // range of [17.0, 85.0] to avoid any issues due to the precision of the
1388
      // relevant data type.
1389
0
      assert(var > 17.0 && var < 85.0);
1390
0
      cpi->ssim_rdmult_scaling_factors[index] = var;
1391
0
      log_sum += log(var);
1392
0
    }
1393
0
  }
1394
1395
  // As log_sum holds the geometric mean, it will be in the range
1396
  // [17.492222, 84.527656]. Hence, in the below loop, the value of
1397
  // cpi->ssim_rdmult_scaling_factors[index] would be in the range
1398
  // [0.2069, 4.8323].
1399
0
  log_sum = exp(log_sum / (double)(num_rows * num_cols));
1400
1401
0
  for (int row = 0; row < num_rows; ++row) {
1402
0
    for (int col = 0; col < num_cols; ++col) {
1403
0
      const int index = row * num_cols + col;
1404
0
      cpi->ssim_rdmult_scaling_factors[index] /= log_sum;
1405
0
    }
1406
0
  }
1407
0
}
1408
1409
// Coding context that only needs to be saved when recode loop includes
1410
// filtering (deblocking, CDEF, superres post-encode upscale and/or loop
1411
// restoraton).
1412
0
static void save_extra_coding_context(AV1_COMP *cpi) {
1413
0
  CODING_CONTEXT *const cc = &cpi->coding_context;
1414
0
  AV1_COMMON *cm = &cpi->common;
1415
1416
0
  cc->lf = cm->lf;
1417
0
  cc->cdef_info = cm->cdef_info;
1418
0
  cc->rc = cpi->rc;
1419
0
  cc->mv_stats = cpi->ppi->mv_stats;
1420
0
}
1421
1422
0
void av1_save_all_coding_context(AV1_COMP *cpi) {
1423
0
  save_extra_coding_context(cpi);
1424
0
  if (!frame_is_intra_only(&cpi->common)) release_scaled_references(cpi);
1425
0
}
1426
1427
#if DUMP_RECON_FRAMES == 1
1428
1429
// NOTE(zoeliu): For debug - Output the filtered reconstructed video.
1430
void av1_dump_filtered_recon_frames(AV1_COMP *cpi) {
1431
  AV1_COMMON *const cm = &cpi->common;
1432
  const CurrentFrame *const current_frame = &cm->current_frame;
1433
  const YV12_BUFFER_CONFIG *recon_buf = &cm->cur_frame->buf;
1434
1435
  if (recon_buf == NULL) {
1436
    printf("Frame %d is not ready.\n", current_frame->frame_number);
1437
    return;
1438
  }
1439
1440
  static const int flag_list[REF_FRAMES] = { 0,
1441
                                             AOM_LAST_FLAG,
1442
                                             AOM_LAST2_FLAG,
1443
                                             AOM_LAST3_FLAG,
1444
                                             AOM_GOLD_FLAG,
1445
                                             AOM_BWD_FLAG,
1446
                                             AOM_ALT2_FLAG,
1447
                                             AOM_ALT_FLAG };
1448
  printf(
1449
      "\n***Frame=%d (frame_offset=%d, show_frame=%d, "
1450
      "show_existing_frame=%d) "
1451
      "[LAST LAST2 LAST3 GOLDEN BWD ALT2 ALT]=[",
1452
      current_frame->frame_number, current_frame->order_hint, cm->show_frame,
1453
      cm->show_existing_frame);
1454
  for (int ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) {
1455
    const RefCntBuffer *const buf = get_ref_frame_buf(cm, ref_frame);
1456
    const int ref_offset = buf != NULL ? (int)buf->order_hint : -1;
1457
    printf(" %d(%c)", ref_offset,
1458
           (cpi->ref_frame_flags & flag_list[ref_frame]) ? 'Y' : 'N');
1459
  }
1460
  printf(" ]\n");
1461
1462
  if (!cm->show_frame) {
1463
    printf("Frame %d is a no show frame, so no image dump.\n",
1464
           current_frame->frame_number);
1465
    return;
1466
  }
1467
1468
  int h;
1469
  char file_name[256] = "/tmp/enc_filtered_recon.yuv";
1470
  FILE *f_recon = NULL;
1471
1472
  if (current_frame->frame_number == 0) {
1473
    if ((f_recon = fopen(file_name, "wb")) == NULL) {
1474
      printf("Unable to open file %s to write.\n", file_name);
1475
      return;
1476
    }
1477
  } else {
1478
    if ((f_recon = fopen(file_name, "ab")) == NULL) {
1479
      printf("Unable to open file %s to append.\n", file_name);
1480
      return;
1481
    }
1482
  }
1483
  printf(
1484
      "\nFrame=%5d, encode_update_type[%5d]=%1d, frame_offset=%d, "
1485
      "show_frame=%d, show_existing_frame=%d, source_alt_ref_active=%d, "
1486
      "refresh_alt_ref_frame=%d, "
1487
      "y_stride=%4d, uv_stride=%4d, cm->width=%4d, cm->height=%4d\n\n",
1488
      current_frame->frame_number, cpi->gf_frame_index,
1489
      cpi->ppi->gf_group.update_type[cpi->gf_frame_index],
1490
      current_frame->order_hint, cm->show_frame, cm->show_existing_frame,
1491
      cpi->rc.source_alt_ref_active, cpi->refresh_frame.alt_ref_frame,
1492
      recon_buf->y_stride, recon_buf->uv_stride, cm->width, cm->height);
1493
#if 0
1494
  int ref_frame;
1495
  printf("get_ref_frame_map_idx: [");
1496
  for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame)
1497
    printf(" %d", get_ref_frame_map_idx(cm, ref_frame));
1498
  printf(" ]\n");
1499
#endif  // 0
1500
1501
  // --- Y ---
1502
  for (h = 0; h < cm->height; ++h) {
1503
    fwrite(&recon_buf->y_buffer[h * recon_buf->y_stride], 1, cm->width,
1504
           f_recon);
1505
  }
1506
  // --- U ---
1507
  for (h = 0; h < (cm->height >> 1); ++h) {
1508
    fwrite(&recon_buf->u_buffer[h * recon_buf->uv_stride], 1, (cm->width >> 1),
1509
           f_recon);
1510
  }
1511
  // --- V ---
1512
  for (h = 0; h < (cm->height >> 1); ++h) {
1513
    fwrite(&recon_buf->v_buffer[h * recon_buf->uv_stride], 1, (cm->width >> 1),
1514
           f_recon);
1515
  }
1516
1517
  fclose(f_recon);
1518
}
1519
#endif  // DUMP_RECON_FRAMES