/src/aom/av1/common/cdef.c
Line | Count | Source (jump to first uncovered line) |
1 | | /* |
2 | | * Copyright (c) 2016, Alliance for Open Media. All rights reserved. |
3 | | * |
4 | | * This source code is subject to the terms of the BSD 2 Clause License and |
5 | | * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License |
6 | | * was not distributed with this source code in the LICENSE file, you can |
7 | | * obtain it at www.aomedia.org/license/software. If the Alliance for Open |
8 | | * Media Patent License 1.0 was not distributed with this source code in the |
9 | | * PATENTS file, you can obtain it at www.aomedia.org/license/patent. |
10 | | */ |
11 | | |
12 | | #include <assert.h> |
13 | | #include <stddef.h> |
14 | | #include <string.h> |
15 | | |
16 | | #include "config/aom_scale_rtcd.h" |
17 | | |
18 | | #include "aom/aom_integer.h" |
19 | | #include "aom_util/aom_pthread.h" |
20 | | #include "av1/common/av1_common_int.h" |
21 | | #include "av1/common/cdef.h" |
22 | | #include "av1/common/cdef_block.h" |
23 | | #include "av1/common/common.h" |
24 | | #include "av1/common/common_data.h" |
25 | | #include "av1/common/enums.h" |
26 | | #include "av1/common/reconinter.h" |
27 | | #include "av1/common/thread_common.h" |
28 | | |
29 | | static int is_8x8_block_skip(MB_MODE_INFO **grid, int mi_row, int mi_col, |
30 | 2.27M | int mi_stride) { |
31 | 2.27M | MB_MODE_INFO **mbmi = grid + mi_row * mi_stride + mi_col; |
32 | 5.15M | for (int r = 0; r < mi_size_high[BLOCK_8X8]; ++r, mbmi += mi_stride) { |
33 | 9.47M | for (int c = 0; c < mi_size_wide[BLOCK_8X8]; ++c) { |
34 | 6.60M | if (!mbmi[c]->skip_txfm) return 0; |
35 | 6.60M | } |
36 | 3.71M | } |
37 | | |
38 | 1.43M | return 1; |
39 | 2.27M | } |
40 | | |
41 | | int av1_cdef_compute_sb_list(const CommonModeInfoParams *const mi_params, |
42 | | int mi_row, int mi_col, cdef_list *dlist, |
43 | 62.4k | BLOCK_SIZE bs) { |
44 | 62.4k | MB_MODE_INFO **grid = mi_params->mi_grid_base; |
45 | 62.4k | int maxc = mi_params->mi_cols - mi_col; |
46 | 62.4k | int maxr = mi_params->mi_rows - mi_row; |
47 | | |
48 | 62.5k | if (bs == BLOCK_128X128 || bs == BLOCK_128X64) |
49 | 0 | maxc = AOMMIN(maxc, MI_SIZE_128X128); |
50 | 62.4k | else |
51 | 62.4k | maxc = AOMMIN(maxc, MI_SIZE_64X64); |
52 | 62.4k | if (bs == BLOCK_128X128 || bs == BLOCK_64X128) |
53 | 0 | maxr = AOMMIN(maxr, MI_SIZE_128X128); |
54 | 62.4k | else |
55 | 62.4k | maxr = AOMMIN(maxr, MI_SIZE_64X64); |
56 | | |
57 | 62.4k | const int r_step = 2; // mi_size_high[BLOCK_8X8] |
58 | 62.4k | const int c_step = 2; // mi_size_wide[BLOCK_8X8] |
59 | 62.4k | const int r_shift = 1; |
60 | 62.4k | const int c_shift = 1; |
61 | 62.4k | int count = 0; |
62 | 477k | for (int r = 0; r < maxr; r += r_step) { |
63 | 2.69M | for (int c = 0; c < maxc; c += c_step) { |
64 | 2.27M | if (!is_8x8_block_skip(grid, mi_row + r, mi_col + c, |
65 | 2.27M | mi_params->mi_stride)) { |
66 | 845k | dlist[count].by = r >> r_shift; |
67 | 845k | dlist[count].bx = c >> c_shift; |
68 | 845k | count++; |
69 | 845k | } |
70 | 2.27M | } |
71 | 415k | } |
72 | 62.4k | return count; |
73 | 62.4k | } |
74 | | |
75 | | void cdef_copy_rect8_8bit_to_16bit_c(uint16_t *dst, int dstride, |
76 | | const uint8_t *src, int sstride, int width, |
77 | 59.4k | int height) { |
78 | 1.22M | for (int i = 0; i < height; i++) { |
79 | 53.8M | for (int j = 0; j < width; j++) { |
80 | 52.7M | dst[i * dstride + j] = src[i * sstride + j]; |
81 | 52.7M | } |
82 | 1.16M | } |
83 | 59.4k | } |
84 | | |
85 | | #if CONFIG_AV1_HIGHBITDEPTH |
86 | | void cdef_copy_rect8_16bit_to_16bit_c(uint16_t *dst, int dstride, |
87 | | const uint16_t *src, int sstride, |
88 | 137k | int width, int height) { |
89 | 2.26M | for (int i = 0; i < height; i++) { |
90 | 64.6M | for (int j = 0; j < width; j++) { |
91 | 62.5M | dst[i * dstride + j] = src[i * sstride + j]; |
92 | 62.5M | } |
93 | 2.12M | } |
94 | 137k | } |
95 | | #endif // CONFIG_AV1_HIGHBITDEPTH |
96 | | |
97 | | void av1_cdef_copy_sb8_16_lowbd(uint16_t *const dst, int dstride, |
98 | | const uint8_t *src, int src_voffset, |
99 | | int src_hoffset, int sstride, int vsize, |
100 | 60.4k | int hsize) { |
101 | 60.4k | const uint8_t *base = &src[src_voffset * (ptrdiff_t)sstride + src_hoffset]; |
102 | 60.4k | cdef_copy_rect8_8bit_to_16bit(dst, dstride, base, sstride, hsize, vsize); |
103 | 60.4k | } |
104 | | |
105 | | #if CONFIG_AV1_HIGHBITDEPTH |
106 | | void av1_cdef_copy_sb8_16_highbd(uint16_t *const dst, int dstride, |
107 | | const uint8_t *src, int src_voffset, |
108 | | int src_hoffset, int sstride, int vsize, |
109 | 138k | int hsize) { |
110 | 138k | const uint16_t *base = |
111 | 138k | &CONVERT_TO_SHORTPTR(src)[src_voffset * (ptrdiff_t)sstride + src_hoffset]; |
112 | 138k | cdef_copy_rect8_16bit_to_16bit(dst, dstride, base, sstride, hsize, vsize); |
113 | 138k | } |
114 | | #endif // CONFIG_AV1_HIGHBITDEPTH |
115 | | |
116 | | void av1_cdef_copy_sb8_16(const AV1_COMMON *const cm, uint16_t *const dst, |
117 | | int dstride, const uint8_t *src, int src_voffset, |
118 | 198k | int src_hoffset, int sstride, int vsize, int hsize) { |
119 | 198k | #if CONFIG_AV1_HIGHBITDEPTH |
120 | 198k | if (cm->seq_params->use_highbitdepth) { |
121 | 137k | av1_cdef_copy_sb8_16_highbd(dst, dstride, src, src_voffset, src_hoffset, |
122 | 137k | sstride, vsize, hsize); |
123 | 137k | return; |
124 | 137k | } |
125 | | #else |
126 | | (void)cm; |
127 | | #endif // CONFIG_AV1_HIGHBITDEPTH |
128 | 60.2k | av1_cdef_copy_sb8_16_lowbd(dst, dstride, src, src_voffset, src_hoffset, |
129 | 60.2k | sstride, vsize, hsize); |
130 | 60.2k | } |
131 | | |
132 | | static inline void copy_rect(uint16_t *dst, int dstride, const uint16_t *src, |
133 | 277k | int sstride, int v, int h) { |
134 | 6.99M | for (int i = 0; i < v; i++) { |
135 | 63.5M | for (int j = 0; j < h; j++) { |
136 | 56.8M | dst[i * dstride + j] = src[i * sstride + j]; |
137 | 56.8M | } |
138 | 6.71M | } |
139 | 277k | } |
140 | | |
141 | | // Prepares intermediate input buffer for CDEF. |
142 | | // Inputs: |
143 | | // cm: Pointer to common structure. |
144 | | // fb_info: Pointer to the CDEF block-level parameter structure. |
145 | | // colbuf: Left column buffer for CDEF. |
146 | | // cdef_left: Left block is filtered or not. |
147 | | // fbc, fbr: col and row index of a block. |
148 | | // plane: plane index Y/CB/CR. |
149 | | // Returns: |
150 | | // Nothing will be returned. |
151 | | static void cdef_prepare_fb(const AV1_COMMON *const cm, CdefBlockInfo *fb_info, |
152 | | uint16_t **const colbuf, const int cdef_left, |
153 | 68.7k | int fbc, int fbr, int plane) { |
154 | 68.7k | const CommonModeInfoParams *const mi_params = &cm->mi_params; |
155 | 68.7k | uint16_t *src = fb_info->src; |
156 | 68.7k | const int luma_stride = |
157 | 68.7k | ALIGN_POWER_OF_TWO(mi_params->mi_cols << MI_SIZE_LOG2, 4); |
158 | 68.7k | const int nvfb = (mi_params->mi_rows + MI_SIZE_64X64 - 1) / MI_SIZE_64X64; |
159 | 68.7k | const int nhfb = (mi_params->mi_cols + MI_SIZE_64X64 - 1) / MI_SIZE_64X64; |
160 | 68.7k | int cstart = 0; |
161 | 68.7k | if (!cdef_left) cstart = -CDEF_HBORDER; |
162 | 68.7k | int rend, cend; |
163 | 68.7k | const int nhb = |
164 | 68.7k | AOMMIN(MI_SIZE_64X64, mi_params->mi_cols - MI_SIZE_64X64 * fbc); |
165 | 68.7k | const int nvb = |
166 | 68.7k | AOMMIN(MI_SIZE_64X64, mi_params->mi_rows - MI_SIZE_64X64 * fbr); |
167 | 68.7k | const int hsize = nhb << fb_info->mi_wide_l2; |
168 | 68.7k | const int vsize = nvb << fb_info->mi_high_l2; |
169 | 68.7k | const uint16_t *top_linebuf = fb_info->top_linebuf[plane]; |
170 | 68.7k | const uint16_t *bot_linebuf = fb_info->bot_linebuf[plane]; |
171 | 68.7k | const int bot_offset = (vsize + CDEF_VBORDER) * CDEF_BSTRIDE; |
172 | 68.7k | const int stride = |
173 | 68.7k | luma_stride >> (plane == AOM_PLANE_Y ? 0 : cm->seq_params->subsampling_x); |
174 | | |
175 | 68.7k | if (fbc == nhfb - 1) |
176 | 50.8k | cend = hsize; |
177 | 17.8k | else |
178 | 17.8k | cend = hsize + CDEF_HBORDER; |
179 | | |
180 | 68.7k | if (fbr == nvfb - 1) |
181 | 21.1k | rend = vsize; |
182 | 47.6k | else |
183 | 47.6k | rend = vsize + CDEF_VBORDER; |
184 | | |
185 | | /* Copy in the pixels we need from the current superblock for |
186 | | deringing.*/ |
187 | 68.7k | av1_cdef_copy_sb8_16( |
188 | 68.7k | cm, &src[CDEF_VBORDER * CDEF_BSTRIDE + CDEF_HBORDER + cstart], |
189 | 68.7k | CDEF_BSTRIDE, fb_info->dst, fb_info->roffset, fb_info->coffset + cstart, |
190 | 68.7k | fb_info->dst_stride, vsize, cend - cstart); |
191 | | |
192 | | /* Copy in the pixels we need for the current superblock from bottom buffer.*/ |
193 | 68.7k | if (fbr < nvfb - 1) { |
194 | 47.7k | copy_rect(&src[bot_offset + CDEF_HBORDER], CDEF_BSTRIDE, |
195 | 47.7k | &bot_linebuf[fb_info->coffset], stride, CDEF_VBORDER, hsize); |
196 | 47.7k | } else { |
197 | 20.9k | fill_rect(&src[bot_offset + CDEF_HBORDER], CDEF_BSTRIDE, CDEF_VBORDER, |
198 | 20.9k | hsize, CDEF_VERY_LARGE); |
199 | 20.9k | } |
200 | 68.7k | if (fbr < nvfb - 1 && fbc > 0) { |
201 | 10.6k | copy_rect(&src[bot_offset], CDEF_BSTRIDE, |
202 | 10.6k | &bot_linebuf[fb_info->coffset - CDEF_HBORDER], stride, |
203 | 10.6k | CDEF_VBORDER, CDEF_HBORDER); |
204 | 58.0k | } else { |
205 | 58.0k | fill_rect(&src[bot_offset], CDEF_BSTRIDE, CDEF_VBORDER, CDEF_HBORDER, |
206 | 58.0k | CDEF_VERY_LARGE); |
207 | 58.0k | } |
208 | 68.7k | if (fbr < nvfb - 1 && fbc < nhfb - 1) { |
209 | 10.6k | copy_rect(&src[bot_offset + hsize + CDEF_HBORDER], CDEF_BSTRIDE, |
210 | 10.6k | &bot_linebuf[fb_info->coffset + hsize], stride, CDEF_VBORDER, |
211 | 10.6k | CDEF_HBORDER); |
212 | 58.1k | } else { |
213 | 58.1k | fill_rect(&src[bot_offset + hsize + CDEF_HBORDER], CDEF_BSTRIDE, |
214 | 58.1k | CDEF_VBORDER, CDEF_HBORDER, CDEF_VERY_LARGE); |
215 | 58.1k | } |
216 | | |
217 | | /* Copy in the pixels we need from the current superblock from top buffer.*/ |
218 | 68.7k | if (fbr > 0) { |
219 | 51.0k | copy_rect(&src[CDEF_HBORDER], CDEF_BSTRIDE, &top_linebuf[fb_info->coffset], |
220 | 51.0k | stride, CDEF_VBORDER, hsize); |
221 | 51.0k | } else { |
222 | 17.6k | fill_rect(&src[CDEF_HBORDER], CDEF_BSTRIDE, CDEF_VBORDER, hsize, |
223 | 17.6k | CDEF_VERY_LARGE); |
224 | 17.6k | } |
225 | 68.7k | if (fbr > 0 && fbc > 0) { |
226 | 13.4k | copy_rect(src, CDEF_BSTRIDE, &top_linebuf[fb_info->coffset - CDEF_HBORDER], |
227 | 13.4k | stride, CDEF_VBORDER, CDEF_HBORDER); |
228 | 55.3k | } else { |
229 | 55.3k | fill_rect(src, CDEF_BSTRIDE, CDEF_VBORDER, CDEF_HBORDER, CDEF_VERY_LARGE); |
230 | 55.3k | } |
231 | 68.7k | if (fbr > 0 && fbc < nhfb - 1) { |
232 | 13.3k | copy_rect(&src[hsize + CDEF_HBORDER], CDEF_BSTRIDE, |
233 | 13.3k | &top_linebuf[fb_info->coffset + hsize], stride, CDEF_VBORDER, |
234 | 13.3k | CDEF_HBORDER); |
235 | 55.4k | } else { |
236 | 55.4k | fill_rect(&src[hsize + CDEF_HBORDER], CDEF_BSTRIDE, CDEF_VBORDER, |
237 | 55.4k | CDEF_HBORDER, CDEF_VERY_LARGE); |
238 | 55.4k | } |
239 | 68.7k | if (cdef_left) { |
240 | | /* If we deringed the superblock on the left then we need to copy in |
241 | | saved pixels. */ |
242 | 64.4k | copy_rect(src, CDEF_BSTRIDE, colbuf[plane], CDEF_HBORDER, |
243 | 64.4k | rend + CDEF_VBORDER, CDEF_HBORDER); |
244 | 64.4k | } |
245 | | /* Saving pixels in case we need to dering the superblock on the |
246 | | right. */ |
247 | 68.7k | copy_rect(colbuf[plane], CDEF_HBORDER, src + hsize, CDEF_BSTRIDE, |
248 | 68.7k | rend + CDEF_VBORDER, CDEF_HBORDER); |
249 | | |
250 | 68.7k | if (fb_info->frame_boundary[LEFT]) { |
251 | 50.8k | fill_rect(src, CDEF_BSTRIDE, vsize + 2 * CDEF_VBORDER, CDEF_HBORDER, |
252 | 50.8k | CDEF_VERY_LARGE); |
253 | 50.8k | } |
254 | 68.7k | if (fb_info->frame_boundary[RIGHT]) { |
255 | 50.9k | fill_rect(&src[hsize + CDEF_HBORDER], CDEF_BSTRIDE, |
256 | 50.9k | vsize + 2 * CDEF_VBORDER, CDEF_HBORDER, CDEF_VERY_LARGE); |
257 | 50.9k | } |
258 | 68.7k | } |
259 | | |
260 | | static inline void cdef_filter_fb(CdefBlockInfo *const fb_info, int plane, |
261 | 68.9k | uint8_t use_highbitdepth) { |
262 | 68.9k | ptrdiff_t offset = |
263 | 68.9k | (ptrdiff_t)fb_info->dst_stride * fb_info->roffset + fb_info->coffset; |
264 | 68.9k | if (use_highbitdepth) { |
265 | 40.7k | av1_cdef_filter_fb( |
266 | 40.7k | NULL, CONVERT_TO_SHORTPTR(fb_info->dst + offset), fb_info->dst_stride, |
267 | 40.7k | &fb_info->src[CDEF_VBORDER * CDEF_BSTRIDE + CDEF_HBORDER], |
268 | 40.7k | fb_info->xdec, fb_info->ydec, fb_info->dir, NULL, fb_info->var, plane, |
269 | 40.7k | fb_info->dlist, fb_info->cdef_count, fb_info->level, |
270 | 40.7k | fb_info->sec_strength, fb_info->damping, fb_info->coeff_shift); |
271 | 40.7k | } else { |
272 | 28.1k | av1_cdef_filter_fb( |
273 | 28.1k | fb_info->dst + offset, NULL, fb_info->dst_stride, |
274 | 28.1k | &fb_info->src[CDEF_VBORDER * CDEF_BSTRIDE + CDEF_HBORDER], |
275 | 28.1k | fb_info->xdec, fb_info->ydec, fb_info->dir, NULL, fb_info->var, plane, |
276 | 28.1k | fb_info->dlist, fb_info->cdef_count, fb_info->level, |
277 | 28.1k | fb_info->sec_strength, fb_info->damping, fb_info->coeff_shift); |
278 | 28.1k | } |
279 | 68.9k | } |
280 | | |
281 | | // Initializes block-level parameters for CDEF. |
282 | | static inline void cdef_init_fb_col(const MACROBLOCKD *const xd, |
283 | | CdefBlockInfo *const fb_info, int *level, |
284 | | int *sec_strength, int fbc, int fbr, |
285 | 68.5k | int plane) { |
286 | 68.5k | const PLANE_TYPE plane_type = get_plane_type(plane); |
287 | 68.5k | fb_info->level = level[plane_type]; |
288 | 68.5k | fb_info->sec_strength = sec_strength[plane_type]; |
289 | 68.5k | fb_info->dst = xd->plane[plane].dst.buf; |
290 | 68.5k | fb_info->dst_stride = xd->plane[plane].dst.stride; |
291 | | |
292 | 68.5k | fb_info->xdec = xd->plane[plane].subsampling_x; |
293 | 68.5k | fb_info->ydec = xd->plane[plane].subsampling_y; |
294 | 68.5k | fb_info->mi_wide_l2 = MI_SIZE_LOG2 - xd->plane[plane].subsampling_x; |
295 | 68.5k | fb_info->mi_high_l2 = MI_SIZE_LOG2 - xd->plane[plane].subsampling_y; |
296 | 68.5k | fb_info->roffset = MI_SIZE_64X64 * fbr << fb_info->mi_high_l2; |
297 | 68.5k | fb_info->coffset = MI_SIZE_64X64 * fbc << fb_info->mi_wide_l2; |
298 | 68.5k | } |
299 | | |
300 | | static void cdef_fb_col(const AV1_COMMON *const cm, const MACROBLOCKD *const xd, |
301 | | CdefBlockInfo *const fb_info, uint16_t **const colbuf, |
302 | 63.2k | int *cdef_left, int fbc, int fbr) { |
303 | 63.2k | const CommonModeInfoParams *const mi_params = &cm->mi_params; |
304 | 63.2k | const int mbmi_cdef_strength = |
305 | 63.2k | mi_params |
306 | 63.2k | ->mi_grid_base[MI_SIZE_64X64 * fbr * mi_params->mi_stride + |
307 | 63.2k | MI_SIZE_64X64 * fbc] |
308 | 63.2k | ->cdef_strength; |
309 | 63.2k | const int num_planes = av1_num_planes(cm); |
310 | 63.2k | int is_zero_level[PLANE_TYPES] = { 1, 1 }; |
311 | 63.2k | int level[PLANE_TYPES] = { 0 }; |
312 | 63.2k | int sec_strength[PLANE_TYPES] = { 0 }; |
313 | 63.2k | const CdefInfo *const cdef_info = &cm->cdef_info; |
314 | | |
315 | 63.2k | if (mi_params->mi_grid_base[MI_SIZE_64X64 * fbr * mi_params->mi_stride + |
316 | 63.2k | MI_SIZE_64X64 * fbc] == NULL || |
317 | 63.2k | mbmi_cdef_strength == -1) { |
318 | 0 | av1_zero_array(cdef_left, num_planes); |
319 | 0 | return; |
320 | 0 | } |
321 | | |
322 | | // Compute level and secondary strength for planes |
323 | 63.2k | level[PLANE_TYPE_Y] = |
324 | 63.2k | cdef_info->cdef_strengths[mbmi_cdef_strength] / CDEF_SEC_STRENGTHS; |
325 | 63.2k | sec_strength[PLANE_TYPE_Y] = |
326 | 63.2k | cdef_info->cdef_strengths[mbmi_cdef_strength] % CDEF_SEC_STRENGTHS; |
327 | 63.2k | sec_strength[PLANE_TYPE_Y] += sec_strength[PLANE_TYPE_Y] == 3; |
328 | 63.2k | is_zero_level[PLANE_TYPE_Y] = |
329 | 63.2k | (level[PLANE_TYPE_Y] == 0) && (sec_strength[PLANE_TYPE_Y] == 0); |
330 | | |
331 | 63.2k | if (num_planes > 1) { |
332 | 51.1k | level[PLANE_TYPE_UV] = |
333 | 51.1k | cdef_info->cdef_uv_strengths[mbmi_cdef_strength] / CDEF_SEC_STRENGTHS; |
334 | 51.1k | sec_strength[PLANE_TYPE_UV] = |
335 | 51.1k | cdef_info->cdef_uv_strengths[mbmi_cdef_strength] % CDEF_SEC_STRENGTHS; |
336 | 51.1k | sec_strength[PLANE_TYPE_UV] += sec_strength[PLANE_TYPE_UV] == 3; |
337 | 51.1k | is_zero_level[PLANE_TYPE_UV] = |
338 | 51.1k | (level[PLANE_TYPE_UV] == 0) && (sec_strength[PLANE_TYPE_UV] == 0); |
339 | 51.1k | } |
340 | | |
341 | 63.2k | if (is_zero_level[PLANE_TYPE_Y] && is_zero_level[PLANE_TYPE_UV]) { |
342 | 1.18k | av1_zero_array(cdef_left, num_planes); |
343 | 1.18k | return; |
344 | 1.18k | } |
345 | | |
346 | 62.0k | fb_info->cdef_count = av1_cdef_compute_sb_list(mi_params, fbr * MI_SIZE_64X64, |
347 | 62.0k | fbc * MI_SIZE_64X64, |
348 | 62.0k | fb_info->dlist, BLOCK_64X64); |
349 | 62.0k | if (!fb_info->cdef_count) { |
350 | 32.9k | av1_zero_array(cdef_left, num_planes); |
351 | 32.9k | return; |
352 | 32.9k | } |
353 | | |
354 | 101k | for (int plane = 0; plane < num_planes; plane++) { |
355 | | // Do not skip cdef filtering for luma plane as filter direction is |
356 | | // computed based on luma. |
357 | 72.3k | if (plane && is_zero_level[get_plane_type(plane)]) { |
358 | 3.86k | cdef_left[plane] = 0; |
359 | 3.86k | continue; |
360 | 3.86k | } |
361 | 68.5k | cdef_init_fb_col(xd, fb_info, level, sec_strength, fbc, fbr, plane); |
362 | 68.5k | cdef_prepare_fb(cm, fb_info, colbuf, cdef_left[plane], fbc, fbr, plane); |
363 | 68.5k | cdef_filter_fb(fb_info, plane, cm->seq_params->use_highbitdepth); |
364 | 68.5k | cdef_left[plane] = 1; |
365 | 68.5k | } |
366 | 29.1k | } |
367 | | |
368 | | // Initializes row-level parameters for CDEF frame. |
369 | | void av1_cdef_init_fb_row(const AV1_COMMON *const cm, |
370 | | const MACROBLOCKD *const xd, |
371 | | CdefBlockInfo *const fb_info, |
372 | | uint16_t **const linebuf, uint16_t *const src, |
373 | 525 | struct AV1CdefSyncData *const cdef_sync, int fbr) { |
374 | 525 | (void)cdef_sync; |
375 | 525 | const int num_planes = av1_num_planes(cm); |
376 | 525 | const int nvfb = (cm->mi_params.mi_rows + MI_SIZE_64X64 - 1) / MI_SIZE_64X64; |
377 | 525 | const int luma_stride = |
378 | 525 | ALIGN_POWER_OF_TWO(cm->mi_params.mi_cols << MI_SIZE_LOG2, 4); |
379 | 525 | const bool ping_pong = fbr & 1; |
380 | | // for the current filter block, it's top left corner mi structure (mi_tl) |
381 | | // is first accessed to check whether the top and left boundaries are |
382 | | // frame boundaries. Then bottom-left and top-right mi structures are |
383 | | // accessed to check whether the bottom and right boundaries |
384 | | // (respectively) are frame boundaries. |
385 | | // |
386 | | // Note that we can't just check the bottom-right mi structure - eg. if |
387 | | // we're at the right-hand edge of the frame but not the bottom, then |
388 | | // the bottom-right mi is NULL but the bottom-left is not. |
389 | 525 | fb_info->frame_boundary[TOP] = (MI_SIZE_64X64 * fbr == 0) ? 1 : 0; |
390 | 525 | if (fbr != nvfb - 1) |
391 | 265 | fb_info->frame_boundary[BOTTOM] = |
392 | 265 | (MI_SIZE_64X64 * (fbr + 1) == cm->mi_params.mi_rows) ? 1 : 0; |
393 | 260 | else |
394 | 260 | fb_info->frame_boundary[BOTTOM] = 1; |
395 | | |
396 | 525 | fb_info->src = src; |
397 | 525 | fb_info->damping = cm->cdef_info.cdef_damping; |
398 | 525 | fb_info->coeff_shift = AOMMAX(cm->seq_params->bit_depth - 8, 0); |
399 | 525 | av1_zero(fb_info->dir); |
400 | 525 | av1_zero(fb_info->var); |
401 | | |
402 | 2.04k | for (int plane = 0; plane < num_planes; plane++) { |
403 | 1.52k | const int mi_high_l2 = MI_SIZE_LOG2 - xd->plane[plane].subsampling_y; |
404 | 1.52k | const int offset = MI_SIZE_64X64 * (fbr + 1) << mi_high_l2; |
405 | 1.52k | const int stride = luma_stride >> xd->plane[plane].subsampling_x; |
406 | | // here ping-pong buffers are maintained for top linebuf |
407 | | // to avoid linebuf over-write by consecutive row. |
408 | 1.52k | uint16_t *const top_linebuf = |
409 | 1.52k | &linebuf[plane][ping_pong * CDEF_VBORDER * stride]; |
410 | 1.52k | fb_info->bot_linebuf[plane] = &linebuf[plane][(CDEF_VBORDER << 1) * stride]; |
411 | | |
412 | 1.52k | if (fbr != nvfb - 1) // top line buffer copy |
413 | 795 | av1_cdef_copy_sb8_16(cm, top_linebuf, stride, xd->plane[plane].dst.buf, |
414 | 795 | offset - CDEF_VBORDER, 0, |
415 | 795 | xd->plane[plane].dst.stride, CDEF_VBORDER, stride); |
416 | 1.52k | fb_info->top_linebuf[plane] = |
417 | 1.52k | &linebuf[plane][(!ping_pong) * CDEF_VBORDER * stride]; |
418 | | |
419 | 1.52k | if (fbr != nvfb - 1) // bottom line buffer copy |
420 | 795 | av1_cdef_copy_sb8_16(cm, fb_info->bot_linebuf[plane], stride, |
421 | 795 | xd->plane[plane].dst.buf, offset, 0, |
422 | 795 | xd->plane[plane].dst.stride, CDEF_VBORDER, stride); |
423 | 1.52k | } |
424 | 525 | } |
425 | | |
426 | | void av1_cdef_fb_row(const AV1_COMMON *const cm, MACROBLOCKD *xd, |
427 | | uint16_t **const linebuf, uint16_t **const colbuf, |
428 | | uint16_t *const src, int fbr, |
429 | | cdef_init_fb_row_t cdef_init_fb_row_fn, |
430 | | struct AV1CdefSyncData *const cdef_sync, |
431 | 33.4k | struct aom_internal_error_info *error_info) { |
432 | | // TODO(aomedia:3276): Pass error_info to the low-level functions as required |
433 | | // in future to handle error propagation. |
434 | 33.4k | (void)error_info; |
435 | 33.4k | CdefBlockInfo fb_info; |
436 | 33.4k | int cdef_left[MAX_MB_PLANE] = { 1, 1, 1 }; |
437 | 33.4k | const int nhfb = (cm->mi_params.mi_cols + MI_SIZE_64X64 - 1) / MI_SIZE_64X64; |
438 | | |
439 | 33.4k | cdef_init_fb_row_fn(cm, xd, &fb_info, linebuf, src, cdef_sync, fbr); |
440 | 33.4k | #if CONFIG_MULTITHREAD |
441 | 33.4k | if (cdef_sync && cm->cdef_info.allocated_num_workers > 1) { |
442 | 32.9k | pthread_mutex_lock(cdef_sync->mutex_); |
443 | 32.9k | const bool cdef_mt_exit = cdef_sync->cdef_mt_exit; |
444 | 32.9k | pthread_mutex_unlock(cdef_sync->mutex_); |
445 | | // Exit in case any worker has encountered an error. |
446 | 32.9k | if (cdef_mt_exit) return; |
447 | 32.9k | } |
448 | 33.4k | #endif |
449 | 96.6k | for (int fbc = 0; fbc < nhfb; fbc++) { |
450 | 63.1k | fb_info.frame_boundary[LEFT] = (MI_SIZE_64X64 * fbc == 0) ? 1 : 0; |
451 | 63.1k | if (fbc != nhfb - 1) |
452 | 30.5k | fb_info.frame_boundary[RIGHT] = |
453 | 30.5k | (MI_SIZE_64X64 * (fbc + 1) == cm->mi_params.mi_cols) ? 1 : 0; |
454 | 32.5k | else |
455 | 32.5k | fb_info.frame_boundary[RIGHT] = 1; |
456 | 63.1k | cdef_fb_col(cm, xd, &fb_info, colbuf, &cdef_left[0], fbc, fbr); |
457 | 63.1k | } |
458 | 33.4k | } |
459 | | |
460 | | // Perform CDEF on input frame. |
461 | | // Inputs: |
462 | | // frame: Pointer to input frame buffer. |
463 | | // cm: Pointer to common structure. |
464 | | // xd: Pointer to common current coding block structure. |
465 | | // Returns: |
466 | | // Nothing will be returned. |
467 | | void av1_cdef_frame(YV12_BUFFER_CONFIG *frame, AV1_COMMON *const cm, |
468 | 260 | MACROBLOCKD *xd, cdef_init_fb_row_t cdef_init_fb_row_fn) { |
469 | 260 | const int num_planes = av1_num_planes(cm); |
470 | 260 | const int nvfb = (cm->mi_params.mi_rows + MI_SIZE_64X64 - 1) / MI_SIZE_64X64; |
471 | | |
472 | 260 | av1_setup_dst_planes(xd->plane, cm->seq_params->sb_size, frame, 0, 0, 0, |
473 | 260 | num_planes); |
474 | | |
475 | 785 | for (int fbr = 0; fbr < nvfb; fbr++) |
476 | 525 | av1_cdef_fb_row(cm, xd, cm->cdef_info.linebuf, cm->cdef_info.colbuf, |
477 | 525 | cm->cdef_info.srcbuf, fbr, cdef_init_fb_row_fn, NULL, |
478 | 525 | xd->error_info); |
479 | 260 | } |