Coverage Report

Created: 2025-06-22 08:04

/src/aom/av1/common/cdef.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * Copyright (c) 2016, Alliance for Open Media. All rights reserved.
3
 *
4
 * This source code is subject to the terms of the BSD 2 Clause License and
5
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6
 * was not distributed with this source code in the LICENSE file, you can
7
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8
 * Media Patent License 1.0 was not distributed with this source code in the
9
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10
 */
11
12
#include <assert.h>
13
#include <stddef.h>
14
#include <string.h>
15
16
#include "config/aom_scale_rtcd.h"
17
18
#include "aom/aom_integer.h"
19
#include "aom_util/aom_pthread.h"
20
#include "av1/common/av1_common_int.h"
21
#include "av1/common/cdef.h"
22
#include "av1/common/cdef_block.h"
23
#include "av1/common/common.h"
24
#include "av1/common/common_data.h"
25
#include "av1/common/enums.h"
26
#include "av1/common/reconinter.h"
27
#include "av1/common/thread_common.h"
28
29
static int is_8x8_block_skip(MB_MODE_INFO **grid, int mi_row, int mi_col,
30
2.27M
                             int mi_stride) {
31
2.27M
  MB_MODE_INFO **mbmi = grid + mi_row * mi_stride + mi_col;
32
5.15M
  for (int r = 0; r < mi_size_high[BLOCK_8X8]; ++r, mbmi += mi_stride) {
33
9.47M
    for (int c = 0; c < mi_size_wide[BLOCK_8X8]; ++c) {
34
6.60M
      if (!mbmi[c]->skip_txfm) return 0;
35
6.60M
    }
36
3.71M
  }
37
38
1.43M
  return 1;
39
2.27M
}
40
41
int av1_cdef_compute_sb_list(const CommonModeInfoParams *const mi_params,
42
                             int mi_row, int mi_col, cdef_list *dlist,
43
62.4k
                             BLOCK_SIZE bs) {
44
62.4k
  MB_MODE_INFO **grid = mi_params->mi_grid_base;
45
62.4k
  int maxc = mi_params->mi_cols - mi_col;
46
62.4k
  int maxr = mi_params->mi_rows - mi_row;
47
48
62.5k
  if (bs == BLOCK_128X128 || bs == BLOCK_128X64)
49
0
    maxc = AOMMIN(maxc, MI_SIZE_128X128);
50
62.4k
  else
51
62.4k
    maxc = AOMMIN(maxc, MI_SIZE_64X64);
52
62.4k
  if (bs == BLOCK_128X128 || bs == BLOCK_64X128)
53
0
    maxr = AOMMIN(maxr, MI_SIZE_128X128);
54
62.4k
  else
55
62.4k
    maxr = AOMMIN(maxr, MI_SIZE_64X64);
56
57
62.4k
  const int r_step = 2;  // mi_size_high[BLOCK_8X8]
58
62.4k
  const int c_step = 2;  // mi_size_wide[BLOCK_8X8]
59
62.4k
  const int r_shift = 1;
60
62.4k
  const int c_shift = 1;
61
62.4k
  int count = 0;
62
477k
  for (int r = 0; r < maxr; r += r_step) {
63
2.69M
    for (int c = 0; c < maxc; c += c_step) {
64
2.27M
      if (!is_8x8_block_skip(grid, mi_row + r, mi_col + c,
65
2.27M
                             mi_params->mi_stride)) {
66
845k
        dlist[count].by = r >> r_shift;
67
845k
        dlist[count].bx = c >> c_shift;
68
845k
        count++;
69
845k
      }
70
2.27M
    }
71
415k
  }
72
62.4k
  return count;
73
62.4k
}
74
75
void cdef_copy_rect8_8bit_to_16bit_c(uint16_t *dst, int dstride,
76
                                     const uint8_t *src, int sstride, int width,
77
59.4k
                                     int height) {
78
1.22M
  for (int i = 0; i < height; i++) {
79
53.8M
    for (int j = 0; j < width; j++) {
80
52.7M
      dst[i * dstride + j] = src[i * sstride + j];
81
52.7M
    }
82
1.16M
  }
83
59.4k
}
84
85
#if CONFIG_AV1_HIGHBITDEPTH
86
void cdef_copy_rect8_16bit_to_16bit_c(uint16_t *dst, int dstride,
87
                                      const uint16_t *src, int sstride,
88
137k
                                      int width, int height) {
89
2.26M
  for (int i = 0; i < height; i++) {
90
64.6M
    for (int j = 0; j < width; j++) {
91
62.5M
      dst[i * dstride + j] = src[i * sstride + j];
92
62.5M
    }
93
2.12M
  }
94
137k
}
95
#endif  // CONFIG_AV1_HIGHBITDEPTH
96
97
void av1_cdef_copy_sb8_16_lowbd(uint16_t *const dst, int dstride,
98
                                const uint8_t *src, int src_voffset,
99
                                int src_hoffset, int sstride, int vsize,
100
60.4k
                                int hsize) {
101
60.4k
  const uint8_t *base = &src[src_voffset * (ptrdiff_t)sstride + src_hoffset];
102
60.4k
  cdef_copy_rect8_8bit_to_16bit(dst, dstride, base, sstride, hsize, vsize);
103
60.4k
}
104
105
#if CONFIG_AV1_HIGHBITDEPTH
106
void av1_cdef_copy_sb8_16_highbd(uint16_t *const dst, int dstride,
107
                                 const uint8_t *src, int src_voffset,
108
                                 int src_hoffset, int sstride, int vsize,
109
138k
                                 int hsize) {
110
138k
  const uint16_t *base =
111
138k
      &CONVERT_TO_SHORTPTR(src)[src_voffset * (ptrdiff_t)sstride + src_hoffset];
112
138k
  cdef_copy_rect8_16bit_to_16bit(dst, dstride, base, sstride, hsize, vsize);
113
138k
}
114
#endif  // CONFIG_AV1_HIGHBITDEPTH
115
116
void av1_cdef_copy_sb8_16(const AV1_COMMON *const cm, uint16_t *const dst,
117
                          int dstride, const uint8_t *src, int src_voffset,
118
198k
                          int src_hoffset, int sstride, int vsize, int hsize) {
119
198k
#if CONFIG_AV1_HIGHBITDEPTH
120
198k
  if (cm->seq_params->use_highbitdepth) {
121
137k
    av1_cdef_copy_sb8_16_highbd(dst, dstride, src, src_voffset, src_hoffset,
122
137k
                                sstride, vsize, hsize);
123
137k
    return;
124
137k
  }
125
#else
126
  (void)cm;
127
#endif  // CONFIG_AV1_HIGHBITDEPTH
128
60.2k
  av1_cdef_copy_sb8_16_lowbd(dst, dstride, src, src_voffset, src_hoffset,
129
60.2k
                             sstride, vsize, hsize);
130
60.2k
}
131
132
static inline void copy_rect(uint16_t *dst, int dstride, const uint16_t *src,
133
277k
                             int sstride, int v, int h) {
134
6.99M
  for (int i = 0; i < v; i++) {
135
63.5M
    for (int j = 0; j < h; j++) {
136
56.8M
      dst[i * dstride + j] = src[i * sstride + j];
137
56.8M
    }
138
6.71M
  }
139
277k
}
140
141
// Prepares intermediate input buffer for CDEF.
142
// Inputs:
143
//   cm: Pointer to common structure.
144
//   fb_info: Pointer to the CDEF block-level parameter structure.
145
//   colbuf: Left column buffer for CDEF.
146
//   cdef_left: Left block is filtered or not.
147
//   fbc, fbr: col and row index of a block.
148
//   plane: plane index Y/CB/CR.
149
// Returns:
150
//   Nothing will be returned.
151
static void cdef_prepare_fb(const AV1_COMMON *const cm, CdefBlockInfo *fb_info,
152
                            uint16_t **const colbuf, const int cdef_left,
153
68.7k
                            int fbc, int fbr, int plane) {
154
68.7k
  const CommonModeInfoParams *const mi_params = &cm->mi_params;
155
68.7k
  uint16_t *src = fb_info->src;
156
68.7k
  const int luma_stride =
157
68.7k
      ALIGN_POWER_OF_TWO(mi_params->mi_cols << MI_SIZE_LOG2, 4);
158
68.7k
  const int nvfb = (mi_params->mi_rows + MI_SIZE_64X64 - 1) / MI_SIZE_64X64;
159
68.7k
  const int nhfb = (mi_params->mi_cols + MI_SIZE_64X64 - 1) / MI_SIZE_64X64;
160
68.7k
  int cstart = 0;
161
68.7k
  if (!cdef_left) cstart = -CDEF_HBORDER;
162
68.7k
  int rend, cend;
163
68.7k
  const int nhb =
164
68.7k
      AOMMIN(MI_SIZE_64X64, mi_params->mi_cols - MI_SIZE_64X64 * fbc);
165
68.7k
  const int nvb =
166
68.7k
      AOMMIN(MI_SIZE_64X64, mi_params->mi_rows - MI_SIZE_64X64 * fbr);
167
68.7k
  const int hsize = nhb << fb_info->mi_wide_l2;
168
68.7k
  const int vsize = nvb << fb_info->mi_high_l2;
169
68.7k
  const uint16_t *top_linebuf = fb_info->top_linebuf[plane];
170
68.7k
  const uint16_t *bot_linebuf = fb_info->bot_linebuf[plane];
171
68.7k
  const int bot_offset = (vsize + CDEF_VBORDER) * CDEF_BSTRIDE;
172
68.7k
  const int stride =
173
68.7k
      luma_stride >> (plane == AOM_PLANE_Y ? 0 : cm->seq_params->subsampling_x);
174
175
68.7k
  if (fbc == nhfb - 1)
176
50.8k
    cend = hsize;
177
17.8k
  else
178
17.8k
    cend = hsize + CDEF_HBORDER;
179
180
68.7k
  if (fbr == nvfb - 1)
181
21.1k
    rend = vsize;
182
47.6k
  else
183
47.6k
    rend = vsize + CDEF_VBORDER;
184
185
  /* Copy in the pixels we need from the current superblock for
186
  deringing.*/
187
68.7k
  av1_cdef_copy_sb8_16(
188
68.7k
      cm, &src[CDEF_VBORDER * CDEF_BSTRIDE + CDEF_HBORDER + cstart],
189
68.7k
      CDEF_BSTRIDE, fb_info->dst, fb_info->roffset, fb_info->coffset + cstart,
190
68.7k
      fb_info->dst_stride, vsize, cend - cstart);
191
192
  /* Copy in the pixels we need for the current superblock from bottom buffer.*/
193
68.7k
  if (fbr < nvfb - 1) {
194
47.7k
    copy_rect(&src[bot_offset + CDEF_HBORDER], CDEF_BSTRIDE,
195
47.7k
              &bot_linebuf[fb_info->coffset], stride, CDEF_VBORDER, hsize);
196
47.7k
  } else {
197
20.9k
    fill_rect(&src[bot_offset + CDEF_HBORDER], CDEF_BSTRIDE, CDEF_VBORDER,
198
20.9k
              hsize, CDEF_VERY_LARGE);
199
20.9k
  }
200
68.7k
  if (fbr < nvfb - 1 && fbc > 0) {
201
10.6k
    copy_rect(&src[bot_offset], CDEF_BSTRIDE,
202
10.6k
              &bot_linebuf[fb_info->coffset - CDEF_HBORDER], stride,
203
10.6k
              CDEF_VBORDER, CDEF_HBORDER);
204
58.0k
  } else {
205
58.0k
    fill_rect(&src[bot_offset], CDEF_BSTRIDE, CDEF_VBORDER, CDEF_HBORDER,
206
58.0k
              CDEF_VERY_LARGE);
207
58.0k
  }
208
68.7k
  if (fbr < nvfb - 1 && fbc < nhfb - 1) {
209
10.6k
    copy_rect(&src[bot_offset + hsize + CDEF_HBORDER], CDEF_BSTRIDE,
210
10.6k
              &bot_linebuf[fb_info->coffset + hsize], stride, CDEF_VBORDER,
211
10.6k
              CDEF_HBORDER);
212
58.1k
  } else {
213
58.1k
    fill_rect(&src[bot_offset + hsize + CDEF_HBORDER], CDEF_BSTRIDE,
214
58.1k
              CDEF_VBORDER, CDEF_HBORDER, CDEF_VERY_LARGE);
215
58.1k
  }
216
217
  /* Copy in the pixels we need from the current superblock from top buffer.*/
218
68.7k
  if (fbr > 0) {
219
51.0k
    copy_rect(&src[CDEF_HBORDER], CDEF_BSTRIDE, &top_linebuf[fb_info->coffset],
220
51.0k
              stride, CDEF_VBORDER, hsize);
221
51.0k
  } else {
222
17.6k
    fill_rect(&src[CDEF_HBORDER], CDEF_BSTRIDE, CDEF_VBORDER, hsize,
223
17.6k
              CDEF_VERY_LARGE);
224
17.6k
  }
225
68.7k
  if (fbr > 0 && fbc > 0) {
226
13.4k
    copy_rect(src, CDEF_BSTRIDE, &top_linebuf[fb_info->coffset - CDEF_HBORDER],
227
13.4k
              stride, CDEF_VBORDER, CDEF_HBORDER);
228
55.3k
  } else {
229
55.3k
    fill_rect(src, CDEF_BSTRIDE, CDEF_VBORDER, CDEF_HBORDER, CDEF_VERY_LARGE);
230
55.3k
  }
231
68.7k
  if (fbr > 0 && fbc < nhfb - 1) {
232
13.3k
    copy_rect(&src[hsize + CDEF_HBORDER], CDEF_BSTRIDE,
233
13.3k
              &top_linebuf[fb_info->coffset + hsize], stride, CDEF_VBORDER,
234
13.3k
              CDEF_HBORDER);
235
55.4k
  } else {
236
55.4k
    fill_rect(&src[hsize + CDEF_HBORDER], CDEF_BSTRIDE, CDEF_VBORDER,
237
55.4k
              CDEF_HBORDER, CDEF_VERY_LARGE);
238
55.4k
  }
239
68.7k
  if (cdef_left) {
240
    /* If we deringed the superblock on the left then we need to copy in
241
    saved pixels. */
242
64.4k
    copy_rect(src, CDEF_BSTRIDE, colbuf[plane], CDEF_HBORDER,
243
64.4k
              rend + CDEF_VBORDER, CDEF_HBORDER);
244
64.4k
  }
245
  /* Saving pixels in case we need to dering the superblock on the
246
  right. */
247
68.7k
  copy_rect(colbuf[plane], CDEF_HBORDER, src + hsize, CDEF_BSTRIDE,
248
68.7k
            rend + CDEF_VBORDER, CDEF_HBORDER);
249
250
68.7k
  if (fb_info->frame_boundary[LEFT]) {
251
50.8k
    fill_rect(src, CDEF_BSTRIDE, vsize + 2 * CDEF_VBORDER, CDEF_HBORDER,
252
50.8k
              CDEF_VERY_LARGE);
253
50.8k
  }
254
68.7k
  if (fb_info->frame_boundary[RIGHT]) {
255
50.9k
    fill_rect(&src[hsize + CDEF_HBORDER], CDEF_BSTRIDE,
256
50.9k
              vsize + 2 * CDEF_VBORDER, CDEF_HBORDER, CDEF_VERY_LARGE);
257
50.9k
  }
258
68.7k
}
259
260
static inline void cdef_filter_fb(CdefBlockInfo *const fb_info, int plane,
261
68.9k
                                  uint8_t use_highbitdepth) {
262
68.9k
  ptrdiff_t offset =
263
68.9k
      (ptrdiff_t)fb_info->dst_stride * fb_info->roffset + fb_info->coffset;
264
68.9k
  if (use_highbitdepth) {
265
40.7k
    av1_cdef_filter_fb(
266
40.7k
        NULL, CONVERT_TO_SHORTPTR(fb_info->dst + offset), fb_info->dst_stride,
267
40.7k
        &fb_info->src[CDEF_VBORDER * CDEF_BSTRIDE + CDEF_HBORDER],
268
40.7k
        fb_info->xdec, fb_info->ydec, fb_info->dir, NULL, fb_info->var, plane,
269
40.7k
        fb_info->dlist, fb_info->cdef_count, fb_info->level,
270
40.7k
        fb_info->sec_strength, fb_info->damping, fb_info->coeff_shift);
271
40.7k
  } else {
272
28.1k
    av1_cdef_filter_fb(
273
28.1k
        fb_info->dst + offset, NULL, fb_info->dst_stride,
274
28.1k
        &fb_info->src[CDEF_VBORDER * CDEF_BSTRIDE + CDEF_HBORDER],
275
28.1k
        fb_info->xdec, fb_info->ydec, fb_info->dir, NULL, fb_info->var, plane,
276
28.1k
        fb_info->dlist, fb_info->cdef_count, fb_info->level,
277
28.1k
        fb_info->sec_strength, fb_info->damping, fb_info->coeff_shift);
278
28.1k
  }
279
68.9k
}
280
281
// Initializes block-level parameters for CDEF.
282
static inline void cdef_init_fb_col(const MACROBLOCKD *const xd,
283
                                    CdefBlockInfo *const fb_info, int *level,
284
                                    int *sec_strength, int fbc, int fbr,
285
68.5k
                                    int plane) {
286
68.5k
  const PLANE_TYPE plane_type = get_plane_type(plane);
287
68.5k
  fb_info->level = level[plane_type];
288
68.5k
  fb_info->sec_strength = sec_strength[plane_type];
289
68.5k
  fb_info->dst = xd->plane[plane].dst.buf;
290
68.5k
  fb_info->dst_stride = xd->plane[plane].dst.stride;
291
292
68.5k
  fb_info->xdec = xd->plane[plane].subsampling_x;
293
68.5k
  fb_info->ydec = xd->plane[plane].subsampling_y;
294
68.5k
  fb_info->mi_wide_l2 = MI_SIZE_LOG2 - xd->plane[plane].subsampling_x;
295
68.5k
  fb_info->mi_high_l2 = MI_SIZE_LOG2 - xd->plane[plane].subsampling_y;
296
68.5k
  fb_info->roffset = MI_SIZE_64X64 * fbr << fb_info->mi_high_l2;
297
68.5k
  fb_info->coffset = MI_SIZE_64X64 * fbc << fb_info->mi_wide_l2;
298
68.5k
}
299
300
static void cdef_fb_col(const AV1_COMMON *const cm, const MACROBLOCKD *const xd,
301
                        CdefBlockInfo *const fb_info, uint16_t **const colbuf,
302
63.2k
                        int *cdef_left, int fbc, int fbr) {
303
63.2k
  const CommonModeInfoParams *const mi_params = &cm->mi_params;
304
63.2k
  const int mbmi_cdef_strength =
305
63.2k
      mi_params
306
63.2k
          ->mi_grid_base[MI_SIZE_64X64 * fbr * mi_params->mi_stride +
307
63.2k
                         MI_SIZE_64X64 * fbc]
308
63.2k
          ->cdef_strength;
309
63.2k
  const int num_planes = av1_num_planes(cm);
310
63.2k
  int is_zero_level[PLANE_TYPES] = { 1, 1 };
311
63.2k
  int level[PLANE_TYPES] = { 0 };
312
63.2k
  int sec_strength[PLANE_TYPES] = { 0 };
313
63.2k
  const CdefInfo *const cdef_info = &cm->cdef_info;
314
315
63.2k
  if (mi_params->mi_grid_base[MI_SIZE_64X64 * fbr * mi_params->mi_stride +
316
63.2k
                              MI_SIZE_64X64 * fbc] == NULL ||
317
63.2k
      mbmi_cdef_strength == -1) {
318
0
    av1_zero_array(cdef_left, num_planes);
319
0
    return;
320
0
  }
321
322
  // Compute level and secondary strength for planes
323
63.2k
  level[PLANE_TYPE_Y] =
324
63.2k
      cdef_info->cdef_strengths[mbmi_cdef_strength] / CDEF_SEC_STRENGTHS;
325
63.2k
  sec_strength[PLANE_TYPE_Y] =
326
63.2k
      cdef_info->cdef_strengths[mbmi_cdef_strength] % CDEF_SEC_STRENGTHS;
327
63.2k
  sec_strength[PLANE_TYPE_Y] += sec_strength[PLANE_TYPE_Y] == 3;
328
63.2k
  is_zero_level[PLANE_TYPE_Y] =
329
63.2k
      (level[PLANE_TYPE_Y] == 0) && (sec_strength[PLANE_TYPE_Y] == 0);
330
331
63.2k
  if (num_planes > 1) {
332
51.1k
    level[PLANE_TYPE_UV] =
333
51.1k
        cdef_info->cdef_uv_strengths[mbmi_cdef_strength] / CDEF_SEC_STRENGTHS;
334
51.1k
    sec_strength[PLANE_TYPE_UV] =
335
51.1k
        cdef_info->cdef_uv_strengths[mbmi_cdef_strength] % CDEF_SEC_STRENGTHS;
336
51.1k
    sec_strength[PLANE_TYPE_UV] += sec_strength[PLANE_TYPE_UV] == 3;
337
51.1k
    is_zero_level[PLANE_TYPE_UV] =
338
51.1k
        (level[PLANE_TYPE_UV] == 0) && (sec_strength[PLANE_TYPE_UV] == 0);
339
51.1k
  }
340
341
63.2k
  if (is_zero_level[PLANE_TYPE_Y] && is_zero_level[PLANE_TYPE_UV]) {
342
1.18k
    av1_zero_array(cdef_left, num_planes);
343
1.18k
    return;
344
1.18k
  }
345
346
62.0k
  fb_info->cdef_count = av1_cdef_compute_sb_list(mi_params, fbr * MI_SIZE_64X64,
347
62.0k
                                                 fbc * MI_SIZE_64X64,
348
62.0k
                                                 fb_info->dlist, BLOCK_64X64);
349
62.0k
  if (!fb_info->cdef_count) {
350
32.9k
    av1_zero_array(cdef_left, num_planes);
351
32.9k
    return;
352
32.9k
  }
353
354
101k
  for (int plane = 0; plane < num_planes; plane++) {
355
    // Do not skip cdef filtering for luma plane as filter direction is
356
    // computed based on luma.
357
72.3k
    if (plane && is_zero_level[get_plane_type(plane)]) {
358
3.86k
      cdef_left[plane] = 0;
359
3.86k
      continue;
360
3.86k
    }
361
68.5k
    cdef_init_fb_col(xd, fb_info, level, sec_strength, fbc, fbr, plane);
362
68.5k
    cdef_prepare_fb(cm, fb_info, colbuf, cdef_left[plane], fbc, fbr, plane);
363
68.5k
    cdef_filter_fb(fb_info, plane, cm->seq_params->use_highbitdepth);
364
68.5k
    cdef_left[plane] = 1;
365
68.5k
  }
366
29.1k
}
367
368
// Initializes row-level parameters for CDEF frame.
369
void av1_cdef_init_fb_row(const AV1_COMMON *const cm,
370
                          const MACROBLOCKD *const xd,
371
                          CdefBlockInfo *const fb_info,
372
                          uint16_t **const linebuf, uint16_t *const src,
373
525
                          struct AV1CdefSyncData *const cdef_sync, int fbr) {
374
525
  (void)cdef_sync;
375
525
  const int num_planes = av1_num_planes(cm);
376
525
  const int nvfb = (cm->mi_params.mi_rows + MI_SIZE_64X64 - 1) / MI_SIZE_64X64;
377
525
  const int luma_stride =
378
525
      ALIGN_POWER_OF_TWO(cm->mi_params.mi_cols << MI_SIZE_LOG2, 4);
379
525
  const bool ping_pong = fbr & 1;
380
  // for the current filter block, it's top left corner mi structure (mi_tl)
381
  // is first accessed to check whether the top and left boundaries are
382
  // frame boundaries. Then bottom-left and top-right mi structures are
383
  // accessed to check whether the bottom and right boundaries
384
  // (respectively) are frame boundaries.
385
  //
386
  // Note that we can't just check the bottom-right mi structure - eg. if
387
  // we're at the right-hand edge of the frame but not the bottom, then
388
  // the bottom-right mi is NULL but the bottom-left is not.
389
525
  fb_info->frame_boundary[TOP] = (MI_SIZE_64X64 * fbr == 0) ? 1 : 0;
390
525
  if (fbr != nvfb - 1)
391
265
    fb_info->frame_boundary[BOTTOM] =
392
265
        (MI_SIZE_64X64 * (fbr + 1) == cm->mi_params.mi_rows) ? 1 : 0;
393
260
  else
394
260
    fb_info->frame_boundary[BOTTOM] = 1;
395
396
525
  fb_info->src = src;
397
525
  fb_info->damping = cm->cdef_info.cdef_damping;
398
525
  fb_info->coeff_shift = AOMMAX(cm->seq_params->bit_depth - 8, 0);
399
525
  av1_zero(fb_info->dir);
400
525
  av1_zero(fb_info->var);
401
402
2.04k
  for (int plane = 0; plane < num_planes; plane++) {
403
1.52k
    const int mi_high_l2 = MI_SIZE_LOG2 - xd->plane[plane].subsampling_y;
404
1.52k
    const int offset = MI_SIZE_64X64 * (fbr + 1) << mi_high_l2;
405
1.52k
    const int stride = luma_stride >> xd->plane[plane].subsampling_x;
406
    // here ping-pong buffers are maintained for top linebuf
407
    // to avoid linebuf over-write by consecutive row.
408
1.52k
    uint16_t *const top_linebuf =
409
1.52k
        &linebuf[plane][ping_pong * CDEF_VBORDER * stride];
410
1.52k
    fb_info->bot_linebuf[plane] = &linebuf[plane][(CDEF_VBORDER << 1) * stride];
411
412
1.52k
    if (fbr != nvfb - 1)  // top line buffer copy
413
795
      av1_cdef_copy_sb8_16(cm, top_linebuf, stride, xd->plane[plane].dst.buf,
414
795
                           offset - CDEF_VBORDER, 0,
415
795
                           xd->plane[plane].dst.stride, CDEF_VBORDER, stride);
416
1.52k
    fb_info->top_linebuf[plane] =
417
1.52k
        &linebuf[plane][(!ping_pong) * CDEF_VBORDER * stride];
418
419
1.52k
    if (fbr != nvfb - 1)  // bottom line buffer copy
420
795
      av1_cdef_copy_sb8_16(cm, fb_info->bot_linebuf[plane], stride,
421
795
                           xd->plane[plane].dst.buf, offset, 0,
422
795
                           xd->plane[plane].dst.stride, CDEF_VBORDER, stride);
423
1.52k
  }
424
525
}
425
426
void av1_cdef_fb_row(const AV1_COMMON *const cm, MACROBLOCKD *xd,
427
                     uint16_t **const linebuf, uint16_t **const colbuf,
428
                     uint16_t *const src, int fbr,
429
                     cdef_init_fb_row_t cdef_init_fb_row_fn,
430
                     struct AV1CdefSyncData *const cdef_sync,
431
33.4k
                     struct aom_internal_error_info *error_info) {
432
  // TODO(aomedia:3276): Pass error_info to the low-level functions as required
433
  // in future to handle error propagation.
434
33.4k
  (void)error_info;
435
33.4k
  CdefBlockInfo fb_info;
436
33.4k
  int cdef_left[MAX_MB_PLANE] = { 1, 1, 1 };
437
33.4k
  const int nhfb = (cm->mi_params.mi_cols + MI_SIZE_64X64 - 1) / MI_SIZE_64X64;
438
439
33.4k
  cdef_init_fb_row_fn(cm, xd, &fb_info, linebuf, src, cdef_sync, fbr);
440
33.4k
#if CONFIG_MULTITHREAD
441
33.4k
  if (cdef_sync && cm->cdef_info.allocated_num_workers > 1) {
442
32.9k
    pthread_mutex_lock(cdef_sync->mutex_);
443
32.9k
    const bool cdef_mt_exit = cdef_sync->cdef_mt_exit;
444
32.9k
    pthread_mutex_unlock(cdef_sync->mutex_);
445
    // Exit in case any worker has encountered an error.
446
32.9k
    if (cdef_mt_exit) return;
447
32.9k
  }
448
33.4k
#endif
449
96.6k
  for (int fbc = 0; fbc < nhfb; fbc++) {
450
63.1k
    fb_info.frame_boundary[LEFT] = (MI_SIZE_64X64 * fbc == 0) ? 1 : 0;
451
63.1k
    if (fbc != nhfb - 1)
452
30.5k
      fb_info.frame_boundary[RIGHT] =
453
30.5k
          (MI_SIZE_64X64 * (fbc + 1) == cm->mi_params.mi_cols) ? 1 : 0;
454
32.5k
    else
455
32.5k
      fb_info.frame_boundary[RIGHT] = 1;
456
63.1k
    cdef_fb_col(cm, xd, &fb_info, colbuf, &cdef_left[0], fbc, fbr);
457
63.1k
  }
458
33.4k
}
459
460
// Perform CDEF on input frame.
461
// Inputs:
462
//   frame: Pointer to input frame buffer.
463
//   cm: Pointer to common structure.
464
//   xd: Pointer to common current coding block structure.
465
// Returns:
466
//   Nothing will be returned.
467
void av1_cdef_frame(YV12_BUFFER_CONFIG *frame, AV1_COMMON *const cm,
468
260
                    MACROBLOCKD *xd, cdef_init_fb_row_t cdef_init_fb_row_fn) {
469
260
  const int num_planes = av1_num_planes(cm);
470
260
  const int nvfb = (cm->mi_params.mi_rows + MI_SIZE_64X64 - 1) / MI_SIZE_64X64;
471
472
260
  av1_setup_dst_planes(xd->plane, cm->seq_params->sb_size, frame, 0, 0, 0,
473
260
                       num_planes);
474
475
785
  for (int fbr = 0; fbr < nvfb; fbr++)
476
525
    av1_cdef_fb_row(cm, xd, cm->cdef_info.linebuf, cm->cdef_info.colbuf,
477
525
                    cm->cdef_info.srcbuf, fbr, cdef_init_fb_row_fn, NULL,
478
525
                    xd->error_info);
479
260
}