Coverage Report

Created: 2026-06-15 06:22

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/work/dav1d/src/filmgrain_tmpl.c
Line
Count
Source
1
/*
2
 * Copyright © 2018, Niklas Haas
3
 * Copyright © 2018, VideoLAN and dav1d authors
4
 * Copyright © 2018, Two Orioles, LLC
5
 * All rights reserved.
6
 *
7
 * Redistribution and use in source and binary forms, with or without
8
 * modification, are permitted provided that the following conditions are met:
9
 *
10
 * 1. Redistributions of source code must retain the above copyright notice, this
11
 *    list of conditions and the following disclaimer.
12
 *
13
 * 2. Redistributions in binary form must reproduce the above copyright notice,
14
 *    this list of conditions and the following disclaimer in the documentation
15
 *    and/or other materials provided with the distribution.
16
 *
17
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
18
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
19
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
20
 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
21
 * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
22
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
23
 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
24
 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
26
 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27
 */
28
29
#include "common/attributes.h"
30
#include "common/intops.h"
31
32
#include "src/filmgrain.h"
33
#include "src/tables.h"
34
35
291
#define SUB_GRAIN_WIDTH 44
36
178
#define SUB_GRAIN_HEIGHT 38
37
38
12.8M
static inline int get_random_number(const int bits, unsigned *const state) {
39
12.8M
    const int r = *state;
40
12.8M
    unsigned bit = ((r >> 0) ^ (r >> 1) ^ (r >> 3) ^ (r >> 12)) & 1;
41
12.8M
    *state = (r >> 1) | (bit << 15);
42
43
12.8M
    return (*state >> (16 - bits)) & ((1 << bits) - 1);
44
12.8M
}
45
46
38.0M
static inline int round2(const int x, const uint64_t shift) {
47
38.0M
    return (x + ((1 << shift) >> 1)) >> shift;
48
38.0M
}
49
50
static void generate_grain_y_c(entry buf[][GRAIN_WIDTH],
51
                               const Dav1dFilmGrainData *const data
52
                               HIGHBD_DECL_SUFFIX)
53
1.00k
{
54
1.00k
    const int bitdepth_min_8 = bitdepth_from_max(bitdepth_max) - 8;
55
1.00k
    unsigned seed = data->seed;
56
1.00k
    const int shift = 4 - bitdepth_min_8 + data->grain_scale_shift;
57
1.00k
    const int grain_ctr = 128 << bitdepth_min_8;
58
1.00k
    const int grain_min = -grain_ctr, grain_max = grain_ctr - 1;
59
60
74.0k
    for (int y = 0; y < GRAIN_HEIGHT; y++) {
61
6.05M
        for (int x = 0; x < GRAIN_WIDTH; x++) {
62
5.98M
            const int value = get_random_number(11, &seed);
63
5.98M
            buf[y][x] = round2(dav1d_gaussian_sequence[ value ], shift);
64
5.98M
        }
65
73.0k
    }
66
67
1.00k
    const int ar_pad = 3;
68
1.00k
    const int ar_lag = data->ar_coeff_lag;
69
70
71.0k
    for (int y = ar_pad; y < GRAIN_HEIGHT; y++) {
71
5.39M
        for (int x = ar_pad; x < GRAIN_WIDTH - ar_pad; x++) {
72
5.32M
            const int8_t *coeff = data->ar_coeffs_y;
73
5.32M
            int sum = 0;
74
16.5M
            for (int dy = -ar_lag; dy <= 0; dy++) {
75
46.5M
                for (int dx = -ar_lag; dx <= ar_lag; dx++) {
76
40.6M
                    if (!dx && !dy)
77
5.32M
                        break;
78
35.3M
                    sum += *(coeff++) * buf[y + dy][x + dx];
79
35.3M
                }
80
11.2M
            }
81
82
5.32M
            const int grain = buf[y][x] + round2(sum, data->ar_coeff_shift);
83
5.32M
            buf[y][x] = iclip(grain, grain_min, grain_max);
84
5.32M
        }
85
70.0k
    }
86
1.00k
}
87
88
static NOINLINE void
89
generate_grain_uv_c(entry buf[][GRAIN_WIDTH],
90
                    const entry buf_y[][GRAIN_WIDTH],
91
                    const Dav1dFilmGrainData *const data, const intptr_t uv,
92
                    const int subx, const int suby HIGHBD_DECL_SUFFIX)
93
1.32k
{
94
1.32k
    const int bitdepth_min_8 = bitdepth_from_max(bitdepth_max) - 8;
95
1.32k
    unsigned seed = data->seed ^ (uv ? 0x49d8 : 0xb524);
96
1.32k
    const int shift = 4 - bitdepth_min_8 + data->grain_scale_shift;
97
1.32k
    const int grain_ctr = 128 << bitdepth_min_8;
98
1.32k
    const int grain_min = -grain_ctr, grain_max = grain_ctr - 1;
99
100
1.32k
    const int chromaW = subx ? SUB_GRAIN_WIDTH  : GRAIN_WIDTH;
101
1.32k
    const int chromaH = suby ? SUB_GRAIN_HEIGHT : GRAIN_HEIGHT;
102
103
91.8k
    for (int y = 0; y < chromaH; y++) {
104
6.94M
        for (int x = 0; x < chromaW; x++) {
105
6.85M
            const int value = get_random_number(11, &seed);
106
6.85M
            buf[y][x] = round2(dav1d_gaussian_sequence[ value ], shift);
107
6.85M
        }
108
90.4k
    }
109
110
1.32k
    const int ar_pad = 3;
111
1.32k
    const int ar_lag = data->ar_coeff_lag;
112
113
87.8k
    for (int y = ar_pad; y < chromaH; y++) {
114
6.12M
        for (int x = ar_pad; x < chromaW - ar_pad; x++) {
115
6.03M
            const int8_t *coeff = data->ar_coeffs_uv[uv];
116
6.03M
            int sum = 0;
117
18.6M
            for (int dy = -ar_lag; dy <= 0; dy++) {
118
50.1M
                for (int dx = -ar_lag; dx <= ar_lag; dx++) {
119
                    // For the final (current) pixel, we need to add in the
120
                    // contribution from the luma grain texture
121
43.5M
                    if (!dx && !dy) {
122
6.03M
                        if (!data->num_y_points)
123
1.64M
                            break;
124
4.38M
                        int luma = 0;
125
4.38M
                        const int lumaX = ((x - ar_pad) << subx) + ar_pad;
126
4.38M
                        const int lumaY = ((y - ar_pad) << suby) + ar_pad;
127
8.93M
                        for (int i = 0; i <= suby; i++) {
128
9.58M
                            for (int j = 0; j <= subx; j++) {
129
5.04M
                                luma += buf_y[lumaY + i][lumaX + j];
130
5.04M
                            }
131
4.54M
                        }
132
4.38M
                        luma = round2(luma, subx + suby);
133
4.38M
                        sum += luma * (*coeff);
134
4.38M
                        break;
135
6.03M
                    }
136
137
37.5M
                    sum += *(coeff++) * buf[y + dy][x + dx];
138
37.5M
                }
139
12.6M
            }
140
141
6.03M
            const int grain = buf[y][x] + round2(sum, data->ar_coeff_shift);
142
6.03M
            buf[y][x] = iclip(grain, grain_min, grain_max);
143
6.03M
        }
144
86.5k
    }
145
1.32k
}
146
147
#define gnuv_ss_fn(nm, ss_x, ss_y) \
148
1.32k
static decl_generate_grain_uv_fn(generate_grain_uv_##nm##_c) { \
149
1.32k
    generate_grain_uv_c(buf, buf_y, data, uv, ss_x, ss_y HIGHBD_TAIL_SUFFIX); \
150
1.32k
}
filmgrain_tmpl.c:generate_grain_uv_420_c
Line
Count
Source
148
178
static decl_generate_grain_uv_fn(generate_grain_uv_##nm##_c) { \
149
178
    generate_grain_uv_c(buf, buf_y, data, uv, ss_x, ss_y HIGHBD_TAIL_SUFFIX); \
150
178
}
filmgrain_tmpl.c:generate_grain_uv_422_c
Line
Count
Source
148
113
static decl_generate_grain_uv_fn(generate_grain_uv_##nm##_c) { \
149
113
    generate_grain_uv_c(buf, buf_y, data, uv, ss_x, ss_y HIGHBD_TAIL_SUFFIX); \
150
113
}
filmgrain_tmpl.c:generate_grain_uv_444_c
Line
Count
Source
148
1.03k
static decl_generate_grain_uv_fn(generate_grain_uv_##nm##_c) { \
149
1.03k
    generate_grain_uv_c(buf, buf_y, data, uv, ss_x, ss_y HIGHBD_TAIL_SUFFIX); \
150
1.03k
}
151
152
gnuv_ss_fn(420, 1, 1);
153
gnuv_ss_fn(422, 1, 0);
154
gnuv_ss_fn(444, 0, 0);
155
156
// samples from the correct block of a grain LUT, while taking into account the
157
// offsets provided by the offsets cache
158
static inline entry sample_lut(const entry grain_lut[][GRAIN_WIDTH],
159
                               const int offsets[2][2], const int subx, const int suby,
160
                               const int bx, const int by, const int x, const int y)
161
9.60M
{
162
9.60M
    const int randval = offsets[bx][by];
163
9.60M
    const int offx = 3 + (2 >> subx) * (3 + (randval >> 4));
164
9.60M
    const int offy = 3 + (2 >> suby) * (3 + (randval & 0xF));
165
9.60M
    return grain_lut[offy + y + (FG_BLOCK_SIZE >> suby) * by]
166
9.60M
                    [offx + x + (FG_BLOCK_SIZE >> subx) * bx];
167
9.60M
}
168
169
static void fgy_32x32xn_c(pixel *const dst_row, const pixel *const src_row,
170
                          const ptrdiff_t stride,
171
                          const Dav1dFilmGrainData *const data, const size_t pw,
172
                          const uint8_t scaling[SCALING_SIZE],
173
                          const entry grain_lut[][GRAIN_WIDTH],
174
                          const int bh, const int row_num HIGHBD_DECL_SUFFIX)
175
4.82k
{
176
4.82k
    const int rows = 1 + (data->overlap_flag && row_num > 0);
177
4.82k
    const int bitdepth_min_8 = bitdepth_from_max(bitdepth_max) - 8;
178
4.82k
    const int grain_ctr = 128 << bitdepth_min_8;
179
4.82k
    const int grain_min = -grain_ctr, grain_max = grain_ctr - 1;
180
181
4.82k
    int min_value, max_value;
182
4.82k
    if (data->clip_to_restricted_range) {
183
2.35k
        min_value = 16 << bitdepth_min_8;
184
2.35k
        max_value = 235 << bitdepth_min_8;
185
2.46k
    } else {
186
2.46k
        min_value = 0;
187
2.46k
        max_value = BITDEPTH_MAX;
188
2.46k
    }
189
190
    // seed[0] contains the current row, seed[1] contains the previous
191
4.82k
    unsigned seed[2];
192
12.0k
    for (int i = 0; i < rows; i++) {
193
7.26k
        seed[i] = data->seed;
194
7.26k
        seed[i] ^= (((row_num - i) * 37  + 178) & 0xFF) << 8;
195
7.26k
        seed[i] ^= (((row_num - i) * 173 + 105) & 0xFF);
196
7.26k
    }
197
198
4.82k
    assert(stride % (FG_BLOCK_SIZE * sizeof(pixel)) == 0);
199
200
4.82k
    int offsets[2 /* col offset */][2 /* row offset */];
201
202
    // process this row in FG_BLOCK_SIZE^2 blocks
203
15.3k
    for (unsigned bx = 0; bx < pw; bx += FG_BLOCK_SIZE) {
204
10.5k
        const int bw = imin(FG_BLOCK_SIZE, (int) pw - bx);
205
206
10.5k
        if (data->overlap_flag && bx) {
207
            // shift previous offsets left
208
12.3k
            for (int i = 0; i < rows; i++)
209
7.65k
                offsets[1][i] = offsets[0][i];
210
4.65k
        }
211
212
        // update current offsets
213
26.3k
        for (int i = 0; i < rows; i++)
214
15.7k
            offsets[0][i] = get_random_number(8, &seed[i]);
215
216
        // x/y block offsets to compensate for overlapped regions
217
10.5k
        const int ystart = data->overlap_flag && row_num ? imin(2, bh) : 0;
218
10.5k
        const int xstart = data->overlap_flag && bx      ? imin(2, bw) : 0;
219
220
10.5k
        static const int w[2][2] = { { 27, 17 }, { 17, 27 } };
221
222
10.5k
#define add_noise_y(x, y, grain)                                                  \
223
3.43M
        const pixel *const src = src_row + (y) * PXSTRIDE(stride) + (x) + bx;     \
224
3.43M
        pixel *const dst = dst_row + (y) * PXSTRIDE(stride) + (x) + bx;           \
225
3.43M
        const int noise = round2(scaling[ *src ] * (grain), data->scaling_shift); \
226
3.43M
        *dst = iclip(*src + noise, min_value, max_value);
227
228
233k
        for (int y = ystart; y < bh; y++) {
229
            // Non-overlapped image region (straightforward)
230
3.27M
            for (int x = xstart; x < bw; x++) {
231
3.04M
                int grain = sample_lut(grain_lut, offsets, 0, 0, 0, 0, x, y);
232
3.04M
                add_noise_y(x, y, grain);
233
3.04M
            }
234
235
            // Special case for overlapped column
236
415k
            for (int x = 0; x < xstart; x++) {
237
191k
                int grain = sample_lut(grain_lut, offsets, 0, 0, 0, 0, x, y);
238
191k
                int old   = sample_lut(grain_lut, offsets, 0, 0, 1, 0, x, y);
239
191k
                grain = round2(old * w[x][0] + grain * w[x][1], 5);
240
191k
                grain = iclip(grain, grain_min, grain_max);
241
191k
                add_noise_y(x, y, grain);
242
191k
            }
243
223k
        }
244
245
21.0k
        for (int y = 0; y < ystart; y++) {
246
            // Special case for overlapped row (sans corner)
247
192k
            for (int x = xstart; x < bw; x++) {
248
181k
                int grain = sample_lut(grain_lut, offsets, 0, 0, 0, 0, x, y);
249
181k
                int old   = sample_lut(grain_lut, offsets, 0, 0, 0, 1, x, y);
250
181k
                grain = round2(old * w[y][0] + grain * w[y][1], 5);
251
181k
                grain = iclip(grain, grain_min, grain_max);
252
181k
                add_noise_y(x, y, grain);
253
181k
            }
254
255
            // Special case for doubly-overlapped corner
256
21.4k
            for (int x = 0; x < xstart; x++) {
257
                // Blend the top pixel with the top left block
258
11.0k
                int top = sample_lut(grain_lut, offsets, 0, 0, 0, 1, x, y);
259
11.0k
                int old = sample_lut(grain_lut, offsets, 0, 0, 1, 1, x, y);
260
11.0k
                top = round2(old * w[x][0] + top * w[x][1], 5);
261
11.0k
                top = iclip(top, grain_min, grain_max);
262
263
                // Blend the current pixel with the left block
264
11.0k
                int grain = sample_lut(grain_lut, offsets, 0, 0, 0, 0, x, y);
265
11.0k
                old = sample_lut(grain_lut, offsets, 0, 0, 1, 0, x, y);
266
11.0k
                grain = round2(old * w[x][0] + grain * w[x][1], 5);
267
11.0k
                grain = iclip(grain, grain_min, grain_max);
268
269
                // Mix the row rows together and apply grain
270
11.0k
                grain = round2(top * w[y][0] + grain * w[y][1], 5);
271
11.0k
                grain = iclip(grain, grain_min, grain_max);
272
11.0k
                add_noise_y(x, y, grain);
273
11.0k
            }
274
10.4k
        }
275
10.5k
    }
276
4.82k
}
277
278
static NOINLINE void
279
fguv_32x32xn_c(pixel *const dst_row, const pixel *const src_row,
280
               const ptrdiff_t stride, const Dav1dFilmGrainData *const data,
281
               const size_t pw, const uint8_t scaling[SCALING_SIZE],
282
               const entry grain_lut[][GRAIN_WIDTH], const int bh,
283
               const int row_num, const pixel *const luma_row,
284
               const ptrdiff_t luma_stride, const int uv, const int is_id,
285
               const int sx, const int sy HIGHBD_DECL_SUFFIX)
286
7.18k
{
287
7.18k
    const int rows = 1 + (data->overlap_flag && row_num > 0);
288
7.18k
    const int bitdepth_min_8 = bitdepth_from_max(bitdepth_max) - 8;
289
7.18k
    const int grain_ctr = 128 << bitdepth_min_8;
290
7.18k
    const int grain_min = -grain_ctr, grain_max = grain_ctr - 1;
291
292
7.18k
    int min_value, max_value;
293
7.18k
    if (data->clip_to_restricted_range) {
294
4.28k
        min_value = 16 << bitdepth_min_8;
295
4.28k
        max_value = (is_id ? 235 : 240) << bitdepth_min_8;
296
4.28k
    } else {
297
2.89k
        min_value = 0;
298
2.89k
        max_value = BITDEPTH_MAX;
299
2.89k
    }
300
301
    // seed[0] contains the current row, seed[1] contains the previous
302
7.18k
    unsigned seed[2];
303
18.6k
    for (int i = 0; i < rows; i++) {
304
11.4k
        seed[i] = data->seed;
305
11.4k
        seed[i] ^= (((row_num - i) * 37  + 178) & 0xFF) << 8;
306
11.4k
        seed[i] ^= (((row_num - i) * 173 + 105) & 0xFF);
307
11.4k
    }
308
309
7.18k
    assert(stride % (FG_BLOCK_SIZE * sizeof(pixel)) == 0);
310
311
7.18k
    int offsets[2 /* col offset */][2 /* row offset */];
312
313
    // process this row in FG_BLOCK_SIZE^2 blocks (subsampled)
314
23.9k
    for (unsigned bx = 0; bx < pw; bx += FG_BLOCK_SIZE >> sx) {
315
16.7k
        const int bw = imin(FG_BLOCK_SIZE >> sx, (int)(pw - bx));
316
16.7k
        if (data->overlap_flag && bx) {
317
            // shift previous offsets left
318
21.8k
            for (int i = 0; i < rows; i++)
319
13.3k
                offsets[1][i] = offsets[0][i];
320
8.51k
        }
321
322
        // update current offsets
323
42.3k
        for (int i = 0; i < rows; i++)
324
25.5k
            offsets[0][i] = get_random_number(8, &seed[i]);
325
326
        // x/y block offsets to compensate for overlapped regions
327
16.7k
        const int ystart = data->overlap_flag && row_num ? imin(2 >> sy, bh) : 0;
328
16.7k
        const int xstart = data->overlap_flag && bx      ? imin(2 >> sx, bw) : 0;
329
330
16.7k
        static const int w[2 /* sub */][2 /* off */][2] = {
331
16.7k
            { { 27, 17 }, { 17, 27 } },
332
16.7k
            { { 23, 22 } },
333
16.7k
        };
334
335
16.7k
#define add_noise_uv(x, y, grain)                                                    \
336
6.52M
            const int lx = (bx + x) << sx;                                           \
337
6.52M
            const int ly = y << sy;                                                  \
338
6.52M
            const pixel *const luma = luma_row + ly * PXSTRIDE(luma_stride) + lx;    \
339
6.52M
            pixel avg = luma[0];                                                     \
340
6.52M
            if (sx)                                                                  \
341
6.52M
                avg = (avg + luma[1] + 1) >> 1;                                      \
342
6.52M
            const pixel *const src = src_row + (y) * PXSTRIDE(stride) + (bx + (x));  \
343
6.52M
            pixel *const dst = dst_row + (y) * PXSTRIDE(stride) + (bx + (x));        \
344
6.52M
            int val = avg;                                                           \
345
6.52M
            if (!data->chroma_scaling_from_luma) {                                   \
346
2.67M
                const int combined = avg * data->uv_luma_mult[uv] +                  \
347
2.67M
                               *src * data->uv_mult[uv];                             \
348
2.67M
                val = iclip_pixel( (combined >> 6) +                                 \
349
2.67M
                                   (data->uv_offset[uv] * (1 << bitdepth_min_8)) );  \
350
2.67M
            }                                                                        \
351
6.52M
            const int noise = round2(scaling[ val ] * (grain), data->scaling_shift); \
352
6.52M
            *dst = iclip(*src + noise, min_value, max_value);
353
354
376k
        for (int y = ystart; y < bh; y++) {
355
            // Non-overlapped image region (straightforward)
356
6.19M
            for (int x = xstart; x < bw; x++) {
357
5.83M
                int grain = sample_lut(grain_lut, offsets, sx, sy, 0, 0, x, y);
358
5.83M
                add_noise_uv(x, y, grain);
359
5.83M
            }
360
361
            // Special case for overlapped column
362
743k
            for (int x = 0; x < xstart; x++) {
363
384k
                int grain = sample_lut(grain_lut, offsets, sx, sy, 0, 0, x, y);
364
384k
                int old   = sample_lut(grain_lut, offsets, sx, sy, 1, 0, x, y);
365
384k
                grain = round2(old * w[sx][x][0] + grain * w[sx][x][1], 5);
366
384k
                grain = iclip(grain, grain_min, grain_max);
367
384k
                add_noise_uv(x, y, grain);
368
384k
            }
369
359k
        }
370
371
32.8k
        for (int y = 0; y < ystart; y++) {
372
            // Special case for overlapped row (sans corner)
373
306k
            for (int x = xstart; x < bw; x++) {
374
290k
                int grain = sample_lut(grain_lut, offsets, sx, sy, 0, 0, x, y);
375
290k
                int old   = sample_lut(grain_lut, offsets, sx, sy, 0, 1, x, y);
376
290k
                grain = round2(old * w[sy][y][0] + grain * w[sy][y][1], 5);
377
290k
                grain = iclip(grain, grain_min, grain_max);
378
290k
                add_noise_uv(x, y, grain);
379
290k
            }
380
381
            // Special case for doubly-overlapped corner
382
33.5k
            for (int x = 0; x < xstart; x++) {
383
                // Blend the top pixel with the top left block
384
17.5k
                int top = sample_lut(grain_lut, offsets, sx, sy, 0, 1, x, y);
385
17.5k
                int old = sample_lut(grain_lut, offsets, sx, sy, 1, 1, x, y);
386
17.5k
                top = round2(old * w[sx][x][0] + top * w[sx][x][1], 5);
387
17.5k
                top = iclip(top, grain_min, grain_max);
388
389
                // Blend the current pixel with the left block
390
17.5k
                int grain = sample_lut(grain_lut, offsets, sx, sy, 0, 0, x, y);
391
17.5k
                old = sample_lut(grain_lut, offsets, sx, sy, 1, 0, x, y);
392
17.5k
                grain = round2(old * w[sx][x][0] + grain * w[sx][x][1], 5);
393
17.5k
                grain = iclip(grain, grain_min, grain_max);
394
395
                // Mix the row rows together and apply to image
396
17.5k
                grain = round2(top * w[sy][y][0] + grain * w[sy][y][1], 5);
397
17.5k
                grain = iclip(grain, grain_min, grain_max);
398
17.5k
                add_noise_uv(x, y, grain);
399
17.5k
            }
400
16.0k
        }
401
16.7k
    }
402
7.18k
}
403
404
#define fguv_ss_fn(nm, ss_x, ss_y) \
405
7.21k
static decl_fguv_32x32xn_fn(fguv_32x32xn_##nm##_c) { \
406
7.21k
    fguv_32x32xn_c(dst_row, src_row, stride, data, pw, scaling, grain_lut, bh, \
407
7.21k
                   row_num, luma_row, luma_stride, uv_pl, is_id, ss_x, ss_y \
408
7.21k
                   HIGHBD_TAIL_SUFFIX); \
409
7.21k
}
filmgrain_tmpl.c:fguv_32x32xn_420_c
Line
Count
Source
405
1.88k
static decl_fguv_32x32xn_fn(fguv_32x32xn_##nm##_c) { \
406
1.88k
    fguv_32x32xn_c(dst_row, src_row, stride, data, pw, scaling, grain_lut, bh, \
407
1.88k
                   row_num, luma_row, luma_stride, uv_pl, is_id, ss_x, ss_y \
408
1.88k
                   HIGHBD_TAIL_SUFFIX); \
409
1.88k
}
filmgrain_tmpl.c:fguv_32x32xn_422_c
Line
Count
Source
405
153
static decl_fguv_32x32xn_fn(fguv_32x32xn_##nm##_c) { \
406
153
    fguv_32x32xn_c(dst_row, src_row, stride, data, pw, scaling, grain_lut, bh, \
407
153
                   row_num, luma_row, luma_stride, uv_pl, is_id, ss_x, ss_y \
408
153
                   HIGHBD_TAIL_SUFFIX); \
409
153
}
filmgrain_tmpl.c:fguv_32x32xn_444_c
Line
Count
Source
405
5.17k
static decl_fguv_32x32xn_fn(fguv_32x32xn_##nm##_c) { \
406
5.17k
    fguv_32x32xn_c(dst_row, src_row, stride, data, pw, scaling, grain_lut, bh, \
407
5.17k
                   row_num, luma_row, luma_stride, uv_pl, is_id, ss_x, ss_y \
408
5.17k
                   HIGHBD_TAIL_SUFFIX); \
409
5.17k
}
410
411
fguv_ss_fn(420, 1, 1);
412
fguv_ss_fn(422, 1, 0);
413
fguv_ss_fn(444, 0, 0);
414
415
#if HAVE_ASM
416
#if ARCH_AARCH64 || ARCH_ARM
417
#include "src/arm/filmgrain.h"
418
#elif ARCH_X86
419
#include "src/x86/filmgrain.h"
420
#endif
421
#endif
422
423
18.4k
COLD void bitfn(dav1d_film_grain_dsp_init)(Dav1dFilmGrainDSPContext *const c) {
424
18.4k
    c->generate_grain_y = generate_grain_y_c;
425
18.4k
    c->generate_grain_uv[DAV1D_PIXEL_LAYOUT_I420 - 1] = generate_grain_uv_420_c;
426
18.4k
    c->generate_grain_uv[DAV1D_PIXEL_LAYOUT_I422 - 1] = generate_grain_uv_422_c;
427
18.4k
    c->generate_grain_uv[DAV1D_PIXEL_LAYOUT_I444 - 1] = generate_grain_uv_444_c;
428
429
18.4k
    c->fgy_32x32xn = fgy_32x32xn_c;
430
18.4k
    c->fguv_32x32xn[DAV1D_PIXEL_LAYOUT_I420 - 1] = fguv_32x32xn_420_c;
431
18.4k
    c->fguv_32x32xn[DAV1D_PIXEL_LAYOUT_I422 - 1] = fguv_32x32xn_422_c;
432
18.4k
    c->fguv_32x32xn[DAV1D_PIXEL_LAYOUT_I444 - 1] = fguv_32x32xn_444_c;
433
434
#if HAVE_ASM
435
#if ARCH_AARCH64 || ARCH_ARM
436
    film_grain_dsp_init_arm(c);
437
#elif ARCH_X86
438
    film_grain_dsp_init_x86(c);
439
#endif
440
#endif
441
18.4k
}
dav1d_film_grain_dsp_init_8bpc
Line
Count
Source
423
8.44k
COLD void bitfn(dav1d_film_grain_dsp_init)(Dav1dFilmGrainDSPContext *const c) {
424
8.44k
    c->generate_grain_y = generate_grain_y_c;
425
8.44k
    c->generate_grain_uv[DAV1D_PIXEL_LAYOUT_I420 - 1] = generate_grain_uv_420_c;
426
8.44k
    c->generate_grain_uv[DAV1D_PIXEL_LAYOUT_I422 - 1] = generate_grain_uv_422_c;
427
8.44k
    c->generate_grain_uv[DAV1D_PIXEL_LAYOUT_I444 - 1] = generate_grain_uv_444_c;
428
429
8.44k
    c->fgy_32x32xn = fgy_32x32xn_c;
430
8.44k
    c->fguv_32x32xn[DAV1D_PIXEL_LAYOUT_I420 - 1] = fguv_32x32xn_420_c;
431
8.44k
    c->fguv_32x32xn[DAV1D_PIXEL_LAYOUT_I422 - 1] = fguv_32x32xn_422_c;
432
8.44k
    c->fguv_32x32xn[DAV1D_PIXEL_LAYOUT_I444 - 1] = fguv_32x32xn_444_c;
433
434
#if HAVE_ASM
435
#if ARCH_AARCH64 || ARCH_ARM
436
    film_grain_dsp_init_arm(c);
437
#elif ARCH_X86
438
    film_grain_dsp_init_x86(c);
439
#endif
440
#endif
441
8.44k
}
dav1d_film_grain_dsp_init_16bpc
Line
Count
Source
423
9.97k
COLD void bitfn(dav1d_film_grain_dsp_init)(Dav1dFilmGrainDSPContext *const c) {
424
9.97k
    c->generate_grain_y = generate_grain_y_c;
425
9.97k
    c->generate_grain_uv[DAV1D_PIXEL_LAYOUT_I420 - 1] = generate_grain_uv_420_c;
426
9.97k
    c->generate_grain_uv[DAV1D_PIXEL_LAYOUT_I422 - 1] = generate_grain_uv_422_c;
427
9.97k
    c->generate_grain_uv[DAV1D_PIXEL_LAYOUT_I444 - 1] = generate_grain_uv_444_c;
428
429
9.97k
    c->fgy_32x32xn = fgy_32x32xn_c;
430
9.97k
    c->fguv_32x32xn[DAV1D_PIXEL_LAYOUT_I420 - 1] = fguv_32x32xn_420_c;
431
9.97k
    c->fguv_32x32xn[DAV1D_PIXEL_LAYOUT_I422 - 1] = fguv_32x32xn_422_c;
432
9.97k
    c->fguv_32x32xn[DAV1D_PIXEL_LAYOUT_I444 - 1] = fguv_32x32xn_444_c;
433
434
#if HAVE_ASM
435
#if ARCH_AARCH64 || ARCH_ARM
436
    film_grain_dsp_init_arm(c);
437
#elif ARCH_X86
438
    film_grain_dsp_init_x86(c);
439
#endif
440
#endif
441
9.97k
}