Coverage Report

Created: 2026-06-16 07:20

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/dav1d/src/fg_apply_tmpl.c
Line
Count
Source
1
/*
2
 * Copyright © 2018, Niklas Haas
3
 * Copyright © 2018, VideoLAN and dav1d authors
4
 * Copyright © 2018, Two Orioles, LLC
5
 * All rights reserved.
6
 *
7
 * Redistribution and use in source and binary forms, with or without
8
 * modification, are permitted provided that the following conditions are met:
9
 *
10
 * 1. Redistributions of source code must retain the above copyright notice, this
11
 *    list of conditions and the following disclaimer.
12
 *
13
 * 2. Redistributions in binary form must reproduce the above copyright notice,
14
 *    this list of conditions and the following disclaimer in the documentation
15
 *    and/or other materials provided with the distribution.
16
 *
17
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
18
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
19
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
20
 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
21
 * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
22
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
23
 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
24
 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
26
 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27
 */
28
29
#include "config.h"
30
31
#include <stdint.h>
32
33
#include "dav1d/common.h"
34
#include "dav1d/picture.h"
35
36
#include "common/intops.h"
37
#include "common/bitdepth.h"
38
39
#include "src/fg_apply.h"
40
41
static void generate_scaling(const int bitdepth,
42
                             const uint8_t points[][2], const int num,
43
                             uint8_t scaling[SCALING_SIZE])
44
1.40k
{
45
1.40k
#if BITDEPTH == 8
46
1.40k
    const int shift_x = 0;
47
1.40k
    const int scaling_size = SCALING_SIZE;
48
#else
49
    assert(bitdepth > 8);
50
    const int shift_x = bitdepth - 8;
51
    const int scaling_size = 1 << bitdepth;
52
#endif
53
54
1.40k
    if (num == 0) {
55
85
        memset(scaling, 0, scaling_size);
56
85
        return;
57
85
    }
58
59
    // Fill up the preceding entries with the initial value
60
1.32k
    memset(scaling, points[0][1], points[0][0] << shift_x);
61
62
    // Linearly interpolate the values in the middle
63
1.88k
    for (int i = 0; i < num - 1; i++) {
64
558
        const int bx = points[i][0];
65
558
        const int by = points[i][1];
66
558
        const int ex = points[i+1][0];
67
558
        const int ey = points[i+1][1];
68
558
        const int dx = ex - bx;
69
558
        const int dy = ey - by;
70
558
        assert(dx > 0);
71
558
        const int delta = dy * ((0x10000 + (dx >> 1)) / dx);
72
40.5k
        for (int x = 0, d = 0x8000; x < dx; x++) {
73
40.0k
            scaling[(bx + x) << shift_x] = by + (d >> 16);
74
40.0k
            d += delta;
75
40.0k
        }
76
558
    }
77
78
    // Fill up the remaining entries with the final value
79
1.32k
    const int n = points[num - 1][0] << shift_x;
80
1.32k
    memset(&scaling[n], points[num - 1][1], scaling_size - n);
81
82
#if BITDEPTH != 8
83
    const int pad = 1 << shift_x, rnd = pad >> 1;
84
    for (int i = 0; i < num - 1; i++) {
85
        const int bx = points[i][0] << shift_x;
86
        const int ex = points[i+1][0] << shift_x;
87
        const int dx = ex - bx;
88
        for (int x = 0; x < dx; x += pad) {
89
            const int range = scaling[bx + x + pad] - scaling[bx + x];
90
            for (int n = 1, r = rnd; n < pad; n++) {
91
                r += range;
92
                scaling[bx + x + n] = scaling[bx + x] + (r >> shift_x);
93
            }
94
        }
95
    }
96
#endif
97
1.32k
}
98
99
#ifndef UNIT_TEST
100
void bitfn(dav1d_prep_grain)(const Dav1dFilmGrainDSPContext *const dsp,
101
                             Dav1dPicture *const out,
102
                             const Dav1dPicture *const in,
103
                             uint8_t scaling[3][SCALING_SIZE],
104
                             entry grain_lut[3][GRAIN_HEIGHT+1][GRAIN_WIDTH])
105
2.30k
{
106
2.30k
    const Dav1dFilmGrainData *const data = &out->frame_hdr->film_grain.data;
107
#if BITDEPTH != 8
108
    const int bitdepth_max = (1 << out->p.bpc) - 1;
109
#endif
110
111
    // Generate grain LUTs as needed
112
2.30k
    dsp->generate_grain_y(grain_lut[0], data HIGHBD_TAIL_SUFFIX); // always needed
113
2.30k
    if (data->num_uv_points[0] || data->chroma_scaling_from_luma)
114
1.99k
        dsp->generate_grain_uv[in->p.layout - 1](grain_lut[1], grain_lut[0],
115
1.99k
                                                 data, 0 HIGHBD_TAIL_SUFFIX);
116
2.30k
    if (data->num_uv_points[1] || data->chroma_scaling_from_luma)
117
2.03k
        dsp->generate_grain_uv[in->p.layout - 1](grain_lut[2], grain_lut[0],
118
2.03k
                                                 data, 1 HIGHBD_TAIL_SUFFIX);
119
120
    // Generate scaling LUTs as needed
121
2.30k
    if (data->num_y_points || data->chroma_scaling_from_luma)
122
2.26k
        generate_scaling(in->p.bpc, data->y_points, data->num_y_points, scaling[0]);
123
2.30k
    if (data->num_uv_points[0])
124
328
        generate_scaling(in->p.bpc, data->uv_points[0], data->num_uv_points[0], scaling[1]);
125
2.30k
    if (data->num_uv_points[1])
126
360
        generate_scaling(in->p.bpc, data->uv_points[1], data->num_uv_points[1], scaling[2]);
127
128
    // Copy over the non-modified planes
129
2.30k
    assert(out->stride[0] == in->stride[0]);
130
2.30k
    if (!data->num_y_points) {
131
208
        const ptrdiff_t stride = out->stride[0];
132
208
        const ptrdiff_t sz = out->p.h * stride;
133
208
        if (sz < 0)
134
0
            memcpy((uint8_t*) out->data[0] + sz - stride,
135
0
                   (uint8_t*) in->data[0] + sz - stride, -sz);
136
208
        else
137
208
            memcpy(out->data[0], in->data[0], sz);
138
208
    }
139
140
2.30k
    if (in->p.layout != DAV1D_PIXEL_LAYOUT_I400 && !data->chroma_scaling_from_luma) {
141
499
        assert(out->stride[1] == in->stride[1]);
142
499
        const int ss_ver = in->p.layout == DAV1D_PIXEL_LAYOUT_I420;
143
499
        const ptrdiff_t stride = out->stride[1];
144
499
        const ptrdiff_t sz = ((out->p.h + ss_ver) >> ss_ver) * stride;
145
499
        if (sz < 0) {
146
0
            if (!data->num_uv_points[0])
147
0
                memcpy((uint8_t*) out->data[1] + sz - stride,
148
0
                       (uint8_t*) in->data[1] + sz - stride, -sz);
149
0
            if (!data->num_uv_points[1])
150
0
                memcpy((uint8_t*) out->data[2] + sz - stride,
151
0
                       (uint8_t*) in->data[2] + sz - stride, -sz);
152
499
        } else {
153
499
            if (!data->num_uv_points[0])
154
171
                memcpy(out->data[1], in->data[1], sz);
155
499
            if (!data->num_uv_points[1])
156
139
                memcpy(out->data[2], in->data[2], sz);
157
499
        }
158
499
    }
159
2.30k
}
dav1d_prep_grain_8bpc
Line
Count
Source
105
1.14k
{
106
1.14k
    const Dav1dFilmGrainData *const data = &out->frame_hdr->film_grain.data;
107
#if BITDEPTH != 8
108
    const int bitdepth_max = (1 << out->p.bpc) - 1;
109
#endif
110
111
    // Generate grain LUTs as needed
112
1.14k
    dsp->generate_grain_y(grain_lut[0], data HIGHBD_TAIL_SUFFIX); // always needed
113
1.14k
    if (data->num_uv_points[0] || data->chroma_scaling_from_luma)
114
957
        dsp->generate_grain_uv[in->p.layout - 1](grain_lut[1], grain_lut[0],
115
957
                                                 data, 0 HIGHBD_TAIL_SUFFIX);
116
1.14k
    if (data->num_uv_points[1] || data->chroma_scaling_from_luma)
117
989
        dsp->generate_grain_uv[in->p.layout - 1](grain_lut[2], grain_lut[0],
118
989
                                                 data, 1 HIGHBD_TAIL_SUFFIX);
119
120
    // Generate scaling LUTs as needed
121
1.14k
    if (data->num_y_points || data->chroma_scaling_from_luma)
122
1.10k
        generate_scaling(in->p.bpc, data->y_points, data->num_y_points, scaling[0]);
123
1.14k
    if (data->num_uv_points[0])
124
134
        generate_scaling(in->p.bpc, data->uv_points[0], data->num_uv_points[0], scaling[1]);
125
1.14k
    if (data->num_uv_points[1])
126
166
        generate_scaling(in->p.bpc, data->uv_points[1], data->num_uv_points[1], scaling[2]);
127
128
    // Copy over the non-modified planes
129
1.14k
    assert(out->stride[0] == in->stride[0]);
130
1.14k
    if (!data->num_y_points) {
131
118
        const ptrdiff_t stride = out->stride[0];
132
118
        const ptrdiff_t sz = out->p.h * stride;
133
118
        if (sz < 0)
134
0
            memcpy((uint8_t*) out->data[0] + sz - stride,
135
0
                   (uint8_t*) in->data[0] + sz - stride, -sz);
136
118
        else
137
118
            memcpy(out->data[0], in->data[0], sz);
138
118
    }
139
140
1.14k
    if (in->p.layout != DAV1D_PIXEL_LAYOUT_I400 && !data->chroma_scaling_from_luma) {
141
267
        assert(out->stride[1] == in->stride[1]);
142
267
        const int ss_ver = in->p.layout == DAV1D_PIXEL_LAYOUT_I420;
143
267
        const ptrdiff_t stride = out->stride[1];
144
267
        const ptrdiff_t sz = ((out->p.h + ss_ver) >> ss_ver) * stride;
145
267
        if (sz < 0) {
146
0
            if (!data->num_uv_points[0])
147
0
                memcpy((uint8_t*) out->data[1] + sz - stride,
148
0
                       (uint8_t*) in->data[1] + sz - stride, -sz);
149
0
            if (!data->num_uv_points[1])
150
0
                memcpy((uint8_t*) out->data[2] + sz - stride,
151
0
                       (uint8_t*) in->data[2] + sz - stride, -sz);
152
267
        } else {
153
267
            if (!data->num_uv_points[0])
154
133
                memcpy(out->data[1], in->data[1], sz);
155
267
            if (!data->num_uv_points[1])
156
101
                memcpy(out->data[2], in->data[2], sz);
157
267
        }
158
267
    }
159
1.14k
}
dav1d_prep_grain_16bpc
Line
Count
Source
105
1.16k
{
106
1.16k
    const Dav1dFilmGrainData *const data = &out->frame_hdr->film_grain.data;
107
1.16k
#if BITDEPTH != 8
108
1.16k
    const int bitdepth_max = (1 << out->p.bpc) - 1;
109
1.16k
#endif
110
111
    // Generate grain LUTs as needed
112
1.16k
    dsp->generate_grain_y(grain_lut[0], data HIGHBD_TAIL_SUFFIX); // always needed
113
1.16k
    if (data->num_uv_points[0] || data->chroma_scaling_from_luma)
114
1.04k
        dsp->generate_grain_uv[in->p.layout - 1](grain_lut[1], grain_lut[0],
115
1.04k
                                                 data, 0 HIGHBD_TAIL_SUFFIX);
116
1.16k
    if (data->num_uv_points[1] || data->chroma_scaling_from_luma)
117
1.04k
        dsp->generate_grain_uv[in->p.layout - 1](grain_lut[2], grain_lut[0],
118
1.04k
                                                 data, 1 HIGHBD_TAIL_SUFFIX);
119
120
    // Generate scaling LUTs as needed
121
1.16k
    if (data->num_y_points || data->chroma_scaling_from_luma)
122
1.15k
        generate_scaling(in->p.bpc, data->y_points, data->num_y_points, scaling[0]);
123
1.16k
    if (data->num_uv_points[0])
124
194
        generate_scaling(in->p.bpc, data->uv_points[0], data->num_uv_points[0], scaling[1]);
125
1.16k
    if (data->num_uv_points[1])
126
194
        generate_scaling(in->p.bpc, data->uv_points[1], data->num_uv_points[1], scaling[2]);
127
128
    // Copy over the non-modified planes
129
1.16k
    assert(out->stride[0] == in->stride[0]);
130
1.16k
    if (!data->num_y_points) {
131
90
        const ptrdiff_t stride = out->stride[0];
132
90
        const ptrdiff_t sz = out->p.h * stride;
133
90
        if (sz < 0)
134
0
            memcpy((uint8_t*) out->data[0] + sz - stride,
135
0
                   (uint8_t*) in->data[0] + sz - stride, -sz);
136
90
        else
137
90
            memcpy(out->data[0], in->data[0], sz);
138
90
    }
139
140
1.16k
    if (in->p.layout != DAV1D_PIXEL_LAYOUT_I400 && !data->chroma_scaling_from_luma) {
141
232
        assert(out->stride[1] == in->stride[1]);
142
232
        const int ss_ver = in->p.layout == DAV1D_PIXEL_LAYOUT_I420;
143
232
        const ptrdiff_t stride = out->stride[1];
144
232
        const ptrdiff_t sz = ((out->p.h + ss_ver) >> ss_ver) * stride;
145
232
        if (sz < 0) {
146
0
            if (!data->num_uv_points[0])
147
0
                memcpy((uint8_t*) out->data[1] + sz - stride,
148
0
                       (uint8_t*) in->data[1] + sz - stride, -sz);
149
0
            if (!data->num_uv_points[1])
150
0
                memcpy((uint8_t*) out->data[2] + sz - stride,
151
0
                       (uint8_t*) in->data[2] + sz - stride, -sz);
152
232
        } else {
153
232
            if (!data->num_uv_points[0])
154
38
                memcpy(out->data[1], in->data[1], sz);
155
232
            if (!data->num_uv_points[1])
156
38
                memcpy(out->data[2], in->data[2], sz);
157
232
        }
158
232
    }
159
1.16k
}
160
161
void bitfn(dav1d_apply_grain_row)(const Dav1dFilmGrainDSPContext *const dsp,
162
                                  Dav1dPicture *const out,
163
                                  const Dav1dPicture *const in,
164
                                  const uint8_t scaling[3][SCALING_SIZE],
165
                                  const entry grain_lut[3][GRAIN_HEIGHT+1][GRAIN_WIDTH],
166
                                  const int row)
167
28.6k
{
168
    // Synthesize grain for the affected planes
169
28.6k
    const Dav1dFilmGrainData *const data = &out->frame_hdr->film_grain.data;
170
28.6k
    const int ss_y = in->p.layout == DAV1D_PIXEL_LAYOUT_I420;
171
28.6k
    const int ss_x = in->p.layout != DAV1D_PIXEL_LAYOUT_I444;
172
28.6k
    const int cpw = (out->p.w + ss_x) >> ss_x;
173
28.6k
    const int is_id = out->seq_hdr->mtrx == DAV1D_MC_IDENTITY;
174
28.6k
    pixel *const luma_src =
175
28.6k
        ((pixel *) in->data[0]) + row * FG_BLOCK_SIZE * PXSTRIDE(in->stride[0]);
176
#if BITDEPTH != 8
177
    const int bitdepth_max = (1 << out->p.bpc) - 1;
178
#endif
179
180
28.6k
    if (data->num_y_points) {
181
25.0k
        const int bh = imin(out->p.h - row * FG_BLOCK_SIZE, FG_BLOCK_SIZE);
182
25.0k
        dsp->fgy_32x32xn(((pixel *) out->data[0]) + row * FG_BLOCK_SIZE * PXSTRIDE(out->stride[0]),
183
25.0k
                         luma_src, out->stride[0], data,
184
25.0k
                         out->p.w, scaling[0], grain_lut[0], bh, row HIGHBD_TAIL_SUFFIX);
185
25.0k
    }
186
187
28.6k
    if (!data->num_uv_points[0] && !data->num_uv_points[1] &&
188
26.5k
        !data->chroma_scaling_from_luma)
189
6.03k
    {
190
6.03k
        return;
191
6.03k
    }
192
193
22.6k
    const int bh = (imin(out->p.h - row * FG_BLOCK_SIZE, FG_BLOCK_SIZE) + ss_y) >> ss_y;
194
195
    // extend padding pixels
196
22.6k
    if (out->p.w & ss_x) {
197
4.07k
        pixel *ptr = luma_src;
198
63.3k
        for (int y = 0; y < bh; y++) {
199
59.3k
            ptr[out->p.w] = ptr[out->p.w - 1];
200
59.3k
            ptr += PXSTRIDE(in->stride[0]) << ss_y;
201
59.3k
        }
202
4.07k
    }
203
204
22.6k
    const ptrdiff_t uv_off = row * FG_BLOCK_SIZE * PXSTRIDE(out->stride[1]) >> ss_y;
205
22.6k
    if (data->chroma_scaling_from_luma) {
206
61.1k
        for (int pl = 0; pl < 2; pl++)
207
40.6k
            dsp->fguv_32x32xn[in->p.layout - 1](((pixel *) out->data[1 + pl]) + uv_off,
208
40.6k
                                                ((const pixel *) in->data[1 + pl]) + uv_off,
209
40.6k
                                                in->stride[1], data, cpw,
210
40.6k
                                                scaling[0], grain_lut[1 + pl],
211
40.6k
                                                bh, row, luma_src, in->stride[0],
212
40.6k
                                                pl, is_id HIGHBD_TAIL_SUFFIX);
213
20.5k
    } else {
214
5.83k
        for (int pl = 0; pl < 2; pl++)
215
3.71k
            if (data->num_uv_points[pl])
216
3.59k
                dsp->fguv_32x32xn[in->p.layout - 1](((pixel *) out->data[1 + pl]) + uv_off,
217
3.59k
                                                    ((const pixel *) in->data[1 + pl]) + uv_off,
218
3.59k
                                                    in->stride[1], data, cpw,
219
3.59k
                                                    scaling[1 + pl], grain_lut[1 + pl],
220
3.59k
                                                    bh, row, luma_src, in->stride[0],
221
3.59k
                                                    pl, is_id HIGHBD_TAIL_SUFFIX);
222
2.12k
    }
223
22.6k
}
dav1d_apply_grain_row_8bpc
Line
Count
Source
167
13.9k
{
168
    // Synthesize grain for the affected planes
169
13.9k
    const Dav1dFilmGrainData *const data = &out->frame_hdr->film_grain.data;
170
13.9k
    const int ss_y = in->p.layout == DAV1D_PIXEL_LAYOUT_I420;
171
13.9k
    const int ss_x = in->p.layout != DAV1D_PIXEL_LAYOUT_I444;
172
13.9k
    const int cpw = (out->p.w + ss_x) >> ss_x;
173
13.9k
    const int is_id = out->seq_hdr->mtrx == DAV1D_MC_IDENTITY;
174
13.9k
    pixel *const luma_src =
175
13.9k
        ((pixel *) in->data[0]) + row * FG_BLOCK_SIZE * PXSTRIDE(in->stride[0]);
176
#if BITDEPTH != 8
177
    const int bitdepth_max = (1 << out->p.bpc) - 1;
178
#endif
179
180
13.9k
    if (data->num_y_points) {
181
11.1k
        const int bh = imin(out->p.h - row * FG_BLOCK_SIZE, FG_BLOCK_SIZE);
182
11.1k
        dsp->fgy_32x32xn(((pixel *) out->data[0]) + row * FG_BLOCK_SIZE * PXSTRIDE(out->stride[0]),
183
11.1k
                         luma_src, out->stride[0], data,
184
11.1k
                         out->p.w, scaling[0], grain_lut[0], bh, row HIGHBD_TAIL_SUFFIX);
185
11.1k
    }
186
187
13.9k
    if (!data->num_uv_points[0] && !data->num_uv_points[1] &&
188
13.2k
        !data->chroma_scaling_from_luma)
189
1.27k
    {
190
1.27k
        return;
191
1.27k
    }
192
193
12.6k
    const int bh = (imin(out->p.h - row * FG_BLOCK_SIZE, FG_BLOCK_SIZE) + ss_y) >> ss_y;
194
195
    // extend padding pixels
196
12.6k
    if (out->p.w & ss_x) {
197
1.76k
        pixel *ptr = luma_src;
198
27.4k
        for (int y = 0; y < bh; y++) {
199
25.7k
            ptr[out->p.w] = ptr[out->p.w - 1];
200
25.7k
            ptr += PXSTRIDE(in->stride[0]) << ss_y;
201
25.7k
        }
202
1.76k
    }
203
204
12.6k
    const ptrdiff_t uv_off = row * FG_BLOCK_SIZE * PXSTRIDE(out->stride[1]) >> ss_y;
205
12.6k
    if (data->chroma_scaling_from_luma) {
206
35.6k
        for (int pl = 0; pl < 2; pl++)
207
23.6k
            dsp->fguv_32x32xn[in->p.layout - 1](((pixel *) out->data[1 + pl]) + uv_off,
208
23.6k
                                                ((const pixel *) in->data[1 + pl]) + uv_off,
209
23.6k
                                                in->stride[1], data, cpw,
210
23.6k
                                                scaling[0], grain_lut[1 + pl],
211
23.6k
                                                bh, row, luma_src, in->stride[0],
212
23.6k
                                                pl, is_id HIGHBD_TAIL_SUFFIX);
213
11.9k
    } else {
214
1.73k
        for (int pl = 0; pl < 2; pl++)
215
1.05k
            if (data->num_uv_points[pl])
216
997
                dsp->fguv_32x32xn[in->p.layout - 1](((pixel *) out->data[1 + pl]) + uv_off,
217
997
                                                    ((const pixel *) in->data[1 + pl]) + uv_off,
218
997
                                                    in->stride[1], data, cpw,
219
997
                                                    scaling[1 + pl], grain_lut[1 + pl],
220
997
                                                    bh, row, luma_src, in->stride[0],
221
997
                                                    pl, is_id HIGHBD_TAIL_SUFFIX);
222
679
    }
223
12.6k
}
dav1d_apply_grain_row_16bpc
Line
Count
Source
167
14.7k
{
168
    // Synthesize grain for the affected planes
169
14.7k
    const Dav1dFilmGrainData *const data = &out->frame_hdr->film_grain.data;
170
14.7k
    const int ss_y = in->p.layout == DAV1D_PIXEL_LAYOUT_I420;
171
14.7k
    const int ss_x = in->p.layout != DAV1D_PIXEL_LAYOUT_I444;
172
14.7k
    const int cpw = (out->p.w + ss_x) >> ss_x;
173
14.7k
    const int is_id = out->seq_hdr->mtrx == DAV1D_MC_IDENTITY;
174
14.7k
    pixel *const luma_src =
175
14.7k
        ((pixel *) in->data[0]) + row * FG_BLOCK_SIZE * PXSTRIDE(in->stride[0]);
176
14.7k
#if BITDEPTH != 8
177
14.7k
    const int bitdepth_max = (1 << out->p.bpc) - 1;
178
14.7k
#endif
179
180
14.7k
    if (data->num_y_points) {
181
13.8k
        const int bh = imin(out->p.h - row * FG_BLOCK_SIZE, FG_BLOCK_SIZE);
182
13.8k
        dsp->fgy_32x32xn(((pixel *) out->data[0]) + row * FG_BLOCK_SIZE * PXSTRIDE(out->stride[0]),
183
13.8k
                         luma_src, out->stride[0], data,
184
13.8k
                         out->p.w, scaling[0], grain_lut[0], bh, row HIGHBD_TAIL_SUFFIX);
185
13.8k
    }
186
187
14.7k
    if (!data->num_uv_points[0] && !data->num_uv_points[1] &&
188
13.2k
        !data->chroma_scaling_from_luma)
189
4.76k
    {
190
4.76k
        return;
191
4.76k
    }
192
193
9.98k
    const int bh = (imin(out->p.h - row * FG_BLOCK_SIZE, FG_BLOCK_SIZE) + ss_y) >> ss_y;
194
195
    // extend padding pixels
196
9.98k
    if (out->p.w & ss_x) {
197
2.30k
        pixel *ptr = luma_src;
198
35.9k
        for (int y = 0; y < bh; y++) {
199
33.6k
            ptr[out->p.w] = ptr[out->p.w - 1];
200
33.6k
            ptr += PXSTRIDE(in->stride[0]) << ss_y;
201
33.6k
        }
202
2.30k
    }
203
204
9.98k
    const ptrdiff_t uv_off = row * FG_BLOCK_SIZE * PXSTRIDE(out->stride[1]) >> ss_y;
205
9.98k
    if (data->chroma_scaling_from_luma) {
206
25.5k
        for (int pl = 0; pl < 2; pl++)
207
16.9k
            dsp->fguv_32x32xn[in->p.layout - 1](((pixel *) out->data[1 + pl]) + uv_off,
208
16.9k
                                                ((const pixel *) in->data[1 + pl]) + uv_off,
209
16.9k
                                                in->stride[1], data, cpw,
210
16.9k
                                                scaling[0], grain_lut[1 + pl],
211
16.9k
                                                bh, row, luma_src, in->stride[0],
212
16.9k
                                                pl, is_id HIGHBD_TAIL_SUFFIX);
213
8.53k
    } else {
214
4.10k
        for (int pl = 0; pl < 2; pl++)
215
2.66k
            if (data->num_uv_points[pl])
216
2.59k
                dsp->fguv_32x32xn[in->p.layout - 1](((pixel *) out->data[1 + pl]) + uv_off,
217
2.59k
                                                    ((const pixel *) in->data[1 + pl]) + uv_off,
218
2.59k
                                                    in->stride[1], data, cpw,
219
2.59k
                                                    scaling[1 + pl], grain_lut[1 + pl],
220
2.59k
                                                    bh, row, luma_src, in->stride[0],
221
2.59k
                                                    pl, is_id HIGHBD_TAIL_SUFFIX);
222
1.44k
    }
223
9.98k
}
224
225
void bitfn(dav1d_apply_grain)(const Dav1dFilmGrainDSPContext *const dsp,
226
                              Dav1dPicture *const out,
227
                              const Dav1dPicture *const in)
228
0
{
229
0
    ALIGN_STK_16(entry, grain_lut, 3,[GRAIN_HEIGHT + 1][GRAIN_WIDTH]);
230
#if ARCH_X86_64 && BITDEPTH == 8
231
0
    ALIGN_STK_64(uint8_t, scaling, 3,[SCALING_SIZE]);
232
#else
233
    uint8_t scaling[3][SCALING_SIZE];
234
#endif
235
0
    const int rows = (out->p.h + FG_BLOCK_SIZE - 1) / FG_BLOCK_SIZE;
236
237
0
    bitfn(dav1d_prep_grain)(dsp, out, in, scaling, grain_lut);
238
0
    for (int row = 0; row < rows; row++)
239
0
        bitfn(dav1d_apply_grain_row)(dsp, out, in, scaling, grain_lut, row);
240
0
}
Unexecuted instantiation: dav1d_apply_grain_8bpc
Unexecuted instantiation: dav1d_apply_grain_16bpc
241
#endif