Coverage Report

Created: 2026-06-15 06:25

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/work/dav1d/src/fg_apply_tmpl.c
Line
Count
Source
1
/*
2
 * Copyright © 2018, Niklas Haas
3
 * Copyright © 2018, VideoLAN and dav1d authors
4
 * Copyright © 2018, Two Orioles, LLC
5
 * All rights reserved.
6
 *
7
 * Redistribution and use in source and binary forms, with or without
8
 * modification, are permitted provided that the following conditions are met:
9
 *
10
 * 1. Redistributions of source code must retain the above copyright notice, this
11
 *    list of conditions and the following disclaimer.
12
 *
13
 * 2. Redistributions in binary form must reproduce the above copyright notice,
14
 *    this list of conditions and the following disclaimer in the documentation
15
 *    and/or other materials provided with the distribution.
16
 *
17
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
18
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
19
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
20
 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
21
 * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
22
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
23
 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
24
 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
26
 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27
 */
28
29
#include "config.h"
30
31
#include <stdint.h>
32
33
#include "dav1d/common.h"
34
#include "dav1d/picture.h"
35
36
#include "common/intops.h"
37
#include "common/bitdepth.h"
38
39
#include "src/fg_apply.h"
40
41
static void generate_scaling(const int bitdepth,
42
                             const uint8_t points[][2], const int num,
43
                             uint8_t scaling[SCALING_SIZE])
44
2.77k
{
45
2.77k
#if BITDEPTH == 8
46
2.77k
    const int shift_x = 0;
47
2.77k
    const int scaling_size = SCALING_SIZE;
48
#else
49
    assert(bitdepth > 8);
50
    const int shift_x = bitdepth - 8;
51
    const int scaling_size = 1 << bitdepth;
52
#endif
53
54
2.77k
    if (num == 0) {
55
213
        memset(scaling, 0, scaling_size);
56
213
        return;
57
213
    }
58
59
    // Fill up the preceding entries with the initial value
60
2.55k
    memset(scaling, points[0][1], points[0][0] << shift_x);
61
62
    // Linearly interpolate the values in the middle
63
3.74k
    for (int i = 0; i < num - 1; i++) {
64
1.18k
        const int bx = points[i][0];
65
1.18k
        const int by = points[i][1];
66
1.18k
        const int ex = points[i+1][0];
67
1.18k
        const int ey = points[i+1][1];
68
1.18k
        const int dx = ex - bx;
69
1.18k
        const int dy = ey - by;
70
1.18k
        assert(dx > 0);
71
1.18k
        const int delta = dy * ((0x10000 + (dx >> 1)) / dx);
72
94.8k
        for (int x = 0, d = 0x8000; x < dx; x++) {
73
93.6k
            scaling[(bx + x) << shift_x] = by + (d >> 16);
74
93.6k
            d += delta;
75
93.6k
        }
76
1.18k
    }
77
78
    // Fill up the remaining entries with the final value
79
2.55k
    const int n = points[num - 1][0] << shift_x;
80
2.55k
    memset(&scaling[n], points[num - 1][1], scaling_size - n);
81
82
#if BITDEPTH != 8
83
    const int pad = 1 << shift_x, rnd = pad >> 1;
84
    for (int i = 0; i < num - 1; i++) {
85
        const int bx = points[i][0] << shift_x;
86
        const int ex = points[i+1][0] << shift_x;
87
        const int dx = ex - bx;
88
        for (int x = 0; x < dx; x += pad) {
89
            const int range = scaling[bx + x + pad] - scaling[bx + x];
90
            for (int n = 1, r = rnd; n < pad; n++) {
91
                r += range;
92
                scaling[bx + x + n] = scaling[bx + x] + (r >> shift_x);
93
            }
94
        }
95
    }
96
#endif
97
2.55k
}
98
99
#ifndef UNIT_TEST
100
void bitfn(dav1d_prep_grain)(const Dav1dFilmGrainDSPContext *const dsp,
101
                             Dav1dPicture *const out,
102
                             const Dav1dPicture *const in,
103
                             uint8_t scaling[3][SCALING_SIZE],
104
                             entry grain_lut[3][GRAIN_HEIGHT+1][GRAIN_WIDTH])
105
4.57k
{
106
4.57k
    const Dav1dFilmGrainData *const data = &out->frame_hdr->film_grain.data;
107
#if BITDEPTH != 8
108
    const int bitdepth_max = (1 << out->p.bpc) - 1;
109
#endif
110
111
    // Generate grain LUTs as needed
112
4.57k
    dsp->generate_grain_y(grain_lut[0], data HIGHBD_TAIL_SUFFIX); // always needed
113
4.57k
    if (data->num_uv_points[0] || data->chroma_scaling_from_luma)
114
3.29k
        dsp->generate_grain_uv[in->p.layout - 1](grain_lut[1], grain_lut[0],
115
3.29k
                                                 data, 0 HIGHBD_TAIL_SUFFIX);
116
4.57k
    if (data->num_uv_points[1] || data->chroma_scaling_from_luma)
117
3.29k
        dsp->generate_grain_uv[in->p.layout - 1](grain_lut[2], grain_lut[0],
118
3.29k
                                                 data, 1 HIGHBD_TAIL_SUFFIX);
119
120
    // Generate scaling LUTs as needed
121
4.57k
    if (data->num_y_points || data->chroma_scaling_from_luma)
122
3.92k
        generate_scaling(in->p.bpc, data->y_points, data->num_y_points, scaling[0]);
123
4.57k
    if (data->num_uv_points[0])
124
965
        generate_scaling(in->p.bpc, data->uv_points[0], data->num_uv_points[0], scaling[1]);
125
4.57k
    if (data->num_uv_points[1])
126
971
        generate_scaling(in->p.bpc, data->uv_points[1], data->num_uv_points[1], scaling[2]);
127
128
    // Copy over the non-modified planes
129
4.57k
    assert(out->stride[0] == in->stride[0]);
130
4.57k
    if (!data->num_y_points) {
131
1.38k
        const ptrdiff_t stride = out->stride[0];
132
1.38k
        const ptrdiff_t sz = out->p.h * stride;
133
1.38k
        if (sz < 0)
134
0
            memcpy((uint8_t*) out->data[0] + sz - stride,
135
0
                   (uint8_t*) in->data[0] + sz - stride, -sz);
136
1.38k
        else
137
1.38k
            memcpy(out->data[0], in->data[0], sz);
138
1.38k
    }
139
140
4.57k
    if (in->p.layout != DAV1D_PIXEL_LAYOUT_I400 && !data->chroma_scaling_from_luma) {
141
1.83k
        assert(out->stride[1] == in->stride[1]);
142
1.83k
        const int ss_ver = in->p.layout == DAV1D_PIXEL_LAYOUT_I420;
143
1.83k
        const ptrdiff_t stride = out->stride[1];
144
1.83k
        const ptrdiff_t sz = ((out->p.h + ss_ver) >> ss_ver) * stride;
145
1.83k
        if (sz < 0) {
146
0
            if (!data->num_uv_points[0])
147
0
                memcpy((uint8_t*) out->data[1] + sz - stride,
148
0
                       (uint8_t*) in->data[1] + sz - stride, -sz);
149
0
            if (!data->num_uv_points[1])
150
0
                memcpy((uint8_t*) out->data[2] + sz - stride,
151
0
                       (uint8_t*) in->data[2] + sz - stride, -sz);
152
1.83k
        } else {
153
1.83k
            if (!data->num_uv_points[0])
154
872
                memcpy(out->data[1], in->data[1], sz);
155
1.83k
            if (!data->num_uv_points[1])
156
866
                memcpy(out->data[2], in->data[2], sz);
157
1.83k
        }
158
1.83k
    }
159
4.57k
}
dav1d_prep_grain_8bpc
Line
Count
Source
105
2.19k
{
106
2.19k
    const Dav1dFilmGrainData *const data = &out->frame_hdr->film_grain.data;
107
#if BITDEPTH != 8
108
    const int bitdepth_max = (1 << out->p.bpc) - 1;
109
#endif
110
111
    // Generate grain LUTs as needed
112
2.19k
    dsp->generate_grain_y(grain_lut[0], data HIGHBD_TAIL_SUFFIX); // always needed
113
2.19k
    if (data->num_uv_points[0] || data->chroma_scaling_from_luma)
114
1.49k
        dsp->generate_grain_uv[in->p.layout - 1](grain_lut[1], grain_lut[0],
115
1.49k
                                                 data, 0 HIGHBD_TAIL_SUFFIX);
116
2.19k
    if (data->num_uv_points[1] || data->chroma_scaling_from_luma)
117
1.65k
        dsp->generate_grain_uv[in->p.layout - 1](grain_lut[2], grain_lut[0],
118
1.65k
                                                 data, 1 HIGHBD_TAIL_SUFFIX);
119
120
    // Generate scaling LUTs as needed
121
2.19k
    if (data->num_y_points || data->chroma_scaling_from_luma)
122
1.80k
        generate_scaling(in->p.bpc, data->y_points, data->num_y_points, scaling[0]);
123
2.19k
    if (data->num_uv_points[0])
124
402
        generate_scaling(in->p.bpc, data->uv_points[0], data->num_uv_points[0], scaling[1]);
125
2.19k
    if (data->num_uv_points[1])
126
564
        generate_scaling(in->p.bpc, data->uv_points[1], data->num_uv_points[1], scaling[2]);
127
128
    // Copy over the non-modified planes
129
2.19k
    assert(out->stride[0] == in->stride[0]);
130
2.19k
    if (!data->num_y_points) {
131
604
        const ptrdiff_t stride = out->stride[0];
132
604
        const ptrdiff_t sz = out->p.h * stride;
133
604
        if (sz < 0)
134
0
            memcpy((uint8_t*) out->data[0] + sz - stride,
135
0
                   (uint8_t*) in->data[0] + sz - stride, -sz);
136
604
        else
137
604
            memcpy(out->data[0], in->data[0], sz);
138
604
    }
139
140
2.19k
    if (in->p.layout != DAV1D_PIXEL_LAYOUT_I400 && !data->chroma_scaling_from_luma) {
141
900
        assert(out->stride[1] == in->stride[1]);
142
900
        const int ss_ver = in->p.layout == DAV1D_PIXEL_LAYOUT_I420;
143
900
        const ptrdiff_t stride = out->stride[1];
144
900
        const ptrdiff_t sz = ((out->p.h + ss_ver) >> ss_ver) * stride;
145
900
        if (sz < 0) {
146
0
            if (!data->num_uv_points[0])
147
0
                memcpy((uint8_t*) out->data[1] + sz - stride,
148
0
                       (uint8_t*) in->data[1] + sz - stride, -sz);
149
0
            if (!data->num_uv_points[1])
150
0
                memcpy((uint8_t*) out->data[2] + sz - stride,
151
0
                       (uint8_t*) in->data[2] + sz - stride, -sz);
152
900
        } else {
153
900
            if (!data->num_uv_points[0])
154
498
                memcpy(out->data[1], in->data[1], sz);
155
900
            if (!data->num_uv_points[1])
156
336
                memcpy(out->data[2], in->data[2], sz);
157
900
        }
158
900
    }
159
2.19k
}
dav1d_prep_grain_16bpc
Line
Count
Source
105
2.37k
{
106
2.37k
    const Dav1dFilmGrainData *const data = &out->frame_hdr->film_grain.data;
107
2.37k
#if BITDEPTH != 8
108
2.37k
    const int bitdepth_max = (1 << out->p.bpc) - 1;
109
2.37k
#endif
110
111
    // Generate grain LUTs as needed
112
2.37k
    dsp->generate_grain_y(grain_lut[0], data HIGHBD_TAIL_SUFFIX); // always needed
113
2.37k
    if (data->num_uv_points[0] || data->chroma_scaling_from_luma)
114
1.79k
        dsp->generate_grain_uv[in->p.layout - 1](grain_lut[1], grain_lut[0],
115
1.79k
                                                 data, 0 HIGHBD_TAIL_SUFFIX);
116
2.37k
    if (data->num_uv_points[1] || data->chroma_scaling_from_luma)
117
1.63k
        dsp->generate_grain_uv[in->p.layout - 1](grain_lut[2], grain_lut[0],
118
1.63k
                                                 data, 1 HIGHBD_TAIL_SUFFIX);
119
120
    // Generate scaling LUTs as needed
121
2.37k
    if (data->num_y_points || data->chroma_scaling_from_luma)
122
2.12k
        generate_scaling(in->p.bpc, data->y_points, data->num_y_points, scaling[0]);
123
2.37k
    if (data->num_uv_points[0])
124
563
        generate_scaling(in->p.bpc, data->uv_points[0], data->num_uv_points[0], scaling[1]);
125
2.37k
    if (data->num_uv_points[1])
126
407
        generate_scaling(in->p.bpc, data->uv_points[1], data->num_uv_points[1], scaling[2]);
127
128
    // Copy over the non-modified planes
129
2.37k
    assert(out->stride[0] == in->stride[0]);
130
2.37k
    if (!data->num_y_points) {
131
781
        const ptrdiff_t stride = out->stride[0];
132
781
        const ptrdiff_t sz = out->p.h * stride;
133
781
        if (sz < 0)
134
0
            memcpy((uint8_t*) out->data[0] + sz - stride,
135
0
                   (uint8_t*) in->data[0] + sz - stride, -sz);
136
781
        else
137
781
            memcpy(out->data[0], in->data[0], sz);
138
781
    }
139
140
2.37k
    if (in->p.layout != DAV1D_PIXEL_LAYOUT_I400 && !data->chroma_scaling_from_luma) {
141
937
        assert(out->stride[1] == in->stride[1]);
142
937
        const int ss_ver = in->p.layout == DAV1D_PIXEL_LAYOUT_I420;
143
937
        const ptrdiff_t stride = out->stride[1];
144
937
        const ptrdiff_t sz = ((out->p.h + ss_ver) >> ss_ver) * stride;
145
937
        if (sz < 0) {
146
0
            if (!data->num_uv_points[0])
147
0
                memcpy((uint8_t*) out->data[1] + sz - stride,
148
0
                       (uint8_t*) in->data[1] + sz - stride, -sz);
149
0
            if (!data->num_uv_points[1])
150
0
                memcpy((uint8_t*) out->data[2] + sz - stride,
151
0
                       (uint8_t*) in->data[2] + sz - stride, -sz);
152
937
        } else {
153
937
            if (!data->num_uv_points[0])
154
374
                memcpy(out->data[1], in->data[1], sz);
155
937
            if (!data->num_uv_points[1])
156
530
                memcpy(out->data[2], in->data[2], sz);
157
937
        }
158
937
    }
159
2.37k
}
160
161
void bitfn(dav1d_apply_grain_row)(const Dav1dFilmGrainDSPContext *const dsp,
162
                                  Dav1dPicture *const out,
163
                                  const Dav1dPicture *const in,
164
                                  const uint8_t scaling[3][SCALING_SIZE],
165
                                  const entry grain_lut[3][GRAIN_HEIGHT+1][GRAIN_WIDTH],
166
                                  const int row)
167
45.0k
{
168
    // Synthesize grain for the affected planes
169
45.0k
    const Dav1dFilmGrainData *const data = &out->frame_hdr->film_grain.data;
170
45.0k
    const int ss_y = in->p.layout == DAV1D_PIXEL_LAYOUT_I420;
171
45.0k
    const int ss_x = in->p.layout != DAV1D_PIXEL_LAYOUT_I444;
172
45.0k
    const int cpw = (out->p.w + ss_x) >> ss_x;
173
45.0k
    const int is_id = out->seq_hdr->mtrx == DAV1D_MC_IDENTITY;
174
45.0k
    pixel *const luma_src =
175
45.0k
        ((pixel *) in->data[0]) + row * FG_BLOCK_SIZE * PXSTRIDE(in->stride[0]);
176
#if BITDEPTH != 8
177
    const int bitdepth_max = (1 << out->p.bpc) - 1;
178
#endif
179
180
45.0k
    if (data->num_y_points) {
181
32.7k
        const int bh = imin(out->p.h - row * FG_BLOCK_SIZE, FG_BLOCK_SIZE);
182
32.7k
        dsp->fgy_32x32xn(((pixel *) out->data[0]) + row * FG_BLOCK_SIZE * PXSTRIDE(out->stride[0]),
183
32.7k
                         luma_src, out->stride[0], data,
184
32.7k
                         out->p.w, scaling[0], grain_lut[0], bh, row HIGHBD_TAIL_SUFFIX);
185
32.7k
    }
186
187
45.0k
    if (!data->num_uv_points[0] && !data->num_uv_points[1] &&
188
33.6k
        !data->chroma_scaling_from_luma)
189
10.9k
    {
190
10.9k
        return;
191
10.9k
    }
192
193
34.1k
    const int bh = (imin(out->p.h - row * FG_BLOCK_SIZE, FG_BLOCK_SIZE) + ss_y) >> ss_y;
194
195
    // extend padding pixels
196
34.1k
    if (out->p.w & ss_x) {
197
4.72k
        pixel *ptr = luma_src;
198
72.0k
        for (int y = 0; y < bh; y++) {
199
67.3k
            ptr[out->p.w] = ptr[out->p.w - 1];
200
67.3k
            ptr += PXSTRIDE(in->stride[0]) << ss_y;
201
67.3k
        }
202
4.72k
    }
203
204
34.1k
    const ptrdiff_t uv_off = row * FG_BLOCK_SIZE * PXSTRIDE(out->stride[1]) >> ss_y;
205
34.1k
    if (data->chroma_scaling_from_luma) {
206
67.5k
        for (int pl = 0; pl < 2; pl++)
207
44.8k
            dsp->fguv_32x32xn[in->p.layout - 1](((pixel *) out->data[1 + pl]) + uv_off,
208
44.8k
                                                ((const pixel *) in->data[1 + pl]) + uv_off,
209
44.8k
                                                in->stride[1], data, cpw,
210
44.8k
                                                scaling[0], grain_lut[1 + pl],
211
44.8k
                                                bh, row, luma_src, in->stride[0],
212
44.8k
                                                pl, is_id HIGHBD_TAIL_SUFFIX);
213
22.7k
    } else {
214
32.9k
        for (int pl = 0; pl < 2; pl++)
215
21.5k
            if (data->num_uv_points[pl])
216
13.6k
                dsp->fguv_32x32xn[in->p.layout - 1](((pixel *) out->data[1 + pl]) + uv_off,
217
13.6k
                                                    ((const pixel *) in->data[1 + pl]) + uv_off,
218
13.6k
                                                    in->stride[1], data, cpw,
219
13.6k
                                                    scaling[1 + pl], grain_lut[1 + pl],
220
13.6k
                                                    bh, row, luma_src, in->stride[0],
221
13.6k
                                                    pl, is_id HIGHBD_TAIL_SUFFIX);
222
11.4k
    }
223
34.1k
}
dav1d_apply_grain_row_8bpc
Line
Count
Source
167
24.7k
{
168
    // Synthesize grain for the affected planes
169
24.7k
    const Dav1dFilmGrainData *const data = &out->frame_hdr->film_grain.data;
170
24.7k
    const int ss_y = in->p.layout == DAV1D_PIXEL_LAYOUT_I420;
171
24.7k
    const int ss_x = in->p.layout != DAV1D_PIXEL_LAYOUT_I444;
172
24.7k
    const int cpw = (out->p.w + ss_x) >> ss_x;
173
24.7k
    const int is_id = out->seq_hdr->mtrx == DAV1D_MC_IDENTITY;
174
24.7k
    pixel *const luma_src =
175
24.7k
        ((pixel *) in->data[0]) + row * FG_BLOCK_SIZE * PXSTRIDE(in->stride[0]);
176
#if BITDEPTH != 8
177
    const int bitdepth_max = (1 << out->p.bpc) - 1;
178
#endif
179
180
24.7k
    if (data->num_y_points) {
181
18.0k
        const int bh = imin(out->p.h - row * FG_BLOCK_SIZE, FG_BLOCK_SIZE);
182
18.0k
        dsp->fgy_32x32xn(((pixel *) out->data[0]) + row * FG_BLOCK_SIZE * PXSTRIDE(out->stride[0]),
183
18.0k
                         luma_src, out->stride[0], data,
184
18.0k
                         out->p.w, scaling[0], grain_lut[0], bh, row HIGHBD_TAIL_SUFFIX);
185
18.0k
    }
186
187
24.7k
    if (!data->num_uv_points[0] && !data->num_uv_points[1] &&
188
18.5k
        !data->chroma_scaling_from_luma)
189
4.84k
    {
190
4.84k
        return;
191
4.84k
    }
192
193
19.9k
    const int bh = (imin(out->p.h - row * FG_BLOCK_SIZE, FG_BLOCK_SIZE) + ss_y) >> ss_y;
194
195
    // extend padding pixels
196
19.9k
    if (out->p.w & ss_x) {
197
3.62k
        pixel *ptr = luma_src;
198
57.1k
        for (int y = 0; y < bh; y++) {
199
53.5k
            ptr[out->p.w] = ptr[out->p.w - 1];
200
53.5k
            ptr += PXSTRIDE(in->stride[0]) << ss_y;
201
53.5k
        }
202
3.62k
    }
203
204
19.9k
    const ptrdiff_t uv_off = row * FG_BLOCK_SIZE * PXSTRIDE(out->stride[1]) >> ss_y;
205
19.9k
    if (data->chroma_scaling_from_luma) {
206
40.7k
        for (int pl = 0; pl < 2; pl++)
207
27.1k
            dsp->fguv_32x32xn[in->p.layout - 1](((pixel *) out->data[1 + pl]) + uv_off,
208
27.1k
                                                ((const pixel *) in->data[1 + pl]) + uv_off,
209
27.1k
                                                in->stride[1], data, cpw,
210
27.1k
                                                scaling[0], grain_lut[1 + pl],
211
27.1k
                                                bh, row, luma_src, in->stride[0],
212
27.1k
                                                pl, is_id HIGHBD_TAIL_SUFFIX);
213
13.6k
    } else {
214
18.2k
        for (int pl = 0; pl < 2; pl++)
215
12.0k
            if (data->num_uv_points[pl])
216
8.05k
                dsp->fguv_32x32xn[in->p.layout - 1](((pixel *) out->data[1 + pl]) + uv_off,
217
8.05k
                                                    ((const pixel *) in->data[1 + pl]) + uv_off,
218
8.05k
                                                    in->stride[1], data, cpw,
219
8.05k
                                                    scaling[1 + pl], grain_lut[1 + pl],
220
8.05k
                                                    bh, row, luma_src, in->stride[0],
221
8.05k
                                                    pl, is_id HIGHBD_TAIL_SUFFIX);
222
6.24k
    }
223
19.9k
}
dav1d_apply_grain_row_16bpc
Line
Count
Source
167
20.3k
{
168
    // Synthesize grain for the affected planes
169
20.3k
    const Dav1dFilmGrainData *const data = &out->frame_hdr->film_grain.data;
170
20.3k
    const int ss_y = in->p.layout == DAV1D_PIXEL_LAYOUT_I420;
171
20.3k
    const int ss_x = in->p.layout != DAV1D_PIXEL_LAYOUT_I444;
172
20.3k
    const int cpw = (out->p.w + ss_x) >> ss_x;
173
20.3k
    const int is_id = out->seq_hdr->mtrx == DAV1D_MC_IDENTITY;
174
20.3k
    pixel *const luma_src =
175
20.3k
        ((pixel *) in->data[0]) + row * FG_BLOCK_SIZE * PXSTRIDE(in->stride[0]);
176
20.3k
#if BITDEPTH != 8
177
20.3k
    const int bitdepth_max = (1 << out->p.bpc) - 1;
178
20.3k
#endif
179
180
20.3k
    if (data->num_y_points) {
181
14.7k
        const int bh = imin(out->p.h - row * FG_BLOCK_SIZE, FG_BLOCK_SIZE);
182
14.7k
        dsp->fgy_32x32xn(((pixel *) out->data[0]) + row * FG_BLOCK_SIZE * PXSTRIDE(out->stride[0]),
183
14.7k
                         luma_src, out->stride[0], data,
184
14.7k
                         out->p.w, scaling[0], grain_lut[0], bh, row HIGHBD_TAIL_SUFFIX);
185
14.7k
    }
186
187
20.3k
    if (!data->num_uv_points[0] && !data->num_uv_points[1] &&
188
15.1k
        !data->chroma_scaling_from_luma)
189
6.09k
    {
190
6.09k
        return;
191
6.09k
    }
192
193
14.2k
    const int bh = (imin(out->p.h - row * FG_BLOCK_SIZE, FG_BLOCK_SIZE) + ss_y) >> ss_y;
194
195
    // extend padding pixels
196
14.2k
    if (out->p.w & ss_x) {
197
1.09k
        pixel *ptr = luma_src;
198
14.9k
        for (int y = 0; y < bh; y++) {
199
13.8k
            ptr[out->p.w] = ptr[out->p.w - 1];
200
13.8k
            ptr += PXSTRIDE(in->stride[0]) << ss_y;
201
13.8k
        }
202
1.09k
    }
203
204
14.2k
    const ptrdiff_t uv_off = row * FG_BLOCK_SIZE * PXSTRIDE(out->stride[1]) >> ss_y;
205
14.2k
    if (data->chroma_scaling_from_luma) {
206
26.7k
        for (int pl = 0; pl < 2; pl++)
207
17.7k
            dsp->fguv_32x32xn[in->p.layout - 1](((pixel *) out->data[1 + pl]) + uv_off,
208
17.7k
                                                ((const pixel *) in->data[1 + pl]) + uv_off,
209
17.7k
                                                in->stride[1], data, cpw,
210
17.7k
                                                scaling[0], grain_lut[1 + pl],
211
17.7k
                                                bh, row, luma_src, in->stride[0],
212
17.7k
                                                pl, is_id HIGHBD_TAIL_SUFFIX);
213
9.05k
    } else {
214
14.6k
        for (int pl = 0; pl < 2; pl++)
215
9.49k
            if (data->num_uv_points[pl])
216
5.63k
                dsp->fguv_32x32xn[in->p.layout - 1](((pixel *) out->data[1 + pl]) + uv_off,
217
5.63k
                                                    ((const pixel *) in->data[1 + pl]) + uv_off,
218
5.63k
                                                    in->stride[1], data, cpw,
219
5.63k
                                                    scaling[1 + pl], grain_lut[1 + pl],
220
5.63k
                                                    bh, row, luma_src, in->stride[0],
221
5.63k
                                                    pl, is_id HIGHBD_TAIL_SUFFIX);
222
5.19k
    }
223
14.2k
}
224
225
void bitfn(dav1d_apply_grain)(const Dav1dFilmGrainDSPContext *const dsp,
226
                              Dav1dPicture *const out,
227
                              const Dav1dPicture *const in)
228
0
{
229
0
    ALIGN_STK_16(entry, grain_lut, 3,[GRAIN_HEIGHT + 1][GRAIN_WIDTH]);
230
#if ARCH_X86_64 && BITDEPTH == 8
231
0
    ALIGN_STK_64(uint8_t, scaling, 3,[SCALING_SIZE]);
232
#else
233
    uint8_t scaling[3][SCALING_SIZE];
234
#endif
235
0
    const int rows = (out->p.h + FG_BLOCK_SIZE - 1) / FG_BLOCK_SIZE;
236
237
0
    bitfn(dav1d_prep_grain)(dsp, out, in, scaling, grain_lut);
238
0
    for (int row = 0; row < rows; row++)
239
0
        bitfn(dav1d_apply_grain_row)(dsp, out, in, scaling, grain_lut, row);
240
0
}
Unexecuted instantiation: dav1d_apply_grain_8bpc
Unexecuted instantiation: dav1d_apply_grain_16bpc
241
#endif