Coverage Report

Created: 2026-06-10 07:00

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/work/dav1d/src/mc_tmpl.c
Line
Count
Source
1
/*
2
 * Copyright © 2018, VideoLAN and dav1d authors
3
 * Copyright © 2018, Two Orioles, LLC
4
 * All rights reserved.
5
 *
6
 * Redistribution and use in source and binary forms, with or without
7
 * modification, are permitted provided that the following conditions are met:
8
 *
9
 * 1. Redistributions of source code must retain the above copyright notice, this
10
 *    list of conditions and the following disclaimer.
11
 *
12
 * 2. Redistributions in binary form must reproduce the above copyright notice,
13
 *    this list of conditions and the following disclaimer in the documentation
14
 *    and/or other materials provided with the distribution.
15
 *
16
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
17
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19
 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
20
 * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
21
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
22
 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
23
 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25
 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26
 */
27
28
#include "config.h"
29
30
#include <stdlib.h>
31
#include <string.h>
32
33
#include "common/attributes.h"
34
#include "common/intops.h"
35
36
#include "src/mc.h"
37
#include "src/tables.h"
38
39
#if BITDEPTH == 8
40
1.51M
#define get_intermediate_bits(bitdepth_max) 4
41
// Output in interval [-5132, 9212], fits in int16_t as is
42
146M
#define PREP_BIAS 0
43
#else
44
// 4 for 10 bits/component, 2 for 12 bits/component
45
#define get_intermediate_bits(bitdepth_max) (14 - bitdepth_from_max(bitdepth_max))
46
// Output in interval [-20588, 36956] (10-bit), [-20602, 36983] (12-bit)
47
// Subtract a bias to ensure the output fits in int16_t
48
#define PREP_BIAS 8192
49
#endif
50
51
static NOINLINE void
52
put_c(pixel *dst, const ptrdiff_t dst_stride,
53
      const pixel *src, const ptrdiff_t src_stride, const int w, int h)
54
471k
{
55
8.29M
    do {
56
8.29M
        pixel_copy(dst, src, w);
57
58
8.29M
        dst += dst_stride;
59
8.29M
        src += src_stride;
60
8.29M
    } while (--h);
61
471k
}
62
63
static NOINLINE void
64
prep_c(int16_t *tmp, const pixel *src, const ptrdiff_t src_stride,
65
       const int w, int h HIGHBD_DECL_SUFFIX)
66
56.6k
{
67
56.6k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
68
1.71M
    do {
69
69.5M
        for (int x = 0; x < w; x++)
70
67.8M
            tmp[x] = (src[x] << intermediate_bits) - PREP_BIAS;
71
72
1.71M
        tmp += w;
73
1.71M
        src += src_stride;
74
1.71M
    } while (--h);
75
56.6k
}
76
77
#define FILTER_8TAP(src, x, F, stride) \
78
189M
    (F[0] * src[x + -3 * stride] + \
79
189M
     F[1] * src[x + -2 * stride] + \
80
189M
     F[2] * src[x + -1 * stride] + \
81
189M
     F[3] * src[x + +0 * stride] + \
82
189M
     F[4] * src[x + +1 * stride] + \
83
189M
     F[5] * src[x + +2 * stride] + \
84
189M
     F[6] * src[x + +3 * stride] + \
85
189M
     F[7] * src[x + +4 * stride])
86
87
#define FILTER_8TAP2(src, x, F) \
88
124M
    (F[0] * src[0][x] + \
89
124M
     F[1] * src[1][x] + \
90
124M
     F[2] * src[2][x] + \
91
124M
     F[3] * src[3][x] + \
92
124M
     F[4] * src[4][x] + \
93
124M
     F[5] * src[5][x] + \
94
124M
     F[6] * src[6][x] + \
95
124M
     F[7] * src[7][x])
96
97
#define DAV1D_FILTER_8TAP_RND(src, x, F, stride, sh) \
98
168M
    ((FILTER_8TAP(src, x, F, stride) + ((1 << (sh)) >> 1)) >> (sh))
99
100
#define DAV1D_FILTER_8TAP_RND2(src, x, F, stride, rnd, sh) \
101
20.3M
    ((FILTER_8TAP(src, x, F, stride) + (rnd)) >> (sh))
102
103
#define DAV1D_FILTER_8TAP_RND3(src, x, F, sh) \
104
124M
    ((FILTER_8TAP2(src, x, F) + ((1 << (sh)) >> 1)) >> (sh))
105
106
#define DAV1D_FILTER_8TAP_CLIP(src, x, F, stride, sh) \
107
32.1M
    iclip_pixel(DAV1D_FILTER_8TAP_RND(src, x, F, stride, sh))
108
109
#define DAV1D_FILTER_8TAP_CLIP2(src, x, F, stride, rnd, sh) \
110
20.3M
    iclip_pixel(DAV1D_FILTER_8TAP_RND2(src, x, F, stride, rnd, sh))
111
112
#define DAV1D_FILTER_8TAP_CLIP3(src, x, F, sh) \
113
87.9M
    iclip_pixel(DAV1D_FILTER_8TAP_RND3(src, x, F, sh))
114
115
#define GET_H_FILTER(mx) \
116
80.6M
    const int8_t *const fh = !(mx) ? NULL : w > 4 ? \
117
72.5M
        dav1d_mc_subpel_filters[filter_type & 3][(mx) - 1] : \
118
72.5M
        dav1d_mc_subpel_filters[3 + (filter_type & 1)][(mx) - 1]
119
120
#define GET_V_FILTER(my) \
121
4.28M
    const int8_t *const fv = !(my) ? NULL : h > 4 ? \
122
3.44M
        dav1d_mc_subpel_filters[filter_type >> 2][(my) - 1] : \
123
3.44M
        dav1d_mc_subpel_filters[3 + ((filter_type >> 2) & 1)][(my) - 1]
124
125
#define GET_FILTERS() \
126
448k
    GET_H_FILTER(mx); \
127
448k
    GET_V_FILTER(my)
128
129
static NOINLINE void
130
put_8tap_c(pixel *dst, ptrdiff_t dst_stride,
131
           const pixel *src, ptrdiff_t src_stride,
132
           const int w, int h, const int mx, const int my,
133
           const int filter_type HIGHBD_DECL_SUFFIX)
134
363k
{
135
363k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
136
363k
    const int intermediate_rnd = 32 + ((1 << (6 - intermediate_bits)) >> 1);
137
138
363k
    GET_FILTERS();
139
363k
    dst_stride = PXSTRIDE(dst_stride);
140
363k
    src_stride = PXSTRIDE(src_stride);
141
142
363k
    if (fh) {
143
124k
        if (fv) {
144
66.2k
            int tmp_h = h + 7;
145
66.2k
            int16_t mid[128 * 135], *mid_ptr = mid;
146
147
66.2k
            src -= src_stride * 3;
148
1.32M
            do {
149
35.5M
                for (int x = 0; x < w; x++)
150
34.1M
                    mid_ptr[x] = DAV1D_FILTER_8TAP_RND(src, x, fh, 1,
151
1.32M
                                                       6 - intermediate_bits);
152
153
1.32M
                mid_ptr += 128;
154
1.32M
                src += src_stride;
155
1.32M
            } while (--tmp_h);
156
157
66.2k
            mid_ptr = mid + 128 * 3;
158
802k
            do {
159
22.5M
                for (int x = 0; x < w; x++)
160
21.7M
                    dst[x] = DAV1D_FILTER_8TAP_CLIP(mid_ptr, x, fv, 128,
161
802k
                                                    6 + intermediate_bits);
162
163
802k
                mid_ptr += 128;
164
802k
                dst += dst_stride;
165
802k
            } while (--h);
166
66.2k
        } else {
167
712k
            do {
168
21.0M
                for (int x = 0; x < w; x++) {
169
20.3M
                    dst[x] = DAV1D_FILTER_8TAP_CLIP2(src, x, fh, 1,
170
20.3M
                                                     intermediate_rnd, 6);
171
20.3M
                }
172
173
712k
                dst += dst_stride;
174
712k
                src += src_stride;
175
712k
            } while (--h);
176
58.3k
        }
177
239k
    } else if (fv) {
178
400k
        do {
179
10.8M
            for (int x = 0; x < w; x++)
180
10.4M
                dst[x] = DAV1D_FILTER_8TAP_CLIP(src, x, fv, src_stride, 6);
181
182
400k
            dst += dst_stride;
183
400k
            src += src_stride;
184
400k
        } while (--h);
185
34.6k
    } else
186
204k
        put_c(dst, dst_stride, src, src_stride, w, h);
187
363k
}
188
189
static NOINLINE void
190
put_8tap_scaled_c(pixel *dst, const ptrdiff_t dst_stride,
191
                  const pixel *src, ptrdiff_t src_stride,
192
                  const int w, int h, const int mx, int my,
193
                  const int dx, const int dy, const int filter_type
194
                  HIGHBD_DECL_SUFFIX)
195
143k
{
196
143k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
197
143k
    const int intermediate_rnd = (1 << intermediate_bits) >> 1;
198
143k
    int16_t mid[128 * 8];
199
143k
    int16_t *mid_ptrs[8];
200
143k
    int in_y = -8;
201
143k
    src_stride = PXSTRIDE(src_stride);
202
203
1.28M
    for (int i = 0; i < 8; i++)
204
1.14M
        mid_ptrs[i] = &mid[128 * i];
205
206
143k
    src -= src_stride * 3;
207
208
2.77M
    for (int y = 0; y < h; y++) {
209
2.62M
        int x;
210
2.62M
        int src_y = my >> 10;
211
2.62M
        GET_V_FILTER((my & 0x3ff) >> 6);
212
213
4.75M
        while (in_y < src_y) {
214
2.12M
            int imx = mx, ioff = 0;
215
2.12M
            int16_t *mid_ptr = mid_ptrs[0];
216
217
16.9M
            for (int i = 0; i < 7; i++)
218
14.8M
                mid_ptrs[i] = mid_ptrs[i + 1];
219
2.12M
            mid_ptrs[7] = mid_ptr;
220
221
59.2M
            for (x = 0; x < w; x++) {
222
57.1M
                GET_H_FILTER(imx >> 6);
223
57.1M
                mid_ptr[x] = fh ? DAV1D_FILTER_8TAP_RND(src, ioff, fh, 1,
224
57.1M
                                                        6 - intermediate_bits) :
225
57.1M
                                  src[ioff] << intermediate_bits;
226
57.1M
                imx += dx;
227
57.1M
                ioff += imx >> 10;
228
57.1M
                imx &= 0x3ff;
229
57.1M
            }
230
231
2.12M
            src += src_stride;
232
2.12M
            in_y++;
233
2.12M
        }
234
235
101M
        for (x = 0; x < w; x++)
236
98.4M
            dst[x] = fv ? DAV1D_FILTER_8TAP_CLIP3(mid_ptrs, x, fv,
237
98.4M
                                                  6 + intermediate_bits) :
238
98.4M
                          iclip_pixel((mid_ptrs[3][x] + intermediate_rnd) >>
239
10.5M
                                              intermediate_bits);
240
241
2.62M
        my += dy;
242
2.62M
        dst += PXSTRIDE(dst_stride);
243
2.62M
    }
244
143k
}
245
246
static NOINLINE void
247
prep_8tap_c(int16_t *tmp, const pixel *src, ptrdiff_t src_stride,
248
            const int w, int h, const int mx, const int my,
249
            const int filter_type HIGHBD_DECL_SUFFIX)
250
84.9k
{
251
84.9k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
252
84.9k
    GET_FILTERS();
253
84.9k
    src_stride = PXSTRIDE(src_stride);
254
255
84.9k
    if (fh) {
256
26.7k
        if (fv) {
257
16.3k
            int tmp_h = h + 7;
258
16.3k
            int16_t mid[128 * 135], *mid_ptr = mid;
259
260
16.3k
            src -= src_stride * 3;
261
381k
            do {
262
9.04M
                for (int x = 0; x < w; x++)
263
8.66M
                    mid_ptr[x] = DAV1D_FILTER_8TAP_RND(src, x, fh, 1,
264
381k
                                                       6 - intermediate_bits);
265
266
381k
                mid_ptr += 128;
267
381k
                src += src_stride;
268
381k
            } while (--tmp_h);
269
270
16.3k
            mid_ptr = mid + 128 * 3;
271
267k
            do {
272
7.39M
                for (int x = 0; x < w; x++) {
273
7.13M
                    int t = DAV1D_FILTER_8TAP_RND(mid_ptr, x, fv, 128, 6) -
274
7.13M
                                  PREP_BIAS;
275
7.13M
                    assert(t >= INT16_MIN && t <= INT16_MAX);
276
7.13M
                    tmp[x] = t;
277
7.13M
                }
278
279
267k
                mid_ptr += 128;
280
267k
                tmp += w;
281
267k
            } while (--h);
282
16.3k
        } else {
283
229k
            do {
284
8.53M
                for (int x = 0; x < w; x++)
285
8.30M
                    tmp[x] = DAV1D_FILTER_8TAP_RND(src, x, fh, 1,
286
8.30M
                                                   6 - intermediate_bits) -
287
8.30M
                             PREP_BIAS;
288
289
229k
                tmp += w;
290
229k
                src += src_stride;
291
229k
            } while (--h);
292
10.4k
        }
293
58.1k
    } else if (fv) {
294
186k
        do {
295
5.79M
            for (int x = 0; x < w; x++)
296
5.60M
                tmp[x] = DAV1D_FILTER_8TAP_RND(src, x, fv, src_stride,
297
5.60M
                                               6 - intermediate_bits) -
298
5.60M
                         PREP_BIAS;
299
300
186k
            tmp += w;
301
186k
            src += src_stride;
302
186k
        } while (--h);
303
9.45k
    } else
304
48.7k
        prep_c(tmp, src, src_stride, w, h HIGHBD_TAIL_SUFFIX);
305
84.9k
}
306
307
static NOINLINE void
308
prep_8tap_scaled_c(int16_t *tmp, const pixel *src, ptrdiff_t src_stride,
309
                   const int w, int h, const int mx, int my,
310
                   const int dx, const int dy, const int filter_type
311
                   HIGHBD_DECL_SUFFIX)
312
47.6k
{
313
47.6k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
314
47.6k
    int16_t mid[128 * 8];
315
47.6k
    int16_t *mid_ptrs[8];
316
47.6k
    int in_y = -8;
317
47.6k
    src_stride = PXSTRIDE(src_stride);
318
319
428k
    for (int i = 0; i < 8; i++)
320
381k
        mid_ptrs[i] = &mid[128 * i];
321
322
47.6k
    src -= src_stride * 3;
323
324
1.25M
    for (int y = 0; y < h; y++) {
325
1.21M
        int x;
326
1.21M
        int src_y = my >> 10;
327
1.21M
        GET_V_FILTER((my & 0x3ff) >> 6);
328
329
2.04M
        while (in_y < src_y) {
330
831k
            int imx = mx, ioff = 0;
331
831k
            int16_t *mid_ptr = mid_ptrs[0];
332
333
6.65M
            for (int i = 0; i < 7; i++)
334
5.82M
                mid_ptrs[i] = mid_ptrs[i + 1];
335
831k
            mid_ptrs[7] = mid_ptr;
336
337
23.8M
            for (x = 0; x < w; x++) {
338
23.0M
                GET_H_FILTER(imx >> 6);
339
23.0M
                mid_ptr[x] = fh ? DAV1D_FILTER_8TAP_RND(src, ioff, fh, 1,
340
23.0M
                                                        6 - intermediate_bits) :
341
23.0M
                                  src[ioff] << intermediate_bits;
342
23.0M
                imx += dx;
343
23.0M
                ioff += imx >> 10;
344
23.0M
                imx &= 0x3ff;
345
23.0M
            }
346
347
831k
            src += src_stride;
348
831k
            in_y++;
349
831k
        }
350
351
43.3M
        for (x = 0; x < w; x++)
352
42.1M
            tmp[x] = (fv ? DAV1D_FILTER_8TAP_RND3(mid_ptrs, x, fv, 6)
353
42.1M
                         : mid_ptrs[3][x]) - PREP_BIAS;
354
355
1.21M
        my += dy;
356
1.21M
        tmp += w;
357
1.21M
    }
358
47.6k
}
359
360
#define filter_fns(type, type_h, type_v) \
361
static void put_8tap_##type##_c(pixel *const dst, \
362
                                const ptrdiff_t dst_stride, \
363
                                const pixel *const src, \
364
                                const ptrdiff_t src_stride, \
365
                                const int w, const int h, \
366
                                const int mx, const int my \
367
363k
                                HIGHBD_DECL_SUFFIX) \
368
363k
{ \
369
363k
    put_8tap_c(dst, dst_stride, src, src_stride, w, h, mx, my, \
370
363k
               type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
371
363k
} \
mc_tmpl.c:put_8tap_regular_c
Line
Count
Source
367
280k
                                HIGHBD_DECL_SUFFIX) \
368
280k
{ \
369
280k
    put_8tap_c(dst, dst_stride, src, src_stride, w, h, mx, my, \
370
280k
               type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
371
280k
} \
mc_tmpl.c:put_8tap_regular_smooth_c
Line
Count
Source
367
9.63k
                                HIGHBD_DECL_SUFFIX) \
368
9.63k
{ \
369
9.63k
    put_8tap_c(dst, dst_stride, src, src_stride, w, h, mx, my, \
370
9.63k
               type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
371
9.63k
} \
mc_tmpl.c:put_8tap_regular_sharp_c
Line
Count
Source
367
1.63k
                                HIGHBD_DECL_SUFFIX) \
368
1.63k
{ \
369
1.63k
    put_8tap_c(dst, dst_stride, src, src_stride, w, h, mx, my, \
370
1.63k
               type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
371
1.63k
} \
mc_tmpl.c:put_8tap_sharp_regular_c
Line
Count
Source
367
1.18k
                                HIGHBD_DECL_SUFFIX) \
368
1.18k
{ \
369
1.18k
    put_8tap_c(dst, dst_stride, src, src_stride, w, h, mx, my, \
370
1.18k
               type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
371
1.18k
} \
mc_tmpl.c:put_8tap_sharp_smooth_c
Line
Count
Source
367
851
                                HIGHBD_DECL_SUFFIX) \
368
851
{ \
369
851
    put_8tap_c(dst, dst_stride, src, src_stride, w, h, mx, my, \
370
851
               type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
371
851
} \
mc_tmpl.c:put_8tap_sharp_c
Line
Count
Source
367
15.6k
                                HIGHBD_DECL_SUFFIX) \
368
15.6k
{ \
369
15.6k
    put_8tap_c(dst, dst_stride, src, src_stride, w, h, mx, my, \
370
15.6k
               type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
371
15.6k
} \
mc_tmpl.c:put_8tap_smooth_regular_c
Line
Count
Source
367
6.70k
                                HIGHBD_DECL_SUFFIX) \
368
6.70k
{ \
369
6.70k
    put_8tap_c(dst, dst_stride, src, src_stride, w, h, mx, my, \
370
6.70k
               type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
371
6.70k
} \
mc_tmpl.c:put_8tap_smooth_c
Line
Count
Source
367
46.8k
                                HIGHBD_DECL_SUFFIX) \
368
46.8k
{ \
369
46.8k
    put_8tap_c(dst, dst_stride, src, src_stride, w, h, mx, my, \
370
46.8k
               type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
371
46.8k
} \
mc_tmpl.c:put_8tap_smooth_sharp_c
Line
Count
Source
367
1.00k
                                HIGHBD_DECL_SUFFIX) \
368
1.00k
{ \
369
1.00k
    put_8tap_c(dst, dst_stride, src, src_stride, w, h, mx, my, \
370
1.00k
               type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
371
1.00k
} \
372
static void put_8tap_##type##_scaled_c(pixel *const dst, \
373
                                       const ptrdiff_t dst_stride, \
374
                                       const pixel *const src, \
375
                                       const ptrdiff_t src_stride, \
376
                                       const int w, const int h, \
377
                                       const int mx, const int my, \
378
                                       const int dx, const int dy \
379
143k
                                       HIGHBD_DECL_SUFFIX) \
380
143k
{ \
381
143k
    put_8tap_scaled_c(dst, dst_stride, src, src_stride, w, h, mx, my, dx, dy, \
382
143k
                      type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
383
143k
} \
mc_tmpl.c:put_8tap_regular_scaled_c
Line
Count
Source
379
82.0k
                                       HIGHBD_DECL_SUFFIX) \
380
82.0k
{ \
381
82.0k
    put_8tap_scaled_c(dst, dst_stride, src, src_stride, w, h, mx, my, dx, dy, \
382
82.0k
                      type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
383
82.0k
} \
mc_tmpl.c:put_8tap_regular_smooth_scaled_c
Line
Count
Source
379
3.37k
                                       HIGHBD_DECL_SUFFIX) \
380
3.37k
{ \
381
3.37k
    put_8tap_scaled_c(dst, dst_stride, src, src_stride, w, h, mx, my, dx, dy, \
382
3.37k
                      type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
383
3.37k
} \
mc_tmpl.c:put_8tap_regular_sharp_scaled_c
Line
Count
Source
379
935
                                       HIGHBD_DECL_SUFFIX) \
380
935
{ \
381
935
    put_8tap_scaled_c(dst, dst_stride, src, src_stride, w, h, mx, my, dx, dy, \
382
935
                      type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
383
935
} \
mc_tmpl.c:put_8tap_sharp_regular_scaled_c
Line
Count
Source
379
1.15k
                                       HIGHBD_DECL_SUFFIX) \
380
1.15k
{ \
381
1.15k
    put_8tap_scaled_c(dst, dst_stride, src, src_stride, w, h, mx, my, dx, dy, \
382
1.15k
                      type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
383
1.15k
} \
mc_tmpl.c:put_8tap_sharp_smooth_scaled_c
Line
Count
Source
379
785
                                       HIGHBD_DECL_SUFFIX) \
380
785
{ \
381
785
    put_8tap_scaled_c(dst, dst_stride, src, src_stride, w, h, mx, my, dx, dy, \
382
785
                      type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
383
785
} \
mc_tmpl.c:put_8tap_sharp_scaled_c
Line
Count
Source
379
16.9k
                                       HIGHBD_DECL_SUFFIX) \
380
16.9k
{ \
381
16.9k
    put_8tap_scaled_c(dst, dst_stride, src, src_stride, w, h, mx, my, dx, dy, \
382
16.9k
                      type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
383
16.9k
} \
mc_tmpl.c:put_8tap_smooth_regular_scaled_c
Line
Count
Source
379
3.64k
                                       HIGHBD_DECL_SUFFIX) \
380
3.64k
{ \
381
3.64k
    put_8tap_scaled_c(dst, dst_stride, src, src_stride, w, h, mx, my, dx, dy, \
382
3.64k
                      type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
383
3.64k
} \
mc_tmpl.c:put_8tap_smooth_scaled_c
Line
Count
Source
379
33.5k
                                       HIGHBD_DECL_SUFFIX) \
380
33.5k
{ \
381
33.5k
    put_8tap_scaled_c(dst, dst_stride, src, src_stride, w, h, mx, my, dx, dy, \
382
33.5k
                      type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
383
33.5k
} \
mc_tmpl.c:put_8tap_smooth_sharp_scaled_c
Line
Count
Source
379
867
                                       HIGHBD_DECL_SUFFIX) \
380
867
{ \
381
867
    put_8tap_scaled_c(dst, dst_stride, src, src_stride, w, h, mx, my, dx, dy, \
382
867
                      type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
383
867
} \
384
static void prep_8tap_##type##_c(int16_t *const tmp, \
385
                                 const pixel *const src, \
386
                                 const ptrdiff_t src_stride, \
387
                                 const int w, const int h, \
388
                                 const int mx, const int my \
389
84.9k
                                 HIGHBD_DECL_SUFFIX) \
390
84.9k
{ \
391
84.9k
    prep_8tap_c(tmp, src, src_stride, w, h, mx, my, \
392
84.9k
                type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
393
84.9k
} \
mc_tmpl.c:prep_8tap_regular_c
Line
Count
Source
389
40.9k
                                 HIGHBD_DECL_SUFFIX) \
390
40.9k
{ \
391
40.9k
    prep_8tap_c(tmp, src, src_stride, w, h, mx, my, \
392
40.9k
                type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
393
40.9k
} \
mc_tmpl.c:prep_8tap_regular_smooth_c
Line
Count
Source
389
1.24k
                                 HIGHBD_DECL_SUFFIX) \
390
1.24k
{ \
391
1.24k
    prep_8tap_c(tmp, src, src_stride, w, h, mx, my, \
392
1.24k
                type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
393
1.24k
} \
mc_tmpl.c:prep_8tap_regular_sharp_c
Line
Count
Source
389
2.18k
                                 HIGHBD_DECL_SUFFIX) \
390
2.18k
{ \
391
2.18k
    prep_8tap_c(tmp, src, src_stride, w, h, mx, my, \
392
2.18k
                type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
393
2.18k
} \
mc_tmpl.c:prep_8tap_sharp_regular_c
Line
Count
Source
389
3.31k
                                 HIGHBD_DECL_SUFFIX) \
390
3.31k
{ \
391
3.31k
    prep_8tap_c(tmp, src, src_stride, w, h, mx, my, \
392
3.31k
                type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
393
3.31k
} \
mc_tmpl.c:prep_8tap_sharp_smooth_c
Line
Count
Source
389
1.80k
                                 HIGHBD_DECL_SUFFIX) \
390
1.80k
{ \
391
1.80k
    prep_8tap_c(tmp, src, src_stride, w, h, mx, my, \
392
1.80k
                type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
393
1.80k
} \
mc_tmpl.c:prep_8tap_sharp_c
Line
Count
Source
389
8.87k
                                 HIGHBD_DECL_SUFFIX) \
390
8.87k
{ \
391
8.87k
    prep_8tap_c(tmp, src, src_stride, w, h, mx, my, \
392
8.87k
                type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
393
8.87k
} \
mc_tmpl.c:prep_8tap_smooth_regular_c
Line
Count
Source
389
1.97k
                                 HIGHBD_DECL_SUFFIX) \
390
1.97k
{ \
391
1.97k
    prep_8tap_c(tmp, src, src_stride, w, h, mx, my, \
392
1.97k
                type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
393
1.97k
} \
mc_tmpl.c:prep_8tap_smooth_c
Line
Count
Source
389
23.1k
                                 HIGHBD_DECL_SUFFIX) \
390
23.1k
{ \
391
23.1k
    prep_8tap_c(tmp, src, src_stride, w, h, mx, my, \
392
23.1k
                type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
393
23.1k
} \
mc_tmpl.c:prep_8tap_smooth_sharp_c
Line
Count
Source
389
1.42k
                                 HIGHBD_DECL_SUFFIX) \
390
1.42k
{ \
391
1.42k
    prep_8tap_c(tmp, src, src_stride, w, h, mx, my, \
392
1.42k
                type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
393
1.42k
} \
394
static void prep_8tap_##type##_scaled_c(int16_t *const tmp, \
395
                                        const pixel *const src, \
396
                                        const ptrdiff_t src_stride, \
397
                                        const int w, const int h, \
398
                                        const int mx, const int my, \
399
                                        const int dx, const int dy \
400
47.6k
                                        HIGHBD_DECL_SUFFIX) \
401
47.6k
{ \
402
47.6k
    prep_8tap_scaled_c(tmp, src, src_stride, w, h, mx, my, dx, dy, \
403
47.6k
                       type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
404
47.6k
}
mc_tmpl.c:prep_8tap_regular_scaled_c
Line
Count
Source
400
19.8k
                                        HIGHBD_DECL_SUFFIX) \
401
19.8k
{ \
402
19.8k
    prep_8tap_scaled_c(tmp, src, src_stride, w, h, mx, my, dx, dy, \
403
19.8k
                       type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
404
19.8k
}
mc_tmpl.c:prep_8tap_regular_smooth_scaled_c
Line
Count
Source
400
797
                                        HIGHBD_DECL_SUFFIX) \
401
797
{ \
402
797
    prep_8tap_scaled_c(tmp, src, src_stride, w, h, mx, my, dx, dy, \
403
797
                       type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
404
797
}
mc_tmpl.c:prep_8tap_regular_sharp_scaled_c
Line
Count
Source
400
3.54k
                                        HIGHBD_DECL_SUFFIX) \
401
3.54k
{ \
402
3.54k
    prep_8tap_scaled_c(tmp, src, src_stride, w, h, mx, my, dx, dy, \
403
3.54k
                       type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
404
3.54k
}
mc_tmpl.c:prep_8tap_sharp_regular_scaled_c
Line
Count
Source
400
2.65k
                                        HIGHBD_DECL_SUFFIX) \
401
2.65k
{ \
402
2.65k
    prep_8tap_scaled_c(tmp, src, src_stride, w, h, mx, my, dx, dy, \
403
2.65k
                       type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
404
2.65k
}
mc_tmpl.c:prep_8tap_sharp_smooth_scaled_c
Line
Count
Source
400
1.38k
                                        HIGHBD_DECL_SUFFIX) \
401
1.38k
{ \
402
1.38k
    prep_8tap_scaled_c(tmp, src, src_stride, w, h, mx, my, dx, dy, \
403
1.38k
                       type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
404
1.38k
}
mc_tmpl.c:prep_8tap_sharp_scaled_c
Line
Count
Source
400
4.46k
                                        HIGHBD_DECL_SUFFIX) \
401
4.46k
{ \
402
4.46k
    prep_8tap_scaled_c(tmp, src, src_stride, w, h, mx, my, dx, dy, \
403
4.46k
                       type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
404
4.46k
}
mc_tmpl.c:prep_8tap_smooth_regular_scaled_c
Line
Count
Source
400
1.42k
                                        HIGHBD_DECL_SUFFIX) \
401
1.42k
{ \
402
1.42k
    prep_8tap_scaled_c(tmp, src, src_stride, w, h, mx, my, dx, dy, \
403
1.42k
                       type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
404
1.42k
}
mc_tmpl.c:prep_8tap_smooth_scaled_c
Line
Count
Source
400
12.4k
                                        HIGHBD_DECL_SUFFIX) \
401
12.4k
{ \
402
12.4k
    prep_8tap_scaled_c(tmp, src, src_stride, w, h, mx, my, dx, dy, \
403
12.4k
                       type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
404
12.4k
}
mc_tmpl.c:prep_8tap_smooth_sharp_scaled_c
Line
Count
Source
400
1.08k
                                        HIGHBD_DECL_SUFFIX) \
401
1.08k
{ \
402
1.08k
    prep_8tap_scaled_c(tmp, src, src_stride, w, h, mx, my, dx, dy, \
403
1.08k
                       type_h | (type_v << 2) HIGHBD_TAIL_SUFFIX); \
404
1.08k
}
405
406
filter_fns(regular,        DAV1D_FILTER_8TAP_REGULAR, DAV1D_FILTER_8TAP_REGULAR)
407
filter_fns(regular_sharp,  DAV1D_FILTER_8TAP_REGULAR, DAV1D_FILTER_8TAP_SHARP)
408
filter_fns(regular_smooth, DAV1D_FILTER_8TAP_REGULAR, DAV1D_FILTER_8TAP_SMOOTH)
409
filter_fns(smooth,         DAV1D_FILTER_8TAP_SMOOTH,  DAV1D_FILTER_8TAP_SMOOTH)
410
filter_fns(smooth_regular, DAV1D_FILTER_8TAP_SMOOTH,  DAV1D_FILTER_8TAP_REGULAR)
411
filter_fns(smooth_sharp,   DAV1D_FILTER_8TAP_SMOOTH,  DAV1D_FILTER_8TAP_SHARP)
412
filter_fns(sharp,          DAV1D_FILTER_8TAP_SHARP,   DAV1D_FILTER_8TAP_SHARP)
413
filter_fns(sharp_regular,  DAV1D_FILTER_8TAP_SHARP,   DAV1D_FILTER_8TAP_REGULAR)
414
filter_fns(sharp_smooth,   DAV1D_FILTER_8TAP_SHARP,   DAV1D_FILTER_8TAP_SMOOTH)
415
416
#define FILTER_BILIN(src, x, mxy, stride) \
417
48.8M
    (16 * src[x] + ((mxy) * (src[x + stride] - src[x])))
418
419
#define FILTER_BILIN_RND(src, x, mxy, stride, sh) \
420
48.8M
    ((FILTER_BILIN(src, x, mxy, stride) + ((1 << (sh)) >> 1)) >> (sh))
421
422
#define FILTER_BILIN_CLIP(src, x, mxy, stride, sh) \
423
5.63M
    iclip_pixel(FILTER_BILIN_RND(src, x, mxy, stride, sh))
424
425
#define FILTER_BILIN2(src1, src2, x, mxy) \
426
24.5M
    (16 * src1[x] + ((mxy) * (src2[x] - src1[x])))
427
428
#define FILTER_BILIN_RND2(src1, src2, x, mxy, sh) \
429
24.5M
    ((FILTER_BILIN2(src1, src2, x, mxy) + ((1 << (sh)) >> 1)) >> (sh))
430
431
#define FILTER_BILIN_CLIP2(src1, src2, x, mxy, sh) \
432
20.9M
    iclip_pixel(FILTER_BILIN_RND2(src1, src2, x, mxy, sh))
433
434
static void put_bilin_c(pixel *dst, ptrdiff_t dst_stride,
435
                        const pixel *src, ptrdiff_t src_stride,
436
                        const int w, int h, const int mx, const int my
437
                        HIGHBD_DECL_SUFFIX)
438
331k
{
439
331k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
440
331k
    const int intermediate_rnd = (1 << intermediate_bits) >> 1;
441
331k
    dst_stride = PXSTRIDE(dst_stride);
442
331k
    src_stride = PXSTRIDE(src_stride);
443
444
331k
    if (mx) {
445
44.4k
        if (my) {
446
22.8k
            int16_t mid[128 * 129], *mid_ptr = mid;
447
22.8k
            int tmp_h = h + 1;
448
449
201k
            do {
450
3.05M
                for (int x = 0; x < w; x++)
451
2.85M
                    mid_ptr[x] = FILTER_BILIN_RND(src, x, mx, 1,
452
201k
                                                  4 - intermediate_bits);
453
454
201k
                mid_ptr += 128;
455
201k
                src += src_stride;
456
201k
            } while (--tmp_h);
457
458
22.8k
            mid_ptr = mid;
459
178k
            do {
460
2.84M
                for (int x = 0; x < w; x++)
461
2.67M
                    dst[x] = FILTER_BILIN_CLIP(mid_ptr, x, my, 128,
462
178k
                                               4 + intermediate_bits);
463
464
178k
                mid_ptr += 128;
465
178k
                dst += dst_stride;
466
178k
            } while (--h);
467
22.8k
        } else {
468
289k
            do {
469
10.1M
                for (int x = 0; x < w; x++) {
470
9.87M
                    const int px = FILTER_BILIN_RND(src, x, mx, 1,
471
9.87M
                                                    4 - intermediate_bits);
472
9.87M
                    dst[x] = iclip_pixel((px + intermediate_rnd) >> intermediate_bits);
473
9.87M
                }
474
475
289k
                dst += dst_stride;
476
289k
                src += src_stride;
477
289k
            } while (--h);
478
21.6k
        }
479
286k
    } else if (my) {
480
163k
        do {
481
3.12M
            for (int x = 0; x < w; x++)
482
2.96M
                dst[x] = FILTER_BILIN_CLIP(src, x, my, src_stride, 4);
483
484
163k
            dst += dst_stride;
485
163k
            src += src_stride;
486
163k
        } while (--h);
487
19.5k
    } else
488
267k
        put_c(dst, dst_stride, src, src_stride, w, h);
489
331k
}
490
491
static void put_bilin_scaled_c(pixel *dst, ptrdiff_t dst_stride,
492
                               const pixel *src, ptrdiff_t src_stride,
493
                               const int w, int h, const int mx, int my,
494
                               const int dx, const int dy
495
                               HIGHBD_DECL_SUFFIX)
496
64.4k
{
497
64.4k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
498
64.4k
    int16_t mid[128 * 2];
499
64.4k
    int in_y = -2;
500
501
859k
    do {
502
859k
        int x;
503
859k
        int y = my >> 10;
504
859k
        int16_t *mid1 = &mid[(y & 1) * 128];
505
859k
        int16_t *mid2 = &mid[((y + 1) & 1) * 128];
506
859k
        int dmy = my & 0x3ff;
507
508
1.53M
        while (in_y < y) {
509
679k
            int imx = mx, ioff = 0;
510
679k
            int16_t *mid_ptr = &mid[(in_y & 1) * 128];
511
512
17.2M
            for (x = 0; x < w; x++) {
513
16.5M
                mid_ptr[x] = FILTER_BILIN_RND(src, ioff, imx >> 6, 1,
514
16.5M
                                              4 - intermediate_bits);
515
16.5M
                imx += dx;
516
16.5M
                ioff += imx >> 10;
517
16.5M
                imx &= 0x3ff;
518
16.5M
            }
519
520
679k
            src += PXSTRIDE(src_stride);
521
679k
            in_y++;
522
679k
        }
523
524
21.7M
        for (x = 0; x < w; x++)
525
20.9M
            dst[x] = FILTER_BILIN_CLIP2(mid1, mid2, x, dmy >> 6,
526
859k
                                       4 + intermediate_bits);
527
528
859k
        my += dy;
529
859k
        dst += PXSTRIDE(dst_stride);
530
859k
    } while (--h);
531
64.4k
}
532
533
static void prep_bilin_c(int16_t *tmp,
534
                         const pixel *src, ptrdiff_t src_stride,
535
                         const int w, int h, const int mx, const int my
536
                         HIGHBD_DECL_SUFFIX)
537
25.5k
{
538
25.5k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
539
25.5k
    src_stride = PXSTRIDE(src_stride);
540
541
25.5k
    if (mx) {
542
13.6k
        if (my) {
543
9.46k
            int16_t mid[128 * 129], *mid_ptr = mid;
544
9.46k
            int tmp_h = h + 1;
545
546
130k
            do {
547
3.59M
                for (int x = 0; x < w; x++)
548
3.45M
                    mid_ptr[x] = FILTER_BILIN_RND(src, x, mx, 1,
549
130k
                                                  4 - intermediate_bits);
550
551
130k
                mid_ptr += 128;
552
130k
                src += src_stride;
553
130k
            } while (--tmp_h);
554
555
9.46k
            mid_ptr = mid;
556
121k
            do {
557
3.44M
                for (int x = 0; x < w; x++)
558
3.32M
                    tmp[x] = FILTER_BILIN_RND(mid_ptr, x, my, 128, 4) -
559
3.32M
                             PREP_BIAS;
560
561
121k
                mid_ptr += 128;
562
121k
                tmp += w;
563
121k
            } while (--h);
564
9.46k
        } else {
565
75.8k
            do {
566
2.70M
                for (int x = 0; x < w; x++)
567
2.62M
                    tmp[x] = FILTER_BILIN_RND(src, x, mx, 1,
568
2.62M
                                              4 - intermediate_bits) -
569
2.62M
                             PREP_BIAS;
570
571
75.8k
                tmp += w;
572
75.8k
                src += src_stride;
573
75.8k
            } while (--h);
574
4.20k
        }
575
13.6k
    } else if (my) {
576
64.4k
        do {
577
2.24M
            for (int x = 0; x < w; x++)
578
2.17M
                tmp[x] = FILTER_BILIN_RND(src, x, my, src_stride,
579
2.17M
                                          4 - intermediate_bits) - PREP_BIAS;
580
581
64.4k
            tmp += w;
582
64.4k
            src += src_stride;
583
64.4k
        } while (--h);
584
3.98k
    } else
585
7.88k
        prep_c(tmp, src, src_stride, w, h HIGHBD_TAIL_SUFFIX);
586
25.5k
}
587
588
static void prep_bilin_scaled_c(int16_t *tmp,
589
                                const pixel *src, ptrdiff_t src_stride,
590
                                const int w, int h, const int mx, int my,
591
                                const int dx, const int dy HIGHBD_DECL_SUFFIX)
592
5.91k
{
593
5.91k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
594
5.91k
    int16_t mid[128 * 2];
595
5.91k
    int in_y = -2;
596
597
111k
    do {
598
111k
        int x;
599
111k
        int y = my >> 10;
600
111k
        int16_t *mid1 = &mid[(y & 1) * 128];
601
111k
        int16_t *mid2 = &mid[((y + 1) & 1) * 128];
602
111k
        int dmy = my & 0x3ff;
603
604
175k
        while (in_y < y) {
605
63.2k
            int imx = mx, ioff = 0;
606
63.2k
            int16_t *mid_ptr = &mid[(in_y & 1) * 128];
607
608
2.38M
            for (x = 0; x < w; x++) {
609
2.32M
                mid_ptr[x] = FILTER_BILIN_RND(src, ioff, imx >> 6, 1,
610
2.32M
                                              4 - intermediate_bits);
611
2.32M
                imx += dx;
612
2.32M
                ioff += imx >> 10;
613
2.32M
                imx &= 0x3ff;
614
2.32M
            }
615
616
63.2k
            src += PXSTRIDE(src_stride);
617
63.2k
            in_y++;
618
63.2k
        }
619
620
3.76M
        for (x = 0; x < w; x++)
621
3.65M
            tmp[x] = FILTER_BILIN_RND2(mid1, mid2, x, dmy >> 6, 4) - PREP_BIAS;
622
623
111k
        my += dy;
624
111k
        tmp += w;
625
111k
    } while (--h);
626
5.91k
}
627
628
static void avg_c(pixel *dst, const ptrdiff_t dst_stride,
629
                  const int16_t *tmp1, const int16_t *tmp2, const int w, int h
630
                  HIGHBD_DECL_SUFFIX)
631
61.7k
{
632
61.7k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
633
61.7k
    const int sh = intermediate_bits + 1;
634
61.7k
    const int rnd = (1 << intermediate_bits) + PREP_BIAS * 2;
635
1.31M
    do {
636
45.3M
        for (int x = 0; x < w; x++)
637
44.0M
            dst[x] = iclip_pixel((tmp1[x] + tmp2[x] + rnd) >> sh);
638
639
1.31M
        tmp1 += w;
640
1.31M
        tmp2 += w;
641
1.31M
        dst += PXSTRIDE(dst_stride);
642
1.31M
    } while (--h);
643
61.7k
}
644
645
static void w_avg_c(pixel *dst, const ptrdiff_t dst_stride,
646
                    const int16_t *tmp1, const int16_t *tmp2, const int w, int h,
647
                    const int weight HIGHBD_DECL_SUFFIX)
648
8.40k
{
649
8.40k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
650
8.40k
    const int sh = intermediate_bits + 4;
651
8.40k
    const int rnd = (8 << intermediate_bits) + PREP_BIAS * 16;
652
220k
    do {
653
9.02M
        for (int x = 0; x < w; x++)
654
8.80M
            dst[x] = iclip_pixel((tmp1[x] * weight +
655
8.80M
                                  tmp2[x] * (16 - weight) + rnd) >> sh);
656
657
220k
        tmp1 += w;
658
220k
        tmp2 += w;
659
220k
        dst += PXSTRIDE(dst_stride);
660
220k
    } while (--h);
661
8.40k
}
662
663
static void mask_c(pixel *dst, const ptrdiff_t dst_stride,
664
                   const int16_t *tmp1, const int16_t *tmp2, const int w, int h,
665
                   const uint8_t *mask HIGHBD_DECL_SUFFIX)
666
11.4k
{
667
11.4k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
668
11.4k
    const int sh = intermediate_bits + 6;
669
11.4k
    const int rnd = (32 << intermediate_bits) + PREP_BIAS * 64;
670
259k
    do {
671
8.06M
        for (int x = 0; x < w; x++)
672
7.80M
            dst[x] = iclip_pixel((tmp1[x] * mask[x] +
673
7.80M
                                  tmp2[x] * (64 - mask[x]) + rnd) >> sh);
674
675
259k
        tmp1 += w;
676
259k
        tmp2 += w;
677
259k
        mask += w;
678
259k
        dst += PXSTRIDE(dst_stride);
679
259k
    } while (--h);
680
11.4k
}
681
682
12.2M
#define blend_px(a, b, m) (((a * (64 - m) + b * m) + 32) >> 6)
683
static void blend_c(pixel *dst, const ptrdiff_t dst_stride, const pixel *tmp,
684
                    const int w, int h, const uint8_t *mask)
685
13.9k
{
686
152k
    do {
687
1.94M
        for (int x = 0; x < w; x++) {
688
1.79M
            dst[x] = blend_px(dst[x], tmp[x], mask[x]);
689
1.79M
        }
690
152k
        dst += PXSTRIDE(dst_stride);
691
152k
        tmp += w;
692
152k
        mask += w;
693
152k
    } while (--h);
694
13.9k
}
695
696
static void blend_v_c(pixel *dst, const ptrdiff_t dst_stride, const pixel *tmp,
697
                      const int w, int h)
698
65.2k
{
699
65.2k
    const uint8_t *const mask = &dav1d_obmc_masks[w];
700
877k
    do {
701
6.92M
        for (int x = 0; x < (w * 3) >> 2; x++) {
702
6.04M
            dst[x] = blend_px(dst[x], tmp[x], mask[x]);
703
6.04M
        }
704
877k
        dst += PXSTRIDE(dst_stride);
705
877k
        tmp += w;
706
877k
    } while (--h);
707
65.2k
}
708
709
static void blend_h_c(pixel *dst, const ptrdiff_t dst_stride, const pixel *tmp,
710
                      const int w, int h)
711
62.1k
{
712
62.1k
    const uint8_t *mask = &dav1d_obmc_masks[h];
713
62.1k
    h = (h * 3) >> 2;
714
297k
    do {
715
297k
        const int m = *mask++;
716
4.67M
        for (int x = 0; x < w; x++) {
717
4.37M
            dst[x] = blend_px(dst[x], tmp[x], m);
718
4.37M
        }
719
297k
        dst += PXSTRIDE(dst_stride);
720
297k
        tmp += w;
721
297k
    } while (--h);
722
62.1k
}
723
724
static void w_mask_c(pixel *dst, const ptrdiff_t dst_stride,
725
                     const int16_t *tmp1, const int16_t *tmp2, const int w, int h,
726
                     uint8_t *mask, const int sign,
727
                     const int ss_hor, const int ss_ver HIGHBD_DECL_SUFFIX)
728
4.96k
{
729
    // store mask at 2x2 resolution, i.e. store 2x1 sum for even rows,
730
    // and then load this intermediate to calculate final value for odd rows
731
4.96k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
732
4.96k
    const int bitdepth = bitdepth_from_max(bitdepth_max);
733
4.96k
    const int sh = intermediate_bits + 6;
734
4.96k
    const int rnd = (32 << intermediate_bits) + PREP_BIAS * 64;
735
4.96k
    const int mask_sh = bitdepth + intermediate_bits - 4;
736
4.96k
    const int mask_rnd = 1 << (mask_sh - 5);
737
223k
    do {
738
7.02M
        for (int x = 0; x < w; x++) {
739
6.80M
            const int tmpdiff = tmp1[x] - tmp2[x];
740
6.80M
            const int m = imin(38 + ((abs(tmpdiff) + mask_rnd) >> mask_sh), 64);
741
6.80M
            dst[x] = iclip_pixel((tmpdiff * m + tmp2[x] * 64 + rnd) >> sh);
742
743
6.80M
            if (ss_hor) {
744
2.03M
                x++;
745
746
2.03M
                const int tmpdiff = tmp1[x] - tmp2[x];
747
2.03M
                const int n = imin(38 + ((abs(tmpdiff) + mask_rnd) >> mask_sh), 64);
748
2.03M
                dst[x] = iclip_pixel((tmpdiff * n + tmp2[x] * 64 + rnd) >> sh);
749
750
2.03M
                if (h & ss_ver) {
751
1.04M
                    mask[x >> 1] = (m + n + mask[x >> 1] + 2 - sign) >> 2;
752
1.04M
                } else if (ss_ver) {
753
1.04M
                    mask[x >> 1] = m + n;
754
18.4E
                } else {
755
18.4E
                    mask[x >> 1] = (m + n + 1 - sign) >> 1;
756
18.4E
                }
757
4.76M
            } else {
758
4.76M
                mask[x] = m;
759
4.76M
            }
760
6.80M
        }
761
762
223k
        tmp1 += w;
763
223k
        tmp2 += w;
764
223k
        dst += PXSTRIDE(dst_stride);
765
223k
        if (!ss_ver || (h & 1)) mask += w >> ss_hor;
766
223k
    } while (--h);
767
4.96k
}
768
769
#define w_mask_fns(ssn, ss_hor, ss_ver) \
770
static void w_mask_##ssn##_c(pixel *const dst, const ptrdiff_t dst_stride, \
771
                             const int16_t *const tmp1, const int16_t *const tmp2, \
772
                             const int w, const int h, uint8_t *mask, \
773
4.96k
                             const int sign HIGHBD_DECL_SUFFIX) \
774
4.96k
{ \
775
4.96k
    w_mask_c(dst, dst_stride, tmp1, tmp2, w, h, mask, sign, ss_hor, ss_ver \
776
4.96k
             HIGHBD_TAIL_SUFFIX); \
777
4.96k
}
mc_tmpl.c:w_mask_444_c
Line
Count
Source
773
2.84k
                             const int sign HIGHBD_DECL_SUFFIX) \
774
2.84k
{ \
775
2.84k
    w_mask_c(dst, dst_stride, tmp1, tmp2, w, h, mask, sign, ss_hor, ss_ver \
776
2.84k
             HIGHBD_TAIL_SUFFIX); \
777
2.84k
}
mc_tmpl.c:w_mask_422_c
Line
Count
Source
773
212
                             const int sign HIGHBD_DECL_SUFFIX) \
774
212
{ \
775
212
    w_mask_c(dst, dst_stride, tmp1, tmp2, w, h, mask, sign, ss_hor, ss_ver \
776
212
             HIGHBD_TAIL_SUFFIX); \
777
212
}
mc_tmpl.c:w_mask_420_c
Line
Count
Source
773
1.90k
                             const int sign HIGHBD_DECL_SUFFIX) \
774
1.90k
{ \
775
1.90k
    w_mask_c(dst, dst_stride, tmp1, tmp2, w, h, mask, sign, ss_hor, ss_ver \
776
1.90k
             HIGHBD_TAIL_SUFFIX); \
777
1.90k
}
778
779
w_mask_fns(444, 0, 0);
780
w_mask_fns(422, 1, 0);
781
w_mask_fns(420, 1, 1);
782
783
#undef w_mask_fns
784
785
#define FILTER_WARP_RND(src, x, F, stride, sh) \
786
55.2M
    ((F[0] * src[x - 3 * stride] + \
787
55.2M
      F[1] * src[x - 2 * stride] + \
788
55.2M
      F[2] * src[x - 1 * stride] + \
789
55.2M
      F[3] * src[x + 0 * stride] + \
790
55.2M
      F[4] * src[x + 1 * stride] + \
791
55.2M
      F[5] * src[x + 2 * stride] + \
792
55.2M
      F[6] * src[x + 3 * stride] + \
793
55.2M
      F[7] * src[x + 4 * stride] + \
794
55.2M
      ((1 << (sh)) >> 1)) >> (sh))
795
796
#define FILTER_WARP_CLIP(src, x, F, stride, sh) \
797
15.6M
    iclip_pixel(FILTER_WARP_RND(src, x, F, stride, sh))
798
799
static void warp_affine_8x8_c(pixel *dst, const ptrdiff_t dst_stride,
800
                              const pixel *src, const ptrdiff_t src_stride,
801
                              const int16_t *const abcd, int mx, int my
802
                              HIGHBD_DECL_SUFFIX)
803
257k
{
804
257k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
805
257k
    int16_t mid[15 * 8], *mid_ptr = mid;
806
807
257k
    src -= 3 * PXSTRIDE(src_stride);
808
4.05M
    for (int y = 0; y < 15; y++, mx += abcd[1]) {
809
34.0M
        for (int x = 0, tmx = mx; x < 8; x++, tmx += abcd[0]) {
810
30.2M
            const int8_t *const filter =
811
30.2M
                dav1d_mc_warp_filter[64 + ((tmx + 512) >> 10)];
812
813
30.2M
            mid_ptr[x] = FILTER_WARP_RND(src, x, filter, 1,
814
30.2M
                                         7 - intermediate_bits);
815
30.2M
        }
816
3.80M
        src += PXSTRIDE(src_stride);
817
3.80M
        mid_ptr += 8;
818
3.80M
    }
819
820
257k
    mid_ptr = &mid[3 * 8];
821
2.21M
    for (int y = 0; y < 8; y++, my += abcd[3]) {
822
17.5M
        for (int x = 0, tmy = my; x < 8; x++, tmy += abcd[2]) {
823
15.6M
            const int8_t *const filter =
824
15.6M
                dav1d_mc_warp_filter[64 + ((tmy + 512) >> 10)];
825
826
15.6M
            dst[x] = FILTER_WARP_CLIP(mid_ptr, x, filter, 8,
827
15.6M
                                      7 + intermediate_bits);
828
15.6M
        }
829
1.95M
        mid_ptr += 8;
830
1.95M
        dst += PXSTRIDE(dst_stride);
831
1.95M
    }
832
257k
}
833
834
static void warp_affine_8x8t_c(int16_t *tmp, const ptrdiff_t tmp_stride,
835
                               const pixel *src, const ptrdiff_t src_stride,
836
                               const int16_t *const abcd, int mx, int my
837
                               HIGHBD_DECL_SUFFIX)
838
51.2k
{
839
51.2k
    const int intermediate_bits = get_intermediate_bits(bitdepth_max);
840
51.2k
    int16_t mid[15 * 8], *mid_ptr = mid;
841
842
51.2k
    src -= 3 * PXSTRIDE(src_stride);
843
819k
    for (int y = 0; y < 15; y++, mx += abcd[1]) {
844
6.91M
        for (int x = 0, tmx = mx; x < 8; x++, tmx += abcd[0]) {
845
6.14M
            const int8_t *const filter =
846
6.14M
                dav1d_mc_warp_filter[64 + ((tmx + 512) >> 10)];
847
848
6.14M
            mid_ptr[x] = FILTER_WARP_RND(src, x, filter, 1,
849
6.14M
                                         7 - intermediate_bits);
850
6.14M
        }
851
768k
        src += PXSTRIDE(src_stride);
852
768k
        mid_ptr += 8;
853
768k
    }
854
855
51.2k
    mid_ptr = &mid[3 * 8];
856
461k
    for (int y = 0; y < 8; y++, my += abcd[3]) {
857
3.68M
        for (int x = 0, tmy = my; x < 8; x++, tmy += abcd[2]) {
858
3.27M
            const int8_t *const filter =
859
3.27M
                dav1d_mc_warp_filter[64 + ((tmy + 512) >> 10)];
860
861
3.27M
            tmp[x] = FILTER_WARP_RND(mid_ptr, x, filter, 8, 7) - PREP_BIAS;
862
3.27M
        }
863
409k
        mid_ptr += 8;
864
409k
        tmp += tmp_stride;
865
409k
    }
866
51.2k
}
867
868
static void emu_edge_c(const intptr_t bw, const intptr_t bh,
869
                       const intptr_t iw, const intptr_t ih,
870
                       const intptr_t x, const intptr_t y,
871
                       pixel *dst, const ptrdiff_t dst_stride,
872
                       const pixel *ref, const ptrdiff_t ref_stride)
873
822k
{
874
    // find offset in reference of visible block to copy
875
822k
    ref += iclip((int) y, 0, (int) ih - 1) * PXSTRIDE(ref_stride) +
876
822k
           iclip((int) x, 0, (int) iw - 1);
877
878
    // number of pixels to extend (left, right, top, bottom)
879
822k
    const int left_ext = iclip((int) -x, 0, (int) bw - 1);
880
822k
    const int right_ext = iclip((int) (x + bw - iw), 0, (int) bw - 1);
881
822k
    assert(left_ext + right_ext < bw);
882
822k
    const int top_ext = iclip((int) -y, 0, (int) bh - 1);
883
822k
    const int bottom_ext = iclip((int) (y + bh - ih), 0, (int) bh - 1);
884
822k
    assert(top_ext + bottom_ext < bh);
885
886
    // copy visible portion first
887
822k
    pixel *blk = dst + top_ext * PXSTRIDE(dst_stride);
888
822k
    const int center_w = (int) (bw - left_ext - right_ext);
889
822k
    const int center_h = (int) (bh - top_ext - bottom_ext);
890
10.6M
    for (int y = 0; y < center_h; y++) {
891
9.85M
        pixel_copy(blk + left_ext, ref, center_w);
892
        // extend left edge for this line
893
9.85M
        if (left_ext)
894
2.35M
            pixel_set(blk, blk[left_ext], left_ext);
895
        // extend right edge for this line
896
9.85M
        if (right_ext)
897
6.90M
            pixel_set(blk + left_ext + center_w, blk[left_ext + center_w - 1],
898
6.90M
                      right_ext);
899
9.85M
        ref += PXSTRIDE(ref_stride);
900
9.85M
        blk += PXSTRIDE(dst_stride);
901
9.85M
    }
902
903
    // copy top
904
822k
    blk = dst + top_ext * PXSTRIDE(dst_stride);
905
1.86M
    for (int y = 0; y < top_ext; y++) {
906
1.04M
        pixel_copy(dst, blk, bw);
907
1.04M
        dst += PXSTRIDE(dst_stride);
908
1.04M
    }
909
910
    // copy bottom
911
822k
    dst += center_h * PXSTRIDE(dst_stride);
912
6.00M
    for (int y = 0; y < bottom_ext; y++) {
913
5.17M
        pixel_copy(dst, &dst[-PXSTRIDE(dst_stride)], bw);
914
5.17M
        dst += PXSTRIDE(dst_stride);
915
5.17M
    }
916
822k
}
917
918
static void resize_c(pixel *dst, const ptrdiff_t dst_stride,
919
                     const pixel *src, const ptrdiff_t src_stride,
920
                     const int dst_w, int h, const int src_w,
921
                     const int dx, const int mx0 HIGHBD_DECL_SUFFIX)
922
153k
{
923
5.67M
    do {
924
5.67M
        int mx = mx0, src_x = -1;
925
784M
        for (int x = 0; x < dst_w; x++) {
926
779M
            const int8_t *const F = dav1d_resize_filter[mx >> 8];
927
779M
            dst[x] = iclip_pixel((-(F[0] * src[iclip(src_x - 3, 0, src_w - 1)] +
928
779M
                                    F[1] * src[iclip(src_x - 2, 0, src_w - 1)] +
929
779M
                                    F[2] * src[iclip(src_x - 1, 0, src_w - 1)] +
930
779M
                                    F[3] * src[iclip(src_x + 0, 0, src_w - 1)] +
931
779M
                                    F[4] * src[iclip(src_x + 1, 0, src_w - 1)] +
932
779M
                                    F[5] * src[iclip(src_x + 2, 0, src_w - 1)] +
933
779M
                                    F[6] * src[iclip(src_x + 3, 0, src_w - 1)] +
934
779M
                                    F[7] * src[iclip(src_x + 4, 0, src_w - 1)]) +
935
779M
                                  64) >> 7);
936
779M
            mx += dx;
937
779M
            src_x += mx >> 14;
938
779M
            mx &= 0x3fff;
939
779M
        }
940
941
5.67M
        dst += PXSTRIDE(dst_stride);
942
5.67M
        src += PXSTRIDE(src_stride);
943
5.67M
    } while (--h);
944
153k
}
945
946
#if HAVE_ASM
947
#if ARCH_AARCH64 || ARCH_ARM
948
#include "src/arm/mc.h"
949
#elif ARCH_LOONGARCH64
950
#include "src/loongarch/mc.h"
951
#elif ARCH_PPC64LE
952
#include "src/ppc/mc.h"
953
#elif ARCH_RISCV
954
#include "src/riscv/mc.h"
955
#elif ARCH_X86
956
#include "src/x86/mc.h"
957
#endif
958
#endif
959
960
68.7k
COLD void bitfn(dav1d_mc_dsp_init)(Dav1dMCDSPContext *const c) {
961
687k
#define init_mc_fns(type, name) do { \
962
687k
    c->mc        [type] = put_##name##_c; \
963
687k
    c->mc_scaled [type] = put_##name##_scaled_c; \
964
687k
    c->mct       [type] = prep_##name##_c; \
965
687k
    c->mct_scaled[type] = prep_##name##_scaled_c; \
966
687k
} while (0)
967
968
68.7k
    init_mc_fns(FILTER_2D_8TAP_REGULAR,        8tap_regular);
969
68.7k
    init_mc_fns(FILTER_2D_8TAP_REGULAR_SMOOTH, 8tap_regular_smooth);
970
68.7k
    init_mc_fns(FILTER_2D_8TAP_REGULAR_SHARP,  8tap_regular_sharp);
971
68.7k
    init_mc_fns(FILTER_2D_8TAP_SHARP_REGULAR,  8tap_sharp_regular);
972
68.7k
    init_mc_fns(FILTER_2D_8TAP_SHARP_SMOOTH,   8tap_sharp_smooth);
973
68.7k
    init_mc_fns(FILTER_2D_8TAP_SHARP,          8tap_sharp);
974
68.7k
    init_mc_fns(FILTER_2D_8TAP_SMOOTH_REGULAR, 8tap_smooth_regular);
975
68.7k
    init_mc_fns(FILTER_2D_8TAP_SMOOTH,         8tap_smooth);
976
68.7k
    init_mc_fns(FILTER_2D_8TAP_SMOOTH_SHARP,   8tap_smooth_sharp);
977
68.7k
    init_mc_fns(FILTER_2D_BILINEAR,            bilin);
978
979
68.7k
    c->avg      = avg_c;
980
68.7k
    c->w_avg    = w_avg_c;
981
68.7k
    c->mask     = mask_c;
982
68.7k
    c->blend    = blend_c;
983
68.7k
    c->blend_v  = blend_v_c;
984
68.7k
    c->blend_h  = blend_h_c;
985
68.7k
    c->w_mask[0] = w_mask_444_c;
986
68.7k
    c->w_mask[1] = w_mask_422_c;
987
68.7k
    c->w_mask[2] = w_mask_420_c;
988
68.7k
    c->warp8x8  = warp_affine_8x8_c;
989
68.7k
    c->warp8x8t = warp_affine_8x8t_c;
990
68.7k
    c->emu_edge = emu_edge_c;
991
68.7k
    c->resize   = resize_c;
992
993
#if HAVE_ASM
994
#if ARCH_AARCH64 || ARCH_ARM
995
    mc_dsp_init_arm(c);
996
#elif ARCH_LOONGARCH64
997
    mc_dsp_init_loongarch(c);
998
#elif ARCH_PPC64LE
999
    mc_dsp_init_ppc(c);
1000
#elif ARCH_RISCV
1001
    mc_dsp_init_riscv(c);
1002
#elif ARCH_X86
1003
    mc_dsp_init_x86(c);
1004
#endif
1005
#endif
1006
68.7k
}
dav1d_mc_dsp_init_8bpc
Line
Count
Source
960
30.8k
COLD void bitfn(dav1d_mc_dsp_init)(Dav1dMCDSPContext *const c) {
961
30.8k
#define init_mc_fns(type, name) do { \
962
30.8k
    c->mc        [type] = put_##name##_c; \
963
30.8k
    c->mc_scaled [type] = put_##name##_scaled_c; \
964
30.8k
    c->mct       [type] = prep_##name##_c; \
965
30.8k
    c->mct_scaled[type] = prep_##name##_scaled_c; \
966
30.8k
} while (0)
967
968
30.8k
    init_mc_fns(FILTER_2D_8TAP_REGULAR,        8tap_regular);
969
30.8k
    init_mc_fns(FILTER_2D_8TAP_REGULAR_SMOOTH, 8tap_regular_smooth);
970
30.8k
    init_mc_fns(FILTER_2D_8TAP_REGULAR_SHARP,  8tap_regular_sharp);
971
30.8k
    init_mc_fns(FILTER_2D_8TAP_SHARP_REGULAR,  8tap_sharp_regular);
972
30.8k
    init_mc_fns(FILTER_2D_8TAP_SHARP_SMOOTH,   8tap_sharp_smooth);
973
30.8k
    init_mc_fns(FILTER_2D_8TAP_SHARP,          8tap_sharp);
974
30.8k
    init_mc_fns(FILTER_2D_8TAP_SMOOTH_REGULAR, 8tap_smooth_regular);
975
30.8k
    init_mc_fns(FILTER_2D_8TAP_SMOOTH,         8tap_smooth);
976
30.8k
    init_mc_fns(FILTER_2D_8TAP_SMOOTH_SHARP,   8tap_smooth_sharp);
977
30.8k
    init_mc_fns(FILTER_2D_BILINEAR,            bilin);
978
979
30.8k
    c->avg      = avg_c;
980
30.8k
    c->w_avg    = w_avg_c;
981
30.8k
    c->mask     = mask_c;
982
30.8k
    c->blend    = blend_c;
983
30.8k
    c->blend_v  = blend_v_c;
984
30.8k
    c->blend_h  = blend_h_c;
985
30.8k
    c->w_mask[0] = w_mask_444_c;
986
30.8k
    c->w_mask[1] = w_mask_422_c;
987
30.8k
    c->w_mask[2] = w_mask_420_c;
988
30.8k
    c->warp8x8  = warp_affine_8x8_c;
989
30.8k
    c->warp8x8t = warp_affine_8x8t_c;
990
30.8k
    c->emu_edge = emu_edge_c;
991
30.8k
    c->resize   = resize_c;
992
993
#if HAVE_ASM
994
#if ARCH_AARCH64 || ARCH_ARM
995
    mc_dsp_init_arm(c);
996
#elif ARCH_LOONGARCH64
997
    mc_dsp_init_loongarch(c);
998
#elif ARCH_PPC64LE
999
    mc_dsp_init_ppc(c);
1000
#elif ARCH_RISCV
1001
    mc_dsp_init_riscv(c);
1002
#elif ARCH_X86
1003
    mc_dsp_init_x86(c);
1004
#endif
1005
#endif
1006
30.8k
}
dav1d_mc_dsp_init_16bpc
Line
Count
Source
960
37.9k
COLD void bitfn(dav1d_mc_dsp_init)(Dav1dMCDSPContext *const c) {
961
37.9k
#define init_mc_fns(type, name) do { \
962
37.9k
    c->mc        [type] = put_##name##_c; \
963
37.9k
    c->mc_scaled [type] = put_##name##_scaled_c; \
964
37.9k
    c->mct       [type] = prep_##name##_c; \
965
37.9k
    c->mct_scaled[type] = prep_##name##_scaled_c; \
966
37.9k
} while (0)
967
968
37.9k
    init_mc_fns(FILTER_2D_8TAP_REGULAR,        8tap_regular);
969
37.9k
    init_mc_fns(FILTER_2D_8TAP_REGULAR_SMOOTH, 8tap_regular_smooth);
970
37.9k
    init_mc_fns(FILTER_2D_8TAP_REGULAR_SHARP,  8tap_regular_sharp);
971
37.9k
    init_mc_fns(FILTER_2D_8TAP_SHARP_REGULAR,  8tap_sharp_regular);
972
37.9k
    init_mc_fns(FILTER_2D_8TAP_SHARP_SMOOTH,   8tap_sharp_smooth);
973
37.9k
    init_mc_fns(FILTER_2D_8TAP_SHARP,          8tap_sharp);
974
37.9k
    init_mc_fns(FILTER_2D_8TAP_SMOOTH_REGULAR, 8tap_smooth_regular);
975
37.9k
    init_mc_fns(FILTER_2D_8TAP_SMOOTH,         8tap_smooth);
976
37.9k
    init_mc_fns(FILTER_2D_8TAP_SMOOTH_SHARP,   8tap_smooth_sharp);
977
37.9k
    init_mc_fns(FILTER_2D_BILINEAR,            bilin);
978
979
37.9k
    c->avg      = avg_c;
980
37.9k
    c->w_avg    = w_avg_c;
981
37.9k
    c->mask     = mask_c;
982
37.9k
    c->blend    = blend_c;
983
37.9k
    c->blend_v  = blend_v_c;
984
37.9k
    c->blend_h  = blend_h_c;
985
37.9k
    c->w_mask[0] = w_mask_444_c;
986
37.9k
    c->w_mask[1] = w_mask_422_c;
987
37.9k
    c->w_mask[2] = w_mask_420_c;
988
37.9k
    c->warp8x8  = warp_affine_8x8_c;
989
37.9k
    c->warp8x8t = warp_affine_8x8t_c;
990
37.9k
    c->emu_edge = emu_edge_c;
991
37.9k
    c->resize   = resize_c;
992
993
#if HAVE_ASM
994
#if ARCH_AARCH64 || ARCH_ARM
995
    mc_dsp_init_arm(c);
996
#elif ARCH_LOONGARCH64
997
    mc_dsp_init_loongarch(c);
998
#elif ARCH_PPC64LE
999
    mc_dsp_init_ppc(c);
1000
#elif ARCH_RISCV
1001
    mc_dsp_init_riscv(c);
1002
#elif ARCH_X86
1003
    mc_dsp_init_x86(c);
1004
#endif
1005
#endif
1006
37.9k
}