Coverage Report

Created: 2026-02-14 06:59

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/ffmpeg/libavcodec/h264pred.c
Line
Count
Source
1
/*
2
 * H.26L/H.264/AVC/JVT/14496-10/... encoder/decoder
3
 * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
4
 *
5
 * This file is part of FFmpeg.
6
 *
7
 * FFmpeg is free software; you can redistribute it and/or
8
 * modify it under the terms of the GNU Lesser General Public
9
 * License as published by the Free Software Foundation; either
10
 * version 2.1 of the License, or (at your option) any later version.
11
 *
12
 * FFmpeg is distributed in the hope that it will be useful,
13
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15
 * Lesser General Public License for more details.
16
 *
17
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with FFmpeg; if not, write to the Free Software
19
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20
 */
21
22
/**
23
 * @file
24
 * H.264 / AVC / MPEG-4 part10 prediction functions.
25
 * @author Michael Niedermayer <michaelni@gmx.at>
26
 */
27
28
#include "config.h"
29
#include "libavutil/attributes.h"
30
#include "libavutil/avassert.h"
31
#include "libavutil/intreadwrite.h"
32
#include "codec_id.h"
33
#include "h264pred.h"
34
#include "mathops.h"
35
36
#define BIT_DEPTH 8
37
#include "h264pred_template.c"
38
#undef BIT_DEPTH
39
40
10.0M
#define BIT_DEPTH 9
41
#include "h264pred_template.c"
42
#undef BIT_DEPTH
43
44
30.0M
#define BIT_DEPTH 10
45
#include "h264pred_template.c"
46
#undef BIT_DEPTH
47
48
6.22M
#define BIT_DEPTH 12
49
#include "h264pred_template.c"
50
#undef BIT_DEPTH
51
52
8.85M
#define BIT_DEPTH 14
53
#include "h264pred_template.c"
54
#undef BIT_DEPTH
55
56
static void pred4x4_127_dc_c(uint8_t *src, const uint8_t *topright,
57
                             ptrdiff_t _stride)
58
9.33k
{
59
9.33k
    int stride = _stride;
60
9.33k
    const uint32_t a = 0x7F7F7F7FU;
61
62
9.33k
    AV_WN32A(src + 0 * stride, a);
63
9.33k
    AV_WN32A(src + 1 * stride, a);
64
9.33k
    AV_WN32A(src + 2 * stride, a);
65
9.33k
    AV_WN32A(src + 3 * stride, a);
66
9.33k
}
67
68
static void pred4x4_129_dc_c(uint8_t *src, const uint8_t *topright,
69
                             ptrdiff_t _stride)
70
2.74k
{
71
2.74k
    int stride = _stride;
72
2.74k
    const uint32_t a = 0x81818181U;
73
74
2.74k
    AV_WN32A(src + 0 * stride, a);
75
2.74k
    AV_WN32A(src + 1 * stride, a);
76
2.74k
    AV_WN32A(src + 2 * stride, a);
77
2.74k
    AV_WN32A(src + 3 * stride, a);
78
2.74k
}
79
80
static void pred4x4_vertical_vp8_c(uint8_t *src, const uint8_t *topright,
81
                                   ptrdiff_t stride)
82
125k
{
83
125k
    const unsigned lt = src[-1-1*stride];
84
125k
    LOAD_TOP_EDGE
85
125k
    LOAD_TOP_RIGHT_EDGE
86
125k
    uint32_t v = PACK_4U8((lt + 2*t0 + t1 + 2) >> 2,
87
125k
                          (t0 + 2*t1 + t2 + 2) >> 2,
88
125k
                          (t1 + 2*t2 + t3 + 2) >> 2,
89
125k
                          (t2 + 2*t3 + t4 + 2) >> 2);
90
91
125k
    AV_WN32A(src+0*stride, v);
92
125k
    AV_WN32A(src+1*stride, v);
93
125k
    AV_WN32A(src+2*stride, v);
94
125k
    AV_WN32A(src+3*stride, v);
95
125k
}
96
97
static void pred4x4_horizontal_vp8_c(uint8_t *src, const uint8_t *topright,
98
                                     ptrdiff_t stride)
99
110k
{
100
110k
    const unsigned lt = src[-1-1*stride];
101
110k
    LOAD_LEFT_EDGE
102
103
110k
    AV_WN32A(src+0*stride, ((lt + 2*l0 + l1 + 2) >> 2)*0x01010101);
104
110k
    AV_WN32A(src+1*stride, ((l0 + 2*l1 + l2 + 2) >> 2)*0x01010101);
105
110k
    AV_WN32A(src+2*stride, ((l1 + 2*l2 + l3 + 2) >> 2)*0x01010101);
106
110k
    AV_WN32A(src+3*stride, ((l2 + 2*l3 + l3 + 2) >> 2)*0x01010101);
107
110k
}
108
109
static void pred4x4_down_left_svq3_c(uint8_t *src, const uint8_t *topright,
110
                                     ptrdiff_t stride)
111
674
{
112
674
    LOAD_TOP_EDGE
113
674
    LOAD_LEFT_EDGE
114
115
674
    src[0+0*stride]=(l1 + t1)>>1;
116
674
    src[1+0*stride]=
117
674
    src[0+1*stride]=(l2 + t2)>>1;
118
674
    src[2+0*stride]=
119
674
    src[1+1*stride]=
120
674
    src[0+2*stride]=
121
674
    src[3+0*stride]=
122
674
    src[2+1*stride]=
123
674
    src[1+2*stride]=
124
674
    src[0+3*stride]=
125
674
    src[3+1*stride]=
126
674
    src[2+2*stride]=
127
674
    src[1+3*stride]=
128
674
    src[3+2*stride]=
129
674
    src[2+3*stride]=
130
674
    src[3+3*stride]=(l3 + t3)>>1;
131
674
}
132
133
static void pred4x4_down_left_rv40_c(uint8_t *src, const uint8_t *topright,
134
                                     ptrdiff_t stride)
135
1.16M
{
136
1.16M
    LOAD_TOP_EDGE
137
1.16M
    LOAD_TOP_RIGHT_EDGE
138
1.16M
    LOAD_LEFT_EDGE
139
1.16M
    LOAD_DOWN_LEFT_EDGE
140
141
1.16M
    src[0+0*stride]=(t0 + t2 + 2*t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
142
1.16M
    src[1+0*stride]=
143
1.16M
    src[0+1*stride]=(t1 + t3 + 2*t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
144
1.16M
    src[2+0*stride]=
145
1.16M
    src[1+1*stride]=
146
1.16M
    src[0+2*stride]=(t2 + t4 + 2*t3 + 2 + l2 + l4 + 2*l3 + 2)>>3;
147
1.16M
    src[3+0*stride]=
148
1.16M
    src[2+1*stride]=
149
1.16M
    src[1+2*stride]=
150
1.16M
    src[0+3*stride]=(t3 + t5 + 2*t4 + 2 + l3 + l5 + 2*l4 + 2)>>3;
151
1.16M
    src[3+1*stride]=
152
1.16M
    src[2+2*stride]=
153
1.16M
    src[1+3*stride]=(t4 + t6 + 2*t5 + 2 + l4 + l6 + 2*l5 + 2)>>3;
154
1.16M
    src[3+2*stride]=
155
1.16M
    src[2+3*stride]=(t5 + t7 + 2*t6 + 2 + l5 + l7 + 2*l6 + 2)>>3;
156
1.16M
    src[3+3*stride]=(t6 + t7 + 1 + l6 + l7 + 1)>>2;
157
1.16M
}
158
159
static void pred4x4_down_left_rv40_nodown_c(uint8_t *src,
160
                                            const uint8_t *topright,
161
                                            ptrdiff_t stride)
162
4.21M
{
163
4.21M
    LOAD_TOP_EDGE
164
4.21M
    LOAD_TOP_RIGHT_EDGE
165
4.21M
    LOAD_LEFT_EDGE
166
167
4.21M
    src[0+0*stride]=(t0 + t2 + 2*t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
168
4.21M
    src[1+0*stride]=
169
4.21M
    src[0+1*stride]=(t1 + t3 + 2*t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
170
4.21M
    src[2+0*stride]=
171
4.21M
    src[1+1*stride]=
172
4.21M
    src[0+2*stride]=(t2 + t4 + 2*t3 + 2 + l2 + 3*l3 + 2)>>3;
173
4.21M
    src[3+0*stride]=
174
4.21M
    src[2+1*stride]=
175
4.21M
    src[1+2*stride]=
176
4.21M
    src[0+3*stride]=(t3 + t5 + 2*t4 + 2 + l3*4 + 2)>>3;
177
4.21M
    src[3+1*stride]=
178
4.21M
    src[2+2*stride]=
179
4.21M
    src[1+3*stride]=(t4 + t6 + 2*t5 + 2 + l3*4 + 2)>>3;
180
4.21M
    src[3+2*stride]=
181
4.21M
    src[2+3*stride]=(t5 + t7 + 2*t6 + 2 + l3*4 + 2)>>3;
182
4.21M
    src[3+3*stride]=(t6 + t7 + 1 + 2*l3 + 1)>>2;
183
4.21M
}
184
185
static void pred4x4_vertical_left_rv40(uint8_t *src, const uint8_t *topright,
186
                                       ptrdiff_t stride,
187
                                       const int l0, const int l1, const int l2,
188
                                       const int l3, const int l4)
189
5.00M
{
190
5.00M
    LOAD_TOP_EDGE
191
5.00M
    LOAD_TOP_RIGHT_EDGE
192
193
5.00M
    src[0+0*stride]=(2*t0 + 2*t1 + l1 + 2*l2 + l3 + 4)>>3;
194
5.00M
    src[1+0*stride]=
195
5.00M
    src[0+2*stride]=(t1 + t2 + 1)>>1;
196
5.00M
    src[2+0*stride]=
197
5.00M
    src[1+2*stride]=(t2 + t3 + 1)>>1;
198
5.00M
    src[3+0*stride]=
199
5.00M
    src[2+2*stride]=(t3 + t4+ 1)>>1;
200
5.00M
    src[3+2*stride]=(t4 + t5+ 1)>>1;
201
5.00M
    src[0+1*stride]=(t0 + 2*t1 + t2 + l2 + 2*l3 + l4 + 4)>>3;
202
5.00M
    src[1+1*stride]=
203
5.00M
    src[0+3*stride]=(t1 + 2*t2 + t3 + 2)>>2;
204
5.00M
    src[2+1*stride]=
205
5.00M
    src[1+3*stride]=(t2 + 2*t3 + t4 + 2)>>2;
206
5.00M
    src[3+1*stride]=
207
5.00M
    src[2+3*stride]=(t3 + 2*t4 + t5 + 2)>>2;
208
5.00M
    src[3+3*stride]=(t4 + 2*t5 + t6 + 2)>>2;
209
5.00M
}
210
211
static void pred4x4_vertical_left_rv40_c(uint8_t *src, const uint8_t *topright,
212
                                         ptrdiff_t stride)
213
963k
{
214
963k
    LOAD_LEFT_EDGE
215
963k
    LOAD_DOWN_LEFT_EDGE
216
217
963k
    pred4x4_vertical_left_rv40(src, topright, stride, l0, l1, l2, l3, l4);
218
963k
}
219
220
static void pred4x4_vertical_left_rv40_nodown_c(uint8_t *src,
221
                                                const uint8_t *topright,
222
                                                ptrdiff_t stride)
223
4.03M
{
224
4.03M
    LOAD_LEFT_EDGE
225
226
4.03M
    pred4x4_vertical_left_rv40(src, topright, stride, l0, l1, l2, l3, l3);
227
4.03M
}
228
229
static void pred4x4_vertical_left_vp8_c(uint8_t *src, const uint8_t *topright,
230
                                        ptrdiff_t stride)
231
66.1k
{
232
66.1k
    LOAD_TOP_EDGE
233
66.1k
    LOAD_TOP_RIGHT_EDGE
234
235
66.1k
    src[0+0*stride]=(t0 + t1 + 1)>>1;
236
66.1k
    src[1+0*stride]=
237
66.1k
    src[0+2*stride]=(t1 + t2 + 1)>>1;
238
66.1k
    src[2+0*stride]=
239
66.1k
    src[1+2*stride]=(t2 + t3 + 1)>>1;
240
66.1k
    src[3+0*stride]=
241
66.1k
    src[2+2*stride]=(t3 + t4 + 1)>>1;
242
66.1k
    src[0+1*stride]=(t0 + 2*t1 + t2 + 2)>>2;
243
66.1k
    src[1+1*stride]=
244
66.1k
    src[0+3*stride]=(t1 + 2*t2 + t3 + 2)>>2;
245
66.1k
    src[2+1*stride]=
246
66.1k
    src[1+3*stride]=(t2 + 2*t3 + t4 + 2)>>2;
247
66.1k
    src[3+1*stride]=
248
66.1k
    src[2+3*stride]=(t3 + 2*t4 + t5 + 2)>>2;
249
66.1k
    src[3+2*stride]=(t4 + 2*t5 + t6 + 2)>>2;
250
66.1k
    src[3+3*stride]=(t5 + 2*t6 + t7 + 2)>>2;
251
66.1k
}
252
253
static void pred4x4_horizontal_up_rv40_c(uint8_t *src, const uint8_t *topright,
254
                                         ptrdiff_t stride)
255
777k
{
256
777k
    LOAD_LEFT_EDGE
257
777k
    LOAD_DOWN_LEFT_EDGE
258
777k
    LOAD_TOP_EDGE
259
777k
    LOAD_TOP_RIGHT_EDGE
260
261
777k
    src[0+0*stride]=(t1 + 2*t2 + t3 + 2*l0 + 2*l1 + 4)>>3;
262
777k
    src[1+0*stride]=(t2 + 2*t3 + t4 + l0 + 2*l1 + l2 + 4)>>3;
263
777k
    src[2+0*stride]=
264
777k
    src[0+1*stride]=(t3 + 2*t4 + t5 + 2*l1 + 2*l2 + 4)>>3;
265
777k
    src[3+0*stride]=
266
777k
    src[1+1*stride]=(t4 + 2*t5 + t6 + l1 + 2*l2 + l3 + 4)>>3;
267
777k
    src[2+1*stride]=
268
777k
    src[0+2*stride]=(t5 + 2*t6 + t7 + 2*l2 + 2*l3 + 4)>>3;
269
777k
    src[3+1*stride]=
270
777k
    src[1+2*stride]=(t6 + 3*t7 + l2 + 3*l3 + 4)>>3;
271
777k
    src[3+2*stride]=
272
777k
    src[1+3*stride]=(l3 + 2*l4 + l5 + 2)>>2;
273
777k
    src[0+3*stride]=
274
777k
    src[2+2*stride]=(t6 + t7 + l3 + l4 + 2)>>2;
275
777k
    src[2+3*stride]=(l4 + l5 + 1)>>1;
276
777k
    src[3+3*stride]=(l4 + 2*l5 + l6 + 2)>>2;
277
777k
}
278
279
static void pred4x4_horizontal_up_rv40_nodown_c(uint8_t *src,
280
                                                const uint8_t *topright,
281
                                                ptrdiff_t stride)
282
3.71M
{
283
3.71M
    LOAD_LEFT_EDGE
284
3.71M
    LOAD_TOP_EDGE
285
3.71M
    LOAD_TOP_RIGHT_EDGE
286
287
3.71M
    src[0+0*stride]=(t1 + 2*t2 + t3 + 2*l0 + 2*l1 + 4)>>3;
288
3.71M
    src[1+0*stride]=(t2 + 2*t3 + t4 + l0 + 2*l1 + l2 + 4)>>3;
289
3.71M
    src[2+0*stride]=
290
3.71M
    src[0+1*stride]=(t3 + 2*t4 + t5 + 2*l1 + 2*l2 + 4)>>3;
291
3.71M
    src[3+0*stride]=
292
3.71M
    src[1+1*stride]=(t4 + 2*t5 + t6 + l1 + 2*l2 + l3 + 4)>>3;
293
3.71M
    src[2+1*stride]=
294
3.71M
    src[0+2*stride]=(t5 + 2*t6 + t7 + 2*l2 + 2*l3 + 4)>>3;
295
3.71M
    src[3+1*stride]=
296
3.71M
    src[1+2*stride]=(t6 + 3*t7 + l2 + 3*l3 + 4)>>3;
297
3.71M
    src[3+2*stride]=
298
3.71M
    src[1+3*stride]=l3;
299
3.71M
    src[0+3*stride]=
300
3.71M
    src[2+2*stride]=(t6 + t7 + 2*l3 + 2)>>2;
301
3.71M
    src[2+3*stride]=
302
3.71M
    src[3+3*stride]=l3;
303
3.71M
}
304
305
static void pred4x4_tm_vp8_c(uint8_t *src, const uint8_t *topright,
306
                             ptrdiff_t stride)
307
314k
{
308
314k
    const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP - src[-1-stride];
309
314k
    uint8_t *top = src-stride;
310
314k
    int y;
311
312
1.57M
    for (y = 0; y < 4; y++) {
313
1.25M
        const uint8_t *cm_in = cm + src[-1];
314
1.25M
        src[0] = cm_in[top[0]];
315
1.25M
        src[1] = cm_in[top[1]];
316
1.25M
        src[2] = cm_in[top[2]];
317
1.25M
        src[3] = cm_in[top[3]];
318
1.25M
        src += stride;
319
1.25M
    }
320
314k
}
321
322
static void pred16x16_plane_svq3_c(uint8_t *src, ptrdiff_t stride)
323
2.95k
{
324
2.95k
    pred16x16_plane_compat_8_c(src, stride, 1, 0);
325
2.95k
}
326
327
static void pred16x16_plane_rv40_c(uint8_t *src, ptrdiff_t stride)
328
204k
{
329
204k
    pred16x16_plane_compat_8_c(src, stride, 0, 1);
330
204k
}
331
332
static void pred16x16_tm_vp8_c(uint8_t *src, ptrdiff_t stride)
333
46.8k
{
334
46.8k
    const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP - src[-1-stride];
335
46.8k
    uint8_t *top = src-stride;
336
46.8k
    int y;
337
338
796k
    for (y = 0; y < 16; y++) {
339
749k
        const uint8_t *cm_in = cm + src[-1];
340
749k
        src[0]  = cm_in[top[0]];
341
749k
        src[1]  = cm_in[top[1]];
342
749k
        src[2]  = cm_in[top[2]];
343
749k
        src[3]  = cm_in[top[3]];
344
749k
        src[4]  = cm_in[top[4]];
345
749k
        src[5]  = cm_in[top[5]];
346
749k
        src[6]  = cm_in[top[6]];
347
749k
        src[7]  = cm_in[top[7]];
348
749k
        src[8]  = cm_in[top[8]];
349
749k
        src[9]  = cm_in[top[9]];
350
749k
        src[10] = cm_in[top[10]];
351
749k
        src[11] = cm_in[top[11]];
352
749k
        src[12] = cm_in[top[12]];
353
749k
        src[13] = cm_in[top[13]];
354
749k
        src[14] = cm_in[top[14]];
355
749k
        src[15] = cm_in[top[15]];
356
749k
        src += stride;
357
749k
    }
358
46.8k
}
359
360
static void pred8x8_left_dc_rv40_c(uint8_t *src, ptrdiff_t stride)
361
598k
{
362
598k
    int i;
363
598k
    unsigned dc0;
364
365
598k
    dc0=0;
366
5.38M
    for(i=0;i<8; i++)
367
4.78M
        dc0+= src[-1+i*stride];
368
598k
    dc0= 0x01010101*((dc0 + 4)>>3);
369
370
5.38M
    for(i=0; i<8; i++){
371
4.78M
        ((uint32_t*)(src+i*stride))[0]=
372
4.78M
        ((uint32_t*)(src+i*stride))[1]= dc0;
373
4.78M
    }
374
598k
}
375
376
static void pred8x8_top_dc_rv40_c(uint8_t *src, ptrdiff_t stride)
377
374k
{
378
374k
    int i;
379
374k
    unsigned dc0;
380
381
374k
    dc0=0;
382
3.36M
    for(i=0;i<8; i++)
383
2.99M
        dc0+= src[i-stride];
384
374k
    dc0= 0x01010101*((dc0 + 4)>>3);
385
386
3.36M
    for(i=0; i<8; i++){
387
2.99M
        ((uint32_t*)(src+i*stride))[0]=
388
2.99M
        ((uint32_t*)(src+i*stride))[1]= dc0;
389
2.99M
    }
390
374k
}
391
392
static void pred8x8_dc_rv40_c(uint8_t *src, ptrdiff_t stride)
393
1.80M
{
394
1.80M
    int i;
395
1.80M
    unsigned dc0 = 0;
396
397
9.02M
    for(i=0;i<4; i++){
398
7.22M
        dc0+= src[-1+i*stride] + src[i-stride];
399
7.22M
        dc0+= src[4+i-stride];
400
7.22M
        dc0+= src[-1+(i+4)*stride];
401
7.22M
    }
402
1.80M
    dc0= 0x01010101*((dc0 + 8)>>4);
403
404
9.02M
    for(i=0; i<4; i++){
405
7.22M
        ((uint32_t*)(src+i*stride))[0]= dc0;
406
7.22M
        ((uint32_t*)(src+i*stride))[1]= dc0;
407
7.22M
    }
408
9.02M
    for(i=4; i<8; i++){
409
7.22M
        ((uint32_t*)(src+i*stride))[0]= dc0;
410
7.22M
        ((uint32_t*)(src+i*stride))[1]= dc0;
411
7.22M
    }
412
1.80M
}
413
414
static void pred8x8_tm_vp8_c(uint8_t *src, ptrdiff_t stride)
415
89.5k
{
416
89.5k
    const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP - src[-1-stride];
417
89.5k
    uint8_t *top = src-stride;
418
89.5k
    int y;
419
420
806k
    for (y = 0; y < 8; y++) {
421
716k
        const uint8_t *cm_in = cm + src[-1];
422
716k
        src[0] = cm_in[top[0]];
423
716k
        src[1] = cm_in[top[1]];
424
716k
        src[2] = cm_in[top[2]];
425
716k
        src[3] = cm_in[top[3]];
426
716k
        src[4] = cm_in[top[4]];
427
716k
        src[5] = cm_in[top[5]];
428
716k
        src[6] = cm_in[top[6]];
429
716k
        src[7] = cm_in[top[7]];
430
716k
        src += stride;
431
716k
    }
432
89.5k
}
433
434
/**
435
 * Set the intra prediction function pointers.
436
 */
437
av_cold void ff_h264_pred_init(H264PredContext *h, int codec_id,
438
                               const int bit_depth,
439
                               int chroma_format_idc)
440
423k
{
441
423k
#undef FUNC
442
423k
#undef FUNCC
443
1.58M
#define FUNC(a, depth) a ## _ ## depth
444
423k
#define FUNCC(a, depth) a ## _ ## depth ## _c
445
423k
#define FUNCD(a) a ## _c
446
447
423k
#define H264_PRED(depth) \
448
423k
    h->pred4x4[VERT_PRED           ] = FUNCC(pred4x4_vertical,        depth);\
449
423k
    h->pred4x4[HOR_PRED            ] = FUNCC(pred4x4_horizontal,      depth);\
450
423k
    h->pred4x4[DC_PRED             ] = FUNCC(pred4x4_dc,              depth);\
451
423k
    h->pred4x4[DIAG_DOWN_LEFT_PRED ] = FUNCC(pred4x4_down_left,       depth);\
452
423k
    h->pred4x4[DIAG_DOWN_RIGHT_PRED] = FUNCC(pred4x4_down_right,      depth);\
453
423k
    h->pred4x4[VERT_RIGHT_PRED     ] = FUNCC(pred4x4_vertical_right,  depth);\
454
423k
    h->pred4x4[HOR_DOWN_PRED       ] = FUNCC(pred4x4_horizontal_down, depth);\
455
423k
    h->pred4x4[VERT_LEFT_PRED      ] = FUNCC(pred4x4_vertical_left,   depth);\
456
423k
    h->pred4x4[HOR_UP_PRED         ] = FUNCC(pred4x4_horizontal_up,   depth);\
457
423k
    h->pred4x4[LEFT_DC_PRED        ] = FUNCC(pred4x4_left_dc,         depth);\
458
423k
    h->pred4x4[TOP_DC_PRED         ] = FUNCC(pred4x4_top_dc,          depth);\
459
423k
    if (depth > 8 || codec_id != AV_CODEC_ID_VP8)\
460
423k
        h->pred4x4[DC_128_PRED     ] = FUNCC(pred4x4_128_dc,          depth);\
461
423k
\
462
423k
    h->pred8x8l[VERT_PRED           ]= FUNCC(pred8x8l_vertical            , depth);\
463
423k
    h->pred8x8l[HOR_PRED            ]= FUNCC(pred8x8l_horizontal          , depth);\
464
423k
    h->pred8x8l[DC_PRED             ]= FUNCC(pred8x8l_dc                  , depth);\
465
423k
    h->pred8x8l[DIAG_DOWN_LEFT_PRED ]= FUNCC(pred8x8l_down_left           , depth);\
466
423k
    h->pred8x8l[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred8x8l_down_right          , depth);\
467
423k
    h->pred8x8l[VERT_RIGHT_PRED     ]= FUNCC(pred8x8l_vertical_right      , depth);\
468
423k
    h->pred8x8l[HOR_DOWN_PRED       ]= FUNCC(pred8x8l_horizontal_down     , depth);\
469
423k
    h->pred8x8l[VERT_LEFT_PRED      ]= FUNCC(pred8x8l_vertical_left       , depth);\
470
423k
    h->pred8x8l[HOR_UP_PRED         ]= FUNCC(pred8x8l_horizontal_up       , depth);\
471
423k
    h->pred8x8l[LEFT_DC_PRED        ]= FUNCC(pred8x8l_left_dc             , depth);\
472
423k
    h->pred8x8l[TOP_DC_PRED         ]= FUNCC(pred8x8l_top_dc              , depth);\
473
423k
    h->pred8x8l[DC_128_PRED         ]= FUNCC(pred8x8l_128_dc              , depth);\
474
423k
\
475
423k
    if (chroma_format_idc <= 1) {\
476
258k
        h->pred8x8[VERT_PRED8x8   ]= FUNCC(pred8x8_vertical               , depth);\
477
258k
        h->pred8x8[HOR_PRED8x8    ]= FUNCC(pred8x8_horizontal             , depth);\
478
258k
        h->pred8x8[PLANE_PRED8x8] = FUNCC(pred8x8_plane,       depth);\
479
258k
    } else {\
480
164k
        h->pred8x8[VERT_PRED8x8   ]= FUNCC(pred8x16_vertical              , depth);\
481
164k
        h->pred8x8[HOR_PRED8x8    ]= FUNCC(pred8x16_horizontal            , depth);\
482
164k
        h->pred8x8[PLANE_PRED8x8] = FUNCC(pred8x16_plane,      depth);\
483
164k
    }\
484
423k
    if (depth > 8 || (codec_id != AV_CODEC_ID_RV40 && \
485
162k
                      codec_id != AV_CODEC_ID_VP7  && \
486
395k
                      codec_id != AV_CODEC_ID_VP8)) { \
487
395k
        if (chroma_format_idc <= 1) {\
488
230k
            h->pred8x8[DC_PRED8x8     ]= FUNCC(pred8x8_dc                     , depth);\
489
230k
            h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x8_left_dc                , depth);\
490
230k
            h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x8_top_dc                 , depth);\
491
230k
            h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l0t, depth);\
492
230k
            h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0lt, depth);\
493
230k
            h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l00, depth);\
494
230k
            h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0l0, depth);\
495
230k
        } else {\
496
164k
            h->pred8x8[DC_PRED8x8     ]= FUNCC(pred8x16_dc                    , depth);\
497
164k
            h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x16_left_dc               , depth);\
498
164k
            h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x16_top_dc                , depth);\
499
164k
            h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_l0t, depth);\
500
164k
            h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_0lt, depth);\
501
164k
            h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_l00, depth);\
502
164k
            h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_0l0, depth);\
503
164k
        }\
504
395k
    }else{\
505
28.0k
        h->pred8x8[DC_PRED8x8     ]= FUNCD(pred8x8_dc_rv40);\
506
28.0k
        h->pred8x8[LEFT_DC_PRED8x8]= FUNCD(pred8x8_left_dc_rv40);\
507
28.0k
        h->pred8x8[TOP_DC_PRED8x8 ]= FUNCD(pred8x8_top_dc_rv40);\
508
28.0k
    }\
509
423k
    if (chroma_format_idc <= 1) {\
510
258k
        h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x8_128_dc                 , depth);\
511
258k
    } else {\
512
164k
        h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x16_128_dc                , depth);\
513
164k
    }\
514
423k
\
515
423k
    h->pred16x16[DC_PRED8x8     ]= FUNCC(pred16x16_dc                     , depth);\
516
423k
    h->pred16x16[VERT_PRED8x8   ]= FUNCC(pred16x16_vertical               , depth);\
517
423k
    h->pred16x16[HOR_PRED8x8    ]= FUNCC(pred16x16_horizontal             , depth);\
518
423k
    h->pred16x16[PLANE_PRED8x8  ]= FUNCC(pred16x16_plane                  , depth);\
519
423k
    h->pred16x16[LEFT_DC_PRED8x8]= FUNCC(pred16x16_left_dc                , depth);\
520
423k
    h->pred16x16[TOP_DC_PRED8x8 ]= FUNCC(pred16x16_top_dc                 , depth);\
521
423k
    h->pred16x16[DC_128_PRED8x8 ]= FUNCC(pred16x16_128_dc                 , depth);\
522
423k
\
523
    /* special lossless h/v prediction for H.264 */ \
524
423k
    h->pred4x4_add  [VERT_PRED   ]= FUNCC(pred4x4_vertical_add            , depth);\
525
423k
    h->pred4x4_add  [ HOR_PRED   ]= FUNCC(pred4x4_horizontal_add          , depth);\
526
423k
    h->pred8x8l_add [VERT_PRED   ]= FUNCC(pred8x8l_vertical_add           , depth);\
527
423k
    h->pred8x8l_add [ HOR_PRED   ]= FUNCC(pred8x8l_horizontal_add         , depth);\
528
423k
    h->pred8x8l_filter_add [VERT_PRED   ]= FUNCC(pred8x8l_vertical_filter_add           , depth);\
529
423k
    h->pred8x8l_filter_add [ HOR_PRED   ]= FUNCC(pred8x8l_horizontal_filter_add         , depth);\
530
423k
    if (chroma_format_idc <= 1) {\
531
258k
        h->pred8x8_add[VERT_PRED8x8] = FUNCC(pred8x8_vertical_add,    depth);\
532
258k
        h->pred8x8_add[ HOR_PRED8x8] = FUNCC(pred8x8_horizontal_add,  depth);\
533
258k
    } else {\
534
164k
        h->pred8x8_add  [VERT_PRED8x8]= FUNCC(pred8x16_vertical_add            , depth);\
535
164k
        h->pred8x8_add  [ HOR_PRED8x8]= FUNCC(pred8x16_horizontal_add          , depth);\
536
164k
    }\
537
423k
    h->pred16x16_add[VERT_PRED8x8]= FUNCC(pred16x16_vertical_add          , depth);\
538
423k
    h->pred16x16_add[ HOR_PRED8x8]= FUNCC(pred16x16_horizontal_add        , depth);\
539
423k
540
423k
    switch (bit_depth) {
541
63.1k
        case 9:
542
63.1k
            H264_PRED(9)
543
63.1k
            break;
544
33.3k
        case 10:
545
33.3k
            H264_PRED(10)
546
33.3k
            break;
547
100k
        case 12:
548
100k
            H264_PRED(12)
549
100k
            break;
550
63.3k
        case 14:
551
63.3k
            H264_PRED(14)
552
63.3k
            break;
553
162k
        default:
554
162k
            av_assert0(bit_depth<=8);
555
162k
            H264_PRED(8)
556
162k
            switch (codec_id) {
557
2.60k
            case AV_CODEC_ID_SVQ3:
558
2.60k
                h->pred4x4[DIAG_DOWN_LEFT_PRED] = FUNCD(pred4x4_down_left_svq3);
559
2.60k
                h->pred16x16[PLANE_PRED8x8    ] = FUNCD(pred16x16_plane_svq3);
560
2.60k
                break;
561
9.88k
            case AV_CODEC_ID_RV40:
562
9.88k
                h->pred4x4[DIAG_DOWN_LEFT_PRED] = FUNCD(pred4x4_down_left_rv40);
563
9.88k
                h->pred4x4[VERT_LEFT_PRED     ] = FUNCD(pred4x4_vertical_left_rv40);
564
9.88k
                h->pred4x4[HOR_UP_PRED        ] = FUNCD(pred4x4_horizontal_up_rv40);
565
9.88k
                h->pred4x4[DIAG_DOWN_LEFT_PRED_RV40_NODOWN] = FUNCD(pred4x4_down_left_rv40_nodown);
566
9.88k
                h->pred4x4[HOR_UP_PRED_RV40_NODOWN] = FUNCD(pred4x4_horizontal_up_rv40_nodown);
567
9.88k
                h->pred4x4[VERT_LEFT_PRED_RV40_NODOWN] = FUNCD(pred4x4_vertical_left_rv40_nodown);
568
9.88k
                h->pred16x16[PLANE_PRED8x8    ] = FUNCD(pred16x16_plane_rv40);
569
9.88k
                break;
570
7.32k
            case AV_CODEC_ID_VP7:
571
18.2k
            case AV_CODEC_ID_VP8:
572
18.2k
                h->pred4x4[VERT_PRED       ] = FUNCD(pred4x4_vertical_vp8);
573
18.2k
                h->pred4x4[HOR_PRED        ] = FUNCD(pred4x4_horizontal_vp8);
574
18.2k
                h->pred4x4[VERT_LEFT_PRED  ] = FUNCD(pred4x4_vertical_left_vp8);
575
18.2k
                h->pred4x4[TM_VP8_PRED     ] = FUNCD(pred4x4_tm_vp8);
576
18.2k
                h->pred4x4[VERT_VP8_PRED   ] = FUNCC(pred4x4_vertical, 8);
577
18.2k
                h->pred4x4[DC_127_PRED     ] = FUNCD(pred4x4_127_dc);
578
18.2k
                h->pred4x4[DC_129_PRED     ] = FUNCD(pred4x4_129_dc);
579
18.2k
                h->pred4x4[HOR_VP8_PRED    ] = FUNCC(pred4x4_horizontal, 8);
580
18.2k
                h->pred8x8[PLANE_PRED8x8   ] = FUNCD(pred8x8_tm_vp8);
581
18.2k
                h->pred8x8[DC_127_PRED8x8  ] = FUNCC(pred8x8_127_dc, 8);
582
18.2k
                h->pred8x8[DC_129_PRED8x8  ] = FUNCC(pred8x8_129_dc, 8);
583
18.2k
                h->pred16x16[PLANE_PRED8x8 ] = FUNCD(pred16x16_tm_vp8);
584
18.2k
                h->pred16x16[DC_127_PRED8x8] = FUNCC(pred16x16_127_dc, 8);
585
18.2k
                h->pred16x16[DC_129_PRED8x8] = FUNCC(pred16x16_129_dc, 8);
586
18.2k
                break;
587
162k
            }
588
162k
            break;
589
423k
    }
590
591
#if ARCH_AARCH64
592
    ff_h264_pred_init_aarch64(h, codec_id, bit_depth, chroma_format_idc);
593
#elif ARCH_ARM
594
    ff_h264_pred_init_arm(h, codec_id, bit_depth, chroma_format_idc);
595
#elif ARCH_X86 && HAVE_X86ASM
596
    ff_h264_pred_init_x86(h, codec_id, bit_depth, chroma_format_idc);
597
#elif ARCH_MIPS
598
    ff_h264_pred_init_mips(h, codec_id, bit_depth, chroma_format_idc);
599
#elif ARCH_LOONGARCH
600
    ff_h264_pred_init_loongarch(h, codec_id, bit_depth, chroma_format_idc);
601
#endif
602
423k
}