Coverage Report

Created: 2026-01-25 07:18

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/ffmpeg/libswscale/rgb2rgb_template.c
Line
Count
Source
1
/*
2
 * software RGB to RGB converter
3
 * pluralize by software PAL8 to RGB converter
4
 *              software YUV to YUV converter
5
 *              software YUV to RGB converter
6
 * Written by Nick Kurshev.
7
 * palette & YUV & runtime CPU stuff by Michael (michaelni@gmx.at)
8
 * lot of big-endian byte order fixes by Alex Beregszaszi
9
 *
10
 * This file is part of FFmpeg.
11
 *
12
 * FFmpeg is free software; you can redistribute it and/or
13
 * modify it under the terms of the GNU Lesser General Public
14
 * License as published by the Free Software Foundation; either
15
 * version 2.1 of the License, or (at your option) any later version.
16
 *
17
 * FFmpeg is distributed in the hope that it will be useful,
18
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
19
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
20
 * Lesser General Public License for more details.
21
 *
22
 * You should have received a copy of the GNU Lesser General Public
23
 * License along with FFmpeg; if not, write to the Free Software
24
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
25
 */
26
27
#include <stddef.h>
28
29
#include "libavutil/attributes.h"
30
31
static inline void rgb24tobgr32_c(const uint8_t *src, uint8_t *dst,
32
                                  int src_size)
33
0
{
34
0
    uint8_t *dest      = dst;
35
0
    const uint8_t *s   = src;
36
0
    const uint8_t *end = s + src_size;
37
38
0
    while (s < end) {
39
#if HAVE_BIGENDIAN
40
        /* RGB24 (= R, G, B) -> RGB32 (= A, B, G, R) */
41
        *dest++  = 255;
42
        *dest++  = s[2];
43
        *dest++  = s[1];
44
        *dest++  = s[0];
45
        s       += 3;
46
#else
47
0
        *dest++  = *s++;
48
0
        *dest++  = *s++;
49
0
        *dest++  = *s++;
50
0
        *dest++  = 255;
51
0
#endif
52
0
    }
53
0
}
54
55
static inline void rgb32tobgr24_c(const uint8_t *src, uint8_t *dst,
56
                                  int src_size)
57
0
{
58
0
    uint8_t *dest      = dst;
59
0
    const uint8_t *s   = src;
60
0
    const uint8_t *end = s + src_size;
61
62
0
    while (s < end) {
63
#if HAVE_BIGENDIAN
64
        /* RGB32 (= A, B, G, R) -> RGB24 (= R, G, B) */
65
        s++;
66
        dest[2]  = *s++;
67
        dest[1]  = *s++;
68
        dest[0]  = *s++;
69
        dest    += 3;
70
#else
71
0
        *dest++  = *s++;
72
0
        *dest++  = *s++;
73
0
        *dest++  = *s++;
74
0
        s++;
75
0
#endif
76
0
    }
77
0
}
78
79
/*
80
 * original by Strepto/Astral
81
 * ported to gcc & bugfixed: A'rpi
82
 * MMXEXT, 3DNOW optimization by Nick Kurshev
83
 * 32-bit C version, and and&add trick by Michael Niedermayer
84
 */
85
static inline void rgb15to16_c(const uint8_t *src, uint8_t *dst, int src_size)
86
0
{
87
0
    register uint8_t *d         = dst;
88
0
    register const uint8_t *s   = src;
89
0
    register const uint8_t *end = s + src_size;
90
0
    const uint8_t *mm_end       = end - 3;
91
92
0
    while (s < mm_end) {
93
0
        register unsigned x = *((const uint32_t *)s);
94
0
        *((uint32_t *)d)    = (x & 0x7FFF7FFF) + (x & 0x7FE07FE0);
95
0
        d += 4;
96
0
        s += 4;
97
0
    }
98
0
    if (s < end) {
99
0
        register unsigned short x = *((const uint16_t *)s);
100
0
        *((uint16_t *)d)          = (x & 0x7FFF) + (x & 0x7FE0);
101
0
    }
102
0
}
103
104
static inline void rgb16to15_c(const uint8_t *src, uint8_t *dst, int src_size)
105
0
{
106
0
    register uint8_t *d         = dst;
107
0
    register const uint8_t *s   = src;
108
0
    register const uint8_t *end = s + src_size;
109
0
    const uint8_t *mm_end       = end - 3;
110
111
0
    while (s < mm_end) {
112
0
        register uint32_t x  = *((const uint32_t *)s);
113
0
        *((uint32_t *)d)     = ((x >> 1) & 0x7FE07FE0) | (x & 0x001F001F);
114
0
        s                   += 4;
115
0
        d                   += 4;
116
0
    }
117
0
    if (s < end) {
118
0
        register uint16_t x = *((const uint16_t *)s);
119
0
        *((uint16_t *)d)    = ((x >> 1) & 0x7FE0) | (x & 0x001F);
120
0
    }
121
0
}
122
123
static inline void rgb32to16_c(const uint8_t *src, uint8_t *dst, int src_size)
124
0
{
125
0
    uint16_t *d        = (uint16_t *)dst;
126
0
    const uint8_t *s   = src;
127
0
    const uint8_t *end = s + src_size;
128
129
0
    while (s < end) {
130
0
        register int rgb  = *(const uint32_t *)s;
131
0
        s                += 4;
132
0
        *d++              = ((rgb & 0xFF)     >> 3) +
133
0
                            ((rgb & 0xFC00)   >> 5) +
134
0
                            ((rgb & 0xF80000) >> 8);
135
0
    }
136
0
}
137
138
static inline void rgb32tobgr16_c(const uint8_t *src, uint8_t *dst,
139
                                  int src_size)
140
0
{
141
0
    uint16_t *d        = (uint16_t *)dst;
142
0
    const uint8_t *s   = src;
143
0
    const uint8_t *end = s + src_size;
144
145
0
    while (s < end) {
146
0
        register int rgb  = *(const uint32_t *)s;
147
0
        s                += 4;
148
0
        *d++              = ((rgb & 0xF8)     << 8) +
149
0
                            ((rgb & 0xFC00)   >> 5) +
150
0
                            ((rgb & 0xF80000) >> 19);
151
0
    }
152
0
}
153
154
static inline void rgb32to15_c(const uint8_t *src, uint8_t *dst, int src_size)
155
0
{
156
0
    uint16_t *d        = (uint16_t *)dst;
157
0
    const uint8_t *s   = src;
158
0
    const uint8_t *end = s + src_size;
159
160
0
    while (s < end) {
161
0
        register int rgb  = *(const uint32_t *)s;
162
0
        s                += 4;
163
0
        *d++              = ((rgb & 0xFF)     >> 3) +
164
0
                            ((rgb & 0xF800)   >> 6) +
165
0
                            ((rgb & 0xF80000) >> 9);
166
0
    }
167
0
}
168
169
static inline void rgb32tobgr15_c(const uint8_t *src, uint8_t *dst,
170
                                  int src_size)
171
0
{
172
0
    uint16_t *d        = (uint16_t *)dst;
173
0
    const uint8_t *s   = src;
174
0
    const uint8_t *end = s + src_size;
175
176
0
    while (s < end) {
177
0
        register int rgb  = *(const uint32_t *)s;
178
0
        s                += 4;
179
0
        *d++              = ((rgb & 0xF8)     <<  7) +
180
0
                            ((rgb & 0xF800)   >>  6) +
181
0
                            ((rgb & 0xF80000) >> 19);
182
0
    }
183
0
}
184
185
static inline void rgb24tobgr16_c(const uint8_t *src, uint8_t *dst,
186
                                  int src_size)
187
0
{
188
0
    uint16_t *d        = (uint16_t *)dst;
189
0
    const uint8_t *s   = src;
190
0
    const uint8_t *end = s + src_size;
191
192
0
    while (s < end) {
193
0
        const int b = *s++;
194
0
        const int g = *s++;
195
0
        const int r = *s++;
196
0
        *d++        = (b >> 3) | ((g & 0xFC) << 3) | ((r & 0xF8) << 8);
197
0
    }
198
0
}
199
200
static inline void rgb24to16_c(const uint8_t *src, uint8_t *dst, int src_size)
201
0
{
202
0
    uint16_t *d        = (uint16_t *)dst;
203
0
    const uint8_t *s   = src;
204
0
    const uint8_t *end = s + src_size;
205
206
0
    while (s < end) {
207
0
        const int r = *s++;
208
0
        const int g = *s++;
209
0
        const int b = *s++;
210
0
        *d++        = (b >> 3) | ((g & 0xFC) << 3) | ((r & 0xF8) << 8);
211
0
    }
212
0
}
213
214
static inline void rgb24tobgr15_c(const uint8_t *src, uint8_t *dst,
215
                                  int src_size)
216
0
{
217
0
    uint16_t *d        = (uint16_t *)dst;
218
0
    const uint8_t *s   = src;
219
0
    const uint8_t *end = s + src_size;
220
221
0
    while (s < end) {
222
0
        const int b = *s++;
223
0
        const int g = *s++;
224
0
        const int r = *s++;
225
0
        *d++        = (b >> 3) | ((g & 0xF8) << 2) | ((r & 0xF8) << 7);
226
0
    }
227
0
}
228
229
static inline void rgb24to15_c(const uint8_t *src, uint8_t *dst, int src_size)
230
0
{
231
0
    uint16_t *d        = (uint16_t *)dst;
232
0
    const uint8_t *s   = src;
233
0
    const uint8_t *end = s + src_size;
234
235
0
    while (s < end) {
236
0
        const int r = *s++;
237
0
        const int g = *s++;
238
0
        const int b = *s++;
239
0
        *d++        = (b >> 3) | ((g & 0xF8) << 2) | ((r & 0xF8) << 7);
240
0
    }
241
0
}
242
243
static inline void rgb15tobgr24_c(const uint8_t *src, uint8_t *dst,
244
                                  int src_size)
245
0
{
246
0
    uint8_t *d          = dst;
247
0
    const uint16_t *s   = (const uint16_t *)src;
248
0
    const uint16_t *end = s + src_size / 2;
249
250
0
    while (s < end) {
251
0
        register uint16_t bgr = *s++;
252
0
        *d++ = ((bgr&0x001F)<<3) | ((bgr&0x001F)>> 2);
253
0
        *d++ = ((bgr&0x03E0)>>2) | ((bgr&0x03E0)>> 7);
254
0
        *d++ = ((bgr&0x7C00)>>7) | ((bgr&0x7C00)>>12);
255
0
    }
256
0
}
257
258
static inline void rgb16tobgr24_c(const uint8_t *src, uint8_t *dst,
259
                                  int src_size)
260
0
{
261
0
    uint8_t *d          = (uint8_t *)dst;
262
0
    const uint16_t *s   = (const uint16_t *)src;
263
0
    const uint16_t *end = s + src_size / 2;
264
265
0
    while (s < end) {
266
0
        register uint16_t bgr = *s++;
267
0
        *d++ = ((bgr&0x001F)<<3) | ((bgr&0x001F)>> 2);
268
0
        *d++ = ((bgr&0x07E0)>>3) | ((bgr&0x07E0)>> 9);
269
0
        *d++ = ((bgr&0xF800)>>8) | ((bgr&0xF800)>>13);
270
0
    }
271
0
}
272
273
static inline void rgb15to32_c(const uint8_t *src, uint8_t *dst, int src_size)
274
0
{
275
0
    uint8_t *d          = dst;
276
0
    const uint16_t *s   = (const uint16_t *)src;
277
0
    const uint16_t *end = s + src_size / 2;
278
279
0
    while (s < end) {
280
0
        register uint16_t bgr = *s++;
281
#if HAVE_BIGENDIAN
282
        *d++ = 255;
283
        *d++ = ((bgr&0x7C00)>>7) | ((bgr&0x7C00)>>12);
284
        *d++ = ((bgr&0x03E0)>>2) | ((bgr&0x03E0)>> 7);
285
        *d++ = ((bgr&0x001F)<<3) | ((bgr&0x001F)>> 2);
286
#else
287
0
        *d++ = ((bgr&0x001F)<<3) | ((bgr&0x001F)>> 2);
288
0
        *d++ = ((bgr&0x03E0)>>2) | ((bgr&0x03E0)>> 7);
289
0
        *d++ = ((bgr&0x7C00)>>7) | ((bgr&0x7C00)>>12);
290
0
        *d++ = 255;
291
0
#endif
292
0
    }
293
0
}
294
295
static inline void rgb16to32_c(const uint8_t *src, uint8_t *dst, int src_size)
296
0
{
297
0
    uint8_t *d          = dst;
298
0
    const uint16_t *s   = (const uint16_t *)src;
299
0
    const uint16_t *end = s + src_size / 2;
300
301
0
    while (s < end) {
302
0
        register uint16_t bgr = *s++;
303
#if HAVE_BIGENDIAN
304
        *d++ = 255;
305
        *d++ = ((bgr&0xF800)>>8) | ((bgr&0xF800)>>13);
306
        *d++ = ((bgr&0x07E0)>>3) | ((bgr&0x07E0)>> 9);
307
        *d++ = ((bgr&0x001F)<<3) | ((bgr&0x001F)>> 2);
308
#else
309
0
        *d++ = ((bgr&0x001F)<<3) | ((bgr&0x001F)>> 2);
310
0
        *d++ = ((bgr&0x07E0)>>3) | ((bgr&0x07E0)>> 9);
311
0
        *d++ = ((bgr&0xF800)>>8) | ((bgr&0xF800)>>13);
312
0
        *d++ = 255;
313
0
#endif
314
0
    }
315
0
}
316
317
static inline void shuffle_bytes_2103_c(const uint8_t *src, uint8_t *dst,
318
                                        int src_size)
319
0
{
320
0
    int idx          = 15  - src_size;
321
0
    const uint8_t *s = src - idx;
322
0
    uint8_t *d       = dst - idx;
323
324
0
    for (; idx < 15; idx += 4) {
325
0
        register unsigned v   = *(const uint32_t *)&s[idx], g = v & 0xff00ff00;
326
0
        v                    &= 0xff00ff;
327
0
        *(uint32_t *)&d[idx]  = (v >> 16) + g + (v << 16);
328
0
    }
329
0
}
330
331
static inline void shuffle_bytes_0321_c(const uint8_t *src, uint8_t *dst,
332
                                        int src_size)
333
0
{
334
0
    int idx          = 15  - src_size;
335
0
    const uint8_t *s = src - idx;
336
0
    uint8_t *d       = dst - idx;
337
338
0
    for (; idx < 15; idx += 4) {
339
0
        register unsigned v   = *(const uint32_t *)&s[idx], g = v & 0x00ff00ff;
340
0
        v                    &= 0xff00ff00;
341
0
        *(uint32_t *)&d[idx]  = (v >> 16) + g + (v << 16);
342
0
    }
343
0
}
344
345
#define DEFINE_SHUFFLE_BYTES(name, a, b, c, d)                          \
346
static void shuffle_bytes_##name (const uint8_t *src,                   \
347
0
                                        uint8_t *dst, int src_size)     \
348
0
{                                                                       \
349
0
    int i;                                                              \
350
0
                                                                        \
351
0
    for (i = 0; i < src_size; i += 4) {                                 \
352
0
        dst[i + 0] = src[i + a];                                        \
353
0
        dst[i + 1] = src[i + b];                                        \
354
0
        dst[i + 2] = src[i + c];                                        \
355
0
        dst[i + 3] = src[i + d];                                        \
356
0
    }                                                                   \
357
0
}
Unexecuted instantiation: rgb2rgb.c:shuffle_bytes_1230_c
Unexecuted instantiation: rgb2rgb.c:shuffle_bytes_3012_c
Unexecuted instantiation: rgb2rgb.c:shuffle_bytes_3210_c
Unexecuted instantiation: rgb2rgb.c:shuffle_bytes_3102_c
Unexecuted instantiation: rgb2rgb.c:shuffle_bytes_2013_c
Unexecuted instantiation: rgb2rgb.c:shuffle_bytes_2130_c
Unexecuted instantiation: rgb2rgb.c:shuffle_bytes_1203_c
358
359
DEFINE_SHUFFLE_BYTES(1230_c, 1, 2, 3, 0)
360
DEFINE_SHUFFLE_BYTES(3012_c, 3, 0, 1, 2)
361
DEFINE_SHUFFLE_BYTES(3210_c, 3, 2, 1, 0)
362
DEFINE_SHUFFLE_BYTES(3102_c, 3, 1, 0, 2)
363
DEFINE_SHUFFLE_BYTES(2013_c, 2, 0, 1, 3)
364
DEFINE_SHUFFLE_BYTES(2130_c, 2, 1, 3, 0)
365
DEFINE_SHUFFLE_BYTES(1203_c, 1, 2, 0, 3)
366
367
static inline void rgb24tobgr24_c(const uint8_t *src, uint8_t *dst, int src_size)
368
0
{
369
0
    unsigned i;
370
371
0
    for (i = 0; i < src_size; i += 3) {
372
0
        register uint8_t x = src[i + 2];
373
0
        dst[i + 1]         = src[i + 1];
374
0
        dst[i + 2]         = src[i + 0];
375
0
        dst[i + 0]         = x;
376
0
    }
377
0
}
378
379
static inline void yuvPlanartoyuy2_c(const uint8_t *ysrc, const uint8_t *usrc,
380
                                     const uint8_t *vsrc, uint8_t *dst,
381
                                     int width, int height,
382
                                     int lumStride, int chromStride,
383
                                     int dstStride, int vertLumPerChroma)
384
0
{
385
0
    int y, i;
386
0
    const int chromWidth = width >> 1;
387
388
0
    for (y = 0; y < height; y++) {
389
0
#if HAVE_FAST_64BIT
390
0
        uint64_t *ldst = (uint64_t *)dst;
391
0
        const uint8_t *yc = ysrc, *uc = usrc, *vc = vsrc;
392
0
        for (i = 0; i < chromWidth; i += 2) {
393
0
            uint64_t k = yc[0] + (uc[0] << 8) +
394
0
                         (yc[1] << 16) + ((unsigned) vc[0] << 24);
395
0
            uint64_t l = yc[2] + (uc[1] << 8) +
396
0
                         (yc[3] << 16) + ((unsigned) vc[1] << 24);
397
0
            *ldst++ = k + (l << 32);
398
0
            yc     += 4;
399
0
            uc     += 2;
400
0
            vc     += 2;
401
0
        }
402
403
#else
404
        int *idst = (int32_t *)dst;
405
        const uint8_t *yc = ysrc, *uc = usrc, *vc = vsrc;
406
407
        for (i = 0; i < chromWidth; i++) {
408
#if HAVE_BIGENDIAN
409
            *idst++ = (yc[0] << 24) + (uc[0] << 16) +
410
                      (yc[1] <<  8) + (vc[0] <<  0);
411
#else
412
            *idst++ = yc[0] + (uc[0] << 8) +
413
                      (yc[1] << 16) + (vc[0] << 24);
414
#endif
415
            yc += 2;
416
            uc++;
417
            vc++;
418
        }
419
#endif
420
0
        if ((y & (vertLumPerChroma - 1)) == vertLumPerChroma - 1) {
421
0
            usrc += chromStride;
422
0
            vsrc += chromStride;
423
0
        }
424
0
        ysrc += lumStride;
425
0
        dst  += dstStride;
426
0
    }
427
0
}
428
429
/**
430
 * Height should be a multiple of 2 and width should be a multiple of 16.
431
 * (If this is a problem for anyone then tell me, and I will fix it.)
432
 */
433
static inline void yv12toyuy2_c(const uint8_t *ysrc, const uint8_t *usrc,
434
                                const uint8_t *vsrc, uint8_t *dst,
435
                                int width, int height, int lumStride,
436
                                int chromStride, int dstStride)
437
0
{
438
    //FIXME interpolate chroma
439
0
    yuvPlanartoyuy2_c(ysrc, usrc, vsrc, dst, width, height, lumStride,
440
0
                      chromStride, dstStride, 2);
441
0
}
442
443
static inline void yuvPlanartouyvy_c(const uint8_t *ysrc, const uint8_t *usrc,
444
                                     const uint8_t *vsrc, uint8_t *dst,
445
                                     int width, int height,
446
                                     int lumStride, int chromStride,
447
                                     int dstStride, int vertLumPerChroma)
448
0
{
449
0
    int y, i;
450
0
    const int chromWidth = width >> 1;
451
452
0
    for (y = 0; y < height; y++) {
453
0
#if HAVE_FAST_64BIT
454
0
        uint64_t *ldst = (uint64_t *)dst;
455
0
        const uint8_t *yc = ysrc, *uc = usrc, *vc = vsrc;
456
0
        for (i = 0; i < chromWidth; i += 2) {
457
0
            uint64_t k = uc[0] + (yc[0] << 8) +
458
0
                         (vc[0] << 16) + ((unsigned) yc[1] << 24);
459
0
            uint64_t l = uc[1] + (yc[2] << 8) +
460
0
                         (vc[1] << 16) + ((unsigned) yc[3] << 24);
461
0
            *ldst++ = k + (l << 32);
462
0
            yc     += 4;
463
0
            uc     += 2;
464
0
            vc     += 2;
465
0
        }
466
467
#else
468
        int *idst = (int32_t *)dst;
469
        const uint8_t *yc = ysrc, *uc = usrc, *vc = vsrc;
470
471
        for (i = 0; i < chromWidth; i++) {
472
#if HAVE_BIGENDIAN
473
            *idst++ = (uc[0] << 24) + (yc[0] << 16) +
474
                      (vc[0] <<  8) + (yc[1] <<  0);
475
#else
476
            *idst++ = uc[0] + (yc[0] << 8) +
477
                      (vc[0] << 16) + (yc[1] << 24);
478
#endif
479
            yc += 2;
480
            uc++;
481
            vc++;
482
        }
483
#endif
484
0
        if ((y & (vertLumPerChroma - 1)) == vertLumPerChroma - 1) {
485
0
            usrc += chromStride;
486
0
            vsrc += chromStride;
487
0
        }
488
0
        ysrc += lumStride;
489
0
        dst  += dstStride;
490
0
    }
491
0
}
492
493
/**
494
 * Height should be a multiple of 2 and width should be a multiple of 16
495
 * (If this is a problem for anyone then tell me, and I will fix it.)
496
 */
497
static inline void yv12touyvy_c(const uint8_t *ysrc, const uint8_t *usrc,
498
                                const uint8_t *vsrc, uint8_t *dst,
499
                                int width, int height, int lumStride,
500
                                int chromStride, int dstStride)
501
0
{
502
    //FIXME interpolate chroma
503
0
    yuvPlanartouyvy_c(ysrc, usrc, vsrc, dst, width, height, lumStride,
504
0
                      chromStride, dstStride, 2);
505
0
}
506
507
/**
508
 * Width should be a multiple of 16.
509
 */
510
static inline void yuv422ptouyvy_c(const uint8_t *ysrc, const uint8_t *usrc,
511
                                   const uint8_t *vsrc, uint8_t *dst,
512
                                   int width, int height, int lumStride,
513
                                   int chromStride, int dstStride)
514
0
{
515
0
    yuvPlanartouyvy_c(ysrc, usrc, vsrc, dst, width, height, lumStride,
516
0
                      chromStride, dstStride, 1);
517
0
}
518
519
/**
520
 * Width should be a multiple of 16.
521
 */
522
static inline void yuv422ptoyuy2_c(const uint8_t *ysrc, const uint8_t *usrc,
523
                                   const uint8_t *vsrc, uint8_t *dst,
524
                                   int width, int height, int lumStride,
525
                                   int chromStride, int dstStride)
526
0
{
527
0
    yuvPlanartoyuy2_c(ysrc, usrc, vsrc, dst, width, height, lumStride,
528
0
                      chromStride, dstStride, 1);
529
0
}
530
531
/**
532
 * Height should be a multiple of 2 and width should be a multiple of 16.
533
 * (If this is a problem for anyone then tell me, and I will fix it.)
534
 */
535
static inline void yuy2toyv12_c(const uint8_t *src, uint8_t *ydst,
536
                                uint8_t *udst, uint8_t *vdst,
537
                                int width, int height, int lumStride,
538
                                int chromStride, int srcStride)
539
0
{
540
0
    int y;
541
0
    const int chromWidth = width >> 1;
542
543
0
    for (y = 0; y < height; y += 2) {
544
0
        int i;
545
0
        for (i = 0; i < chromWidth; i++) {
546
0
            ydst[2 * i + 0] = src[4 * i + 0];
547
0
            udst[i]         = src[4 * i + 1];
548
0
            ydst[2 * i + 1] = src[4 * i + 2];
549
0
            vdst[i]         = src[4 * i + 3];
550
0
        }
551
0
        ydst += lumStride;
552
0
        src  += srcStride;
553
554
0
        for (i = 0; i < chromWidth; i++) {
555
0
            ydst[2 * i + 0] = src[4 * i + 0];
556
0
            ydst[2 * i + 1] = src[4 * i + 2];
557
0
        }
558
0
        udst += chromStride;
559
0
        vdst += chromStride;
560
0
        ydst += lumStride;
561
0
        src  += srcStride;
562
0
    }
563
0
}
564
565
static inline void planar2x_c(const uint8_t *src, uint8_t *dst, int srcWidth,
566
                              int srcHeight, int srcStride, int dstStride)
567
0
{
568
0
    int x, y;
569
570
0
    dst[0] = src[0];
571
572
    // first line
573
0
    for (x = 0; x < srcWidth - 1; x++) {
574
0
        dst[2 * x + 1] = (3 * src[x] + src[x + 1]) >> 2;
575
0
        dst[2 * x + 2] = (src[x] + 3 * src[x + 1]) >> 2;
576
0
    }
577
0
    dst[2 * srcWidth - 1] = src[srcWidth - 1];
578
579
0
    dst += dstStride;
580
581
0
    for (y = 1; y < srcHeight; y++) {
582
0
        const int mmxSize = 1;
583
584
0
        dst[0]         = (src[0] * 3 + src[srcStride]) >> 2;
585
0
        dst[dstStride] = (src[0] + 3 * src[srcStride]) >> 2;
586
587
0
        for (x = mmxSize - 1; x < srcWidth - 1; x++) {
588
0
            dst[2 * x + 1]             = (src[x + 0] * 3 + src[x + srcStride + 1]) >> 2;
589
0
            dst[2 * x + dstStride + 2] = (src[x + 0] + 3 * src[x + srcStride + 1]) >> 2;
590
0
            dst[2 * x + dstStride + 1] = (src[x + 1] + 3 * src[x + srcStride])     >> 2;
591
0
            dst[2 * x + 2]             = (src[x + 1] * 3 + src[x + srcStride])     >> 2;
592
0
        }
593
0
        dst[srcWidth * 2 - 1]             = (src[srcWidth - 1] * 3 + src[srcWidth - 1 + srcStride]) >> 2;
594
0
        dst[srcWidth * 2 - 1 + dstStride] = (src[srcWidth - 1] + 3 * src[srcWidth - 1 + srcStride]) >> 2;
595
596
0
        dst += dstStride * 2;
597
0
        src += srcStride;
598
0
    }
599
600
    // last line
601
0
    dst[0] = src[0];
602
603
0
    for (x = 0; x < srcWidth - 1; x++) {
604
0
        dst[2 * x + 1] = (src[x] * 3 + src[x + 1]) >> 2;
605
0
        dst[2 * x + 2] = (src[x] + 3 * src[x + 1]) >> 2;
606
0
    }
607
0
    dst[2 * srcWidth - 1] = src[srcWidth - 1];
608
0
}
609
610
/**
611
 * Height should be a multiple of 2 and width should be a multiple of 16.
612
 * (If this is a problem for anyone then tell me, and I will fix it.)
613
 * Chrominance data is only taken from every second line, others are ignored.
614
 * FIXME: Write HQ version.
615
 */
616
static inline void uyvytoyv12_c(const uint8_t *src, uint8_t *ydst,
617
                                uint8_t *udst, uint8_t *vdst,
618
                                int width, int height, int lumStride,
619
                                int chromStride, int srcStride)
620
0
{
621
0
    int y;
622
0
    const int chromWidth = width >> 1;
623
0
624
0
    for (y = 0; y < height; y += 2) {
625
0
        int i;
626
0
        for (i = 0; i < chromWidth; i++) {
627
0
            udst[i]         = src[4 * i + 0];
628
0
            ydst[2 * i + 0] = src[4 * i + 1];
629
0
            vdst[i]         = src[4 * i + 2];
630
0
            ydst[2 * i + 1] = src[4 * i + 3];
631
0
        }
632
0
        ydst += lumStride;
633
0
        src  += srcStride;
634
0
635
0
        for (i = 0; i < chromWidth; i++) {
636
0
            ydst[2 * i + 0] = src[4 * i + 1];
637
0
            ydst[2 * i + 1] = src[4 * i + 3];
638
0
        }
639
0
        udst += chromStride;
640
0
        vdst += chromStride;
641
0
        ydst += lumStride;
642
0
        src  += srcStride;
643
0
    }
644
0
}
645
646
/**
647
 * width should be a multiple of 2.
648
 * (If this is a problem for anyone then tell me, and I will fix it.)
649
 */
650
void ff_rgb24toyv12_c(const uint8_t *src, uint8_t *ydst, uint8_t *udst,
651
                   uint8_t *vdst, int width, int height, int lumStride,
652
                   int chromStride, int srcStride, const int32_t *rgb2yuv)
653
0
{
654
0
    int32_t ry = rgb2yuv[RY_IDX], gy = rgb2yuv[GY_IDX], by = rgb2yuv[BY_IDX];
655
0
    int32_t ru = rgb2yuv[RU_IDX], gu = rgb2yuv[GU_IDX], bu = rgb2yuv[BU_IDX];
656
0
    int32_t rv = rgb2yuv[RV_IDX], gv = rgb2yuv[GV_IDX], bv = rgb2yuv[BV_IDX];
657
0
    int y;
658
0
    const int chromWidth = width >> 1;
659
0
    const uint8_t *src1 = src;
660
0
    const uint8_t *src2 = src1 + srcStride;
661
0
    uint8_t *ydst1 = ydst;
662
0
    uint8_t *ydst2 = ydst + lumStride;
663
664
0
    for (y = 0; y < height; y += 2) {
665
0
        int i;
666
0
        if (y + 1 == height) {
667
0
            ydst2 = ydst1;
668
0
            src2  = src1;
669
0
        }
670
671
0
        for (i = 0; i < chromWidth; i++) {
672
0
            unsigned int b11 = src1[6 * i + 0];
673
0
            unsigned int g11 = src1[6 * i + 1];
674
0
            unsigned int r11 = src1[6 * i + 2];
675
0
            unsigned int b12 = src1[6 * i + 3];
676
0
            unsigned int g12 = src1[6 * i + 4];
677
0
            unsigned int r12 = src1[6 * i + 5];
678
0
            unsigned int b21 = src2[6 * i + 0];
679
0
            unsigned int g21 = src2[6 * i + 1];
680
0
            unsigned int r21 = src2[6 * i + 2];
681
0
            unsigned int b22 = src2[6 * i + 3];
682
0
            unsigned int g22 = src2[6 * i + 4];
683
0
            unsigned int r22 = src2[6 * i + 5];
684
685
0
            unsigned int Y11 = ((ry * r11 + gy * g11 + by * b11) >> RGB2YUV_SHIFT) + 16;
686
0
            unsigned int Y12 = ((ry * r12 + gy * g12 + by * b12) >> RGB2YUV_SHIFT) + 16;
687
0
            unsigned int Y21 = ((ry * r21 + gy * g21 + by * b21) >> RGB2YUV_SHIFT) + 16;
688
0
            unsigned int Y22 = ((ry * r22 + gy * g22 + by * b22) >> RGB2YUV_SHIFT) + 16;
689
690
0
            unsigned int bx = (b11 + b12 + b21 + b22) >> 2;
691
0
            unsigned int gx = (g11 + g12 + g21 + g22) >> 2;
692
0
            unsigned int rx = (r11 + r12 + r21 + r22) >> 2;
693
694
0
            unsigned int U  = ((ru * rx + gu * gx + bu * bx) >> RGB2YUV_SHIFT) + 128;
695
0
            unsigned int V  = ((rv * rx + gv * gx + bv * bx) >> RGB2YUV_SHIFT) + 128;
696
697
0
            ydst1[2 * i + 0] = Y11;
698
0
            ydst1[2 * i + 1] = Y12;
699
0
            ydst2[2 * i + 0] = Y21;
700
0
            ydst2[2 * i + 1] = Y22;
701
0
            udst[i]          = U;
702
0
            vdst[i]          = V;
703
0
        }
704
0
        src1  += srcStride * 2;
705
0
        src2  += srcStride * 2;
706
0
        ydst1 += lumStride * 2;
707
0
        ydst2 += lumStride * 2;
708
0
        udst  += chromStride;
709
0
        vdst  += chromStride;
710
0
    }
711
0
}
712
713
static void interleaveBytes_c(const uint8_t *src1, const uint8_t *src2,
714
                              uint8_t *dest, int width, int height,
715
                              int src1Stride, int src2Stride, int dstStride)
716
0
{
717
0
    int h;
718
719
0
    for (h = 0; h < height; h++) {
720
0
        int w;
721
0
        for (w = 0; w < width; w++) {
722
0
            dest[2 * w + 0] = src1[w];
723
0
            dest[2 * w + 1] = src2[w];
724
0
        }
725
0
        dest += dstStride;
726
0
        src1 += src1Stride;
727
0
        src2 += src2Stride;
728
0
    }
729
0
}
730
731
static void deinterleaveBytes_c(const uint8_t *src, uint8_t *dst1, uint8_t *dst2,
732
                                int width, int height, int srcStride,
733
                                int dst1Stride, int dst2Stride)
734
0
{
735
0
    int h;
736
737
0
    for (h = 0; h < height; h++) {
738
0
        int w;
739
0
        for (w = 0; w < width; w++) {
740
0
            dst1[w] = src[2 * w + 0];
741
0
            dst2[w] = src[2 * w + 1];
742
0
        }
743
0
        src  += srcStride;
744
0
        dst1 += dst1Stride;
745
0
        dst2 += dst2Stride;
746
0
    }
747
0
}
748
749
static inline void vu9_to_vu12_c(const uint8_t *src1, const uint8_t *src2,
750
                                 uint8_t *dst1, uint8_t *dst2,
751
                                 int width, int height,
752
                                 int srcStride1, int srcStride2,
753
                                 int dstStride1, int dstStride2)
754
0
{
755
0
    int x, y;
756
0
    int w = width  / 2;
757
0
    int h = height / 2;
758
759
0
    for (y = 0; y < h; y++) {
760
0
        const uint8_t *s1 = src1 + srcStride1 * (y >> 1);
761
0
        uint8_t *d        = dst1 + dstStride1 *  y;
762
0
        for (x = 0; x < w; x++)
763
0
            d[2 * x] = d[2 * x + 1] = s1[x];
764
0
    }
765
0
    for (y = 0; y < h; y++) {
766
0
        const uint8_t *s2 = src2 + srcStride2 * (y >> 1);
767
0
        uint8_t *d        = dst2 + dstStride2 *  y;
768
0
        for (x = 0; x < w; x++)
769
0
            d[2 * x] = d[2 * x + 1] = s2[x];
770
0
    }
771
0
}
772
773
static inline void yvu9_to_yuy2_c(const uint8_t *src1, const uint8_t *src2,
774
                                  const uint8_t *src3, uint8_t *dst,
775
                                  int width, int height,
776
                                  int srcStride1, int srcStride2,
777
                                  int srcStride3, int dstStride)
778
0
{
779
0
    int x, y;
780
0
    int w = width / 2;
781
0
    int h = height;
782
783
0
    for (y = 0; y < h; y++) {
784
0
        const uint8_t *yp = src1 + srcStride1 *  y;
785
0
        const uint8_t *up = src2 + srcStride2 * (y >> 2);
786
0
        const uint8_t *vp = src3 + srcStride3 * (y >> 2);
787
0
        uint8_t *d        = dst  + dstStride  *  y;
788
0
        for (x = 0; x < w; x++) {
789
0
            const int x2 = x << 2;
790
0
            d[8 * x + 0] = yp[x2];
791
0
            d[8 * x + 1] = up[x];
792
0
            d[8 * x + 2] = yp[x2 + 1];
793
0
            d[8 * x + 3] = vp[x];
794
0
            d[8 * x + 4] = yp[x2 + 2];
795
0
            d[8 * x + 5] = up[x];
796
0
            d[8 * x + 6] = yp[x2 + 3];
797
0
            d[8 * x + 7] = vp[x];
798
0
        }
799
0
    }
800
0
}
801
802
static void extract_even_c(const uint8_t *src, uint8_t *dst, int count)
803
0
{
804
0
    dst   +=  count;
805
0
    src   +=  count * 2;
806
0
    count  = -count;
807
0
    while (count < 0) {
808
0
        dst[count] = src[2 * count];
809
0
        count++;
810
0
    }
811
0
}
812
813
static void extract_even2_c(const uint8_t *src, uint8_t *dst0, uint8_t *dst1,
814
                            int count)
815
0
{
816
0
    dst0  +=  count;
817
0
    dst1  +=  count;
818
0
    src   +=  count * 4;
819
0
    count  = -count;
820
0
    while (count < 0) {
821
0
        dst0[count] = src[4 * count + 0];
822
0
        dst1[count] = src[4 * count + 2];
823
0
        count++;
824
0
    }
825
0
}
826
827
static void extract_even2avg_c(const uint8_t *src0, const uint8_t *src1,
828
                               uint8_t *dst0, uint8_t *dst1, int count)
829
0
{
830
0
    dst0  +=  count;
831
0
    dst1  +=  count;
832
0
    src0  +=  count * 4;
833
0
    src1  +=  count * 4;
834
0
    count  = -count;
835
0
    while (count < 0) {
836
0
        dst0[count] = (src0[4 * count + 0] + src1[4 * count + 0]) >> 1;
837
0
        dst1[count] = (src0[4 * count + 2] + src1[4 * count + 2]) >> 1;
838
0
        count++;
839
0
    }
840
0
}
841
842
static void extract_odd2_c(const uint8_t *src, uint8_t *dst0, uint8_t *dst1,
843
                           int count)
844
0
{
845
0
    dst0  +=  count;
846
0
    dst1  +=  count;
847
0
    src   +=  count * 4;
848
0
    count  = -count;
849
0
    src++;
850
0
    while (count < 0) {
851
0
        dst0[count] = src[4 * count + 0];
852
0
        dst1[count] = src[4 * count + 2];
853
0
        count++;
854
0
    }
855
0
}
856
857
static void extract_odd2avg_c(const uint8_t *src0, const uint8_t *src1,
858
                              uint8_t *dst0, uint8_t *dst1, int count)
859
0
{
860
0
    dst0  +=  count;
861
0
    dst1  +=  count;
862
0
    src0  +=  count * 4;
863
0
    src1  +=  count * 4;
864
0
    count  = -count;
865
0
    src0++;
866
0
    src1++;
867
0
    while (count < 0) {
868
0
        dst0[count] = (src0[4 * count + 0] + src1[4 * count + 0]) >> 1;
869
0
        dst1[count] = (src0[4 * count + 2] + src1[4 * count + 2]) >> 1;
870
0
        count++;
871
0
    }
872
0
}
873
874
static void yuyvtoyuv420_c(uint8_t *ydst, uint8_t *udst, uint8_t *vdst,
875
                           const uint8_t *src, int width, int height,
876
                           int lumStride, int chromStride, int srcStride)
877
0
{
878
0
    int y;
879
0
    const int chromWidth = AV_CEIL_RSHIFT(width, 1);
880
881
0
    for (y = 0; y < height; y++) {
882
0
        extract_even_c(src, ydst, width);
883
0
        if (y & 1) {
884
0
            extract_odd2avg_c(src - srcStride, src, udst, vdst, chromWidth);
885
0
            udst += chromStride;
886
0
            vdst += chromStride;
887
0
        }
888
889
0
        src  += srcStride;
890
0
        ydst += lumStride;
891
0
    }
892
0
}
893
894
static void yuyvtoyuv422_c(uint8_t *ydst, uint8_t *udst, uint8_t *vdst,
895
                           const uint8_t *src, int width, int height,
896
                           int lumStride, int chromStride, int srcStride)
897
0
{
898
0
    int y;
899
0
    const int chromWidth = AV_CEIL_RSHIFT(width, 1);
900
901
0
    for (y = 0; y < height; y++) {
902
0
        extract_even_c(src, ydst, width);
903
0
        extract_odd2_c(src, udst, vdst, chromWidth);
904
905
0
        src  += srcStride;
906
0
        ydst += lumStride;
907
0
        udst += chromStride;
908
0
        vdst += chromStride;
909
0
    }
910
0
}
911
912
static void uyvytoyuv420_c(uint8_t *ydst, uint8_t *udst, uint8_t *vdst,
913
                           const uint8_t *src, int width, int height,
914
                           int lumStride, int chromStride, int srcStride)
915
0
{
916
0
    int y;
917
0
    const int chromWidth = AV_CEIL_RSHIFT(width, 1);
918
919
0
    for (y = 0; y < height; y++) {
920
0
        extract_even_c(src + 1, ydst, width);
921
0
        if (y & 1) {
922
0
            extract_even2avg_c(src - srcStride, src, udst, vdst, chromWidth);
923
0
            udst += chromStride;
924
0
            vdst += chromStride;
925
0
        }
926
927
0
        src  += srcStride;
928
0
        ydst += lumStride;
929
0
    }
930
0
}
931
932
static void uyvytoyuv422_c(uint8_t *ydst, uint8_t *udst, uint8_t *vdst,
933
                           const uint8_t *src, int width, int height,
934
                           int lumStride, int chromStride, int srcStride)
935
0
{
936
0
    int y;
937
0
    const int chromWidth = AV_CEIL_RSHIFT(width, 1);
938
939
0
    for (y = 0; y < height; y++) {
940
0
        extract_even_c(src + 1, ydst, width);
941
0
        extract_even2_c(src, udst, vdst, chromWidth);
942
943
0
        src  += srcStride;
944
0
        ydst += lumStride;
945
0
        udst += chromStride;
946
0
        vdst += chromStride;
947
0
    }
948
0
}
949
950
static av_cold void rgb2rgb_init_c(void)
951
0
{
952
0
    rgb15to16          = rgb15to16_c;
953
0
    rgb15tobgr24       = rgb15tobgr24_c;
954
0
    rgb15to32          = rgb15to32_c;
955
0
    rgb16tobgr24       = rgb16tobgr24_c;
956
0
    rgb16to32          = rgb16to32_c;
957
0
    rgb16to15          = rgb16to15_c;
958
0
    rgb24tobgr16       = rgb24tobgr16_c;
959
0
    rgb24tobgr15       = rgb24tobgr15_c;
960
0
    rgb24tobgr32       = rgb24tobgr32_c;
961
0
    rgb32to16          = rgb32to16_c;
962
0
    rgb32to15          = rgb32to15_c;
963
0
    rgb32tobgr24       = rgb32tobgr24_c;
964
0
    rgb24to15          = rgb24to15_c;
965
0
    rgb24to16          = rgb24to16_c;
966
0
    rgb24tobgr24       = rgb24tobgr24_c;
967
#if HAVE_BIGENDIAN
968
    shuffle_bytes_0321 = shuffle_bytes_2103_c;
969
    shuffle_bytes_2103 = shuffle_bytes_0321_c;
970
#else
971
0
    shuffle_bytes_0321 = shuffle_bytes_0321_c;
972
0
    shuffle_bytes_2103 = shuffle_bytes_2103_c;
973
0
#endif
974
0
    shuffle_bytes_1230 = shuffle_bytes_1230_c;
975
0
    shuffle_bytes_3012 = shuffle_bytes_3012_c;
976
0
    shuffle_bytes_3210 = shuffle_bytes_3210_c;
977
0
    shuffle_bytes_3102 = shuffle_bytes_3102_c;
978
0
    shuffle_bytes_2013 = shuffle_bytes_2013_c;
979
0
    shuffle_bytes_2130 = shuffle_bytes_2130_c;
980
0
    shuffle_bytes_1203 = shuffle_bytes_1203_c;
981
0
    rgb32tobgr16       = rgb32tobgr16_c;
982
0
    rgb32tobgr15       = rgb32tobgr15_c;
983
0
    yv12toyuy2         = yv12toyuy2_c;
984
0
    yv12touyvy         = yv12touyvy_c;
985
0
    yuv422ptoyuy2      = yuv422ptoyuy2_c;
986
0
    yuv422ptouyvy      = yuv422ptouyvy_c;
987
0
    yuy2toyv12         = yuy2toyv12_c;
988
0
    planar2x           = planar2x_c;
989
0
    ff_rgb24toyv12     = ff_rgb24toyv12_c;
990
0
    interleaveBytes    = interleaveBytes_c;
991
0
    deinterleaveBytes  = deinterleaveBytes_c;
992
0
    vu9_to_vu12        = vu9_to_vu12_c;
993
0
    yvu9_to_yuy2       = yvu9_to_yuy2_c;
994
995
0
    uyvytoyuv420       = uyvytoyuv420_c;
996
0
    uyvytoyuv422       = uyvytoyuv422_c;
997
0
    yuyvtoyuv420       = yuyvtoyuv420_c;
998
0
    yuyvtoyuv422       = yuyvtoyuv422_c;
999
0
}