/src/ffmpeg/libavcodec/qpeldsp.c
Line | Count | Source |
1 | | /* |
2 | | * quarterpel DSP functions |
3 | | * Copyright (c) 2000, 2001 Fabrice Bellard |
4 | | * Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at> |
5 | | * |
6 | | * This file is part of FFmpeg. |
7 | | * |
8 | | * FFmpeg is free software; you can redistribute it and/or |
9 | | * modify it under the terms of the GNU Lesser General Public |
10 | | * License as published by the Free Software Foundation; either |
11 | | * version 2.1 of the License, or (at your option) any later version. |
12 | | * |
13 | | * FFmpeg is distributed in the hope that it will be useful, |
14 | | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
15 | | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
16 | | * Lesser General Public License for more details. |
17 | | * |
18 | | * You should have received a copy of the GNU Lesser General Public |
19 | | * License along with FFmpeg; if not, write to the Free Software |
20 | | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
21 | | */ |
22 | | |
23 | | /** |
24 | | * @file |
25 | | * quarterpel DSP functions |
26 | | */ |
27 | | |
28 | | #include <stddef.h> |
29 | | #include <stdint.h> |
30 | | |
31 | | #include "config.h" |
32 | | #include "config_components.h" |
33 | | #include "libavutil/attributes.h" |
34 | | #include "copy_block.h" |
35 | | #include "qpeldsp.h" |
36 | | #include "diracdsp.h" |
37 | | |
38 | | #define BIT_DEPTH 8 |
39 | | #include "hpel_template.c" |
40 | | #include "pel_template.c" |
41 | | #include "qpel_template.c" |
42 | | |
43 | | #define QPEL_MC(r, OPNAME, RND, OP) \ |
44 | | static void OPNAME ## mpeg4_qpel8_h_lowpass(uint8_t *dst, const uint8_t *src, \ |
45 | | int dstStride, int srcStride, \ |
46 | 229k | int h) \ |
47 | 229k | { \ |
48 | 229k | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ |
49 | 229k | int i; \ |
50 | 229k | \ |
51 | 2.22M | for (i = 0; i < h; i++) { \ |
52 | 1.99M | OP(dst[0], (src[0] + src[1]) * 20 - (src[0] + src[2]) * 6 + (src[1] + src[3]) * 3 - (src[2] + src[4])); \ |
53 | 1.99M | OP(dst[1], (src[1] + src[2]) * 20 - (src[0] + src[3]) * 6 + (src[0] + src[4]) * 3 - (src[1] + src[5])); \ |
54 | 1.99M | OP(dst[2], (src[2] + src[3]) * 20 - (src[1] + src[4]) * 6 + (src[0] + src[5]) * 3 - (src[0] + src[6])); \ |
55 | 1.99M | OP(dst[3], (src[3] + src[4]) * 20 - (src[2] + src[5]) * 6 + (src[1] + src[6]) * 3 - (src[0] + src[7])); \ |
56 | 1.99M | OP(dst[4], (src[4] + src[5]) * 20 - (src[3] + src[6]) * 6 + (src[2] + src[7]) * 3 - (src[1] + src[8])); \ |
57 | 1.99M | OP(dst[5], (src[5] + src[6]) * 20 - (src[4] + src[7]) * 6 + (src[3] + src[8]) * 3 - (src[2] + src[8])); \ |
58 | 1.99M | OP(dst[6], (src[6] + src[7]) * 20 - (src[5] + src[8]) * 6 + (src[4] + src[8]) * 3 - (src[3] + src[7])); \ |
59 | 1.99M | OP(dst[7], (src[7] + src[8]) * 20 - (src[6] + src[8]) * 6 + (src[5] + src[7]) * 3 - (src[4] + src[6])); \ |
60 | 1.99M | dst += dstStride; \ |
61 | 1.99M | src += srcStride; \ |
62 | 1.99M | } \ |
63 | 229k | } \ qpeldsp.c:put_mpeg4_qpel8_h_lowpass Line | Count | Source | 46 | 188k | int h) \ | 47 | 188k | { \ | 48 | 188k | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ | 49 | 188k | int i; \ | 50 | 188k | \ | 51 | 1.82M | for (i = 0; i < h; i++) { \ | 52 | 1.63M | OP(dst[0], (src[0] + src[1]) * 20 - (src[0] + src[2]) * 6 + (src[1] + src[3]) * 3 - (src[2] + src[4])); \ | 53 | 1.63M | OP(dst[1], (src[1] + src[2]) * 20 - (src[0] + src[3]) * 6 + (src[0] + src[4]) * 3 - (src[1] + src[5])); \ | 54 | 1.63M | OP(dst[2], (src[2] + src[3]) * 20 - (src[1] + src[4]) * 6 + (src[0] + src[5]) * 3 - (src[0] + src[6])); \ | 55 | 1.63M | OP(dst[3], (src[3] + src[4]) * 20 - (src[2] + src[5]) * 6 + (src[1] + src[6]) * 3 - (src[0] + src[7])); \ | 56 | 1.63M | OP(dst[4], (src[4] + src[5]) * 20 - (src[3] + src[6]) * 6 + (src[2] + src[7]) * 3 - (src[1] + src[8])); \ | 57 | 1.63M | OP(dst[5], (src[5] + src[6]) * 20 - (src[4] + src[7]) * 6 + (src[3] + src[8]) * 3 - (src[2] + src[8])); \ | 58 | 1.63M | OP(dst[6], (src[6] + src[7]) * 20 - (src[5] + src[8]) * 6 + (src[4] + src[8]) * 3 - (src[3] + src[7])); \ | 59 | 1.63M | OP(dst[7], (src[7] + src[8]) * 20 - (src[6] + src[8]) * 6 + (src[5] + src[7]) * 3 - (src[4] + src[6])); \ | 60 | 1.63M | dst += dstStride; \ | 61 | 1.63M | src += srcStride; \ | 62 | 1.63M | } \ | 63 | 188k | } \ |
qpeldsp.c:put_no_rnd_mpeg4_qpel8_h_lowpass Line | Count | Source | 46 | 34.7k | int h) \ | 47 | 34.7k | { \ | 48 | 34.7k | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ | 49 | 34.7k | int i; \ | 50 | 34.7k | \ | 51 | 337k | for (i = 0; i < h; i++) { \ | 52 | 303k | OP(dst[0], (src[0] + src[1]) * 20 - (src[0] + src[2]) * 6 + (src[1] + src[3]) * 3 - (src[2] + src[4])); \ | 53 | 303k | OP(dst[1], (src[1] + src[2]) * 20 - (src[0] + src[3]) * 6 + (src[0] + src[4]) * 3 - (src[1] + src[5])); \ | 54 | 303k | OP(dst[2], (src[2] + src[3]) * 20 - (src[1] + src[4]) * 6 + (src[0] + src[5]) * 3 - (src[0] + src[6])); \ | 55 | 303k | OP(dst[3], (src[3] + src[4]) * 20 - (src[2] + src[5]) * 6 + (src[1] + src[6]) * 3 - (src[0] + src[7])); \ | 56 | 303k | OP(dst[4], (src[4] + src[5]) * 20 - (src[3] + src[6]) * 6 + (src[2] + src[7]) * 3 - (src[1] + src[8])); \ | 57 | 303k | OP(dst[5], (src[5] + src[6]) * 20 - (src[4] + src[7]) * 6 + (src[3] + src[8]) * 3 - (src[2] + src[8])); \ | 58 | 303k | OP(dst[6], (src[6] + src[7]) * 20 - (src[5] + src[8]) * 6 + (src[4] + src[8]) * 3 - (src[3] + src[7])); \ | 59 | 303k | OP(dst[7], (src[7] + src[8]) * 20 - (src[6] + src[8]) * 6 + (src[5] + src[7]) * 3 - (src[4] + src[6])); \ | 60 | 303k | dst += dstStride; \ | 61 | 303k | src += srcStride; \ | 62 | 303k | } \ | 63 | 34.7k | } \ |
qpeldsp.c:avg_mpeg4_qpel8_h_lowpass Line | Count | Source | 46 | 6.53k | int h) \ | 47 | 6.53k | { \ | 48 | 6.53k | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ | 49 | 6.53k | int i; \ | 50 | 6.53k | \ | 51 | 58.8k | for (i = 0; i < h; i++) { \ | 52 | 52.3k | OP(dst[0], (src[0] + src[1]) * 20 - (src[0] + src[2]) * 6 + (src[1] + src[3]) * 3 - (src[2] + src[4])); \ | 53 | 52.3k | OP(dst[1], (src[1] + src[2]) * 20 - (src[0] + src[3]) * 6 + (src[0] + src[4]) * 3 - (src[1] + src[5])); \ | 54 | 52.3k | OP(dst[2], (src[2] + src[3]) * 20 - (src[1] + src[4]) * 6 + (src[0] + src[5]) * 3 - (src[0] + src[6])); \ | 55 | 52.3k | OP(dst[3], (src[3] + src[4]) * 20 - (src[2] + src[5]) * 6 + (src[1] + src[6]) * 3 - (src[0] + src[7])); \ | 56 | 52.3k | OP(dst[4], (src[4] + src[5]) * 20 - (src[3] + src[6]) * 6 + (src[2] + src[7]) * 3 - (src[1] + src[8])); \ | 57 | 52.3k | OP(dst[5], (src[5] + src[6]) * 20 - (src[4] + src[7]) * 6 + (src[3] + src[8]) * 3 - (src[2] + src[8])); \ | 58 | 52.3k | OP(dst[6], (src[6] + src[7]) * 20 - (src[5] + src[8]) * 6 + (src[4] + src[8]) * 3 - (src[3] + src[7])); \ | 59 | 52.3k | OP(dst[7], (src[7] + src[8]) * 20 - (src[6] + src[8]) * 6 + (src[5] + src[7]) * 3 - (src[4] + src[6])); \ | 60 | 52.3k | dst += dstStride; \ | 61 | 52.3k | src += srcStride; \ | 62 | 52.3k | } \ | 63 | 6.53k | } \ |
|
64 | | \ |
65 | | static void OPNAME ## mpeg4_qpel8_v_lowpass(uint8_t *dst, const uint8_t *src, \ |
66 | 271k | int dstStride, int srcStride) \ |
67 | 271k | { \ |
68 | 271k | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ |
69 | 271k | const int w = 8; \ |
70 | 271k | int i; \ |
71 | 271k | \ |
72 | 2.44M | for (i = 0; i < w; i++) { \ |
73 | 2.16M | const int src0 = src[0 * srcStride]; \ |
74 | 2.16M | const int src1 = src[1 * srcStride]; \ |
75 | 2.16M | const int src2 = src[2 * srcStride]; \ |
76 | 2.16M | const int src3 = src[3 * srcStride]; \ |
77 | 2.16M | const int src4 = src[4 * srcStride]; \ |
78 | 2.16M | const int src5 = src[5 * srcStride]; \ |
79 | 2.16M | const int src6 = src[6 * srcStride]; \ |
80 | 2.16M | const int src7 = src[7 * srcStride]; \ |
81 | 2.16M | const int src8 = src[8 * srcStride]; \ |
82 | 2.16M | OP(dst[0 * dstStride], (src0 + src1) * 20 - (src0 + src2) * 6 + (src1 + src3) * 3 - (src2 + src4)); \ |
83 | 2.16M | OP(dst[1 * dstStride], (src1 + src2) * 20 - (src0 + src3) * 6 + (src0 + src4) * 3 - (src1 + src5)); \ |
84 | 2.16M | OP(dst[2 * dstStride], (src2 + src3) * 20 - (src1 + src4) * 6 + (src0 + src5) * 3 - (src0 + src6)); \ |
85 | 2.16M | OP(dst[3 * dstStride], (src3 + src4) * 20 - (src2 + src5) * 6 + (src1 + src6) * 3 - (src0 + src7)); \ |
86 | 2.16M | OP(dst[4 * dstStride], (src4 + src5) * 20 - (src3 + src6) * 6 + (src2 + src7) * 3 - (src1 + src8)); \ |
87 | 2.16M | OP(dst[5 * dstStride], (src5 + src6) * 20 - (src4 + src7) * 6 + (src3 + src8) * 3 - (src2 + src8)); \ |
88 | 2.16M | OP(dst[6 * dstStride], (src6 + src7) * 20 - (src5 + src8) * 6 + (src4 + src8) * 3 - (src3 + src7)); \ |
89 | 2.16M | OP(dst[7 * dstStride], (src7 + src8) * 20 - (src6 + src8) * 6 + (src5 + src7) * 3 - (src4 + src6)); \ |
90 | 2.16M | dst++; \ |
91 | 2.16M | src++; \ |
92 | 2.16M | } \ |
93 | 271k | } \ qpeldsp.c:put_mpeg4_qpel8_v_lowpass Line | Count | Source | 66 | 208k | int dstStride, int srcStride) \ | 67 | 208k | { \ | 68 | 208k | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ | 69 | 208k | const int w = 8; \ | 70 | 208k | int i; \ | 71 | 208k | \ | 72 | 1.87M | for (i = 0; i < w; i++) { \ | 73 | 1.66M | const int src0 = src[0 * srcStride]; \ | 74 | 1.66M | const int src1 = src[1 * srcStride]; \ | 75 | 1.66M | const int src2 = src[2 * srcStride]; \ | 76 | 1.66M | const int src3 = src[3 * srcStride]; \ | 77 | 1.66M | const int src4 = src[4 * srcStride]; \ | 78 | 1.66M | const int src5 = src[5 * srcStride]; \ | 79 | 1.66M | const int src6 = src[6 * srcStride]; \ | 80 | 1.66M | const int src7 = src[7 * srcStride]; \ | 81 | 1.66M | const int src8 = src[8 * srcStride]; \ | 82 | 1.66M | OP(dst[0 * dstStride], (src0 + src1) * 20 - (src0 + src2) * 6 + (src1 + src3) * 3 - (src2 + src4)); \ | 83 | 1.66M | OP(dst[1 * dstStride], (src1 + src2) * 20 - (src0 + src3) * 6 + (src0 + src4) * 3 - (src1 + src5)); \ | 84 | 1.66M | OP(dst[2 * dstStride], (src2 + src3) * 20 - (src1 + src4) * 6 + (src0 + src5) * 3 - (src0 + src6)); \ | 85 | 1.66M | OP(dst[3 * dstStride], (src3 + src4) * 20 - (src2 + src5) * 6 + (src1 + src6) * 3 - (src0 + src7)); \ | 86 | 1.66M | OP(dst[4 * dstStride], (src4 + src5) * 20 - (src3 + src6) * 6 + (src2 + src7) * 3 - (src1 + src8)); \ | 87 | 1.66M | OP(dst[5 * dstStride], (src5 + src6) * 20 - (src4 + src7) * 6 + (src3 + src8) * 3 - (src2 + src8)); \ | 88 | 1.66M | OP(dst[6 * dstStride], (src6 + src7) * 20 - (src5 + src8) * 6 + (src4 + src8) * 3 - (src3 + src7)); \ | 89 | 1.66M | OP(dst[7 * dstStride], (src7 + src8) * 20 - (src6 + src8) * 6 + (src5 + src7) * 3 - (src4 + src6)); \ | 90 | 1.66M | dst++; \ | 91 | 1.66M | src++; \ | 92 | 1.66M | } \ | 93 | 208k | } \ |
qpeldsp.c:put_no_rnd_mpeg4_qpel8_v_lowpass Line | Count | Source | 66 | 42.7k | int dstStride, int srcStride) \ | 67 | 42.7k | { \ | 68 | 42.7k | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ | 69 | 42.7k | const int w = 8; \ | 70 | 42.7k | int i; \ | 71 | 42.7k | \ | 72 | 385k | for (i = 0; i < w; i++) { \ | 73 | 342k | const int src0 = src[0 * srcStride]; \ | 74 | 342k | const int src1 = src[1 * srcStride]; \ | 75 | 342k | const int src2 = src[2 * srcStride]; \ | 76 | 342k | const int src3 = src[3 * srcStride]; \ | 77 | 342k | const int src4 = src[4 * srcStride]; \ | 78 | 342k | const int src5 = src[5 * srcStride]; \ | 79 | 342k | const int src6 = src[6 * srcStride]; \ | 80 | 342k | const int src7 = src[7 * srcStride]; \ | 81 | 342k | const int src8 = src[8 * srcStride]; \ | 82 | 342k | OP(dst[0 * dstStride], (src0 + src1) * 20 - (src0 + src2) * 6 + (src1 + src3) * 3 - (src2 + src4)); \ | 83 | 342k | OP(dst[1 * dstStride], (src1 + src2) * 20 - (src0 + src3) * 6 + (src0 + src4) * 3 - (src1 + src5)); \ | 84 | 342k | OP(dst[2 * dstStride], (src2 + src3) * 20 - (src1 + src4) * 6 + (src0 + src5) * 3 - (src0 + src6)); \ | 85 | 342k | OP(dst[3 * dstStride], (src3 + src4) * 20 - (src2 + src5) * 6 + (src1 + src6) * 3 - (src0 + src7)); \ | 86 | 342k | OP(dst[4 * dstStride], (src4 + src5) * 20 - (src3 + src6) * 6 + (src2 + src7) * 3 - (src1 + src8)); \ | 87 | 342k | OP(dst[5 * dstStride], (src5 + src6) * 20 - (src4 + src7) * 6 + (src3 + src8) * 3 - (src2 + src8)); \ | 88 | 342k | OP(dst[6 * dstStride], (src6 + src7) * 20 - (src5 + src8) * 6 + (src4 + src8) * 3 - (src3 + src7)); \ | 89 | 342k | OP(dst[7 * dstStride], (src7 + src8) * 20 - (src6 + src8) * 6 + (src5 + src7) * 3 - (src4 + src6)); \ | 90 | 342k | dst++; \ | 91 | 342k | src++; \ | 92 | 342k | } \ | 93 | 42.7k | } \ |
qpeldsp.c:avg_mpeg4_qpel8_v_lowpass Line | Count | Source | 66 | 19.7k | int dstStride, int srcStride) \ | 67 | 19.7k | { \ | 68 | 19.7k | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ | 69 | 19.7k | const int w = 8; \ | 70 | 19.7k | int i; \ | 71 | 19.7k | \ | 72 | 178k | for (i = 0; i < w; i++) { \ | 73 | 158k | const int src0 = src[0 * srcStride]; \ | 74 | 158k | const int src1 = src[1 * srcStride]; \ | 75 | 158k | const int src2 = src[2 * srcStride]; \ | 76 | 158k | const int src3 = src[3 * srcStride]; \ | 77 | 158k | const int src4 = src[4 * srcStride]; \ | 78 | 158k | const int src5 = src[5 * srcStride]; \ | 79 | 158k | const int src6 = src[6 * srcStride]; \ | 80 | 158k | const int src7 = src[7 * srcStride]; \ | 81 | 158k | const int src8 = src[8 * srcStride]; \ | 82 | 158k | OP(dst[0 * dstStride], (src0 + src1) * 20 - (src0 + src2) * 6 + (src1 + src3) * 3 - (src2 + src4)); \ | 83 | 158k | OP(dst[1 * dstStride], (src1 + src2) * 20 - (src0 + src3) * 6 + (src0 + src4) * 3 - (src1 + src5)); \ | 84 | 158k | OP(dst[2 * dstStride], (src2 + src3) * 20 - (src1 + src4) * 6 + (src0 + src5) * 3 - (src0 + src6)); \ | 85 | 158k | OP(dst[3 * dstStride], (src3 + src4) * 20 - (src2 + src5) * 6 + (src1 + src6) * 3 - (src0 + src7)); \ | 86 | 158k | OP(dst[4 * dstStride], (src4 + src5) * 20 - (src3 + src6) * 6 + (src2 + src7) * 3 - (src1 + src8)); \ | 87 | 158k | OP(dst[5 * dstStride], (src5 + src6) * 20 - (src4 + src7) * 6 + (src3 + src8) * 3 - (src2 + src8)); \ | 88 | 158k | OP(dst[6 * dstStride], (src6 + src7) * 20 - (src5 + src8) * 6 + (src4 + src8) * 3 - (src3 + src7)); \ | 89 | 158k | OP(dst[7 * dstStride], (src7 + src8) * 20 - (src6 + src8) * 6 + (src5 + src7) * 3 - (src4 + src6)); \ | 90 | 158k | dst++; \ | 91 | 158k | src++; \ | 92 | 158k | } \ | 93 | 19.7k | } \ |
|
94 | | \ |
95 | | static void OPNAME ## mpeg4_qpel16_h_lowpass(uint8_t *dst, \ |
96 | | const uint8_t *src, \ |
97 | | int dstStride, int srcStride, \ |
98 | 2.87M | int h) \ |
99 | 2.87M | { \ |
100 | 2.87M | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ |
101 | 2.87M | int i; \ |
102 | 2.87M | \ |
103 | 50.9M | for (i = 0; i < h; i++) { \ |
104 | 48.1M | OP(dst[0], (src[0] + src[1]) * 20 - (src[0] + src[2]) * 6 + (src[1] + src[3]) * 3 - (src[2] + src[4])); \ |
105 | 48.1M | OP(dst[1], (src[1] + src[2]) * 20 - (src[0] + src[3]) * 6 + (src[0] + src[4]) * 3 - (src[1] + src[5])); \ |
106 | 48.1M | OP(dst[2], (src[2] + src[3]) * 20 - (src[1] + src[4]) * 6 + (src[0] + src[5]) * 3 - (src[0] + src[6])); \ |
107 | 48.1M | OP(dst[3], (src[3] + src[4]) * 20 - (src[2] + src[5]) * 6 + (src[1] + src[6]) * 3 - (src[0] + src[7])); \ |
108 | 48.1M | OP(dst[4], (src[4] + src[5]) * 20 - (src[3] + src[6]) * 6 + (src[2] + src[7]) * 3 - (src[1] + src[8])); \ |
109 | 48.1M | OP(dst[5], (src[5] + src[6]) * 20 - (src[4] + src[7]) * 6 + (src[3] + src[8]) * 3 - (src[2] + src[9])); \ |
110 | 48.1M | OP(dst[6], (src[6] + src[7]) * 20 - (src[5] + src[8]) * 6 + (src[4] + src[9]) * 3 - (src[3] + src[10])); \ |
111 | 48.1M | OP(dst[7], (src[7] + src[8]) * 20 - (src[6] + src[9]) * 6 + (src[5] + src[10]) * 3 - (src[4] + src[11])); \ |
112 | 48.1M | OP(dst[8], (src[8] + src[9]) * 20 - (src[7] + src[10]) * 6 + (src[6] + src[11]) * 3 - (src[5] + src[12])); \ |
113 | 48.1M | OP(dst[9], (src[9] + src[10]) * 20 - (src[8] + src[11]) * 6 + (src[7] + src[12]) * 3 - (src[6] + src[13])); \ |
114 | 48.1M | OP(dst[10], (src[10] + src[11]) * 20 - (src[9] + src[12]) * 6 + (src[8] + src[13]) * 3 - (src[7] + src[14])); \ |
115 | 48.1M | OP(dst[11], (src[11] + src[12]) * 20 - (src[10] + src[13]) * 6 + (src[9] + src[14]) * 3 - (src[8] + src[15])); \ |
116 | 48.1M | OP(dst[12], (src[12] + src[13]) * 20 - (src[11] + src[14]) * 6 + (src[10] + src[15]) * 3 - (src[9] + src[16])); \ |
117 | 48.1M | OP(dst[13], (src[13] + src[14]) * 20 - (src[12] + src[15]) * 6 + (src[11] + src[16]) * 3 - (src[10] + src[16])); \ |
118 | 48.1M | OP(dst[14], (src[14] + src[15]) * 20 - (src[13] + src[16]) * 6 + (src[12] + src[16]) * 3 - (src[11] + src[15])); \ |
119 | 48.1M | OP(dst[15], (src[15] + src[16]) * 20 - (src[14] + src[16]) * 6 + (src[13] + src[15]) * 3 - (src[12] + src[14])); \ |
120 | 48.1M | dst += dstStride; \ |
121 | 48.1M | src += srcStride; \ |
122 | 48.1M | } \ |
123 | 2.87M | } \ qpeldsp.c:put_mpeg4_qpel16_h_lowpass Line | Count | Source | 98 | 2.64M | int h) \ | 99 | 2.64M | { \ | 100 | 2.64M | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ | 101 | 2.64M | int i; \ | 102 | 2.64M | \ | 103 | 46.7M | for (i = 0; i < h; i++) { \ | 104 | 44.1M | OP(dst[0], (src[0] + src[1]) * 20 - (src[0] + src[2]) * 6 + (src[1] + src[3]) * 3 - (src[2] + src[4])); \ | 105 | 44.1M | OP(dst[1], (src[1] + src[2]) * 20 - (src[0] + src[3]) * 6 + (src[0] + src[4]) * 3 - (src[1] + src[5])); \ | 106 | 44.1M | OP(dst[2], (src[2] + src[3]) * 20 - (src[1] + src[4]) * 6 + (src[0] + src[5]) * 3 - (src[0] + src[6])); \ | 107 | 44.1M | OP(dst[3], (src[3] + src[4]) * 20 - (src[2] + src[5]) * 6 + (src[1] + src[6]) * 3 - (src[0] + src[7])); \ | 108 | 44.1M | OP(dst[4], (src[4] + src[5]) * 20 - (src[3] + src[6]) * 6 + (src[2] + src[7]) * 3 - (src[1] + src[8])); \ | 109 | 44.1M | OP(dst[5], (src[5] + src[6]) * 20 - (src[4] + src[7]) * 6 + (src[3] + src[8]) * 3 - (src[2] + src[9])); \ | 110 | 44.1M | OP(dst[6], (src[6] + src[7]) * 20 - (src[5] + src[8]) * 6 + (src[4] + src[9]) * 3 - (src[3] + src[10])); \ | 111 | 44.1M | OP(dst[7], (src[7] + src[8]) * 20 - (src[6] + src[9]) * 6 + (src[5] + src[10]) * 3 - (src[4] + src[11])); \ | 112 | 44.1M | OP(dst[8], (src[8] + src[9]) * 20 - (src[7] + src[10]) * 6 + (src[6] + src[11]) * 3 - (src[5] + src[12])); \ | 113 | 44.1M | OP(dst[9], (src[9] + src[10]) * 20 - (src[8] + src[11]) * 6 + (src[7] + src[12]) * 3 - (src[6] + src[13])); \ | 114 | 44.1M | OP(dst[10], (src[10] + src[11]) * 20 - (src[9] + src[12]) * 6 + (src[8] + src[13]) * 3 - (src[7] + src[14])); \ | 115 | 44.1M | OP(dst[11], (src[11] + src[12]) * 20 - (src[10] + src[13]) * 6 + (src[9] + src[14]) * 3 - (src[8] + src[15])); \ | 116 | 44.1M | OP(dst[12], (src[12] + src[13]) * 20 - (src[11] + src[14]) * 6 + (src[10] + src[15]) * 3 - (src[9] + src[16])); \ | 117 | 44.1M | OP(dst[13], (src[13] + src[14]) * 20 - (src[12] + src[15]) * 6 + (src[11] + src[16]) * 3 - (src[10] + src[16])); \ | 118 | 44.1M | OP(dst[14], (src[14] + src[15]) * 20 - (src[13] + src[16]) * 6 + (src[12] + src[16]) * 3 - (src[11] + src[15])); \ | 119 | 44.1M | OP(dst[15], (src[15] + src[16]) * 20 - (src[14] + src[16]) * 6 + (src[13] + src[15]) * 3 - (src[12] + src[14])); \ | 120 | 44.1M | dst += dstStride; \ | 121 | 44.1M | src += srcStride; \ | 122 | 44.1M | } \ | 123 | 2.64M | } \ |
qpeldsp.c:put_no_rnd_mpeg4_qpel16_h_lowpass Line | Count | Source | 98 | 232k | int h) \ | 99 | 232k | { \ | 100 | 232k | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ | 101 | 232k | int i; \ | 102 | 232k | \ | 103 | 4.13M | for (i = 0; i < h; i++) { \ | 104 | 3.89M | OP(dst[0], (src[0] + src[1]) * 20 - (src[0] + src[2]) * 6 + (src[1] + src[3]) * 3 - (src[2] + src[4])); \ | 105 | 3.89M | OP(dst[1], (src[1] + src[2]) * 20 - (src[0] + src[3]) * 6 + (src[0] + src[4]) * 3 - (src[1] + src[5])); \ | 106 | 3.89M | OP(dst[2], (src[2] + src[3]) * 20 - (src[1] + src[4]) * 6 + (src[0] + src[5]) * 3 - (src[0] + src[6])); \ | 107 | 3.89M | OP(dst[3], (src[3] + src[4]) * 20 - (src[2] + src[5]) * 6 + (src[1] + src[6]) * 3 - (src[0] + src[7])); \ | 108 | 3.89M | OP(dst[4], (src[4] + src[5]) * 20 - (src[3] + src[6]) * 6 + (src[2] + src[7]) * 3 - (src[1] + src[8])); \ | 109 | 3.89M | OP(dst[5], (src[5] + src[6]) * 20 - (src[4] + src[7]) * 6 + (src[3] + src[8]) * 3 - (src[2] + src[9])); \ | 110 | 3.89M | OP(dst[6], (src[6] + src[7]) * 20 - (src[5] + src[8]) * 6 + (src[4] + src[9]) * 3 - (src[3] + src[10])); \ | 111 | 3.89M | OP(dst[7], (src[7] + src[8]) * 20 - (src[6] + src[9]) * 6 + (src[5] + src[10]) * 3 - (src[4] + src[11])); \ | 112 | 3.89M | OP(dst[8], (src[8] + src[9]) * 20 - (src[7] + src[10]) * 6 + (src[6] + src[11]) * 3 - (src[5] + src[12])); \ | 113 | 3.89M | OP(dst[9], (src[9] + src[10]) * 20 - (src[8] + src[11]) * 6 + (src[7] + src[12]) * 3 - (src[6] + src[13])); \ | 114 | 3.89M | OP(dst[10], (src[10] + src[11]) * 20 - (src[9] + src[12]) * 6 + (src[8] + src[13]) * 3 - (src[7] + src[14])); \ | 115 | 3.89M | OP(dst[11], (src[11] + src[12]) * 20 - (src[10] + src[13]) * 6 + (src[9] + src[14]) * 3 - (src[8] + src[15])); \ | 116 | 3.89M | OP(dst[12], (src[12] + src[13]) * 20 - (src[11] + src[14]) * 6 + (src[10] + src[15]) * 3 - (src[9] + src[16])); \ | 117 | 3.89M | OP(dst[13], (src[13] + src[14]) * 20 - (src[12] + src[15]) * 6 + (src[11] + src[16]) * 3 - (src[10] + src[16])); \ | 118 | 3.89M | OP(dst[14], (src[14] + src[15]) * 20 - (src[13] + src[16]) * 6 + (src[12] + src[16]) * 3 - (src[11] + src[15])); \ | 119 | 3.89M | OP(dst[15], (src[15] + src[16]) * 20 - (src[14] + src[16]) * 6 + (src[13] + src[15]) * 3 - (src[12] + src[14])); \ | 120 | 3.89M | dst += dstStride; \ | 121 | 3.89M | src += srcStride; \ | 122 | 3.89M | } \ | 123 | 232k | } \ |
qpeldsp.c:avg_mpeg4_qpel16_h_lowpass Line | Count | Source | 98 | 3.88k | int h) \ | 99 | 3.88k | { \ | 100 | 3.88k | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ | 101 | 3.88k | int i; \ | 102 | 3.88k | \ | 103 | 66.1k | for (i = 0; i < h; i++) { \ | 104 | 62.2k | OP(dst[0], (src[0] + src[1]) * 20 - (src[0] + src[2]) * 6 + (src[1] + src[3]) * 3 - (src[2] + src[4])); \ | 105 | 62.2k | OP(dst[1], (src[1] + src[2]) * 20 - (src[0] + src[3]) * 6 + (src[0] + src[4]) * 3 - (src[1] + src[5])); \ | 106 | 62.2k | OP(dst[2], (src[2] + src[3]) * 20 - (src[1] + src[4]) * 6 + (src[0] + src[5]) * 3 - (src[0] + src[6])); \ | 107 | 62.2k | OP(dst[3], (src[3] + src[4]) * 20 - (src[2] + src[5]) * 6 + (src[1] + src[6]) * 3 - (src[0] + src[7])); \ | 108 | 62.2k | OP(dst[4], (src[4] + src[5]) * 20 - (src[3] + src[6]) * 6 + (src[2] + src[7]) * 3 - (src[1] + src[8])); \ | 109 | 62.2k | OP(dst[5], (src[5] + src[6]) * 20 - (src[4] + src[7]) * 6 + (src[3] + src[8]) * 3 - (src[2] + src[9])); \ | 110 | 62.2k | OP(dst[6], (src[6] + src[7]) * 20 - (src[5] + src[8]) * 6 + (src[4] + src[9]) * 3 - (src[3] + src[10])); \ | 111 | 62.2k | OP(dst[7], (src[7] + src[8]) * 20 - (src[6] + src[9]) * 6 + (src[5] + src[10]) * 3 - (src[4] + src[11])); \ | 112 | 62.2k | OP(dst[8], (src[8] + src[9]) * 20 - (src[7] + src[10]) * 6 + (src[6] + src[11]) * 3 - (src[5] + src[12])); \ | 113 | 62.2k | OP(dst[9], (src[9] + src[10]) * 20 - (src[8] + src[11]) * 6 + (src[7] + src[12]) * 3 - (src[6] + src[13])); \ | 114 | 62.2k | OP(dst[10], (src[10] + src[11]) * 20 - (src[9] + src[12]) * 6 + (src[8] + src[13]) * 3 - (src[7] + src[14])); \ | 115 | 62.2k | OP(dst[11], (src[11] + src[12]) * 20 - (src[10] + src[13]) * 6 + (src[9] + src[14]) * 3 - (src[8] + src[15])); \ | 116 | 62.2k | OP(dst[12], (src[12] + src[13]) * 20 - (src[11] + src[14]) * 6 + (src[10] + src[15]) * 3 - (src[9] + src[16])); \ | 117 | 62.2k | OP(dst[13], (src[13] + src[14]) * 20 - (src[12] + src[15]) * 6 + (src[11] + src[16]) * 3 - (src[10] + src[16])); \ | 118 | 62.2k | OP(dst[14], (src[14] + src[15]) * 20 - (src[13] + src[16]) * 6 + (src[12] + src[16]) * 3 - (src[11] + src[15])); \ | 119 | 62.2k | OP(dst[15], (src[15] + src[16]) * 20 - (src[14] + src[16]) * 6 + (src[13] + src[15]) * 3 - (src[12] + src[14])); \ | 120 | 62.2k | dst += dstStride; \ | 121 | 62.2k | src += srcStride; \ | 122 | 62.2k | } \ | 123 | 3.88k | } \ |
|
124 | | \ |
125 | | static void OPNAME ## mpeg4_qpel16_v_lowpass(uint8_t *dst, \ |
126 | | const uint8_t *src, \ |
127 | 2.85M | int dstStride, int srcStride) \ |
128 | 2.85M | { \ |
129 | 2.85M | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ |
130 | 2.85M | const int w = 16; \ |
131 | 2.85M | int i; \ |
132 | 2.85M | \ |
133 | 48.5M | for (i = 0; i < w; i++) { \ |
134 | 45.6M | const int src0 = src[0 * srcStride]; \ |
135 | 45.6M | const int src1 = src[1 * srcStride]; \ |
136 | 45.6M | const int src2 = src[2 * srcStride]; \ |
137 | 45.6M | const int src3 = src[3 * srcStride]; \ |
138 | 45.6M | const int src4 = src[4 * srcStride]; \ |
139 | 45.6M | const int src5 = src[5 * srcStride]; \ |
140 | 45.6M | const int src6 = src[6 * srcStride]; \ |
141 | 45.6M | const int src7 = src[7 * srcStride]; \ |
142 | 45.6M | const int src8 = src[8 * srcStride]; \ |
143 | 45.6M | const int src9 = src[9 * srcStride]; \ |
144 | 45.6M | const int src10 = src[10 * srcStride]; \ |
145 | 45.6M | const int src11 = src[11 * srcStride]; \ |
146 | 45.6M | const int src12 = src[12 * srcStride]; \ |
147 | 45.6M | const int src13 = src[13 * srcStride]; \ |
148 | 45.6M | const int src14 = src[14 * srcStride]; \ |
149 | 45.6M | const int src15 = src[15 * srcStride]; \ |
150 | 45.6M | const int src16 = src[16 * srcStride]; \ |
151 | 45.6M | OP(dst[0 * dstStride], (src0 + src1) * 20 - (src0 + src2) * 6 + (src1 + src3) * 3 - (src2 + src4)); \ |
152 | 45.6M | OP(dst[1 * dstStride], (src1 + src2) * 20 - (src0 + src3) * 6 + (src0 + src4) * 3 - (src1 + src5)); \ |
153 | 45.6M | OP(dst[2 * dstStride], (src2 + src3) * 20 - (src1 + src4) * 6 + (src0 + src5) * 3 - (src0 + src6)); \ |
154 | 45.6M | OP(dst[3 * dstStride], (src3 + src4) * 20 - (src2 + src5) * 6 + (src1 + src6) * 3 - (src0 + src7)); \ |
155 | 45.6M | OP(dst[4 * dstStride], (src4 + src5) * 20 - (src3 + src6) * 6 + (src2 + src7) * 3 - (src1 + src8)); \ |
156 | 45.6M | OP(dst[5 * dstStride], (src5 + src6) * 20 - (src4 + src7) * 6 + (src3 + src8) * 3 - (src2 + src9)); \ |
157 | 45.6M | OP(dst[6 * dstStride], (src6 + src7) * 20 - (src5 + src8) * 6 + (src4 + src9) * 3 - (src3 + src10)); \ |
158 | 45.6M | OP(dst[7 * dstStride], (src7 + src8) * 20 - (src6 + src9) * 6 + (src5 + src10) * 3 - (src4 + src11)); \ |
159 | 45.6M | OP(dst[8 * dstStride], (src8 + src9) * 20 - (src7 + src10) * 6 + (src6 + src11) * 3 - (src5 + src12)); \ |
160 | 45.6M | OP(dst[9 * dstStride], (src9 + src10) * 20 - (src8 + src11) * 6 + (src7 + src12) * 3 - (src6 + src13)); \ |
161 | 45.6M | OP(dst[10 * dstStride], (src10 + src11) * 20 - (src9 + src12) * 6 + (src8 + src13) * 3 - (src7 + src14)); \ |
162 | 45.6M | OP(dst[11 * dstStride], (src11 + src12) * 20 - (src10 + src13) * 6 + (src9 + src14) * 3 - (src8 + src15)); \ |
163 | 45.6M | OP(dst[12 * dstStride], (src12 + src13) * 20 - (src11 + src14) * 6 + (src10 + src15) * 3 - (src9 + src16)); \ |
164 | 45.6M | OP(dst[13 * dstStride], (src13 + src14) * 20 - (src12 + src15) * 6 + (src11 + src16) * 3 - (src10 + src16)); \ |
165 | 45.6M | OP(dst[14 * dstStride], (src14 + src15) * 20 - (src13 + src16) * 6 + (src12 + src16) * 3 - (src11 + src15)); \ |
166 | 45.6M | OP(dst[15 * dstStride], (src15 + src16) * 20 - (src14 + src16) * 6 + (src13 + src15) * 3 - (src12 + src14)); \ |
167 | 45.6M | dst++; \ |
168 | 45.6M | src++; \ |
169 | 45.6M | } \ |
170 | 2.85M | } \ qpeldsp.c:put_mpeg4_qpel16_v_lowpass Line | Count | Source | 127 | 2.58M | int dstStride, int srcStride) \ | 128 | 2.58M | { \ | 129 | 2.58M | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ | 130 | 2.58M | const int w = 16; \ | 131 | 2.58M | int i; \ | 132 | 2.58M | \ | 133 | 43.9M | for (i = 0; i < w; i++) { \ | 134 | 41.3M | const int src0 = src[0 * srcStride]; \ | 135 | 41.3M | const int src1 = src[1 * srcStride]; \ | 136 | 41.3M | const int src2 = src[2 * srcStride]; \ | 137 | 41.3M | const int src3 = src[3 * srcStride]; \ | 138 | 41.3M | const int src4 = src[4 * srcStride]; \ | 139 | 41.3M | const int src5 = src[5 * srcStride]; \ | 140 | 41.3M | const int src6 = src[6 * srcStride]; \ | 141 | 41.3M | const int src7 = src[7 * srcStride]; \ | 142 | 41.3M | const int src8 = src[8 * srcStride]; \ | 143 | 41.3M | const int src9 = src[9 * srcStride]; \ | 144 | 41.3M | const int src10 = src[10 * srcStride]; \ | 145 | 41.3M | const int src11 = src[11 * srcStride]; \ | 146 | 41.3M | const int src12 = src[12 * srcStride]; \ | 147 | 41.3M | const int src13 = src[13 * srcStride]; \ | 148 | 41.3M | const int src14 = src[14 * srcStride]; \ | 149 | 41.3M | const int src15 = src[15 * srcStride]; \ | 150 | 41.3M | const int src16 = src[16 * srcStride]; \ | 151 | 41.3M | OP(dst[0 * dstStride], (src0 + src1) * 20 - (src0 + src2) * 6 + (src1 + src3) * 3 - (src2 + src4)); \ | 152 | 41.3M | OP(dst[1 * dstStride], (src1 + src2) * 20 - (src0 + src3) * 6 + (src0 + src4) * 3 - (src1 + src5)); \ | 153 | 41.3M | OP(dst[2 * dstStride], (src2 + src3) * 20 - (src1 + src4) * 6 + (src0 + src5) * 3 - (src0 + src6)); \ | 154 | 41.3M | OP(dst[3 * dstStride], (src3 + src4) * 20 - (src2 + src5) * 6 + (src1 + src6) * 3 - (src0 + src7)); \ | 155 | 41.3M | OP(dst[4 * dstStride], (src4 + src5) * 20 - (src3 + src6) * 6 + (src2 + src7) * 3 - (src1 + src8)); \ | 156 | 41.3M | OP(dst[5 * dstStride], (src5 + src6) * 20 - (src4 + src7) * 6 + (src3 + src8) * 3 - (src2 + src9)); \ | 157 | 41.3M | OP(dst[6 * dstStride], (src6 + src7) * 20 - (src5 + src8) * 6 + (src4 + src9) * 3 - (src3 + src10)); \ | 158 | 41.3M | OP(dst[7 * dstStride], (src7 + src8) * 20 - (src6 + src9) * 6 + (src5 + src10) * 3 - (src4 + src11)); \ | 159 | 41.3M | OP(dst[8 * dstStride], (src8 + src9) * 20 - (src7 + src10) * 6 + (src6 + src11) * 3 - (src5 + src12)); \ | 160 | 41.3M | OP(dst[9 * dstStride], (src9 + src10) * 20 - (src8 + src11) * 6 + (src7 + src12) * 3 - (src6 + src13)); \ | 161 | 41.3M | OP(dst[10 * dstStride], (src10 + src11) * 20 - (src9 + src12) * 6 + (src8 + src13) * 3 - (src7 + src14)); \ | 162 | 41.3M | OP(dst[11 * dstStride], (src11 + src12) * 20 - (src10 + src13) * 6 + (src9 + src14) * 3 - (src8 + src15)); \ | 163 | 41.3M | OP(dst[12 * dstStride], (src12 + src13) * 20 - (src11 + src14) * 6 + (src10 + src15) * 3 - (src9 + src16)); \ | 164 | 41.3M | OP(dst[13 * dstStride], (src13 + src14) * 20 - (src12 + src15) * 6 + (src11 + src16) * 3 - (src10 + src16)); \ | 165 | 41.3M | OP(dst[14 * dstStride], (src14 + src15) * 20 - (src13 + src16) * 6 + (src12 + src16) * 3 - (src11 + src15)); \ | 166 | 41.3M | OP(dst[15 * dstStride], (src15 + src16) * 20 - (src14 + src16) * 6 + (src13 + src15) * 3 - (src12 + src14)); \ | 167 | 41.3M | dst++; \ | 168 | 41.3M | src++; \ | 169 | 41.3M | } \ | 170 | 2.58M | } \ |
qpeldsp.c:put_no_rnd_mpeg4_qpel16_v_lowpass Line | Count | Source | 127 | 259k | int dstStride, int srcStride) \ | 128 | 259k | { \ | 129 | 259k | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ | 130 | 259k | const int w = 16; \ | 131 | 259k | int i; \ | 132 | 259k | \ | 133 | 4.41M | for (i = 0; i < w; i++) { \ | 134 | 4.15M | const int src0 = src[0 * srcStride]; \ | 135 | 4.15M | const int src1 = src[1 * srcStride]; \ | 136 | 4.15M | const int src2 = src[2 * srcStride]; \ | 137 | 4.15M | const int src3 = src[3 * srcStride]; \ | 138 | 4.15M | const int src4 = src[4 * srcStride]; \ | 139 | 4.15M | const int src5 = src[5 * srcStride]; \ | 140 | 4.15M | const int src6 = src[6 * srcStride]; \ | 141 | 4.15M | const int src7 = src[7 * srcStride]; \ | 142 | 4.15M | const int src8 = src[8 * srcStride]; \ | 143 | 4.15M | const int src9 = src[9 * srcStride]; \ | 144 | 4.15M | const int src10 = src[10 * srcStride]; \ | 145 | 4.15M | const int src11 = src[11 * srcStride]; \ | 146 | 4.15M | const int src12 = src[12 * srcStride]; \ | 147 | 4.15M | const int src13 = src[13 * srcStride]; \ | 148 | 4.15M | const int src14 = src[14 * srcStride]; \ | 149 | 4.15M | const int src15 = src[15 * srcStride]; \ | 150 | 4.15M | const int src16 = src[16 * srcStride]; \ | 151 | 4.15M | OP(dst[0 * dstStride], (src0 + src1) * 20 - (src0 + src2) * 6 + (src1 + src3) * 3 - (src2 + src4)); \ | 152 | 4.15M | OP(dst[1 * dstStride], (src1 + src2) * 20 - (src0 + src3) * 6 + (src0 + src4) * 3 - (src1 + src5)); \ | 153 | 4.15M | OP(dst[2 * dstStride], (src2 + src3) * 20 - (src1 + src4) * 6 + (src0 + src5) * 3 - (src0 + src6)); \ | 154 | 4.15M | OP(dst[3 * dstStride], (src3 + src4) * 20 - (src2 + src5) * 6 + (src1 + src6) * 3 - (src0 + src7)); \ | 155 | 4.15M | OP(dst[4 * dstStride], (src4 + src5) * 20 - (src3 + src6) * 6 + (src2 + src7) * 3 - (src1 + src8)); \ | 156 | 4.15M | OP(dst[5 * dstStride], (src5 + src6) * 20 - (src4 + src7) * 6 + (src3 + src8) * 3 - (src2 + src9)); \ | 157 | 4.15M | OP(dst[6 * dstStride], (src6 + src7) * 20 - (src5 + src8) * 6 + (src4 + src9) * 3 - (src3 + src10)); \ | 158 | 4.15M | OP(dst[7 * dstStride], (src7 + src8) * 20 - (src6 + src9) * 6 + (src5 + src10) * 3 - (src4 + src11)); \ | 159 | 4.15M | OP(dst[8 * dstStride], (src8 + src9) * 20 - (src7 + src10) * 6 + (src6 + src11) * 3 - (src5 + src12)); \ | 160 | 4.15M | OP(dst[9 * dstStride], (src9 + src10) * 20 - (src8 + src11) * 6 + (src7 + src12) * 3 - (src6 + src13)); \ | 161 | 4.15M | OP(dst[10 * dstStride], (src10 + src11) * 20 - (src9 + src12) * 6 + (src8 + src13) * 3 - (src7 + src14)); \ | 162 | 4.15M | OP(dst[11 * dstStride], (src11 + src12) * 20 - (src10 + src13) * 6 + (src9 + src14) * 3 - (src8 + src15)); \ | 163 | 4.15M | OP(dst[12 * dstStride], (src12 + src13) * 20 - (src11 + src14) * 6 + (src10 + src15) * 3 - (src9 + src16)); \ | 164 | 4.15M | OP(dst[13 * dstStride], (src13 + src14) * 20 - (src12 + src15) * 6 + (src11 + src16) * 3 - (src10 + src16)); \ | 165 | 4.15M | OP(dst[14 * dstStride], (src14 + src15) * 20 - (src13 + src16) * 6 + (src12 + src16) * 3 - (src11 + src15)); \ | 166 | 4.15M | OP(dst[15 * dstStride], (src15 + src16) * 20 - (src14 + src16) * 6 + (src13 + src15) * 3 - (src12 + src14)); \ | 167 | 4.15M | dst++; \ | 168 | 4.15M | src++; \ | 169 | 4.15M | } \ | 170 | 259k | } \ |
qpeldsp.c:avg_mpeg4_qpel16_v_lowpass Line | Count | Source | 127 | 9.97k | int dstStride, int srcStride) \ | 128 | 9.97k | { \ | 129 | 9.97k | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; \ | 130 | 9.97k | const int w = 16; \ | 131 | 9.97k | int i; \ | 132 | 9.97k | \ | 133 | 169k | for (i = 0; i < w; i++) { \ | 134 | 159k | const int src0 = src[0 * srcStride]; \ | 135 | 159k | const int src1 = src[1 * srcStride]; \ | 136 | 159k | const int src2 = src[2 * srcStride]; \ | 137 | 159k | const int src3 = src[3 * srcStride]; \ | 138 | 159k | const int src4 = src[4 * srcStride]; \ | 139 | 159k | const int src5 = src[5 * srcStride]; \ | 140 | 159k | const int src6 = src[6 * srcStride]; \ | 141 | 159k | const int src7 = src[7 * srcStride]; \ | 142 | 159k | const int src8 = src[8 * srcStride]; \ | 143 | 159k | const int src9 = src[9 * srcStride]; \ | 144 | 159k | const int src10 = src[10 * srcStride]; \ | 145 | 159k | const int src11 = src[11 * srcStride]; \ | 146 | 159k | const int src12 = src[12 * srcStride]; \ | 147 | 159k | const int src13 = src[13 * srcStride]; \ | 148 | 159k | const int src14 = src[14 * srcStride]; \ | 149 | 159k | const int src15 = src[15 * srcStride]; \ | 150 | 159k | const int src16 = src[16 * srcStride]; \ | 151 | 159k | OP(dst[0 * dstStride], (src0 + src1) * 20 - (src0 + src2) * 6 + (src1 + src3) * 3 - (src2 + src4)); \ | 152 | 159k | OP(dst[1 * dstStride], (src1 + src2) * 20 - (src0 + src3) * 6 + (src0 + src4) * 3 - (src1 + src5)); \ | 153 | 159k | OP(dst[2 * dstStride], (src2 + src3) * 20 - (src1 + src4) * 6 + (src0 + src5) * 3 - (src0 + src6)); \ | 154 | 159k | OP(dst[3 * dstStride], (src3 + src4) * 20 - (src2 + src5) * 6 + (src1 + src6) * 3 - (src0 + src7)); \ | 155 | 159k | OP(dst[4 * dstStride], (src4 + src5) * 20 - (src3 + src6) * 6 + (src2 + src7) * 3 - (src1 + src8)); \ | 156 | 159k | OP(dst[5 * dstStride], (src5 + src6) * 20 - (src4 + src7) * 6 + (src3 + src8) * 3 - (src2 + src9)); \ | 157 | 159k | OP(dst[6 * dstStride], (src6 + src7) * 20 - (src5 + src8) * 6 + (src4 + src9) * 3 - (src3 + src10)); \ | 158 | 159k | OP(dst[7 * dstStride], (src7 + src8) * 20 - (src6 + src9) * 6 + (src5 + src10) * 3 - (src4 + src11)); \ | 159 | 159k | OP(dst[8 * dstStride], (src8 + src9) * 20 - (src7 + src10) * 6 + (src6 + src11) * 3 - (src5 + src12)); \ | 160 | 159k | OP(dst[9 * dstStride], (src9 + src10) * 20 - (src8 + src11) * 6 + (src7 + src12) * 3 - (src6 + src13)); \ | 161 | 159k | OP(dst[10 * dstStride], (src10 + src11) * 20 - (src9 + src12) * 6 + (src8 + src13) * 3 - (src7 + src14)); \ | 162 | 159k | OP(dst[11 * dstStride], (src11 + src12) * 20 - (src10 + src13) * 6 + (src9 + src14) * 3 - (src8 + src15)); \ | 163 | 159k | OP(dst[12 * dstStride], (src12 + src13) * 20 - (src11 + src14) * 6 + (src10 + src15) * 3 - (src9 + src16)); \ | 164 | 159k | OP(dst[13 * dstStride], (src13 + src14) * 20 - (src12 + src15) * 6 + (src11 + src16) * 3 - (src10 + src16)); \ | 165 | 159k | OP(dst[14 * dstStride], (src14 + src15) * 20 - (src13 + src16) * 6 + (src12 + src16) * 3 - (src11 + src15)); \ | 166 | 159k | OP(dst[15 * dstStride], (src15 + src16) * 20 - (src14 + src16) * 6 + (src13 + src15) * 3 - (src12 + src14)); \ | 167 | 159k | dst++; \ | 168 | 159k | src++; \ | 169 | 159k | } \ | 170 | 9.97k | } \ |
|
171 | | \ |
172 | | static void OPNAME ## qpel8_mc10_c(uint8_t *dst, const uint8_t *src, \ |
173 | 28.1k | ptrdiff_t stride) \ |
174 | 28.1k | { \ |
175 | 28.1k | uint8_t half[64]; \ |
176 | 28.1k | \ |
177 | 28.1k | put ## RND ## mpeg4_qpel8_h_lowpass(half, src, 8, stride, 8); \ |
178 | 28.1k | OPNAME ## pixels8_l2_8(dst, src, half, stride, stride, 8, 8); \ |
179 | 28.1k | } \ qpeldsp.c:put_qpel8_mc10_c Line | Count | Source | 173 | 17.5k | ptrdiff_t stride) \ | 174 | 17.5k | { \ | 175 | 17.5k | uint8_t half[64]; \ | 176 | 17.5k | \ | 177 | 17.5k | put ## RND ## mpeg4_qpel8_h_lowpass(half, src, 8, stride, 8); \ | 178 | 17.5k | OPNAME ## pixels8_l2_8(dst, src, half, stride, stride, 8, 8); \ | 179 | 17.5k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc10_c Line | Count | Source | 173 | 3.20k | ptrdiff_t stride) \ | 174 | 3.20k | { \ | 175 | 3.20k | uint8_t half[64]; \ | 176 | 3.20k | \ | 177 | 3.20k | put ## RND ## mpeg4_qpel8_h_lowpass(half, src, 8, stride, 8); \ | 178 | 3.20k | OPNAME ## pixels8_l2_8(dst, src, half, stride, stride, 8, 8); \ | 179 | 3.20k | } \ |
qpeldsp.c:avg_qpel8_mc10_c Line | Count | Source | 173 | 7.38k | ptrdiff_t stride) \ | 174 | 7.38k | { \ | 175 | 7.38k | uint8_t half[64]; \ | 176 | 7.38k | \ | 177 | 7.38k | put ## RND ## mpeg4_qpel8_h_lowpass(half, src, 8, stride, 8); \ | 178 | 7.38k | OPNAME ## pixels8_l2_8(dst, src, half, stride, stride, 8, 8); \ | 179 | 7.38k | } \ |
|
180 | | \ |
181 | | static void OPNAME ## qpel8_mc20_c(uint8_t *dst, const uint8_t *src, \ |
182 | 18.1k | ptrdiff_t stride) \ |
183 | 18.1k | { \ |
184 | 18.1k | OPNAME ## mpeg4_qpel8_h_lowpass(dst, src, stride, stride, 8); \ |
185 | 18.1k | } \ qpeldsp.c:put_qpel8_mc20_c Line | Count | Source | 182 | 8.73k | ptrdiff_t stride) \ | 183 | 8.73k | { \ | 184 | 8.73k | OPNAME ## mpeg4_qpel8_h_lowpass(dst, src, stride, stride, 8); \ | 185 | 8.73k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc20_c Line | Count | Source | 182 | 2.88k | ptrdiff_t stride) \ | 183 | 2.88k | { \ | 184 | 2.88k | OPNAME ## mpeg4_qpel8_h_lowpass(dst, src, stride, stride, 8); \ | 185 | 2.88k | } \ |
qpeldsp.c:avg_qpel8_mc20_c Line | Count | Source | 182 | 6.53k | ptrdiff_t stride) \ | 183 | 6.53k | { \ | 184 | 6.53k | OPNAME ## mpeg4_qpel8_h_lowpass(dst, src, stride, stride, 8); \ | 185 | 6.53k | } \ |
|
186 | | \ |
187 | | static void OPNAME ## qpel8_mc30_c(uint8_t *dst, const uint8_t *src, \ |
188 | 28.5k | ptrdiff_t stride) \ |
189 | 28.5k | { \ |
190 | 28.5k | uint8_t half[64]; \ |
191 | 28.5k | \ |
192 | 28.5k | put ## RND ## mpeg4_qpel8_h_lowpass(half, src, 8, stride, 8); \ |
193 | 28.5k | OPNAME ## pixels8_l2_8(dst, src + 1, half, stride, stride, 8, 8); \ |
194 | 28.5k | } \ qpeldsp.c:put_qpel8_mc30_c Line | Count | Source | 188 | 16.5k | ptrdiff_t stride) \ | 189 | 16.5k | { \ | 190 | 16.5k | uint8_t half[64]; \ | 191 | 16.5k | \ | 192 | 16.5k | put ## RND ## mpeg4_qpel8_h_lowpass(half, src, 8, stride, 8); \ | 193 | 16.5k | OPNAME ## pixels8_l2_8(dst, src + 1, half, stride, stride, 8, 8); \ | 194 | 16.5k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc30_c Line | Count | Source | 188 | 3.25k | ptrdiff_t stride) \ | 189 | 3.25k | { \ | 190 | 3.25k | uint8_t half[64]; \ | 191 | 3.25k | \ | 192 | 3.25k | put ## RND ## mpeg4_qpel8_h_lowpass(half, src, 8, stride, 8); \ | 193 | 3.25k | OPNAME ## pixels8_l2_8(dst, src + 1, half, stride, stride, 8, 8); \ | 194 | 3.25k | } \ |
qpeldsp.c:avg_qpel8_mc30_c Line | Count | Source | 188 | 8.76k | ptrdiff_t stride) \ | 189 | 8.76k | { \ | 190 | 8.76k | uint8_t half[64]; \ | 191 | 8.76k | \ | 192 | 8.76k | put ## RND ## mpeg4_qpel8_h_lowpass(half, src, 8, stride, 8); \ | 193 | 8.76k | OPNAME ## pixels8_l2_8(dst, src + 1, half, stride, stride, 8, 8); \ | 194 | 8.76k | } \ |
|
195 | | \ |
196 | | static void OPNAME ## qpel8_mc01_c(uint8_t *dst, const uint8_t *src, \ |
197 | 18.9k | ptrdiff_t stride) \ |
198 | 18.9k | { \ |
199 | 18.9k | uint8_t full[16 * 9]; \ |
200 | 18.9k | uint8_t half[64]; \ |
201 | 18.9k | \ |
202 | 18.9k | copy_block8(full, src, 16, stride, 9); \ |
203 | 18.9k | put ## RND ## mpeg4_qpel8_v_lowpass(half, full, 8, 16); \ |
204 | 18.9k | OPNAME ## pixels8_l2_8(dst, full, half, stride, 16, 8, 8); \ |
205 | 18.9k | } \ qpeldsp.c:put_qpel8_mc01_c Line | Count | Source | 197 | 9.07k | ptrdiff_t stride) \ | 198 | 9.07k | { \ | 199 | 9.07k | uint8_t full[16 * 9]; \ | 200 | 9.07k | uint8_t half[64]; \ | 201 | 9.07k | \ | 202 | 9.07k | copy_block8(full, src, 16, stride, 9); \ | 203 | 9.07k | put ## RND ## mpeg4_qpel8_v_lowpass(half, full, 8, 16); \ | 204 | 9.07k | OPNAME ## pixels8_l2_8(dst, full, half, stride, 16, 8, 8); \ | 205 | 9.07k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc01_c Line | Count | Source | 197 | 3.04k | ptrdiff_t stride) \ | 198 | 3.04k | { \ | 199 | 3.04k | uint8_t full[16 * 9]; \ | 200 | 3.04k | uint8_t half[64]; \ | 201 | 3.04k | \ | 202 | 3.04k | copy_block8(full, src, 16, stride, 9); \ | 203 | 3.04k | put ## RND ## mpeg4_qpel8_v_lowpass(half, full, 8, 16); \ | 204 | 3.04k | OPNAME ## pixels8_l2_8(dst, full, half, stride, 16, 8, 8); \ | 205 | 3.04k | } \ |
qpeldsp.c:avg_qpel8_mc01_c Line | Count | Source | 197 | 6.84k | ptrdiff_t stride) \ | 198 | 6.84k | { \ | 199 | 6.84k | uint8_t full[16 * 9]; \ | 200 | 6.84k | uint8_t half[64]; \ | 201 | 6.84k | \ | 202 | 6.84k | copy_block8(full, src, 16, stride, 9); \ | 203 | 6.84k | put ## RND ## mpeg4_qpel8_v_lowpass(half, full, 8, 16); \ | 204 | 6.84k | OPNAME ## pixels8_l2_8(dst, full, half, stride, 16, 8, 8); \ | 205 | 6.84k | } \ |
|
206 | | \ |
207 | | static void OPNAME ## qpel8_mc02_c(uint8_t *dst, const uint8_t *src, \ |
208 | 18.7k | ptrdiff_t stride) \ |
209 | 18.7k | { \ |
210 | 18.7k | uint8_t full[16 * 9]; \ |
211 | 18.7k | \ |
212 | 18.7k | copy_block8(full, src, 16, stride, 9); \ |
213 | 18.7k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, full, stride, 16); \ |
214 | 18.7k | } \ qpeldsp.c:put_qpel8_mc02_c Line | Count | Source | 208 | 8.42k | ptrdiff_t stride) \ | 209 | 8.42k | { \ | 210 | 8.42k | uint8_t full[16 * 9]; \ | 211 | 8.42k | \ | 212 | 8.42k | copy_block8(full, src, 16, stride, 9); \ | 213 | 8.42k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, full, stride, 16); \ | 214 | 8.42k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc02_c Line | Count | Source | 208 | 2.36k | ptrdiff_t stride) \ | 209 | 2.36k | { \ | 210 | 2.36k | uint8_t full[16 * 9]; \ | 211 | 2.36k | \ | 212 | 2.36k | copy_block8(full, src, 16, stride, 9); \ | 213 | 2.36k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, full, stride, 16); \ | 214 | 2.36k | } \ |
qpeldsp.c:avg_qpel8_mc02_c Line | Count | Source | 208 | 7.97k | ptrdiff_t stride) \ | 209 | 7.97k | { \ | 210 | 7.97k | uint8_t full[16 * 9]; \ | 211 | 7.97k | \ | 212 | 7.97k | copy_block8(full, src, 16, stride, 9); \ | 213 | 7.97k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, full, stride, 16); \ | 214 | 7.97k | } \ |
|
215 | | \ |
216 | | static void OPNAME ## qpel8_mc03_c(uint8_t *dst, const uint8_t *src, \ |
217 | 21.1k | ptrdiff_t stride) \ |
218 | 21.1k | { \ |
219 | 21.1k | uint8_t full[16 * 9]; \ |
220 | 21.1k | uint8_t half[64]; \ |
221 | 21.1k | \ |
222 | 21.1k | copy_block8(full, src, 16, stride, 9); \ |
223 | 21.1k | put ## RND ## mpeg4_qpel8_v_lowpass(half, full, 8, 16); \ |
224 | 21.1k | OPNAME ## pixels8_l2_8(dst, full + 16, half, stride, 16, 8, 8); \ |
225 | 21.1k | } \ qpeldsp.c:put_qpel8_mc03_c Line | Count | Source | 217 | 10.3k | ptrdiff_t stride) \ | 218 | 10.3k | { \ | 219 | 10.3k | uint8_t full[16 * 9]; \ | 220 | 10.3k | uint8_t half[64]; \ | 221 | 10.3k | \ | 222 | 10.3k | copy_block8(full, src, 16, stride, 9); \ | 223 | 10.3k | put ## RND ## mpeg4_qpel8_v_lowpass(half, full, 8, 16); \ | 224 | 10.3k | OPNAME ## pixels8_l2_8(dst, full + 16, half, stride, 16, 8, 8); \ | 225 | 10.3k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc03_c Line | Count | Source | 217 | 2.92k | ptrdiff_t stride) \ | 218 | 2.92k | { \ | 219 | 2.92k | uint8_t full[16 * 9]; \ | 220 | 2.92k | uint8_t half[64]; \ | 221 | 2.92k | \ | 222 | 2.92k | copy_block8(full, src, 16, stride, 9); \ | 223 | 2.92k | put ## RND ## mpeg4_qpel8_v_lowpass(half, full, 8, 16); \ | 224 | 2.92k | OPNAME ## pixels8_l2_8(dst, full + 16, half, stride, 16, 8, 8); \ | 225 | 2.92k | } \ |
qpeldsp.c:avg_qpel8_mc03_c Line | Count | Source | 217 | 7.95k | ptrdiff_t stride) \ | 218 | 7.95k | { \ | 219 | 7.95k | uint8_t full[16 * 9]; \ | 220 | 7.95k | uint8_t half[64]; \ | 221 | 7.95k | \ | 222 | 7.95k | copy_block8(full, src, 16, stride, 9); \ | 223 | 7.95k | put ## RND ## mpeg4_qpel8_v_lowpass(half, full, 8, 16); \ | 224 | 7.95k | OPNAME ## pixels8_l2_8(dst, full + 16, half, stride, 16, 8, 8); \ | 225 | 7.95k | } \ |
|
226 | | \ |
227 | | void ff_ ## OPNAME ## qpel8_mc11_old_c(uint8_t *dst, const uint8_t *src, \ |
228 | 9.47k | ptrdiff_t stride) \ |
229 | 9.47k | { \ |
230 | 9.47k | uint8_t full[16 * 9]; \ |
231 | 9.47k | uint8_t halfH[72]; \ |
232 | 9.47k | uint8_t halfV[64]; \ |
233 | 9.47k | uint8_t halfHV[64]; \ |
234 | 9.47k | \ |
235 | 9.47k | copy_block9(full, src, 16, stride, 9); \ |
236 | 9.47k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ |
237 | 9.47k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16); \ |
238 | 9.47k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ |
239 | 9.47k | OPNAME ## pixels8_l4_8(dst, full, halfH, halfV, halfHV, \ |
240 | 9.47k | stride, 16, 8, 8, 8, 8); \ |
241 | 9.47k | } \ Line | Count | Source | 228 | 2.33k | ptrdiff_t stride) \ | 229 | 2.33k | { \ | 230 | 2.33k | uint8_t full[16 * 9]; \ | 231 | 2.33k | uint8_t halfH[72]; \ | 232 | 2.33k | uint8_t halfV[64]; \ | 233 | 2.33k | uint8_t halfHV[64]; \ | 234 | 2.33k | \ | 235 | 2.33k | copy_block9(full, src, 16, stride, 9); \ | 236 | 2.33k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 237 | 2.33k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16); \ | 238 | 2.33k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 239 | 2.33k | OPNAME ## pixels8_l4_8(dst, full, halfH, halfV, halfHV, \ | 240 | 2.33k | stride, 16, 8, 8, 8, 8); \ | 241 | 2.33k | } \ |
ff_put_no_rnd_qpel8_mc11_old_c Line | Count | Source | 228 | 1.53k | ptrdiff_t stride) \ | 229 | 1.53k | { \ | 230 | 1.53k | uint8_t full[16 * 9]; \ | 231 | 1.53k | uint8_t halfH[72]; \ | 232 | 1.53k | uint8_t halfV[64]; \ | 233 | 1.53k | uint8_t halfHV[64]; \ | 234 | 1.53k | \ | 235 | 1.53k | copy_block9(full, src, 16, stride, 9); \ | 236 | 1.53k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 237 | 1.53k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16); \ | 238 | 1.53k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 239 | 1.53k | OPNAME ## pixels8_l4_8(dst, full, halfH, halfV, halfHV, \ | 240 | 1.53k | stride, 16, 8, 8, 8, 8); \ | 241 | 1.53k | } \ |
Line | Count | Source | 228 | 5.60k | ptrdiff_t stride) \ | 229 | 5.60k | { \ | 230 | 5.60k | uint8_t full[16 * 9]; \ | 231 | 5.60k | uint8_t halfH[72]; \ | 232 | 5.60k | uint8_t halfV[64]; \ | 233 | 5.60k | uint8_t halfHV[64]; \ | 234 | 5.60k | \ | 235 | 5.60k | copy_block9(full, src, 16, stride, 9); \ | 236 | 5.60k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 237 | 5.60k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16); \ | 238 | 5.60k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 239 | 5.60k | OPNAME ## pixels8_l4_8(dst, full, halfH, halfV, halfHV, \ | 240 | 5.60k | stride, 16, 8, 8, 8, 8); \ | 241 | 5.60k | } \ |
|
242 | | \ |
243 | | static void OPNAME ## qpel8_mc11_c(uint8_t *dst, const uint8_t *src, \ |
244 | 9.74k | ptrdiff_t stride) \ |
245 | 9.74k | { \ |
246 | 9.74k | uint8_t full[16 * 9]; \ |
247 | 9.74k | uint8_t halfH[72]; \ |
248 | 9.74k | uint8_t halfHV[64]; \ |
249 | 9.74k | \ |
250 | 9.74k | copy_block9(full, src, 16, stride, 9); \ |
251 | 9.74k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ |
252 | 9.74k | put ## RND ## pixels8_l2_8(halfH, halfH, full, 8, 8, 16, 9); \ |
253 | 9.74k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ |
254 | 9.74k | OPNAME ## pixels8_l2_8(dst, halfH, halfHV, stride, 8, 8, 8); \ |
255 | 9.74k | } \ qpeldsp.c:put_qpel8_mc11_c Line | Count | Source | 244 | 4.24k | ptrdiff_t stride) \ | 245 | 4.24k | { \ | 246 | 4.24k | uint8_t full[16 * 9]; \ | 247 | 4.24k | uint8_t halfH[72]; \ | 248 | 4.24k | uint8_t halfHV[64]; \ | 249 | 4.24k | \ | 250 | 4.24k | copy_block9(full, src, 16, stride, 9); \ | 251 | 4.24k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 252 | 4.24k | put ## RND ## pixels8_l2_8(halfH, halfH, full, 8, 8, 16, 9); \ | 253 | 4.24k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 254 | 4.24k | OPNAME ## pixels8_l2_8(dst, halfH, halfHV, stride, 8, 8, 8); \ | 255 | 4.24k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc11_c Line | Count | Source | 244 | 1.45k | ptrdiff_t stride) \ | 245 | 1.45k | { \ | 246 | 1.45k | uint8_t full[16 * 9]; \ | 247 | 1.45k | uint8_t halfH[72]; \ | 248 | 1.45k | uint8_t halfHV[64]; \ | 249 | 1.45k | \ | 250 | 1.45k | copy_block9(full, src, 16, stride, 9); \ | 251 | 1.45k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 252 | 1.45k | put ## RND ## pixels8_l2_8(halfH, halfH, full, 8, 8, 16, 9); \ | 253 | 1.45k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 254 | 1.45k | OPNAME ## pixels8_l2_8(dst, halfH, halfHV, stride, 8, 8, 8); \ | 255 | 1.45k | } \ |
qpeldsp.c:avg_qpel8_mc11_c Line | Count | Source | 244 | 4.03k | ptrdiff_t stride) \ | 245 | 4.03k | { \ | 246 | 4.03k | uint8_t full[16 * 9]; \ | 247 | 4.03k | uint8_t halfH[72]; \ | 248 | 4.03k | uint8_t halfHV[64]; \ | 249 | 4.03k | \ | 250 | 4.03k | copy_block9(full, src, 16, stride, 9); \ | 251 | 4.03k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 252 | 4.03k | put ## RND ## pixels8_l2_8(halfH, halfH, full, 8, 8, 16, 9); \ | 253 | 4.03k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 254 | 4.03k | OPNAME ## pixels8_l2_8(dst, halfH, halfHV, stride, 8, 8, 8); \ | 255 | 4.03k | } \ |
|
256 | | \ |
257 | | void ff_ ## OPNAME ## qpel8_mc31_old_c(uint8_t *dst, const uint8_t *src, \ |
258 | 10.8k | ptrdiff_t stride) \ |
259 | 10.8k | { \ |
260 | 10.8k | uint8_t full[16 * 9]; \ |
261 | 10.8k | uint8_t halfH[72]; \ |
262 | 10.8k | uint8_t halfV[64]; \ |
263 | 10.8k | uint8_t halfHV[64]; \ |
264 | 10.8k | \ |
265 | 10.8k | copy_block9(full, src, 16, stride, 9); \ |
266 | 10.8k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ |
267 | 10.8k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full + 1, 8, 16); \ |
268 | 10.8k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ |
269 | 10.8k | OPNAME ## pixels8_l4_8(dst, full + 1, halfH, halfV, halfHV, \ |
270 | 10.8k | stride, 16, 8, 8, 8, 8); \ |
271 | 10.8k | } \ Line | Count | Source | 258 | 3.74k | ptrdiff_t stride) \ | 259 | 3.74k | { \ | 260 | 3.74k | uint8_t full[16 * 9]; \ | 261 | 3.74k | uint8_t halfH[72]; \ | 262 | 3.74k | uint8_t halfV[64]; \ | 263 | 3.74k | uint8_t halfHV[64]; \ | 264 | 3.74k | \ | 265 | 3.74k | copy_block9(full, src, 16, stride, 9); \ | 266 | 3.74k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 267 | 3.74k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full + 1, 8, 16); \ | 268 | 3.74k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 269 | 3.74k | OPNAME ## pixels8_l4_8(dst, full + 1, halfH, halfV, halfHV, \ | 270 | 3.74k | stride, 16, 8, 8, 8, 8); \ | 271 | 3.74k | } \ |
ff_put_no_rnd_qpel8_mc31_old_c Line | Count | Source | 258 | 2.12k | ptrdiff_t stride) \ | 259 | 2.12k | { \ | 260 | 2.12k | uint8_t full[16 * 9]; \ | 261 | 2.12k | uint8_t halfH[72]; \ | 262 | 2.12k | uint8_t halfV[64]; \ | 263 | 2.12k | uint8_t halfHV[64]; \ | 264 | 2.12k | \ | 265 | 2.12k | copy_block9(full, src, 16, stride, 9); \ | 266 | 2.12k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 267 | 2.12k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full + 1, 8, 16); \ | 268 | 2.12k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 269 | 2.12k | OPNAME ## pixels8_l4_8(dst, full + 1, halfH, halfV, halfHV, \ | 270 | 2.12k | stride, 16, 8, 8, 8, 8); \ | 271 | 2.12k | } \ |
Line | Count | Source | 258 | 4.96k | ptrdiff_t stride) \ | 259 | 4.96k | { \ | 260 | 4.96k | uint8_t full[16 * 9]; \ | 261 | 4.96k | uint8_t halfH[72]; \ | 262 | 4.96k | uint8_t halfV[64]; \ | 263 | 4.96k | uint8_t halfHV[64]; \ | 264 | 4.96k | \ | 265 | 4.96k | copy_block9(full, src, 16, stride, 9); \ | 266 | 4.96k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 267 | 4.96k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full + 1, 8, 16); \ | 268 | 4.96k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 269 | 4.96k | OPNAME ## pixels8_l4_8(dst, full + 1, halfH, halfV, halfHV, \ | 270 | 4.96k | stride, 16, 8, 8, 8, 8); \ | 271 | 4.96k | } \ |
|
272 | | \ |
273 | | static void OPNAME ## qpel8_mc31_c(uint8_t *dst, const uint8_t *src, \ |
274 | 10.6k | ptrdiff_t stride) \ |
275 | 10.6k | { \ |
276 | 10.6k | uint8_t full[16 * 9]; \ |
277 | 10.6k | uint8_t halfH[72]; \ |
278 | 10.6k | uint8_t halfHV[64]; \ |
279 | 10.6k | \ |
280 | 10.6k | copy_block9(full, src, 16, stride, 9); \ |
281 | 10.6k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ |
282 | 10.6k | put ## RND ## pixels8_l2_8(halfH, halfH, full + 1, 8, 8, 16, 9); \ |
283 | 10.6k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ |
284 | 10.6k | OPNAME ## pixels8_l2_8(dst, halfH, halfHV, stride, 8, 8, 8); \ |
285 | 10.6k | } \ qpeldsp.c:put_qpel8_mc31_c Line | Count | Source | 274 | 4.46k | ptrdiff_t stride) \ | 275 | 4.46k | { \ | 276 | 4.46k | uint8_t full[16 * 9]; \ | 277 | 4.46k | uint8_t halfH[72]; \ | 278 | 4.46k | uint8_t halfHV[64]; \ | 279 | 4.46k | \ | 280 | 4.46k | copy_block9(full, src, 16, stride, 9); \ | 281 | 4.46k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 282 | 4.46k | put ## RND ## pixels8_l2_8(halfH, halfH, full + 1, 8, 8, 16, 9); \ | 283 | 4.46k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 284 | 4.46k | OPNAME ## pixels8_l2_8(dst, halfH, halfHV, stride, 8, 8, 8); \ | 285 | 4.46k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc31_c Line | Count | Source | 274 | 1.81k | ptrdiff_t stride) \ | 275 | 1.81k | { \ | 276 | 1.81k | uint8_t full[16 * 9]; \ | 277 | 1.81k | uint8_t halfH[72]; \ | 278 | 1.81k | uint8_t halfHV[64]; \ | 279 | 1.81k | \ | 280 | 1.81k | copy_block9(full, src, 16, stride, 9); \ | 281 | 1.81k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 282 | 1.81k | put ## RND ## pixels8_l2_8(halfH, halfH, full + 1, 8, 8, 16, 9); \ | 283 | 1.81k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 284 | 1.81k | OPNAME ## pixels8_l2_8(dst, halfH, halfHV, stride, 8, 8, 8); \ | 285 | 1.81k | } \ |
qpeldsp.c:avg_qpel8_mc31_c Line | Count | Source | 274 | 4.39k | ptrdiff_t stride) \ | 275 | 4.39k | { \ | 276 | 4.39k | uint8_t full[16 * 9]; \ | 277 | 4.39k | uint8_t halfH[72]; \ | 278 | 4.39k | uint8_t halfHV[64]; \ | 279 | 4.39k | \ | 280 | 4.39k | copy_block9(full, src, 16, stride, 9); \ | 281 | 4.39k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 282 | 4.39k | put ## RND ## pixels8_l2_8(halfH, halfH, full + 1, 8, 8, 16, 9); \ | 283 | 4.39k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 284 | 4.39k | OPNAME ## pixels8_l2_8(dst, halfH, halfHV, stride, 8, 8, 8); \ | 285 | 4.39k | } \ |
|
286 | | \ |
287 | | void ff_ ## OPNAME ## qpel8_mc13_old_c(uint8_t *dst, const uint8_t *src, \ |
288 | 7.24k | ptrdiff_t stride) \ |
289 | 7.24k | { \ |
290 | 7.24k | uint8_t full[16 * 9]; \ |
291 | 7.24k | uint8_t halfH[72]; \ |
292 | 7.24k | uint8_t halfV[64]; \ |
293 | 7.24k | uint8_t halfHV[64]; \ |
294 | 7.24k | \ |
295 | 7.24k | copy_block9(full, src, 16, stride, 9); \ |
296 | 7.24k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ |
297 | 7.24k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16); \ |
298 | 7.24k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ |
299 | 7.24k | OPNAME ## pixels8_l4_8(dst, full + 16, halfH + 8, halfV, halfHV, \ |
300 | 7.24k | stride, 16, 8, 8, 8, 8); \ |
301 | 7.24k | } \ Line | Count | Source | 288 | 3.83k | ptrdiff_t stride) \ | 289 | 3.83k | { \ | 290 | 3.83k | uint8_t full[16 * 9]; \ | 291 | 3.83k | uint8_t halfH[72]; \ | 292 | 3.83k | uint8_t halfV[64]; \ | 293 | 3.83k | uint8_t halfHV[64]; \ | 294 | 3.83k | \ | 295 | 3.83k | copy_block9(full, src, 16, stride, 9); \ | 296 | 3.83k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 297 | 3.83k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16); \ | 298 | 3.83k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 299 | 3.83k | OPNAME ## pixels8_l4_8(dst, full + 16, halfH + 8, halfV, halfHV, \ | 300 | 3.83k | stride, 16, 8, 8, 8, 8); \ | 301 | 3.83k | } \ |
ff_put_no_rnd_qpel8_mc13_old_c Line | Count | Source | 288 | 1.10k | ptrdiff_t stride) \ | 289 | 1.10k | { \ | 290 | 1.10k | uint8_t full[16 * 9]; \ | 291 | 1.10k | uint8_t halfH[72]; \ | 292 | 1.10k | uint8_t halfV[64]; \ | 293 | 1.10k | uint8_t halfHV[64]; \ | 294 | 1.10k | \ | 295 | 1.10k | copy_block9(full, src, 16, stride, 9); \ | 296 | 1.10k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 297 | 1.10k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16); \ | 298 | 1.10k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 299 | 1.10k | OPNAME ## pixels8_l4_8(dst, full + 16, halfH + 8, halfV, halfHV, \ | 300 | 1.10k | stride, 16, 8, 8, 8, 8); \ | 301 | 1.10k | } \ |
Line | Count | Source | 288 | 2.30k | ptrdiff_t stride) \ | 289 | 2.30k | { \ | 290 | 2.30k | uint8_t full[16 * 9]; \ | 291 | 2.30k | uint8_t halfH[72]; \ | 292 | 2.30k | uint8_t halfV[64]; \ | 293 | 2.30k | uint8_t halfHV[64]; \ | 294 | 2.30k | \ | 295 | 2.30k | copy_block9(full, src, 16, stride, 9); \ | 296 | 2.30k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 297 | 2.30k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16); \ | 298 | 2.30k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 299 | 2.30k | OPNAME ## pixels8_l4_8(dst, full + 16, halfH + 8, halfV, halfHV, \ | 300 | 2.30k | stride, 16, 8, 8, 8, 8); \ | 301 | 2.30k | } \ |
|
302 | | \ |
303 | | static void OPNAME ## qpel8_mc13_c(uint8_t *dst, const uint8_t *src, \ |
304 | 10.9k | ptrdiff_t stride) \ |
305 | 10.9k | { \ |
306 | 10.9k | uint8_t full[16 * 9]; \ |
307 | 10.9k | uint8_t halfH[72]; \ |
308 | 10.9k | uint8_t halfHV[64]; \ |
309 | 10.9k | \ |
310 | 10.9k | copy_block9(full, src, 16, stride, 9); \ |
311 | 10.9k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ |
312 | 10.9k | put ## RND ## pixels8_l2_8(halfH, halfH, full, 8, 8, 16, 9); \ |
313 | 10.9k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ |
314 | 10.9k | OPNAME ## pixels8_l2_8(dst, halfH + 8, halfHV, stride, 8, 8, 8); \ |
315 | 10.9k | } \ qpeldsp.c:put_qpel8_mc13_c Line | Count | Source | 304 | 5.81k | ptrdiff_t stride) \ | 305 | 5.81k | { \ | 306 | 5.81k | uint8_t full[16 * 9]; \ | 307 | 5.81k | uint8_t halfH[72]; \ | 308 | 5.81k | uint8_t halfHV[64]; \ | 309 | 5.81k | \ | 310 | 5.81k | copy_block9(full, src, 16, stride, 9); \ | 311 | 5.81k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 312 | 5.81k | put ## RND ## pixels8_l2_8(halfH, halfH, full, 8, 8, 16, 9); \ | 313 | 5.81k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 314 | 5.81k | OPNAME ## pixels8_l2_8(dst, halfH + 8, halfHV, stride, 8, 8, 8); \ | 315 | 5.81k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc13_c Line | Count | Source | 304 | 1.70k | ptrdiff_t stride) \ | 305 | 1.70k | { \ | 306 | 1.70k | uint8_t full[16 * 9]; \ | 307 | 1.70k | uint8_t halfH[72]; \ | 308 | 1.70k | uint8_t halfHV[64]; \ | 309 | 1.70k | \ | 310 | 1.70k | copy_block9(full, src, 16, stride, 9); \ | 311 | 1.70k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 312 | 1.70k | put ## RND ## pixels8_l2_8(halfH, halfH, full, 8, 8, 16, 9); \ | 313 | 1.70k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 314 | 1.70k | OPNAME ## pixels8_l2_8(dst, halfH + 8, halfHV, stride, 8, 8, 8); \ | 315 | 1.70k | } \ |
qpeldsp.c:avg_qpel8_mc13_c Line | Count | Source | 304 | 3.39k | ptrdiff_t stride) \ | 305 | 3.39k | { \ | 306 | 3.39k | uint8_t full[16 * 9]; \ | 307 | 3.39k | uint8_t halfH[72]; \ | 308 | 3.39k | uint8_t halfHV[64]; \ | 309 | 3.39k | \ | 310 | 3.39k | copy_block9(full, src, 16, stride, 9); \ | 311 | 3.39k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 312 | 3.39k | put ## RND ## pixels8_l2_8(halfH, halfH, full, 8, 8, 16, 9); \ | 313 | 3.39k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 314 | 3.39k | OPNAME ## pixels8_l2_8(dst, halfH + 8, halfHV, stride, 8, 8, 8); \ | 315 | 3.39k | } \ |
|
316 | | \ |
317 | | void ff_ ## OPNAME ## qpel8_mc33_old_c(uint8_t *dst, const uint8_t *src, \ |
318 | 7.89k | ptrdiff_t stride) \ |
319 | 7.89k | { \ |
320 | 7.89k | uint8_t full[16 * 9]; \ |
321 | 7.89k | uint8_t halfH[72]; \ |
322 | 7.89k | uint8_t halfV[64]; \ |
323 | 7.89k | uint8_t halfHV[64]; \ |
324 | 7.89k | \ |
325 | 7.89k | copy_block9(full, src, 16, stride, 9); \ |
326 | 7.89k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ |
327 | 7.89k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full + 1, 8, 16); \ |
328 | 7.89k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ |
329 | 7.89k | OPNAME ## pixels8_l4_8(dst, full + 17, halfH + 8, halfV, halfHV, \ |
330 | 7.89k | stride, 16, 8, 8, 8, 8); \ |
331 | 7.89k | } \ Line | Count | Source | 318 | 4.28k | ptrdiff_t stride) \ | 319 | 4.28k | { \ | 320 | 4.28k | uint8_t full[16 * 9]; \ | 321 | 4.28k | uint8_t halfH[72]; \ | 322 | 4.28k | uint8_t halfV[64]; \ | 323 | 4.28k | uint8_t halfHV[64]; \ | 324 | 4.28k | \ | 325 | 4.28k | copy_block9(full, src, 16, stride, 9); \ | 326 | 4.28k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 327 | 4.28k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full + 1, 8, 16); \ | 328 | 4.28k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 329 | 4.28k | OPNAME ## pixels8_l4_8(dst, full + 17, halfH + 8, halfV, halfHV, \ | 330 | 4.28k | stride, 16, 8, 8, 8, 8); \ | 331 | 4.28k | } \ |
ff_put_no_rnd_qpel8_mc33_old_c Line | Count | Source | 318 | 1.45k | ptrdiff_t stride) \ | 319 | 1.45k | { \ | 320 | 1.45k | uint8_t full[16 * 9]; \ | 321 | 1.45k | uint8_t halfH[72]; \ | 322 | 1.45k | uint8_t halfV[64]; \ | 323 | 1.45k | uint8_t halfHV[64]; \ | 324 | 1.45k | \ | 325 | 1.45k | copy_block9(full, src, 16, stride, 9); \ | 326 | 1.45k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 327 | 1.45k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full + 1, 8, 16); \ | 328 | 1.45k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 329 | 1.45k | OPNAME ## pixels8_l4_8(dst, full + 17, halfH + 8, halfV, halfHV, \ | 330 | 1.45k | stride, 16, 8, 8, 8, 8); \ | 331 | 1.45k | } \ |
Line | Count | Source | 318 | 2.15k | ptrdiff_t stride) \ | 319 | 2.15k | { \ | 320 | 2.15k | uint8_t full[16 * 9]; \ | 321 | 2.15k | uint8_t halfH[72]; \ | 322 | 2.15k | uint8_t halfV[64]; \ | 323 | 2.15k | uint8_t halfHV[64]; \ | 324 | 2.15k | \ | 325 | 2.15k | copy_block9(full, src, 16, stride, 9); \ | 326 | 2.15k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 327 | 2.15k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full + 1, 8, 16); \ | 328 | 2.15k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 329 | 2.15k | OPNAME ## pixels8_l4_8(dst, full + 17, halfH + 8, halfV, halfHV, \ | 330 | 2.15k | stride, 16, 8, 8, 8, 8); \ | 331 | 2.15k | } \ |
|
332 | | \ |
333 | | static void OPNAME ## qpel8_mc33_c(uint8_t *dst, const uint8_t *src, \ |
334 | 11.7k | ptrdiff_t stride) \ |
335 | 11.7k | { \ |
336 | 11.7k | uint8_t full[16 * 9]; \ |
337 | 11.7k | uint8_t halfH[72]; \ |
338 | 11.7k | uint8_t halfHV[64]; \ |
339 | 11.7k | \ |
340 | 11.7k | copy_block9(full, src, 16, stride, 9); \ |
341 | 11.7k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ |
342 | 11.7k | put ## RND ## pixels8_l2_8(halfH, halfH, full + 1, 8, 8, 16, 9); \ |
343 | 11.7k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ |
344 | 11.7k | OPNAME ## pixels8_l2_8(dst, halfH + 8, halfHV, stride, 8, 8, 8); \ |
345 | 11.7k | } \ qpeldsp.c:put_qpel8_mc33_c Line | Count | Source | 334 | 5.41k | ptrdiff_t stride) \ | 335 | 5.41k | { \ | 336 | 5.41k | uint8_t full[16 * 9]; \ | 337 | 5.41k | uint8_t halfH[72]; \ | 338 | 5.41k | uint8_t halfHV[64]; \ | 339 | 5.41k | \ | 340 | 5.41k | copy_block9(full, src, 16, stride, 9); \ | 341 | 5.41k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 342 | 5.41k | put ## RND ## pixels8_l2_8(halfH, halfH, full + 1, 8, 8, 16, 9); \ | 343 | 5.41k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 344 | 5.41k | OPNAME ## pixels8_l2_8(dst, halfH + 8, halfHV, stride, 8, 8, 8); \ | 345 | 5.41k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc33_c Line | Count | Source | 334 | 2.75k | ptrdiff_t stride) \ | 335 | 2.75k | { \ | 336 | 2.75k | uint8_t full[16 * 9]; \ | 337 | 2.75k | uint8_t halfH[72]; \ | 338 | 2.75k | uint8_t halfHV[64]; \ | 339 | 2.75k | \ | 340 | 2.75k | copy_block9(full, src, 16, stride, 9); \ | 341 | 2.75k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 342 | 2.75k | put ## RND ## pixels8_l2_8(halfH, halfH, full + 1, 8, 8, 16, 9); \ | 343 | 2.75k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 344 | 2.75k | OPNAME ## pixels8_l2_8(dst, halfH + 8, halfHV, stride, 8, 8, 8); \ | 345 | 2.75k | } \ |
qpeldsp.c:avg_qpel8_mc33_c Line | Count | Source | 334 | 3.58k | ptrdiff_t stride) \ | 335 | 3.58k | { \ | 336 | 3.58k | uint8_t full[16 * 9]; \ | 337 | 3.58k | uint8_t halfH[72]; \ | 338 | 3.58k | uint8_t halfHV[64]; \ | 339 | 3.58k | \ | 340 | 3.58k | copy_block9(full, src, 16, stride, 9); \ | 341 | 3.58k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 342 | 3.58k | put ## RND ## pixels8_l2_8(halfH, halfH, full + 1, 8, 8, 16, 9); \ | 343 | 3.58k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 344 | 3.58k | OPNAME ## pixels8_l2_8(dst, halfH + 8, halfHV, stride, 8, 8, 8); \ | 345 | 3.58k | } \ |
|
346 | | \ |
347 | | static void OPNAME ## qpel8_mc21_c(uint8_t *dst, const uint8_t *src, \ |
348 | 14.0k | ptrdiff_t stride) \ |
349 | 14.0k | { \ |
350 | 14.0k | uint8_t halfH[72]; \ |
351 | 14.0k | uint8_t halfHV[64]; \ |
352 | 14.0k | \ |
353 | 14.0k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9); \ |
354 | 14.0k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ |
355 | 14.0k | OPNAME ## pixels8_l2_8(dst, halfH, halfHV, stride, 8, 8, 8); \ |
356 | 14.0k | } \ qpeldsp.c:put_qpel8_mc21_c Line | Count | Source | 348 | 6.45k | ptrdiff_t stride) \ | 349 | 6.45k | { \ | 350 | 6.45k | uint8_t halfH[72]; \ | 351 | 6.45k | uint8_t halfHV[64]; \ | 352 | 6.45k | \ | 353 | 6.45k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9); \ | 354 | 6.45k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 355 | 6.45k | OPNAME ## pixels8_l2_8(dst, halfH, halfHV, stride, 8, 8, 8); \ | 356 | 6.45k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc21_c Line | Count | Source | 348 | 2.27k | ptrdiff_t stride) \ | 349 | 2.27k | { \ | 350 | 2.27k | uint8_t halfH[72]; \ | 351 | 2.27k | uint8_t halfHV[64]; \ | 352 | 2.27k | \ | 353 | 2.27k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9); \ | 354 | 2.27k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 355 | 2.27k | OPNAME ## pixels8_l2_8(dst, halfH, halfHV, stride, 8, 8, 8); \ | 356 | 2.27k | } \ |
qpeldsp.c:avg_qpel8_mc21_c Line | Count | Source | 348 | 5.29k | ptrdiff_t stride) \ | 349 | 5.29k | { \ | 350 | 5.29k | uint8_t halfH[72]; \ | 351 | 5.29k | uint8_t halfHV[64]; \ | 352 | 5.29k | \ | 353 | 5.29k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9); \ | 354 | 5.29k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 355 | 5.29k | OPNAME ## pixels8_l2_8(dst, halfH, halfHV, stride, 8, 8, 8); \ | 356 | 5.29k | } \ |
|
357 | | \ |
358 | | static void OPNAME ## qpel8_mc23_c(uint8_t *dst, const uint8_t *src, \ |
359 | 12.9k | ptrdiff_t stride) \ |
360 | 12.9k | { \ |
361 | 12.9k | uint8_t halfH[72]; \ |
362 | 12.9k | uint8_t halfHV[64]; \ |
363 | 12.9k | \ |
364 | 12.9k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9); \ |
365 | 12.9k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ |
366 | 12.9k | OPNAME ## pixels8_l2_8(dst, halfH + 8, halfHV, stride, 8, 8, 8); \ |
367 | 12.9k | } \ qpeldsp.c:put_qpel8_mc23_c Line | Count | Source | 359 | 5.21k | ptrdiff_t stride) \ | 360 | 5.21k | { \ | 361 | 5.21k | uint8_t halfH[72]; \ | 362 | 5.21k | uint8_t halfHV[64]; \ | 363 | 5.21k | \ | 364 | 5.21k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9); \ | 365 | 5.21k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 366 | 5.21k | OPNAME ## pixels8_l2_8(dst, halfH + 8, halfHV, stride, 8, 8, 8); \ | 367 | 5.21k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc23_c Line | Count | Source | 359 | 2.15k | ptrdiff_t stride) \ | 360 | 2.15k | { \ | 361 | 2.15k | uint8_t halfH[72]; \ | 362 | 2.15k | uint8_t halfHV[64]; \ | 363 | 2.15k | \ | 364 | 2.15k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9); \ | 365 | 2.15k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 366 | 2.15k | OPNAME ## pixels8_l2_8(dst, halfH + 8, halfHV, stride, 8, 8, 8); \ | 367 | 2.15k | } \ |
qpeldsp.c:avg_qpel8_mc23_c Line | Count | Source | 359 | 5.53k | ptrdiff_t stride) \ | 360 | 5.53k | { \ | 361 | 5.53k | uint8_t halfH[72]; \ | 362 | 5.53k | uint8_t halfHV[64]; \ | 363 | 5.53k | \ | 364 | 5.53k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9); \ | 365 | 5.53k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 366 | 5.53k | OPNAME ## pixels8_l2_8(dst, halfH + 8, halfHV, stride, 8, 8, 8); \ | 367 | 5.53k | } \ |
|
368 | | \ |
369 | | void ff_ ## OPNAME ## qpel8_mc12_old_c(uint8_t *dst, const uint8_t *src, \ |
370 | 9.09k | ptrdiff_t stride) \ |
371 | 9.09k | { \ |
372 | 9.09k | uint8_t full[16 * 9]; \ |
373 | 9.09k | uint8_t halfH[72]; \ |
374 | 9.09k | uint8_t halfV[64]; \ |
375 | 9.09k | uint8_t halfHV[64]; \ |
376 | 9.09k | \ |
377 | 9.09k | copy_block9(full, src, 16, stride, 9); \ |
378 | 9.09k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ |
379 | 9.09k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16); \ |
380 | 9.09k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ |
381 | 9.09k | OPNAME ## pixels8_l2_8(dst, halfV, halfHV, stride, 8, 8, 8); \ |
382 | 9.09k | } \ Line | Count | Source | 370 | 2.88k | ptrdiff_t stride) \ | 371 | 2.88k | { \ | 372 | 2.88k | uint8_t full[16 * 9]; \ | 373 | 2.88k | uint8_t halfH[72]; \ | 374 | 2.88k | uint8_t halfV[64]; \ | 375 | 2.88k | uint8_t halfHV[64]; \ | 376 | 2.88k | \ | 377 | 2.88k | copy_block9(full, src, 16, stride, 9); \ | 378 | 2.88k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 379 | 2.88k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16); \ | 380 | 2.88k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 381 | 2.88k | OPNAME ## pixels8_l2_8(dst, halfV, halfHV, stride, 8, 8, 8); \ | 382 | 2.88k | } \ |
ff_put_no_rnd_qpel8_mc12_old_c Line | Count | Source | 370 | 1.28k | ptrdiff_t stride) \ | 371 | 1.28k | { \ | 372 | 1.28k | uint8_t full[16 * 9]; \ | 373 | 1.28k | uint8_t halfH[72]; \ | 374 | 1.28k | uint8_t halfV[64]; \ | 375 | 1.28k | uint8_t halfHV[64]; \ | 376 | 1.28k | \ | 377 | 1.28k | copy_block9(full, src, 16, stride, 9); \ | 378 | 1.28k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 379 | 1.28k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16); \ | 380 | 1.28k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 381 | 1.28k | OPNAME ## pixels8_l2_8(dst, halfV, halfHV, stride, 8, 8, 8); \ | 382 | 1.28k | } \ |
Line | Count | Source | 370 | 4.92k | ptrdiff_t stride) \ | 371 | 4.92k | { \ | 372 | 4.92k | uint8_t full[16 * 9]; \ | 373 | 4.92k | uint8_t halfH[72]; \ | 374 | 4.92k | uint8_t halfV[64]; \ | 375 | 4.92k | uint8_t halfHV[64]; \ | 376 | 4.92k | \ | 377 | 4.92k | copy_block9(full, src, 16, stride, 9); \ | 378 | 4.92k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 379 | 4.92k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16); \ | 380 | 4.92k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 381 | 4.92k | OPNAME ## pixels8_l2_8(dst, halfV, halfHV, stride, 8, 8, 8); \ | 382 | 4.92k | } \ |
|
383 | | \ |
384 | | static void OPNAME ## qpel8_mc12_c(uint8_t *dst, const uint8_t *src, \ |
385 | 6.85k | ptrdiff_t stride) \ |
386 | 6.85k | { \ |
387 | 6.85k | uint8_t full[16 * 9]; \ |
388 | 6.85k | uint8_t halfH[72]; \ |
389 | 6.85k | \ |
390 | 6.85k | copy_block9(full, src, 16, stride, 9); \ |
391 | 6.85k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ |
392 | 6.85k | put ## RND ## pixels8_l2_8(halfH, halfH, full, 8, 8, 16, 9); \ |
393 | 6.85k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8); \ |
394 | 6.85k | } \ qpeldsp.c:put_qpel8_mc12_c Line | Count | Source | 385 | 2.58k | ptrdiff_t stride) \ | 386 | 2.58k | { \ | 387 | 2.58k | uint8_t full[16 * 9]; \ | 388 | 2.58k | uint8_t halfH[72]; \ | 389 | 2.58k | \ | 390 | 2.58k | copy_block9(full, src, 16, stride, 9); \ | 391 | 2.58k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 392 | 2.58k | put ## RND ## pixels8_l2_8(halfH, halfH, full, 8, 8, 16, 9); \ | 393 | 2.58k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8); \ | 394 | 2.58k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc12_c Line | Count | Source | 385 | 977 | ptrdiff_t stride) \ | 386 | 977 | { \ | 387 | 977 | uint8_t full[16 * 9]; \ | 388 | 977 | uint8_t halfH[72]; \ | 389 | 977 | \ | 390 | 977 | copy_block9(full, src, 16, stride, 9); \ | 391 | 977 | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 392 | 977 | put ## RND ## pixels8_l2_8(halfH, halfH, full, 8, 8, 16, 9); \ | 393 | 977 | OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8); \ | 394 | 977 | } \ |
qpeldsp.c:avg_qpel8_mc12_c Line | Count | Source | 385 | 3.29k | ptrdiff_t stride) \ | 386 | 3.29k | { \ | 387 | 3.29k | uint8_t full[16 * 9]; \ | 388 | 3.29k | uint8_t halfH[72]; \ | 389 | 3.29k | \ | 390 | 3.29k | copy_block9(full, src, 16, stride, 9); \ | 391 | 3.29k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 392 | 3.29k | put ## RND ## pixels8_l2_8(halfH, halfH, full, 8, 8, 16, 9); \ | 393 | 3.29k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8); \ | 394 | 3.29k | } \ |
|
395 | | \ |
396 | | void ff_ ## OPNAME ## qpel8_mc32_old_c(uint8_t *dst, const uint8_t *src, \ |
397 | 12.7k | ptrdiff_t stride) \ |
398 | 12.7k | { \ |
399 | 12.7k | uint8_t full[16 * 9]; \ |
400 | 12.7k | uint8_t halfH[72]; \ |
401 | 12.7k | uint8_t halfV[64]; \ |
402 | 12.7k | uint8_t halfHV[64]; \ |
403 | 12.7k | \ |
404 | 12.7k | copy_block9(full, src, 16, stride, 9); \ |
405 | 12.7k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ |
406 | 12.7k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full + 1, 8, 16); \ |
407 | 12.7k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ |
408 | 12.7k | OPNAME ## pixels8_l2_8(dst, halfV, halfHV, stride, 8, 8, 8); \ |
409 | 12.7k | } \ Line | Count | Source | 397 | 2.49k | ptrdiff_t stride) \ | 398 | 2.49k | { \ | 399 | 2.49k | uint8_t full[16 * 9]; \ | 400 | 2.49k | uint8_t halfH[72]; \ | 401 | 2.49k | uint8_t halfV[64]; \ | 402 | 2.49k | uint8_t halfHV[64]; \ | 403 | 2.49k | \ | 404 | 2.49k | copy_block9(full, src, 16, stride, 9); \ | 405 | 2.49k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 406 | 2.49k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full + 1, 8, 16); \ | 407 | 2.49k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 408 | 2.49k | OPNAME ## pixels8_l2_8(dst, halfV, halfHV, stride, 8, 8, 8); \ | 409 | 2.49k | } \ |
ff_put_no_rnd_qpel8_mc32_old_c Line | Count | Source | 397 | 1.57k | ptrdiff_t stride) \ | 398 | 1.57k | { \ | 399 | 1.57k | uint8_t full[16 * 9]; \ | 400 | 1.57k | uint8_t halfH[72]; \ | 401 | 1.57k | uint8_t halfV[64]; \ | 402 | 1.57k | uint8_t halfHV[64]; \ | 403 | 1.57k | \ | 404 | 1.57k | copy_block9(full, src, 16, stride, 9); \ | 405 | 1.57k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 406 | 1.57k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full + 1, 8, 16); \ | 407 | 1.57k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 408 | 1.57k | OPNAME ## pixels8_l2_8(dst, halfV, halfHV, stride, 8, 8, 8); \ | 409 | 1.57k | } \ |
Line | Count | Source | 397 | 8.65k | ptrdiff_t stride) \ | 398 | 8.65k | { \ | 399 | 8.65k | uint8_t full[16 * 9]; \ | 400 | 8.65k | uint8_t halfH[72]; \ | 401 | 8.65k | uint8_t halfV[64]; \ | 402 | 8.65k | uint8_t halfHV[64]; \ | 403 | 8.65k | \ | 404 | 8.65k | copy_block9(full, src, 16, stride, 9); \ | 405 | 8.65k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 406 | 8.65k | put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full + 1, 8, 16); \ | 407 | 8.65k | put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8); \ | 408 | 8.65k | OPNAME ## pixels8_l2_8(dst, halfV, halfHV, stride, 8, 8, 8); \ | 409 | 8.65k | } \ |
|
410 | | \ |
411 | | static void OPNAME ## qpel8_mc32_c(uint8_t *dst, const uint8_t *src, \ |
412 | 6.65k | ptrdiff_t stride) \ |
413 | 6.65k | { \ |
414 | 6.65k | uint8_t full[16 * 9]; \ |
415 | 6.65k | uint8_t halfH[72]; \ |
416 | 6.65k | \ |
417 | 6.65k | copy_block9(full, src, 16, stride, 9); \ |
418 | 6.65k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ |
419 | 6.65k | put ## RND ## pixels8_l2_8(halfH, halfH, full + 1, 8, 8, 16, 9); \ |
420 | 6.65k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8); \ |
421 | 6.65k | } \ qpeldsp.c:put_qpel8_mc32_c Line | Count | Source | 412 | 2.66k | ptrdiff_t stride) \ | 413 | 2.66k | { \ | 414 | 2.66k | uint8_t full[16 * 9]; \ | 415 | 2.66k | uint8_t halfH[72]; \ | 416 | 2.66k | \ | 417 | 2.66k | copy_block9(full, src, 16, stride, 9); \ | 418 | 2.66k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 419 | 2.66k | put ## RND ## pixels8_l2_8(halfH, halfH, full + 1, 8, 8, 16, 9); \ | 420 | 2.66k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8); \ | 421 | 2.66k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc32_c Line | Count | Source | 412 | 1.23k | ptrdiff_t stride) \ | 413 | 1.23k | { \ | 414 | 1.23k | uint8_t full[16 * 9]; \ | 415 | 1.23k | uint8_t halfH[72]; \ | 416 | 1.23k | \ | 417 | 1.23k | copy_block9(full, src, 16, stride, 9); \ | 418 | 1.23k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 419 | 1.23k | put ## RND ## pixels8_l2_8(halfH, halfH, full + 1, 8, 8, 16, 9); \ | 420 | 1.23k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8); \ | 421 | 1.23k | } \ |
qpeldsp.c:avg_qpel8_mc32_c Line | Count | Source | 412 | 2.75k | ptrdiff_t stride) \ | 413 | 2.75k | { \ | 414 | 2.75k | uint8_t full[16 * 9]; \ | 415 | 2.75k | uint8_t halfH[72]; \ | 416 | 2.75k | \ | 417 | 2.75k | copy_block9(full, src, 16, stride, 9); \ | 418 | 2.75k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9); \ | 419 | 2.75k | put ## RND ## pixels8_l2_8(halfH, halfH, full + 1, 8, 8, 16, 9); \ | 420 | 2.75k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8); \ | 421 | 2.75k | } \ |
|
422 | | \ |
423 | | static void OPNAME ## qpel8_mc22_c(uint8_t *dst, const uint8_t *src, \ |
424 | 14.2k | ptrdiff_t stride) \ |
425 | 14.2k | { \ |
426 | 14.2k | uint8_t halfH[72]; \ |
427 | 14.2k | \ |
428 | 14.2k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9); \ |
429 | 14.2k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8); \ |
430 | 14.2k | } \ qpeldsp.c:put_qpel8_mc22_c Line | Count | Source | 424 | 6.51k | ptrdiff_t stride) \ | 425 | 6.51k | { \ | 426 | 6.51k | uint8_t halfH[72]; \ | 427 | 6.51k | \ | 428 | 6.51k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9); \ | 429 | 6.51k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8); \ | 430 | 6.51k | } \ |
qpeldsp.c:put_no_rnd_qpel8_mc22_c Line | Count | Source | 424 | 1.91k | ptrdiff_t stride) \ | 425 | 1.91k | { \ | 426 | 1.91k | uint8_t halfH[72]; \ | 427 | 1.91k | \ | 428 | 1.91k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9); \ | 429 | 1.91k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8); \ | 430 | 1.91k | } \ |
qpeldsp.c:avg_qpel8_mc22_c Line | Count | Source | 424 | 5.78k | ptrdiff_t stride) \ | 425 | 5.78k | { \ | 426 | 5.78k | uint8_t halfH[72]; \ | 427 | 5.78k | \ | 428 | 5.78k | put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9); \ | 429 | 5.78k | OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8); \ | 430 | 5.78k | } \ |
|
431 | | \ |
432 | | static void OPNAME ## qpel16_mc10_c(uint8_t *dst, const uint8_t *src, \ |
433 | 281k | ptrdiff_t stride) \ |
434 | 281k | { \ |
435 | 281k | uint8_t half[256]; \ |
436 | 281k | \ |
437 | 281k | put ## RND ## mpeg4_qpel16_h_lowpass(half, src, 16, stride, 16); \ |
438 | 281k | OPNAME ## pixels16_l2_8(dst, src, half, stride, stride, 16, 16); \ |
439 | 281k | } \ qpeldsp.c:put_qpel16_mc10_c Line | Count | Source | 433 | 263k | ptrdiff_t stride) \ | 434 | 263k | { \ | 435 | 263k | uint8_t half[256]; \ | 436 | 263k | \ | 437 | 263k | put ## RND ## mpeg4_qpel16_h_lowpass(half, src, 16, stride, 16); \ | 438 | 263k | OPNAME ## pixels16_l2_8(dst, src, half, stride, stride, 16, 16); \ | 439 | 263k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc10_c Line | Count | Source | 433 | 12.1k | ptrdiff_t stride) \ | 434 | 12.1k | { \ | 435 | 12.1k | uint8_t half[256]; \ | 436 | 12.1k | \ | 437 | 12.1k | put ## RND ## mpeg4_qpel16_h_lowpass(half, src, 16, stride, 16); \ | 438 | 12.1k | OPNAME ## pixels16_l2_8(dst, src, half, stride, stride, 16, 16); \ | 439 | 12.1k | } \ |
qpeldsp.c:avg_qpel16_mc10_c Line | Count | Source | 433 | 5.33k | ptrdiff_t stride) \ | 434 | 5.33k | { \ | 435 | 5.33k | uint8_t half[256]; \ | 436 | 5.33k | \ | 437 | 5.33k | put ## RND ## mpeg4_qpel16_h_lowpass(half, src, 16, stride, 16); \ | 438 | 5.33k | OPNAME ## pixels16_l2_8(dst, src, half, stride, stride, 16, 16); \ | 439 | 5.33k | } \ |
|
440 | | \ |
441 | | static void OPNAME ## qpel16_mc20_c(uint8_t *dst, const uint8_t *src, \ |
442 | 262k | ptrdiff_t stride) \ |
443 | 262k | { \ |
444 | 262k | OPNAME ## mpeg4_qpel16_h_lowpass(dst, src, stride, stride, 16); \ |
445 | 262k | } \ qpeldsp.c:put_qpel16_mc20_c Line | Count | Source | 442 | 244k | ptrdiff_t stride) \ | 443 | 244k | { \ | 444 | 244k | OPNAME ## mpeg4_qpel16_h_lowpass(dst, src, stride, stride, 16); \ | 445 | 244k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc20_c Line | Count | Source | 442 | 14.1k | ptrdiff_t stride) \ | 443 | 14.1k | { \ | 444 | 14.1k | OPNAME ## mpeg4_qpel16_h_lowpass(dst, src, stride, stride, 16); \ | 445 | 14.1k | } \ |
qpeldsp.c:avg_qpel16_mc20_c Line | Count | Source | 442 | 3.88k | ptrdiff_t stride) \ | 443 | 3.88k | { \ | 444 | 3.88k | OPNAME ## mpeg4_qpel16_h_lowpass(dst, src, stride, stride, 16); \ | 445 | 3.88k | } \ |
|
446 | | \ |
447 | | static void OPNAME ## qpel16_mc30_c(uint8_t *dst, const uint8_t *src, \ |
448 | 287k | ptrdiff_t stride) \ |
449 | 287k | { \ |
450 | 287k | uint8_t half[256]; \ |
451 | 287k | \ |
452 | 287k | put ## RND ## mpeg4_qpel16_h_lowpass(half, src, 16, stride, 16); \ |
453 | 287k | OPNAME ## pixels16_l2_8(dst, src + 1, half, stride, stride, 16, 16); \ |
454 | 287k | } \ qpeldsp.c:put_qpel16_mc30_c Line | Count | Source | 448 | 257k | ptrdiff_t stride) \ | 449 | 257k | { \ | 450 | 257k | uint8_t half[256]; \ | 451 | 257k | \ | 452 | 257k | put ## RND ## mpeg4_qpel16_h_lowpass(half, src, 16, stride, 16); \ | 453 | 257k | OPNAME ## pixels16_l2_8(dst, src + 1, half, stride, stride, 16, 16); \ | 454 | 257k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc30_c Line | Count | Source | 448 | 25.3k | ptrdiff_t stride) \ | 449 | 25.3k | { \ | 450 | 25.3k | uint8_t half[256]; \ | 451 | 25.3k | \ | 452 | 25.3k | put ## RND ## mpeg4_qpel16_h_lowpass(half, src, 16, stride, 16); \ | 453 | 25.3k | OPNAME ## pixels16_l2_8(dst, src + 1, half, stride, stride, 16, 16); \ | 454 | 25.3k | } \ |
qpeldsp.c:avg_qpel16_mc30_c Line | Count | Source | 448 | 4.91k | ptrdiff_t stride) \ | 449 | 4.91k | { \ | 450 | 4.91k | uint8_t half[256]; \ | 451 | 4.91k | \ | 452 | 4.91k | put ## RND ## mpeg4_qpel16_h_lowpass(half, src, 16, stride, 16); \ | 453 | 4.91k | OPNAME ## pixels16_l2_8(dst, src + 1, half, stride, stride, 16, 16); \ | 454 | 4.91k | } \ |
|
455 | | \ |
456 | | static void OPNAME ## qpel16_mc01_c(uint8_t *dst, const uint8_t *src, \ |
457 | 229k | ptrdiff_t stride) \ |
458 | 229k | { \ |
459 | 229k | uint8_t full[24 * 17]; \ |
460 | 229k | uint8_t half[256]; \ |
461 | 229k | \ |
462 | 229k | copy_block16(full, src, 24, stride, 17); \ |
463 | 229k | put ## RND ## mpeg4_qpel16_v_lowpass(half, full, 16, 24); \ |
464 | 229k | OPNAME ## pixels16_l2_8(dst, full, half, stride, 24, 16, 16); \ |
465 | 229k | } \ qpeldsp.c:put_qpel16_mc01_c Line | Count | Source | 457 | 217k | ptrdiff_t stride) \ | 458 | 217k | { \ | 459 | 217k | uint8_t full[24 * 17]; \ | 460 | 217k | uint8_t half[256]; \ | 461 | 217k | \ | 462 | 217k | copy_block16(full, src, 24, stride, 17); \ | 463 | 217k | put ## RND ## mpeg4_qpel16_v_lowpass(half, full, 16, 24); \ | 464 | 217k | OPNAME ## pixels16_l2_8(dst, full, half, stride, 24, 16, 16); \ | 465 | 217k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc01_c Line | Count | Source | 457 | 7.56k | ptrdiff_t stride) \ | 458 | 7.56k | { \ | 459 | 7.56k | uint8_t full[24 * 17]; \ | 460 | 7.56k | uint8_t half[256]; \ | 461 | 7.56k | \ | 462 | 7.56k | copy_block16(full, src, 24, stride, 17); \ | 463 | 7.56k | put ## RND ## mpeg4_qpel16_v_lowpass(half, full, 16, 24); \ | 464 | 7.56k | OPNAME ## pixels16_l2_8(dst, full, half, stride, 24, 16, 16); \ | 465 | 7.56k | } \ |
qpeldsp.c:avg_qpel16_mc01_c Line | Count | Source | 457 | 4.11k | ptrdiff_t stride) \ | 458 | 4.11k | { \ | 459 | 4.11k | uint8_t full[24 * 17]; \ | 460 | 4.11k | uint8_t half[256]; \ | 461 | 4.11k | \ | 462 | 4.11k | copy_block16(full, src, 24, stride, 17); \ | 463 | 4.11k | put ## RND ## mpeg4_qpel16_v_lowpass(half, full, 16, 24); \ | 464 | 4.11k | OPNAME ## pixels16_l2_8(dst, full, half, stride, 24, 16, 16); \ | 465 | 4.11k | } \ |
|
466 | | \ |
467 | | static void OPNAME ## qpel16_mc02_c(uint8_t *dst, const uint8_t *src, \ |
468 | 254k | ptrdiff_t stride) \ |
469 | 254k | { \ |
470 | 254k | uint8_t full[24 * 17]; \ |
471 | 254k | \ |
472 | 254k | copy_block16(full, src, 24, stride, 17); \ |
473 | 254k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, full, stride, 24); \ |
474 | 254k | } \ qpeldsp.c:put_qpel16_mc02_c Line | Count | Source | 468 | 236k | ptrdiff_t stride) \ | 469 | 236k | { \ | 470 | 236k | uint8_t full[24 * 17]; \ | 471 | 236k | \ | 472 | 236k | copy_block16(full, src, 24, stride, 17); \ | 473 | 236k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, full, stride, 24); \ | 474 | 236k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc02_c Line | Count | Source | 468 | 14.3k | ptrdiff_t stride) \ | 469 | 14.3k | { \ | 470 | 14.3k | uint8_t full[24 * 17]; \ | 471 | 14.3k | \ | 472 | 14.3k | copy_block16(full, src, 24, stride, 17); \ | 473 | 14.3k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, full, stride, 24); \ | 474 | 14.3k | } \ |
qpeldsp.c:avg_qpel16_mc02_c Line | Count | Source | 468 | 3.55k | ptrdiff_t stride) \ | 469 | 3.55k | { \ | 470 | 3.55k | uint8_t full[24 * 17]; \ | 471 | 3.55k | \ | 472 | 3.55k | copy_block16(full, src, 24, stride, 17); \ | 473 | 3.55k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, full, stride, 24); \ | 474 | 3.55k | } \ |
|
475 | | \ |
476 | | static void OPNAME ## qpel16_mc03_c(uint8_t *dst, const uint8_t *src, \ |
477 | 244k | ptrdiff_t stride) \ |
478 | 244k | { \ |
479 | 244k | uint8_t full[24 * 17]; \ |
480 | 244k | uint8_t half[256]; \ |
481 | 244k | \ |
482 | 244k | copy_block16(full, src, 24, stride, 17); \ |
483 | 244k | put ## RND ## mpeg4_qpel16_v_lowpass(half, full, 16, 24); \ |
484 | 244k | OPNAME ## pixels16_l2_8(dst, full + 24, half, stride, 24, 16, 16); \ |
485 | 244k | } \ qpeldsp.c:put_qpel16_mc03_c Line | Count | Source | 477 | 207k | ptrdiff_t stride) \ | 478 | 207k | { \ | 479 | 207k | uint8_t full[24 * 17]; \ | 480 | 207k | uint8_t half[256]; \ | 481 | 207k | \ | 482 | 207k | copy_block16(full, src, 24, stride, 17); \ | 483 | 207k | put ## RND ## mpeg4_qpel16_v_lowpass(half, full, 16, 24); \ | 484 | 207k | OPNAME ## pixels16_l2_8(dst, full + 24, half, stride, 24, 16, 16); \ | 485 | 207k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc03_c Line | Count | Source | 477 | 32.6k | ptrdiff_t stride) \ | 478 | 32.6k | { \ | 479 | 32.6k | uint8_t full[24 * 17]; \ | 480 | 32.6k | uint8_t half[256]; \ | 481 | 32.6k | \ | 482 | 32.6k | copy_block16(full, src, 24, stride, 17); \ | 483 | 32.6k | put ## RND ## mpeg4_qpel16_v_lowpass(half, full, 16, 24); \ | 484 | 32.6k | OPNAME ## pixels16_l2_8(dst, full + 24, half, stride, 24, 16, 16); \ | 485 | 32.6k | } \ |
qpeldsp.c:avg_qpel16_mc03_c Line | Count | Source | 477 | 4.76k | ptrdiff_t stride) \ | 478 | 4.76k | { \ | 479 | 4.76k | uint8_t full[24 * 17]; \ | 480 | 4.76k | uint8_t half[256]; \ | 481 | 4.76k | \ | 482 | 4.76k | copy_block16(full, src, 24, stride, 17); \ | 483 | 4.76k | put ## RND ## mpeg4_qpel16_v_lowpass(half, full, 16, 24); \ | 484 | 4.76k | OPNAME ## pixels16_l2_8(dst, full + 24, half, stride, 24, 16, 16); \ | 485 | 4.76k | } \ |
|
486 | | \ |
487 | | void ff_ ## OPNAME ## qpel16_mc11_old_c(uint8_t *dst, const uint8_t *src, \ |
488 | 9.32k | ptrdiff_t stride) \ |
489 | 9.32k | { \ |
490 | 9.32k | uint8_t full[24 * 17]; \ |
491 | 9.32k | uint8_t halfH[272]; \ |
492 | 9.32k | uint8_t halfV[256]; \ |
493 | 9.32k | uint8_t halfHV[256]; \ |
494 | 9.32k | \ |
495 | 9.32k | copy_block17(full, src, 24, stride, 17); \ |
496 | 9.32k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ |
497 | 9.32k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24); \ |
498 | 9.32k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ |
499 | 9.32k | OPNAME ## pixels16_l4_8(dst, full, halfH, halfV, halfHV, \ |
500 | 9.32k | stride, 24, 16, 16, 16, 16); \ |
501 | 9.32k | } \ Line | Count | Source | 488 | 3.68k | ptrdiff_t stride) \ | 489 | 3.68k | { \ | 490 | 3.68k | uint8_t full[24 * 17]; \ | 491 | 3.68k | uint8_t halfH[272]; \ | 492 | 3.68k | uint8_t halfV[256]; \ | 493 | 3.68k | uint8_t halfHV[256]; \ | 494 | 3.68k | \ | 495 | 3.68k | copy_block17(full, src, 24, stride, 17); \ | 496 | 3.68k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 497 | 3.68k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24); \ | 498 | 3.68k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 499 | 3.68k | OPNAME ## pixels16_l4_8(dst, full, halfH, halfV, halfHV, \ | 500 | 3.68k | stride, 24, 16, 16, 16, 16); \ | 501 | 3.68k | } \ |
ff_put_no_rnd_qpel16_mc11_old_c Line | Count | Source | 488 | 3.13k | ptrdiff_t stride) \ | 489 | 3.13k | { \ | 490 | 3.13k | uint8_t full[24 * 17]; \ | 491 | 3.13k | uint8_t halfH[272]; \ | 492 | 3.13k | uint8_t halfV[256]; \ | 493 | 3.13k | uint8_t halfHV[256]; \ | 494 | 3.13k | \ | 495 | 3.13k | copy_block17(full, src, 24, stride, 17); \ | 496 | 3.13k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 497 | 3.13k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24); \ | 498 | 3.13k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 499 | 3.13k | OPNAME ## pixels16_l4_8(dst, full, halfH, halfV, halfHV, \ | 500 | 3.13k | stride, 24, 16, 16, 16, 16); \ | 501 | 3.13k | } \ |
Line | Count | Source | 488 | 2.50k | ptrdiff_t stride) \ | 489 | 2.50k | { \ | 490 | 2.50k | uint8_t full[24 * 17]; \ | 491 | 2.50k | uint8_t halfH[272]; \ | 492 | 2.50k | uint8_t halfV[256]; \ | 493 | 2.50k | uint8_t halfHV[256]; \ | 494 | 2.50k | \ | 495 | 2.50k | copy_block17(full, src, 24, stride, 17); \ | 496 | 2.50k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 497 | 2.50k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24); \ | 498 | 2.50k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 499 | 2.50k | OPNAME ## pixels16_l4_8(dst, full, halfH, halfV, halfHV, \ | 500 | 2.50k | stride, 24, 16, 16, 16, 16); \ | 501 | 2.50k | } \ |
|
502 | | \ |
503 | | static void OPNAME ## qpel16_mc11_c(uint8_t *dst, const uint8_t *src, \ |
504 | 181k | ptrdiff_t stride) \ |
505 | 181k | { \ |
506 | 181k | uint8_t full[24 * 17]; \ |
507 | 181k | uint8_t halfH[272]; \ |
508 | 181k | uint8_t halfHV[256]; \ |
509 | 181k | \ |
510 | 181k | copy_block17(full, src, 24, stride, 17); \ |
511 | 181k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ |
512 | 181k | put ## RND ## pixels16_l2_8(halfH, halfH, full, 16, 16, 24, 17); \ |
513 | 181k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ |
514 | 181k | OPNAME ## pixels16_l2_8(dst, halfH, halfHV, stride, 16, 16, 16); \ |
515 | 181k | } \ qpeldsp.c:put_qpel16_mc11_c Line | Count | Source | 504 | 172k | ptrdiff_t stride) \ | 505 | 172k | { \ | 506 | 172k | uint8_t full[24 * 17]; \ | 507 | 172k | uint8_t halfH[272]; \ | 508 | 172k | uint8_t halfHV[256]; \ | 509 | 172k | \ | 510 | 172k | copy_block17(full, src, 24, stride, 17); \ | 511 | 172k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 512 | 172k | put ## RND ## pixels16_l2_8(halfH, halfH, full, 16, 16, 24, 17); \ | 513 | 172k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 514 | 172k | OPNAME ## pixels16_l2_8(dst, halfH, halfHV, stride, 16, 16, 16); \ | 515 | 172k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc11_c Line | Count | Source | 504 | 6.28k | ptrdiff_t stride) \ | 505 | 6.28k | { \ | 506 | 6.28k | uint8_t full[24 * 17]; \ | 507 | 6.28k | uint8_t halfH[272]; \ | 508 | 6.28k | uint8_t halfHV[256]; \ | 509 | 6.28k | \ | 510 | 6.28k | copy_block17(full, src, 24, stride, 17); \ | 511 | 6.28k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 512 | 6.28k | put ## RND ## pixels16_l2_8(halfH, halfH, full, 16, 16, 24, 17); \ | 513 | 6.28k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 514 | 6.28k | OPNAME ## pixels16_l2_8(dst, halfH, halfHV, stride, 16, 16, 16); \ | 515 | 6.28k | } \ |
qpeldsp.c:avg_qpel16_mc11_c Line | Count | Source | 504 | 2.82k | ptrdiff_t stride) \ | 505 | 2.82k | { \ | 506 | 2.82k | uint8_t full[24 * 17]; \ | 507 | 2.82k | uint8_t halfH[272]; \ | 508 | 2.82k | uint8_t halfHV[256]; \ | 509 | 2.82k | \ | 510 | 2.82k | copy_block17(full, src, 24, stride, 17); \ | 511 | 2.82k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 512 | 2.82k | put ## RND ## pixels16_l2_8(halfH, halfH, full, 16, 16, 24, 17); \ | 513 | 2.82k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 514 | 2.82k | OPNAME ## pixels16_l2_8(dst, halfH, halfHV, stride, 16, 16, 16); \ | 515 | 2.82k | } \ |
|
516 | | \ |
517 | | void ff_ ## OPNAME ## qpel16_mc31_old_c(uint8_t *dst, const uint8_t *src, \ |
518 | 18.4k | ptrdiff_t stride) \ |
519 | 18.4k | { \ |
520 | 18.4k | uint8_t full[24 * 17]; \ |
521 | 18.4k | uint8_t halfH[272]; \ |
522 | 18.4k | uint8_t halfV[256]; \ |
523 | 18.4k | uint8_t halfHV[256]; \ |
524 | 18.4k | \ |
525 | 18.4k | copy_block17(full, src, 24, stride, 17); \ |
526 | 18.4k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ |
527 | 18.4k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full + 1, 16, 24); \ |
528 | 18.4k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ |
529 | 18.4k | OPNAME ## pixels16_l4_8(dst, full + 1, halfH, halfV, halfHV, \ |
530 | 18.4k | stride, 24, 16, 16, 16, 16); \ |
531 | 18.4k | } \ Line | Count | Source | 518 | 10.6k | ptrdiff_t stride) \ | 519 | 10.6k | { \ | 520 | 10.6k | uint8_t full[24 * 17]; \ | 521 | 10.6k | uint8_t halfH[272]; \ | 522 | 10.6k | uint8_t halfV[256]; \ | 523 | 10.6k | uint8_t halfHV[256]; \ | 524 | 10.6k | \ | 525 | 10.6k | copy_block17(full, src, 24, stride, 17); \ | 526 | 10.6k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 527 | 10.6k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full + 1, 16, 24); \ | 528 | 10.6k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 529 | 10.6k | OPNAME ## pixels16_l4_8(dst, full + 1, halfH, halfV, halfHV, \ | 530 | 10.6k | stride, 24, 16, 16, 16, 16); \ | 531 | 10.6k | } \ |
ff_put_no_rnd_qpel16_mc31_old_c Line | Count | Source | 518 | 5.29k | ptrdiff_t stride) \ | 519 | 5.29k | { \ | 520 | 5.29k | uint8_t full[24 * 17]; \ | 521 | 5.29k | uint8_t halfH[272]; \ | 522 | 5.29k | uint8_t halfV[256]; \ | 523 | 5.29k | uint8_t halfHV[256]; \ | 524 | 5.29k | \ | 525 | 5.29k | copy_block17(full, src, 24, stride, 17); \ | 526 | 5.29k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 527 | 5.29k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full + 1, 16, 24); \ | 528 | 5.29k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 529 | 5.29k | OPNAME ## pixels16_l4_8(dst, full + 1, halfH, halfV, halfHV, \ | 530 | 5.29k | stride, 24, 16, 16, 16, 16); \ | 531 | 5.29k | } \ |
Line | Count | Source | 518 | 2.51k | ptrdiff_t stride) \ | 519 | 2.51k | { \ | 520 | 2.51k | uint8_t full[24 * 17]; \ | 521 | 2.51k | uint8_t halfH[272]; \ | 522 | 2.51k | uint8_t halfV[256]; \ | 523 | 2.51k | uint8_t halfHV[256]; \ | 524 | 2.51k | \ | 525 | 2.51k | copy_block17(full, src, 24, stride, 17); \ | 526 | 2.51k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 527 | 2.51k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full + 1, 16, 24); \ | 528 | 2.51k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 529 | 2.51k | OPNAME ## pixels16_l4_8(dst, full + 1, halfH, halfV, halfHV, \ | 530 | 2.51k | stride, 24, 16, 16, 16, 16); \ | 531 | 2.51k | } \ |
|
532 | | \ |
533 | | static void OPNAME ## qpel16_mc31_c(uint8_t *dst, const uint8_t *src, \ |
534 | 196k | ptrdiff_t stride) \ |
535 | 196k | { \ |
536 | 196k | uint8_t full[24 * 17]; \ |
537 | 196k | uint8_t halfH[272]; \ |
538 | 196k | uint8_t halfHV[256]; \ |
539 | 196k | \ |
540 | 196k | copy_block17(full, src, 24, stride, 17); \ |
541 | 196k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ |
542 | 196k | put ## RND ## pixels16_l2_8(halfH, halfH, full + 1, 16, 16, 24, 17); \ |
543 | 196k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ |
544 | 196k | OPNAME ## pixels16_l2_8(dst, halfH, halfHV, stride, 16, 16, 16); \ |
545 | 196k | } \ qpeldsp.c:put_qpel16_mc31_c Line | Count | Source | 534 | 179k | ptrdiff_t stride) \ | 535 | 179k | { \ | 536 | 179k | uint8_t full[24 * 17]; \ | 537 | 179k | uint8_t halfH[272]; \ | 538 | 179k | uint8_t halfHV[256]; \ | 539 | 179k | \ | 540 | 179k | copy_block17(full, src, 24, stride, 17); \ | 541 | 179k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 542 | 179k | put ## RND ## pixels16_l2_8(halfH, halfH, full + 1, 16, 16, 24, 17); \ | 543 | 179k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 544 | 179k | OPNAME ## pixels16_l2_8(dst, halfH, halfHV, stride, 16, 16, 16); \ | 545 | 179k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc31_c Line | Count | Source | 534 | 13.6k | ptrdiff_t stride) \ | 535 | 13.6k | { \ | 536 | 13.6k | uint8_t full[24 * 17]; \ | 537 | 13.6k | uint8_t halfH[272]; \ | 538 | 13.6k | uint8_t halfHV[256]; \ | 539 | 13.6k | \ | 540 | 13.6k | copy_block17(full, src, 24, stride, 17); \ | 541 | 13.6k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 542 | 13.6k | put ## RND ## pixels16_l2_8(halfH, halfH, full + 1, 16, 16, 24, 17); \ | 543 | 13.6k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 544 | 13.6k | OPNAME ## pixels16_l2_8(dst, halfH, halfHV, stride, 16, 16, 16); \ | 545 | 13.6k | } \ |
qpeldsp.c:avg_qpel16_mc31_c Line | Count | Source | 534 | 2.77k | ptrdiff_t stride) \ | 535 | 2.77k | { \ | 536 | 2.77k | uint8_t full[24 * 17]; \ | 537 | 2.77k | uint8_t halfH[272]; \ | 538 | 2.77k | uint8_t halfHV[256]; \ | 539 | 2.77k | \ | 540 | 2.77k | copy_block17(full, src, 24, stride, 17); \ | 541 | 2.77k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 542 | 2.77k | put ## RND ## pixels16_l2_8(halfH, halfH, full + 1, 16, 16, 24, 17); \ | 543 | 2.77k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 544 | 2.77k | OPNAME ## pixels16_l2_8(dst, halfH, halfHV, stride, 16, 16, 16); \ | 545 | 2.77k | } \ |
|
546 | | \ |
547 | | void ff_ ## OPNAME ## qpel16_mc13_old_c(uint8_t *dst, const uint8_t *src, \ |
548 | 13.0k | ptrdiff_t stride) \ |
549 | 13.0k | { \ |
550 | 13.0k | uint8_t full[24 * 17]; \ |
551 | 13.0k | uint8_t halfH[272]; \ |
552 | 13.0k | uint8_t halfV[256]; \ |
553 | 13.0k | uint8_t halfHV[256]; \ |
554 | 13.0k | \ |
555 | 13.0k | copy_block17(full, src, 24, stride, 17); \ |
556 | 13.0k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ |
557 | 13.0k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24); \ |
558 | 13.0k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ |
559 | 13.0k | OPNAME ## pixels16_l4_8(dst, full + 24, halfH + 16, halfV, halfHV, \ |
560 | 13.0k | stride, 24, 16, 16, 16, 16); \ |
561 | 13.0k | } \ Line | Count | Source | 548 | 9.26k | ptrdiff_t stride) \ | 549 | 9.26k | { \ | 550 | 9.26k | uint8_t full[24 * 17]; \ | 551 | 9.26k | uint8_t halfH[272]; \ | 552 | 9.26k | uint8_t halfV[256]; \ | 553 | 9.26k | uint8_t halfHV[256]; \ | 554 | 9.26k | \ | 555 | 9.26k | copy_block17(full, src, 24, stride, 17); \ | 556 | 9.26k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 557 | 9.26k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24); \ | 558 | 9.26k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 559 | 9.26k | OPNAME ## pixels16_l4_8(dst, full + 24, halfH + 16, halfV, halfHV, \ | 560 | 9.26k | stride, 24, 16, 16, 16, 16); \ | 561 | 9.26k | } \ |
ff_put_no_rnd_qpel16_mc13_old_c Line | Count | Source | 548 | 2.05k | ptrdiff_t stride) \ | 549 | 2.05k | { \ | 550 | 2.05k | uint8_t full[24 * 17]; \ | 551 | 2.05k | uint8_t halfH[272]; \ | 552 | 2.05k | uint8_t halfV[256]; \ | 553 | 2.05k | uint8_t halfHV[256]; \ | 554 | 2.05k | \ | 555 | 2.05k | copy_block17(full, src, 24, stride, 17); \ | 556 | 2.05k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 557 | 2.05k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24); \ | 558 | 2.05k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 559 | 2.05k | OPNAME ## pixels16_l4_8(dst, full + 24, halfH + 16, halfV, halfHV, \ | 560 | 2.05k | stride, 24, 16, 16, 16, 16); \ | 561 | 2.05k | } \ |
Line | Count | Source | 548 | 1.75k | ptrdiff_t stride) \ | 549 | 1.75k | { \ | 550 | 1.75k | uint8_t full[24 * 17]; \ | 551 | 1.75k | uint8_t halfH[272]; \ | 552 | 1.75k | uint8_t halfV[256]; \ | 553 | 1.75k | uint8_t halfHV[256]; \ | 554 | 1.75k | \ | 555 | 1.75k | copy_block17(full, src, 24, stride, 17); \ | 556 | 1.75k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 557 | 1.75k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24); \ | 558 | 1.75k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 559 | 1.75k | OPNAME ## pixels16_l4_8(dst, full + 24, halfH + 16, halfV, halfHV, \ | 560 | 1.75k | stride, 24, 16, 16, 16, 16); \ | 561 | 1.75k | } \ |
|
562 | | \ |
563 | | static void OPNAME ## qpel16_mc13_c(uint8_t *dst, const uint8_t *src, \ |
564 | 206k | ptrdiff_t stride) \ |
565 | 206k | { \ |
566 | 206k | uint8_t full[24 * 17]; \ |
567 | 206k | uint8_t halfH[272]; \ |
568 | 206k | uint8_t halfHV[256]; \ |
569 | 206k | \ |
570 | 206k | copy_block17(full, src, 24, stride, 17); \ |
571 | 206k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ |
572 | 206k | put ## RND ## pixels16_l2_8(halfH, halfH, full, 16, 16, 24, 17); \ |
573 | 206k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ |
574 | 206k | OPNAME ## pixels16_l2_8(dst, halfH + 16, halfHV, stride, 16, 16, 16); \ |
575 | 206k | } \ qpeldsp.c:put_qpel16_mc13_c Line | Count | Source | 564 | 185k | ptrdiff_t stride) \ | 565 | 185k | { \ | 566 | 185k | uint8_t full[24 * 17]; \ | 567 | 185k | uint8_t halfH[272]; \ | 568 | 185k | uint8_t halfHV[256]; \ | 569 | 185k | \ | 570 | 185k | copy_block17(full, src, 24, stride, 17); \ | 571 | 185k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 572 | 185k | put ## RND ## pixels16_l2_8(halfH, halfH, full, 16, 16, 24, 17); \ | 573 | 185k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 574 | 185k | OPNAME ## pixels16_l2_8(dst, halfH + 16, halfHV, stride, 16, 16, 16); \ | 575 | 185k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc13_c Line | Count | Source | 564 | 16.8k | ptrdiff_t stride) \ | 565 | 16.8k | { \ | 566 | 16.8k | uint8_t full[24 * 17]; \ | 567 | 16.8k | uint8_t halfH[272]; \ | 568 | 16.8k | uint8_t halfHV[256]; \ | 569 | 16.8k | \ | 570 | 16.8k | copy_block17(full, src, 24, stride, 17); \ | 571 | 16.8k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 572 | 16.8k | put ## RND ## pixels16_l2_8(halfH, halfH, full, 16, 16, 24, 17); \ | 573 | 16.8k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 574 | 16.8k | OPNAME ## pixels16_l2_8(dst, halfH + 16, halfHV, stride, 16, 16, 16); \ | 575 | 16.8k | } \ |
qpeldsp.c:avg_qpel16_mc13_c Line | Count | Source | 564 | 3.73k | ptrdiff_t stride) \ | 565 | 3.73k | { \ | 566 | 3.73k | uint8_t full[24 * 17]; \ | 567 | 3.73k | uint8_t halfH[272]; \ | 568 | 3.73k | uint8_t halfHV[256]; \ | 569 | 3.73k | \ | 570 | 3.73k | copy_block17(full, src, 24, stride, 17); \ | 571 | 3.73k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 572 | 3.73k | put ## RND ## pixels16_l2_8(halfH, halfH, full, 16, 16, 24, 17); \ | 573 | 3.73k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 574 | 3.73k | OPNAME ## pixels16_l2_8(dst, halfH + 16, halfHV, stride, 16, 16, 16); \ | 575 | 3.73k | } \ |
|
576 | | \ |
577 | | void ff_ ## OPNAME ## qpel16_mc33_old_c(uint8_t *dst, const uint8_t *src, \ |
578 | 14.3k | ptrdiff_t stride) \ |
579 | 14.3k | { \ |
580 | 14.3k | uint8_t full[24 * 17]; \ |
581 | 14.3k | uint8_t halfH[272]; \ |
582 | 14.3k | uint8_t halfV[256]; \ |
583 | 14.3k | uint8_t halfHV[256]; \ |
584 | 14.3k | \ |
585 | 14.3k | copy_block17(full, src, 24, stride, 17); \ |
586 | 14.3k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ |
587 | 14.3k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full + 1, 16, 24); \ |
588 | 14.3k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ |
589 | 14.3k | OPNAME ## pixels16_l4_8(dst, full + 25, halfH + 16, halfV, halfHV, \ |
590 | 14.3k | stride, 24, 16, 16, 16, 16); \ |
591 | 14.3k | } \ Line | Count | Source | 578 | 7.09k | ptrdiff_t stride) \ | 579 | 7.09k | { \ | 580 | 7.09k | uint8_t full[24 * 17]; \ | 581 | 7.09k | uint8_t halfH[272]; \ | 582 | 7.09k | uint8_t halfV[256]; \ | 583 | 7.09k | uint8_t halfHV[256]; \ | 584 | 7.09k | \ | 585 | 7.09k | copy_block17(full, src, 24, stride, 17); \ | 586 | 7.09k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 587 | 7.09k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full + 1, 16, 24); \ | 588 | 7.09k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 589 | 7.09k | OPNAME ## pixels16_l4_8(dst, full + 25, halfH + 16, halfV, halfHV, \ | 590 | 7.09k | stride, 24, 16, 16, 16, 16); \ | 591 | 7.09k | } \ |
ff_put_no_rnd_qpel16_mc33_old_c Line | Count | Source | 578 | 5.94k | ptrdiff_t stride) \ | 579 | 5.94k | { \ | 580 | 5.94k | uint8_t full[24 * 17]; \ | 581 | 5.94k | uint8_t halfH[272]; \ | 582 | 5.94k | uint8_t halfV[256]; \ | 583 | 5.94k | uint8_t halfHV[256]; \ | 584 | 5.94k | \ | 585 | 5.94k | copy_block17(full, src, 24, stride, 17); \ | 586 | 5.94k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 587 | 5.94k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full + 1, 16, 24); \ | 588 | 5.94k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 589 | 5.94k | OPNAME ## pixels16_l4_8(dst, full + 25, halfH + 16, halfV, halfHV, \ | 590 | 5.94k | stride, 24, 16, 16, 16, 16); \ | 591 | 5.94k | } \ |
Line | Count | Source | 578 | 1.33k | ptrdiff_t stride) \ | 579 | 1.33k | { \ | 580 | 1.33k | uint8_t full[24 * 17]; \ | 581 | 1.33k | uint8_t halfH[272]; \ | 582 | 1.33k | uint8_t halfV[256]; \ | 583 | 1.33k | uint8_t halfHV[256]; \ | 584 | 1.33k | \ | 585 | 1.33k | copy_block17(full, src, 24, stride, 17); \ | 586 | 1.33k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 587 | 1.33k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full + 1, 16, 24); \ | 588 | 1.33k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 589 | 1.33k | OPNAME ## pixels16_l4_8(dst, full + 25, halfH + 16, halfV, halfHV, \ | 590 | 1.33k | stride, 24, 16, 16, 16, 16); \ | 591 | 1.33k | } \ |
|
592 | | \ |
593 | | static void OPNAME ## qpel16_mc33_c(uint8_t *dst, const uint8_t *src, \ |
594 | 297k | ptrdiff_t stride) \ |
595 | 297k | { \ |
596 | 297k | uint8_t full[24 * 17]; \ |
597 | 297k | uint8_t halfH[272]; \ |
598 | 297k | uint8_t halfHV[256]; \ |
599 | 297k | \ |
600 | 297k | copy_block17(full, src, 24, stride, 17); \ |
601 | 297k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ |
602 | 297k | put ## RND ## pixels16_l2_8(halfH, halfH, full + 1, 16, 16, 24, 17); \ |
603 | 297k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ |
604 | 297k | OPNAME ## pixels16_l2_8(dst, halfH + 16, halfHV, stride, 16, 16, 16); \ |
605 | 297k | } \ qpeldsp.c:put_qpel16_mc33_c Line | Count | Source | 594 | 259k | ptrdiff_t stride) \ | 595 | 259k | { \ | 596 | 259k | uint8_t full[24 * 17]; \ | 597 | 259k | uint8_t halfH[272]; \ | 598 | 259k | uint8_t halfHV[256]; \ | 599 | 259k | \ | 600 | 259k | copy_block17(full, src, 24, stride, 17); \ | 601 | 259k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 602 | 259k | put ## RND ## pixels16_l2_8(halfH, halfH, full + 1, 16, 16, 24, 17); \ | 603 | 259k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 604 | 259k | OPNAME ## pixels16_l2_8(dst, halfH + 16, halfHV, stride, 16, 16, 16); \ | 605 | 259k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc33_c Line | Count | Source | 594 | 33.0k | ptrdiff_t stride) \ | 595 | 33.0k | { \ | 596 | 33.0k | uint8_t full[24 * 17]; \ | 597 | 33.0k | uint8_t halfH[272]; \ | 598 | 33.0k | uint8_t halfHV[256]; \ | 599 | 33.0k | \ | 600 | 33.0k | copy_block17(full, src, 24, stride, 17); \ | 601 | 33.0k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 602 | 33.0k | put ## RND ## pixels16_l2_8(halfH, halfH, full + 1, 16, 16, 24, 17); \ | 603 | 33.0k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 604 | 33.0k | OPNAME ## pixels16_l2_8(dst, halfH + 16, halfHV, stride, 16, 16, 16); \ | 605 | 33.0k | } \ |
qpeldsp.c:avg_qpel16_mc33_c Line | Count | Source | 594 | 4.37k | ptrdiff_t stride) \ | 595 | 4.37k | { \ | 596 | 4.37k | uint8_t full[24 * 17]; \ | 597 | 4.37k | uint8_t halfH[272]; \ | 598 | 4.37k | uint8_t halfHV[256]; \ | 599 | 4.37k | \ | 600 | 4.37k | copy_block17(full, src, 24, stride, 17); \ | 601 | 4.37k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 602 | 4.37k | put ## RND ## pixels16_l2_8(halfH, halfH, full + 1, 16, 16, 24, 17); \ | 603 | 4.37k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 604 | 4.37k | OPNAME ## pixels16_l2_8(dst, halfH + 16, halfHV, stride, 16, 16, 16); \ | 605 | 4.37k | } \ |
|
606 | | \ |
607 | | static void OPNAME ## qpel16_mc21_c(uint8_t *dst, const uint8_t *src, \ |
608 | 205k | ptrdiff_t stride) \ |
609 | 205k | { \ |
610 | 205k | uint8_t halfH[272]; \ |
611 | 205k | uint8_t halfHV[256]; \ |
612 | 205k | \ |
613 | 205k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17); \ |
614 | 205k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ |
615 | 205k | OPNAME ## pixels16_l2_8(dst, halfH, halfHV, stride, 16, 16, 16); \ |
616 | 205k | } \ qpeldsp.c:put_qpel16_mc21_c Line | Count | Source | 608 | 193k | ptrdiff_t stride) \ | 609 | 193k | { \ | 610 | 193k | uint8_t halfH[272]; \ | 611 | 193k | uint8_t halfHV[256]; \ | 612 | 193k | \ | 613 | 193k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17); \ | 614 | 193k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 615 | 193k | OPNAME ## pixels16_l2_8(dst, halfH, halfHV, stride, 16, 16, 16); \ | 616 | 193k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc21_c Line | Count | Source | 608 | 8.84k | ptrdiff_t stride) \ | 609 | 8.84k | { \ | 610 | 8.84k | uint8_t halfH[272]; \ | 611 | 8.84k | uint8_t halfHV[256]; \ | 612 | 8.84k | \ | 613 | 8.84k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17); \ | 614 | 8.84k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 615 | 8.84k | OPNAME ## pixels16_l2_8(dst, halfH, halfHV, stride, 16, 16, 16); \ | 616 | 8.84k | } \ |
qpeldsp.c:avg_qpel16_mc21_c Line | Count | Source | 608 | 3.15k | ptrdiff_t stride) \ | 609 | 3.15k | { \ | 610 | 3.15k | uint8_t halfH[272]; \ | 611 | 3.15k | uint8_t halfHV[256]; \ | 612 | 3.15k | \ | 613 | 3.15k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17); \ | 614 | 3.15k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 615 | 3.15k | OPNAME ## pixels16_l2_8(dst, halfH, halfHV, stride, 16, 16, 16); \ | 616 | 3.15k | } \ |
|
617 | | \ |
618 | | static void OPNAME ## qpel16_mc23_c(uint8_t *dst, const uint8_t *src, \ |
619 | 261k | ptrdiff_t stride) \ |
620 | 261k | { \ |
621 | 261k | uint8_t halfH[272]; \ |
622 | 261k | uint8_t halfHV[256]; \ |
623 | 261k | \ |
624 | 261k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17); \ |
625 | 261k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ |
626 | 261k | OPNAME ## pixels16_l2_8(dst, halfH + 16, halfHV, stride, 16, 16, 16); \ |
627 | 261k | } \ qpeldsp.c:put_qpel16_mc23_c Line | Count | Source | 619 | 222k | ptrdiff_t stride) \ | 620 | 222k | { \ | 621 | 222k | uint8_t halfH[272]; \ | 622 | 222k | uint8_t halfHV[256]; \ | 623 | 222k | \ | 624 | 222k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17); \ | 625 | 222k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 626 | 222k | OPNAME ## pixels16_l2_8(dst, halfH + 16, halfHV, stride, 16, 16, 16); \ | 627 | 222k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc23_c Line | Count | Source | 619 | 33.9k | ptrdiff_t stride) \ | 620 | 33.9k | { \ | 621 | 33.9k | uint8_t halfH[272]; \ | 622 | 33.9k | uint8_t halfHV[256]; \ | 623 | 33.9k | \ | 624 | 33.9k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17); \ | 625 | 33.9k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 626 | 33.9k | OPNAME ## pixels16_l2_8(dst, halfH + 16, halfHV, stride, 16, 16, 16); \ | 627 | 33.9k | } \ |
qpeldsp.c:avg_qpel16_mc23_c Line | Count | Source | 619 | 4.92k | ptrdiff_t stride) \ | 620 | 4.92k | { \ | 621 | 4.92k | uint8_t halfH[272]; \ | 622 | 4.92k | uint8_t halfHV[256]; \ | 623 | 4.92k | \ | 624 | 4.92k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17); \ | 625 | 4.92k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 626 | 4.92k | OPNAME ## pixels16_l2_8(dst, halfH + 16, halfHV, stride, 16, 16, 16); \ | 627 | 4.92k | } \ |
|
628 | | \ |
629 | | void ff_ ## OPNAME ## qpel16_mc12_old_c(uint8_t *dst, const uint8_t *src, \ |
630 | 8.37k | ptrdiff_t stride) \ |
631 | 8.37k | { \ |
632 | 8.37k | uint8_t full[24 * 17]; \ |
633 | 8.37k | uint8_t halfH[272]; \ |
634 | 8.37k | uint8_t halfV[256]; \ |
635 | 8.37k | uint8_t halfHV[256]; \ |
636 | 8.37k | \ |
637 | 8.37k | copy_block17(full, src, 24, stride, 17); \ |
638 | 8.37k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ |
639 | 8.37k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24); \ |
640 | 8.37k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ |
641 | 8.37k | OPNAME ## pixels16_l2_8(dst, halfV, halfHV, stride, 16, 16, 16); \ |
642 | 8.37k | } \ Line | Count | Source | 630 | 4.12k | ptrdiff_t stride) \ | 631 | 4.12k | { \ | 632 | 4.12k | uint8_t full[24 * 17]; \ | 633 | 4.12k | uint8_t halfH[272]; \ | 634 | 4.12k | uint8_t halfV[256]; \ | 635 | 4.12k | uint8_t halfHV[256]; \ | 636 | 4.12k | \ | 637 | 4.12k | copy_block17(full, src, 24, stride, 17); \ | 638 | 4.12k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 639 | 4.12k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24); \ | 640 | 4.12k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 641 | 4.12k | OPNAME ## pixels16_l2_8(dst, halfV, halfHV, stride, 16, 16, 16); \ | 642 | 4.12k | } \ |
ff_put_no_rnd_qpel16_mc12_old_c Line | Count | Source | 630 | 2.15k | ptrdiff_t stride) \ | 631 | 2.15k | { \ | 632 | 2.15k | uint8_t full[24 * 17]; \ | 633 | 2.15k | uint8_t halfH[272]; \ | 634 | 2.15k | uint8_t halfV[256]; \ | 635 | 2.15k | uint8_t halfHV[256]; \ | 636 | 2.15k | \ | 637 | 2.15k | copy_block17(full, src, 24, stride, 17); \ | 638 | 2.15k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 639 | 2.15k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24); \ | 640 | 2.15k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 641 | 2.15k | OPNAME ## pixels16_l2_8(dst, halfV, halfHV, stride, 16, 16, 16); \ | 642 | 2.15k | } \ |
Line | Count | Source | 630 | 2.09k | ptrdiff_t stride) \ | 631 | 2.09k | { \ | 632 | 2.09k | uint8_t full[24 * 17]; \ | 633 | 2.09k | uint8_t halfH[272]; \ | 634 | 2.09k | uint8_t halfV[256]; \ | 635 | 2.09k | uint8_t halfHV[256]; \ | 636 | 2.09k | \ | 637 | 2.09k | copy_block17(full, src, 24, stride, 17); \ | 638 | 2.09k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 639 | 2.09k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24); \ | 640 | 2.09k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 641 | 2.09k | OPNAME ## pixels16_l2_8(dst, halfV, halfHV, stride, 16, 16, 16); \ | 642 | 2.09k | } \ |
|
643 | | \ |
644 | | static void OPNAME ## qpel16_mc12_c(uint8_t *dst, const uint8_t *src, \ |
645 | 171k | ptrdiff_t stride) \ |
646 | 171k | { \ |
647 | 171k | uint8_t full[24 * 17]; \ |
648 | 171k | uint8_t halfH[272]; \ |
649 | 171k | \ |
650 | 171k | copy_block17(full, src, 24, stride, 17); \ |
651 | 171k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ |
652 | 171k | put ## RND ## pixels16_l2_8(halfH, halfH, full, 16, 16, 24, 17); \ |
653 | 171k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16); \ |
654 | 171k | } \ qpeldsp.c:put_qpel16_mc12_c Line | Count | Source | 645 | 158k | ptrdiff_t stride) \ | 646 | 158k | { \ | 647 | 158k | uint8_t full[24 * 17]; \ | 648 | 158k | uint8_t halfH[272]; \ | 649 | 158k | \ | 650 | 158k | copy_block17(full, src, 24, stride, 17); \ | 651 | 158k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 652 | 158k | put ## RND ## pixels16_l2_8(halfH, halfH, full, 16, 16, 24, 17); \ | 653 | 158k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16); \ | 654 | 158k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc12_c Line | Count | Source | 645 | 10.1k | ptrdiff_t stride) \ | 646 | 10.1k | { \ | 647 | 10.1k | uint8_t full[24 * 17]; \ | 648 | 10.1k | uint8_t halfH[272]; \ | 649 | 10.1k | \ | 650 | 10.1k | copy_block17(full, src, 24, stride, 17); \ | 651 | 10.1k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 652 | 10.1k | put ## RND ## pixels16_l2_8(halfH, halfH, full, 16, 16, 24, 17); \ | 653 | 10.1k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16); \ | 654 | 10.1k | } \ |
qpeldsp.c:avg_qpel16_mc12_c Line | Count | Source | 645 | 2.16k | ptrdiff_t stride) \ | 646 | 2.16k | { \ | 647 | 2.16k | uint8_t full[24 * 17]; \ | 648 | 2.16k | uint8_t halfH[272]; \ | 649 | 2.16k | \ | 650 | 2.16k | copy_block17(full, src, 24, stride, 17); \ | 651 | 2.16k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 652 | 2.16k | put ## RND ## pixels16_l2_8(halfH, halfH, full, 16, 16, 24, 17); \ | 653 | 2.16k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16); \ | 654 | 2.16k | } \ |
|
655 | | \ |
656 | | void ff_ ## OPNAME ## qpel16_mc32_old_c(uint8_t *dst, const uint8_t *src, \ |
657 | 14.6k | ptrdiff_t stride) \ |
658 | 14.6k | { \ |
659 | 14.6k | uint8_t full[24 * 17]; \ |
660 | 14.6k | uint8_t halfH[272]; \ |
661 | 14.6k | uint8_t halfV[256]; \ |
662 | 14.6k | uint8_t halfHV[256]; \ |
663 | 14.6k | \ |
664 | 14.6k | copy_block17(full, src, 24, stride, 17); \ |
665 | 14.6k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ |
666 | 14.6k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full + 1, 16, 24); \ |
667 | 14.6k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ |
668 | 14.6k | OPNAME ## pixels16_l2_8(dst, halfV, halfHV, stride, 16, 16, 16); \ |
669 | 14.6k | } \ Line | Count | Source | 657 | 5.26k | ptrdiff_t stride) \ | 658 | 5.26k | { \ | 659 | 5.26k | uint8_t full[24 * 17]; \ | 660 | 5.26k | uint8_t halfH[272]; \ | 661 | 5.26k | uint8_t halfV[256]; \ | 662 | 5.26k | uint8_t halfHV[256]; \ | 663 | 5.26k | \ | 664 | 5.26k | copy_block17(full, src, 24, stride, 17); \ | 665 | 5.26k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 666 | 5.26k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full + 1, 16, 24); \ | 667 | 5.26k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 668 | 5.26k | OPNAME ## pixels16_l2_8(dst, halfV, halfHV, stride, 16, 16, 16); \ | 669 | 5.26k | } \ |
ff_put_no_rnd_qpel16_mc32_old_c Line | Count | Source | 657 | 5.56k | ptrdiff_t stride) \ | 658 | 5.56k | { \ | 659 | 5.56k | uint8_t full[24 * 17]; \ | 660 | 5.56k | uint8_t halfH[272]; \ | 661 | 5.56k | uint8_t halfV[256]; \ | 662 | 5.56k | uint8_t halfHV[256]; \ | 663 | 5.56k | \ | 664 | 5.56k | copy_block17(full, src, 24, stride, 17); \ | 665 | 5.56k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 666 | 5.56k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full + 1, 16, 24); \ | 667 | 5.56k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 668 | 5.56k | OPNAME ## pixels16_l2_8(dst, halfV, halfHV, stride, 16, 16, 16); \ | 669 | 5.56k | } \ |
Line | Count | Source | 657 | 3.83k | ptrdiff_t stride) \ | 658 | 3.83k | { \ | 659 | 3.83k | uint8_t full[24 * 17]; \ | 660 | 3.83k | uint8_t halfH[272]; \ | 661 | 3.83k | uint8_t halfV[256]; \ | 662 | 3.83k | uint8_t halfHV[256]; \ | 663 | 3.83k | \ | 664 | 3.83k | copy_block17(full, src, 24, stride, 17); \ | 665 | 3.83k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 666 | 3.83k | put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full + 1, 16, 24); \ | 667 | 3.83k | put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16); \ | 668 | 3.83k | OPNAME ## pixels16_l2_8(dst, halfV, halfHV, stride, 16, 16, 16); \ | 669 | 3.83k | } \ |
|
670 | | \ |
671 | | static void OPNAME ## qpel16_mc32_c(uint8_t *dst, const uint8_t *src, \ |
672 | 241k | ptrdiff_t stride) \ |
673 | 241k | { \ |
674 | 241k | uint8_t full[24 * 17]; \ |
675 | 241k | uint8_t halfH[272]; \ |
676 | 241k | \ |
677 | 241k | copy_block17(full, src, 24, stride, 17); \ |
678 | 241k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ |
679 | 241k | put ## RND ## pixels16_l2_8(halfH, halfH, full + 1, 16, 16, 24, 17); \ |
680 | 241k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16); \ |
681 | 241k | } \ qpeldsp.c:put_qpel16_mc32_c Line | Count | Source | 672 | 218k | ptrdiff_t stride) \ | 673 | 218k | { \ | 674 | 218k | uint8_t full[24 * 17]; \ | 675 | 218k | uint8_t halfH[272]; \ | 676 | 218k | \ | 677 | 218k | copy_block17(full, src, 24, stride, 17); \ | 678 | 218k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 679 | 218k | put ## RND ## pixels16_l2_8(halfH, halfH, full + 1, 16, 16, 24, 17); \ | 680 | 218k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16); \ | 681 | 218k | } \ |
qpeldsp.c:put_no_rnd_qpel16_mc32_c Line | Count | Source | 672 | 21.2k | ptrdiff_t stride) \ | 673 | 21.2k | { \ | 674 | 21.2k | uint8_t full[24 * 17]; \ | 675 | 21.2k | uint8_t halfH[272]; \ | 676 | 21.2k | \ | 677 | 21.2k | copy_block17(full, src, 24, stride, 17); \ | 678 | 21.2k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 679 | 21.2k | put ## RND ## pixels16_l2_8(halfH, halfH, full + 1, 16, 16, 24, 17); \ | 680 | 21.2k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16); \ | 681 | 21.2k | } \ |
qpeldsp.c:avg_qpel16_mc32_c Line | Count | Source | 672 | 1.72k | ptrdiff_t stride) \ | 673 | 1.72k | { \ | 674 | 1.72k | uint8_t full[24 * 17]; \ | 675 | 1.72k | uint8_t halfH[272]; \ | 676 | 1.72k | \ | 677 | 1.72k | copy_block17(full, src, 24, stride, 17); \ | 678 | 1.72k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17); \ | 679 | 1.72k | put ## RND ## pixels16_l2_8(halfH, halfH, full + 1, 16, 16, 24, 17); \ | 680 | 1.72k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16); \ | 681 | 1.72k | } \ |
|
682 | | \ |
683 | | static void OPNAME ## qpel16_mc22_c(uint8_t *dst, const uint8_t *src, \ |
684 | 206k | ptrdiff_t stride) \ |
685 | 206k | { \ |
686 | 206k | uint8_t halfH[272]; \ |
687 | 206k | \ |
688 | 206k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17); \ |
689 | 206k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16); \ |
690 | 206k | } qpeldsp.c:put_qpel16_mc22_c Line | Count | Source | 684 | 191k | ptrdiff_t stride) \ | 685 | 191k | { \ | 686 | 191k | uint8_t halfH[272]; \ | 687 | 191k | \ | 688 | 191k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17); \ | 689 | 191k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16); \ | 690 | 191k | } |
qpeldsp.c:put_no_rnd_qpel16_mc22_c Line | Count | Source | 684 | 12.5k | ptrdiff_t stride) \ | 685 | 12.5k | { \ | 686 | 12.5k | uint8_t halfH[272]; \ | 687 | 12.5k | \ | 688 | 12.5k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17); \ | 689 | 12.5k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16); \ | 690 | 12.5k | } |
qpeldsp.c:avg_qpel16_mc22_c Line | Count | Source | 684 | 2.52k | ptrdiff_t stride) \ | 685 | 2.52k | { \ | 686 | 2.52k | uint8_t halfH[272]; \ | 687 | 2.52k | \ | 688 | 2.52k | put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17); \ | 689 | 2.52k | OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16); \ | 690 | 2.52k | } |
|
691 | | |
692 | 5.23M | #define op_avg(a, b) a = (((a) + cm[((b) + 16) >> 5] + 1) >> 1) |
693 | 1.39G | #define op_put(a, b) a = cm[((b) + 16) >> 5] |
694 | 133M | #define op_put_no_rnd(a, b) a = cm[((b) + 15) >> 5] |
695 | | |
696 | 1.39G | QPEL_MC(0, put_, _, op_put) |
697 | 133M | QPEL_MC(1, put_no_rnd_, _no_rnd_, op_put_no_rnd) |
698 | 5.23M | QPEL_MC(0, avg_, _, op_avg) |
699 | | |
700 | | #undef op_avg |
701 | | #undef op_put |
702 | | #undef op_put_no_rnd |
703 | | |
704 | | void ff_put_pixels8x8_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride) |
705 | 52.4M | { |
706 | 52.4M | put_pixels8_8_c(dst, src, stride, 8); |
707 | 52.4M | } |
708 | | |
709 | | void ff_avg_pixels8x8_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride) |
710 | 5.82M | { |
711 | 5.82M | avg_pixels8_8_c(dst, src, stride, 8); |
712 | 5.82M | } |
713 | | |
714 | | void ff_put_pixels16x16_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride) |
715 | 189M | { |
716 | 189M | put_pixels16_8_c(dst, src, stride, 16); |
717 | 189M | } |
718 | | |
719 | | void ff_avg_pixels16x16_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride) |
720 | 1.11M | { |
721 | 1.11M | avg_pixels16_8_c(dst, src, stride, 16); |
722 | 1.11M | } |
723 | | |
724 | 44.2k | #define put_qpel8_mc00_c ff_put_pixels8x8_c |
725 | 44.2k | #define avg_qpel8_mc00_c ff_avg_pixels8x8_c |
726 | 44.2k | #define put_qpel16_mc00_c ff_put_pixels16x16_c |
727 | 44.2k | #define avg_qpel16_mc00_c ff_avg_pixels16x16_c |
728 | 44.2k | #define put_no_rnd_qpel8_mc00_c ff_put_pixels8x8_c |
729 | 44.2k | #define put_no_rnd_qpel16_mc00_c ff_put_pixels16x16_c |
730 | | |
731 | | void ff_put_pixels8_l2_8(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, |
732 | | int dst_stride, int src_stride1, int src_stride2, |
733 | | int h) |
734 | 13.3M | { |
735 | 13.3M | put_pixels8_l2_8(dst, src1, src2, dst_stride, src_stride1, src_stride2, h); |
736 | | |
737 | 13.3M | } |
738 | | |
739 | | #if CONFIG_DIRAC_DECODER |
740 | | #define DIRAC_MC(OPNAME)\ |
741 | 61.9M | void ff_ ## OPNAME ## _dirac_pixels8_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ |
742 | 61.9M | {\ |
743 | 61.9M | OPNAME ## _pixels8_8_c(dst, src[0], stride, h);\ |
744 | 61.9M | }\ Line | Count | Source | 741 | 34.2M | void ff_ ## OPNAME ## _dirac_pixels8_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 742 | 34.2M | {\ | 743 | 34.2M | OPNAME ## _pixels8_8_c(dst, src[0], stride, h);\ | 744 | 34.2M | }\ |
Line | Count | Source | 741 | 27.6M | void ff_ ## OPNAME ## _dirac_pixels8_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 742 | 27.6M | {\ | 743 | 27.6M | OPNAME ## _pixels8_8_c(dst, src[0], stride, h);\ | 744 | 27.6M | }\ |
|
745 | 2.66M | void ff_ ## OPNAME ## _dirac_pixels16_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ |
746 | 2.66M | {\ |
747 | 2.66M | OPNAME ## _pixels16_8_c(dst, src[0], stride, h);\ |
748 | 2.66M | }\ Line | Count | Source | 745 | 2.32M | void ff_ ## OPNAME ## _dirac_pixels16_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 746 | 2.32M | {\ | 747 | 2.32M | OPNAME ## _pixels16_8_c(dst, src[0], stride, h);\ | 748 | 2.32M | }\ |
Line | Count | Source | 745 | 335k | void ff_ ## OPNAME ## _dirac_pixels16_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 746 | 335k | {\ | 747 | 335k | OPNAME ## _pixels16_8_c(dst, src[0], stride, h);\ | 748 | 335k | }\ |
|
749 | 875k | void ff_ ## OPNAME ## _dirac_pixels32_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ |
750 | 875k | {\ |
751 | 875k | OPNAME ## _pixels16_8_c(dst , src[0] , stride, h);\ |
752 | 875k | OPNAME ## _pixels16_8_c(dst+16, src[0]+16, stride, h);\ |
753 | 875k | }\ Line | Count | Source | 749 | 823k | void ff_ ## OPNAME ## _dirac_pixels32_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 750 | 823k | {\ | 751 | 823k | OPNAME ## _pixels16_8_c(dst , src[0] , stride, h);\ | 752 | 823k | OPNAME ## _pixels16_8_c(dst+16, src[0]+16, stride, h);\ | 753 | 823k | }\ |
Line | Count | Source | 749 | 52.8k | void ff_ ## OPNAME ## _dirac_pixels32_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 750 | 52.8k | {\ | 751 | 52.8k | OPNAME ## _pixels16_8_c(dst , src[0] , stride, h);\ | 752 | 52.8k | OPNAME ## _pixels16_8_c(dst+16, src[0]+16, stride, h);\ | 753 | 52.8k | }\ |
|
754 | 279k | void ff_ ## OPNAME ## _dirac_pixels8_l2_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ |
755 | 279k | {\ |
756 | 279k | OPNAME ## _pixels8_l2_8(dst, src[0], src[1], stride, stride, stride, h);\ |
757 | 279k | }\ ff_put_dirac_pixels8_l2_c Line | Count | Source | 754 | 115k | void ff_ ## OPNAME ## _dirac_pixels8_l2_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 755 | 115k | {\ | 756 | 115k | OPNAME ## _pixels8_l2_8(dst, src[0], src[1], stride, stride, stride, h);\ | 757 | 115k | }\ |
ff_avg_dirac_pixels8_l2_c Line | Count | Source | 754 | 164k | void ff_ ## OPNAME ## _dirac_pixels8_l2_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 755 | 164k | {\ | 756 | 164k | OPNAME ## _pixels8_l2_8(dst, src[0], src[1], stride, stride, stride, h);\ | 757 | 164k | }\ |
|
758 | 38.9k | void ff_ ## OPNAME ## _dirac_pixels16_l2_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ |
759 | 38.9k | {\ |
760 | 38.9k | OPNAME ## _pixels16_l2_8(dst, src[0], src[1], stride, stride, stride, h);\ |
761 | 38.9k | }\ ff_put_dirac_pixels16_l2_c Line | Count | Source | 758 | 32.9k | void ff_ ## OPNAME ## _dirac_pixels16_l2_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 759 | 32.9k | {\ | 760 | 32.9k | OPNAME ## _pixels16_l2_8(dst, src[0], src[1], stride, stride, stride, h);\ | 761 | 32.9k | }\ |
ff_avg_dirac_pixels16_l2_c Line | Count | Source | 758 | 6.02k | void ff_ ## OPNAME ## _dirac_pixels16_l2_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 759 | 6.02k | {\ | 760 | 6.02k | OPNAME ## _pixels16_l2_8(dst, src[0], src[1], stride, stride, stride, h);\ | 761 | 6.02k | }\ |
|
762 | 101k | void ff_ ## OPNAME ## _dirac_pixels32_l2_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ |
763 | 101k | {\ |
764 | 101k | OPNAME ## _pixels16_l2_8(dst , src[0] , src[1] , stride, stride, stride, h);\ |
765 | 101k | OPNAME ## _pixels16_l2_8(dst+16, src[0]+16, src[1]+16, stride, stride, stride, h);\ |
766 | 101k | }\ ff_put_dirac_pixels32_l2_c Line | Count | Source | 762 | 96.4k | void ff_ ## OPNAME ## _dirac_pixels32_l2_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 763 | 96.4k | {\ | 764 | 96.4k | OPNAME ## _pixels16_l2_8(dst , src[0] , src[1] , stride, stride, stride, h);\ | 765 | 96.4k | OPNAME ## _pixels16_l2_8(dst+16, src[0]+16, src[1]+16, stride, stride, stride, h);\ | 766 | 96.4k | }\ |
ff_avg_dirac_pixels32_l2_c Line | Count | Source | 762 | 4.63k | void ff_ ## OPNAME ## _dirac_pixels32_l2_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 763 | 4.63k | {\ | 764 | 4.63k | OPNAME ## _pixels16_l2_8(dst , src[0] , src[1] , stride, stride, stride, h);\ | 765 | 4.63k | OPNAME ## _pixels16_l2_8(dst+16, src[0]+16, src[1]+16, stride, stride, stride, h);\ | 766 | 4.63k | }\ |
|
767 | 504k | void ff_ ## OPNAME ## _dirac_pixels8_l4_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ |
768 | 504k | {\ |
769 | 504k | OPNAME ## _pixels8_l4_8(dst, src[0], src[1], src[2], src[3], stride, stride, stride, stride, stride, h);\ |
770 | 504k | }\ ff_put_dirac_pixels8_l4_c Line | Count | Source | 767 | 344k | void ff_ ## OPNAME ## _dirac_pixels8_l4_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 768 | 344k | {\ | 769 | 344k | OPNAME ## _pixels8_l4_8(dst, src[0], src[1], src[2], src[3], stride, stride, stride, stride, stride, h);\ | 770 | 344k | }\ |
ff_avg_dirac_pixels8_l4_c Line | Count | Source | 767 | 160k | void ff_ ## OPNAME ## _dirac_pixels8_l4_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 768 | 160k | {\ | 769 | 160k | OPNAME ## _pixels8_l4_8(dst, src[0], src[1], src[2], src[3], stride, stride, stride, stride, stride, h);\ | 770 | 160k | }\ |
|
771 | 118k | void ff_ ## OPNAME ## _dirac_pixels16_l4_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ |
772 | 118k | {\ |
773 | 118k | OPNAME ## _pixels16_l4_8(dst, src[0], src[1], src[2], src[3], stride, stride, stride, stride, stride, h);\ |
774 | 118k | }\ ff_put_dirac_pixels16_l4_c Line | Count | Source | 771 | 66.2k | void ff_ ## OPNAME ## _dirac_pixels16_l4_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 772 | 66.2k | {\ | 773 | 66.2k | OPNAME ## _pixels16_l4_8(dst, src[0], src[1], src[2], src[3], stride, stride, stride, stride, stride, h);\ | 774 | 66.2k | }\ |
ff_avg_dirac_pixels16_l4_c Line | Count | Source | 771 | 51.8k | void ff_ ## OPNAME ## _dirac_pixels16_l4_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 772 | 51.8k | {\ | 773 | 51.8k | OPNAME ## _pixels16_l4_8(dst, src[0], src[1], src[2], src[3], stride, stride, stride, stride, stride, h);\ | 774 | 51.8k | }\ |
|
775 | 196k | void ff_ ## OPNAME ## _dirac_pixels32_l4_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ |
776 | 196k | {\ |
777 | 196k | OPNAME ## _pixels16_l4_8(dst , src[0] , src[1] , src[2] , src[3] , stride, stride, stride, stride, stride, h);\ |
778 | 196k | OPNAME ## _pixels16_l4_8(dst+16, src[0]+16, src[1]+16, src[2]+16, src[3]+16, stride, stride, stride, stride, stride, h);\ |
779 | 196k | } ff_put_dirac_pixels32_l4_c Line | Count | Source | 775 | 187k | void ff_ ## OPNAME ## _dirac_pixels32_l4_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 776 | 187k | {\ | 777 | 187k | OPNAME ## _pixels16_l4_8(dst , src[0] , src[1] , src[2] , src[3] , stride, stride, stride, stride, stride, h);\ | 778 | 187k | OPNAME ## _pixels16_l4_8(dst+16, src[0]+16, src[1]+16, src[2]+16, src[3]+16, stride, stride, stride, stride, stride, h);\ | 779 | 187k | } |
ff_avg_dirac_pixels32_l4_c Line | Count | Source | 775 | 8.29k | void ff_ ## OPNAME ## _dirac_pixels32_l4_c(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ | 776 | 8.29k | {\ | 777 | 8.29k | OPNAME ## _pixels16_l4_8(dst , src[0] , src[1] , src[2] , src[3] , stride, stride, stride, stride, stride, h);\ | 778 | 8.29k | OPNAME ## _pixels16_l4_8(dst+16, src[0]+16, src[1]+16, src[2]+16, src[3]+16, stride, stride, stride, stride, stride, h);\ | 779 | 8.29k | } |
|
780 | | DIRAC_MC(put) |
781 | | DIRAC_MC(avg) |
782 | | #endif |
783 | | |
784 | | av_cold void ff_qpeldsp_init(QpelDSPContext *c) |
785 | 44.2k | { |
786 | 44.2k | #define dspfunc(PFX, IDX, NUM) \ |
787 | 265k | c->PFX ## _pixels_tab[IDX][0] = PFX ## NUM ## _mc00_c; \ |
788 | 265k | c->PFX ## _pixels_tab[IDX][1] = PFX ## NUM ## _mc10_c; \ |
789 | 265k | c->PFX ## _pixels_tab[IDX][2] = PFX ## NUM ## _mc20_c; \ |
790 | 265k | c->PFX ## _pixels_tab[IDX][3] = PFX ## NUM ## _mc30_c; \ |
791 | 265k | c->PFX ## _pixels_tab[IDX][4] = PFX ## NUM ## _mc01_c; \ |
792 | 265k | c->PFX ## _pixels_tab[IDX][5] = PFX ## NUM ## _mc11_c; \ |
793 | 265k | c->PFX ## _pixels_tab[IDX][6] = PFX ## NUM ## _mc21_c; \ |
794 | 265k | c->PFX ## _pixels_tab[IDX][7] = PFX ## NUM ## _mc31_c; \ |
795 | 265k | c->PFX ## _pixels_tab[IDX][8] = PFX ## NUM ## _mc02_c; \ |
796 | 265k | c->PFX ## _pixels_tab[IDX][9] = PFX ## NUM ## _mc12_c; \ |
797 | 265k | c->PFX ## _pixels_tab[IDX][10] = PFX ## NUM ## _mc22_c; \ |
798 | 265k | c->PFX ## _pixels_tab[IDX][11] = PFX ## NUM ## _mc32_c; \ |
799 | 265k | c->PFX ## _pixels_tab[IDX][12] = PFX ## NUM ## _mc03_c; \ |
800 | 265k | c->PFX ## _pixels_tab[IDX][13] = PFX ## NUM ## _mc13_c; \ |
801 | 265k | c->PFX ## _pixels_tab[IDX][14] = PFX ## NUM ## _mc23_c; \ |
802 | 265k | c->PFX ## _pixels_tab[IDX][15] = PFX ## NUM ## _mc33_c |
803 | | |
804 | 44.2k | dspfunc(put_qpel, 0, 16); |
805 | 44.2k | dspfunc(put_qpel, 1, 8); |
806 | | |
807 | 44.2k | dspfunc(put_no_rnd_qpel, 0, 16); |
808 | 44.2k | dspfunc(put_no_rnd_qpel, 1, 8); |
809 | | |
810 | 44.2k | dspfunc(avg_qpel, 0, 16); |
811 | 44.2k | dspfunc(avg_qpel, 1, 8); |
812 | | |
813 | | #if ARCH_X86 && HAVE_X86ASM |
814 | | ff_qpeldsp_init_x86(c); |
815 | | #elif ARCH_MIPS |
816 | | ff_qpeldsp_init_mips(c); |
817 | | #endif |
818 | 44.2k | } |