/src/opus/celt/x86/x86cpu.c
Line | Count | Source (jump to first uncovered line) |
1 | | /* Copyright (c) 2014, Cisco Systems, INC |
2 | | Written by XiangMingZhu WeiZhou MinPeng YanWang |
3 | | |
4 | | Redistribution and use in source and binary forms, with or without |
5 | | modification, are permitted provided that the following conditions |
6 | | are met: |
7 | | |
8 | | - Redistributions of source code must retain the above copyright |
9 | | notice, this list of conditions and the following disclaimer. |
10 | | |
11 | | - Redistributions in binary form must reproduce the above copyright |
12 | | notice, this list of conditions and the following disclaimer in the |
13 | | documentation and/or other materials provided with the distribution. |
14 | | |
15 | | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
16 | | ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
17 | | LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
18 | | A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER |
19 | | OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
20 | | EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
21 | | PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
22 | | PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF |
23 | | LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING |
24 | | NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |
25 | | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
26 | | */ |
27 | | |
28 | | #ifdef HAVE_CONFIG_H |
29 | | #include "config.h" |
30 | | #endif |
31 | | |
32 | | #include "cpu_support.h" |
33 | | #include "macros.h" |
34 | | #include "main.h" |
35 | | #include "pitch.h" |
36 | | #include "x86cpu.h" |
37 | | |
38 | | #if defined(OPUS_HAVE_RTCD) && \ |
39 | | ((defined(OPUS_X86_MAY_HAVE_SSE) && !defined(OPUS_X86_PRESUME_SSE)) || \ |
40 | | (defined(OPUS_X86_MAY_HAVE_SSE2) && !defined(OPUS_X86_PRESUME_SSE2)) || \ |
41 | | (defined(OPUS_X86_MAY_HAVE_SSE4_1) && !defined(OPUS_X86_PRESUME_SSE4_1)) || \ |
42 | | (defined(OPUS_X86_MAY_HAVE_AVX2) && !defined(OPUS_X86_PRESUME_AVX2))) |
43 | | |
44 | | #if defined(_MSC_VER) |
45 | | |
46 | | #include <intrin.h> |
47 | | static _inline void cpuid(unsigned int CPUInfo[4], unsigned int InfoType) |
48 | | { |
49 | | __cpuid((int*)CPUInfo, InfoType); |
50 | | } |
51 | | |
52 | | #else |
53 | | |
54 | | #if defined(CPU_INFO_BY_C) |
55 | | #include <cpuid.h> |
56 | | #endif |
57 | | |
58 | | static void cpuid(unsigned int CPUInfo[4], unsigned int InfoType) |
59 | 0 | { |
60 | 0 | #if defined(CPU_INFO_BY_ASM) |
61 | | #if defined(__i386__) && defined(__PIC__) |
62 | | /* %ebx is PIC register in 32-bit, so mustn't clobber it. */ |
63 | | __asm__ __volatile__ ( |
64 | | "xchg %%ebx, %1\n" |
65 | | "cpuid\n" |
66 | | "xchg %%ebx, %1\n": |
67 | | "=a" (CPUInfo[0]), |
68 | | "=r" (CPUInfo[1]), |
69 | | "=c" (CPUInfo[2]), |
70 | | "=d" (CPUInfo[3]) : |
71 | | /* We clear ECX to avoid a valgrind false-positive prior to v3.17.0. */ |
72 | | "0" (InfoType), "2" (0) |
73 | | ); |
74 | | #else |
75 | 0 | __asm__ __volatile__ ( |
76 | 0 | "cpuid": |
77 | 0 | "=a" (CPUInfo[0]), |
78 | 0 | "=b" (CPUInfo[1]), |
79 | 0 | "=c" (CPUInfo[2]), |
80 | 0 | "=d" (CPUInfo[3]) : |
81 | | /* We clear ECX to avoid a valgrind false-positive prior to v3.17.0. */ |
82 | 0 | "0" (InfoType), "2" (0) |
83 | 0 | ); |
84 | 0 | #endif |
85 | | #elif defined(CPU_INFO_BY_C) |
86 | | /* We use __get_cpuid_count to clear ECX to avoid a valgrind false-positive |
87 | | prior to v3.17.0.*/ |
88 | | if (!__get_cpuid_count(InfoType, 0, &(CPUInfo[0]), &(CPUInfo[1]), &(CPUInfo[2]), &(CPUInfo[3]))) { |
89 | | /* Our function cannot fail, but __get_cpuid{_count} can. |
90 | | Returning all zeroes will effectively disable all SIMD, which is |
91 | | what we want on CPUs that don't support CPUID. */ |
92 | | CPUInfo[3] = CPUInfo[2] = CPUInfo[1] = CPUInfo[0] = 0; |
93 | | } |
94 | | #else |
95 | | # error "Configured to use x86 RTCD, but no CPU detection method available. " \ |
96 | | "Reconfigure with --disable-rtcd (or send patches)." |
97 | | #endif |
98 | 0 | } |
99 | | |
100 | | #endif |
101 | | |
102 | | typedef struct CPU_Feature{ |
103 | | /* SIMD: 128-bit */ |
104 | | int HW_SSE; |
105 | | int HW_SSE2; |
106 | | int HW_SSE41; |
107 | | /* SIMD: 256-bit */ |
108 | | int HW_AVX2; |
109 | | } CPU_Feature; |
110 | | |
111 | | static void opus_cpu_feature_check(CPU_Feature *cpu_feature) |
112 | 0 | { |
113 | 0 | unsigned int info[4]; |
114 | 0 | unsigned int nIds = 0; |
115 | |
|
116 | 0 | cpuid(info, 0); |
117 | 0 | nIds = info[0]; |
118 | |
|
119 | 0 | if (nIds >= 1){ |
120 | 0 | cpuid(info, 1); |
121 | 0 | cpu_feature->HW_SSE = (info[3] & (1 << 25)) != 0; |
122 | 0 | cpu_feature->HW_SSE2 = (info[3] & (1 << 26)) != 0; |
123 | 0 | cpu_feature->HW_SSE41 = (info[2] & (1 << 19)) != 0; |
124 | 0 | cpu_feature->HW_AVX2 = (info[2] & (1 << 28)) != 0 && (info[2] & (1 << 12)) != 0; |
125 | 0 | if (cpu_feature->HW_AVX2 && nIds >= 7) { |
126 | 0 | cpuid(info, 7); |
127 | 0 | cpu_feature->HW_AVX2 = cpu_feature->HW_AVX2 && (info[1] & (1 << 5)) != 0; |
128 | 0 | } else { |
129 | 0 | cpu_feature->HW_AVX2 = 0; |
130 | 0 | } |
131 | 0 | } |
132 | 0 | else { |
133 | 0 | cpu_feature->HW_SSE = 0; |
134 | 0 | cpu_feature->HW_SSE2 = 0; |
135 | 0 | cpu_feature->HW_SSE41 = 0; |
136 | 0 | cpu_feature->HW_AVX2 = 0; |
137 | 0 | } |
138 | 0 | } |
139 | | |
140 | | static int opus_select_arch_impl(void) |
141 | 0 | { |
142 | 0 | CPU_Feature cpu_feature; |
143 | 0 | int arch; |
144 | |
|
145 | 0 | opus_cpu_feature_check(&cpu_feature); |
146 | |
|
147 | 0 | arch = 0; |
148 | 0 | if (!cpu_feature.HW_SSE) |
149 | 0 | { |
150 | 0 | return arch; |
151 | 0 | } |
152 | 0 | arch++; |
153 | |
|
154 | 0 | if (!cpu_feature.HW_SSE2) |
155 | 0 | { |
156 | 0 | return arch; |
157 | 0 | } |
158 | 0 | arch++; |
159 | |
|
160 | 0 | if (!cpu_feature.HW_SSE41) |
161 | 0 | { |
162 | 0 | return arch; |
163 | 0 | } |
164 | 0 | arch++; |
165 | |
|
166 | 0 | if (!cpu_feature.HW_AVX2) |
167 | 0 | { |
168 | 0 | return arch; |
169 | 0 | } |
170 | 0 | arch++; |
171 | |
|
172 | 0 | return arch; |
173 | 0 | } |
174 | | |
175 | 0 | int opus_select_arch(void) { |
176 | 0 | int arch = opus_select_arch_impl(); |
177 | | #ifdef FUZZING |
178 | | /* Randomly downgrade the architecture. */ |
179 | | arch = rand()%(arch+1); |
180 | | #endif |
181 | 0 | return arch; |
182 | 0 | } |
183 | | |
184 | | #endif |