/src/mozilla-central/mozglue/build/SSE.h
Line | Count | Source (jump to first uncovered line) |
1 | | /* vim: set shiftwidth=2 tabstop=8 autoindent cindent expandtab: */ |
2 | | /* This Source Code Form is subject to the terms of the Mozilla Public |
3 | | * License, v. 2.0. If a copy of the MPL was not distributed with this |
4 | | * file, You can obtain one at http://mozilla.org/MPL/2.0/. */ |
5 | | |
6 | | /* compile-time and runtime tests for whether to use SSE instructions */ |
7 | | |
8 | | #ifndef mozilla_SSE_h_ |
9 | | #define mozilla_SSE_h_ |
10 | | |
11 | | // for definition of MFBT_DATA |
12 | | #include "mozilla/Types.h" |
13 | | |
14 | | /** |
15 | | * The public interface of this header consists of a set of macros and |
16 | | * functions for Intel CPU features. |
17 | | * |
18 | | * DETECTING ISA EXTENSIONS |
19 | | * ======================== |
20 | | * |
21 | | * This header provides the following functions for determining whether the |
22 | | * current CPU supports a particular instruction set extension: |
23 | | * |
24 | | * mozilla::supports_mmx |
25 | | * mozilla::supports_sse |
26 | | * mozilla::supports_sse2 |
27 | | * mozilla::supports_sse3 |
28 | | * mozilla::supports_ssse3 |
29 | | * mozilla::supports_sse4a |
30 | | * mozilla::supports_sse4_1 |
31 | | * mozilla::supports_sse4_2 |
32 | | * mozilla::supports_avx |
33 | | * mozilla::supports_avx2 |
34 | | * mozilla::supports_aes |
35 | | * |
36 | | * If you're writing code using inline assembly, you should guard it with a |
37 | | * call to one of these functions. For instance: |
38 | | * |
39 | | * if (mozilla::supports_sse2()) { |
40 | | * asm(" ... "); |
41 | | * } |
42 | | * else { |
43 | | * ... |
44 | | * } |
45 | | * |
46 | | * Note that these functions depend on cpuid intrinsics only available in gcc |
47 | | * 4.3 or later and MSVC 8.0 (Visual C++ 2005) or later, so they return false |
48 | | * in older compilers. (This could be fixed by replacing the code with inline |
49 | | * assembly.) |
50 | | * |
51 | | * |
52 | | * USING INTRINSICS |
53 | | * ================ |
54 | | * |
55 | | * This header also provides support for coding using CPU intrinsics. |
56 | | * |
57 | | * For each mozilla::supports_abc function, we define a MOZILLA_MAY_SUPPORT_ABC |
58 | | * macro which indicates that the target/compiler combination we're using is |
59 | | * compatible with the ABC extension. For instance, x86_64 with MSVC 2003 is |
60 | | * compatible with SSE2 but not SSE3, since although there exist x86_64 CPUs |
61 | | * with SSE3 support, MSVC 2003 only supports through SSE2. |
62 | | * |
63 | | * Until gcc fixes #pragma target [1] [2] or our x86 builds require SSE2, |
64 | | * you'll need to separate code using intrinsics into a file separate from your |
65 | | * regular code. Here's the recommended pattern: |
66 | | * |
67 | | * #ifdef MOZILLA_MAY_SUPPORT_ABC |
68 | | * namespace mozilla { |
69 | | * namespace ABC { |
70 | | * void foo(); |
71 | | * } |
72 | | * } |
73 | | * #endif |
74 | | * |
75 | | * void foo() { |
76 | | * #ifdef MOZILLA_MAY_SUPPORT_ABC |
77 | | * if (mozilla::supports_abc()) { |
78 | | * mozilla::ABC::foo(); // in a separate file |
79 | | * return; |
80 | | * } |
81 | | * #endif |
82 | | * |
83 | | * foo_unvectorized(); |
84 | | * } |
85 | | * |
86 | | * You'll need to define mozilla::ABC::foo() in a separate file and add the |
87 | | * -mabc flag when using gcc. |
88 | | * |
89 | | * [1] http://gcc.gnu.org/bugzilla/show_bug.cgi?id=39787 and |
90 | | * [2] http://gcc.gnu.org/bugzilla/show_bug.cgi?id=41201 being fixed. |
91 | | * |
92 | | */ |
93 | | |
94 | | #if defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__)) |
95 | | |
96 | | #ifdef __MMX__ |
97 | | // It's ok to use MMX instructions based on the -march option (or |
98 | | // the default for x86_64 or for Intel Mac). |
99 | | #define MOZILLA_PRESUME_MMX 1 |
100 | | #endif |
101 | | #ifdef __SSE__ |
102 | | // It's ok to use SSE instructions based on the -march option (or |
103 | | // the default for x86_64 or for Intel Mac). |
104 | | #define MOZILLA_PRESUME_SSE 1 |
105 | | #endif |
106 | | #ifdef __SSE2__ |
107 | | // It's ok to use SSE2 instructions based on the -march option (or |
108 | | // the default for x86_64 or for Intel Mac). |
109 | | #define MOZILLA_PRESUME_SSE2 1 |
110 | | #endif |
111 | | #ifdef __SSE3__ |
112 | | // It's ok to use SSE3 instructions based on the -march option (or the |
113 | | // default for Intel Mac). |
114 | | #define MOZILLA_PRESUME_SSE3 1 |
115 | | #endif |
116 | | #ifdef __SSSE3__ |
117 | | // It's ok to use SSSE3 instructions based on the -march option. |
118 | | #define MOZILLA_PRESUME_SSSE3 1 |
119 | | #endif |
120 | | #ifdef __SSE4A__ |
121 | | // It's ok to use SSE4A instructions based on the -march option. |
122 | | #define MOZILLA_PRESUME_SSE4A 1 |
123 | | #endif |
124 | | #ifdef __SSE4_1__ |
125 | | // It's ok to use SSE4.1 instructions based on the -march option. |
126 | | #define MOZILLA_PRESUME_SSE4_1 1 |
127 | | #endif |
128 | | #ifdef __SSE4_2__ |
129 | | // It's ok to use SSE4.2 instructions based on the -march option. |
130 | | #define MOZILLA_PRESUME_SSE4_2 1 |
131 | | #endif |
132 | | #ifdef __AVX__ |
133 | | // It's ok to use AVX instructions based on the -march option. |
134 | | #define MOZILLA_PRESUME_AVX 1 |
135 | | #endif |
136 | | #ifdef __AVX2__ |
137 | | // It's ok to use AVX instructions based on the -march option. |
138 | | #define MOZILLA_PRESUME_AVX2 1 |
139 | | #endif |
140 | | #ifdef __AES__ |
141 | | // It's ok to use AES instructions based on the -march option. |
142 | | #define MOZILLA_PRESUME_AES 1 |
143 | | #endif |
144 | | |
145 | | |
146 | | |
147 | | #ifdef HAVE_CPUID_H |
148 | | #define MOZILLA_SSE_HAVE_CPUID_DETECTION |
149 | | #endif |
150 | | |
151 | | #elif defined(_MSC_VER) && (defined(_M_IX86) || defined(_M_AMD64)) |
152 | | |
153 | | #define MOZILLA_SSE_HAVE_CPUID_DETECTION |
154 | | |
155 | | #if defined(_M_IX86_FP) |
156 | | |
157 | | #if _M_IX86_FP >= 1 |
158 | | // It's ok to use SSE instructions based on the /arch option |
159 | | #define MOZILLA_PRESUME_SSE |
160 | | #endif |
161 | | #if _M_IX86_FP >= 2 |
162 | | // It's ok to use SSE2 instructions based on the /arch option |
163 | | #define MOZILLA_PRESUME_SSE2 |
164 | | #endif |
165 | | |
166 | | #elif defined(_M_AMD64) |
167 | | // MSVC for AMD64 doesn't support MMX, so don't presume it here. |
168 | | |
169 | | // SSE is always available on AMD64. |
170 | | #define MOZILLA_PRESUME_SSE |
171 | | // SSE2 is always available on AMD64. |
172 | | #define MOZILLA_PRESUME_SSE2 |
173 | | #endif |
174 | | |
175 | | #elif defined(__SUNPRO_CC) && (defined(__i386) || defined(__x86_64__)) |
176 | | // Sun Studio on x86 or amd64 |
177 | | |
178 | | #define MOZILLA_SSE_HAVE_CPUID_DETECTION |
179 | | |
180 | | #if defined(__x86_64__) |
181 | | // MMX is always available on AMD64. |
182 | | #define MOZILLA_PRESUME_MMX |
183 | | // SSE is always available on AMD64. |
184 | | #define MOZILLA_PRESUME_SSE |
185 | | // SSE2 is always available on AMD64. |
186 | | #define MOZILLA_PRESUME_SSE2 |
187 | | #endif |
188 | | |
189 | | #endif |
190 | | |
191 | | namespace mozilla { |
192 | | |
193 | | namespace sse_private { |
194 | | #if defined(MOZILLA_SSE_HAVE_CPUID_DETECTION) |
195 | | #if !defined(MOZILLA_PRESUME_MMX) |
196 | | extern bool MFBT_DATA mmx_enabled; |
197 | | #endif |
198 | | #if !defined(MOZILLA_PRESUME_SSE) |
199 | | extern bool MFBT_DATA sse_enabled; |
200 | | #endif |
201 | | #if !defined(MOZILLA_PRESUME_SSE2) |
202 | | extern bool MFBT_DATA sse2_enabled; |
203 | | #endif |
204 | | #if !defined(MOZILLA_PRESUME_SSE3) |
205 | | extern bool MFBT_DATA sse3_enabled; |
206 | | #endif |
207 | | #if !defined(MOZILLA_PRESUME_SSSE3) |
208 | | extern bool MFBT_DATA ssse3_enabled; |
209 | | #endif |
210 | | #if !defined(MOZILLA_PRESUME_SSE4A) |
211 | | extern bool MFBT_DATA sse4a_enabled; |
212 | | #endif |
213 | | #if !defined(MOZILLA_PRESUME_SSE4_1) |
214 | | extern bool MFBT_DATA sse4_1_enabled; |
215 | | #endif |
216 | | #if !defined(MOZILLA_PRESUME_SSE4_2) |
217 | | extern bool MFBT_DATA sse4_2_enabled; |
218 | | #endif |
219 | | #if !defined(MOZILLA_PRESUME_AVX) |
220 | | extern bool MFBT_DATA avx_enabled; |
221 | | #endif |
222 | | #if !defined(MOZILLA_PRESUME_AVX2) |
223 | | extern bool MFBT_DATA avx2_enabled; |
224 | | #endif |
225 | | #if !defined(MOZILLA_PRESUME_AES) |
226 | | extern bool MFBT_DATA aes_enabled; |
227 | | #endif |
228 | | |
229 | | |
230 | | #endif |
231 | | } // namespace sse_private |
232 | | |
233 | | #if defined(MOZILLA_PRESUME_MMX) |
234 | | #define MOZILLA_MAY_SUPPORT_MMX 1 |
235 | 0 | inline bool supports_mmx() { return true; } |
236 | | #elif defined(MOZILLA_SSE_HAVE_CPUID_DETECTION) |
237 | | #if !(defined(_MSC_VER) && defined(_M_AMD64)) |
238 | | // Define MOZILLA_MAY_SUPPORT_MMX only if we're not on MSVC for |
239 | | // AMD64, since that compiler doesn't support MMX. |
240 | | #define MOZILLA_MAY_SUPPORT_MMX 1 |
241 | | #endif |
242 | | inline bool supports_mmx() { return sse_private::mmx_enabled; } |
243 | | #else |
244 | | inline bool supports_mmx() { return false; } |
245 | | #endif |
246 | | |
247 | | #if defined(MOZILLA_PRESUME_SSE) |
248 | | #define MOZILLA_MAY_SUPPORT_SSE 1 |
249 | 0 | inline bool supports_sse() { return true; } |
250 | | #elif defined(MOZILLA_SSE_HAVE_CPUID_DETECTION) |
251 | | #define MOZILLA_MAY_SUPPORT_SSE 1 |
252 | | inline bool supports_sse() { return sse_private::sse_enabled; } |
253 | | #else |
254 | | inline bool supports_sse() { return false; } |
255 | | #endif |
256 | | |
257 | | #if defined(MOZILLA_PRESUME_SSE2) |
258 | | #define MOZILLA_MAY_SUPPORT_SSE2 1 |
259 | 0 | inline bool supports_sse2() { return true; } |
260 | | #elif defined(MOZILLA_SSE_HAVE_CPUID_DETECTION) |
261 | | #define MOZILLA_MAY_SUPPORT_SSE2 1 |
262 | | inline bool supports_sse2() { return sse_private::sse2_enabled; } |
263 | | #else |
264 | | inline bool supports_sse2() { return false; } |
265 | | #endif |
266 | | |
267 | | #if defined(MOZILLA_PRESUME_SSE3) |
268 | | #define MOZILLA_MAY_SUPPORT_SSE3 1 |
269 | | inline bool supports_sse3() { return true; } |
270 | | #elif defined(MOZILLA_SSE_HAVE_CPUID_DETECTION) |
271 | | #define MOZILLA_MAY_SUPPORT_SSE3 1 |
272 | 0 | inline bool supports_sse3() { return sse_private::sse3_enabled; } |
273 | | #else |
274 | | inline bool supports_sse3() { return false; } |
275 | | #endif |
276 | | |
277 | | #if defined(MOZILLA_PRESUME_SSSE3) |
278 | | #define MOZILLA_MAY_SUPPORT_SSSE3 1 |
279 | | inline bool supports_ssse3() { return true; } |
280 | | #elif defined(MOZILLA_SSE_HAVE_CPUID_DETECTION) |
281 | | #define MOZILLA_MAY_SUPPORT_SSSE3 1 |
282 | 0 | inline bool supports_ssse3() { return sse_private::ssse3_enabled; } |
283 | | #else |
284 | | inline bool supports_ssse3() { return false; } |
285 | | #endif |
286 | | |
287 | | #if defined(MOZILLA_PRESUME_SSE4A) |
288 | | #define MOZILLA_MAY_SUPPORT_SSE4A 1 |
289 | | inline bool supports_sse4a() { return true; } |
290 | | #elif defined(MOZILLA_SSE_HAVE_CPUID_DETECTION) |
291 | | #define MOZILLA_MAY_SUPPORT_SSE4A 1 |
292 | 0 | inline bool supports_sse4a() { return sse_private::sse4a_enabled; } |
293 | | #else |
294 | | inline bool supports_sse4a() { return false; } |
295 | | #endif |
296 | | |
297 | | #if defined(MOZILLA_PRESUME_SSE4_1) |
298 | | #define MOZILLA_MAY_SUPPORT_SSE4_1 1 |
299 | | inline bool supports_sse4_1() { return true; } |
300 | | #elif defined(MOZILLA_SSE_HAVE_CPUID_DETECTION) |
301 | | #define MOZILLA_MAY_SUPPORT_SSE4_1 1 |
302 | 0 | inline bool supports_sse4_1() { return sse_private::sse4_1_enabled; } |
303 | | #else |
304 | | inline bool supports_sse4_1() { return false; } |
305 | | #endif |
306 | | |
307 | | #if defined(MOZILLA_PRESUME_SSE4_2) |
308 | | #define MOZILLA_MAY_SUPPORT_SSE4_2 1 |
309 | | inline bool supports_sse4_2() { return true; } |
310 | | #elif defined(MOZILLA_SSE_HAVE_CPUID_DETECTION) |
311 | | #define MOZILLA_MAY_SUPPORT_SSE4_2 1 |
312 | 0 | inline bool supports_sse4_2() { return sse_private::sse4_2_enabled; } |
313 | | #else |
314 | | inline bool supports_sse4_2() { return false; } |
315 | | #endif |
316 | | |
317 | | #if defined(MOZILLA_PRESUME_AVX) |
318 | | #define MOZILLA_MAY_SUPPORT_AVX 1 |
319 | | inline bool supports_avx() { return true; } |
320 | | #elif defined(MOZILLA_SSE_HAVE_CPUID_DETECTION) |
321 | | #define MOZILLA_MAY_SUPPORT_AVX 1 |
322 | 0 | inline bool supports_avx() { return sse_private::avx_enabled; } |
323 | | #else |
324 | | inline bool supports_avx() { return false; } |
325 | | #endif |
326 | | |
327 | | #if defined(MOZILLA_PRESUME_AVX2) |
328 | | #define MOZILLA_MAY_SUPPORT_AVX2 1 |
329 | | inline bool supports_avx2() { return true; } |
330 | | #elif defined(MOZILLA_SSE_HAVE_CPUID_DETECTION) |
331 | | #define MOZILLA_MAY_SUPPORT_AVX2 1 |
332 | 0 | inline bool supports_avx2() { return sse_private::avx2_enabled; } |
333 | | #else |
334 | | inline bool supports_avx2() { return false; } |
335 | | #endif |
336 | | |
337 | | #if defined(MOZILLA_PRESUME_AES) |
338 | | #define MOZILLA_MAY_SUPPORT_AES 1 |
339 | | inline bool supports_aes() { return true; } |
340 | | #elif defined(MOZILLA_SSE_HAVE_CPUID_DETECTION) |
341 | | #define MOZILLA_MAY_SUPPORT_AES 1 |
342 | 0 | inline bool supports_aes() { return sse_private::aes_enabled; } |
343 | | #else |
344 | | inline bool supports_aes() { return false; } |
345 | | #endif |
346 | | |
347 | | |
348 | | } // namespace mozilla |
349 | | |
350 | | #endif /* !defined(mozilla_SSE_h_) */ |