clang  12.0.0git
ia32intrin.h
Go to the documentation of this file.
1 /* ===-------- ia32intrin.h ---------------------------------------------------===
2  *
3  * Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4  * See https://llvm.org/LICENSE.txt for license information.
5  * SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6  *
7  *===-----------------------------------------------------------------------===
8  */
9 
10 #ifndef __X86INTRIN_H
11 #error "Never use <ia32intrin.h> directly; include <x86intrin.h> instead."
12 #endif
13 
14 #ifndef __IA32INTRIN_H
15 #define __IA32INTRIN_H
16 
17 /* Define the default attributes for the functions in this file. */
18 #define __DEFAULT_FN_ATTRS __attribute__((__always_inline__, __nodebug__))
19 #define __DEFAULT_FN_ATTRS_SSE42 __attribute__((__always_inline__, __nodebug__, __target__("sse4.2")))
20 
21 #if defined(__cplusplus) && (__cplusplus >= 201103L)
22 #define __DEFAULT_FN_ATTRS_CAST __attribute__((__always_inline__)) constexpr
23 #define __DEFAULT_FN_ATTRS_CONSTEXPR __DEFAULT_FN_ATTRS constexpr
24 #else
25 #define __DEFAULT_FN_ATTRS_CAST __attribute__((__always_inline__))
26 #define __DEFAULT_FN_ATTRS_CONSTEXPR __DEFAULT_FN_ATTRS
27 #endif
28 
29 /** Find the first set bit starting from the lsb. Result is undefined if
30  * input is 0.
31  *
32  * \headerfile <x86intrin.h>
33  *
34  * This intrinsic corresponds to the <c> BSF </c> instruction or the
35  * <c> TZCNT </c> instruction.
36  *
37  * \param __A
38  * A 32-bit integer operand.
39  * \returns A 32-bit integer containing the bit number.
40  */
41 static __inline__ int __DEFAULT_FN_ATTRS_CONSTEXPR
42 __bsfd(int __A) {
43  return __builtin_ctz(__A);
44 }
45 
46 /** Find the first set bit starting from the msb. Result is undefined if
47  * input is 0.
48  *
49  * \headerfile <x86intrin.h>
50  *
51  * This intrinsic corresponds to the <c> BSR </c> instruction or the
52  * <c> LZCNT </c> instruction and an <c> XOR </c>.
53  *
54  * \param __A
55  * A 32-bit integer operand.
56  * \returns A 32-bit integer containing the bit number.
57  */
58 static __inline__ int __DEFAULT_FN_ATTRS_CONSTEXPR
59 __bsrd(int __A) {
60  return 31 - __builtin_clz(__A);
61 }
62 
63 /** Swaps the bytes in the input. Converting little endian to big endian or
64  * vice versa.
65  *
66  * \headerfile <x86intrin.h>
67  *
68  * This intrinsic corresponds to the <c> BSWAP </c> instruction.
69  *
70  * \param __A
71  * A 32-bit integer operand.
72  * \returns A 32-bit integer containing the swapped bytes.
73  */
74 static __inline__ int __DEFAULT_FN_ATTRS_CONSTEXPR
75 __bswapd(int __A) {
76  return __builtin_bswap32(__A);
77 }
78 
79 static __inline__ int __DEFAULT_FN_ATTRS_CONSTEXPR
80 _bswap(int __A) {
81  return __builtin_bswap32(__A);
82 }
83 
84 #define _bit_scan_forward(A) __bsfd((A))
85 #define _bit_scan_reverse(A) __bsrd((A))
86 
87 #ifdef __x86_64__
88 /** Find the first set bit starting from the lsb. Result is undefined if
89  * input is 0.
90  *
91  * \headerfile <x86intrin.h>
92  *
93  * This intrinsic corresponds to the <c> BSF </c> instruction or the
94  * <c> TZCNT </c> instruction.
95  *
96  * \param __A
97  * A 64-bit integer operand.
98  * \returns A 32-bit integer containing the bit number.
99  */
100 static __inline__ int __DEFAULT_FN_ATTRS_CONSTEXPR
101 __bsfq(long long __A) {
102  return __builtin_ctzll(__A);
103 }
104 
105 /** Find the first set bit starting from the msb. Result is undefined if
106  * input is 0.
107  *
108  * \headerfile <x86intrin.h>
109  *
110  * This intrinsic corresponds to the <c> BSR </c> instruction or the
111  * <c> LZCNT </c> instruction and an <c> XOR </c>.
112  *
113  * \param __A
114  * A 64-bit integer operand.
115  * \returns A 32-bit integer containing the bit number.
116  */
117 static __inline__ int __DEFAULT_FN_ATTRS_CONSTEXPR
118 __bsrq(long long __A) {
119  return 63 - __builtin_clzll(__A);
120 }
121 
122 /** Swaps the bytes in the input. Converting little endian to big endian or
123  * vice versa.
124  *
125  * \headerfile <x86intrin.h>
126  *
127  * This intrinsic corresponds to the <c> BSWAP </c> instruction.
128  *
129  * \param __A
130  * A 64-bit integer operand.
131  * \returns A 64-bit integer containing the swapped bytes.
132  */
133 static __inline__ long long __DEFAULT_FN_ATTRS_CONSTEXPR
134 __bswapq(long long __A) {
135  return __builtin_bswap64(__A);
136 }
137 
138 #define _bswap64(A) __bswapq((A))
139 #endif
140 
141 /** Counts the number of bits in the source operand having a value of 1.
142  *
143  * \headerfile <x86intrin.h>
144  *
145  * This intrinsic corresponds to the <c> POPCNT </c> instruction or a
146  * a sequence of arithmetic and logic ops to calculate it.
147  *
148  * \param __A
149  * An unsigned 32-bit integer operand.
150  * \returns A 32-bit integer containing the number of bits with value 1 in the
151  * source operand.
152  */
153 static __inline__ int __DEFAULT_FN_ATTRS_CONSTEXPR
154 __popcntd(unsigned int __A)
155 {
156  return __builtin_popcount(__A);
157 }
158 
159 #define _popcnt32(A) __popcntd((A))
160 
161 #ifdef __x86_64__
162 /** Counts the number of bits in the source operand having a value of 1.
163  *
164  * \headerfile <x86intrin.h>
165  *
166  * This intrinsic corresponds to the <c> POPCNT </c> instruction or a
167  * a sequence of arithmetic and logic ops to calculate it.
168  *
169  * \param __A
170  * An unsigned 64-bit integer operand.
171  * \returns A 64-bit integer containing the number of bits with value 1 in the
172  * source operand.
173  */
174 static __inline__ long long __DEFAULT_FN_ATTRS_CONSTEXPR
175 __popcntq(unsigned long long __A)
176 {
177  return __builtin_popcountll(__A);
178 }
179 
180 #define _popcnt64(A) __popcntq((A))
181 #endif /* __x86_64__ */
182 
183 #ifdef __x86_64__
184 static __inline__ unsigned long long __DEFAULT_FN_ATTRS
185 __readeflags(void)
186 {
187  return __builtin_ia32_readeflags_u64();
188 }
189 
190 static __inline__ void __DEFAULT_FN_ATTRS
191 __writeeflags(unsigned long long __f)
192 {
193  __builtin_ia32_writeeflags_u64(__f);
194 }
195 
196 #else /* !__x86_64__ */
197 static __inline__ unsigned int __DEFAULT_FN_ATTRS
199 {
200  return __builtin_ia32_readeflags_u32();
201 }
202 
203 static __inline__ void __DEFAULT_FN_ATTRS
204 __writeeflags(unsigned int __f)
205 {
206  __builtin_ia32_writeeflags_u32(__f);
207 }
208 #endif /* !__x86_64__ */
209 
210 /** Cast a 32-bit float value to a 32-bit unsigned integer value
211  *
212  * \headerfile <x86intrin.h>
213  * This intrinsic corresponds to the <c> VMOVD / MOVD </c> instruction in x86_64,
214  * and corresponds to the <c> VMOVL / MOVL </c> instruction in ia32.
215  *
216  * \param __A
217  * A 32-bit float value.
218  * \returns a 32-bit unsigned integer containing the converted value.
219  */
220 static __inline__ unsigned int __DEFAULT_FN_ATTRS_CAST
221 _castf32_u32(float __A) {
222  return __builtin_bit_cast(unsigned int, __A);
223 }
224 
225 /** Cast a 64-bit float value to a 64-bit unsigned integer value
226  *
227  * \headerfile <x86intrin.h>
228  * This intrinsic corresponds to the <c> VMOVQ / MOVQ </c> instruction in x86_64,
229  * and corresponds to the <c> VMOVL / MOVL </c> instruction in ia32.
230  *
231  * \param __A
232  * A 64-bit float value.
233  * \returns a 64-bit unsigned integer containing the converted value.
234  */
235 static __inline__ unsigned long long __DEFAULT_FN_ATTRS_CAST
236 _castf64_u64(double __A) {
237  return __builtin_bit_cast(unsigned long long, __A);
238 }
239 
240 /** Cast a 32-bit unsigned integer value to a 32-bit float value
241  *
242  * \headerfile <x86intrin.h>
243  * This intrinsic corresponds to the <c> VMOVQ / MOVQ </c> instruction in x86_64,
244  * and corresponds to the <c> FLDS </c> instruction in ia32.
245  *
246  * \param __A
247  * A 32-bit unsigned integer value.
248  * \returns a 32-bit float value containing the converted value.
249  */
250 static __inline__ float __DEFAULT_FN_ATTRS_CAST
251 _castu32_f32(unsigned int __A) {
252  return __builtin_bit_cast(float, __A);
253 }
254 
255 /** Cast a 64-bit unsigned integer value to a 64-bit float value
256  *
257  * \headerfile <x86intrin.h>
258  * This intrinsic corresponds to the <c> VMOVQ / MOVQ </c> instruction in x86_64,
259  * and corresponds to the <c> FLDL </c> instruction in ia32.
260  *
261  * \param __A
262  * A 64-bit unsigned integer value.
263  * \returns a 64-bit float value containing the converted value.
264  */
265 static __inline__ double __DEFAULT_FN_ATTRS_CAST
266 _castu64_f64(unsigned long long __A) {
267  return __builtin_bit_cast(double, __A);
268 }
269 
270 /** Adds the unsigned integer operand to the CRC-32C checksum of the
271  * unsigned char operand.
272  *
273  * \headerfile <x86intrin.h>
274  *
275  * This intrinsic corresponds to the <c> CRC32B </c> instruction.
276  *
277  * \param __C
278  * An unsigned integer operand to add to the CRC-32C checksum of operand
279  * \a __D.
280  * \param __D
281  * An unsigned 8-bit integer operand used to compute the CRC-32C checksum.
282  * \returns The result of adding operand \a __C to the CRC-32C checksum of
283  * operand \a __D.
284  */
285 static __inline__ unsigned int __DEFAULT_FN_ATTRS_SSE42
286 __crc32b(unsigned int __C, unsigned char __D)
287 {
288  return __builtin_ia32_crc32qi(__C, __D);
289 }
290 
291 /** Adds the unsigned integer operand to the CRC-32C checksum of the
292  * unsigned short operand.
293  *
294  * \headerfile <x86intrin.h>
295  *
296  * This intrinsic corresponds to the <c> CRC32W </c> instruction.
297  *
298  * \param __C
299  * An unsigned integer operand to add to the CRC-32C checksum of operand
300  * \a __D.
301  * \param __D
302  * An unsigned 16-bit integer operand used to compute the CRC-32C checksum.
303  * \returns The result of adding operand \a __C to the CRC-32C checksum of
304  * operand \a __D.
305  */
306 static __inline__ unsigned int __DEFAULT_FN_ATTRS_SSE42
307 __crc32w(unsigned int __C, unsigned short __D)
308 {
309  return __builtin_ia32_crc32hi(__C, __D);
310 }
311 
312 /** Adds the unsigned integer operand to the CRC-32C checksum of the
313  * second unsigned integer operand.
314  *
315  * \headerfile <x86intrin.h>
316  *
317  * This intrinsic corresponds to the <c> CRC32D </c> instruction.
318  *
319  * \param __C
320  * An unsigned integer operand to add to the CRC-32C checksum of operand
321  * \a __D.
322  * \param __D
323  * An unsigned 32-bit integer operand used to compute the CRC-32C checksum.
324  * \returns The result of adding operand \a __C to the CRC-32C checksum of
325  * operand \a __D.
326  */
327 static __inline__ unsigned int __DEFAULT_FN_ATTRS_SSE42
328 __crc32d(unsigned int __C, unsigned int __D)
329 {
330  return __builtin_ia32_crc32si(__C, __D);
331 }
332 
333 #ifdef __x86_64__
334 /** Adds the unsigned integer operand to the CRC-32C checksum of the
335  * unsigned 64-bit integer operand.
336  *
337  * \headerfile <x86intrin.h>
338  *
339  * This intrinsic corresponds to the <c> CRC32Q </c> instruction.
340  *
341  * \param __C
342  * An unsigned integer operand to add to the CRC-32C checksum of operand
343  * \a __D.
344  * \param __D
345  * An unsigned 64-bit integer operand used to compute the CRC-32C checksum.
346  * \returns The result of adding operand \a __C to the CRC-32C checksum of
347  * operand \a __D.
348  */
349 static __inline__ unsigned long long __DEFAULT_FN_ATTRS_SSE42
350 __crc32q(unsigned long long __C, unsigned long long __D)
351 {
352  return __builtin_ia32_crc32di(__C, __D);
353 }
354 #endif /* __x86_64__ */
355 
356 static __inline__ unsigned long long __DEFAULT_FN_ATTRS
357 __rdpmc(int __A) {
358  return __builtin_ia32_rdpmc(__A);
359 }
360 
361 /* __rdtscp */
362 static __inline__ unsigned long long __DEFAULT_FN_ATTRS
363 __rdtscp(unsigned int *__A) {
364  return __builtin_ia32_rdtscp(__A);
365 }
366 
367 #define _rdtsc() __rdtsc()
368 
369 #define _rdpmc(A) __rdpmc(A)
370 
371 static __inline__ void __DEFAULT_FN_ATTRS
372 _wbinvd(void) {
373  __builtin_ia32_wbinvd();
374 }
375 
376 static __inline__ unsigned char __DEFAULT_FN_ATTRS_CONSTEXPR
377 __rolb(unsigned char __X, int __C) {
378  return __builtin_rotateleft8(__X, __C);
379 }
380 
381 static __inline__ unsigned char __DEFAULT_FN_ATTRS_CONSTEXPR
382 __rorb(unsigned char __X, int __C) {
383  return __builtin_rotateright8(__X, __C);
384 }
385 
386 static __inline__ unsigned short __DEFAULT_FN_ATTRS_CONSTEXPR
387 __rolw(unsigned short __X, int __C) {
388  return __builtin_rotateleft16(__X, __C);
389 }
390 
391 static __inline__ unsigned short __DEFAULT_FN_ATTRS_CONSTEXPR
392 __rorw(unsigned short __X, int __C) {
393  return __builtin_rotateright16(__X, __C);
394 }
395 
396 static __inline__ unsigned int __DEFAULT_FN_ATTRS_CONSTEXPR
397 __rold(unsigned int __X, int __C) {
398  return __builtin_rotateleft32(__X, __C);
399 }
400 
401 static __inline__ unsigned int __DEFAULT_FN_ATTRS_CONSTEXPR
402 __rord(unsigned int __X, int __C) {
403  return __builtin_rotateright32(__X, __C);
404 }
405 
406 #ifdef __x86_64__
407 static __inline__ unsigned long long __DEFAULT_FN_ATTRS_CONSTEXPR
408 __rolq(unsigned long long __X, int __C) {
409  return __builtin_rotateleft64(__X, __C);
410 }
411 
412 static __inline__ unsigned long long __DEFAULT_FN_ATTRS_CONSTEXPR
413 __rorq(unsigned long long __X, int __C) {
414  return __builtin_rotateright64(__X, __C);
415 }
416 #endif /* __x86_64__ */
417 
418 #ifndef _MSC_VER
419 /* These are already provided as builtins for MSVC. */
420 /* Select the correct function based on the size of long. */
421 #ifdef __LP64__
422 #define _lrotl(a,b) __rolq((a), (b))
423 #define _lrotr(a,b) __rorq((a), (b))
424 #else
425 #define _lrotl(a,b) __rold((a), (b))
426 #define _lrotr(a,b) __rord((a), (b))
427 #endif
428 #define _rotl(a,b) __rold((a), (b))
429 #define _rotr(a,b) __rord((a), (b))
430 #endif // _MSC_VER
431 
432 /* These are not builtins so need to be provided in all modes. */
433 #define _rotwl(a,b) __rolw((a), (b))
434 #define _rotwr(a,b) __rorw((a), (b))
435 
436 #undef __DEFAULT_FN_ATTRS
437 #undef __DEFAULT_FN_ATTRS_CAST
438 #undef __DEFAULT_FN_ATTRS_SSE42
439 #undef __DEFAULT_FN_ATTRS_CONSTEXPR
440 
441 #endif /* __IA32INTRIN_H */
static __inline__ int __DEFAULT_FN_ATTRS_CONSTEXPR _bswap(int __A)
Definition: ia32intrin.h:80
static __inline__ unsigned int __DEFAULT_FN_ATTRS_CONSTEXPR __rord(unsigned int __X, int __C)
Definition: ia32intrin.h:402
static __inline__ unsigned int __DEFAULT_FN_ATTRS __readeflags(void)
Definition: ia32intrin.h:198
static __inline__ float __DEFAULT_FN_ATTRS_CAST _castu32_f32(unsigned int __A)
Cast a 32-bit unsigned integer value to a 32-bit float value.
Definition: ia32intrin.h:251
static __inline__ int __DEFAULT_FN_ATTRS_CONSTEXPR __bswapd(int __A)
Swaps the bytes in the input.
Definition: ia32intrin.h:75
static __inline__ void short __D
Definition: immintrin.h:351
#define __DEFAULT_FN_ATTRS_CAST
Definition: ia32intrin.h:25
static __inline__ unsigned int __DEFAULT_FN_ATTRS_CONSTEXPR __rold(unsigned int __X, int __C)
Definition: ia32intrin.h:397
static __inline__ unsigned int __DEFAULT_FN_ATTRS_CAST _castf32_u32(float __A)
Cast a 32-bit float value to a 32-bit unsigned integer value.
Definition: ia32intrin.h:221
static __inline__ unsigned int __DEFAULT_FN_ATTRS_SSE42 __crc32b(unsigned int __C, unsigned char __D)
Adds the unsigned integer operand to the CRC-32C checksum of the unsigned char operand.
Definition: ia32intrin.h:286
static __inline__ unsigned int __DEFAULT_FN_ATTRS_SSE42 __crc32d(unsigned int __C, unsigned int __D)
Adds the unsigned integer operand to the CRC-32C checksum of the second unsigned integer operand.
Definition: ia32intrin.h:328
static __inline__ unsigned short __DEFAULT_FN_ATTRS_CONSTEXPR __rorw(unsigned short __X, int __C)
Definition: ia32intrin.h:392
static __inline__ void __DEFAULT_FN_ATTRS __writeeflags(unsigned int __f)
Definition: ia32intrin.h:204
static __inline__ unsigned long long __DEFAULT_FN_ATTRS __rdtscp(unsigned int *__A)
Definition: ia32intrin.h:363
static __inline__ int __DEFAULT_FN_ATTRS_CONSTEXPR __popcntd(unsigned int __A)
Counts the number of bits in the source operand having a value of 1.
Definition: ia32intrin.h:154
static __inline__ unsigned long long __DEFAULT_FN_ATTRS_CAST _castf64_u64(double __A)
Cast a 64-bit float value to a 64-bit unsigned integer value.
Definition: ia32intrin.h:236
#define __DEFAULT_FN_ATTRS_SSE42
Definition: ia32intrin.h:19
#define __DEFAULT_FN_ATTRS_CONSTEXPR
Definition: ia32intrin.h:26
static __inline__ unsigned char __DEFAULT_FN_ATTRS_CONSTEXPR __rolb(unsigned char __X, int __C)
Definition: ia32intrin.h:377
static __inline__ int __DEFAULT_FN_ATTRS_CONSTEXPR __bsfd(int __A)
Find the first set bit starting from the lsb.
Definition: ia32intrin.h:42
static __inline__ int __DEFAULT_FN_ATTRS_CONSTEXPR __bsrd(int __A)
Find the first set bit starting from the msb.
Definition: ia32intrin.h:59
static __inline__ unsigned short __DEFAULT_FN_ATTRS_CONSTEXPR __rolw(unsigned short __X, int __C)
Definition: ia32intrin.h:387
static __inline__ unsigned int __DEFAULT_FN_ATTRS_SSE42 __crc32w(unsigned int __C, unsigned short __D)
Adds the unsigned integer operand to the CRC-32C checksum of the unsigned short operand.
Definition: ia32intrin.h:307
#define __DEFAULT_FN_ATTRS
Definition: ia32intrin.h:18
static __inline__ unsigned long long __DEFAULT_FN_ATTRS __rdpmc(int __A)
Definition: ia32intrin.h:357
static __inline__ double __DEFAULT_FN_ATTRS_CAST _castu64_f64(unsigned long long __A)
Cast a 64-bit unsigned integer value to a 64-bit float value.
Definition: ia32intrin.h:266
static __inline__ void __DEFAULT_FN_ATTRS _wbinvd(void)
Definition: ia32intrin.h:372
static __inline__ unsigned char __DEFAULT_FN_ATTRS_CONSTEXPR __rorb(unsigned char __X, int __C)
Definition: ia32intrin.h:382