1 /*===---- bmi2intrin.h - BMI2 intrinsics -----------------------------------===
2  *
3  * Permission is hereby granted, free of charge, to any person obtaining a copy
4  * of this software and associated documentation files (the "Software"), to deal
5  * in the Software without restriction, including without limitation the rights
6  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
7  * copies of the Software, and to permit persons to whom the Software is
8  * furnished to do so, subject to the following conditions:
9  *
10  * The above copyright notice and this permission notice shall be included in
11  * all copies or substantial portions of the Software.
12  *
13  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
16  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
17  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
18  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
19  * THE SOFTWARE.
20  *
21  *===-----------------------------------------------------------------------===
22  */
23 
24 #if !defined __X86INTRIN_H && !defined __IMMINTRIN_H
25 #error "Never use <bmi2intrin.h> directly; include <x86intrin.h> instead."
26 #endif
27 
28 #ifndef __BMI2__
29 # error "BMI2 instruction set not enabled"
30 #endif /* __BMI2__ */
31 
32 #ifndef __BMI2INTRIN_H
33 #define __BMI2INTRIN_H
34 
35 static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__))
_bzhi_u32(unsigned int __X,unsigned int __Y)36 _bzhi_u32(unsigned int __X, unsigned int __Y)
37 {
38   return __builtin_ia32_bzhi_si(__X, __Y);
39 }
40 
41 static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__))
_pdep_u32(unsigned int __X,unsigned int __Y)42 _pdep_u32(unsigned int __X, unsigned int __Y)
43 {
44   return __builtin_ia32_pdep_si(__X, __Y);
45 }
46 
47 static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__))
_pext_u32(unsigned int __X,unsigned int __Y)48 _pext_u32(unsigned int __X, unsigned int __Y)
49 {
50   return __builtin_ia32_pext_si(__X, __Y);
51 }
52 
53 #ifdef  __x86_64__
54 
55 static __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__))
_bzhi_u64(unsigned long long __X,unsigned long long __Y)56 _bzhi_u64(unsigned long long __X, unsigned long long __Y)
57 {
58   return __builtin_ia32_bzhi_di(__X, __Y);
59 }
60 
61 static __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__))
_pdep_u64(unsigned long long __X,unsigned long long __Y)62 _pdep_u64(unsigned long long __X, unsigned long long __Y)
63 {
64   return __builtin_ia32_pdep_di(__X, __Y);
65 }
66 
67 static __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__))
_pext_u64(unsigned long long __X,unsigned long long __Y)68 _pext_u64(unsigned long long __X, unsigned long long __Y)
69 {
70   return __builtin_ia32_pext_di(__X, __Y);
71 }
72 
73 static __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__))
_mulx_u64(unsigned long long __X,unsigned long long __Y,unsigned long long * __P)74 _mulx_u64 (unsigned long long __X, unsigned long long __Y,
75 	   unsigned long long *__P)
76 {
77   unsigned __int128 __res = (unsigned __int128) __X * __Y;
78   *__P = (unsigned long long) (__res >> 64);
79   return (unsigned long long) __res;
80 }
81 
82 #else /* !__x86_64__ */
83 
84 static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__))
_mulx_u32(unsigned int __X,unsigned int __Y,unsigned int * __P)85 _mulx_u32 (unsigned int __X, unsigned int __Y, unsigned int *__P)
86 {
87   unsigned long long __res = (unsigned long long) __X * __Y;
88   *__P = (unsigned int) (__res >> 32);
89   return (unsigned int) __res;
90 }
91 
92 #endif /* !__x86_64__  */
93 
94 #endif /* __BMI2INTRIN_H */
95