1*67e74705SXin Li /*===---- tbmintrin.h - TBM intrinsics -------------------------------------===
2*67e74705SXin Li *
3*67e74705SXin Li * Permission is hereby granted, free of charge, to any person obtaining a copy
4*67e74705SXin Li * of this software and associated documentation files (the "Software"), to deal
5*67e74705SXin Li * in the Software without restriction, including without limitation the rights
6*67e74705SXin Li * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
7*67e74705SXin Li * copies of the Software, and to permit persons to whom the Software is
8*67e74705SXin Li * furnished to do so, subject to the following conditions:
9*67e74705SXin Li *
10*67e74705SXin Li * The above copyright notice and this permission notice shall be included in
11*67e74705SXin Li * all copies or substantial portions of the Software.
12*67e74705SXin Li *
13*67e74705SXin Li * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14*67e74705SXin Li * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15*67e74705SXin Li * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
16*67e74705SXin Li * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
17*67e74705SXin Li * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
18*67e74705SXin Li * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
19*67e74705SXin Li * THE SOFTWARE.
20*67e74705SXin Li *
21*67e74705SXin Li *===-----------------------------------------------------------------------===
22*67e74705SXin Li */
23*67e74705SXin Li
24*67e74705SXin Li #ifndef __X86INTRIN_H
25*67e74705SXin Li #error "Never use <tbmintrin.h> directly; include <x86intrin.h> instead."
26*67e74705SXin Li #endif
27*67e74705SXin Li
28*67e74705SXin Li #ifndef __TBMINTRIN_H
29*67e74705SXin Li #define __TBMINTRIN_H
30*67e74705SXin Li
31*67e74705SXin Li /* Define the default attributes for the functions in this file. */
32*67e74705SXin Li #define __DEFAULT_FN_ATTRS __attribute__((__always_inline__, __nodebug__, __target__("tbm")))
33*67e74705SXin Li
34*67e74705SXin Li #define __bextri_u32(a, b) \
35*67e74705SXin Li ((unsigned int)__builtin_ia32_bextri_u32((unsigned int)(a), \
36*67e74705SXin Li (unsigned int)(b)))
37*67e74705SXin Li
38*67e74705SXin Li static __inline__ unsigned int __DEFAULT_FN_ATTRS
__blcfill_u32(unsigned int __a)39*67e74705SXin Li __blcfill_u32(unsigned int __a)
40*67e74705SXin Li {
41*67e74705SXin Li return __a & (__a + 1);
42*67e74705SXin Li }
43*67e74705SXin Li
44*67e74705SXin Li static __inline__ unsigned int __DEFAULT_FN_ATTRS
__blci_u32(unsigned int __a)45*67e74705SXin Li __blci_u32(unsigned int __a)
46*67e74705SXin Li {
47*67e74705SXin Li return __a | ~(__a + 1);
48*67e74705SXin Li }
49*67e74705SXin Li
50*67e74705SXin Li static __inline__ unsigned int __DEFAULT_FN_ATTRS
__blcic_u32(unsigned int __a)51*67e74705SXin Li __blcic_u32(unsigned int __a)
52*67e74705SXin Li {
53*67e74705SXin Li return ~__a & (__a + 1);
54*67e74705SXin Li }
55*67e74705SXin Li
56*67e74705SXin Li static __inline__ unsigned int __DEFAULT_FN_ATTRS
__blcmsk_u32(unsigned int __a)57*67e74705SXin Li __blcmsk_u32(unsigned int __a)
58*67e74705SXin Li {
59*67e74705SXin Li return __a ^ (__a + 1);
60*67e74705SXin Li }
61*67e74705SXin Li
62*67e74705SXin Li static __inline__ unsigned int __DEFAULT_FN_ATTRS
__blcs_u32(unsigned int __a)63*67e74705SXin Li __blcs_u32(unsigned int __a)
64*67e74705SXin Li {
65*67e74705SXin Li return __a | (__a + 1);
66*67e74705SXin Li }
67*67e74705SXin Li
68*67e74705SXin Li static __inline__ unsigned int __DEFAULT_FN_ATTRS
__blsfill_u32(unsigned int __a)69*67e74705SXin Li __blsfill_u32(unsigned int __a)
70*67e74705SXin Li {
71*67e74705SXin Li return __a | (__a - 1);
72*67e74705SXin Li }
73*67e74705SXin Li
74*67e74705SXin Li static __inline__ unsigned int __DEFAULT_FN_ATTRS
__blsic_u32(unsigned int __a)75*67e74705SXin Li __blsic_u32(unsigned int __a)
76*67e74705SXin Li {
77*67e74705SXin Li return ~__a | (__a - 1);
78*67e74705SXin Li }
79*67e74705SXin Li
80*67e74705SXin Li static __inline__ unsigned int __DEFAULT_FN_ATTRS
__t1mskc_u32(unsigned int __a)81*67e74705SXin Li __t1mskc_u32(unsigned int __a)
82*67e74705SXin Li {
83*67e74705SXin Li return ~__a | (__a + 1);
84*67e74705SXin Li }
85*67e74705SXin Li
86*67e74705SXin Li static __inline__ unsigned int __DEFAULT_FN_ATTRS
__tzmsk_u32(unsigned int __a)87*67e74705SXin Li __tzmsk_u32(unsigned int __a)
88*67e74705SXin Li {
89*67e74705SXin Li return ~__a & (__a - 1);
90*67e74705SXin Li }
91*67e74705SXin Li
92*67e74705SXin Li #ifdef __x86_64__
93*67e74705SXin Li #define __bextri_u64(a, b) \
94*67e74705SXin Li ((unsigned long long)__builtin_ia32_bextri_u64((unsigned long long)(a), \
95*67e74705SXin Li (unsigned long long)(b)))
96*67e74705SXin Li
97*67e74705SXin Li static __inline__ unsigned long long __DEFAULT_FN_ATTRS
__blcfill_u64(unsigned long long __a)98*67e74705SXin Li __blcfill_u64(unsigned long long __a)
99*67e74705SXin Li {
100*67e74705SXin Li return __a & (__a + 1);
101*67e74705SXin Li }
102*67e74705SXin Li
103*67e74705SXin Li static __inline__ unsigned long long __DEFAULT_FN_ATTRS
__blci_u64(unsigned long long __a)104*67e74705SXin Li __blci_u64(unsigned long long __a)
105*67e74705SXin Li {
106*67e74705SXin Li return __a | ~(__a + 1);
107*67e74705SXin Li }
108*67e74705SXin Li
109*67e74705SXin Li static __inline__ unsigned long long __DEFAULT_FN_ATTRS
__blcic_u64(unsigned long long __a)110*67e74705SXin Li __blcic_u64(unsigned long long __a)
111*67e74705SXin Li {
112*67e74705SXin Li return ~__a & (__a + 1);
113*67e74705SXin Li }
114*67e74705SXin Li
115*67e74705SXin Li static __inline__ unsigned long long __DEFAULT_FN_ATTRS
__blcmsk_u64(unsigned long long __a)116*67e74705SXin Li __blcmsk_u64(unsigned long long __a)
117*67e74705SXin Li {
118*67e74705SXin Li return __a ^ (__a + 1);
119*67e74705SXin Li }
120*67e74705SXin Li
121*67e74705SXin Li static __inline__ unsigned long long __DEFAULT_FN_ATTRS
__blcs_u64(unsigned long long __a)122*67e74705SXin Li __blcs_u64(unsigned long long __a)
123*67e74705SXin Li {
124*67e74705SXin Li return __a | (__a + 1);
125*67e74705SXin Li }
126*67e74705SXin Li
127*67e74705SXin Li static __inline__ unsigned long long __DEFAULT_FN_ATTRS
__blsfill_u64(unsigned long long __a)128*67e74705SXin Li __blsfill_u64(unsigned long long __a)
129*67e74705SXin Li {
130*67e74705SXin Li return __a | (__a - 1);
131*67e74705SXin Li }
132*67e74705SXin Li
133*67e74705SXin Li static __inline__ unsigned long long __DEFAULT_FN_ATTRS
__blsic_u64(unsigned long long __a)134*67e74705SXin Li __blsic_u64(unsigned long long __a)
135*67e74705SXin Li {
136*67e74705SXin Li return ~__a | (__a - 1);
137*67e74705SXin Li }
138*67e74705SXin Li
139*67e74705SXin Li static __inline__ unsigned long long __DEFAULT_FN_ATTRS
__t1mskc_u64(unsigned long long __a)140*67e74705SXin Li __t1mskc_u64(unsigned long long __a)
141*67e74705SXin Li {
142*67e74705SXin Li return ~__a | (__a + 1);
143*67e74705SXin Li }
144*67e74705SXin Li
145*67e74705SXin Li static __inline__ unsigned long long __DEFAULT_FN_ATTRS
__tzmsk_u64(unsigned long long __a)146*67e74705SXin Li __tzmsk_u64(unsigned long long __a)
147*67e74705SXin Li {
148*67e74705SXin Li return ~__a & (__a - 1);
149*67e74705SXin Li }
150*67e74705SXin Li #endif
151*67e74705SXin Li
152*67e74705SXin Li #undef __DEFAULT_FN_ATTRS
153*67e74705SXin Li
154*67e74705SXin Li #endif /* __TBMINTRIN_H */
155