xref: /aosp_15_r20/external/mesa3d/src/util/bitscan.h (revision 6104692788411f58d303aa86923a9ff6ecaded22)
1*61046927SAndroid Build Coastguard Worker /**************************************************************************
2*61046927SAndroid Build Coastguard Worker  *
3*61046927SAndroid Build Coastguard Worker  * Copyright 2008 VMware, Inc.
4*61046927SAndroid Build Coastguard Worker  * All Rights Reserved.
5*61046927SAndroid Build Coastguard Worker  *
6*61046927SAndroid Build Coastguard Worker  * Permission is hereby granted, free of charge, to any person obtaining a
7*61046927SAndroid Build Coastguard Worker  * copy of this software and associated documentation files (the
8*61046927SAndroid Build Coastguard Worker  * "Software"), to deal in the Software without restriction, including
9*61046927SAndroid Build Coastguard Worker  * without limitation the rights to use, copy, modify, merge, publish,
10*61046927SAndroid Build Coastguard Worker  * distribute, sub license, and/or sell copies of the Software, and to
11*61046927SAndroid Build Coastguard Worker  * permit persons to whom the Software is furnished to do so, subject to
12*61046927SAndroid Build Coastguard Worker  * the following conditions:
13*61046927SAndroid Build Coastguard Worker  *
14*61046927SAndroid Build Coastguard Worker  * The above copyright notice and this permission notice (including the
15*61046927SAndroid Build Coastguard Worker  * next paragraph) shall be included in all copies or substantial portions
16*61046927SAndroid Build Coastguard Worker  * of the Software.
17*61046927SAndroid Build Coastguard Worker  *
18*61046927SAndroid Build Coastguard Worker  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19*61046927SAndroid Build Coastguard Worker  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20*61046927SAndroid Build Coastguard Worker  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21*61046927SAndroid Build Coastguard Worker  * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22*61046927SAndroid Build Coastguard Worker  * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23*61046927SAndroid Build Coastguard Worker  * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24*61046927SAndroid Build Coastguard Worker  * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25*61046927SAndroid Build Coastguard Worker  *
26*61046927SAndroid Build Coastguard Worker  **************************************************************************/
27*61046927SAndroid Build Coastguard Worker 
28*61046927SAndroid Build Coastguard Worker 
29*61046927SAndroid Build Coastguard Worker #ifndef BITSCAN_H
30*61046927SAndroid Build Coastguard Worker #define BITSCAN_H
31*61046927SAndroid Build Coastguard Worker 
32*61046927SAndroid Build Coastguard Worker #include <assert.h>
33*61046927SAndroid Build Coastguard Worker #include <stdint.h>
34*61046927SAndroid Build Coastguard Worker #include <stdbool.h>
35*61046927SAndroid Build Coastguard Worker #include <string.h>
36*61046927SAndroid Build Coastguard Worker 
37*61046927SAndroid Build Coastguard Worker #if defined(_MSC_VER)
38*61046927SAndroid Build Coastguard Worker #include <intrin.h>
39*61046927SAndroid Build Coastguard Worker #endif
40*61046927SAndroid Build Coastguard Worker 
41*61046927SAndroid Build Coastguard Worker #if defined(__POPCNT__)
42*61046927SAndroid Build Coastguard Worker #include <popcntintrin.h>
43*61046927SAndroid Build Coastguard Worker #endif
44*61046927SAndroid Build Coastguard Worker 
45*61046927SAndroid Build Coastguard Worker #include "macros.h"
46*61046927SAndroid Build Coastguard Worker 
47*61046927SAndroid Build Coastguard Worker #ifdef __cplusplus
48*61046927SAndroid Build Coastguard Worker extern "C" {
49*61046927SAndroid Build Coastguard Worker #endif
50*61046927SAndroid Build Coastguard Worker 
51*61046927SAndroid Build Coastguard Worker 
52*61046927SAndroid Build Coastguard Worker /**
53*61046927SAndroid Build Coastguard Worker  * Find first bit set in word.  Least significant bit is 1.
54*61046927SAndroid Build Coastguard Worker  * Return 0 if no bits set.
55*61046927SAndroid Build Coastguard Worker  */
56*61046927SAndroid Build Coastguard Worker #ifdef HAVE___BUILTIN_FFS
57*61046927SAndroid Build Coastguard Worker #define ffs __builtin_ffs
58*61046927SAndroid Build Coastguard Worker #elif defined(_MSC_VER) && (_M_IX86 || _M_ARM || _M_AMD64 || _M_IA64)
59*61046927SAndroid Build Coastguard Worker static inline
60*61046927SAndroid Build Coastguard Worker int ffs(int i)
61*61046927SAndroid Build Coastguard Worker {
62*61046927SAndroid Build Coastguard Worker    unsigned long index;
63*61046927SAndroid Build Coastguard Worker    if (_BitScanForward(&index, i))
64*61046927SAndroid Build Coastguard Worker       return index + 1;
65*61046927SAndroid Build Coastguard Worker    else
66*61046927SAndroid Build Coastguard Worker       return 0;
67*61046927SAndroid Build Coastguard Worker }
68*61046927SAndroid Build Coastguard Worker #else
69*61046927SAndroid Build Coastguard Worker extern
70*61046927SAndroid Build Coastguard Worker int ffs(int i);
71*61046927SAndroid Build Coastguard Worker #endif
72*61046927SAndroid Build Coastguard Worker 
73*61046927SAndroid Build Coastguard Worker #ifdef HAVE___BUILTIN_FFSLL
74*61046927SAndroid Build Coastguard Worker #define ffsll __builtin_ffsll
75*61046927SAndroid Build Coastguard Worker #elif defined(_MSC_VER) && (_M_AMD64 || _M_ARM64 || _M_IA64)
76*61046927SAndroid Build Coastguard Worker static inline int
77*61046927SAndroid Build Coastguard Worker ffsll(long long int i)
78*61046927SAndroid Build Coastguard Worker {
79*61046927SAndroid Build Coastguard Worker    unsigned long index;
80*61046927SAndroid Build Coastguard Worker    if (_BitScanForward64(&index, i))
81*61046927SAndroid Build Coastguard Worker       return index + 1;
82*61046927SAndroid Build Coastguard Worker    else
83*61046927SAndroid Build Coastguard Worker       return 0;
84*61046927SAndroid Build Coastguard Worker }
85*61046927SAndroid Build Coastguard Worker #else
86*61046927SAndroid Build Coastguard Worker extern int
87*61046927SAndroid Build Coastguard Worker ffsll(long long int val);
88*61046927SAndroid Build Coastguard Worker #endif
89*61046927SAndroid Build Coastguard Worker 
90*61046927SAndroid Build Coastguard Worker 
91*61046927SAndroid Build Coastguard Worker /* Destructively loop over all of the bits in a mask as in:
92*61046927SAndroid Build Coastguard Worker  *
93*61046927SAndroid Build Coastguard Worker  * while (mymask) {
94*61046927SAndroid Build Coastguard Worker  *   int i = u_bit_scan(&mymask);
95*61046927SAndroid Build Coastguard Worker  *   ... process element i
96*61046927SAndroid Build Coastguard Worker  * }
97*61046927SAndroid Build Coastguard Worker  *
98*61046927SAndroid Build Coastguard Worker  */
99*61046927SAndroid Build Coastguard Worker static inline int
u_bit_scan(unsigned * mask)100*61046927SAndroid Build Coastguard Worker u_bit_scan(unsigned *mask)
101*61046927SAndroid Build Coastguard Worker {
102*61046927SAndroid Build Coastguard Worker    const int i = ffs(*mask) - 1;
103*61046927SAndroid Build Coastguard Worker    *mask ^= (1u << i);
104*61046927SAndroid Build Coastguard Worker    return i;
105*61046927SAndroid Build Coastguard Worker }
106*61046927SAndroid Build Coastguard Worker 
107*61046927SAndroid Build Coastguard Worker #define u_foreach_bit(b, dword)                          \
108*61046927SAndroid Build Coastguard Worker    for (uint32_t __dword = (dword), b;                     \
109*61046927SAndroid Build Coastguard Worker         ((b) = ffs(__dword) - 1, __dword);      \
110*61046927SAndroid Build Coastguard Worker         __dword &= ~(1 << (b)))
111*61046927SAndroid Build Coastguard Worker 
112*61046927SAndroid Build Coastguard Worker static inline int
u_bit_scan64(uint64_t * mask)113*61046927SAndroid Build Coastguard Worker u_bit_scan64(uint64_t *mask)
114*61046927SAndroid Build Coastguard Worker {
115*61046927SAndroid Build Coastguard Worker    const int i = ffsll(*mask) - 1;
116*61046927SAndroid Build Coastguard Worker    *mask ^= (((uint64_t)1) << i);
117*61046927SAndroid Build Coastguard Worker    return i;
118*61046927SAndroid Build Coastguard Worker }
119*61046927SAndroid Build Coastguard Worker 
120*61046927SAndroid Build Coastguard Worker #define u_foreach_bit64(b, dword)                          \
121*61046927SAndroid Build Coastguard Worker    for (uint64_t __dword = (dword), b;                     \
122*61046927SAndroid Build Coastguard Worker         ((b) = ffsll(__dword) - 1, __dword);      \
123*61046927SAndroid Build Coastguard Worker         __dword &= ~(1ull << (b)))
124*61046927SAndroid Build Coastguard Worker 
125*61046927SAndroid Build Coastguard Worker /* Determine if an uint32_t value is a power of two.
126*61046927SAndroid Build Coastguard Worker  *
127*61046927SAndroid Build Coastguard Worker  * \note
128*61046927SAndroid Build Coastguard Worker  * Zero is treated as a power of two.
129*61046927SAndroid Build Coastguard Worker  */
130*61046927SAndroid Build Coastguard Worker static inline bool
util_is_power_of_two_or_zero(uint32_t v)131*61046927SAndroid Build Coastguard Worker util_is_power_of_two_or_zero(uint32_t v)
132*61046927SAndroid Build Coastguard Worker {
133*61046927SAndroid Build Coastguard Worker    return IS_POT(v);
134*61046927SAndroid Build Coastguard Worker }
135*61046927SAndroid Build Coastguard Worker 
136*61046927SAndroid Build Coastguard Worker /* Determine if an uint64_t value is a power of two.
137*61046927SAndroid Build Coastguard Worker  *
138*61046927SAndroid Build Coastguard Worker  * \note
139*61046927SAndroid Build Coastguard Worker  * Zero is treated as a power of two.
140*61046927SAndroid Build Coastguard Worker  */
141*61046927SAndroid Build Coastguard Worker static inline bool
util_is_power_of_two_or_zero64(uint64_t v)142*61046927SAndroid Build Coastguard Worker util_is_power_of_two_or_zero64(uint64_t v)
143*61046927SAndroid Build Coastguard Worker {
144*61046927SAndroid Build Coastguard Worker    return IS_POT(v);
145*61046927SAndroid Build Coastguard Worker }
146*61046927SAndroid Build Coastguard Worker 
147*61046927SAndroid Build Coastguard Worker /* Determine if an uint32_t value is a power of two.
148*61046927SAndroid Build Coastguard Worker  *
149*61046927SAndroid Build Coastguard Worker  * \note
150*61046927SAndroid Build Coastguard Worker  * Zero is \b not treated as a power of two.
151*61046927SAndroid Build Coastguard Worker  */
152*61046927SAndroid Build Coastguard Worker static inline bool
util_is_power_of_two_nonzero(uint32_t v)153*61046927SAndroid Build Coastguard Worker util_is_power_of_two_nonzero(uint32_t v)
154*61046927SAndroid Build Coastguard Worker {
155*61046927SAndroid Build Coastguard Worker    /* __POPCNT__ is different from HAVE___BUILTIN_POPCOUNT.  The latter
156*61046927SAndroid Build Coastguard Worker     * indicates the existence of the __builtin_popcount function.  The former
157*61046927SAndroid Build Coastguard Worker     * indicates that _mm_popcnt_u32 exists and is a native instruction.
158*61046927SAndroid Build Coastguard Worker     *
159*61046927SAndroid Build Coastguard Worker     * The other alternative is to use SSE 4.2 compile-time flags.  This has
160*61046927SAndroid Build Coastguard Worker     * two drawbacks.  First, there is currently no build infrastructure for
161*61046927SAndroid Build Coastguard Worker     * SSE 4.2 (only 4.1), so that would have to be added.  Second, some AMD
162*61046927SAndroid Build Coastguard Worker     * CPUs support POPCNT but not SSE 4.2 (e.g., Barcelona).
163*61046927SAndroid Build Coastguard Worker     */
164*61046927SAndroid Build Coastguard Worker #ifdef __POPCNT__
165*61046927SAndroid Build Coastguard Worker    return _mm_popcnt_u32(v) == 1;
166*61046927SAndroid Build Coastguard Worker #else
167*61046927SAndroid Build Coastguard Worker    return IS_POT_NONZERO(v);
168*61046927SAndroid Build Coastguard Worker #endif
169*61046927SAndroid Build Coastguard Worker }
170*61046927SAndroid Build Coastguard Worker 
171*61046927SAndroid Build Coastguard Worker /* Determine if an uint64_t value is a power of two.
172*61046927SAndroid Build Coastguard Worker  *
173*61046927SAndroid Build Coastguard Worker  * \note
174*61046927SAndroid Build Coastguard Worker  * Zero is \b not treated as a power of two.
175*61046927SAndroid Build Coastguard Worker  */
176*61046927SAndroid Build Coastguard Worker static inline bool
util_is_power_of_two_nonzero64(uint64_t v)177*61046927SAndroid Build Coastguard Worker util_is_power_of_two_nonzero64(uint64_t v)
178*61046927SAndroid Build Coastguard Worker {
179*61046927SAndroid Build Coastguard Worker    return IS_POT_NONZERO(v);
180*61046927SAndroid Build Coastguard Worker }
181*61046927SAndroid Build Coastguard Worker 
182*61046927SAndroid Build Coastguard Worker /* Determine if an size_t/uintptr_t/intptr_t value is a power of two.
183*61046927SAndroid Build Coastguard Worker  *
184*61046927SAndroid Build Coastguard Worker  * \note
185*61046927SAndroid Build Coastguard Worker  * Zero is \b not treated as a power of two.
186*61046927SAndroid Build Coastguard Worker  */
187*61046927SAndroid Build Coastguard Worker static inline bool
util_is_power_of_two_nonzero_uintptr(uintptr_t v)188*61046927SAndroid Build Coastguard Worker util_is_power_of_two_nonzero_uintptr(uintptr_t v)
189*61046927SAndroid Build Coastguard Worker {
190*61046927SAndroid Build Coastguard Worker    return IS_POT_NONZERO(v);
191*61046927SAndroid Build Coastguard Worker }
192*61046927SAndroid Build Coastguard Worker 
193*61046927SAndroid Build Coastguard Worker /* For looping over a bitmask when you want to loop over consecutive bits
194*61046927SAndroid Build Coastguard Worker  * manually, for example:
195*61046927SAndroid Build Coastguard Worker  *
196*61046927SAndroid Build Coastguard Worker  * while (mask) {
197*61046927SAndroid Build Coastguard Worker  *    int start, count, i;
198*61046927SAndroid Build Coastguard Worker  *
199*61046927SAndroid Build Coastguard Worker  *    u_bit_scan_consecutive_range(&mask, &start, &count);
200*61046927SAndroid Build Coastguard Worker  *
201*61046927SAndroid Build Coastguard Worker  *    for (i = 0; i < count; i++)
202*61046927SAndroid Build Coastguard Worker  *       ... process element (start+i)
203*61046927SAndroid Build Coastguard Worker  * }
204*61046927SAndroid Build Coastguard Worker  */
205*61046927SAndroid Build Coastguard Worker static inline void
u_bit_scan_consecutive_range(unsigned * mask,int * start,int * count)206*61046927SAndroid Build Coastguard Worker u_bit_scan_consecutive_range(unsigned *mask, int *start, int *count)
207*61046927SAndroid Build Coastguard Worker {
208*61046927SAndroid Build Coastguard Worker    if (*mask == 0xffffffff) {
209*61046927SAndroid Build Coastguard Worker       *start = 0;
210*61046927SAndroid Build Coastguard Worker       *count = 32;
211*61046927SAndroid Build Coastguard Worker       *mask = 0;
212*61046927SAndroid Build Coastguard Worker       return;
213*61046927SAndroid Build Coastguard Worker    }
214*61046927SAndroid Build Coastguard Worker    *start = ffs(*mask) - 1;
215*61046927SAndroid Build Coastguard Worker    *count = ffs(~(*mask >> *start)) - 1;
216*61046927SAndroid Build Coastguard Worker    *mask &= ~(((1u << *count) - 1) << *start);
217*61046927SAndroid Build Coastguard Worker }
218*61046927SAndroid Build Coastguard Worker 
219*61046927SAndroid Build Coastguard Worker static inline void
u_bit_scan_consecutive_range64(uint64_t * mask,int * start,int * count)220*61046927SAndroid Build Coastguard Worker u_bit_scan_consecutive_range64(uint64_t *mask, int *start, int *count)
221*61046927SAndroid Build Coastguard Worker {
222*61046927SAndroid Build Coastguard Worker    if (*mask == ~0ull) {
223*61046927SAndroid Build Coastguard Worker       *start = 0;
224*61046927SAndroid Build Coastguard Worker       *count = 64;
225*61046927SAndroid Build Coastguard Worker       *mask = 0;
226*61046927SAndroid Build Coastguard Worker       return;
227*61046927SAndroid Build Coastguard Worker    }
228*61046927SAndroid Build Coastguard Worker    *start = ffsll(*mask) - 1;
229*61046927SAndroid Build Coastguard Worker    *count = ffsll(~(*mask >> *start)) - 1;
230*61046927SAndroid Build Coastguard Worker    *mask &= ~(((((uint64_t)1) << *count) - 1) << *start);
231*61046927SAndroid Build Coastguard Worker }
232*61046927SAndroid Build Coastguard Worker 
233*61046927SAndroid Build Coastguard Worker 
234*61046927SAndroid Build Coastguard Worker /**
235*61046927SAndroid Build Coastguard Worker  * Find last bit set in a word.  The least significant bit is 1.
236*61046927SAndroid Build Coastguard Worker  * Return 0 if no bits are set.
237*61046927SAndroid Build Coastguard Worker  * Essentially ffs() in the reverse direction.
238*61046927SAndroid Build Coastguard Worker  */
239*61046927SAndroid Build Coastguard Worker static inline unsigned
util_last_bit(unsigned u)240*61046927SAndroid Build Coastguard Worker util_last_bit(unsigned u)
241*61046927SAndroid Build Coastguard Worker {
242*61046927SAndroid Build Coastguard Worker #if defined(HAVE___BUILTIN_CLZ)
243*61046927SAndroid Build Coastguard Worker    return u == 0 ? 0 : 32 - __builtin_clz(u);
244*61046927SAndroid Build Coastguard Worker #elif defined(_MSC_VER) && (_M_IX86 || _M_ARM || _M_AMD64 || _M_IA64)
245*61046927SAndroid Build Coastguard Worker    unsigned long index;
246*61046927SAndroid Build Coastguard Worker    if (_BitScanReverse(&index, u))
247*61046927SAndroid Build Coastguard Worker       return index + 1;
248*61046927SAndroid Build Coastguard Worker    else
249*61046927SAndroid Build Coastguard Worker       return 0;
250*61046927SAndroid Build Coastguard Worker #else
251*61046927SAndroid Build Coastguard Worker    unsigned r = 0;
252*61046927SAndroid Build Coastguard Worker    while (u) {
253*61046927SAndroid Build Coastguard Worker       r++;
254*61046927SAndroid Build Coastguard Worker       u >>= 1;
255*61046927SAndroid Build Coastguard Worker    }
256*61046927SAndroid Build Coastguard Worker    return r;
257*61046927SAndroid Build Coastguard Worker #endif
258*61046927SAndroid Build Coastguard Worker }
259*61046927SAndroid Build Coastguard Worker 
260*61046927SAndroid Build Coastguard Worker /**
261*61046927SAndroid Build Coastguard Worker  * Find last bit set in a word.  The least significant bit is 1.
262*61046927SAndroid Build Coastguard Worker  * Return 0 if no bits are set.
263*61046927SAndroid Build Coastguard Worker  * Essentially ffsll() in the reverse direction.
264*61046927SAndroid Build Coastguard Worker  */
265*61046927SAndroid Build Coastguard Worker static inline unsigned
util_last_bit64(uint64_t u)266*61046927SAndroid Build Coastguard Worker util_last_bit64(uint64_t u)
267*61046927SAndroid Build Coastguard Worker {
268*61046927SAndroid Build Coastguard Worker #if defined(HAVE___BUILTIN_CLZLL)
269*61046927SAndroid Build Coastguard Worker    return u == 0 ? 0 : 64 - __builtin_clzll(u);
270*61046927SAndroid Build Coastguard Worker #elif defined(_MSC_VER) && (_M_AMD64 || _M_ARM64 || _M_IA64)
271*61046927SAndroid Build Coastguard Worker    unsigned long index;
272*61046927SAndroid Build Coastguard Worker    if (_BitScanReverse64(&index, u))
273*61046927SAndroid Build Coastguard Worker       return index + 1;
274*61046927SAndroid Build Coastguard Worker    else
275*61046927SAndroid Build Coastguard Worker       return 0;
276*61046927SAndroid Build Coastguard Worker #else
277*61046927SAndroid Build Coastguard Worker    unsigned r = 0;
278*61046927SAndroid Build Coastguard Worker    while (u) {
279*61046927SAndroid Build Coastguard Worker       r++;
280*61046927SAndroid Build Coastguard Worker       u >>= 1;
281*61046927SAndroid Build Coastguard Worker    }
282*61046927SAndroid Build Coastguard Worker    return r;
283*61046927SAndroid Build Coastguard Worker #endif
284*61046927SAndroid Build Coastguard Worker }
285*61046927SAndroid Build Coastguard Worker 
286*61046927SAndroid Build Coastguard Worker /**
287*61046927SAndroid Build Coastguard Worker  * Find last bit in a word that does not match the sign bit. The least
288*61046927SAndroid Build Coastguard Worker  * significant bit is 1.
289*61046927SAndroid Build Coastguard Worker  * Return 0 if no bits are set.
290*61046927SAndroid Build Coastguard Worker  */
291*61046927SAndroid Build Coastguard Worker static inline unsigned
util_last_bit_signed(int i)292*61046927SAndroid Build Coastguard Worker util_last_bit_signed(int i)
293*61046927SAndroid Build Coastguard Worker {
294*61046927SAndroid Build Coastguard Worker    if (i >= 0)
295*61046927SAndroid Build Coastguard Worker       return util_last_bit(i);
296*61046927SAndroid Build Coastguard Worker    else
297*61046927SAndroid Build Coastguard Worker       return util_last_bit(~(unsigned)i);
298*61046927SAndroid Build Coastguard Worker }
299*61046927SAndroid Build Coastguard Worker 
300*61046927SAndroid Build Coastguard Worker /* Returns a bitfield in which the first count bits starting at start are
301*61046927SAndroid Build Coastguard Worker  * set.
302*61046927SAndroid Build Coastguard Worker  */
303*61046927SAndroid Build Coastguard Worker static inline unsigned
u_bit_consecutive(unsigned start,unsigned count)304*61046927SAndroid Build Coastguard Worker u_bit_consecutive(unsigned start, unsigned count)
305*61046927SAndroid Build Coastguard Worker {
306*61046927SAndroid Build Coastguard Worker    assert(start + count <= 32);
307*61046927SAndroid Build Coastguard Worker    if (count == 32)
308*61046927SAndroid Build Coastguard Worker       return ~0;
309*61046927SAndroid Build Coastguard Worker    return ((1u << count) - 1) << start;
310*61046927SAndroid Build Coastguard Worker }
311*61046927SAndroid Build Coastguard Worker 
312*61046927SAndroid Build Coastguard Worker static inline uint64_t
u_bit_consecutive64(unsigned start,unsigned count)313*61046927SAndroid Build Coastguard Worker u_bit_consecutive64(unsigned start, unsigned count)
314*61046927SAndroid Build Coastguard Worker {
315*61046927SAndroid Build Coastguard Worker    assert(start + count <= 64);
316*61046927SAndroid Build Coastguard Worker    if (count == 64)
317*61046927SAndroid Build Coastguard Worker       return ~(uint64_t)0;
318*61046927SAndroid Build Coastguard Worker    return (((uint64_t)1 << count) - 1) << start;
319*61046927SAndroid Build Coastguard Worker }
320*61046927SAndroid Build Coastguard Worker 
321*61046927SAndroid Build Coastguard Worker /**
322*61046927SAndroid Build Coastguard Worker  * Return number of bits set in n.
323*61046927SAndroid Build Coastguard Worker  */
324*61046927SAndroid Build Coastguard Worker static inline unsigned
util_bitcount(unsigned n)325*61046927SAndroid Build Coastguard Worker util_bitcount(unsigned n)
326*61046927SAndroid Build Coastguard Worker {
327*61046927SAndroid Build Coastguard Worker #if defined(HAVE___BUILTIN_POPCOUNT)
328*61046927SAndroid Build Coastguard Worker    return __builtin_popcount(n);
329*61046927SAndroid Build Coastguard Worker #else
330*61046927SAndroid Build Coastguard Worker    /* K&R classic bitcount.
331*61046927SAndroid Build Coastguard Worker     *
332*61046927SAndroid Build Coastguard Worker     * For each iteration, clear the LSB from the bitfield.
333*61046927SAndroid Build Coastguard Worker     * Requires only one iteration per set bit, instead of
334*61046927SAndroid Build Coastguard Worker     * one iteration per bit less than highest set bit.
335*61046927SAndroid Build Coastguard Worker     */
336*61046927SAndroid Build Coastguard Worker    unsigned bits;
337*61046927SAndroid Build Coastguard Worker    for (bits = 0; n; bits++) {
338*61046927SAndroid Build Coastguard Worker       n &= n - 1;
339*61046927SAndroid Build Coastguard Worker    }
340*61046927SAndroid Build Coastguard Worker    return bits;
341*61046927SAndroid Build Coastguard Worker #endif
342*61046927SAndroid Build Coastguard Worker }
343*61046927SAndroid Build Coastguard Worker 
344*61046927SAndroid Build Coastguard Worker /**
345*61046927SAndroid Build Coastguard Worker  * Return the number of bits set in n using the native popcnt instruction.
346*61046927SAndroid Build Coastguard Worker  * The caller is responsible for ensuring that popcnt is supported by the CPU.
347*61046927SAndroid Build Coastguard Worker  *
348*61046927SAndroid Build Coastguard Worker  * gcc doesn't use it if -mpopcnt or -march= that has popcnt is missing.
349*61046927SAndroid Build Coastguard Worker  *
350*61046927SAndroid Build Coastguard Worker  */
351*61046927SAndroid Build Coastguard Worker static inline unsigned
util_popcnt_inline_asm(unsigned n)352*61046927SAndroid Build Coastguard Worker util_popcnt_inline_asm(unsigned n)
353*61046927SAndroid Build Coastguard Worker {
354*61046927SAndroid Build Coastguard Worker #if defined(USE_X86_64_ASM) || defined(USE_X86_ASM)
355*61046927SAndroid Build Coastguard Worker    uint32_t out;
356*61046927SAndroid Build Coastguard Worker    __asm volatile("popcnt %1, %0" : "=r"(out) : "r"(n));
357*61046927SAndroid Build Coastguard Worker    return out;
358*61046927SAndroid Build Coastguard Worker #else
359*61046927SAndroid Build Coastguard Worker    /* We should never get here by accident, but I'm sure it'll happen. */
360*61046927SAndroid Build Coastguard Worker    return util_bitcount(n);
361*61046927SAndroid Build Coastguard Worker #endif
362*61046927SAndroid Build Coastguard Worker }
363*61046927SAndroid Build Coastguard Worker 
364*61046927SAndroid Build Coastguard Worker static inline unsigned
util_bitcount64(uint64_t n)365*61046927SAndroid Build Coastguard Worker util_bitcount64(uint64_t n)
366*61046927SAndroid Build Coastguard Worker {
367*61046927SAndroid Build Coastguard Worker #ifdef HAVE___BUILTIN_POPCOUNTLL
368*61046927SAndroid Build Coastguard Worker    return __builtin_popcountll(n);
369*61046927SAndroid Build Coastguard Worker #else
370*61046927SAndroid Build Coastguard Worker    return util_bitcount(n) + util_bitcount(n >> 32);
371*61046927SAndroid Build Coastguard Worker #endif
372*61046927SAndroid Build Coastguard Worker }
373*61046927SAndroid Build Coastguard Worker 
374*61046927SAndroid Build Coastguard Worker /**
375*61046927SAndroid Build Coastguard Worker  * Widens the given bit mask by a multiplier, meaning that it will
376*61046927SAndroid Build Coastguard Worker  * replicate each bit by that amount.
377*61046927SAndroid Build Coastguard Worker  *
378*61046927SAndroid Build Coastguard Worker  * For example:
379*61046927SAndroid Build Coastguard Worker  * 0b101 widened by 2 will become: 0b110011
380*61046927SAndroid Build Coastguard Worker  *
381*61046927SAndroid Build Coastguard Worker  * This is typically used in shader I/O to transform a 64-bit
382*61046927SAndroid Build Coastguard Worker  * writemask to a 32-bit writemask.
383*61046927SAndroid Build Coastguard Worker  */
384*61046927SAndroid Build Coastguard Worker static inline uint32_t
util_widen_mask(uint32_t mask,unsigned multiplier)385*61046927SAndroid Build Coastguard Worker util_widen_mask(uint32_t mask, unsigned multiplier)
386*61046927SAndroid Build Coastguard Worker {
387*61046927SAndroid Build Coastguard Worker    uint32_t new_mask = 0;
388*61046927SAndroid Build Coastguard Worker    u_foreach_bit(i, mask)
389*61046927SAndroid Build Coastguard Worker       new_mask |= ((1u << multiplier) - 1u) << (i * multiplier);
390*61046927SAndroid Build Coastguard Worker    return new_mask;
391*61046927SAndroid Build Coastguard Worker }
392*61046927SAndroid Build Coastguard Worker 
393*61046927SAndroid Build Coastguard Worker #ifdef __cplusplus
394*61046927SAndroid Build Coastguard Worker }
395*61046927SAndroid Build Coastguard Worker 
396*61046927SAndroid Build Coastguard Worker /* util_bitcount has large measurable overhead (~2%), so it's recommended to
397*61046927SAndroid Build Coastguard Worker  * use the POPCNT instruction via inline assembly if the CPU supports it.
398*61046927SAndroid Build Coastguard Worker  */
399*61046927SAndroid Build Coastguard Worker enum util_popcnt {
400*61046927SAndroid Build Coastguard Worker    POPCNT_NO,
401*61046927SAndroid Build Coastguard Worker    POPCNT_YES,
402*61046927SAndroid Build Coastguard Worker    POPCNT_INVALID,
403*61046927SAndroid Build Coastguard Worker };
404*61046927SAndroid Build Coastguard Worker 
405*61046927SAndroid Build Coastguard Worker /* Convenient function to select popcnt through a C++ template argument.
406*61046927SAndroid Build Coastguard Worker  * This should be used as part of larger functions that are optimized
407*61046927SAndroid Build Coastguard Worker  * as a whole.
408*61046927SAndroid Build Coastguard Worker  */
409*61046927SAndroid Build Coastguard Worker template<util_popcnt POPCNT> inline unsigned
util_bitcount_fast(unsigned n)410*61046927SAndroid Build Coastguard Worker util_bitcount_fast(unsigned n)
411*61046927SAndroid Build Coastguard Worker {
412*61046927SAndroid Build Coastguard Worker    if (POPCNT == POPCNT_YES)
413*61046927SAndroid Build Coastguard Worker       return util_popcnt_inline_asm(n);
414*61046927SAndroid Build Coastguard Worker    else
415*61046927SAndroid Build Coastguard Worker       return util_bitcount(n);
416*61046927SAndroid Build Coastguard Worker }
417*61046927SAndroid Build Coastguard Worker 
418*61046927SAndroid Build Coastguard Worker #endif /* __cplusplus */
419*61046927SAndroid Build Coastguard Worker 
420*61046927SAndroid Build Coastguard Worker #endif /* BITSCAN_H */
421