xref: /aosp_15_r20/external/vixl/src/compiler-intrinsics-vixl.cc (revision f5c631da2f1efdd72b5fd1e20510e4042af13d77)
1*f5c631daSSadaf Ebrahimi // Copyright 2015, VIXL authors
2*f5c631daSSadaf Ebrahimi // All rights reserved.
3*f5c631daSSadaf Ebrahimi //
4*f5c631daSSadaf Ebrahimi // Redistribution and use in source and binary forms, with or without
5*f5c631daSSadaf Ebrahimi // modification, are permitted provided that the following conditions are met:
6*f5c631daSSadaf Ebrahimi //
7*f5c631daSSadaf Ebrahimi //   * Redistributions of source code must retain the above copyright notice,
8*f5c631daSSadaf Ebrahimi //     this list of conditions and the following disclaimer.
9*f5c631daSSadaf Ebrahimi //   * Redistributions in binary form must reproduce the above copyright notice,
10*f5c631daSSadaf Ebrahimi //     this list of conditions and the following disclaimer in the documentation
11*f5c631daSSadaf Ebrahimi //     and/or other materials provided with the distribution.
12*f5c631daSSadaf Ebrahimi //   * Neither the name of ARM Limited nor the names of its contributors may be
13*f5c631daSSadaf Ebrahimi //     used to endorse or promote products derived from this software without
14*f5c631daSSadaf Ebrahimi //     specific prior written permission.
15*f5c631daSSadaf Ebrahimi //
16*f5c631daSSadaf Ebrahimi // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS CONTRIBUTORS "AS IS" AND
17*f5c631daSSadaf Ebrahimi // ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18*f5c631daSSadaf Ebrahimi // WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19*f5c631daSSadaf Ebrahimi // DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
20*f5c631daSSadaf Ebrahimi // FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21*f5c631daSSadaf Ebrahimi // DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
22*f5c631daSSadaf Ebrahimi // SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
23*f5c631daSSadaf Ebrahimi // CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
24*f5c631daSSadaf Ebrahimi // OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
25*f5c631daSSadaf Ebrahimi // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26*f5c631daSSadaf Ebrahimi 
27*f5c631daSSadaf Ebrahimi #include "compiler-intrinsics-vixl.h"
28*f5c631daSSadaf Ebrahimi #include "utils-vixl.h"
29*f5c631daSSadaf Ebrahimi 
30*f5c631daSSadaf Ebrahimi namespace vixl {
31*f5c631daSSadaf Ebrahimi 
32*f5c631daSSadaf Ebrahimi 
CountLeadingSignBitsFallBack(int64_t value,int width)33*f5c631daSSadaf Ebrahimi int CountLeadingSignBitsFallBack(int64_t value, int width) {
34*f5c631daSSadaf Ebrahimi   VIXL_ASSERT(IsPowerOf2(width) && (width <= 64));
35*f5c631daSSadaf Ebrahimi   if (width < 64) VIXL_ASSERT(IsIntN(width, value));
36*f5c631daSSadaf Ebrahimi   if (value >= 0) {
37*f5c631daSSadaf Ebrahimi     return CountLeadingZeros(value, width) - 1;
38*f5c631daSSadaf Ebrahimi   } else {
39*f5c631daSSadaf Ebrahimi     return CountLeadingZeros(~value, width) - 1;
40*f5c631daSSadaf Ebrahimi   }
41*f5c631daSSadaf Ebrahimi }
42*f5c631daSSadaf Ebrahimi 
43*f5c631daSSadaf Ebrahimi 
CountLeadingZerosFallBack(uint64_t value,int width)44*f5c631daSSadaf Ebrahimi int CountLeadingZerosFallBack(uint64_t value, int width) {
45*f5c631daSSadaf Ebrahimi   VIXL_ASSERT(IsPowerOf2(width) && (width <= 64));
46*f5c631daSSadaf Ebrahimi   if (value == 0) {
47*f5c631daSSadaf Ebrahimi     return width;
48*f5c631daSSadaf Ebrahimi   }
49*f5c631daSSadaf Ebrahimi   int count = 0;
50*f5c631daSSadaf Ebrahimi   value = value << (64 - width);
51*f5c631daSSadaf Ebrahimi   if ((value & UINT64_C(0xffffffff00000000)) == 0) {
52*f5c631daSSadaf Ebrahimi     count += 32;
53*f5c631daSSadaf Ebrahimi     value = value << 32;
54*f5c631daSSadaf Ebrahimi   }
55*f5c631daSSadaf Ebrahimi   if ((value & UINT64_C(0xffff000000000000)) == 0) {
56*f5c631daSSadaf Ebrahimi     count += 16;
57*f5c631daSSadaf Ebrahimi     value = value << 16;
58*f5c631daSSadaf Ebrahimi   }
59*f5c631daSSadaf Ebrahimi   if ((value & UINT64_C(0xff00000000000000)) == 0) {
60*f5c631daSSadaf Ebrahimi     count += 8;
61*f5c631daSSadaf Ebrahimi     value = value << 8;
62*f5c631daSSadaf Ebrahimi   }
63*f5c631daSSadaf Ebrahimi   if ((value & UINT64_C(0xf000000000000000)) == 0) {
64*f5c631daSSadaf Ebrahimi     count += 4;
65*f5c631daSSadaf Ebrahimi     value = value << 4;
66*f5c631daSSadaf Ebrahimi   }
67*f5c631daSSadaf Ebrahimi   if ((value & UINT64_C(0xc000000000000000)) == 0) {
68*f5c631daSSadaf Ebrahimi     count += 2;
69*f5c631daSSadaf Ebrahimi     value = value << 2;
70*f5c631daSSadaf Ebrahimi   }
71*f5c631daSSadaf Ebrahimi   if ((value & UINT64_C(0x8000000000000000)) == 0) {
72*f5c631daSSadaf Ebrahimi     count += 1;
73*f5c631daSSadaf Ebrahimi   }
74*f5c631daSSadaf Ebrahimi   count += (value == 0);
75*f5c631daSSadaf Ebrahimi   return count;
76*f5c631daSSadaf Ebrahimi }
77*f5c631daSSadaf Ebrahimi 
78*f5c631daSSadaf Ebrahimi 
CountSetBitsFallBack(uint64_t value,int width)79*f5c631daSSadaf Ebrahimi int CountSetBitsFallBack(uint64_t value, int width) {
80*f5c631daSSadaf Ebrahimi   VIXL_ASSERT(IsPowerOf2(width) && (width <= 64));
81*f5c631daSSadaf Ebrahimi 
82*f5c631daSSadaf Ebrahimi   // Mask out unused bits to ensure that they are not counted.
83*f5c631daSSadaf Ebrahimi   value &= (UINT64_C(0xffffffffffffffff) >> (64 - width));
84*f5c631daSSadaf Ebrahimi 
85*f5c631daSSadaf Ebrahimi   // Add up the set bits.
86*f5c631daSSadaf Ebrahimi   // The algorithm works by adding pairs of bit fields together iteratively,
87*f5c631daSSadaf Ebrahimi   // where the size of each bit field doubles each time.
88*f5c631daSSadaf Ebrahimi   // An example for an 8-bit value:
89*f5c631daSSadaf Ebrahimi   // Bits:  h  g  f  e  d  c  b  a
90*f5c631daSSadaf Ebrahimi   //         \ |   \ |   \ |   \ |
91*f5c631daSSadaf Ebrahimi   // value = h+g   f+e   d+c   b+a
92*f5c631daSSadaf Ebrahimi   //            \    |      \    |
93*f5c631daSSadaf Ebrahimi   // value =   h+g+f+e     d+c+b+a
94*f5c631daSSadaf Ebrahimi   //                  \          |
95*f5c631daSSadaf Ebrahimi   // value =       h+g+f+e+d+c+b+a
96*f5c631daSSadaf Ebrahimi   const uint64_t kMasks[] = {
97*f5c631daSSadaf Ebrahimi       UINT64_C(0x5555555555555555),
98*f5c631daSSadaf Ebrahimi       UINT64_C(0x3333333333333333),
99*f5c631daSSadaf Ebrahimi       UINT64_C(0x0f0f0f0f0f0f0f0f),
100*f5c631daSSadaf Ebrahimi       UINT64_C(0x00ff00ff00ff00ff),
101*f5c631daSSadaf Ebrahimi       UINT64_C(0x0000ffff0000ffff),
102*f5c631daSSadaf Ebrahimi       UINT64_C(0x00000000ffffffff),
103*f5c631daSSadaf Ebrahimi   };
104*f5c631daSSadaf Ebrahimi 
105*f5c631daSSadaf Ebrahimi   for (unsigned i = 0; i < (sizeof(kMasks) / sizeof(kMasks[0])); i++) {
106*f5c631daSSadaf Ebrahimi     int shift = 1 << i;
107*f5c631daSSadaf Ebrahimi     value = ((value >> shift) & kMasks[i]) + (value & kMasks[i]);
108*f5c631daSSadaf Ebrahimi   }
109*f5c631daSSadaf Ebrahimi 
110*f5c631daSSadaf Ebrahimi   return static_cast<int>(value);
111*f5c631daSSadaf Ebrahimi }
112*f5c631daSSadaf Ebrahimi 
113*f5c631daSSadaf Ebrahimi 
CountTrailingZerosFallBack(uint64_t value,int width)114*f5c631daSSadaf Ebrahimi int CountTrailingZerosFallBack(uint64_t value, int width) {
115*f5c631daSSadaf Ebrahimi   VIXL_ASSERT(IsPowerOf2(width) && (width <= 64));
116*f5c631daSSadaf Ebrahimi   int count = 0;
117*f5c631daSSadaf Ebrahimi   value = value << (64 - width);
118*f5c631daSSadaf Ebrahimi   if ((value & UINT64_C(0xffffffff)) == 0) {
119*f5c631daSSadaf Ebrahimi     count += 32;
120*f5c631daSSadaf Ebrahimi     value = value >> 32;
121*f5c631daSSadaf Ebrahimi   }
122*f5c631daSSadaf Ebrahimi   if ((value & 0xffff) == 0) {
123*f5c631daSSadaf Ebrahimi     count += 16;
124*f5c631daSSadaf Ebrahimi     value = value >> 16;
125*f5c631daSSadaf Ebrahimi   }
126*f5c631daSSadaf Ebrahimi   if ((value & 0xff) == 0) {
127*f5c631daSSadaf Ebrahimi     count += 8;
128*f5c631daSSadaf Ebrahimi     value = value >> 8;
129*f5c631daSSadaf Ebrahimi   }
130*f5c631daSSadaf Ebrahimi   if ((value & 0xf) == 0) {
131*f5c631daSSadaf Ebrahimi     count += 4;
132*f5c631daSSadaf Ebrahimi     value = value >> 4;
133*f5c631daSSadaf Ebrahimi   }
134*f5c631daSSadaf Ebrahimi   if ((value & 0x3) == 0) {
135*f5c631daSSadaf Ebrahimi     count += 2;
136*f5c631daSSadaf Ebrahimi     value = value >> 2;
137*f5c631daSSadaf Ebrahimi   }
138*f5c631daSSadaf Ebrahimi   if ((value & 0x1) == 0) {
139*f5c631daSSadaf Ebrahimi     count += 1;
140*f5c631daSSadaf Ebrahimi   }
141*f5c631daSSadaf Ebrahimi   count += (value == 0);
142*f5c631daSSadaf Ebrahimi   return count - (64 - width);
143*f5c631daSSadaf Ebrahimi }
144*f5c631daSSadaf Ebrahimi 
145*f5c631daSSadaf Ebrahimi 
146*f5c631daSSadaf Ebrahimi }  // namespace vixl
147