xref: /aosp_15_r20/external/vixl/src/aarch64/cpu-aarch64.cc (revision f5c631da2f1efdd72b5fd1e20510e4042af13d77)
1*f5c631daSSadaf Ebrahimi // Copyright 2015, VIXL authors
2*f5c631daSSadaf Ebrahimi // All rights reserved.
3*f5c631daSSadaf Ebrahimi //
4*f5c631daSSadaf Ebrahimi // Redistribution and use in source and binary forms, with or without
5*f5c631daSSadaf Ebrahimi // modification, are permitted provided that the following conditions are met:
6*f5c631daSSadaf Ebrahimi //
7*f5c631daSSadaf Ebrahimi //   * Redistributions of source code must retain the above copyright notice,
8*f5c631daSSadaf Ebrahimi //     this list of conditions and the following disclaimer.
9*f5c631daSSadaf Ebrahimi //   * Redistributions in binary form must reproduce the above copyright notice,
10*f5c631daSSadaf Ebrahimi //     this list of conditions and the following disclaimer in the documentation
11*f5c631daSSadaf Ebrahimi //     and/or other materials provided with the distribution.
12*f5c631daSSadaf Ebrahimi //   * Neither the name of ARM Limited nor the names of its contributors may be
13*f5c631daSSadaf Ebrahimi //     used to endorse or promote products derived from this software without
14*f5c631daSSadaf Ebrahimi //     specific prior written permission.
15*f5c631daSSadaf Ebrahimi //
16*f5c631daSSadaf Ebrahimi // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS CONTRIBUTORS "AS IS" AND
17*f5c631daSSadaf Ebrahimi // ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18*f5c631daSSadaf Ebrahimi // WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19*f5c631daSSadaf Ebrahimi // DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
20*f5c631daSSadaf Ebrahimi // FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21*f5c631daSSadaf Ebrahimi // DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
22*f5c631daSSadaf Ebrahimi // SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
23*f5c631daSSadaf Ebrahimi // CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
24*f5c631daSSadaf Ebrahimi // OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
25*f5c631daSSadaf Ebrahimi // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26*f5c631daSSadaf Ebrahimi 
27*f5c631daSSadaf Ebrahimi #if defined(__aarch64__) && (defined(__ANDROID__) || defined(__linux__))
28*f5c631daSSadaf Ebrahimi #include <sys/auxv.h>
29*f5c631daSSadaf Ebrahimi #define VIXL_USE_LINUX_HWCAP 1
30*f5c631daSSadaf Ebrahimi #endif
31*f5c631daSSadaf Ebrahimi 
32*f5c631daSSadaf Ebrahimi #include "../utils-vixl.h"
33*f5c631daSSadaf Ebrahimi 
34*f5c631daSSadaf Ebrahimi #include "cpu-aarch64.h"
35*f5c631daSSadaf Ebrahimi 
36*f5c631daSSadaf Ebrahimi namespace vixl {
37*f5c631daSSadaf Ebrahimi namespace aarch64 {
38*f5c631daSSadaf Ebrahimi 
39*f5c631daSSadaf Ebrahimi 
40*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64PFR0::kFP(16, Field::kSigned);
41*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64PFR0::kAdvSIMD(20, Field::kSigned);
42*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64PFR0::kRAS(28);
43*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64PFR0::kSVE(32);
44*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64PFR0::kDIT(48);
45*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64PFR0::kCSV2(56);
46*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64PFR0::kCSV3(60);
47*f5c631daSSadaf Ebrahimi 
48*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64PFR1::kBT(0);
49*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64PFR1::kSSBS(4);
50*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64PFR1::kMTE(8);
51*f5c631daSSadaf Ebrahimi 
52*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR0::kAES(4);
53*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR0::kSHA1(8);
54*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR0::kSHA2(12);
55*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR0::kCRC32(16);
56*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR0::kAtomic(20);
57*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR0::kRDM(28);
58*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR0::kSHA3(32);
59*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR0::kSM3(36);
60*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR0::kSM4(40);
61*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR0::kDP(44);
62*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR0::kFHM(48);
63*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR0::kTS(52);
64*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR0::kRNDR(60);
65*f5c631daSSadaf Ebrahimi 
66*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kDPB(0);
67*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kAPA(4);
68*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kAPI(8);
69*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kJSCVT(12);
70*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kFCMA(16);
71*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kLRCPC(20);
72*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kGPA(24);
73*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kGPI(28);
74*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kFRINTTS(32);
75*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kSB(36);
76*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kSPECRES(40);
77*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kBF16(44);
78*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kDGH(48);
79*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR1::kI8MM(52);
80*f5c631daSSadaf Ebrahimi 
81*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ISAR2::kRPRES(4);
82*f5c631daSSadaf Ebrahimi 
83*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64MMFR0::kECV(60);
84*f5c631daSSadaf Ebrahimi 
85*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64MMFR1::kLO(16);
86*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64MMFR1::kAFP(44);
87*f5c631daSSadaf Ebrahimi 
88*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64MMFR2::kAT(32);
89*f5c631daSSadaf Ebrahimi 
90*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ZFR0::kSVEver(0);
91*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ZFR0::kAES(4);
92*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ZFR0::kBitPerm(16);
93*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ZFR0::kBF16(20);
94*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ZFR0::kSHA3(32);
95*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ZFR0::kSM4(40);
96*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ZFR0::kI8MM(44);
97*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ZFR0::kF32MM(52);
98*f5c631daSSadaf Ebrahimi const IDRegister::Field AA64ZFR0::kF64MM(56);
99*f5c631daSSadaf Ebrahimi 
GetCPUFeatures() const100*f5c631daSSadaf Ebrahimi CPUFeatures AA64PFR0::GetCPUFeatures() const {
101*f5c631daSSadaf Ebrahimi   CPUFeatures f;
102*f5c631daSSadaf Ebrahimi   if (Get(kFP) >= 0) f.Combine(CPUFeatures::kFP);
103*f5c631daSSadaf Ebrahimi   if (Get(kFP) >= 1) f.Combine(CPUFeatures::kFPHalf);
104*f5c631daSSadaf Ebrahimi   if (Get(kAdvSIMD) >= 0) f.Combine(CPUFeatures::kNEON);
105*f5c631daSSadaf Ebrahimi   if (Get(kAdvSIMD) >= 1) f.Combine(CPUFeatures::kNEONHalf);
106*f5c631daSSadaf Ebrahimi   if (Get(kRAS) >= 1) f.Combine(CPUFeatures::kRAS);
107*f5c631daSSadaf Ebrahimi   if (Get(kSVE) >= 1) f.Combine(CPUFeatures::kSVE);
108*f5c631daSSadaf Ebrahimi   if (Get(kDIT) >= 1) f.Combine(CPUFeatures::kDIT);
109*f5c631daSSadaf Ebrahimi   if (Get(kCSV2) >= 1) f.Combine(CPUFeatures::kCSV2);
110*f5c631daSSadaf Ebrahimi   if (Get(kCSV2) >= 2) f.Combine(CPUFeatures::kSCXTNUM);
111*f5c631daSSadaf Ebrahimi   if (Get(kCSV3) >= 1) f.Combine(CPUFeatures::kCSV3);
112*f5c631daSSadaf Ebrahimi   return f;
113*f5c631daSSadaf Ebrahimi }
114*f5c631daSSadaf Ebrahimi 
GetCPUFeatures() const115*f5c631daSSadaf Ebrahimi CPUFeatures AA64PFR1::GetCPUFeatures() const {
116*f5c631daSSadaf Ebrahimi   CPUFeatures f;
117*f5c631daSSadaf Ebrahimi   if (Get(kBT) >= 1) f.Combine(CPUFeatures::kBTI);
118*f5c631daSSadaf Ebrahimi   if (Get(kSSBS) >= 1) f.Combine(CPUFeatures::kSSBS);
119*f5c631daSSadaf Ebrahimi   if (Get(kSSBS) >= 2) f.Combine(CPUFeatures::kSSBSControl);
120*f5c631daSSadaf Ebrahimi   if (Get(kMTE) >= 1) f.Combine(CPUFeatures::kMTEInstructions);
121*f5c631daSSadaf Ebrahimi   if (Get(kMTE) >= 2) f.Combine(CPUFeatures::kMTE);
122*f5c631daSSadaf Ebrahimi   return f;
123*f5c631daSSadaf Ebrahimi }
124*f5c631daSSadaf Ebrahimi 
GetCPUFeatures() const125*f5c631daSSadaf Ebrahimi CPUFeatures AA64ISAR0::GetCPUFeatures() const {
126*f5c631daSSadaf Ebrahimi   CPUFeatures f;
127*f5c631daSSadaf Ebrahimi   if (Get(kAES) >= 1) f.Combine(CPUFeatures::kAES);
128*f5c631daSSadaf Ebrahimi   if (Get(kAES) >= 2) f.Combine(CPUFeatures::kPmull1Q);
129*f5c631daSSadaf Ebrahimi   if (Get(kSHA1) >= 1) f.Combine(CPUFeatures::kSHA1);
130*f5c631daSSadaf Ebrahimi   if (Get(kSHA2) >= 1) f.Combine(CPUFeatures::kSHA2);
131*f5c631daSSadaf Ebrahimi   if (Get(kSHA2) >= 2) f.Combine(CPUFeatures::kSHA512);
132*f5c631daSSadaf Ebrahimi   if (Get(kCRC32) >= 1) f.Combine(CPUFeatures::kCRC32);
133*f5c631daSSadaf Ebrahimi   if (Get(kAtomic) >= 1) f.Combine(CPUFeatures::kAtomics);
134*f5c631daSSadaf Ebrahimi   if (Get(kRDM) >= 1) f.Combine(CPUFeatures::kRDM);
135*f5c631daSSadaf Ebrahimi   if (Get(kSHA3) >= 1) f.Combine(CPUFeatures::kSHA3);
136*f5c631daSSadaf Ebrahimi   if (Get(kSM3) >= 1) f.Combine(CPUFeatures::kSM3);
137*f5c631daSSadaf Ebrahimi   if (Get(kSM4) >= 1) f.Combine(CPUFeatures::kSM4);
138*f5c631daSSadaf Ebrahimi   if (Get(kDP) >= 1) f.Combine(CPUFeatures::kDotProduct);
139*f5c631daSSadaf Ebrahimi   if (Get(kFHM) >= 1) f.Combine(CPUFeatures::kFHM);
140*f5c631daSSadaf Ebrahimi   if (Get(kTS) >= 1) f.Combine(CPUFeatures::kFlagM);
141*f5c631daSSadaf Ebrahimi   if (Get(kTS) >= 2) f.Combine(CPUFeatures::kAXFlag);
142*f5c631daSSadaf Ebrahimi   if (Get(kRNDR) >= 1) f.Combine(CPUFeatures::kRNG);
143*f5c631daSSadaf Ebrahimi   return f;
144*f5c631daSSadaf Ebrahimi }
145*f5c631daSSadaf Ebrahimi 
GetCPUFeatures() const146*f5c631daSSadaf Ebrahimi CPUFeatures AA64ISAR1::GetCPUFeatures() const {
147*f5c631daSSadaf Ebrahimi   CPUFeatures f;
148*f5c631daSSadaf Ebrahimi   if (Get(kDPB) >= 1) f.Combine(CPUFeatures::kDCPoP);
149*f5c631daSSadaf Ebrahimi   if (Get(kDPB) >= 2) f.Combine(CPUFeatures::kDCCVADP);
150*f5c631daSSadaf Ebrahimi   if (Get(kJSCVT) >= 1) f.Combine(CPUFeatures::kJSCVT);
151*f5c631daSSadaf Ebrahimi   if (Get(kFCMA) >= 1) f.Combine(CPUFeatures::kFcma);
152*f5c631daSSadaf Ebrahimi   if (Get(kLRCPC) >= 1) f.Combine(CPUFeatures::kRCpc);
153*f5c631daSSadaf Ebrahimi   if (Get(kLRCPC) >= 2) f.Combine(CPUFeatures::kRCpcImm);
154*f5c631daSSadaf Ebrahimi   if (Get(kFRINTTS) >= 1) f.Combine(CPUFeatures::kFrintToFixedSizedInt);
155*f5c631daSSadaf Ebrahimi   if (Get(kSB) >= 1) f.Combine(CPUFeatures::kSB);
156*f5c631daSSadaf Ebrahimi   if (Get(kSPECRES) >= 1) f.Combine(CPUFeatures::kSPECRES);
157*f5c631daSSadaf Ebrahimi   if (Get(kBF16) >= 1) f.Combine(CPUFeatures::kBF16);
158*f5c631daSSadaf Ebrahimi   if (Get(kDGH) >= 1) f.Combine(CPUFeatures::kDGH);
159*f5c631daSSadaf Ebrahimi   if (Get(kI8MM) >= 1) f.Combine(CPUFeatures::kI8MM);
160*f5c631daSSadaf Ebrahimi 
161*f5c631daSSadaf Ebrahimi   // Only one of these fields should be non-zero, but they have the same
162*f5c631daSSadaf Ebrahimi   // encodings, so merge the logic.
163*f5c631daSSadaf Ebrahimi   int apx = std::max(Get(kAPI), Get(kAPA));
164*f5c631daSSadaf Ebrahimi   if (apx >= 1) {
165*f5c631daSSadaf Ebrahimi     f.Combine(CPUFeatures::kPAuth);
166*f5c631daSSadaf Ebrahimi     // APA (rather than API) indicates QARMA.
167*f5c631daSSadaf Ebrahimi     if (Get(kAPA) >= 1) f.Combine(CPUFeatures::kPAuthQARMA);
168*f5c631daSSadaf Ebrahimi     if (apx == 0b0010) f.Combine(CPUFeatures::kPAuthEnhancedPAC);
169*f5c631daSSadaf Ebrahimi     if (apx >= 0b0011) f.Combine(CPUFeatures::kPAuthEnhancedPAC2);
170*f5c631daSSadaf Ebrahimi     if (apx >= 0b0100) f.Combine(CPUFeatures::kPAuthFPAC);
171*f5c631daSSadaf Ebrahimi     if (apx >= 0b0101) f.Combine(CPUFeatures::kPAuthFPACCombined);
172*f5c631daSSadaf Ebrahimi   }
173*f5c631daSSadaf Ebrahimi 
174*f5c631daSSadaf Ebrahimi   if (Get(kGPI) >= 1) f.Combine(CPUFeatures::kPAuthGeneric);
175*f5c631daSSadaf Ebrahimi   if (Get(kGPA) >= 1) {
176*f5c631daSSadaf Ebrahimi     f.Combine(CPUFeatures::kPAuthGeneric, CPUFeatures::kPAuthGenericQARMA);
177*f5c631daSSadaf Ebrahimi   }
178*f5c631daSSadaf Ebrahimi   return f;
179*f5c631daSSadaf Ebrahimi }
180*f5c631daSSadaf Ebrahimi 
GetCPUFeatures() const181*f5c631daSSadaf Ebrahimi CPUFeatures AA64ISAR2::GetCPUFeatures() const {
182*f5c631daSSadaf Ebrahimi   CPUFeatures f;
183*f5c631daSSadaf Ebrahimi   if (Get(kRPRES) >= 1) f.Combine(CPUFeatures::kRPRES);
184*f5c631daSSadaf Ebrahimi   return f;
185*f5c631daSSadaf Ebrahimi }
186*f5c631daSSadaf Ebrahimi 
GetCPUFeatures() const187*f5c631daSSadaf Ebrahimi CPUFeatures AA64MMFR0::GetCPUFeatures() const {
188*f5c631daSSadaf Ebrahimi   CPUFeatures f;
189*f5c631daSSadaf Ebrahimi   if (Get(kECV) >= 1) f.Combine(CPUFeatures::kECV);
190*f5c631daSSadaf Ebrahimi   return f;
191*f5c631daSSadaf Ebrahimi }
192*f5c631daSSadaf Ebrahimi 
GetCPUFeatures() const193*f5c631daSSadaf Ebrahimi CPUFeatures AA64MMFR1::GetCPUFeatures() const {
194*f5c631daSSadaf Ebrahimi   CPUFeatures f;
195*f5c631daSSadaf Ebrahimi   if (Get(kLO) >= 1) f.Combine(CPUFeatures::kLORegions);
196*f5c631daSSadaf Ebrahimi   if (Get(kAFP) >= 1) f.Combine(CPUFeatures::kAFP);
197*f5c631daSSadaf Ebrahimi   return f;
198*f5c631daSSadaf Ebrahimi }
199*f5c631daSSadaf Ebrahimi 
GetCPUFeatures() const200*f5c631daSSadaf Ebrahimi CPUFeatures AA64MMFR2::GetCPUFeatures() const {
201*f5c631daSSadaf Ebrahimi   CPUFeatures f;
202*f5c631daSSadaf Ebrahimi   if (Get(kAT) >= 1) f.Combine(CPUFeatures::kUSCAT);
203*f5c631daSSadaf Ebrahimi   return f;
204*f5c631daSSadaf Ebrahimi }
205*f5c631daSSadaf Ebrahimi 
GetCPUFeatures() const206*f5c631daSSadaf Ebrahimi CPUFeatures AA64ZFR0::GetCPUFeatures() const {
207*f5c631daSSadaf Ebrahimi   // This register is only available with SVE, but reads-as-zero in its absence,
208*f5c631daSSadaf Ebrahimi   // so it's always safe to read it.
209*f5c631daSSadaf Ebrahimi   CPUFeatures f;
210*f5c631daSSadaf Ebrahimi   if (Get(kF64MM) >= 1) f.Combine(CPUFeatures::kSVEF64MM);
211*f5c631daSSadaf Ebrahimi   if (Get(kF32MM) >= 1) f.Combine(CPUFeatures::kSVEF32MM);
212*f5c631daSSadaf Ebrahimi   if (Get(kI8MM) >= 1) f.Combine(CPUFeatures::kSVEI8MM);
213*f5c631daSSadaf Ebrahimi   if (Get(kSM4) >= 1) f.Combine(CPUFeatures::kSVESM4);
214*f5c631daSSadaf Ebrahimi   if (Get(kSHA3) >= 1) f.Combine(CPUFeatures::kSVESHA3);
215*f5c631daSSadaf Ebrahimi   if (Get(kBF16) >= 1) f.Combine(CPUFeatures::kSVEBF16);
216*f5c631daSSadaf Ebrahimi   if (Get(kBitPerm) >= 1) f.Combine(CPUFeatures::kSVEBitPerm);
217*f5c631daSSadaf Ebrahimi   if (Get(kAES) >= 1) f.Combine(CPUFeatures::kSVEAES);
218*f5c631daSSadaf Ebrahimi   if (Get(kAES) >= 2) f.Combine(CPUFeatures::kSVEPmull128);
219*f5c631daSSadaf Ebrahimi   if (Get(kSVEver) >= 1) f.Combine(CPUFeatures::kSVE2);
220*f5c631daSSadaf Ebrahimi   return f;
221*f5c631daSSadaf Ebrahimi }
222*f5c631daSSadaf Ebrahimi 
Get(IDRegister::Field field) const223*f5c631daSSadaf Ebrahimi int IDRegister::Get(IDRegister::Field field) const {
224*f5c631daSSadaf Ebrahimi   int msb = field.GetMsb();
225*f5c631daSSadaf Ebrahimi   int lsb = field.GetLsb();
226*f5c631daSSadaf Ebrahimi   VIXL_STATIC_ASSERT(static_cast<size_t>(Field::kMaxWidthInBits) <
227*f5c631daSSadaf Ebrahimi                      (sizeof(int) * kBitsPerByte));
228*f5c631daSSadaf Ebrahimi   switch (field.GetType()) {
229*f5c631daSSadaf Ebrahimi     case Field::kSigned:
230*f5c631daSSadaf Ebrahimi       return static_cast<int>(ExtractSignedBitfield64(msb, lsb, value_));
231*f5c631daSSadaf Ebrahimi     case Field::kUnsigned:
232*f5c631daSSadaf Ebrahimi       return static_cast<int>(ExtractUnsignedBitfield64(msb, lsb, value_));
233*f5c631daSSadaf Ebrahimi   }
234*f5c631daSSadaf Ebrahimi   VIXL_UNREACHABLE();
235*f5c631daSSadaf Ebrahimi   return 0;
236*f5c631daSSadaf Ebrahimi }
237*f5c631daSSadaf Ebrahimi 
InferCPUFeaturesFromIDRegisters()238*f5c631daSSadaf Ebrahimi CPUFeatures CPU::InferCPUFeaturesFromIDRegisters() {
239*f5c631daSSadaf Ebrahimi   CPUFeatures f;
240*f5c631daSSadaf Ebrahimi #define VIXL_COMBINE_ID_REG(NAME, MRS_ARG) \
241*f5c631daSSadaf Ebrahimi   f.Combine(Read##NAME().GetCPUFeatures());
242*f5c631daSSadaf Ebrahimi   VIXL_AARCH64_ID_REG_LIST(VIXL_COMBINE_ID_REG)
243*f5c631daSSadaf Ebrahimi #undef VIXL_COMBINE_ID_REG
244*f5c631daSSadaf Ebrahimi   return f;
245*f5c631daSSadaf Ebrahimi }
246*f5c631daSSadaf Ebrahimi 
InferCPUFeaturesFromOS(CPUFeatures::QueryIDRegistersOption option)247*f5c631daSSadaf Ebrahimi CPUFeatures CPU::InferCPUFeaturesFromOS(
248*f5c631daSSadaf Ebrahimi     CPUFeatures::QueryIDRegistersOption option) {
249*f5c631daSSadaf Ebrahimi   CPUFeatures features;
250*f5c631daSSadaf Ebrahimi 
251*f5c631daSSadaf Ebrahimi #if VIXL_USE_LINUX_HWCAP
252*f5c631daSSadaf Ebrahimi   // Map each set bit onto a feature. Ideally, we'd use HWCAP_* macros rather
253*f5c631daSSadaf Ebrahimi   // than explicit bits, but explicit bits allow us to identify features that
254*f5c631daSSadaf Ebrahimi   // the toolchain doesn't know about.
255*f5c631daSSadaf Ebrahimi   static const CPUFeatures::Feature kFeatureBits[] =
256*f5c631daSSadaf Ebrahimi       {// Bits 0-7
257*f5c631daSSadaf Ebrahimi        CPUFeatures::kFP,
258*f5c631daSSadaf Ebrahimi        CPUFeatures::kNEON,
259*f5c631daSSadaf Ebrahimi        CPUFeatures::kNone,  // "EVTSTRM", which VIXL doesn't track.
260*f5c631daSSadaf Ebrahimi        CPUFeatures::kAES,
261*f5c631daSSadaf Ebrahimi        CPUFeatures::kPmull1Q,
262*f5c631daSSadaf Ebrahimi        CPUFeatures::kSHA1,
263*f5c631daSSadaf Ebrahimi        CPUFeatures::kSHA2,
264*f5c631daSSadaf Ebrahimi        CPUFeatures::kCRC32,
265*f5c631daSSadaf Ebrahimi        // Bits 8-15
266*f5c631daSSadaf Ebrahimi        CPUFeatures::kAtomics,
267*f5c631daSSadaf Ebrahimi        CPUFeatures::kFPHalf,
268*f5c631daSSadaf Ebrahimi        CPUFeatures::kNEONHalf,
269*f5c631daSSadaf Ebrahimi        CPUFeatures::kIDRegisterEmulation,
270*f5c631daSSadaf Ebrahimi        CPUFeatures::kRDM,
271*f5c631daSSadaf Ebrahimi        CPUFeatures::kJSCVT,
272*f5c631daSSadaf Ebrahimi        CPUFeatures::kFcma,
273*f5c631daSSadaf Ebrahimi        CPUFeatures::kRCpc,
274*f5c631daSSadaf Ebrahimi        // Bits 16-23
275*f5c631daSSadaf Ebrahimi        CPUFeatures::kDCPoP,
276*f5c631daSSadaf Ebrahimi        CPUFeatures::kSHA3,
277*f5c631daSSadaf Ebrahimi        CPUFeatures::kSM3,
278*f5c631daSSadaf Ebrahimi        CPUFeatures::kSM4,
279*f5c631daSSadaf Ebrahimi        CPUFeatures::kDotProduct,
280*f5c631daSSadaf Ebrahimi        CPUFeatures::kSHA512,
281*f5c631daSSadaf Ebrahimi        CPUFeatures::kSVE,
282*f5c631daSSadaf Ebrahimi        CPUFeatures::kFHM,
283*f5c631daSSadaf Ebrahimi        // Bits 24-31
284*f5c631daSSadaf Ebrahimi        CPUFeatures::kDIT,
285*f5c631daSSadaf Ebrahimi        CPUFeatures::kUSCAT,
286*f5c631daSSadaf Ebrahimi        CPUFeatures::kRCpcImm,
287*f5c631daSSadaf Ebrahimi        CPUFeatures::kFlagM,
288*f5c631daSSadaf Ebrahimi        CPUFeatures::kSSBSControl,
289*f5c631daSSadaf Ebrahimi        CPUFeatures::kSB,
290*f5c631daSSadaf Ebrahimi        CPUFeatures::kPAuth,
291*f5c631daSSadaf Ebrahimi        CPUFeatures::kPAuthGeneric,
292*f5c631daSSadaf Ebrahimi        // Bits 32-39
293*f5c631daSSadaf Ebrahimi        CPUFeatures::kDCCVADP,
294*f5c631daSSadaf Ebrahimi        CPUFeatures::kSVE2,
295*f5c631daSSadaf Ebrahimi        CPUFeatures::kSVEAES,
296*f5c631daSSadaf Ebrahimi        CPUFeatures::kSVEPmull128,
297*f5c631daSSadaf Ebrahimi        CPUFeatures::kSVEBitPerm,
298*f5c631daSSadaf Ebrahimi        CPUFeatures::kSVESHA3,
299*f5c631daSSadaf Ebrahimi        CPUFeatures::kSVESM4,
300*f5c631daSSadaf Ebrahimi        CPUFeatures::kAXFlag,
301*f5c631daSSadaf Ebrahimi        // Bits 40-47
302*f5c631daSSadaf Ebrahimi        CPUFeatures::kFrintToFixedSizedInt,
303*f5c631daSSadaf Ebrahimi        CPUFeatures::kSVEI8MM,
304*f5c631daSSadaf Ebrahimi        CPUFeatures::kSVEF32MM,
305*f5c631daSSadaf Ebrahimi        CPUFeatures::kSVEF64MM,
306*f5c631daSSadaf Ebrahimi        CPUFeatures::kSVEBF16,
307*f5c631daSSadaf Ebrahimi        CPUFeatures::kI8MM,
308*f5c631daSSadaf Ebrahimi        CPUFeatures::kBF16,
309*f5c631daSSadaf Ebrahimi        CPUFeatures::kDGH,
310*f5c631daSSadaf Ebrahimi        // Bits 48+
311*f5c631daSSadaf Ebrahimi        CPUFeatures::kRNG,
312*f5c631daSSadaf Ebrahimi        CPUFeatures::kBTI,
313*f5c631daSSadaf Ebrahimi        CPUFeatures::kMTE,
314*f5c631daSSadaf Ebrahimi        CPUFeatures::kECV,
315*f5c631daSSadaf Ebrahimi        CPUFeatures::kAFP,
316*f5c631daSSadaf Ebrahimi        CPUFeatures::kRPRES};
317*f5c631daSSadaf Ebrahimi 
318*f5c631daSSadaf Ebrahimi   uint64_t hwcap_low32 = getauxval(AT_HWCAP);
319*f5c631daSSadaf Ebrahimi   uint64_t hwcap_high32 = getauxval(AT_HWCAP2);
320*f5c631daSSadaf Ebrahimi   VIXL_ASSERT(IsUint32(hwcap_low32));
321*f5c631daSSadaf Ebrahimi   VIXL_ASSERT(IsUint32(hwcap_high32));
322*f5c631daSSadaf Ebrahimi   uint64_t hwcap = hwcap_low32 | (hwcap_high32 << 32);
323*f5c631daSSadaf Ebrahimi 
324*f5c631daSSadaf Ebrahimi   VIXL_STATIC_ASSERT(ArrayLength(kFeatureBits) < 64);
325*f5c631daSSadaf Ebrahimi   for (size_t i = 0; i < ArrayLength(kFeatureBits); i++) {
326*f5c631daSSadaf Ebrahimi     if (hwcap & (UINT64_C(1) << i)) features.Combine(kFeatureBits[i]);
327*f5c631daSSadaf Ebrahimi   }
328*f5c631daSSadaf Ebrahimi   // MTE support from HWCAP2 signifies FEAT_MTE1 and FEAT_MTE2 support
329*f5c631daSSadaf Ebrahimi   if (features.Has(CPUFeatures::kMTE)) {
330*f5c631daSSadaf Ebrahimi     features.Combine(CPUFeatures::kMTEInstructions);
331*f5c631daSSadaf Ebrahimi   }
332*f5c631daSSadaf Ebrahimi #endif  // VIXL_USE_LINUX_HWCAP
333*f5c631daSSadaf Ebrahimi 
334*f5c631daSSadaf Ebrahimi   if ((option == CPUFeatures::kQueryIDRegistersIfAvailable) &&
335*f5c631daSSadaf Ebrahimi       (features.Has(CPUFeatures::kIDRegisterEmulation))) {
336*f5c631daSSadaf Ebrahimi     features.Combine(InferCPUFeaturesFromIDRegisters());
337*f5c631daSSadaf Ebrahimi   }
338*f5c631daSSadaf Ebrahimi   return features;
339*f5c631daSSadaf Ebrahimi }
340*f5c631daSSadaf Ebrahimi 
341*f5c631daSSadaf Ebrahimi 
342*f5c631daSSadaf Ebrahimi #ifdef __aarch64__
343*f5c631daSSadaf Ebrahimi #define VIXL_READ_ID_REG(NAME, MRS_ARG)        \
344*f5c631daSSadaf Ebrahimi   NAME CPU::Read##NAME() {                     \
345*f5c631daSSadaf Ebrahimi     uint64_t value = 0;                        \
346*f5c631daSSadaf Ebrahimi     __asm__("mrs %0, " MRS_ARG : "=r"(value)); \
347*f5c631daSSadaf Ebrahimi     return NAME(value);                        \
348*f5c631daSSadaf Ebrahimi   }
349*f5c631daSSadaf Ebrahimi #else  // __aarch64__
350*f5c631daSSadaf Ebrahimi #define VIXL_READ_ID_REG(NAME, MRS_ARG) \
351*f5c631daSSadaf Ebrahimi   NAME CPU::Read##NAME() {              \
352*f5c631daSSadaf Ebrahimi     VIXL_UNREACHABLE();                 \
353*f5c631daSSadaf Ebrahimi     return NAME(0);                     \
354*f5c631daSSadaf Ebrahimi   }
355*f5c631daSSadaf Ebrahimi #endif  // __aarch64__
356*f5c631daSSadaf Ebrahimi 
357*f5c631daSSadaf Ebrahimi VIXL_AARCH64_ID_REG_LIST(VIXL_READ_ID_REG)
358*f5c631daSSadaf Ebrahimi 
359*f5c631daSSadaf Ebrahimi #undef VIXL_READ_ID_REG
360*f5c631daSSadaf Ebrahimi 
361*f5c631daSSadaf Ebrahimi 
362*f5c631daSSadaf Ebrahimi // Initialise to smallest possible cache size.
363*f5c631daSSadaf Ebrahimi unsigned CPU::dcache_line_size_ = 1;
364*f5c631daSSadaf Ebrahimi unsigned CPU::icache_line_size_ = 1;
365*f5c631daSSadaf Ebrahimi 
366*f5c631daSSadaf Ebrahimi 
367*f5c631daSSadaf Ebrahimi // Currently computes I and D cache line size.
SetUp()368*f5c631daSSadaf Ebrahimi void CPU::SetUp() {
369*f5c631daSSadaf Ebrahimi   uint32_t cache_type_register = GetCacheType();
370*f5c631daSSadaf Ebrahimi 
371*f5c631daSSadaf Ebrahimi   // The cache type register holds information about the caches, including I
372*f5c631daSSadaf Ebrahimi   // D caches line size.
373*f5c631daSSadaf Ebrahimi   static const int kDCacheLineSizeShift = 16;
374*f5c631daSSadaf Ebrahimi   static const int kICacheLineSizeShift = 0;
375*f5c631daSSadaf Ebrahimi   static const uint32_t kDCacheLineSizeMask = 0xf << kDCacheLineSizeShift;
376*f5c631daSSadaf Ebrahimi   static const uint32_t kICacheLineSizeMask = 0xf << kICacheLineSizeShift;
377*f5c631daSSadaf Ebrahimi 
378*f5c631daSSadaf Ebrahimi   // The cache type register holds the size of the I and D caches in words as
379*f5c631daSSadaf Ebrahimi   // a power of two.
380*f5c631daSSadaf Ebrahimi   uint32_t dcache_line_size_power_of_two =
381*f5c631daSSadaf Ebrahimi       (cache_type_register & kDCacheLineSizeMask) >> kDCacheLineSizeShift;
382*f5c631daSSadaf Ebrahimi   uint32_t icache_line_size_power_of_two =
383*f5c631daSSadaf Ebrahimi       (cache_type_register & kICacheLineSizeMask) >> kICacheLineSizeShift;
384*f5c631daSSadaf Ebrahimi 
385*f5c631daSSadaf Ebrahimi   dcache_line_size_ = 4 << dcache_line_size_power_of_two;
386*f5c631daSSadaf Ebrahimi   icache_line_size_ = 4 << icache_line_size_power_of_two;
387*f5c631daSSadaf Ebrahimi }
388*f5c631daSSadaf Ebrahimi 
389*f5c631daSSadaf Ebrahimi 
GetCacheType()390*f5c631daSSadaf Ebrahimi uint32_t CPU::GetCacheType() {
391*f5c631daSSadaf Ebrahimi #ifdef __aarch64__
392*f5c631daSSadaf Ebrahimi   uint64_t cache_type_register;
393*f5c631daSSadaf Ebrahimi   // Copy the content of the cache type register to a core register.
394*f5c631daSSadaf Ebrahimi   __asm__ __volatile__("mrs %[ctr], ctr_el0"  // NOLINT(runtime/references)
395*f5c631daSSadaf Ebrahimi                        : [ctr] "=r"(cache_type_register));
396*f5c631daSSadaf Ebrahimi   VIXL_ASSERT(IsUint32(cache_type_register));
397*f5c631daSSadaf Ebrahimi   return static_cast<uint32_t>(cache_type_register);
398*f5c631daSSadaf Ebrahimi #else
399*f5c631daSSadaf Ebrahimi   // This will lead to a cache with 1 byte long lines, which is fine since
400*f5c631daSSadaf Ebrahimi   // neither EnsureIAndDCacheCoherency nor the simulator will need this
401*f5c631daSSadaf Ebrahimi   // information.
402*f5c631daSSadaf Ebrahimi   return 0;
403*f5c631daSSadaf Ebrahimi #endif
404*f5c631daSSadaf Ebrahimi }
405*f5c631daSSadaf Ebrahimi 
406*f5c631daSSadaf Ebrahimi 
407*f5c631daSSadaf Ebrahimi // Query the SVE vector length. This requires CPUFeatures::kSVE.
ReadSVEVectorLengthInBits()408*f5c631daSSadaf Ebrahimi int CPU::ReadSVEVectorLengthInBits() {
409*f5c631daSSadaf Ebrahimi #ifdef __aarch64__
410*f5c631daSSadaf Ebrahimi   uint64_t vl;
411*f5c631daSSadaf Ebrahimi   // To support compilers that don't understand `rdvl`, encode the value
412*f5c631daSSadaf Ebrahimi   // directly and move it manually.
413*f5c631daSSadaf Ebrahimi   __asm__(
414*f5c631daSSadaf Ebrahimi       "   .word 0x04bf5100\n"  // rdvl x0, #8
415*f5c631daSSadaf Ebrahimi       "   mov %[vl], x0\n"
416*f5c631daSSadaf Ebrahimi       : [vl] "=r"(vl)
417*f5c631daSSadaf Ebrahimi       :
418*f5c631daSSadaf Ebrahimi       : "x0");
419*f5c631daSSadaf Ebrahimi   VIXL_ASSERT(vl <= INT_MAX);
420*f5c631daSSadaf Ebrahimi   return static_cast<int>(vl);
421*f5c631daSSadaf Ebrahimi #else
422*f5c631daSSadaf Ebrahimi   VIXL_UNREACHABLE();
423*f5c631daSSadaf Ebrahimi   return 0;
424*f5c631daSSadaf Ebrahimi #endif
425*f5c631daSSadaf Ebrahimi }
426*f5c631daSSadaf Ebrahimi 
427*f5c631daSSadaf Ebrahimi 
EnsureIAndDCacheCoherency(void * address,size_t length)428*f5c631daSSadaf Ebrahimi void CPU::EnsureIAndDCacheCoherency(void *address, size_t length) {
429*f5c631daSSadaf Ebrahimi #ifdef __aarch64__
430*f5c631daSSadaf Ebrahimi   // Implement the cache synchronisation for all targets where AArch64 is the
431*f5c631daSSadaf Ebrahimi   // host, even if we're building the simulator for an AAarch64 host. This
432*f5c631daSSadaf Ebrahimi   // allows for cases where the user wants to simulate code as well as run it
433*f5c631daSSadaf Ebrahimi   // natively.
434*f5c631daSSadaf Ebrahimi 
435*f5c631daSSadaf Ebrahimi   if (length == 0) {
436*f5c631daSSadaf Ebrahimi     return;
437*f5c631daSSadaf Ebrahimi   }
438*f5c631daSSadaf Ebrahimi 
439*f5c631daSSadaf Ebrahimi   // The code below assumes user space cache operations are allowed.
440*f5c631daSSadaf Ebrahimi 
441*f5c631daSSadaf Ebrahimi   // Work out the line sizes for each cache, and use them to determine the
442*f5c631daSSadaf Ebrahimi   // start addresses.
443*f5c631daSSadaf Ebrahimi   uintptr_t start = reinterpret_cast<uintptr_t>(address);
444*f5c631daSSadaf Ebrahimi   uintptr_t dsize = static_cast<uintptr_t>(dcache_line_size_);
445*f5c631daSSadaf Ebrahimi   uintptr_t isize = static_cast<uintptr_t>(icache_line_size_);
446*f5c631daSSadaf Ebrahimi   uintptr_t dline = start & ~(dsize - 1);
447*f5c631daSSadaf Ebrahimi   uintptr_t iline = start & ~(isize - 1);
448*f5c631daSSadaf Ebrahimi 
449*f5c631daSSadaf Ebrahimi   // Cache line sizes are always a power of 2.
450*f5c631daSSadaf Ebrahimi   VIXL_ASSERT(IsPowerOf2(dsize));
451*f5c631daSSadaf Ebrahimi   VIXL_ASSERT(IsPowerOf2(isize));
452*f5c631daSSadaf Ebrahimi   uintptr_t end = start + length;
453*f5c631daSSadaf Ebrahimi 
454*f5c631daSSadaf Ebrahimi   do {
455*f5c631daSSadaf Ebrahimi     __asm__ __volatile__(
456*f5c631daSSadaf Ebrahimi         // Clean each line of the D cache containing the target data.
457*f5c631daSSadaf Ebrahimi         //
458*f5c631daSSadaf Ebrahimi         // dc       : Data Cache maintenance
459*f5c631daSSadaf Ebrahimi         //     c    : Clean
460*f5c631daSSadaf Ebrahimi         //      va  : by (Virtual) Address
461*f5c631daSSadaf Ebrahimi         //        u : to the point of Unification
462*f5c631daSSadaf Ebrahimi         // The point of unification for a processor is the point by which the
463*f5c631daSSadaf Ebrahimi         // instruction and data caches are guaranteed to see the same copy of a
464*f5c631daSSadaf Ebrahimi         // memory location. See ARM DDI 0406B page B2-12 for more information.
465*f5c631daSSadaf Ebrahimi         "   dc    cvau, %[dline]\n"
466*f5c631daSSadaf Ebrahimi         :
467*f5c631daSSadaf Ebrahimi         : [dline] "r"(dline)
468*f5c631daSSadaf Ebrahimi         // This code does not write to memory, but the "memory" dependency
469*f5c631daSSadaf Ebrahimi         // prevents GCC from reordering the code.
470*f5c631daSSadaf Ebrahimi         : "memory");
471*f5c631daSSadaf Ebrahimi     dline += dsize;
472*f5c631daSSadaf Ebrahimi   } while (dline < end);
473*f5c631daSSadaf Ebrahimi 
474*f5c631daSSadaf Ebrahimi   __asm__ __volatile__(
475*f5c631daSSadaf Ebrahimi       // Make sure that the data cache operations (above) complete before the
476*f5c631daSSadaf Ebrahimi       // instruction cache operations (below).
477*f5c631daSSadaf Ebrahimi       //
478*f5c631daSSadaf Ebrahimi       // dsb      : Data Synchronisation Barrier
479*f5c631daSSadaf Ebrahimi       //      ish : Inner SHareable domain
480*f5c631daSSadaf Ebrahimi       //
481*f5c631daSSadaf Ebrahimi       // The point of unification for an Inner Shareable shareability domain is
482*f5c631daSSadaf Ebrahimi       // the point by which the instruction and data caches of all the
483*f5c631daSSadaf Ebrahimi       // processors
484*f5c631daSSadaf Ebrahimi       // in that Inner Shareable shareability domain are guaranteed to see the
485*f5c631daSSadaf Ebrahimi       // same copy of a memory location. See ARM DDI 0406B page B2-12 for more
486*f5c631daSSadaf Ebrahimi       // information.
487*f5c631daSSadaf Ebrahimi       "   dsb   ish\n"
488*f5c631daSSadaf Ebrahimi       :
489*f5c631daSSadaf Ebrahimi       :
490*f5c631daSSadaf Ebrahimi       : "memory");
491*f5c631daSSadaf Ebrahimi 
492*f5c631daSSadaf Ebrahimi   do {
493*f5c631daSSadaf Ebrahimi     __asm__ __volatile__(
494*f5c631daSSadaf Ebrahimi         // Invalidate each line of the I cache containing the target data.
495*f5c631daSSadaf Ebrahimi         //
496*f5c631daSSadaf Ebrahimi         // ic      : Instruction Cache maintenance
497*f5c631daSSadaf Ebrahimi         //    i    : Invalidate
498*f5c631daSSadaf Ebrahimi         //     va  : by Address
499*f5c631daSSadaf Ebrahimi         //       u : to the point of Unification
500*f5c631daSSadaf Ebrahimi         "   ic   ivau, %[iline]\n"
501*f5c631daSSadaf Ebrahimi         :
502*f5c631daSSadaf Ebrahimi         : [iline] "r"(iline)
503*f5c631daSSadaf Ebrahimi         : "memory");
504*f5c631daSSadaf Ebrahimi     iline += isize;
505*f5c631daSSadaf Ebrahimi   } while (iline < end);
506*f5c631daSSadaf Ebrahimi 
507*f5c631daSSadaf Ebrahimi   __asm__ __volatile__(
508*f5c631daSSadaf Ebrahimi       // Make sure that the instruction cache operations (above) take effect
509*f5c631daSSadaf Ebrahimi       // before the isb (below).
510*f5c631daSSadaf Ebrahimi       "   dsb  ish\n"
511*f5c631daSSadaf Ebrahimi 
512*f5c631daSSadaf Ebrahimi       // Ensure that any instructions already in the pipeline are discarded and
513*f5c631daSSadaf Ebrahimi       // reloaded from the new data.
514*f5c631daSSadaf Ebrahimi       // isb : Instruction Synchronisation Barrier
515*f5c631daSSadaf Ebrahimi       "   isb\n"
516*f5c631daSSadaf Ebrahimi       :
517*f5c631daSSadaf Ebrahimi       :
518*f5c631daSSadaf Ebrahimi       : "memory");
519*f5c631daSSadaf Ebrahimi #else
520*f5c631daSSadaf Ebrahimi   // If the host isn't AArch64, we must be using the simulator, so this function
521*f5c631daSSadaf Ebrahimi   // doesn't have to do anything.
522*f5c631daSSadaf Ebrahimi   USE(address, length);
523*f5c631daSSadaf Ebrahimi #endif
524*f5c631daSSadaf Ebrahimi }
525*f5c631daSSadaf Ebrahimi 
526*f5c631daSSadaf Ebrahimi }  // namespace aarch64
527*f5c631daSSadaf Ebrahimi }  // namespace vixl
528