1 //===-- TargetParser - Parser for target features ---------------*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements a target parser to recognise hardware features such as
10 // FPU/CPU/ARCH names as well as specific support such as HDIV, etc.
11 //
12 //===----------------------------------------------------------------------===//
13
14 #include "llvm/TargetParser/TargetParser.h"
15 #include "llvm/ADT/ArrayRef.h"
16 #include "llvm/ADT/StringSwitch.h"
17 #include "llvm/TargetParser/Triple.h"
18
19 using namespace llvm;
20 using namespace AMDGPU;
21
22 namespace {
23
24 struct GPUInfo {
25 StringLiteral Name;
26 StringLiteral CanonicalName;
27 AMDGPU::GPUKind Kind;
28 unsigned Features;
29 };
30
31 constexpr GPUInfo R600GPUs[] = {
32 // Name Canonical Kind Features
33 // Name
34 {{"r600"}, {"r600"}, GK_R600, FEATURE_NONE },
35 {{"rv630"}, {"r600"}, GK_R600, FEATURE_NONE },
36 {{"rv635"}, {"r600"}, GK_R600, FEATURE_NONE },
37 {{"r630"}, {"r630"}, GK_R630, FEATURE_NONE },
38 {{"rs780"}, {"rs880"}, GK_RS880, FEATURE_NONE },
39 {{"rs880"}, {"rs880"}, GK_RS880, FEATURE_NONE },
40 {{"rv610"}, {"rs880"}, GK_RS880, FEATURE_NONE },
41 {{"rv620"}, {"rs880"}, GK_RS880, FEATURE_NONE },
42 {{"rv670"}, {"rv670"}, GK_RV670, FEATURE_NONE },
43 {{"rv710"}, {"rv710"}, GK_RV710, FEATURE_NONE },
44 {{"rv730"}, {"rv730"}, GK_RV730, FEATURE_NONE },
45 {{"rv740"}, {"rv770"}, GK_RV770, FEATURE_NONE },
46 {{"rv770"}, {"rv770"}, GK_RV770, FEATURE_NONE },
47 {{"cedar"}, {"cedar"}, GK_CEDAR, FEATURE_NONE },
48 {{"palm"}, {"cedar"}, GK_CEDAR, FEATURE_NONE },
49 {{"cypress"}, {"cypress"}, GK_CYPRESS, FEATURE_FMA },
50 {{"hemlock"}, {"cypress"}, GK_CYPRESS, FEATURE_FMA },
51 {{"juniper"}, {"juniper"}, GK_JUNIPER, FEATURE_NONE },
52 {{"redwood"}, {"redwood"}, GK_REDWOOD, FEATURE_NONE },
53 {{"sumo"}, {"sumo"}, GK_SUMO, FEATURE_NONE },
54 {{"sumo2"}, {"sumo"}, GK_SUMO, FEATURE_NONE },
55 {{"barts"}, {"barts"}, GK_BARTS, FEATURE_NONE },
56 {{"caicos"}, {"caicos"}, GK_CAICOS, FEATURE_NONE },
57 {{"aruba"}, {"cayman"}, GK_CAYMAN, FEATURE_FMA },
58 {{"cayman"}, {"cayman"}, GK_CAYMAN, FEATURE_FMA },
59 {{"turks"}, {"turks"}, GK_TURKS, FEATURE_NONE }
60 };
61
62 // This table should be sorted by the value of GPUKind
63 // Don't bother listing the implicitly true features
64 constexpr GPUInfo AMDGCNGPUs[] = {
65 // Name Canonical Kind Features
66 // Name
67 {{"gfx600"}, {"gfx600"}, GK_GFX600, FEATURE_FAST_FMA_F32},
68 {{"tahiti"}, {"gfx600"}, GK_GFX600, FEATURE_FAST_FMA_F32},
69 {{"gfx601"}, {"gfx601"}, GK_GFX601, FEATURE_NONE},
70 {{"pitcairn"}, {"gfx601"}, GK_GFX601, FEATURE_NONE},
71 {{"verde"}, {"gfx601"}, GK_GFX601, FEATURE_NONE},
72 {{"gfx602"}, {"gfx602"}, GK_GFX602, FEATURE_NONE},
73 {{"hainan"}, {"gfx602"}, GK_GFX602, FEATURE_NONE},
74 {{"oland"}, {"gfx602"}, GK_GFX602, FEATURE_NONE},
75 {{"gfx700"}, {"gfx700"}, GK_GFX700, FEATURE_NONE},
76 {{"kaveri"}, {"gfx700"}, GK_GFX700, FEATURE_NONE},
77 {{"gfx701"}, {"gfx701"}, GK_GFX701, FEATURE_FAST_FMA_F32},
78 {{"hawaii"}, {"gfx701"}, GK_GFX701, FEATURE_FAST_FMA_F32},
79 {{"gfx702"}, {"gfx702"}, GK_GFX702, FEATURE_FAST_FMA_F32},
80 {{"gfx703"}, {"gfx703"}, GK_GFX703, FEATURE_NONE},
81 {{"kabini"}, {"gfx703"}, GK_GFX703, FEATURE_NONE},
82 {{"mullins"}, {"gfx703"}, GK_GFX703, FEATURE_NONE},
83 {{"gfx704"}, {"gfx704"}, GK_GFX704, FEATURE_NONE},
84 {{"bonaire"}, {"gfx704"}, GK_GFX704, FEATURE_NONE},
85 {{"gfx705"}, {"gfx705"}, GK_GFX705, FEATURE_NONE},
86 {{"gfx801"}, {"gfx801"}, GK_GFX801, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
87 {{"carrizo"}, {"gfx801"}, GK_GFX801, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
88 {{"gfx802"}, {"gfx802"}, GK_GFX802, FEATURE_FAST_DENORMAL_F32},
89 {{"iceland"}, {"gfx802"}, GK_GFX802, FEATURE_FAST_DENORMAL_F32},
90 {{"tonga"}, {"gfx802"}, GK_GFX802, FEATURE_FAST_DENORMAL_F32},
91 {{"gfx803"}, {"gfx803"}, GK_GFX803, FEATURE_FAST_DENORMAL_F32},
92 {{"fiji"}, {"gfx803"}, GK_GFX803, FEATURE_FAST_DENORMAL_F32},
93 {{"polaris10"}, {"gfx803"}, GK_GFX803, FEATURE_FAST_DENORMAL_F32},
94 {{"polaris11"}, {"gfx803"}, GK_GFX803, FEATURE_FAST_DENORMAL_F32},
95 {{"gfx805"}, {"gfx805"}, GK_GFX805, FEATURE_FAST_DENORMAL_F32},
96 {{"tongapro"}, {"gfx805"}, GK_GFX805, FEATURE_FAST_DENORMAL_F32},
97 {{"gfx810"}, {"gfx810"}, GK_GFX810, FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
98 {{"stoney"}, {"gfx810"}, GK_GFX810, FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
99 {{"gfx900"}, {"gfx900"}, GK_GFX900, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
100 {{"gfx902"}, {"gfx902"}, GK_GFX902, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
101 {{"gfx904"}, {"gfx904"}, GK_GFX904, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
102 {{"gfx906"}, {"gfx906"}, GK_GFX906, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
103 {{"gfx908"}, {"gfx908"}, GK_GFX908, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
104 {{"gfx909"}, {"gfx909"}, GK_GFX909, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
105 {{"gfx90a"}, {"gfx90a"}, GK_GFX90A, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
106 {{"gfx90c"}, {"gfx90c"}, GK_GFX90C, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
107 {{"gfx940"}, {"gfx940"}, GK_GFX940, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
108 {{"gfx1010"}, {"gfx1010"}, GK_GFX1010, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK},
109 {{"gfx1011"}, {"gfx1011"}, GK_GFX1011, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK},
110 {{"gfx1012"}, {"gfx1012"}, GK_GFX1012, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK},
111 {{"gfx1013"}, {"gfx1013"}, GK_GFX1013, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK},
112 {{"gfx1030"}, {"gfx1030"}, GK_GFX1030, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32},
113 {{"gfx1031"}, {"gfx1031"}, GK_GFX1031, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32},
114 {{"gfx1032"}, {"gfx1032"}, GK_GFX1032, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32},
115 {{"gfx1033"}, {"gfx1033"}, GK_GFX1033, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32},
116 {{"gfx1034"}, {"gfx1034"}, GK_GFX1034, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32},
117 {{"gfx1035"}, {"gfx1035"}, GK_GFX1035, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32},
118 {{"gfx1036"}, {"gfx1036"}, GK_GFX1036, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32},
119 {{"gfx1100"}, {"gfx1100"}, GK_GFX1100, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32},
120 {{"gfx1101"}, {"gfx1101"}, GK_GFX1101, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32},
121 {{"gfx1102"}, {"gfx1102"}, GK_GFX1102, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32},
122 {{"gfx1103"}, {"gfx1103"}, GK_GFX1103, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32},
123 };
124
getArchEntry(AMDGPU::GPUKind AK,ArrayRef<GPUInfo> Table)125 const GPUInfo *getArchEntry(AMDGPU::GPUKind AK, ArrayRef<GPUInfo> Table) {
126 GPUInfo Search = { {""}, {""}, AK, AMDGPU::FEATURE_NONE };
127
128 auto I =
129 llvm::lower_bound(Table, Search, [](const GPUInfo &A, const GPUInfo &B) {
130 return A.Kind < B.Kind;
131 });
132
133 if (I == Table.end())
134 return nullptr;
135 return I;
136 }
137
138 } // namespace
139
getArchNameAMDGCN(GPUKind AK)140 StringRef llvm::AMDGPU::getArchNameAMDGCN(GPUKind AK) {
141 if (const auto *Entry = getArchEntry(AK, AMDGCNGPUs))
142 return Entry->CanonicalName;
143 return "";
144 }
145
getArchNameR600(GPUKind AK)146 StringRef llvm::AMDGPU::getArchNameR600(GPUKind AK) {
147 if (const auto *Entry = getArchEntry(AK, R600GPUs))
148 return Entry->CanonicalName;
149 return "";
150 }
151
parseArchAMDGCN(StringRef CPU)152 AMDGPU::GPUKind llvm::AMDGPU::parseArchAMDGCN(StringRef CPU) {
153 for (const auto &C : AMDGCNGPUs) {
154 if (CPU == C.Name)
155 return C.Kind;
156 }
157
158 return AMDGPU::GPUKind::GK_NONE;
159 }
160
parseArchR600(StringRef CPU)161 AMDGPU::GPUKind llvm::AMDGPU::parseArchR600(StringRef CPU) {
162 for (const auto &C : R600GPUs) {
163 if (CPU == C.Name)
164 return C.Kind;
165 }
166
167 return AMDGPU::GPUKind::GK_NONE;
168 }
169
getArchAttrAMDGCN(GPUKind AK)170 unsigned AMDGPU::getArchAttrAMDGCN(GPUKind AK) {
171 if (const auto *Entry = getArchEntry(AK, AMDGCNGPUs))
172 return Entry->Features;
173 return FEATURE_NONE;
174 }
175
getArchAttrR600(GPUKind AK)176 unsigned AMDGPU::getArchAttrR600(GPUKind AK) {
177 if (const auto *Entry = getArchEntry(AK, R600GPUs))
178 return Entry->Features;
179 return FEATURE_NONE;
180 }
181
fillValidArchListAMDGCN(SmallVectorImpl<StringRef> & Values)182 void AMDGPU::fillValidArchListAMDGCN(SmallVectorImpl<StringRef> &Values) {
183 // XXX: Should this only report unique canonical names?
184 for (const auto &C : AMDGCNGPUs)
185 Values.push_back(C.Name);
186 }
187
fillValidArchListR600(SmallVectorImpl<StringRef> & Values)188 void AMDGPU::fillValidArchListR600(SmallVectorImpl<StringRef> &Values) {
189 for (const auto &C : R600GPUs)
190 Values.push_back(C.Name);
191 }
192
getIsaVersion(StringRef GPU)193 AMDGPU::IsaVersion AMDGPU::getIsaVersion(StringRef GPU) {
194 AMDGPU::GPUKind AK = parseArchAMDGCN(GPU);
195 if (AK == AMDGPU::GPUKind::GK_NONE) {
196 if (GPU == "generic-hsa")
197 return {7, 0, 0};
198 if (GPU == "generic")
199 return {6, 0, 0};
200 return {0, 0, 0};
201 }
202
203 switch (AK) {
204 case GK_GFX600: return {6, 0, 0};
205 case GK_GFX601: return {6, 0, 1};
206 case GK_GFX602: return {6, 0, 2};
207 case GK_GFX700: return {7, 0, 0};
208 case GK_GFX701: return {7, 0, 1};
209 case GK_GFX702: return {7, 0, 2};
210 case GK_GFX703: return {7, 0, 3};
211 case GK_GFX704: return {7, 0, 4};
212 case GK_GFX705: return {7, 0, 5};
213 case GK_GFX801: return {8, 0, 1};
214 case GK_GFX802: return {8, 0, 2};
215 case GK_GFX803: return {8, 0, 3};
216 case GK_GFX805: return {8, 0, 5};
217 case GK_GFX810: return {8, 1, 0};
218 case GK_GFX900: return {9, 0, 0};
219 case GK_GFX902: return {9, 0, 2};
220 case GK_GFX904: return {9, 0, 4};
221 case GK_GFX906: return {9, 0, 6};
222 case GK_GFX908: return {9, 0, 8};
223 case GK_GFX909: return {9, 0, 9};
224 case GK_GFX90A: return {9, 0, 10};
225 case GK_GFX90C: return {9, 0, 12};
226 case GK_GFX940: return {9, 4, 0};
227 case GK_GFX1010: return {10, 1, 0};
228 case GK_GFX1011: return {10, 1, 1};
229 case GK_GFX1012: return {10, 1, 2};
230 case GK_GFX1013: return {10, 1, 3};
231 case GK_GFX1030: return {10, 3, 0};
232 case GK_GFX1031: return {10, 3, 1};
233 case GK_GFX1032: return {10, 3, 2};
234 case GK_GFX1033: return {10, 3, 3};
235 case GK_GFX1034: return {10, 3, 4};
236 case GK_GFX1035: return {10, 3, 5};
237 case GK_GFX1036: return {10, 3, 6};
238 case GK_GFX1100: return {11, 0, 0};
239 case GK_GFX1101: return {11, 0, 1};
240 case GK_GFX1102: return {11, 0, 2};
241 case GK_GFX1103: return {11, 0, 3};
242 default: return {0, 0, 0};
243 }
244 }
245
getCanonicalArchName(const Triple & T,StringRef Arch)246 StringRef AMDGPU::getCanonicalArchName(const Triple &T, StringRef Arch) {
247 assert(T.isAMDGPU());
248 auto ProcKind = T.isAMDGCN() ? parseArchAMDGCN(Arch) : parseArchR600(Arch);
249 if (ProcKind == GK_NONE)
250 return StringRef();
251
252 return T.isAMDGCN() ? getArchNameAMDGCN(ProcKind) : getArchNameR600(ProcKind);
253 }
254