1//===-- TargetParser - Parser for target features ---------------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements a target parser to recognise hardware features such as
10// FPU/CPU/ARCH names as well as specific support such as HDIV, etc.
11//
12//===----------------------------------------------------------------------===//
13
14#include "llvm/TargetParser/TargetParser.h"
15#include "llvm/ADT/ArrayRef.h"
16#include "llvm/TargetParser/Triple.h"
17
18using namespace llvm;
19using namespace AMDGPU;
20
21/// Find KV in array using binary search.
22static const BasicSubtargetSubTypeKV *
23find(StringRef S, ArrayRef<BasicSubtargetSubTypeKV> A) {
24 // Binary search the array
25 auto F = llvm::lower_bound(Range&: A, Value&: S);
26 // If not found then return NULL
27 if (F == A.end() || StringRef(F->Key) != S)
28 return nullptr;
29 // Return the found array item
30 return F;
31}
32
33/// For each feature that is (transitively) implied by this feature, set it.
34static void setImpliedBits(FeatureBitset &Bits, const FeatureBitset &Implies,
35 ArrayRef<BasicSubtargetFeatureKV> FeatureTable) {
36 // OR the Implies bits in outside the loop. This allows the Implies for CPUs
37 // which might imply features not in FeatureTable to use this.
38 Bits |= Implies;
39 for (const auto &FE : FeatureTable)
40 if (Implies.test(I: FE.Value))
41 setImpliedBits(Bits, Implies: FE.Implies.getAsBitset(), FeatureTable);
42}
43
44std::optional<llvm::StringMap<bool>> llvm::getCPUDefaultTargetFeatures(
45 StringRef CPU, ArrayRef<BasicSubtargetSubTypeKV> ProcDesc,
46 ArrayRef<BasicSubtargetFeatureKV> ProcFeatures) {
47 if (CPU.empty())
48 return std::nullopt;
49
50 const BasicSubtargetSubTypeKV *CPUEntry = ::find(S: CPU, A: ProcDesc);
51 if (!CPUEntry)
52 return std::nullopt;
53
54 // Set the features implied by this CPU feature if there is a match.
55 FeatureBitset Bits;
56 llvm::StringMap<bool> DefaultFeatures;
57 setImpliedBits(Bits, Implies: CPUEntry->Implies.getAsBitset(), FeatureTable: ProcFeatures);
58
59 [[maybe_unused]] unsigned BitSize = Bits.size();
60 for (const BasicSubtargetFeatureKV &FE : ProcFeatures) {
61 assert(FE.Value < BitSize && "Target Feature is out of range");
62 if (Bits[FE.Value])
63 DefaultFeatures[FE.Key] = true;
64 }
65 return DefaultFeatures;
66}
67
68namespace {
69
70struct GPUInfo {
71 StringLiteral Name;
72 StringLiteral CanonicalName;
73 AMDGPU::GPUKind Kind;
74 unsigned Features;
75};
76
77constexpr GPUInfo R600GPUs[] = {
78 // Name Canonical Kind Features
79 // Name
80 {.Name: {"r600"}, .CanonicalName: {"r600"}, .Kind: GK_R600, .Features: FEATURE_NONE },
81 {.Name: {"rv630"}, .CanonicalName: {"r600"}, .Kind: GK_R600, .Features: FEATURE_NONE },
82 {.Name: {"rv635"}, .CanonicalName: {"r600"}, .Kind: GK_R600, .Features: FEATURE_NONE },
83 {.Name: {"r630"}, .CanonicalName: {"r630"}, .Kind: GK_R630, .Features: FEATURE_NONE },
84 {.Name: {"rs780"}, .CanonicalName: {"rs880"}, .Kind: GK_RS880, .Features: FEATURE_NONE },
85 {.Name: {"rs880"}, .CanonicalName: {"rs880"}, .Kind: GK_RS880, .Features: FEATURE_NONE },
86 {.Name: {"rv610"}, .CanonicalName: {"rs880"}, .Kind: GK_RS880, .Features: FEATURE_NONE },
87 {.Name: {"rv620"}, .CanonicalName: {"rs880"}, .Kind: GK_RS880, .Features: FEATURE_NONE },
88 {.Name: {"rv670"}, .CanonicalName: {"rv670"}, .Kind: GK_RV670, .Features: FEATURE_NONE },
89 {.Name: {"rv710"}, .CanonicalName: {"rv710"}, .Kind: GK_RV710, .Features: FEATURE_NONE },
90 {.Name: {"rv730"}, .CanonicalName: {"rv730"}, .Kind: GK_RV730, .Features: FEATURE_NONE },
91 {.Name: {"rv740"}, .CanonicalName: {"rv770"}, .Kind: GK_RV770, .Features: FEATURE_NONE },
92 {.Name: {"rv770"}, .CanonicalName: {"rv770"}, .Kind: GK_RV770, .Features: FEATURE_NONE },
93 {.Name: {"cedar"}, .CanonicalName: {"cedar"}, .Kind: GK_CEDAR, .Features: FEATURE_NONE },
94 {.Name: {"palm"}, .CanonicalName: {"cedar"}, .Kind: GK_CEDAR, .Features: FEATURE_NONE },
95 {.Name: {"cypress"}, .CanonicalName: {"cypress"}, .Kind: GK_CYPRESS, .Features: FEATURE_FMA },
96 {.Name: {"hemlock"}, .CanonicalName: {"cypress"}, .Kind: GK_CYPRESS, .Features: FEATURE_FMA },
97 {.Name: {"juniper"}, .CanonicalName: {"juniper"}, .Kind: GK_JUNIPER, .Features: FEATURE_NONE },
98 {.Name: {"redwood"}, .CanonicalName: {"redwood"}, .Kind: GK_REDWOOD, .Features: FEATURE_NONE },
99 {.Name: {"sumo"}, .CanonicalName: {"sumo"}, .Kind: GK_SUMO, .Features: FEATURE_NONE },
100 {.Name: {"sumo2"}, .CanonicalName: {"sumo"}, .Kind: GK_SUMO, .Features: FEATURE_NONE },
101 {.Name: {"barts"}, .CanonicalName: {"barts"}, .Kind: GK_BARTS, .Features: FEATURE_NONE },
102 {.Name: {"caicos"}, .CanonicalName: {"caicos"}, .Kind: GK_CAICOS, .Features: FEATURE_NONE },
103 {.Name: {"aruba"}, .CanonicalName: {"cayman"}, .Kind: GK_CAYMAN, .Features: FEATURE_FMA },
104 {.Name: {"cayman"}, .CanonicalName: {"cayman"}, .Kind: GK_CAYMAN, .Features: FEATURE_FMA },
105 {.Name: {"turks"}, .CanonicalName: {"turks"}, .Kind: GK_TURKS, .Features: FEATURE_NONE }
106};
107
108// This table should be sorted by the value of GPUKind
109// Don't bother listing the implicitly true features
110constexpr GPUInfo AMDGCNGPUs[] = {
111 // clang-format off
112 // Name Canonical Kind Features
113 // Name
114 {.Name: {"gfx600"}, .CanonicalName: {"gfx600"}, .Kind: GK_GFX600, .Features: FEATURE_FAST_FMA_F32},
115 {.Name: {"tahiti"}, .CanonicalName: {"gfx600"}, .Kind: GK_GFX600, .Features: FEATURE_FAST_FMA_F32},
116 {.Name: {"gfx601"}, .CanonicalName: {"gfx601"}, .Kind: GK_GFX601, .Features: FEATURE_NONE},
117 {.Name: {"pitcairn"}, .CanonicalName: {"gfx601"}, .Kind: GK_GFX601, .Features: FEATURE_NONE},
118 {.Name: {"verde"}, .CanonicalName: {"gfx601"}, .Kind: GK_GFX601, .Features: FEATURE_NONE},
119 {.Name: {"gfx602"}, .CanonicalName: {"gfx602"}, .Kind: GK_GFX602, .Features: FEATURE_NONE},
120 {.Name: {"hainan"}, .CanonicalName: {"gfx602"}, .Kind: GK_GFX602, .Features: FEATURE_NONE},
121 {.Name: {"oland"}, .CanonicalName: {"gfx602"}, .Kind: GK_GFX602, .Features: FEATURE_NONE},
122 {.Name: {"gfx700"}, .CanonicalName: {"gfx700"}, .Kind: GK_GFX700, .Features: FEATURE_NONE},
123 {.Name: {"kaveri"}, .CanonicalName: {"gfx700"}, .Kind: GK_GFX700, .Features: FEATURE_NONE},
124 {.Name: {"gfx701"}, .CanonicalName: {"gfx701"}, .Kind: GK_GFX701, .Features: FEATURE_FAST_FMA_F32},
125 {.Name: {"hawaii"}, .CanonicalName: {"gfx701"}, .Kind: GK_GFX701, .Features: FEATURE_FAST_FMA_F32},
126 {.Name: {"gfx702"}, .CanonicalName: {"gfx702"}, .Kind: GK_GFX702, .Features: FEATURE_FAST_FMA_F32},
127 {.Name: {"gfx703"}, .CanonicalName: {"gfx703"}, .Kind: GK_GFX703, .Features: FEATURE_NONE},
128 {.Name: {"kabini"}, .CanonicalName: {"gfx703"}, .Kind: GK_GFX703, .Features: FEATURE_NONE},
129 {.Name: {"mullins"}, .CanonicalName: {"gfx703"}, .Kind: GK_GFX703, .Features: FEATURE_NONE},
130 {.Name: {"gfx704"}, .CanonicalName: {"gfx704"}, .Kind: GK_GFX704, .Features: FEATURE_NONE},
131 {.Name: {"bonaire"}, .CanonicalName: {"gfx704"}, .Kind: GK_GFX704, .Features: FEATURE_NONE},
132 {.Name: {"gfx705"}, .CanonicalName: {"gfx705"}, .Kind: GK_GFX705, .Features: FEATURE_NONE},
133 {.Name: {"gfx801"}, .CanonicalName: {"gfx801"}, .Kind: GK_GFX801, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
134 {.Name: {"carrizo"}, .CanonicalName: {"gfx801"}, .Kind: GK_GFX801, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
135 {.Name: {"gfx802"}, .CanonicalName: {"gfx802"}, .Kind: GK_GFX802, .Features: FEATURE_FAST_DENORMAL_F32},
136 {.Name: {"iceland"}, .CanonicalName: {"gfx802"}, .Kind: GK_GFX802, .Features: FEATURE_FAST_DENORMAL_F32},
137 {.Name: {"tonga"}, .CanonicalName: {"gfx802"}, .Kind: GK_GFX802, .Features: FEATURE_FAST_DENORMAL_F32},
138 {.Name: {"gfx803"}, .CanonicalName: {"gfx803"}, .Kind: GK_GFX803, .Features: FEATURE_FAST_DENORMAL_F32},
139 {.Name: {"fiji"}, .CanonicalName: {"gfx803"}, .Kind: GK_GFX803, .Features: FEATURE_FAST_DENORMAL_F32},
140 {.Name: {"polaris10"}, .CanonicalName: {"gfx803"}, .Kind: GK_GFX803, .Features: FEATURE_FAST_DENORMAL_F32},
141 {.Name: {"polaris11"}, .CanonicalName: {"gfx803"}, .Kind: GK_GFX803, .Features: FEATURE_FAST_DENORMAL_F32},
142 {.Name: {"gfx805"}, .CanonicalName: {"gfx805"}, .Kind: GK_GFX805, .Features: FEATURE_FAST_DENORMAL_F32},
143 {.Name: {"tongapro"}, .CanonicalName: {"gfx805"}, .Kind: GK_GFX805, .Features: FEATURE_FAST_DENORMAL_F32},
144 {.Name: {"gfx810"}, .CanonicalName: {"gfx810"}, .Kind: GK_GFX810, .Features: FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
145 {.Name: {"stoney"}, .CanonicalName: {"gfx810"}, .Kind: GK_GFX810, .Features: FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
146 {.Name: {"gfx900"}, .CanonicalName: {"gfx900"}, .Kind: GK_GFX900, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
147 {.Name: {"gfx902"}, .CanonicalName: {"gfx902"}, .Kind: GK_GFX902, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
148 {.Name: {"gfx904"}, .CanonicalName: {"gfx904"}, .Kind: GK_GFX904, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
149 {.Name: {"gfx906"}, .CanonicalName: {"gfx906"}, .Kind: GK_GFX906, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
150 {.Name: {"gfx908"}, .CanonicalName: {"gfx908"}, .Kind: GK_GFX908, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
151 {.Name: {"gfx909"}, .CanonicalName: {"gfx909"}, .Kind: GK_GFX909, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
152 {.Name: {"gfx90a"}, .CanonicalName: {"gfx90a"}, .Kind: GK_GFX90A, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
153 {.Name: {"gfx90c"}, .CanonicalName: {"gfx90c"}, .Kind: GK_GFX90C, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
154 {.Name: {"gfx942"}, .CanonicalName: {"gfx942"}, .Kind: GK_GFX942, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
155 {.Name: {"gfx950"}, .CanonicalName: {"gfx950"}, .Kind: GK_GFX950, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
156 {.Name: {"gfx1010"}, .CanonicalName: {"gfx1010"}, .Kind: GK_GFX1010, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},
157 {.Name: {"gfx1011"}, .CanonicalName: {"gfx1011"}, .Kind: GK_GFX1011, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},
158 {.Name: {"gfx1012"}, .CanonicalName: {"gfx1012"}, .Kind: GK_GFX1012, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},
159 {.Name: {"gfx1013"}, .CanonicalName: {"gfx1013"}, .Kind: GK_GFX1013, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},
160 {.Name: {"gfx1030"}, .CanonicalName: {"gfx1030"}, .Kind: GK_GFX1030, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
161 {.Name: {"gfx1031"}, .CanonicalName: {"gfx1031"}, .Kind: GK_GFX1031, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
162 {.Name: {"gfx1032"}, .CanonicalName: {"gfx1032"}, .Kind: GK_GFX1032, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
163 {.Name: {"gfx1033"}, .CanonicalName: {"gfx1033"}, .Kind: GK_GFX1033, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
164 {.Name: {"gfx1034"}, .CanonicalName: {"gfx1034"}, .Kind: GK_GFX1034, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
165 {.Name: {"gfx1035"}, .CanonicalName: {"gfx1035"}, .Kind: GK_GFX1035, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
166 {.Name: {"gfx1036"}, .CanonicalName: {"gfx1036"}, .Kind: GK_GFX1036, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
167 {.Name: {"gfx1100"}, .CanonicalName: {"gfx1100"}, .Kind: GK_GFX1100, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
168 {.Name: {"gfx1101"}, .CanonicalName: {"gfx1101"}, .Kind: GK_GFX1101, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
169 {.Name: {"gfx1102"}, .CanonicalName: {"gfx1102"}, .Kind: GK_GFX1102, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
170 {.Name: {"gfx1103"}, .CanonicalName: {"gfx1103"}, .Kind: GK_GFX1103, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
171 {.Name: {"gfx1150"}, .CanonicalName: {"gfx1150"}, .Kind: GK_GFX1150, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
172 {.Name: {"gfx1151"}, .CanonicalName: {"gfx1151"}, .Kind: GK_GFX1151, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
173 {.Name: {"gfx1152"}, .CanonicalName: {"gfx1152"}, .Kind: GK_GFX1152, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
174 {.Name: {"gfx1153"}, .CanonicalName: {"gfx1153"}, .Kind: GK_GFX1153, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
175 {.Name: {"gfx1170"}, .CanonicalName: {"gfx1170"}, .Kind: GK_GFX1170, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
176 {.Name: {"gfx1200"}, .CanonicalName: {"gfx1200"}, .Kind: GK_GFX1200, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
177 {.Name: {"gfx1201"}, .CanonicalName: {"gfx1201"}, .Kind: GK_GFX1201, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
178 {.Name: {"gfx1250"}, .CanonicalName: {"gfx1250"}, .Kind: GK_GFX1250, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK_ALWAYS},
179 {.Name: {"gfx1251"}, .CanonicalName: {"gfx1251"}, .Kind: GK_GFX1251, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK_ALWAYS},
180 {.Name: {"gfx1310"}, .CanonicalName: {"gfx1310"}, .Kind: GK_GFX1310, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
181
182 {.Name: {"gfx9-generic"}, .CanonicalName: {"gfx9-generic"}, .Kind: GK_GFX9_GENERIC, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
183 {.Name: {"gfx10-1-generic"}, .CanonicalName: {"gfx10-1-generic"}, .Kind: GK_GFX10_1_GENERIC, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},
184 {.Name: {"gfx10-3-generic"}, .CanonicalName: {"gfx10-3-generic"}, .Kind: GK_GFX10_3_GENERIC, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
185 {.Name: {"gfx11-generic"}, .CanonicalName: {"gfx11-generic"}, .Kind: GK_GFX11_GENERIC, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
186 {.Name: {"gfx12-generic"}, .CanonicalName: {"gfx12-generic"}, .Kind: GK_GFX12_GENERIC, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
187 {.Name: {"gfx9-4-generic"}, .CanonicalName: {"gfx9-4-generic"}, .Kind: GK_GFX9_4_GENERIC, .Features: FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
188 // clang-format on
189};
190
191const GPUInfo *getArchEntry(AMDGPU::GPUKind AK, ArrayRef<GPUInfo> Table) {
192 GPUInfo Search = { .Name: {""}, .CanonicalName: {""}, .Kind: AK, .Features: AMDGPU::FEATURE_NONE };
193
194 auto I =
195 llvm::lower_bound(Range&: Table, Value&: Search, C: [](const GPUInfo &A, const GPUInfo &B) {
196 return A.Kind < B.Kind;
197 });
198
199 if (I == Table.end() || I->Kind != Search.Kind)
200 return nullptr;
201 return I;
202}
203
204} // namespace
205
206StringRef llvm::AMDGPU::getArchFamilyNameAMDGCN(GPUKind AK) {
207 switch (AK) {
208 case AMDGPU::GK_GFX9_GENERIC:
209 case AMDGPU::GK_GFX9_4_GENERIC:
210 return "gfx9";
211 case AMDGPU::GK_GFX10_1_GENERIC:
212 case AMDGPU::GK_GFX10_3_GENERIC:
213 return "gfx10";
214 case AMDGPU::GK_GFX11_GENERIC:
215 return "gfx11";
216 case AMDGPU::GK_GFX12_GENERIC:
217 return "gfx12";
218 default: {
219 StringRef ArchName = getArchNameAMDGCN(AK);
220 return ArchName.empty() ? "" : ArchName.drop_back(N: 2);
221 }
222 }
223}
224
225StringRef llvm::AMDGPU::getArchNameAMDGCN(GPUKind AK) {
226 if (const auto *Entry = getArchEntry(AK, Table: AMDGCNGPUs))
227 return Entry->CanonicalName;
228 return "";
229}
230
231StringRef llvm::AMDGPU::getArchNameR600(GPUKind AK) {
232 if (const auto *Entry = getArchEntry(AK, Table: R600GPUs))
233 return Entry->CanonicalName;
234 return "";
235}
236
237AMDGPU::GPUKind llvm::AMDGPU::parseArchAMDGCN(StringRef CPU) {
238 for (const auto &C : AMDGCNGPUs) {
239 if (CPU == C.Name)
240 return C.Kind;
241 }
242
243 return AMDGPU::GPUKind::GK_NONE;
244}
245
246AMDGPU::GPUKind llvm::AMDGPU::parseArchR600(StringRef CPU) {
247 for (const auto &C : R600GPUs) {
248 if (CPU == C.Name)
249 return C.Kind;
250 }
251
252 return AMDGPU::GPUKind::GK_NONE;
253}
254
255unsigned AMDGPU::getArchAttrAMDGCN(GPUKind AK) {
256 if (const auto *Entry = getArchEntry(AK, Table: AMDGCNGPUs))
257 return Entry->Features;
258 return FEATURE_NONE;
259}
260
261unsigned AMDGPU::getArchAttrR600(GPUKind AK) {
262 if (const auto *Entry = getArchEntry(AK, Table: R600GPUs))
263 return Entry->Features;
264 return FEATURE_NONE;
265}
266
267void AMDGPU::fillValidArchListAMDGCN(SmallVectorImpl<StringRef> &Values) {
268 // XXX: Should this only report unique canonical names?
269 for (const auto &C : AMDGCNGPUs)
270 Values.push_back(Elt: C.Name);
271}
272
273void AMDGPU::fillValidArchListR600(SmallVectorImpl<StringRef> &Values) {
274 for (const auto &C : R600GPUs)
275 Values.push_back(Elt: C.Name);
276}
277
278AMDGPU::IsaVersion AMDGPU::getIsaVersion(StringRef GPU) {
279 AMDGPU::GPUKind AK = parseArchAMDGCN(CPU: GPU);
280 if (AK == AMDGPU::GPUKind::GK_NONE) {
281 if (GPU == "generic-hsa")
282 return {.Major: 7, .Minor: 0, .Stepping: 0};
283 if (GPU == "generic")
284 return {.Major: 6, .Minor: 0, .Stepping: 0};
285 return {.Major: 0, .Minor: 0, .Stepping: 0};
286 }
287
288 // clang-format off
289 switch (AK) {
290 case GK_GFX600: return {.Major: 6, .Minor: 0, .Stepping: 0};
291 case GK_GFX601: return {.Major: 6, .Minor: 0, .Stepping: 1};
292 case GK_GFX602: return {.Major: 6, .Minor: 0, .Stepping: 2};
293 case GK_GFX700: return {.Major: 7, .Minor: 0, .Stepping: 0};
294 case GK_GFX701: return {.Major: 7, .Minor: 0, .Stepping: 1};
295 case GK_GFX702: return {.Major: 7, .Minor: 0, .Stepping: 2};
296 case GK_GFX703: return {.Major: 7, .Minor: 0, .Stepping: 3};
297 case GK_GFX704: return {.Major: 7, .Minor: 0, .Stepping: 4};
298 case GK_GFX705: return {.Major: 7, .Minor: 0, .Stepping: 5};
299 case GK_GFX801: return {.Major: 8, .Minor: 0, .Stepping: 1};
300 case GK_GFX802: return {.Major: 8, .Minor: 0, .Stepping: 2};
301 case GK_GFX803: return {.Major: 8, .Minor: 0, .Stepping: 3};
302 case GK_GFX805: return {.Major: 8, .Minor: 0, .Stepping: 5};
303 case GK_GFX810: return {.Major: 8, .Minor: 1, .Stepping: 0};
304 case GK_GFX900: return {.Major: 9, .Minor: 0, .Stepping: 0};
305 case GK_GFX902: return {.Major: 9, .Minor: 0, .Stepping: 2};
306 case GK_GFX904: return {.Major: 9, .Minor: 0, .Stepping: 4};
307 case GK_GFX906: return {.Major: 9, .Minor: 0, .Stepping: 6};
308 case GK_GFX908: return {.Major: 9, .Minor: 0, .Stepping: 8};
309 case GK_GFX909: return {.Major: 9, .Minor: 0, .Stepping: 9};
310 case GK_GFX90A: return {.Major: 9, .Minor: 0, .Stepping: 10};
311 case GK_GFX90C: return {.Major: 9, .Minor: 0, .Stepping: 12};
312 case GK_GFX942: return {.Major: 9, .Minor: 4, .Stepping: 2};
313 case GK_GFX950: return {.Major: 9, .Minor: 5, .Stepping: 0};
314 case GK_GFX1010: return {.Major: 10, .Minor: 1, .Stepping: 0};
315 case GK_GFX1011: return {.Major: 10, .Minor: 1, .Stepping: 1};
316 case GK_GFX1012: return {.Major: 10, .Minor: 1, .Stepping: 2};
317 case GK_GFX1013: return {.Major: 10, .Minor: 1, .Stepping: 3};
318 case GK_GFX1030: return {.Major: 10, .Minor: 3, .Stepping: 0};
319 case GK_GFX1031: return {.Major: 10, .Minor: 3, .Stepping: 1};
320 case GK_GFX1032: return {.Major: 10, .Minor: 3, .Stepping: 2};
321 case GK_GFX1033: return {.Major: 10, .Minor: 3, .Stepping: 3};
322 case GK_GFX1034: return {.Major: 10, .Minor: 3, .Stepping: 4};
323 case GK_GFX1035: return {.Major: 10, .Minor: 3, .Stepping: 5};
324 case GK_GFX1036: return {.Major: 10, .Minor: 3, .Stepping: 6};
325 case GK_GFX1100: return {.Major: 11, .Minor: 0, .Stepping: 0};
326 case GK_GFX1101: return {.Major: 11, .Minor: 0, .Stepping: 1};
327 case GK_GFX1102: return {.Major: 11, .Minor: 0, .Stepping: 2};
328 case GK_GFX1103: return {.Major: 11, .Minor: 0, .Stepping: 3};
329 case GK_GFX1150: return {.Major: 11, .Minor: 5, .Stepping: 0};
330 case GK_GFX1151: return {.Major: 11, .Minor: 5, .Stepping: 1};
331 case GK_GFX1152: return {.Major: 11, .Minor: 5, .Stepping: 2};
332 case GK_GFX1153: return {.Major: 11, .Minor: 5, .Stepping: 3};
333 case GK_GFX1170: return {.Major: 11, .Minor: 7, .Stepping: 0};
334 case GK_GFX1200: return {.Major: 12, .Minor: 0, .Stepping: 0};
335 case GK_GFX1201: return {.Major: 12, .Minor: 0, .Stepping: 1};
336 case GK_GFX1250: return {.Major: 12, .Minor: 5, .Stepping: 0};
337 case GK_GFX1251: return {.Major: 12, .Minor: 5, .Stepping: 1};
338 case GK_GFX1310: return {.Major: 13, .Minor: 1, .Stepping: 0};
339
340 // Generic targets return the lowest common denominator
341 // within their family. That is, the ISA that is the most
342 // restricted in terms of features.
343 //
344 // gfx9-generic is tricky because there is no lowest
345 // common denominator, so we return gfx900 which has mad-mix
346 // but this family doesn't have it.
347 //
348 // This API should never be used to check for a particular
349 // feature anyway.
350 //
351 // TODO: Split up this API depending on its caller so
352 // generic target handling is more obvious and less risky.
353 case GK_GFX9_GENERIC: return {.Major: 9, .Minor: 0, .Stepping: 0};
354 case GK_GFX9_4_GENERIC: return {.Major: 9, .Minor: 4, .Stepping: 0};
355 case GK_GFX10_1_GENERIC: return {.Major: 10, .Minor: 1, .Stepping: 0};
356 case GK_GFX10_3_GENERIC: return {.Major: 10, .Minor: 3, .Stepping: 0};
357 case GK_GFX11_GENERIC: return {.Major: 11, .Minor: 0, .Stepping: 3};
358 case GK_GFX12_GENERIC: return {.Major: 12, .Minor: 0, .Stepping: 0};
359 default: return {.Major: 0, .Minor: 0, .Stepping: 0};
360 }
361 // clang-format on
362}
363
364StringRef AMDGPU::getCanonicalArchName(const Triple &T, StringRef Arch) {
365 assert(T.isAMDGPU());
366 auto ProcKind = T.isAMDGCN() ? parseArchAMDGCN(CPU: Arch) : parseArchR600(CPU: Arch);
367 if (ProcKind == GK_NONE)
368 return StringRef();
369
370 return T.isAMDGCN() ? getArchNameAMDGCN(AK: ProcKind) : getArchNameR600(AK: ProcKind);
371}
372
373static std::pair<FeatureError, StringRef>
374insertWaveSizeFeature(StringRef GPU, const Triple &T,
375 const StringMap<bool> &DefaultFeatures,
376 StringMap<bool> &Features) {
377 const bool IsNullGPU = GPU.empty();
378 const bool TargetHasWave32 = DefaultFeatures.count(Key: "wavefrontsize32");
379 const bool TargetHasWave64 = DefaultFeatures.count(Key: "wavefrontsize64");
380
381 auto Wave32Itr = Features.find(Key: "wavefrontsize32");
382 auto Wave64Itr = Features.find(Key: "wavefrontsize64");
383 const bool EnableWave32 =
384 Wave32Itr != Features.end() && Wave32Itr->getValue();
385 const bool EnableWave64 =
386 Wave64Itr != Features.end() && Wave64Itr->getValue();
387 const bool DisableWave32 =
388 Wave32Itr != Features.end() && !Wave32Itr->getValue();
389 const bool DisableWave64 =
390 Wave64Itr != Features.end() && !Wave64Itr->getValue();
391
392 if (EnableWave32 && EnableWave64)
393 return {AMDGPU::INVALID_FEATURE_COMBINATION,
394 "'+wavefrontsize32' and '+wavefrontsize64' are mutually exclusive"};
395 if (DisableWave32 && DisableWave64)
396 return {AMDGPU::INVALID_FEATURE_COMBINATION,
397 "'-wavefrontsize32' and '-wavefrontsize64' are mutually exclusive"};
398
399 if (!IsNullGPU) {
400 if (TargetHasWave64) {
401 if (EnableWave32)
402 return {AMDGPU::UNSUPPORTED_TARGET_FEATURE, "+wavefrontsize32"};
403 if (DisableWave64)
404 return {AMDGPU::UNSUPPORTED_TARGET_FEATURE, "-wavefrontsize64"};
405 }
406
407 if (TargetHasWave32) {
408 if (EnableWave64)
409 return {AMDGPU::UNSUPPORTED_TARGET_FEATURE, "+wavefrontsize64"};
410 if (DisableWave32)
411 return {AMDGPU::UNSUPPORTED_TARGET_FEATURE, "-wavefrontsize32"};
412 }
413 }
414
415 // Don't assume any wavesize with an unknown subtarget.
416 // Default to wave32 if target supports both.
417 if (!IsNullGPU && !EnableWave32 && !EnableWave64 && !TargetHasWave32 &&
418 !TargetHasWave64)
419 Features.insert(KV: std::make_pair(x: "wavefrontsize32", y: true));
420
421 for (const auto &Entry : DefaultFeatures) {
422 if (!Features.count(Key: Entry.getKey()))
423 Features[Entry.getKey()] = Entry.getValue();
424 }
425
426 return {NO_ERROR, StringRef()};
427}
428
429/// Fills Features map with default values for given target GPU.
430/// \p Features contains overriding target features and this function returns
431/// default target features with entries overridden by \p Features.
432static void fillAMDGCNFeatureMap(StringRef GPU, const Triple &T,
433 StringMap<bool> &Features) {
434 AMDGPU::GPUKind Kind = parseArchAMDGCN(CPU: GPU);
435 switch (Kind) {
436 case GK_GFX1310:
437 case GK_GFX1251:
438 case GK_GFX1250:
439 Features["ci-insts"] = true;
440 Features["dot7-insts"] = true;
441 Features["dot8-insts"] = true;
442 Features["dl-insts"] = true;
443 Features["16-bit-insts"] = true;
444 Features["dpp"] = true;
445 Features["gfx8-insts"] = true;
446 Features["gfx9-insts"] = true;
447 Features["gfx10-insts"] = true;
448 Features["gfx10-3-insts"] = true;
449 Features["gfx11-insts"] = true;
450 Features["gfx12-insts"] = true;
451 Features["gfx1250-insts"] = true;
452 Features["bitop3-insts"] = true;
453 Features["prng-inst"] = true;
454 Features["tanh-insts"] = true;
455 Features["tensor-cvt-lut-insts"] = true;
456 Features["transpose-load-f4f6-insts"] = true;
457 Features["bf16-trans-insts"] = true;
458 Features["bf16-cvt-insts"] = true;
459 Features["bf16-pk-insts"] = true;
460 Features["fp8-conversion-insts"] = true;
461 Features["fp8e5m3-insts"] = true;
462 Features["permlane16-swap"] = true;
463 Features["ashr-pk-insts"] = true;
464 Features["add-min-max-insts"] = true;
465 Features["pk-add-min-max-insts"] = true;
466 Features["atomic-buffer-pk-add-bf16-inst"] = true;
467 Features["vmem-pref-insts"] = true;
468 Features["atomic-fadd-rtn-insts"] = true;
469 Features["atomic-buffer-global-pk-add-f16-insts"] = true;
470 Features["atomic-flat-pk-add-16-insts"] = true;
471 Features["atomic-global-pk-add-bf16-inst"] = true;
472 Features["atomic-ds-pk-add-16-insts"] = true;
473 Features["setprio-inc-wg-inst"] = true;
474 Features["s-wakeup-barrier-inst"] = true;
475 Features["atomic-fmin-fmax-global-f32"] = true;
476 Features["atomic-fmin-fmax-global-f64"] = true;
477 Features["wavefrontsize32"] = true;
478 Features["clusters"] = true;
479 Features["mcast-load-insts"] = true;
480 Features["cube-insts"] = true;
481 Features["lerp-inst"] = true;
482 Features["sad-insts"] = true;
483 Features["qsad-insts"] = true;
484 Features["cvt-pknorm-vop2-insts"] = true;
485 break;
486 case GK_GFX1201:
487 case GK_GFX1200:
488 case GK_GFX12_GENERIC:
489 Features["ci-insts"] = true;
490 Features["dot7-insts"] = true;
491 Features["dot8-insts"] = true;
492 Features["dot9-insts"] = true;
493 Features["dot10-insts"] = true;
494 Features["dot11-insts"] = true;
495 Features["dot12-insts"] = true;
496 Features["dl-insts"] = true;
497 Features["atomic-ds-pk-add-16-insts"] = true;
498 Features["atomic-flat-pk-add-16-insts"] = true;
499 Features["atomic-buffer-global-pk-add-f16-insts"] = true;
500 Features["atomic-buffer-pk-add-bf16-inst"] = true;
501 Features["atomic-global-pk-add-bf16-inst"] = true;
502 Features["16-bit-insts"] = true;
503 Features["dpp"] = true;
504 Features["gfx8-insts"] = true;
505 Features["gfx9-insts"] = true;
506 Features["gfx10-insts"] = true;
507 Features["gfx10-3-insts"] = true;
508 Features["gfx11-insts"] = true;
509 Features["gfx12-insts"] = true;
510 Features["atomic-fadd-rtn-insts"] = true;
511 Features["image-insts"] = true;
512 Features["cube-insts"] = true;
513 Features["lerp-inst"] = true;
514 Features["sad-insts"] = true;
515 Features["qsad-insts"] = true;
516 Features["cvt-pknorm-vop2-insts"] = true;
517 Features["fp8-conversion-insts"] = true;
518 Features["wmma-128b-insts"] = true;
519 Features["atomic-fmin-fmax-global-f32"] = true;
520 break;
521 case GK_GFX1170:
522 Features["ci-insts"] = true;
523 Features["dot7-insts"] = true;
524 Features["dot8-insts"] = true;
525 Features["dot9-insts"] = true;
526 Features["dot10-insts"] = true;
527 Features["dot12-insts"] = true;
528 Features["dl-insts"] = true;
529 Features["16-bit-insts"] = true;
530 Features["dpp"] = true;
531 Features["gfx8-insts"] = true;
532 Features["gfx9-insts"] = true;
533 Features["gfx10-insts"] = true;
534 Features["gfx10-3-insts"] = true;
535 Features["gfx11-insts"] = true;
536 Features["atomic-fadd-rtn-insts"] = true;
537 Features["image-insts"] = true;
538 Features["cube-insts"] = true;
539 Features["lerp-inst"] = true;
540 Features["sad-insts"] = true;
541 Features["qsad-insts"] = true;
542 Features["cvt-pknorm-vop2-insts"] = true;
543 Features["gws"] = true;
544 Features["dot11-insts"] = true;
545 Features["fp8-conversion-insts"] = true;
546 Features["wmma-128b-insts"] = true;
547 Features["atomic-fmin-fmax-global-f32"] = true;
548 break;
549 case GK_GFX1153:
550 case GK_GFX1152:
551 case GK_GFX1151:
552 case GK_GFX1150:
553 case GK_GFX1103:
554 case GK_GFX1102:
555 case GK_GFX1101:
556 case GK_GFX1100:
557 case GK_GFX11_GENERIC:
558 Features["ci-insts"] = true;
559 Features["dot5-insts"] = true;
560 Features["dot7-insts"] = true;
561 Features["dot8-insts"] = true;
562 Features["dot9-insts"] = true;
563 Features["dot10-insts"] = true;
564 Features["dot12-insts"] = true;
565 Features["dl-insts"] = true;
566 Features["16-bit-insts"] = true;
567 Features["dpp"] = true;
568 Features["gfx8-insts"] = true;
569 Features["gfx9-insts"] = true;
570 Features["gfx10-insts"] = true;
571 Features["gfx10-3-insts"] = true;
572 Features["gfx11-insts"] = true;
573 Features["atomic-fadd-rtn-insts"] = true;
574 Features["image-insts"] = true;
575 Features["cube-insts"] = true;
576 Features["lerp-inst"] = true;
577 Features["sad-insts"] = true;
578 Features["qsad-insts"] = true;
579 Features["cvt-pknorm-vop2-insts"] = true;
580 Features["gws"] = true;
581 Features["wmma-256b-insts"] = true;
582 Features["atomic-fmin-fmax-global-f32"] = true;
583 break;
584 case GK_GFX1036:
585 case GK_GFX1035:
586 case GK_GFX1034:
587 case GK_GFX1033:
588 case GK_GFX1032:
589 case GK_GFX1031:
590 case GK_GFX1030:
591 case GK_GFX10_3_GENERIC:
592 Features["ci-insts"] = true;
593 Features["dot1-insts"] = true;
594 Features["dot2-insts"] = true;
595 Features["dot5-insts"] = true;
596 Features["dot6-insts"] = true;
597 Features["dot7-insts"] = true;
598 Features["dot10-insts"] = true;
599 Features["dl-insts"] = true;
600 Features["16-bit-insts"] = true;
601 Features["dpp"] = true;
602 Features["gfx8-insts"] = true;
603 Features["gfx9-insts"] = true;
604 Features["gfx10-insts"] = true;
605 Features["gfx10-3-insts"] = true;
606 Features["image-insts"] = true;
607 Features["s-memrealtime"] = true;
608 Features["s-memtime-inst"] = true;
609 Features["gws"] = true;
610 Features["vmem-to-lds-load-insts"] = true;
611 Features["atomic-fmin-fmax-global-f32"] = true;
612 Features["atomic-fmin-fmax-global-f64"] = true;
613 Features["cube-insts"] = true;
614 Features["lerp-inst"] = true;
615 Features["sad-insts"] = true;
616 Features["qsad-insts"] = true;
617 Features["cvt-pknorm-vop2-insts"] = true;
618 break;
619 case GK_GFX1012:
620 case GK_GFX1011:
621 Features["dot1-insts"] = true;
622 Features["dot2-insts"] = true;
623 Features["dot5-insts"] = true;
624 Features["dot6-insts"] = true;
625 Features["dot7-insts"] = true;
626 Features["dot10-insts"] = true;
627 [[fallthrough]];
628 case GK_GFX1013:
629 case GK_GFX1010:
630 case GK_GFX10_1_GENERIC:
631 Features["dl-insts"] = true;
632 Features["ci-insts"] = true;
633 Features["16-bit-insts"] = true;
634 Features["dpp"] = true;
635 Features["gfx8-insts"] = true;
636 Features["gfx9-insts"] = true;
637 Features["gfx10-insts"] = true;
638 Features["image-insts"] = true;
639 Features["s-memrealtime"] = true;
640 Features["s-memtime-inst"] = true;
641 Features["gws"] = true;
642 Features["vmem-to-lds-load-insts"] = true;
643 Features["atomic-fmin-fmax-global-f32"] = true;
644 Features["atomic-fmin-fmax-global-f64"] = true;
645 Features["cube-insts"] = true;
646 Features["lerp-inst"] = true;
647 Features["sad-insts"] = true;
648 Features["qsad-insts"] = true;
649 Features["cvt-pknorm-vop2-insts"] = true;
650 break;
651 case GK_GFX950:
652 Features["bitop3-insts"] = true;
653 Features["fp6bf6-cvt-scale-insts"] = true;
654 Features["fp4-cvt-scale-insts"] = true;
655 Features["bf8-cvt-scale-insts"] = true;
656 Features["fp8-cvt-scale-insts"] = true;
657 Features["f16bf16-to-fp6bf6-cvt-scale-insts"] = true;
658 Features["f32-to-f16bf16-cvt-sr-insts"] = true;
659 Features["prng-inst"] = true;
660 Features["permlane16-swap"] = true;
661 Features["permlane32-swap"] = true;
662 Features["ashr-pk-insts"] = true;
663 Features["dot12-insts"] = true;
664 Features["dot13-insts"] = true;
665 Features["atomic-buffer-pk-add-bf16-inst"] = true;
666 Features["gfx950-insts"] = true;
667 [[fallthrough]];
668 case GK_GFX942:
669 Features["fp8-insts"] = true;
670 Features["fp8-conversion-insts"] = true;
671 if (Kind != GK_GFX950)
672 Features["xf32-insts"] = true;
673 [[fallthrough]];
674 case GK_GFX9_4_GENERIC:
675 Features["gfx940-insts"] = true;
676 Features["atomic-ds-pk-add-16-insts"] = true;
677 Features["atomic-flat-pk-add-16-insts"] = true;
678 Features["atomic-global-pk-add-bf16-inst"] = true;
679 Features["gfx90a-insts"] = true;
680 Features["atomic-buffer-global-pk-add-f16-insts"] = true;
681 Features["atomic-fadd-rtn-insts"] = true;
682 Features["dot3-insts"] = true;
683 Features["dot4-insts"] = true;
684 Features["dot5-insts"] = true;
685 Features["dot6-insts"] = true;
686 Features["mai-insts"] = true;
687 Features["dl-insts"] = true;
688 Features["dot1-insts"] = true;
689 Features["dot2-insts"] = true;
690 Features["dot7-insts"] = true;
691 Features["dot10-insts"] = true;
692 Features["gfx9-insts"] = true;
693 Features["gfx8-insts"] = true;
694 Features["16-bit-insts"] = true;
695 Features["dpp"] = true;
696 Features["s-memrealtime"] = true;
697 Features["ci-insts"] = true;
698 Features["s-memtime-inst"] = true;
699 Features["gws"] = true;
700 Features["vmem-to-lds-load-insts"] = true;
701 Features["atomic-fmin-fmax-global-f64"] = true;
702 Features["wavefrontsize64"] = true;
703 Features["cube-insts"] = true;
704 Features["lerp-inst"] = true;
705 Features["sad-insts"] = true;
706 Features["qsad-insts"] = true;
707 Features["cvt-pknorm-vop2-insts"] = true;
708 break;
709 case GK_GFX90A:
710 Features["gfx90a-insts"] = true;
711 Features["atomic-buffer-global-pk-add-f16-insts"] = true;
712 Features["atomic-fadd-rtn-insts"] = true;
713 Features["atomic-fmin-fmax-global-f64"] = true;
714 [[fallthrough]];
715 case GK_GFX908:
716 Features["dot3-insts"] = true;
717 Features["dot4-insts"] = true;
718 Features["dot5-insts"] = true;
719 Features["dot6-insts"] = true;
720 Features["mai-insts"] = true;
721 [[fallthrough]];
722 case GK_GFX906:
723 Features["dl-insts"] = true;
724 Features["dot1-insts"] = true;
725 Features["dot2-insts"] = true;
726 Features["dot7-insts"] = true;
727 Features["dot10-insts"] = true;
728 [[fallthrough]];
729 case GK_GFX90C:
730 case GK_GFX909:
731 case GK_GFX904:
732 case GK_GFX902:
733 case GK_GFX900:
734 case GK_GFX9_GENERIC:
735 Features["gfx9-insts"] = true;
736 Features["vmem-to-lds-load-insts"] = true;
737 [[fallthrough]];
738 case GK_GFX810:
739 case GK_GFX805:
740 case GK_GFX803:
741 case GK_GFX802:
742 case GK_GFX801:
743 Features["gfx8-insts"] = true;
744 Features["16-bit-insts"] = true;
745 Features["dpp"] = true;
746 Features["s-memrealtime"] = true;
747 Features["ci-insts"] = true;
748 Features["image-insts"] = true;
749 Features["s-memtime-inst"] = true;
750 Features["gws"] = true;
751 Features["wavefrontsize64"] = true;
752 Features["cube-insts"] = true;
753 Features["lerp-inst"] = true;
754 Features["sad-insts"] = true;
755 Features["qsad-insts"] = true;
756 Features["cvt-pknorm-vop2-insts"] = true;
757 break;
758 case GK_GFX705:
759 case GK_GFX704:
760 case GK_GFX703:
761 case GK_GFX702:
762 case GK_GFX701:
763 case GK_GFX700:
764 Features["ci-insts"] = true;
765 Features["cube-insts"] = true;
766 Features["lerp-inst"] = true;
767 Features["sad-insts"] = true;
768 Features["qsad-insts"] = true;
769 Features["cvt-pknorm-vop2-insts"] = true;
770 Features["image-insts"] = true;
771 Features["s-memtime-inst"] = true;
772 Features["gws"] = true;
773 Features["atomic-fmin-fmax-global-f32"] = true;
774 Features["atomic-fmin-fmax-global-f64"] = true;
775 Features["wavefrontsize64"] = true;
776 break;
777 case GK_GFX602:
778 case GK_GFX601:
779 case GK_GFX600:
780 Features["image-insts"] = true;
781 Features["s-memtime-inst"] = true;
782 Features["gws"] = true;
783 Features["atomic-fmin-fmax-global-f32"] = true;
784 Features["atomic-fmin-fmax-global-f64"] = true;
785 Features["wavefrontsize64"] = true;
786 Features["cube-insts"] = true;
787 Features["lerp-inst"] = true;
788 Features["sad-insts"] = true;
789 Features["cvt-pknorm-vop2-insts"] = true;
790 break;
791 case GK_NONE:
792 break;
793 default:
794 llvm_unreachable("Unhandled GPU!");
795 }
796}
797
798/// Fills Features map with default values for given target GPU.
799/// \p Features contains overriding target features and this function returns
800/// default target features with entries overridden by \p Features.
801std::pair<FeatureError, StringRef>
802AMDGPU::fillAMDGPUFeatureMap(StringRef GPU, const Triple &T,
803 StringMap<bool> &Features) {
804 // XXX - What does the member GPU mean if device name string passed here?
805 if (T.isSPIRV() && T.getOS() == Triple::OSType::AMDHSA) {
806 // AMDGCN SPIRV must support the union of all AMDGCN features. This list
807 // should be kept in sorted order and updated whenever new features are
808 // added.
809 Features["16-bit-insts"] = true;
810 Features["ashr-pk-insts"] = true;
811 Features["atomic-buffer-pk-add-bf16-inst"] = true;
812 Features["atomic-buffer-global-pk-add-f16-insts"] = true;
813 Features["atomic-ds-pk-add-16-insts"] = true;
814 Features["atomic-fadd-rtn-insts"] = true;
815 Features["atomic-flat-pk-add-16-insts"] = true;
816 Features["atomic-global-pk-add-bf16-inst"] = true;
817 Features["bf16-trans-insts"] = true;
818 Features["bf16-cvt-insts"] = true;
819 Features["bf8-cvt-scale-insts"] = true;
820 Features["bitop3-insts"] = true;
821 Features["ci-insts"] = true;
822 Features["dl-insts"] = true;
823 Features["dot1-insts"] = true;
824 Features["dot2-insts"] = true;
825 Features["dot3-insts"] = true;
826 Features["dot4-insts"] = true;
827 Features["dot5-insts"] = true;
828 Features["dot6-insts"] = true;
829 Features["dot7-insts"] = true;
830 Features["dot8-insts"] = true;
831 Features["dot9-insts"] = true;
832 Features["dot10-insts"] = true;
833 Features["dot11-insts"] = true;
834 Features["dot12-insts"] = true;
835 Features["dot13-insts"] = true;
836 Features["dpp"] = true;
837 Features["f16bf16-to-fp6bf6-cvt-scale-insts"] = true;
838 Features["f32-to-f16bf16-cvt-sr-insts"] = true;
839 Features["fp4-cvt-scale-insts"] = true;
840 Features["fp6bf6-cvt-scale-insts"] = true;
841 Features["fp8e5m3-insts"] = true;
842 Features["fp8-conversion-insts"] = true;
843 Features["fp8-cvt-scale-insts"] = true;
844 Features["fp8-insts"] = true;
845 Features["gfx8-insts"] = true;
846 Features["gfx9-insts"] = true;
847 Features["gfx90a-insts"] = true;
848 Features["gfx940-insts"] = true;
849 Features["gfx950-insts"] = true;
850 Features["gfx10-insts"] = true;
851 Features["gfx10-3-insts"] = true;
852 Features["gfx11-insts"] = true;
853 Features["gfx12-insts"] = true;
854 Features["gfx1250-insts"] = true;
855 Features["gws"] = true;
856 Features["image-insts"] = true;
857 Features["mai-insts"] = true;
858 Features["permlane16-swap"] = true;
859 Features["permlane32-swap"] = true;
860 Features["prng-inst"] = true;
861 Features["setprio-inc-wg-inst"] = true;
862 Features["s-memrealtime"] = true;
863 Features["s-memtime-inst"] = true;
864 Features["tanh-insts"] = true;
865 Features["tensor-cvt-lut-insts"] = true;
866 Features["transpose-load-f4f6-insts"] = true;
867 Features["vmem-pref-insts"] = true;
868 Features["vmem-to-lds-load-insts"] = true;
869 Features["wavefrontsize32"] = true;
870 Features["wavefrontsize64"] = true;
871 } else if (T.isAMDGCN()) {
872 StringMap<bool> DefaultFeatures;
873 fillAMDGCNFeatureMap(GPU, T, Features&: DefaultFeatures);
874 return insertWaveSizeFeature(GPU, T, DefaultFeatures, Features);
875 } else {
876 if (GPU.empty())
877 GPU = "r600";
878
879 switch (llvm::AMDGPU::parseArchR600(CPU: GPU)) {
880 case GK_CAYMAN:
881 case GK_CYPRESS:
882 case GK_RV770:
883 case GK_RV670:
884 // TODO: Add fp64 when implemented.
885 break;
886 case GK_TURKS:
887 case GK_CAICOS:
888 case GK_BARTS:
889 case GK_SUMO:
890 case GK_REDWOOD:
891 case GK_JUNIPER:
892 case GK_CEDAR:
893 case GK_RV730:
894 case GK_RV710:
895 case GK_RS880:
896 case GK_R630:
897 case GK_R600:
898 break;
899 default:
900 llvm_unreachable("Unhandled GPU!");
901 }
902 }
903 return {NO_ERROR, StringRef()};
904}
905