1bdd1243dSDimitry Andric //===-- TargetParser - Parser for target features ---------------*- C++ -*-===//
2bdd1243dSDimitry Andric //
3bdd1243dSDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4bdd1243dSDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
5bdd1243dSDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6bdd1243dSDimitry Andric //
7bdd1243dSDimitry Andric //===----------------------------------------------------------------------===//
8bdd1243dSDimitry Andric //
9bdd1243dSDimitry Andric // This file implements a target parser to recognise hardware features such as
10bdd1243dSDimitry Andric // FPU/CPU/ARCH names as well as specific support such as HDIV, etc.
11bdd1243dSDimitry Andric //
12bdd1243dSDimitry Andric //===----------------------------------------------------------------------===//
13bdd1243dSDimitry Andric
14bdd1243dSDimitry Andric #include "llvm/TargetParser/TargetParser.h"
15bdd1243dSDimitry Andric #include "llvm/ADT/ArrayRef.h"
16bdd1243dSDimitry Andric #include "llvm/TargetParser/Triple.h"
17bdd1243dSDimitry Andric
18bdd1243dSDimitry Andric using namespace llvm;
19bdd1243dSDimitry Andric using namespace AMDGPU;
20bdd1243dSDimitry Andric
21bdd1243dSDimitry Andric namespace {
22bdd1243dSDimitry Andric
23bdd1243dSDimitry Andric struct GPUInfo {
24bdd1243dSDimitry Andric StringLiteral Name;
25bdd1243dSDimitry Andric StringLiteral CanonicalName;
26bdd1243dSDimitry Andric AMDGPU::GPUKind Kind;
27bdd1243dSDimitry Andric unsigned Features;
28bdd1243dSDimitry Andric };
29bdd1243dSDimitry Andric
30bdd1243dSDimitry Andric constexpr GPUInfo R600GPUs[] = {
31bdd1243dSDimitry Andric // Name Canonical Kind Features
32bdd1243dSDimitry Andric // Name
33bdd1243dSDimitry Andric {{"r600"}, {"r600"}, GK_R600, FEATURE_NONE },
34bdd1243dSDimitry Andric {{"rv630"}, {"r600"}, GK_R600, FEATURE_NONE },
35bdd1243dSDimitry Andric {{"rv635"}, {"r600"}, GK_R600, FEATURE_NONE },
36bdd1243dSDimitry Andric {{"r630"}, {"r630"}, GK_R630, FEATURE_NONE },
37bdd1243dSDimitry Andric {{"rs780"}, {"rs880"}, GK_RS880, FEATURE_NONE },
38bdd1243dSDimitry Andric {{"rs880"}, {"rs880"}, GK_RS880, FEATURE_NONE },
39bdd1243dSDimitry Andric {{"rv610"}, {"rs880"}, GK_RS880, FEATURE_NONE },
40bdd1243dSDimitry Andric {{"rv620"}, {"rs880"}, GK_RS880, FEATURE_NONE },
41bdd1243dSDimitry Andric {{"rv670"}, {"rv670"}, GK_RV670, FEATURE_NONE },
42bdd1243dSDimitry Andric {{"rv710"}, {"rv710"}, GK_RV710, FEATURE_NONE },
43bdd1243dSDimitry Andric {{"rv730"}, {"rv730"}, GK_RV730, FEATURE_NONE },
44bdd1243dSDimitry Andric {{"rv740"}, {"rv770"}, GK_RV770, FEATURE_NONE },
45bdd1243dSDimitry Andric {{"rv770"}, {"rv770"}, GK_RV770, FEATURE_NONE },
46bdd1243dSDimitry Andric {{"cedar"}, {"cedar"}, GK_CEDAR, FEATURE_NONE },
47bdd1243dSDimitry Andric {{"palm"}, {"cedar"}, GK_CEDAR, FEATURE_NONE },
48bdd1243dSDimitry Andric {{"cypress"}, {"cypress"}, GK_CYPRESS, FEATURE_FMA },
49bdd1243dSDimitry Andric {{"hemlock"}, {"cypress"}, GK_CYPRESS, FEATURE_FMA },
50bdd1243dSDimitry Andric {{"juniper"}, {"juniper"}, GK_JUNIPER, FEATURE_NONE },
51bdd1243dSDimitry Andric {{"redwood"}, {"redwood"}, GK_REDWOOD, FEATURE_NONE },
52bdd1243dSDimitry Andric {{"sumo"}, {"sumo"}, GK_SUMO, FEATURE_NONE },
53bdd1243dSDimitry Andric {{"sumo2"}, {"sumo"}, GK_SUMO, FEATURE_NONE },
54bdd1243dSDimitry Andric {{"barts"}, {"barts"}, GK_BARTS, FEATURE_NONE },
55bdd1243dSDimitry Andric {{"caicos"}, {"caicos"}, GK_CAICOS, FEATURE_NONE },
56bdd1243dSDimitry Andric {{"aruba"}, {"cayman"}, GK_CAYMAN, FEATURE_FMA },
57bdd1243dSDimitry Andric {{"cayman"}, {"cayman"}, GK_CAYMAN, FEATURE_FMA },
58bdd1243dSDimitry Andric {{"turks"}, {"turks"}, GK_TURKS, FEATURE_NONE }
59bdd1243dSDimitry Andric };
60bdd1243dSDimitry Andric
61bdd1243dSDimitry Andric // This table should be sorted by the value of GPUKind
62bdd1243dSDimitry Andric // Don't bother listing the implicitly true features
63bdd1243dSDimitry Andric constexpr GPUInfo AMDGCNGPUs[] = {
64c9157d92SDimitry Andric // clang-format off
65bdd1243dSDimitry Andric // Name Canonical Kind Features
66bdd1243dSDimitry Andric // Name
67bdd1243dSDimitry Andric {{"gfx600"}, {"gfx600"}, GK_GFX600, FEATURE_FAST_FMA_F32},
68bdd1243dSDimitry Andric {{"tahiti"}, {"gfx600"}, GK_GFX600, FEATURE_FAST_FMA_F32},
69bdd1243dSDimitry Andric {{"gfx601"}, {"gfx601"}, GK_GFX601, FEATURE_NONE},
70bdd1243dSDimitry Andric {{"pitcairn"}, {"gfx601"}, GK_GFX601, FEATURE_NONE},
71bdd1243dSDimitry Andric {{"verde"}, {"gfx601"}, GK_GFX601, FEATURE_NONE},
72bdd1243dSDimitry Andric {{"gfx602"}, {"gfx602"}, GK_GFX602, FEATURE_NONE},
73bdd1243dSDimitry Andric {{"hainan"}, {"gfx602"}, GK_GFX602, FEATURE_NONE},
74bdd1243dSDimitry Andric {{"oland"}, {"gfx602"}, GK_GFX602, FEATURE_NONE},
75bdd1243dSDimitry Andric {{"gfx700"}, {"gfx700"}, GK_GFX700, FEATURE_NONE},
76bdd1243dSDimitry Andric {{"kaveri"}, {"gfx700"}, GK_GFX700, FEATURE_NONE},
77bdd1243dSDimitry Andric {{"gfx701"}, {"gfx701"}, GK_GFX701, FEATURE_FAST_FMA_F32},
78bdd1243dSDimitry Andric {{"hawaii"}, {"gfx701"}, GK_GFX701, FEATURE_FAST_FMA_F32},
79bdd1243dSDimitry Andric {{"gfx702"}, {"gfx702"}, GK_GFX702, FEATURE_FAST_FMA_F32},
80bdd1243dSDimitry Andric {{"gfx703"}, {"gfx703"}, GK_GFX703, FEATURE_NONE},
81bdd1243dSDimitry Andric {{"kabini"}, {"gfx703"}, GK_GFX703, FEATURE_NONE},
82bdd1243dSDimitry Andric {{"mullins"}, {"gfx703"}, GK_GFX703, FEATURE_NONE},
83bdd1243dSDimitry Andric {{"gfx704"}, {"gfx704"}, GK_GFX704, FEATURE_NONE},
84bdd1243dSDimitry Andric {{"bonaire"}, {"gfx704"}, GK_GFX704, FEATURE_NONE},
85bdd1243dSDimitry Andric {{"gfx705"}, {"gfx705"}, GK_GFX705, FEATURE_NONE},
86bdd1243dSDimitry Andric {{"gfx801"}, {"gfx801"}, GK_GFX801, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
87bdd1243dSDimitry Andric {{"carrizo"}, {"gfx801"}, GK_GFX801, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
88bdd1243dSDimitry Andric {{"gfx802"}, {"gfx802"}, GK_GFX802, FEATURE_FAST_DENORMAL_F32},
89bdd1243dSDimitry Andric {{"iceland"}, {"gfx802"}, GK_GFX802, FEATURE_FAST_DENORMAL_F32},
90bdd1243dSDimitry Andric {{"tonga"}, {"gfx802"}, GK_GFX802, FEATURE_FAST_DENORMAL_F32},
91bdd1243dSDimitry Andric {{"gfx803"}, {"gfx803"}, GK_GFX803, FEATURE_FAST_DENORMAL_F32},
92bdd1243dSDimitry Andric {{"fiji"}, {"gfx803"}, GK_GFX803, FEATURE_FAST_DENORMAL_F32},
93bdd1243dSDimitry Andric {{"polaris10"}, {"gfx803"}, GK_GFX803, FEATURE_FAST_DENORMAL_F32},
94bdd1243dSDimitry Andric {{"polaris11"}, {"gfx803"}, GK_GFX803, FEATURE_FAST_DENORMAL_F32},
95bdd1243dSDimitry Andric {{"gfx805"}, {"gfx805"}, GK_GFX805, FEATURE_FAST_DENORMAL_F32},
96bdd1243dSDimitry Andric {{"tongapro"}, {"gfx805"}, GK_GFX805, FEATURE_FAST_DENORMAL_F32},
97bdd1243dSDimitry Andric {{"gfx810"}, {"gfx810"}, GK_GFX810, FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
98bdd1243dSDimitry Andric {{"stoney"}, {"gfx810"}, GK_GFX810, FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
99bdd1243dSDimitry Andric {{"gfx900"}, {"gfx900"}, GK_GFX900, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
100bdd1243dSDimitry Andric {{"gfx902"}, {"gfx902"}, GK_GFX902, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
101bdd1243dSDimitry Andric {{"gfx904"}, {"gfx904"}, GK_GFX904, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
102bdd1243dSDimitry Andric {{"gfx906"}, {"gfx906"}, GK_GFX906, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
103bdd1243dSDimitry Andric {{"gfx908"}, {"gfx908"}, GK_GFX908, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
104bdd1243dSDimitry Andric {{"gfx909"}, {"gfx909"}, GK_GFX909, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
105bdd1243dSDimitry Andric {{"gfx90a"}, {"gfx90a"}, GK_GFX90A, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
106bdd1243dSDimitry Andric {{"gfx90c"}, {"gfx90c"}, GK_GFX90C, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},
107bdd1243dSDimitry Andric {{"gfx940"}, {"gfx940"}, GK_GFX940, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
108fe013be4SDimitry Andric {{"gfx941"}, {"gfx941"}, GK_GFX941, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
109fe013be4SDimitry Andric {{"gfx942"}, {"gfx942"}, GK_GFX942, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},
110fe013be4SDimitry Andric {{"gfx1010"}, {"gfx1010"}, GK_GFX1010, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},
111fe013be4SDimitry Andric {{"gfx1011"}, {"gfx1011"}, GK_GFX1011, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},
112fe013be4SDimitry Andric {{"gfx1012"}, {"gfx1012"}, GK_GFX1012, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},
113fe013be4SDimitry Andric {{"gfx1013"}, {"gfx1013"}, GK_GFX1013, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},
114fe013be4SDimitry Andric {{"gfx1030"}, {"gfx1030"}, GK_GFX1030, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
115fe013be4SDimitry Andric {{"gfx1031"}, {"gfx1031"}, GK_GFX1031, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
116fe013be4SDimitry Andric {{"gfx1032"}, {"gfx1032"}, GK_GFX1032, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
117fe013be4SDimitry Andric {{"gfx1033"}, {"gfx1033"}, GK_GFX1033, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
118fe013be4SDimitry Andric {{"gfx1034"}, {"gfx1034"}, GK_GFX1034, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
119fe013be4SDimitry Andric {{"gfx1035"}, {"gfx1035"}, GK_GFX1035, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
120fe013be4SDimitry Andric {{"gfx1036"}, {"gfx1036"}, GK_GFX1036, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
121fe013be4SDimitry Andric {{"gfx1100"}, {"gfx1100"}, GK_GFX1100, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
122fe013be4SDimitry Andric {{"gfx1101"}, {"gfx1101"}, GK_GFX1101, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
123fe013be4SDimitry Andric {{"gfx1102"}, {"gfx1102"}, GK_GFX1102, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
124fe013be4SDimitry Andric {{"gfx1103"}, {"gfx1103"}, GK_GFX1103, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
125fe013be4SDimitry Andric {{"gfx1150"}, {"gfx1150"}, GK_GFX1150, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
126fe013be4SDimitry Andric {{"gfx1151"}, {"gfx1151"}, GK_GFX1151, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
127c9157d92SDimitry Andric {{"gfx1200"}, {"gfx1200"}, GK_GFX1200, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
128c9157d92SDimitry Andric {{"gfx1201"}, {"gfx1201"}, GK_GFX1201, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},
129c9157d92SDimitry Andric // clang-format on
130bdd1243dSDimitry Andric };
131bdd1243dSDimitry Andric
getArchEntry(AMDGPU::GPUKind AK,ArrayRef<GPUInfo> Table)132bdd1243dSDimitry Andric const GPUInfo *getArchEntry(AMDGPU::GPUKind AK, ArrayRef<GPUInfo> Table) {
133bdd1243dSDimitry Andric GPUInfo Search = { {""}, {""}, AK, AMDGPU::FEATURE_NONE };
134bdd1243dSDimitry Andric
135bdd1243dSDimitry Andric auto I =
136bdd1243dSDimitry Andric llvm::lower_bound(Table, Search, [](const GPUInfo &A, const GPUInfo &B) {
137bdd1243dSDimitry Andric return A.Kind < B.Kind;
138bdd1243dSDimitry Andric });
139bdd1243dSDimitry Andric
140c9157d92SDimitry Andric if (I == Table.end() || I->Kind != Search.Kind)
141bdd1243dSDimitry Andric return nullptr;
142bdd1243dSDimitry Andric return I;
143bdd1243dSDimitry Andric }
144bdd1243dSDimitry Andric
145bdd1243dSDimitry Andric } // namespace
146bdd1243dSDimitry Andric
getArchNameAMDGCN(GPUKind AK)147bdd1243dSDimitry Andric StringRef llvm::AMDGPU::getArchNameAMDGCN(GPUKind AK) {
148bdd1243dSDimitry Andric if (const auto *Entry = getArchEntry(AK, AMDGCNGPUs))
149bdd1243dSDimitry Andric return Entry->CanonicalName;
150bdd1243dSDimitry Andric return "";
151bdd1243dSDimitry Andric }
152bdd1243dSDimitry Andric
getArchNameR600(GPUKind AK)153bdd1243dSDimitry Andric StringRef llvm::AMDGPU::getArchNameR600(GPUKind AK) {
154bdd1243dSDimitry Andric if (const auto *Entry = getArchEntry(AK, R600GPUs))
155bdd1243dSDimitry Andric return Entry->CanonicalName;
156bdd1243dSDimitry Andric return "";
157bdd1243dSDimitry Andric }
158bdd1243dSDimitry Andric
parseArchAMDGCN(StringRef CPU)159bdd1243dSDimitry Andric AMDGPU::GPUKind llvm::AMDGPU::parseArchAMDGCN(StringRef CPU) {
160bdd1243dSDimitry Andric for (const auto &C : AMDGCNGPUs) {
161bdd1243dSDimitry Andric if (CPU == C.Name)
162bdd1243dSDimitry Andric return C.Kind;
163bdd1243dSDimitry Andric }
164bdd1243dSDimitry Andric
165bdd1243dSDimitry Andric return AMDGPU::GPUKind::GK_NONE;
166bdd1243dSDimitry Andric }
167bdd1243dSDimitry Andric
parseArchR600(StringRef CPU)168bdd1243dSDimitry Andric AMDGPU::GPUKind llvm::AMDGPU::parseArchR600(StringRef CPU) {
169bdd1243dSDimitry Andric for (const auto &C : R600GPUs) {
170bdd1243dSDimitry Andric if (CPU == C.Name)
171bdd1243dSDimitry Andric return C.Kind;
172bdd1243dSDimitry Andric }
173bdd1243dSDimitry Andric
174bdd1243dSDimitry Andric return AMDGPU::GPUKind::GK_NONE;
175bdd1243dSDimitry Andric }
176bdd1243dSDimitry Andric
getArchAttrAMDGCN(GPUKind AK)177bdd1243dSDimitry Andric unsigned AMDGPU::getArchAttrAMDGCN(GPUKind AK) {
178bdd1243dSDimitry Andric if (const auto *Entry = getArchEntry(AK, AMDGCNGPUs))
179bdd1243dSDimitry Andric return Entry->Features;
180bdd1243dSDimitry Andric return FEATURE_NONE;
181bdd1243dSDimitry Andric }
182bdd1243dSDimitry Andric
getArchAttrR600(GPUKind AK)183bdd1243dSDimitry Andric unsigned AMDGPU::getArchAttrR600(GPUKind AK) {
184bdd1243dSDimitry Andric if (const auto *Entry = getArchEntry(AK, R600GPUs))
185bdd1243dSDimitry Andric return Entry->Features;
186bdd1243dSDimitry Andric return FEATURE_NONE;
187bdd1243dSDimitry Andric }
188bdd1243dSDimitry Andric
fillValidArchListAMDGCN(SmallVectorImpl<StringRef> & Values)189bdd1243dSDimitry Andric void AMDGPU::fillValidArchListAMDGCN(SmallVectorImpl<StringRef> &Values) {
190bdd1243dSDimitry Andric // XXX: Should this only report unique canonical names?
191bdd1243dSDimitry Andric for (const auto &C : AMDGCNGPUs)
192bdd1243dSDimitry Andric Values.push_back(C.Name);
193bdd1243dSDimitry Andric }
194bdd1243dSDimitry Andric
fillValidArchListR600(SmallVectorImpl<StringRef> & Values)195bdd1243dSDimitry Andric void AMDGPU::fillValidArchListR600(SmallVectorImpl<StringRef> &Values) {
196bdd1243dSDimitry Andric for (const auto &C : R600GPUs)
197bdd1243dSDimitry Andric Values.push_back(C.Name);
198bdd1243dSDimitry Andric }
199bdd1243dSDimitry Andric
getIsaVersion(StringRef GPU)200bdd1243dSDimitry Andric AMDGPU::IsaVersion AMDGPU::getIsaVersion(StringRef GPU) {
201bdd1243dSDimitry Andric AMDGPU::GPUKind AK = parseArchAMDGCN(GPU);
202bdd1243dSDimitry Andric if (AK == AMDGPU::GPUKind::GK_NONE) {
203bdd1243dSDimitry Andric if (GPU == "generic-hsa")
204bdd1243dSDimitry Andric return {7, 0, 0};
205bdd1243dSDimitry Andric if (GPU == "generic")
206bdd1243dSDimitry Andric return {6, 0, 0};
207bdd1243dSDimitry Andric return {0, 0, 0};
208bdd1243dSDimitry Andric }
209bdd1243dSDimitry Andric
210c9157d92SDimitry Andric // clang-format off
211bdd1243dSDimitry Andric switch (AK) {
212bdd1243dSDimitry Andric case GK_GFX600: return {6, 0, 0};
213bdd1243dSDimitry Andric case GK_GFX601: return {6, 0, 1};
214bdd1243dSDimitry Andric case GK_GFX602: return {6, 0, 2};
215bdd1243dSDimitry Andric case GK_GFX700: return {7, 0, 0};
216bdd1243dSDimitry Andric case GK_GFX701: return {7, 0, 1};
217bdd1243dSDimitry Andric case GK_GFX702: return {7, 0, 2};
218bdd1243dSDimitry Andric case GK_GFX703: return {7, 0, 3};
219bdd1243dSDimitry Andric case GK_GFX704: return {7, 0, 4};
220bdd1243dSDimitry Andric case GK_GFX705: return {7, 0, 5};
221bdd1243dSDimitry Andric case GK_GFX801: return {8, 0, 1};
222bdd1243dSDimitry Andric case GK_GFX802: return {8, 0, 2};
223bdd1243dSDimitry Andric case GK_GFX803: return {8, 0, 3};
224bdd1243dSDimitry Andric case GK_GFX805: return {8, 0, 5};
225bdd1243dSDimitry Andric case GK_GFX810: return {8, 1, 0};
226bdd1243dSDimitry Andric case GK_GFX900: return {9, 0, 0};
227bdd1243dSDimitry Andric case GK_GFX902: return {9, 0, 2};
228bdd1243dSDimitry Andric case GK_GFX904: return {9, 0, 4};
229bdd1243dSDimitry Andric case GK_GFX906: return {9, 0, 6};
230bdd1243dSDimitry Andric case GK_GFX908: return {9, 0, 8};
231bdd1243dSDimitry Andric case GK_GFX909: return {9, 0, 9};
232bdd1243dSDimitry Andric case GK_GFX90A: return {9, 0, 10};
233bdd1243dSDimitry Andric case GK_GFX90C: return {9, 0, 12};
234bdd1243dSDimitry Andric case GK_GFX940: return {9, 4, 0};
235fe013be4SDimitry Andric case GK_GFX941: return {9, 4, 1};
236fe013be4SDimitry Andric case GK_GFX942: return {9, 4, 2};
237bdd1243dSDimitry Andric case GK_GFX1010: return {10, 1, 0};
238bdd1243dSDimitry Andric case GK_GFX1011: return {10, 1, 1};
239bdd1243dSDimitry Andric case GK_GFX1012: return {10, 1, 2};
240bdd1243dSDimitry Andric case GK_GFX1013: return {10, 1, 3};
241bdd1243dSDimitry Andric case GK_GFX1030: return {10, 3, 0};
242bdd1243dSDimitry Andric case GK_GFX1031: return {10, 3, 1};
243bdd1243dSDimitry Andric case GK_GFX1032: return {10, 3, 2};
244bdd1243dSDimitry Andric case GK_GFX1033: return {10, 3, 3};
245bdd1243dSDimitry Andric case GK_GFX1034: return {10, 3, 4};
246bdd1243dSDimitry Andric case GK_GFX1035: return {10, 3, 5};
247bdd1243dSDimitry Andric case GK_GFX1036: return {10, 3, 6};
248bdd1243dSDimitry Andric case GK_GFX1100: return {11, 0, 0};
249bdd1243dSDimitry Andric case GK_GFX1101: return {11, 0, 1};
250bdd1243dSDimitry Andric case GK_GFX1102: return {11, 0, 2};
251bdd1243dSDimitry Andric case GK_GFX1103: return {11, 0, 3};
252fe013be4SDimitry Andric case GK_GFX1150: return {11, 5, 0};
253fe013be4SDimitry Andric case GK_GFX1151: return {11, 5, 1};
254c9157d92SDimitry Andric case GK_GFX1200: return {12, 0, 0};
255c9157d92SDimitry Andric case GK_GFX1201: return {12, 0, 1};
256bdd1243dSDimitry Andric default: return {0, 0, 0};
257bdd1243dSDimitry Andric }
258c9157d92SDimitry Andric // clang-format on
259bdd1243dSDimitry Andric }
260bdd1243dSDimitry Andric
getCanonicalArchName(const Triple & T,StringRef Arch)261bdd1243dSDimitry Andric StringRef AMDGPU::getCanonicalArchName(const Triple &T, StringRef Arch) {
262bdd1243dSDimitry Andric assert(T.isAMDGPU());
263bdd1243dSDimitry Andric auto ProcKind = T.isAMDGCN() ? parseArchAMDGCN(Arch) : parseArchR600(Arch);
264bdd1243dSDimitry Andric if (ProcKind == GK_NONE)
265bdd1243dSDimitry Andric return StringRef();
266bdd1243dSDimitry Andric
267bdd1243dSDimitry Andric return T.isAMDGCN() ? getArchNameAMDGCN(ProcKind) : getArchNameR600(ProcKind);
268bdd1243dSDimitry Andric }
269fe013be4SDimitry Andric
fillAMDGPUFeatureMap(StringRef GPU,const Triple & T,StringMap<bool> & Features)270fe013be4SDimitry Andric void AMDGPU::fillAMDGPUFeatureMap(StringRef GPU, const Triple &T,
271fe013be4SDimitry Andric StringMap<bool> &Features) {
272fe013be4SDimitry Andric // XXX - What does the member GPU mean if device name string passed here?
273fe013be4SDimitry Andric if (T.isAMDGCN()) {
274fe013be4SDimitry Andric switch (parseArchAMDGCN(GPU)) {
275c9157d92SDimitry Andric case GK_GFX1201:
276c9157d92SDimitry Andric case GK_GFX1200:
277c9157d92SDimitry Andric Features["ci-insts"] = true;
278c9157d92SDimitry Andric Features["dot7-insts"] = true;
279c9157d92SDimitry Andric Features["dot8-insts"] = true;
280c9157d92SDimitry Andric Features["dot9-insts"] = true;
281c9157d92SDimitry Andric Features["dot10-insts"] = true;
282c9157d92SDimitry Andric Features["dl-insts"] = true;
283a58f00eaSDimitry Andric Features["atomic-ds-pk-add-16-insts"] = true;
284a58f00eaSDimitry Andric Features["atomic-flat-pk-add-16-insts"] = true;
285a58f00eaSDimitry Andric Features["atomic-buffer-global-pk-add-f16-insts"] = true;
286a58f00eaSDimitry Andric Features["atomic-global-pk-add-bf16-inst"] = true;
287c9157d92SDimitry Andric Features["16-bit-insts"] = true;
288c9157d92SDimitry Andric Features["dpp"] = true;
289c9157d92SDimitry Andric Features["gfx8-insts"] = true;
290c9157d92SDimitry Andric Features["gfx9-insts"] = true;
291c9157d92SDimitry Andric Features["gfx10-insts"] = true;
292c9157d92SDimitry Andric Features["gfx10-3-insts"] = true;
293c9157d92SDimitry Andric Features["gfx11-insts"] = true;
294c9157d92SDimitry Andric Features["gfx12-insts"] = true;
295c9157d92SDimitry Andric Features["atomic-fadd-rtn-insts"] = true;
296c9157d92SDimitry Andric Features["image-insts"] = true;
297*b9d9368bSDimitry Andric Features["fp8-conversion-insts"] = true;
298c9157d92SDimitry Andric break;
299fe013be4SDimitry Andric case GK_GFX1151:
300fe013be4SDimitry Andric case GK_GFX1150:
301fe013be4SDimitry Andric case GK_GFX1103:
302fe013be4SDimitry Andric case GK_GFX1102:
303fe013be4SDimitry Andric case GK_GFX1101:
304fe013be4SDimitry Andric case GK_GFX1100:
305fe013be4SDimitry Andric Features["ci-insts"] = true;
306fe013be4SDimitry Andric Features["dot5-insts"] = true;
307fe013be4SDimitry Andric Features["dot7-insts"] = true;
308fe013be4SDimitry Andric Features["dot8-insts"] = true;
309fe013be4SDimitry Andric Features["dot9-insts"] = true;
310fe013be4SDimitry Andric Features["dot10-insts"] = true;
311fe013be4SDimitry Andric Features["dl-insts"] = true;
312fe013be4SDimitry Andric Features["16-bit-insts"] = true;
313fe013be4SDimitry Andric Features["dpp"] = true;
314fe013be4SDimitry Andric Features["gfx8-insts"] = true;
315fe013be4SDimitry Andric Features["gfx9-insts"] = true;
316fe013be4SDimitry Andric Features["gfx10-insts"] = true;
317fe013be4SDimitry Andric Features["gfx10-3-insts"] = true;
318fe013be4SDimitry Andric Features["gfx11-insts"] = true;
319fe013be4SDimitry Andric Features["atomic-fadd-rtn-insts"] = true;
320fe013be4SDimitry Andric Features["image-insts"] = true;
321c9157d92SDimitry Andric Features["gws"] = true;
322fe013be4SDimitry Andric break;
323fe013be4SDimitry Andric case GK_GFX1036:
324fe013be4SDimitry Andric case GK_GFX1035:
325fe013be4SDimitry Andric case GK_GFX1034:
326fe013be4SDimitry Andric case GK_GFX1033:
327fe013be4SDimitry Andric case GK_GFX1032:
328fe013be4SDimitry Andric case GK_GFX1031:
329fe013be4SDimitry Andric case GK_GFX1030:
330fe013be4SDimitry Andric Features["ci-insts"] = true;
331fe013be4SDimitry Andric Features["dot1-insts"] = true;
332fe013be4SDimitry Andric Features["dot2-insts"] = true;
333fe013be4SDimitry Andric Features["dot5-insts"] = true;
334fe013be4SDimitry Andric Features["dot6-insts"] = true;
335fe013be4SDimitry Andric Features["dot7-insts"] = true;
336fe013be4SDimitry Andric Features["dot10-insts"] = true;
337fe013be4SDimitry Andric Features["dl-insts"] = true;
338fe013be4SDimitry Andric Features["16-bit-insts"] = true;
339fe013be4SDimitry Andric Features["dpp"] = true;
340fe013be4SDimitry Andric Features["gfx8-insts"] = true;
341fe013be4SDimitry Andric Features["gfx9-insts"] = true;
342fe013be4SDimitry Andric Features["gfx10-insts"] = true;
343fe013be4SDimitry Andric Features["gfx10-3-insts"] = true;
344fe013be4SDimitry Andric Features["image-insts"] = true;
345fe013be4SDimitry Andric Features["s-memrealtime"] = true;
346fe013be4SDimitry Andric Features["s-memtime-inst"] = true;
347c9157d92SDimitry Andric Features["gws"] = true;
348fe013be4SDimitry Andric break;
349fe013be4SDimitry Andric case GK_GFX1012:
350fe013be4SDimitry Andric case GK_GFX1011:
351fe013be4SDimitry Andric Features["dot1-insts"] = true;
352fe013be4SDimitry Andric Features["dot2-insts"] = true;
353fe013be4SDimitry Andric Features["dot5-insts"] = true;
354fe013be4SDimitry Andric Features["dot6-insts"] = true;
355fe013be4SDimitry Andric Features["dot7-insts"] = true;
356fe013be4SDimitry Andric Features["dot10-insts"] = true;
357fe013be4SDimitry Andric [[fallthrough]];
358fe013be4SDimitry Andric case GK_GFX1013:
359fe013be4SDimitry Andric case GK_GFX1010:
360fe013be4SDimitry Andric Features["dl-insts"] = true;
361fe013be4SDimitry Andric Features["ci-insts"] = true;
362fe013be4SDimitry Andric Features["16-bit-insts"] = true;
363fe013be4SDimitry Andric Features["dpp"] = true;
364fe013be4SDimitry Andric Features["gfx8-insts"] = true;
365fe013be4SDimitry Andric Features["gfx9-insts"] = true;
366fe013be4SDimitry Andric Features["gfx10-insts"] = true;
367fe013be4SDimitry Andric Features["image-insts"] = true;
368fe013be4SDimitry Andric Features["s-memrealtime"] = true;
369fe013be4SDimitry Andric Features["s-memtime-inst"] = true;
370c9157d92SDimitry Andric Features["gws"] = true;
371fe013be4SDimitry Andric break;
372fe013be4SDimitry Andric case GK_GFX942:
373fe013be4SDimitry Andric case GK_GFX941:
374fe013be4SDimitry Andric case GK_GFX940:
375fe013be4SDimitry Andric Features["gfx940-insts"] = true;
376fe013be4SDimitry Andric Features["fp8-insts"] = true;
377a58f00eaSDimitry Andric Features["fp8-conversion-insts"] = true;
378fe013be4SDimitry Andric Features["atomic-ds-pk-add-16-insts"] = true;
379fe013be4SDimitry Andric Features["atomic-flat-pk-add-16-insts"] = true;
380fe013be4SDimitry Andric Features["atomic-global-pk-add-bf16-inst"] = true;
381fe013be4SDimitry Andric Features["gfx90a-insts"] = true;
382fe013be4SDimitry Andric Features["atomic-buffer-global-pk-add-f16-insts"] = true;
383fe013be4SDimitry Andric Features["atomic-fadd-rtn-insts"] = true;
384fe013be4SDimitry Andric Features["dot3-insts"] = true;
385fe013be4SDimitry Andric Features["dot4-insts"] = true;
386fe013be4SDimitry Andric Features["dot5-insts"] = true;
387fe013be4SDimitry Andric Features["dot6-insts"] = true;
388fe013be4SDimitry Andric Features["mai-insts"] = true;
389fe013be4SDimitry Andric Features["dl-insts"] = true;
390fe013be4SDimitry Andric Features["dot1-insts"] = true;
391fe013be4SDimitry Andric Features["dot2-insts"] = true;
392fe013be4SDimitry Andric Features["dot7-insts"] = true;
393fe013be4SDimitry Andric Features["dot10-insts"] = true;
394fe013be4SDimitry Andric Features["gfx9-insts"] = true;
395fe013be4SDimitry Andric Features["gfx8-insts"] = true;
396fe013be4SDimitry Andric Features["16-bit-insts"] = true;
397fe013be4SDimitry Andric Features["dpp"] = true;
398fe013be4SDimitry Andric Features["s-memrealtime"] = true;
399fe013be4SDimitry Andric Features["ci-insts"] = true;
400fe013be4SDimitry Andric Features["s-memtime-inst"] = true;
401c9157d92SDimitry Andric Features["gws"] = true;
402fe013be4SDimitry Andric break;
403fe013be4SDimitry Andric case GK_GFX90A:
404fe013be4SDimitry Andric Features["gfx90a-insts"] = true;
405fe013be4SDimitry Andric Features["atomic-buffer-global-pk-add-f16-insts"] = true;
406fe013be4SDimitry Andric Features["atomic-fadd-rtn-insts"] = true;
407fe013be4SDimitry Andric [[fallthrough]];
408fe013be4SDimitry Andric case GK_GFX908:
409fe013be4SDimitry Andric Features["dot3-insts"] = true;
410fe013be4SDimitry Andric Features["dot4-insts"] = true;
411fe013be4SDimitry Andric Features["dot5-insts"] = true;
412fe013be4SDimitry Andric Features["dot6-insts"] = true;
413fe013be4SDimitry Andric Features["mai-insts"] = true;
414fe013be4SDimitry Andric [[fallthrough]];
415fe013be4SDimitry Andric case GK_GFX906:
416fe013be4SDimitry Andric Features["dl-insts"] = true;
417fe013be4SDimitry Andric Features["dot1-insts"] = true;
418fe013be4SDimitry Andric Features["dot2-insts"] = true;
419fe013be4SDimitry Andric Features["dot7-insts"] = true;
420fe013be4SDimitry Andric Features["dot10-insts"] = true;
421fe013be4SDimitry Andric [[fallthrough]];
422fe013be4SDimitry Andric case GK_GFX90C:
423fe013be4SDimitry Andric case GK_GFX909:
424fe013be4SDimitry Andric case GK_GFX904:
425fe013be4SDimitry Andric case GK_GFX902:
426fe013be4SDimitry Andric case GK_GFX900:
427fe013be4SDimitry Andric Features["gfx9-insts"] = true;
428fe013be4SDimitry Andric [[fallthrough]];
429fe013be4SDimitry Andric case GK_GFX810:
430fe013be4SDimitry Andric case GK_GFX805:
431fe013be4SDimitry Andric case GK_GFX803:
432fe013be4SDimitry Andric case GK_GFX802:
433fe013be4SDimitry Andric case GK_GFX801:
434fe013be4SDimitry Andric Features["gfx8-insts"] = true;
435fe013be4SDimitry Andric Features["16-bit-insts"] = true;
436fe013be4SDimitry Andric Features["dpp"] = true;
437fe013be4SDimitry Andric Features["s-memrealtime"] = true;
438fe013be4SDimitry Andric [[fallthrough]];
439fe013be4SDimitry Andric case GK_GFX705:
440fe013be4SDimitry Andric case GK_GFX704:
441fe013be4SDimitry Andric case GK_GFX703:
442fe013be4SDimitry Andric case GK_GFX702:
443fe013be4SDimitry Andric case GK_GFX701:
444fe013be4SDimitry Andric case GK_GFX700:
445fe013be4SDimitry Andric Features["ci-insts"] = true;
446fe013be4SDimitry Andric [[fallthrough]];
447fe013be4SDimitry Andric case GK_GFX602:
448fe013be4SDimitry Andric case GK_GFX601:
449fe013be4SDimitry Andric case GK_GFX600:
450fe013be4SDimitry Andric Features["image-insts"] = true;
451fe013be4SDimitry Andric Features["s-memtime-inst"] = true;
452c9157d92SDimitry Andric Features["gws"] = true;
453fe013be4SDimitry Andric break;
454fe013be4SDimitry Andric case GK_NONE:
455fe013be4SDimitry Andric break;
456fe013be4SDimitry Andric default:
457fe013be4SDimitry Andric llvm_unreachable("Unhandled GPU!");
458fe013be4SDimitry Andric }
459fe013be4SDimitry Andric } else {
460fe013be4SDimitry Andric if (GPU.empty())
461fe013be4SDimitry Andric GPU = "r600";
462fe013be4SDimitry Andric
463fe013be4SDimitry Andric switch (llvm::AMDGPU::parseArchR600(GPU)) {
464fe013be4SDimitry Andric case GK_CAYMAN:
465fe013be4SDimitry Andric case GK_CYPRESS:
466fe013be4SDimitry Andric case GK_RV770:
467fe013be4SDimitry Andric case GK_RV670:
468fe013be4SDimitry Andric // TODO: Add fp64 when implemented.
469fe013be4SDimitry Andric break;
470fe013be4SDimitry Andric case GK_TURKS:
471fe013be4SDimitry Andric case GK_CAICOS:
472fe013be4SDimitry Andric case GK_BARTS:
473fe013be4SDimitry Andric case GK_SUMO:
474fe013be4SDimitry Andric case GK_REDWOOD:
475fe013be4SDimitry Andric case GK_JUNIPER:
476fe013be4SDimitry Andric case GK_CEDAR:
477fe013be4SDimitry Andric case GK_RV730:
478fe013be4SDimitry Andric case GK_RV710:
479fe013be4SDimitry Andric case GK_RS880:
480fe013be4SDimitry Andric case GK_R630:
481fe013be4SDimitry Andric case GK_R600:
482fe013be4SDimitry Andric break;
483fe013be4SDimitry Andric default:
484fe013be4SDimitry Andric llvm_unreachable("Unhandled GPU!");
485fe013be4SDimitry Andric }
486fe013be4SDimitry Andric }
487fe013be4SDimitry Andric }
488fe013be4SDimitry Andric
isWave32Capable(StringRef GPU,const Triple & T)489fe013be4SDimitry Andric static bool isWave32Capable(StringRef GPU, const Triple &T) {
490fe013be4SDimitry Andric bool IsWave32Capable = false;
491fe013be4SDimitry Andric // XXX - What does the member GPU mean if device name string passed here?
492fe013be4SDimitry Andric if (T.isAMDGCN()) {
493fe013be4SDimitry Andric switch (parseArchAMDGCN(GPU)) {
494c9157d92SDimitry Andric case GK_GFX1201:
495c9157d92SDimitry Andric case GK_GFX1200:
496fe013be4SDimitry Andric case GK_GFX1151:
497fe013be4SDimitry Andric case GK_GFX1150:
498fe013be4SDimitry Andric case GK_GFX1103:
499fe013be4SDimitry Andric case GK_GFX1102:
500fe013be4SDimitry Andric case GK_GFX1101:
501fe013be4SDimitry Andric case GK_GFX1100:
502fe013be4SDimitry Andric case GK_GFX1036:
503fe013be4SDimitry Andric case GK_GFX1035:
504fe013be4SDimitry Andric case GK_GFX1034:
505fe013be4SDimitry Andric case GK_GFX1033:
506fe013be4SDimitry Andric case GK_GFX1032:
507fe013be4SDimitry Andric case GK_GFX1031:
508fe013be4SDimitry Andric case GK_GFX1030:
509fe013be4SDimitry Andric case GK_GFX1012:
510fe013be4SDimitry Andric case GK_GFX1011:
511fe013be4SDimitry Andric case GK_GFX1013:
512fe013be4SDimitry Andric case GK_GFX1010:
513fe013be4SDimitry Andric IsWave32Capable = true;
514fe013be4SDimitry Andric break;
515fe013be4SDimitry Andric default:
516fe013be4SDimitry Andric break;
517fe013be4SDimitry Andric }
518fe013be4SDimitry Andric }
519fe013be4SDimitry Andric return IsWave32Capable;
520fe013be4SDimitry Andric }
521fe013be4SDimitry Andric
insertWaveSizeFeature(StringRef GPU,const Triple & T,StringMap<bool> & Features,std::string & ErrorMsg)522fe013be4SDimitry Andric bool AMDGPU::insertWaveSizeFeature(StringRef GPU, const Triple &T,
523fe013be4SDimitry Andric StringMap<bool> &Features,
524fe013be4SDimitry Andric std::string &ErrorMsg) {
525fe013be4SDimitry Andric bool IsWave32Capable = isWave32Capable(GPU, T);
526fe013be4SDimitry Andric const bool IsNullGPU = GPU.empty();
527fe013be4SDimitry Andric // FIXME: Not diagnosing wavefrontsize32 on wave64 only targets.
528fe013be4SDimitry Andric const bool HaveWave32 =
529fe013be4SDimitry Andric (IsWave32Capable || IsNullGPU) && Features.count("wavefrontsize32");
530fe013be4SDimitry Andric const bool HaveWave64 = Features.count("wavefrontsize64");
531fe013be4SDimitry Andric if (HaveWave32 && HaveWave64) {
532fe013be4SDimitry Andric ErrorMsg = "'wavefrontsize32' and 'wavefrontsize64' are mutually exclusive";
533fe013be4SDimitry Andric return false;
534fe013be4SDimitry Andric }
535fe013be4SDimitry Andric // Don't assume any wavesize with an unknown subtarget.
536fe013be4SDimitry Andric if (!IsNullGPU) {
537fe013be4SDimitry Andric // Default to wave32 if available, or wave64 if not
538fe013be4SDimitry Andric if (!HaveWave32 && !HaveWave64) {
539fe013be4SDimitry Andric StringRef DefaultWaveSizeFeature =
540fe013be4SDimitry Andric IsWave32Capable ? "wavefrontsize32" : "wavefrontsize64";
541fe013be4SDimitry Andric Features.insert(std::make_pair(DefaultWaveSizeFeature, true));
542fe013be4SDimitry Andric }
543fe013be4SDimitry Andric }
544fe013be4SDimitry Andric return true;
545fe013be4SDimitry Andric }
546