xref: /freebsd/contrib/llvm-project/clang/lib/Basic/Targets/AMDGPU.cpp (revision 5f757f3ff9144b609b3c433dfd370cc6bdc191ad)
10b57cec5SDimitry Andric //===--- AMDGPU.cpp - Implement AMDGPU target feature support -------------===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric //
90b57cec5SDimitry Andric // This file implements AMDGPU TargetInfo objects.
100b57cec5SDimitry Andric //
110b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
120b57cec5SDimitry Andric 
130b57cec5SDimitry Andric #include "AMDGPU.h"
140b57cec5SDimitry Andric #include "clang/Basic/Builtins.h"
150b57cec5SDimitry Andric #include "clang/Basic/CodeGenOptions.h"
16bdd1243dSDimitry Andric #include "clang/Basic/Diagnostic.h"
170b57cec5SDimitry Andric #include "clang/Basic/LangOptions.h"
180b57cec5SDimitry Andric #include "clang/Basic/MacroBuilder.h"
190b57cec5SDimitry Andric #include "clang/Basic/TargetBuiltins.h"
200b57cec5SDimitry Andric using namespace clang;
210b57cec5SDimitry Andric using namespace clang::targets;
220b57cec5SDimitry Andric 
230b57cec5SDimitry Andric namespace clang {
240b57cec5SDimitry Andric namespace targets {
250b57cec5SDimitry Andric 
260b57cec5SDimitry Andric // If you edit the description strings, make sure you update
270b57cec5SDimitry Andric // getPointerWidthV().
280b57cec5SDimitry Andric 
290b57cec5SDimitry Andric static const char *const DataLayoutStringR600 =
300b57cec5SDimitry Andric     "e-p:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128"
31e8d8bef9SDimitry Andric     "-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1";
320b57cec5SDimitry Andric 
330b57cec5SDimitry Andric static const char *const DataLayoutStringAMDGCN =
340b57cec5SDimitry Andric     "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32"
35*5f757f3fSDimitry Andric     "-p7:160:256:256:32-p8:128:128-p9:192:256:256:32-i64:64-v16:16-v24:32-v32:"
36*5f757f3fSDimitry Andric     "32-v48:64-v96:128"
37e8d8bef9SDimitry Andric     "-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1"
38*5f757f3fSDimitry Andric     "-ni:7:8:9";
390b57cec5SDimitry Andric 
400b57cec5SDimitry Andric const LangASMap AMDGPUTargetInfo::AMDGPUDefIsGenMap = {
41*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // Default
42*5f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // opencl_global
43*5f757f3fSDimitry Andric     llvm::AMDGPUAS::LOCAL_ADDRESS,    // opencl_local
44*5f757f3fSDimitry Andric     llvm::AMDGPUAS::CONSTANT_ADDRESS, // opencl_constant
45*5f757f3fSDimitry Andric     llvm::AMDGPUAS::PRIVATE_ADDRESS,  // opencl_private
46*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // opencl_generic
47*5f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // opencl_global_device
48*5f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // opencl_global_host
49*5f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // cuda_device
50*5f757f3fSDimitry Andric     llvm::AMDGPUAS::CONSTANT_ADDRESS, // cuda_constant
51*5f757f3fSDimitry Andric     llvm::AMDGPUAS::LOCAL_ADDRESS,    // cuda_shared
52*5f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // sycl_global
53*5f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // sycl_global_device
54*5f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // sycl_global_host
55*5f757f3fSDimitry Andric     llvm::AMDGPUAS::LOCAL_ADDRESS,    // sycl_local
56*5f757f3fSDimitry Andric     llvm::AMDGPUAS::PRIVATE_ADDRESS,  // sycl_private
57*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // ptr32_sptr
58*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // ptr32_uptr
59*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // ptr64
60*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // hlsl_groupshared
610b57cec5SDimitry Andric };
620b57cec5SDimitry Andric 
630b57cec5SDimitry Andric const LangASMap AMDGPUTargetInfo::AMDGPUDefIsPrivMap = {
64*5f757f3fSDimitry Andric     llvm::AMDGPUAS::PRIVATE_ADDRESS,  // Default
65*5f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // opencl_global
66*5f757f3fSDimitry Andric     llvm::AMDGPUAS::LOCAL_ADDRESS,    // opencl_local
67*5f757f3fSDimitry Andric     llvm::AMDGPUAS::CONSTANT_ADDRESS, // opencl_constant
68*5f757f3fSDimitry Andric     llvm::AMDGPUAS::PRIVATE_ADDRESS,  // opencl_private
69*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // opencl_generic
70*5f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // opencl_global_device
71*5f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // opencl_global_host
72*5f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // cuda_device
73*5f757f3fSDimitry Andric     llvm::AMDGPUAS::CONSTANT_ADDRESS, // cuda_constant
74*5f757f3fSDimitry Andric     llvm::AMDGPUAS::LOCAL_ADDRESS,    // cuda_shared
75fe6060f1SDimitry Andric     // SYCL address space values for this map are dummy
76*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global
77*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global_device
78*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global_host
79*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_local
80*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_private
81*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_sptr
82*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_uptr
83*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // ptr64
84*5f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // hlsl_groupshared
85480093f4SDimitry Andric 
860b57cec5SDimitry Andric };
870b57cec5SDimitry Andric } // namespace targets
880b57cec5SDimitry Andric } // namespace clang
890b57cec5SDimitry Andric 
90bdd1243dSDimitry Andric static constexpr Builtin::Info BuiltinInfo[] = {
910b57cec5SDimitry Andric #define BUILTIN(ID, TYPE, ATTRS)                                               \
92bdd1243dSDimitry Andric   {#ID, TYPE, ATTRS, nullptr, HeaderDesc::NO_HEADER, ALL_LANGUAGES},
930b57cec5SDimitry Andric #define TARGET_BUILTIN(ID, TYPE, ATTRS, FEATURE)                               \
94bdd1243dSDimitry Andric   {#ID, TYPE, ATTRS, FEATURE, HeaderDesc::NO_HEADER, ALL_LANGUAGES},
950b57cec5SDimitry Andric #include "clang/Basic/BuiltinsAMDGPU.def"
960b57cec5SDimitry Andric };
970b57cec5SDimitry Andric 
980b57cec5SDimitry Andric const char *const AMDGPUTargetInfo::GCCRegNames[] = {
990b57cec5SDimitry Andric   "v0", "v1", "v2", "v3", "v4", "v5", "v6", "v7", "v8",
1000b57cec5SDimitry Andric   "v9", "v10", "v11", "v12", "v13", "v14", "v15", "v16", "v17",
1010b57cec5SDimitry Andric   "v18", "v19", "v20", "v21", "v22", "v23", "v24", "v25", "v26",
1020b57cec5SDimitry Andric   "v27", "v28", "v29", "v30", "v31", "v32", "v33", "v34", "v35",
1030b57cec5SDimitry Andric   "v36", "v37", "v38", "v39", "v40", "v41", "v42", "v43", "v44",
1040b57cec5SDimitry Andric   "v45", "v46", "v47", "v48", "v49", "v50", "v51", "v52", "v53",
1050b57cec5SDimitry Andric   "v54", "v55", "v56", "v57", "v58", "v59", "v60", "v61", "v62",
1060b57cec5SDimitry Andric   "v63", "v64", "v65", "v66", "v67", "v68", "v69", "v70", "v71",
1070b57cec5SDimitry Andric   "v72", "v73", "v74", "v75", "v76", "v77", "v78", "v79", "v80",
1080b57cec5SDimitry Andric   "v81", "v82", "v83", "v84", "v85", "v86", "v87", "v88", "v89",
1090b57cec5SDimitry Andric   "v90", "v91", "v92", "v93", "v94", "v95", "v96", "v97", "v98",
1100b57cec5SDimitry Andric   "v99", "v100", "v101", "v102", "v103", "v104", "v105", "v106", "v107",
1110b57cec5SDimitry Andric   "v108", "v109", "v110", "v111", "v112", "v113", "v114", "v115", "v116",
1120b57cec5SDimitry Andric   "v117", "v118", "v119", "v120", "v121", "v122", "v123", "v124", "v125",
1130b57cec5SDimitry Andric   "v126", "v127", "v128", "v129", "v130", "v131", "v132", "v133", "v134",
1140b57cec5SDimitry Andric   "v135", "v136", "v137", "v138", "v139", "v140", "v141", "v142", "v143",
1150b57cec5SDimitry Andric   "v144", "v145", "v146", "v147", "v148", "v149", "v150", "v151", "v152",
1160b57cec5SDimitry Andric   "v153", "v154", "v155", "v156", "v157", "v158", "v159", "v160", "v161",
1170b57cec5SDimitry Andric   "v162", "v163", "v164", "v165", "v166", "v167", "v168", "v169", "v170",
1180b57cec5SDimitry Andric   "v171", "v172", "v173", "v174", "v175", "v176", "v177", "v178", "v179",
1190b57cec5SDimitry Andric   "v180", "v181", "v182", "v183", "v184", "v185", "v186", "v187", "v188",
1200b57cec5SDimitry Andric   "v189", "v190", "v191", "v192", "v193", "v194", "v195", "v196", "v197",
1210b57cec5SDimitry Andric   "v198", "v199", "v200", "v201", "v202", "v203", "v204", "v205", "v206",
1220b57cec5SDimitry Andric   "v207", "v208", "v209", "v210", "v211", "v212", "v213", "v214", "v215",
1230b57cec5SDimitry Andric   "v216", "v217", "v218", "v219", "v220", "v221", "v222", "v223", "v224",
1240b57cec5SDimitry Andric   "v225", "v226", "v227", "v228", "v229", "v230", "v231", "v232", "v233",
1250b57cec5SDimitry Andric   "v234", "v235", "v236", "v237", "v238", "v239", "v240", "v241", "v242",
1260b57cec5SDimitry Andric   "v243", "v244", "v245", "v246", "v247", "v248", "v249", "v250", "v251",
1270b57cec5SDimitry Andric   "v252", "v253", "v254", "v255", "s0", "s1", "s2", "s3", "s4",
1280b57cec5SDimitry Andric   "s5", "s6", "s7", "s8", "s9", "s10", "s11", "s12", "s13",
1290b57cec5SDimitry Andric   "s14", "s15", "s16", "s17", "s18", "s19", "s20", "s21", "s22",
1300b57cec5SDimitry Andric   "s23", "s24", "s25", "s26", "s27", "s28", "s29", "s30", "s31",
1310b57cec5SDimitry Andric   "s32", "s33", "s34", "s35", "s36", "s37", "s38", "s39", "s40",
1320b57cec5SDimitry Andric   "s41", "s42", "s43", "s44", "s45", "s46", "s47", "s48", "s49",
1330b57cec5SDimitry Andric   "s50", "s51", "s52", "s53", "s54", "s55", "s56", "s57", "s58",
1340b57cec5SDimitry Andric   "s59", "s60", "s61", "s62", "s63", "s64", "s65", "s66", "s67",
1350b57cec5SDimitry Andric   "s68", "s69", "s70", "s71", "s72", "s73", "s74", "s75", "s76",
1360b57cec5SDimitry Andric   "s77", "s78", "s79", "s80", "s81", "s82", "s83", "s84", "s85",
1370b57cec5SDimitry Andric   "s86", "s87", "s88", "s89", "s90", "s91", "s92", "s93", "s94",
1380b57cec5SDimitry Andric   "s95", "s96", "s97", "s98", "s99", "s100", "s101", "s102", "s103",
1390b57cec5SDimitry Andric   "s104", "s105", "s106", "s107", "s108", "s109", "s110", "s111", "s112",
1400b57cec5SDimitry Andric   "s113", "s114", "s115", "s116", "s117", "s118", "s119", "s120", "s121",
1410b57cec5SDimitry Andric   "s122", "s123", "s124", "s125", "s126", "s127", "exec", "vcc", "scc",
1420b57cec5SDimitry Andric   "m0", "flat_scratch", "exec_lo", "exec_hi", "vcc_lo", "vcc_hi",
1435ffd83dbSDimitry Andric   "flat_scratch_lo", "flat_scratch_hi",
1445ffd83dbSDimitry Andric   "a0", "a1", "a2", "a3", "a4", "a5", "a6", "a7", "a8",
1455ffd83dbSDimitry Andric   "a9", "a10", "a11", "a12", "a13", "a14", "a15", "a16", "a17",
1465ffd83dbSDimitry Andric   "a18", "a19", "a20", "a21", "a22", "a23", "a24", "a25", "a26",
1475ffd83dbSDimitry Andric   "a27", "a28", "a29", "a30", "a31", "a32", "a33", "a34", "a35",
1485ffd83dbSDimitry Andric   "a36", "a37", "a38", "a39", "a40", "a41", "a42", "a43", "a44",
1495ffd83dbSDimitry Andric   "a45", "a46", "a47", "a48", "a49", "a50", "a51", "a52", "a53",
1505ffd83dbSDimitry Andric   "a54", "a55", "a56", "a57", "a58", "a59", "a60", "a61", "a62",
1515ffd83dbSDimitry Andric   "a63", "a64", "a65", "a66", "a67", "a68", "a69", "a70", "a71",
1525ffd83dbSDimitry Andric   "a72", "a73", "a74", "a75", "a76", "a77", "a78", "a79", "a80",
1535ffd83dbSDimitry Andric   "a81", "a82", "a83", "a84", "a85", "a86", "a87", "a88", "a89",
1545ffd83dbSDimitry Andric   "a90", "a91", "a92", "a93", "a94", "a95", "a96", "a97", "a98",
1555ffd83dbSDimitry Andric   "a99", "a100", "a101", "a102", "a103", "a104", "a105", "a106", "a107",
1565ffd83dbSDimitry Andric   "a108", "a109", "a110", "a111", "a112", "a113", "a114", "a115", "a116",
1575ffd83dbSDimitry Andric   "a117", "a118", "a119", "a120", "a121", "a122", "a123", "a124", "a125",
1585ffd83dbSDimitry Andric   "a126", "a127", "a128", "a129", "a130", "a131", "a132", "a133", "a134",
1595ffd83dbSDimitry Andric   "a135", "a136", "a137", "a138", "a139", "a140", "a141", "a142", "a143",
1605ffd83dbSDimitry Andric   "a144", "a145", "a146", "a147", "a148", "a149", "a150", "a151", "a152",
1615ffd83dbSDimitry Andric   "a153", "a154", "a155", "a156", "a157", "a158", "a159", "a160", "a161",
1625ffd83dbSDimitry Andric   "a162", "a163", "a164", "a165", "a166", "a167", "a168", "a169", "a170",
1635ffd83dbSDimitry Andric   "a171", "a172", "a173", "a174", "a175", "a176", "a177", "a178", "a179",
1645ffd83dbSDimitry Andric   "a180", "a181", "a182", "a183", "a184", "a185", "a186", "a187", "a188",
1655ffd83dbSDimitry Andric   "a189", "a190", "a191", "a192", "a193", "a194", "a195", "a196", "a197",
1665ffd83dbSDimitry Andric   "a198", "a199", "a200", "a201", "a202", "a203", "a204", "a205", "a206",
1675ffd83dbSDimitry Andric   "a207", "a208", "a209", "a210", "a211", "a212", "a213", "a214", "a215",
1685ffd83dbSDimitry Andric   "a216", "a217", "a218", "a219", "a220", "a221", "a222", "a223", "a224",
1695ffd83dbSDimitry Andric   "a225", "a226", "a227", "a228", "a229", "a230", "a231", "a232", "a233",
1705ffd83dbSDimitry Andric   "a234", "a235", "a236", "a237", "a238", "a239", "a240", "a241", "a242",
1715ffd83dbSDimitry Andric   "a243", "a244", "a245", "a246", "a247", "a248", "a249", "a250", "a251",
1725ffd83dbSDimitry Andric   "a252", "a253", "a254", "a255"
1730b57cec5SDimitry Andric };
1740b57cec5SDimitry Andric 
1750b57cec5SDimitry Andric ArrayRef<const char *> AMDGPUTargetInfo::getGCCRegNames() const {
176bdd1243dSDimitry Andric   return llvm::ArrayRef(GCCRegNames);
1770b57cec5SDimitry Andric }
1780b57cec5SDimitry Andric 
1790b57cec5SDimitry Andric bool AMDGPUTargetInfo::initFeatureMap(
1800b57cec5SDimitry Andric     llvm::StringMap<bool> &Features, DiagnosticsEngine &Diags, StringRef CPU,
1810b57cec5SDimitry Andric     const std::vector<std::string> &FeatureVec) const {
1820b57cec5SDimitry Andric 
1830b57cec5SDimitry Andric   using namespace llvm::AMDGPU;
18406c3fb27SDimitry Andric   fillAMDGPUFeatureMap(CPU, getTriple(), Features);
185bdd1243dSDimitry Andric   if (!TargetInfo::initFeatureMap(Features, Diags, CPU, FeatureVec))
186bdd1243dSDimitry Andric     return false;
187bdd1243dSDimitry Andric 
188bdd1243dSDimitry Andric   // TODO: Should move this logic into TargetParser
18906c3fb27SDimitry Andric   std::string ErrorMsg;
19006c3fb27SDimitry Andric   if (!insertWaveSizeFeature(CPU, getTriple(), Features, ErrorMsg)) {
19106c3fb27SDimitry Andric     Diags.Report(diag::err_invalid_feature_combination) << ErrorMsg;
192bdd1243dSDimitry Andric     return false;
193bdd1243dSDimitry Andric   }
194bdd1243dSDimitry Andric 
195bdd1243dSDimitry Andric   return true;
1960b57cec5SDimitry Andric }
1970b57cec5SDimitry Andric 
1980b57cec5SDimitry Andric void AMDGPUTargetInfo::fillValidCPUList(
1990b57cec5SDimitry Andric     SmallVectorImpl<StringRef> &Values) const {
2000b57cec5SDimitry Andric   if (isAMDGCN(getTriple()))
2010b57cec5SDimitry Andric     llvm::AMDGPU::fillValidArchListAMDGCN(Values);
2020b57cec5SDimitry Andric   else
2030b57cec5SDimitry Andric     llvm::AMDGPU::fillValidArchListR600(Values);
2040b57cec5SDimitry Andric }
2050b57cec5SDimitry Andric 
2060b57cec5SDimitry Andric void AMDGPUTargetInfo::setAddressSpaceMap(bool DefaultIsPrivate) {
2070b57cec5SDimitry Andric   AddrSpaceMap = DefaultIsPrivate ? &AMDGPUDefIsPrivMap : &AMDGPUDefIsGenMap;
2080b57cec5SDimitry Andric }
2090b57cec5SDimitry Andric 
2100b57cec5SDimitry Andric AMDGPUTargetInfo::AMDGPUTargetInfo(const llvm::Triple &Triple,
2110b57cec5SDimitry Andric                                    const TargetOptions &Opts)
2120b57cec5SDimitry Andric     : TargetInfo(Triple),
2130b57cec5SDimitry Andric       GPUKind(isAMDGCN(Triple) ?
2140b57cec5SDimitry Andric               llvm::AMDGPU::parseArchAMDGCN(Opts.CPU) :
2150b57cec5SDimitry Andric               llvm::AMDGPU::parseArchR600(Opts.CPU)),
2160b57cec5SDimitry Andric       GPUFeatures(isAMDGCN(Triple) ?
2170b57cec5SDimitry Andric                   llvm::AMDGPU::getArchAttrAMDGCN(GPUKind) :
2180b57cec5SDimitry Andric                   llvm::AMDGPU::getArchAttrR600(GPUKind)) {
2190b57cec5SDimitry Andric   resetDataLayout(isAMDGCN(getTriple()) ? DataLayoutStringAMDGCN
2200b57cec5SDimitry Andric                                         : DataLayoutStringR600);
2210b57cec5SDimitry Andric 
2220b57cec5SDimitry Andric   setAddressSpaceMap(Triple.getOS() == llvm::Triple::Mesa3D ||
2230b57cec5SDimitry Andric                      !isAMDGCN(Triple));
2240b57cec5SDimitry Andric   UseAddrSpaceMapMangling = true;
2250b57cec5SDimitry Andric 
226bdd1243dSDimitry Andric   if (isAMDGCN(Triple)) {
227bdd1243dSDimitry Andric     // __bf16 is always available as a load/store only type on AMDGCN.
228bdd1243dSDimitry Andric     BFloat16Width = BFloat16Align = 16;
229bdd1243dSDimitry Andric     BFloat16Format = &llvm::APFloat::BFloat();
230bdd1243dSDimitry Andric   }
231bdd1243dSDimitry Andric 
2320b57cec5SDimitry Andric   HasLegalHalfType = true;
2330b57cec5SDimitry Andric   HasFloat16 = true;
234e8d8bef9SDimitry Andric   WavefrontSize = GPUFeatures & llvm::AMDGPU::FEATURE_WAVE32 ? 32 : 64;
235e8d8bef9SDimitry Andric   AllowAMDGPUUnsafeFPAtomics = Opts.AllowAMDGPUUnsafeFPAtomics;
2360b57cec5SDimitry Andric 
237bdd1243dSDimitry Andric   // Set pointer width and alignment for the generic address space.
238bdd1243dSDimitry Andric   PointerWidth = PointerAlign = getPointerWidthV(LangAS::Default);
2390b57cec5SDimitry Andric   if (getMaxPointerWidth() == 64) {
2400b57cec5SDimitry Andric     LongWidth = LongAlign = 64;
2410b57cec5SDimitry Andric     SizeType = UnsignedLong;
2420b57cec5SDimitry Andric     PtrDiffType = SignedLong;
2430b57cec5SDimitry Andric     IntPtrType = SignedLong;
2440b57cec5SDimitry Andric   }
2450b57cec5SDimitry Andric 
2460b57cec5SDimitry Andric   MaxAtomicPromoteWidth = MaxAtomicInlineWidth = 64;
24706c3fb27SDimitry Andric   CUMode = !(GPUFeatures & llvm::AMDGPU::FEATURE_WGP);
248*5f757f3fSDimitry Andric   for (auto F : {"image-insts", "gws"})
249*5f757f3fSDimitry Andric     ReadOnlyFeatures.insert(F);
250*5f757f3fSDimitry Andric   HalfArgsAndReturns = true;
2510b57cec5SDimitry Andric }
2520b57cec5SDimitry Andric 
253fe6060f1SDimitry Andric void AMDGPUTargetInfo::adjust(DiagnosticsEngine &Diags, LangOptions &Opts) {
254fe6060f1SDimitry Andric   TargetInfo::adjust(Diags, Opts);
2550b57cec5SDimitry Andric   // ToDo: There are still a few places using default address space as private
2560b57cec5SDimitry Andric   // address space in OpenCL, which needs to be cleaned up, then Opts.OpenCL
2570b57cec5SDimitry Andric   // can be removed from the following line.
2580b57cec5SDimitry Andric   setAddressSpaceMap(/*DefaultIsPrivate=*/Opts.OpenCL ||
2590b57cec5SDimitry Andric                      !isAMDGCN(getTriple()));
2600b57cec5SDimitry Andric }
2610b57cec5SDimitry Andric 
2620b57cec5SDimitry Andric ArrayRef<Builtin::Info> AMDGPUTargetInfo::getTargetBuiltins() const {
263bdd1243dSDimitry Andric   return llvm::ArrayRef(BuiltinInfo,
264bdd1243dSDimitry Andric                         clang::AMDGPU::LastTSBuiltin - Builtin::FirstTSBuiltin);
2650b57cec5SDimitry Andric }
2660b57cec5SDimitry Andric 
2670b57cec5SDimitry Andric void AMDGPUTargetInfo::getTargetDefines(const LangOptions &Opts,
2680b57cec5SDimitry Andric                                         MacroBuilder &Builder) const {
2690b57cec5SDimitry Andric   Builder.defineMacro("__AMD__");
2700b57cec5SDimitry Andric   Builder.defineMacro("__AMDGPU__");
2710b57cec5SDimitry Andric 
2720b57cec5SDimitry Andric   if (isAMDGCN(getTriple()))
2730b57cec5SDimitry Andric     Builder.defineMacro("__AMDGCN__");
2740b57cec5SDimitry Andric   else
2750b57cec5SDimitry Andric     Builder.defineMacro("__R600__");
2760b57cec5SDimitry Andric 
2770b57cec5SDimitry Andric   if (GPUKind != llvm::AMDGPU::GK_NONE) {
2780b57cec5SDimitry Andric     StringRef CanonName = isAMDGCN(getTriple()) ?
2790b57cec5SDimitry Andric       getArchNameAMDGCN(GPUKind) : getArchNameR600(GPUKind);
2800b57cec5SDimitry Andric     Builder.defineMacro(Twine("__") + Twine(CanonName) + Twine("__"));
28181ad6265SDimitry Andric     // Emit macros for gfx family e.g. gfx906 -> __GFX9__, gfx1030 -> __GFX10___
28281ad6265SDimitry Andric     if (isAMDGCN(getTriple())) {
283*5f757f3fSDimitry Andric       assert(CanonName.starts_with("gfx") && "Invalid amdgcn canonical name");
28481ad6265SDimitry Andric       Builder.defineMacro(Twine("__") + Twine(CanonName.drop_back(2).upper()) +
28581ad6265SDimitry Andric                           Twine("__"));
28681ad6265SDimitry Andric     }
287e8d8bef9SDimitry Andric     if (isAMDGCN(getTriple())) {
288e8d8bef9SDimitry Andric       Builder.defineMacro("__amdgcn_processor__",
289e8d8bef9SDimitry Andric                           Twine("\"") + Twine(CanonName) + Twine("\""));
290e8d8bef9SDimitry Andric       Builder.defineMacro("__amdgcn_target_id__",
29181ad6265SDimitry Andric                           Twine("\"") + Twine(*getTargetID()) + Twine("\""));
292e8d8bef9SDimitry Andric       for (auto F : getAllPossibleTargetIDFeatures(getTriple(), CanonName)) {
293e8d8bef9SDimitry Andric         auto Loc = OffloadArchFeatures.find(F);
294e8d8bef9SDimitry Andric         if (Loc != OffloadArchFeatures.end()) {
295e8d8bef9SDimitry Andric           std::string NewF = F.str();
296e8d8bef9SDimitry Andric           std::replace(NewF.begin(), NewF.end(), '-', '_');
297e8d8bef9SDimitry Andric           Builder.defineMacro(Twine("__amdgcn_feature_") + Twine(NewF) +
298e8d8bef9SDimitry Andric                                   Twine("__"),
299e8d8bef9SDimitry Andric                               Loc->second ? "1" : "0");
300e8d8bef9SDimitry Andric         }
301e8d8bef9SDimitry Andric       }
302e8d8bef9SDimitry Andric     }
3030b57cec5SDimitry Andric   }
3040b57cec5SDimitry Andric 
30581ad6265SDimitry Andric   if (AllowAMDGPUUnsafeFPAtomics)
30681ad6265SDimitry Andric     Builder.defineMacro("__AMDGCN_UNSAFE_FP_ATOMICS__");
30781ad6265SDimitry Andric 
3080b57cec5SDimitry Andric   // TODO: __HAS_FMAF__, __HAS_LDEXPF__, __HAS_FP64__ are deprecated and will be
3090b57cec5SDimitry Andric   // removed in the near future.
3100b57cec5SDimitry Andric   if (hasFMAF())
3110b57cec5SDimitry Andric     Builder.defineMacro("__HAS_FMAF__");
3120b57cec5SDimitry Andric   if (hasFastFMAF())
3130b57cec5SDimitry Andric     Builder.defineMacro("FP_FAST_FMAF");
3140b57cec5SDimitry Andric   if (hasLDEXPF())
3150b57cec5SDimitry Andric     Builder.defineMacro("__HAS_LDEXPF__");
3160b57cec5SDimitry Andric   if (hasFP64())
3170b57cec5SDimitry Andric     Builder.defineMacro("__HAS_FP64__");
3180b57cec5SDimitry Andric   if (hasFastFMA())
3190b57cec5SDimitry Andric     Builder.defineMacro("FP_FAST_FMA");
320e8d8bef9SDimitry Andric 
32106c3fb27SDimitry Andric   Builder.defineMacro("__AMDGCN_WAVEFRONT_SIZE__", Twine(WavefrontSize));
32206c3fb27SDimitry Andric   // ToDo: deprecate this macro for naming consistency.
323e8d8bef9SDimitry Andric   Builder.defineMacro("__AMDGCN_WAVEFRONT_SIZE", Twine(WavefrontSize));
32406c3fb27SDimitry Andric   Builder.defineMacro("__AMDGCN_CUMODE__", Twine(CUMode));
3250b57cec5SDimitry Andric }
3260b57cec5SDimitry Andric 
3270b57cec5SDimitry Andric void AMDGPUTargetInfo::setAuxTarget(const TargetInfo *Aux) {
3280b57cec5SDimitry Andric   assert(HalfFormat == Aux->HalfFormat);
3290b57cec5SDimitry Andric   assert(FloatFormat == Aux->FloatFormat);
3300b57cec5SDimitry Andric   assert(DoubleFormat == Aux->DoubleFormat);
3310b57cec5SDimitry Andric 
3320b57cec5SDimitry Andric   // On x86_64 long double is 80-bit extended precision format, which is
3330b57cec5SDimitry Andric   // not supported by AMDGPU. 128-bit floating point format is also not
3340b57cec5SDimitry Andric   // supported by AMDGPU. Therefore keep its own format for these two types.
3350b57cec5SDimitry Andric   auto SaveLongDoubleFormat = LongDoubleFormat;
3360b57cec5SDimitry Andric   auto SaveFloat128Format = Float128Format;
33781ad6265SDimitry Andric   auto SaveLongDoubleWidth = LongDoubleWidth;
33881ad6265SDimitry Andric   auto SaveLongDoubleAlign = LongDoubleAlign;
3390b57cec5SDimitry Andric   copyAuxTarget(Aux);
3400b57cec5SDimitry Andric   LongDoubleFormat = SaveLongDoubleFormat;
3410b57cec5SDimitry Andric   Float128Format = SaveFloat128Format;
34281ad6265SDimitry Andric   LongDoubleWidth = SaveLongDoubleWidth;
34381ad6265SDimitry Andric   LongDoubleAlign = SaveLongDoubleAlign;
3445ffd83dbSDimitry Andric   // For certain builtin types support on the host target, claim they are
3455ffd83dbSDimitry Andric   // support to pass the compilation of the host code during the device-side
3465ffd83dbSDimitry Andric   // compilation.
3475ffd83dbSDimitry Andric   // FIXME: As the side effect, we also accept `__float128` uses in the device
3485ffd83dbSDimitry Andric   // code. To rejct these builtin types supported in the host target but not in
3495ffd83dbSDimitry Andric   // the device target, one approach would support `device_builtin` attribute
3505ffd83dbSDimitry Andric   // so that we could tell the device builtin types from the host ones. The
3515ffd83dbSDimitry Andric   // also solves the different representations of the same builtin type, such
3525ffd83dbSDimitry Andric   // as `size_t` in the MSVC environment.
3535ffd83dbSDimitry Andric   if (Aux->hasFloat128Type()) {
3545ffd83dbSDimitry Andric     HasFloat128 = true;
3555ffd83dbSDimitry Andric     Float128Format = DoubleFormat;
3565ffd83dbSDimitry Andric   }
3570b57cec5SDimitry Andric }
358