xref: /freebsd/contrib/llvm-project/clang/lib/Basic/Targets/AMDGPU.cpp (revision 0fca6ea1d4eea4c934cfff25ac9ee8ad6fe95583)
10b57cec5SDimitry Andric //===--- AMDGPU.cpp - Implement AMDGPU target feature support -------------===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric //
90b57cec5SDimitry Andric // This file implements AMDGPU TargetInfo objects.
100b57cec5SDimitry Andric //
110b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
120b57cec5SDimitry Andric 
130b57cec5SDimitry Andric #include "AMDGPU.h"
140b57cec5SDimitry Andric #include "clang/Basic/Builtins.h"
150b57cec5SDimitry Andric #include "clang/Basic/CodeGenOptions.h"
16bdd1243dSDimitry Andric #include "clang/Basic/Diagnostic.h"
170b57cec5SDimitry Andric #include "clang/Basic/LangOptions.h"
180b57cec5SDimitry Andric #include "clang/Basic/MacroBuilder.h"
190b57cec5SDimitry Andric #include "clang/Basic/TargetBuiltins.h"
20*0fca6ea1SDimitry Andric #include "llvm/ADT/SmallString.h"
210b57cec5SDimitry Andric using namespace clang;
220b57cec5SDimitry Andric using namespace clang::targets;
230b57cec5SDimitry Andric 
240b57cec5SDimitry Andric namespace clang {
250b57cec5SDimitry Andric namespace targets {
260b57cec5SDimitry Andric 
270b57cec5SDimitry Andric // If you edit the description strings, make sure you update
280b57cec5SDimitry Andric // getPointerWidthV().
290b57cec5SDimitry Andric 
300b57cec5SDimitry Andric static const char *const DataLayoutStringR600 =
310b57cec5SDimitry Andric     "e-p:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128"
32e8d8bef9SDimitry Andric     "-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1";
330b57cec5SDimitry Andric 
340b57cec5SDimitry Andric static const char *const DataLayoutStringAMDGCN =
350b57cec5SDimitry Andric     "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32"
365f757f3fSDimitry Andric     "-p7:160:256:256:32-p8:128:128-p9:192:256:256:32-i64:64-v16:16-v24:32-v32:"
375f757f3fSDimitry Andric     "32-v48:64-v96:128"
38e8d8bef9SDimitry Andric     "-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1"
395f757f3fSDimitry Andric     "-ni:7:8:9";
400b57cec5SDimitry Andric 
410b57cec5SDimitry Andric const LangASMap AMDGPUTargetInfo::AMDGPUDefIsGenMap = {
425f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // Default
435f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // opencl_global
445f757f3fSDimitry Andric     llvm::AMDGPUAS::LOCAL_ADDRESS,    // opencl_local
455f757f3fSDimitry Andric     llvm::AMDGPUAS::CONSTANT_ADDRESS, // opencl_constant
465f757f3fSDimitry Andric     llvm::AMDGPUAS::PRIVATE_ADDRESS,  // opencl_private
475f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // opencl_generic
485f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // opencl_global_device
495f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // opencl_global_host
505f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // cuda_device
515f757f3fSDimitry Andric     llvm::AMDGPUAS::CONSTANT_ADDRESS, // cuda_constant
525f757f3fSDimitry Andric     llvm::AMDGPUAS::LOCAL_ADDRESS,    // cuda_shared
535f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // sycl_global
545f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // sycl_global_device
555f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // sycl_global_host
565f757f3fSDimitry Andric     llvm::AMDGPUAS::LOCAL_ADDRESS,    // sycl_local
575f757f3fSDimitry Andric     llvm::AMDGPUAS::PRIVATE_ADDRESS,  // sycl_private
585f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // ptr32_sptr
595f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // ptr32_uptr
605f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // ptr64
615f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // hlsl_groupshared
620b57cec5SDimitry Andric };
630b57cec5SDimitry Andric 
640b57cec5SDimitry Andric const LangASMap AMDGPUTargetInfo::AMDGPUDefIsPrivMap = {
655f757f3fSDimitry Andric     llvm::AMDGPUAS::PRIVATE_ADDRESS,  // Default
665f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // opencl_global
675f757f3fSDimitry Andric     llvm::AMDGPUAS::LOCAL_ADDRESS,    // opencl_local
685f757f3fSDimitry Andric     llvm::AMDGPUAS::CONSTANT_ADDRESS, // opencl_constant
695f757f3fSDimitry Andric     llvm::AMDGPUAS::PRIVATE_ADDRESS,  // opencl_private
705f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS,     // opencl_generic
715f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // opencl_global_device
725f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // opencl_global_host
735f757f3fSDimitry Andric     llvm::AMDGPUAS::GLOBAL_ADDRESS,   // cuda_device
745f757f3fSDimitry Andric     llvm::AMDGPUAS::CONSTANT_ADDRESS, // cuda_constant
755f757f3fSDimitry Andric     llvm::AMDGPUAS::LOCAL_ADDRESS,    // cuda_shared
76fe6060f1SDimitry Andric     // SYCL address space values for this map are dummy
775f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global
785f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global_device
795f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global_host
805f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_local
815f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_private
825f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_sptr
835f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_uptr
845f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // ptr64
855f757f3fSDimitry Andric     llvm::AMDGPUAS::FLAT_ADDRESS, // hlsl_groupshared
86480093f4SDimitry Andric 
870b57cec5SDimitry Andric };
880b57cec5SDimitry Andric } // namespace targets
890b57cec5SDimitry Andric } // namespace clang
900b57cec5SDimitry Andric 
91bdd1243dSDimitry Andric static constexpr Builtin::Info BuiltinInfo[] = {
920b57cec5SDimitry Andric #define BUILTIN(ID, TYPE, ATTRS)                                               \
93bdd1243dSDimitry Andric   {#ID, TYPE, ATTRS, nullptr, HeaderDesc::NO_HEADER, ALL_LANGUAGES},
940b57cec5SDimitry Andric #define TARGET_BUILTIN(ID, TYPE, ATTRS, FEATURE)                               \
95bdd1243dSDimitry Andric   {#ID, TYPE, ATTRS, FEATURE, HeaderDesc::NO_HEADER, ALL_LANGUAGES},
960b57cec5SDimitry Andric #include "clang/Basic/BuiltinsAMDGPU.def"
970b57cec5SDimitry Andric };
980b57cec5SDimitry Andric 
990b57cec5SDimitry Andric const char *const AMDGPUTargetInfo::GCCRegNames[] = {
1000b57cec5SDimitry Andric   "v0", "v1", "v2", "v3", "v4", "v5", "v6", "v7", "v8",
1010b57cec5SDimitry Andric   "v9", "v10", "v11", "v12", "v13", "v14", "v15", "v16", "v17",
1020b57cec5SDimitry Andric   "v18", "v19", "v20", "v21", "v22", "v23", "v24", "v25", "v26",
1030b57cec5SDimitry Andric   "v27", "v28", "v29", "v30", "v31", "v32", "v33", "v34", "v35",
1040b57cec5SDimitry Andric   "v36", "v37", "v38", "v39", "v40", "v41", "v42", "v43", "v44",
1050b57cec5SDimitry Andric   "v45", "v46", "v47", "v48", "v49", "v50", "v51", "v52", "v53",
1060b57cec5SDimitry Andric   "v54", "v55", "v56", "v57", "v58", "v59", "v60", "v61", "v62",
1070b57cec5SDimitry Andric   "v63", "v64", "v65", "v66", "v67", "v68", "v69", "v70", "v71",
1080b57cec5SDimitry Andric   "v72", "v73", "v74", "v75", "v76", "v77", "v78", "v79", "v80",
1090b57cec5SDimitry Andric   "v81", "v82", "v83", "v84", "v85", "v86", "v87", "v88", "v89",
1100b57cec5SDimitry Andric   "v90", "v91", "v92", "v93", "v94", "v95", "v96", "v97", "v98",
1110b57cec5SDimitry Andric   "v99", "v100", "v101", "v102", "v103", "v104", "v105", "v106", "v107",
1120b57cec5SDimitry Andric   "v108", "v109", "v110", "v111", "v112", "v113", "v114", "v115", "v116",
1130b57cec5SDimitry Andric   "v117", "v118", "v119", "v120", "v121", "v122", "v123", "v124", "v125",
1140b57cec5SDimitry Andric   "v126", "v127", "v128", "v129", "v130", "v131", "v132", "v133", "v134",
1150b57cec5SDimitry Andric   "v135", "v136", "v137", "v138", "v139", "v140", "v141", "v142", "v143",
1160b57cec5SDimitry Andric   "v144", "v145", "v146", "v147", "v148", "v149", "v150", "v151", "v152",
1170b57cec5SDimitry Andric   "v153", "v154", "v155", "v156", "v157", "v158", "v159", "v160", "v161",
1180b57cec5SDimitry Andric   "v162", "v163", "v164", "v165", "v166", "v167", "v168", "v169", "v170",
1190b57cec5SDimitry Andric   "v171", "v172", "v173", "v174", "v175", "v176", "v177", "v178", "v179",
1200b57cec5SDimitry Andric   "v180", "v181", "v182", "v183", "v184", "v185", "v186", "v187", "v188",
1210b57cec5SDimitry Andric   "v189", "v190", "v191", "v192", "v193", "v194", "v195", "v196", "v197",
1220b57cec5SDimitry Andric   "v198", "v199", "v200", "v201", "v202", "v203", "v204", "v205", "v206",
1230b57cec5SDimitry Andric   "v207", "v208", "v209", "v210", "v211", "v212", "v213", "v214", "v215",
1240b57cec5SDimitry Andric   "v216", "v217", "v218", "v219", "v220", "v221", "v222", "v223", "v224",
1250b57cec5SDimitry Andric   "v225", "v226", "v227", "v228", "v229", "v230", "v231", "v232", "v233",
1260b57cec5SDimitry Andric   "v234", "v235", "v236", "v237", "v238", "v239", "v240", "v241", "v242",
1270b57cec5SDimitry Andric   "v243", "v244", "v245", "v246", "v247", "v248", "v249", "v250", "v251",
1280b57cec5SDimitry Andric   "v252", "v253", "v254", "v255", "s0", "s1", "s2", "s3", "s4",
1290b57cec5SDimitry Andric   "s5", "s6", "s7", "s8", "s9", "s10", "s11", "s12", "s13",
1300b57cec5SDimitry Andric   "s14", "s15", "s16", "s17", "s18", "s19", "s20", "s21", "s22",
1310b57cec5SDimitry Andric   "s23", "s24", "s25", "s26", "s27", "s28", "s29", "s30", "s31",
1320b57cec5SDimitry Andric   "s32", "s33", "s34", "s35", "s36", "s37", "s38", "s39", "s40",
1330b57cec5SDimitry Andric   "s41", "s42", "s43", "s44", "s45", "s46", "s47", "s48", "s49",
1340b57cec5SDimitry Andric   "s50", "s51", "s52", "s53", "s54", "s55", "s56", "s57", "s58",
1350b57cec5SDimitry Andric   "s59", "s60", "s61", "s62", "s63", "s64", "s65", "s66", "s67",
1360b57cec5SDimitry Andric   "s68", "s69", "s70", "s71", "s72", "s73", "s74", "s75", "s76",
1370b57cec5SDimitry Andric   "s77", "s78", "s79", "s80", "s81", "s82", "s83", "s84", "s85",
1380b57cec5SDimitry Andric   "s86", "s87", "s88", "s89", "s90", "s91", "s92", "s93", "s94",
1390b57cec5SDimitry Andric   "s95", "s96", "s97", "s98", "s99", "s100", "s101", "s102", "s103",
1400b57cec5SDimitry Andric   "s104", "s105", "s106", "s107", "s108", "s109", "s110", "s111", "s112",
1410b57cec5SDimitry Andric   "s113", "s114", "s115", "s116", "s117", "s118", "s119", "s120", "s121",
1420b57cec5SDimitry Andric   "s122", "s123", "s124", "s125", "s126", "s127", "exec", "vcc", "scc",
1430b57cec5SDimitry Andric   "m0", "flat_scratch", "exec_lo", "exec_hi", "vcc_lo", "vcc_hi",
1445ffd83dbSDimitry Andric   "flat_scratch_lo", "flat_scratch_hi",
1455ffd83dbSDimitry Andric   "a0", "a1", "a2", "a3", "a4", "a5", "a6", "a7", "a8",
1465ffd83dbSDimitry Andric   "a9", "a10", "a11", "a12", "a13", "a14", "a15", "a16", "a17",
1475ffd83dbSDimitry Andric   "a18", "a19", "a20", "a21", "a22", "a23", "a24", "a25", "a26",
1485ffd83dbSDimitry Andric   "a27", "a28", "a29", "a30", "a31", "a32", "a33", "a34", "a35",
1495ffd83dbSDimitry Andric   "a36", "a37", "a38", "a39", "a40", "a41", "a42", "a43", "a44",
1505ffd83dbSDimitry Andric   "a45", "a46", "a47", "a48", "a49", "a50", "a51", "a52", "a53",
1515ffd83dbSDimitry Andric   "a54", "a55", "a56", "a57", "a58", "a59", "a60", "a61", "a62",
1525ffd83dbSDimitry Andric   "a63", "a64", "a65", "a66", "a67", "a68", "a69", "a70", "a71",
1535ffd83dbSDimitry Andric   "a72", "a73", "a74", "a75", "a76", "a77", "a78", "a79", "a80",
1545ffd83dbSDimitry Andric   "a81", "a82", "a83", "a84", "a85", "a86", "a87", "a88", "a89",
1555ffd83dbSDimitry Andric   "a90", "a91", "a92", "a93", "a94", "a95", "a96", "a97", "a98",
1565ffd83dbSDimitry Andric   "a99", "a100", "a101", "a102", "a103", "a104", "a105", "a106", "a107",
1575ffd83dbSDimitry Andric   "a108", "a109", "a110", "a111", "a112", "a113", "a114", "a115", "a116",
1585ffd83dbSDimitry Andric   "a117", "a118", "a119", "a120", "a121", "a122", "a123", "a124", "a125",
1595ffd83dbSDimitry Andric   "a126", "a127", "a128", "a129", "a130", "a131", "a132", "a133", "a134",
1605ffd83dbSDimitry Andric   "a135", "a136", "a137", "a138", "a139", "a140", "a141", "a142", "a143",
1615ffd83dbSDimitry Andric   "a144", "a145", "a146", "a147", "a148", "a149", "a150", "a151", "a152",
1625ffd83dbSDimitry Andric   "a153", "a154", "a155", "a156", "a157", "a158", "a159", "a160", "a161",
1635ffd83dbSDimitry Andric   "a162", "a163", "a164", "a165", "a166", "a167", "a168", "a169", "a170",
1645ffd83dbSDimitry Andric   "a171", "a172", "a173", "a174", "a175", "a176", "a177", "a178", "a179",
1655ffd83dbSDimitry Andric   "a180", "a181", "a182", "a183", "a184", "a185", "a186", "a187", "a188",
1665ffd83dbSDimitry Andric   "a189", "a190", "a191", "a192", "a193", "a194", "a195", "a196", "a197",
1675ffd83dbSDimitry Andric   "a198", "a199", "a200", "a201", "a202", "a203", "a204", "a205", "a206",
1685ffd83dbSDimitry Andric   "a207", "a208", "a209", "a210", "a211", "a212", "a213", "a214", "a215",
1695ffd83dbSDimitry Andric   "a216", "a217", "a218", "a219", "a220", "a221", "a222", "a223", "a224",
1705ffd83dbSDimitry Andric   "a225", "a226", "a227", "a228", "a229", "a230", "a231", "a232", "a233",
1715ffd83dbSDimitry Andric   "a234", "a235", "a236", "a237", "a238", "a239", "a240", "a241", "a242",
1725ffd83dbSDimitry Andric   "a243", "a244", "a245", "a246", "a247", "a248", "a249", "a250", "a251",
1735ffd83dbSDimitry Andric   "a252", "a253", "a254", "a255"
1740b57cec5SDimitry Andric };
1750b57cec5SDimitry Andric 
getGCCRegNames() const1760b57cec5SDimitry Andric ArrayRef<const char *> AMDGPUTargetInfo::getGCCRegNames() const {
177bdd1243dSDimitry Andric   return llvm::ArrayRef(GCCRegNames);
1780b57cec5SDimitry Andric }
1790b57cec5SDimitry Andric 
initFeatureMap(llvm::StringMap<bool> & Features,DiagnosticsEngine & Diags,StringRef CPU,const std::vector<std::string> & FeatureVec) const1800b57cec5SDimitry Andric bool AMDGPUTargetInfo::initFeatureMap(
1810b57cec5SDimitry Andric     llvm::StringMap<bool> &Features, DiagnosticsEngine &Diags, StringRef CPU,
1820b57cec5SDimitry Andric     const std::vector<std::string> &FeatureVec) const {
1830b57cec5SDimitry Andric 
1840b57cec5SDimitry Andric   using namespace llvm::AMDGPU;
18506c3fb27SDimitry Andric   fillAMDGPUFeatureMap(CPU, getTriple(), Features);
186bdd1243dSDimitry Andric   if (!TargetInfo::initFeatureMap(Features, Diags, CPU, FeatureVec))
187bdd1243dSDimitry Andric     return false;
188bdd1243dSDimitry Andric 
189bdd1243dSDimitry Andric   // TODO: Should move this logic into TargetParser
190*0fca6ea1SDimitry Andric   auto HasError = insertWaveSizeFeature(CPU, getTriple(), Features);
191*0fca6ea1SDimitry Andric   switch (HasError.first) {
192*0fca6ea1SDimitry Andric   default:
193*0fca6ea1SDimitry Andric     break;
194*0fca6ea1SDimitry Andric   case llvm::AMDGPU::INVALID_FEATURE_COMBINATION:
195*0fca6ea1SDimitry Andric     Diags.Report(diag::err_invalid_feature_combination) << HasError.second;
196*0fca6ea1SDimitry Andric     return false;
197*0fca6ea1SDimitry Andric   case llvm::AMDGPU::UNSUPPORTED_TARGET_FEATURE:
198*0fca6ea1SDimitry Andric     Diags.Report(diag::err_opt_not_valid_on_target) << HasError.second;
199bdd1243dSDimitry Andric     return false;
200bdd1243dSDimitry Andric   }
201bdd1243dSDimitry Andric 
202bdd1243dSDimitry Andric   return true;
2030b57cec5SDimitry Andric }
2040b57cec5SDimitry Andric 
fillValidCPUList(SmallVectorImpl<StringRef> & Values) const2050b57cec5SDimitry Andric void AMDGPUTargetInfo::fillValidCPUList(
2060b57cec5SDimitry Andric     SmallVectorImpl<StringRef> &Values) const {
2070b57cec5SDimitry Andric   if (isAMDGCN(getTriple()))
2080b57cec5SDimitry Andric     llvm::AMDGPU::fillValidArchListAMDGCN(Values);
2090b57cec5SDimitry Andric   else
2100b57cec5SDimitry Andric     llvm::AMDGPU::fillValidArchListR600(Values);
2110b57cec5SDimitry Andric }
2120b57cec5SDimitry Andric 
setAddressSpaceMap(bool DefaultIsPrivate)2130b57cec5SDimitry Andric void AMDGPUTargetInfo::setAddressSpaceMap(bool DefaultIsPrivate) {
2140b57cec5SDimitry Andric   AddrSpaceMap = DefaultIsPrivate ? &AMDGPUDefIsPrivMap : &AMDGPUDefIsGenMap;
2150b57cec5SDimitry Andric }
2160b57cec5SDimitry Andric 
AMDGPUTargetInfo(const llvm::Triple & Triple,const TargetOptions & Opts)2170b57cec5SDimitry Andric AMDGPUTargetInfo::AMDGPUTargetInfo(const llvm::Triple &Triple,
2180b57cec5SDimitry Andric                                    const TargetOptions &Opts)
2190b57cec5SDimitry Andric     : TargetInfo(Triple),
2200b57cec5SDimitry Andric       GPUKind(isAMDGCN(Triple) ?
2210b57cec5SDimitry Andric               llvm::AMDGPU::parseArchAMDGCN(Opts.CPU) :
2220b57cec5SDimitry Andric               llvm::AMDGPU::parseArchR600(Opts.CPU)),
2230b57cec5SDimitry Andric       GPUFeatures(isAMDGCN(Triple) ?
2240b57cec5SDimitry Andric                   llvm::AMDGPU::getArchAttrAMDGCN(GPUKind) :
2250b57cec5SDimitry Andric                   llvm::AMDGPU::getArchAttrR600(GPUKind)) {
2260b57cec5SDimitry Andric   resetDataLayout(isAMDGCN(getTriple()) ? DataLayoutStringAMDGCN
2270b57cec5SDimitry Andric                                         : DataLayoutStringR600);
2280b57cec5SDimitry Andric 
2290b57cec5SDimitry Andric   setAddressSpaceMap(Triple.getOS() == llvm::Triple::Mesa3D ||
2300b57cec5SDimitry Andric                      !isAMDGCN(Triple));
2310b57cec5SDimitry Andric   UseAddrSpaceMapMangling = true;
2320b57cec5SDimitry Andric 
233bdd1243dSDimitry Andric   if (isAMDGCN(Triple)) {
234bdd1243dSDimitry Andric     // __bf16 is always available as a load/store only type on AMDGCN.
235bdd1243dSDimitry Andric     BFloat16Width = BFloat16Align = 16;
236bdd1243dSDimitry Andric     BFloat16Format = &llvm::APFloat::BFloat();
237bdd1243dSDimitry Andric   }
238bdd1243dSDimitry Andric 
2390b57cec5SDimitry Andric   HasLegalHalfType = true;
2400b57cec5SDimitry Andric   HasFloat16 = true;
241*0fca6ea1SDimitry Andric   WavefrontSize = (GPUFeatures & llvm::AMDGPU::FEATURE_WAVE32) ? 32 : 64;
242e8d8bef9SDimitry Andric   AllowAMDGPUUnsafeFPAtomics = Opts.AllowAMDGPUUnsafeFPAtomics;
2430b57cec5SDimitry Andric 
244bdd1243dSDimitry Andric   // Set pointer width and alignment for the generic address space.
245bdd1243dSDimitry Andric   PointerWidth = PointerAlign = getPointerWidthV(LangAS::Default);
2460b57cec5SDimitry Andric   if (getMaxPointerWidth() == 64) {
2470b57cec5SDimitry Andric     LongWidth = LongAlign = 64;
2480b57cec5SDimitry Andric     SizeType = UnsignedLong;
2490b57cec5SDimitry Andric     PtrDiffType = SignedLong;
2500b57cec5SDimitry Andric     IntPtrType = SignedLong;
2510b57cec5SDimitry Andric   }
2520b57cec5SDimitry Andric 
2530b57cec5SDimitry Andric   MaxAtomicPromoteWidth = MaxAtomicInlineWidth = 64;
25406c3fb27SDimitry Andric   CUMode = !(GPUFeatures & llvm::AMDGPU::FEATURE_WGP);
2555f757f3fSDimitry Andric   for (auto F : {"image-insts", "gws"})
2565f757f3fSDimitry Andric     ReadOnlyFeatures.insert(F);
2575f757f3fSDimitry Andric   HalfArgsAndReturns = true;
2580b57cec5SDimitry Andric }
2590b57cec5SDimitry Andric 
adjust(DiagnosticsEngine & Diags,LangOptions & Opts)260fe6060f1SDimitry Andric void AMDGPUTargetInfo::adjust(DiagnosticsEngine &Diags, LangOptions &Opts) {
261fe6060f1SDimitry Andric   TargetInfo::adjust(Diags, Opts);
2620b57cec5SDimitry Andric   // ToDo: There are still a few places using default address space as private
2630b57cec5SDimitry Andric   // address space in OpenCL, which needs to be cleaned up, then Opts.OpenCL
2640b57cec5SDimitry Andric   // can be removed from the following line.
2650b57cec5SDimitry Andric   setAddressSpaceMap(/*DefaultIsPrivate=*/Opts.OpenCL ||
2660b57cec5SDimitry Andric                      !isAMDGCN(getTriple()));
2670b57cec5SDimitry Andric }
2680b57cec5SDimitry Andric 
getTargetBuiltins() const2690b57cec5SDimitry Andric ArrayRef<Builtin::Info> AMDGPUTargetInfo::getTargetBuiltins() const {
270bdd1243dSDimitry Andric   return llvm::ArrayRef(BuiltinInfo,
271bdd1243dSDimitry Andric                         clang::AMDGPU::LastTSBuiltin - Builtin::FirstTSBuiltin);
2720b57cec5SDimitry Andric }
2730b57cec5SDimitry Andric 
getTargetDefines(const LangOptions & Opts,MacroBuilder & Builder) const2740b57cec5SDimitry Andric void AMDGPUTargetInfo::getTargetDefines(const LangOptions &Opts,
2750b57cec5SDimitry Andric                                         MacroBuilder &Builder) const {
2760b57cec5SDimitry Andric   Builder.defineMacro("__AMD__");
2770b57cec5SDimitry Andric   Builder.defineMacro("__AMDGPU__");
2780b57cec5SDimitry Andric 
2790b57cec5SDimitry Andric   if (isAMDGCN(getTriple()))
2800b57cec5SDimitry Andric     Builder.defineMacro("__AMDGCN__");
2810b57cec5SDimitry Andric   else
2820b57cec5SDimitry Andric     Builder.defineMacro("__R600__");
2830b57cec5SDimitry Andric 
284*0fca6ea1SDimitry Andric   // Legacy HIP host code relies on these default attributes to be defined.
285*0fca6ea1SDimitry Andric   bool IsHIPHost = Opts.HIP && !Opts.CUDAIsDevice;
286*0fca6ea1SDimitry Andric   if (GPUKind == llvm::AMDGPU::GK_NONE && !IsHIPHost)
287*0fca6ea1SDimitry Andric     return;
288*0fca6ea1SDimitry Andric 
289*0fca6ea1SDimitry Andric   llvm::SmallString<16> CanonName =
290*0fca6ea1SDimitry Andric       (isAMDGCN(getTriple()) ? getArchNameAMDGCN(GPUKind)
291*0fca6ea1SDimitry Andric                              : getArchNameR600(GPUKind));
292*0fca6ea1SDimitry Andric 
293*0fca6ea1SDimitry Andric   // Sanitize the name of generic targets.
294*0fca6ea1SDimitry Andric   // e.g. gfx10-1-generic -> gfx10_1_generic
295*0fca6ea1SDimitry Andric   if (GPUKind >= llvm::AMDGPU::GK_AMDGCN_GENERIC_FIRST &&
296*0fca6ea1SDimitry Andric       GPUKind <= llvm::AMDGPU::GK_AMDGCN_GENERIC_LAST) {
297*0fca6ea1SDimitry Andric     std::replace(CanonName.begin(), CanonName.end(), '-', '_');
298*0fca6ea1SDimitry Andric   }
299*0fca6ea1SDimitry Andric 
3000b57cec5SDimitry Andric   Builder.defineMacro(Twine("__") + Twine(CanonName) + Twine("__"));
30181ad6265SDimitry Andric   // Emit macros for gfx family e.g. gfx906 -> __GFX9__, gfx1030 -> __GFX10___
302*0fca6ea1SDimitry Andric   if (isAMDGCN(getTriple()) && !IsHIPHost) {
303*0fca6ea1SDimitry Andric     assert(StringRef(CanonName).starts_with("gfx") &&
304*0fca6ea1SDimitry Andric            "Invalid amdgcn canonical name");
305*0fca6ea1SDimitry Andric     StringRef CanonFamilyName = getArchFamilyNameAMDGCN(GPUKind);
306*0fca6ea1SDimitry Andric     Builder.defineMacro(Twine("__") + Twine(CanonFamilyName.upper()) +
30781ad6265SDimitry Andric                         Twine("__"));
308e8d8bef9SDimitry Andric     Builder.defineMacro("__amdgcn_processor__",
309e8d8bef9SDimitry Andric                         Twine("\"") + Twine(CanonName) + Twine("\""));
310e8d8bef9SDimitry Andric     Builder.defineMacro("__amdgcn_target_id__",
31181ad6265SDimitry Andric                         Twine("\"") + Twine(*getTargetID()) + Twine("\""));
312e8d8bef9SDimitry Andric     for (auto F : getAllPossibleTargetIDFeatures(getTriple(), CanonName)) {
313e8d8bef9SDimitry Andric       auto Loc = OffloadArchFeatures.find(F);
314e8d8bef9SDimitry Andric       if (Loc != OffloadArchFeatures.end()) {
315e8d8bef9SDimitry Andric         std::string NewF = F.str();
316e8d8bef9SDimitry Andric         std::replace(NewF.begin(), NewF.end(), '-', '_');
317e8d8bef9SDimitry Andric         Builder.defineMacro(Twine("__amdgcn_feature_") + Twine(NewF) +
318e8d8bef9SDimitry Andric                                 Twine("__"),
319e8d8bef9SDimitry Andric                             Loc->second ? "1" : "0");
320e8d8bef9SDimitry Andric       }
321e8d8bef9SDimitry Andric     }
322e8d8bef9SDimitry Andric   }
3230b57cec5SDimitry Andric 
32481ad6265SDimitry Andric   if (AllowAMDGPUUnsafeFPAtomics)
32581ad6265SDimitry Andric     Builder.defineMacro("__AMDGCN_UNSAFE_FP_ATOMICS__");
32681ad6265SDimitry Andric 
3270b57cec5SDimitry Andric   // TODO: __HAS_FMAF__, __HAS_LDEXPF__, __HAS_FP64__ are deprecated and will be
3280b57cec5SDimitry Andric   // removed in the near future.
3290b57cec5SDimitry Andric   if (hasFMAF())
3300b57cec5SDimitry Andric     Builder.defineMacro("__HAS_FMAF__");
3310b57cec5SDimitry Andric   if (hasFastFMAF())
3320b57cec5SDimitry Andric     Builder.defineMacro("FP_FAST_FMAF");
3330b57cec5SDimitry Andric   if (hasLDEXPF())
3340b57cec5SDimitry Andric     Builder.defineMacro("__HAS_LDEXPF__");
3350b57cec5SDimitry Andric   if (hasFP64())
3360b57cec5SDimitry Andric     Builder.defineMacro("__HAS_FP64__");
3370b57cec5SDimitry Andric   if (hasFastFMA())
3380b57cec5SDimitry Andric     Builder.defineMacro("FP_FAST_FMA");
339e8d8bef9SDimitry Andric 
34006c3fb27SDimitry Andric   Builder.defineMacro("__AMDGCN_WAVEFRONT_SIZE__", Twine(WavefrontSize));
34106c3fb27SDimitry Andric   // ToDo: deprecate this macro for naming consistency.
342e8d8bef9SDimitry Andric   Builder.defineMacro("__AMDGCN_WAVEFRONT_SIZE", Twine(WavefrontSize));
34306c3fb27SDimitry Andric   Builder.defineMacro("__AMDGCN_CUMODE__", Twine(CUMode));
3440b57cec5SDimitry Andric }
3450b57cec5SDimitry Andric 
setAuxTarget(const TargetInfo * Aux)3460b57cec5SDimitry Andric void AMDGPUTargetInfo::setAuxTarget(const TargetInfo *Aux) {
3470b57cec5SDimitry Andric   assert(HalfFormat == Aux->HalfFormat);
3480b57cec5SDimitry Andric   assert(FloatFormat == Aux->FloatFormat);
3490b57cec5SDimitry Andric   assert(DoubleFormat == Aux->DoubleFormat);
3500b57cec5SDimitry Andric 
3510b57cec5SDimitry Andric   // On x86_64 long double is 80-bit extended precision format, which is
3520b57cec5SDimitry Andric   // not supported by AMDGPU. 128-bit floating point format is also not
3530b57cec5SDimitry Andric   // supported by AMDGPU. Therefore keep its own format for these two types.
3540b57cec5SDimitry Andric   auto SaveLongDoubleFormat = LongDoubleFormat;
3550b57cec5SDimitry Andric   auto SaveFloat128Format = Float128Format;
35681ad6265SDimitry Andric   auto SaveLongDoubleWidth = LongDoubleWidth;
35781ad6265SDimitry Andric   auto SaveLongDoubleAlign = LongDoubleAlign;
3580b57cec5SDimitry Andric   copyAuxTarget(Aux);
3590b57cec5SDimitry Andric   LongDoubleFormat = SaveLongDoubleFormat;
3600b57cec5SDimitry Andric   Float128Format = SaveFloat128Format;
36181ad6265SDimitry Andric   LongDoubleWidth = SaveLongDoubleWidth;
36281ad6265SDimitry Andric   LongDoubleAlign = SaveLongDoubleAlign;
3635ffd83dbSDimitry Andric   // For certain builtin types support on the host target, claim they are
3645ffd83dbSDimitry Andric   // support to pass the compilation of the host code during the device-side
3655ffd83dbSDimitry Andric   // compilation.
3665ffd83dbSDimitry Andric   // FIXME: As the side effect, we also accept `__float128` uses in the device
3675ffd83dbSDimitry Andric   // code. To rejct these builtin types supported in the host target but not in
3685ffd83dbSDimitry Andric   // the device target, one approach would support `device_builtin` attribute
3695ffd83dbSDimitry Andric   // so that we could tell the device builtin types from the host ones. The
3705ffd83dbSDimitry Andric   // also solves the different representations of the same builtin type, such
3715ffd83dbSDimitry Andric   // as `size_t` in the MSVC environment.
3725ffd83dbSDimitry Andric   if (Aux->hasFloat128Type()) {
3735ffd83dbSDimitry Andric     HasFloat128 = true;
3745ffd83dbSDimitry Andric     Float128Format = DoubleFormat;
3755ffd83dbSDimitry Andric   }
3760b57cec5SDimitry Andric }
377