10b57cec5SDimitry Andric //===--- AMDGPU.cpp - Implement AMDGPU target feature support -------------===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric //
90b57cec5SDimitry Andric // This file implements AMDGPU TargetInfo objects.
100b57cec5SDimitry Andric //
110b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
120b57cec5SDimitry Andric
130b57cec5SDimitry Andric #include "AMDGPU.h"
140b57cec5SDimitry Andric #include "clang/Basic/Builtins.h"
150b57cec5SDimitry Andric #include "clang/Basic/CodeGenOptions.h"
16bdd1243dSDimitry Andric #include "clang/Basic/Diagnostic.h"
170b57cec5SDimitry Andric #include "clang/Basic/LangOptions.h"
180b57cec5SDimitry Andric #include "clang/Basic/MacroBuilder.h"
190b57cec5SDimitry Andric #include "clang/Basic/TargetBuiltins.h"
20*0fca6ea1SDimitry Andric #include "llvm/ADT/SmallString.h"
210b57cec5SDimitry Andric using namespace clang;
220b57cec5SDimitry Andric using namespace clang::targets;
230b57cec5SDimitry Andric
240b57cec5SDimitry Andric namespace clang {
250b57cec5SDimitry Andric namespace targets {
260b57cec5SDimitry Andric
270b57cec5SDimitry Andric // If you edit the description strings, make sure you update
280b57cec5SDimitry Andric // getPointerWidthV().
290b57cec5SDimitry Andric
300b57cec5SDimitry Andric static const char *const DataLayoutStringR600 =
310b57cec5SDimitry Andric "e-p:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128"
32e8d8bef9SDimitry Andric "-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1";
330b57cec5SDimitry Andric
340b57cec5SDimitry Andric static const char *const DataLayoutStringAMDGCN =
350b57cec5SDimitry Andric "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32"
365f757f3fSDimitry Andric "-p7:160:256:256:32-p8:128:128-p9:192:256:256:32-i64:64-v16:16-v24:32-v32:"
375f757f3fSDimitry Andric "32-v48:64-v96:128"
38e8d8bef9SDimitry Andric "-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1"
395f757f3fSDimitry Andric "-ni:7:8:9";
400b57cec5SDimitry Andric
410b57cec5SDimitry Andric const LangASMap AMDGPUTargetInfo::AMDGPUDefIsGenMap = {
425f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // Default
435f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global
445f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // opencl_local
455f757f3fSDimitry Andric llvm::AMDGPUAS::CONSTANT_ADDRESS, // opencl_constant
465f757f3fSDimitry Andric llvm::AMDGPUAS::PRIVATE_ADDRESS, // opencl_private
475f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // opencl_generic
485f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global_device
495f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global_host
505f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // cuda_device
515f757f3fSDimitry Andric llvm::AMDGPUAS::CONSTANT_ADDRESS, // cuda_constant
525f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // cuda_shared
535f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // sycl_global
545f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // sycl_global_device
555f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // sycl_global_host
565f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // sycl_local
575f757f3fSDimitry Andric llvm::AMDGPUAS::PRIVATE_ADDRESS, // sycl_private
585f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_sptr
595f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_uptr
605f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr64
615f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // hlsl_groupshared
620b57cec5SDimitry Andric };
630b57cec5SDimitry Andric
640b57cec5SDimitry Andric const LangASMap AMDGPUTargetInfo::AMDGPUDefIsPrivMap = {
655f757f3fSDimitry Andric llvm::AMDGPUAS::PRIVATE_ADDRESS, // Default
665f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global
675f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // opencl_local
685f757f3fSDimitry Andric llvm::AMDGPUAS::CONSTANT_ADDRESS, // opencl_constant
695f757f3fSDimitry Andric llvm::AMDGPUAS::PRIVATE_ADDRESS, // opencl_private
705f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // opencl_generic
715f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global_device
725f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global_host
735f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // cuda_device
745f757f3fSDimitry Andric llvm::AMDGPUAS::CONSTANT_ADDRESS, // cuda_constant
755f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // cuda_shared
76fe6060f1SDimitry Andric // SYCL address space values for this map are dummy
775f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global
785f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global_device
795f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global_host
805f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_local
815f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_private
825f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_sptr
835f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_uptr
845f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr64
855f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // hlsl_groupshared
86480093f4SDimitry Andric
870b57cec5SDimitry Andric };
880b57cec5SDimitry Andric } // namespace targets
890b57cec5SDimitry Andric } // namespace clang
900b57cec5SDimitry Andric
91bdd1243dSDimitry Andric static constexpr Builtin::Info BuiltinInfo[] = {
920b57cec5SDimitry Andric #define BUILTIN(ID, TYPE, ATTRS) \
93bdd1243dSDimitry Andric {#ID, TYPE, ATTRS, nullptr, HeaderDesc::NO_HEADER, ALL_LANGUAGES},
940b57cec5SDimitry Andric #define TARGET_BUILTIN(ID, TYPE, ATTRS, FEATURE) \
95bdd1243dSDimitry Andric {#ID, TYPE, ATTRS, FEATURE, HeaderDesc::NO_HEADER, ALL_LANGUAGES},
960b57cec5SDimitry Andric #include "clang/Basic/BuiltinsAMDGPU.def"
970b57cec5SDimitry Andric };
980b57cec5SDimitry Andric
990b57cec5SDimitry Andric const char *const AMDGPUTargetInfo::GCCRegNames[] = {
1000b57cec5SDimitry Andric "v0", "v1", "v2", "v3", "v4", "v5", "v6", "v7", "v8",
1010b57cec5SDimitry Andric "v9", "v10", "v11", "v12", "v13", "v14", "v15", "v16", "v17",
1020b57cec5SDimitry Andric "v18", "v19", "v20", "v21", "v22", "v23", "v24", "v25", "v26",
1030b57cec5SDimitry Andric "v27", "v28", "v29", "v30", "v31", "v32", "v33", "v34", "v35",
1040b57cec5SDimitry Andric "v36", "v37", "v38", "v39", "v40", "v41", "v42", "v43", "v44",
1050b57cec5SDimitry Andric "v45", "v46", "v47", "v48", "v49", "v50", "v51", "v52", "v53",
1060b57cec5SDimitry Andric "v54", "v55", "v56", "v57", "v58", "v59", "v60", "v61", "v62",
1070b57cec5SDimitry Andric "v63", "v64", "v65", "v66", "v67", "v68", "v69", "v70", "v71",
1080b57cec5SDimitry Andric "v72", "v73", "v74", "v75", "v76", "v77", "v78", "v79", "v80",
1090b57cec5SDimitry Andric "v81", "v82", "v83", "v84", "v85", "v86", "v87", "v88", "v89",
1100b57cec5SDimitry Andric "v90", "v91", "v92", "v93", "v94", "v95", "v96", "v97", "v98",
1110b57cec5SDimitry Andric "v99", "v100", "v101", "v102", "v103", "v104", "v105", "v106", "v107",
1120b57cec5SDimitry Andric "v108", "v109", "v110", "v111", "v112", "v113", "v114", "v115", "v116",
1130b57cec5SDimitry Andric "v117", "v118", "v119", "v120", "v121", "v122", "v123", "v124", "v125",
1140b57cec5SDimitry Andric "v126", "v127", "v128", "v129", "v130", "v131", "v132", "v133", "v134",
1150b57cec5SDimitry Andric "v135", "v136", "v137", "v138", "v139", "v140", "v141", "v142", "v143",
1160b57cec5SDimitry Andric "v144", "v145", "v146", "v147", "v148", "v149", "v150", "v151", "v152",
1170b57cec5SDimitry Andric "v153", "v154", "v155", "v156", "v157", "v158", "v159", "v160", "v161",
1180b57cec5SDimitry Andric "v162", "v163", "v164", "v165", "v166", "v167", "v168", "v169", "v170",
1190b57cec5SDimitry Andric "v171", "v172", "v173", "v174", "v175", "v176", "v177", "v178", "v179",
1200b57cec5SDimitry Andric "v180", "v181", "v182", "v183", "v184", "v185", "v186", "v187", "v188",
1210b57cec5SDimitry Andric "v189", "v190", "v191", "v192", "v193", "v194", "v195", "v196", "v197",
1220b57cec5SDimitry Andric "v198", "v199", "v200", "v201", "v202", "v203", "v204", "v205", "v206",
1230b57cec5SDimitry Andric "v207", "v208", "v209", "v210", "v211", "v212", "v213", "v214", "v215",
1240b57cec5SDimitry Andric "v216", "v217", "v218", "v219", "v220", "v221", "v222", "v223", "v224",
1250b57cec5SDimitry Andric "v225", "v226", "v227", "v228", "v229", "v230", "v231", "v232", "v233",
1260b57cec5SDimitry Andric "v234", "v235", "v236", "v237", "v238", "v239", "v240", "v241", "v242",
1270b57cec5SDimitry Andric "v243", "v244", "v245", "v246", "v247", "v248", "v249", "v250", "v251",
1280b57cec5SDimitry Andric "v252", "v253", "v254", "v255", "s0", "s1", "s2", "s3", "s4",
1290b57cec5SDimitry Andric "s5", "s6", "s7", "s8", "s9", "s10", "s11", "s12", "s13",
1300b57cec5SDimitry Andric "s14", "s15", "s16", "s17", "s18", "s19", "s20", "s21", "s22",
1310b57cec5SDimitry Andric "s23", "s24", "s25", "s26", "s27", "s28", "s29", "s30", "s31",
1320b57cec5SDimitry Andric "s32", "s33", "s34", "s35", "s36", "s37", "s38", "s39", "s40",
1330b57cec5SDimitry Andric "s41", "s42", "s43", "s44", "s45", "s46", "s47", "s48", "s49",
1340b57cec5SDimitry Andric "s50", "s51", "s52", "s53", "s54", "s55", "s56", "s57", "s58",
1350b57cec5SDimitry Andric "s59", "s60", "s61", "s62", "s63", "s64", "s65", "s66", "s67",
1360b57cec5SDimitry Andric "s68", "s69", "s70", "s71", "s72", "s73", "s74", "s75", "s76",
1370b57cec5SDimitry Andric "s77", "s78", "s79", "s80", "s81", "s82", "s83", "s84", "s85",
1380b57cec5SDimitry Andric "s86", "s87", "s88", "s89", "s90", "s91", "s92", "s93", "s94",
1390b57cec5SDimitry Andric "s95", "s96", "s97", "s98", "s99", "s100", "s101", "s102", "s103",
1400b57cec5SDimitry Andric "s104", "s105", "s106", "s107", "s108", "s109", "s110", "s111", "s112",
1410b57cec5SDimitry Andric "s113", "s114", "s115", "s116", "s117", "s118", "s119", "s120", "s121",
1420b57cec5SDimitry Andric "s122", "s123", "s124", "s125", "s126", "s127", "exec", "vcc", "scc",
1430b57cec5SDimitry Andric "m0", "flat_scratch", "exec_lo", "exec_hi", "vcc_lo", "vcc_hi",
1445ffd83dbSDimitry Andric "flat_scratch_lo", "flat_scratch_hi",
1455ffd83dbSDimitry Andric "a0", "a1", "a2", "a3", "a4", "a5", "a6", "a7", "a8",
1465ffd83dbSDimitry Andric "a9", "a10", "a11", "a12", "a13", "a14", "a15", "a16", "a17",
1475ffd83dbSDimitry Andric "a18", "a19", "a20", "a21", "a22", "a23", "a24", "a25", "a26",
1485ffd83dbSDimitry Andric "a27", "a28", "a29", "a30", "a31", "a32", "a33", "a34", "a35",
1495ffd83dbSDimitry Andric "a36", "a37", "a38", "a39", "a40", "a41", "a42", "a43", "a44",
1505ffd83dbSDimitry Andric "a45", "a46", "a47", "a48", "a49", "a50", "a51", "a52", "a53",
1515ffd83dbSDimitry Andric "a54", "a55", "a56", "a57", "a58", "a59", "a60", "a61", "a62",
1525ffd83dbSDimitry Andric "a63", "a64", "a65", "a66", "a67", "a68", "a69", "a70", "a71",
1535ffd83dbSDimitry Andric "a72", "a73", "a74", "a75", "a76", "a77", "a78", "a79", "a80",
1545ffd83dbSDimitry Andric "a81", "a82", "a83", "a84", "a85", "a86", "a87", "a88", "a89",
1555ffd83dbSDimitry Andric "a90", "a91", "a92", "a93", "a94", "a95", "a96", "a97", "a98",
1565ffd83dbSDimitry Andric "a99", "a100", "a101", "a102", "a103", "a104", "a105", "a106", "a107",
1575ffd83dbSDimitry Andric "a108", "a109", "a110", "a111", "a112", "a113", "a114", "a115", "a116",
1585ffd83dbSDimitry Andric "a117", "a118", "a119", "a120", "a121", "a122", "a123", "a124", "a125",
1595ffd83dbSDimitry Andric "a126", "a127", "a128", "a129", "a130", "a131", "a132", "a133", "a134",
1605ffd83dbSDimitry Andric "a135", "a136", "a137", "a138", "a139", "a140", "a141", "a142", "a143",
1615ffd83dbSDimitry Andric "a144", "a145", "a146", "a147", "a148", "a149", "a150", "a151", "a152",
1625ffd83dbSDimitry Andric "a153", "a154", "a155", "a156", "a157", "a158", "a159", "a160", "a161",
1635ffd83dbSDimitry Andric "a162", "a163", "a164", "a165", "a166", "a167", "a168", "a169", "a170",
1645ffd83dbSDimitry Andric "a171", "a172", "a173", "a174", "a175", "a176", "a177", "a178", "a179",
1655ffd83dbSDimitry Andric "a180", "a181", "a182", "a183", "a184", "a185", "a186", "a187", "a188",
1665ffd83dbSDimitry Andric "a189", "a190", "a191", "a192", "a193", "a194", "a195", "a196", "a197",
1675ffd83dbSDimitry Andric "a198", "a199", "a200", "a201", "a202", "a203", "a204", "a205", "a206",
1685ffd83dbSDimitry Andric "a207", "a208", "a209", "a210", "a211", "a212", "a213", "a214", "a215",
1695ffd83dbSDimitry Andric "a216", "a217", "a218", "a219", "a220", "a221", "a222", "a223", "a224",
1705ffd83dbSDimitry Andric "a225", "a226", "a227", "a228", "a229", "a230", "a231", "a232", "a233",
1715ffd83dbSDimitry Andric "a234", "a235", "a236", "a237", "a238", "a239", "a240", "a241", "a242",
1725ffd83dbSDimitry Andric "a243", "a244", "a245", "a246", "a247", "a248", "a249", "a250", "a251",
1735ffd83dbSDimitry Andric "a252", "a253", "a254", "a255"
1740b57cec5SDimitry Andric };
1750b57cec5SDimitry Andric
getGCCRegNames() const1760b57cec5SDimitry Andric ArrayRef<const char *> AMDGPUTargetInfo::getGCCRegNames() const {
177bdd1243dSDimitry Andric return llvm::ArrayRef(GCCRegNames);
1780b57cec5SDimitry Andric }
1790b57cec5SDimitry Andric
initFeatureMap(llvm::StringMap<bool> & Features,DiagnosticsEngine & Diags,StringRef CPU,const std::vector<std::string> & FeatureVec) const1800b57cec5SDimitry Andric bool AMDGPUTargetInfo::initFeatureMap(
1810b57cec5SDimitry Andric llvm::StringMap<bool> &Features, DiagnosticsEngine &Diags, StringRef CPU,
1820b57cec5SDimitry Andric const std::vector<std::string> &FeatureVec) const {
1830b57cec5SDimitry Andric
1840b57cec5SDimitry Andric using namespace llvm::AMDGPU;
18506c3fb27SDimitry Andric fillAMDGPUFeatureMap(CPU, getTriple(), Features);
186bdd1243dSDimitry Andric if (!TargetInfo::initFeatureMap(Features, Diags, CPU, FeatureVec))
187bdd1243dSDimitry Andric return false;
188bdd1243dSDimitry Andric
189bdd1243dSDimitry Andric // TODO: Should move this logic into TargetParser
190*0fca6ea1SDimitry Andric auto HasError = insertWaveSizeFeature(CPU, getTriple(), Features);
191*0fca6ea1SDimitry Andric switch (HasError.first) {
192*0fca6ea1SDimitry Andric default:
193*0fca6ea1SDimitry Andric break;
194*0fca6ea1SDimitry Andric case llvm::AMDGPU::INVALID_FEATURE_COMBINATION:
195*0fca6ea1SDimitry Andric Diags.Report(diag::err_invalid_feature_combination) << HasError.second;
196*0fca6ea1SDimitry Andric return false;
197*0fca6ea1SDimitry Andric case llvm::AMDGPU::UNSUPPORTED_TARGET_FEATURE:
198*0fca6ea1SDimitry Andric Diags.Report(diag::err_opt_not_valid_on_target) << HasError.second;
199bdd1243dSDimitry Andric return false;
200bdd1243dSDimitry Andric }
201bdd1243dSDimitry Andric
202bdd1243dSDimitry Andric return true;
2030b57cec5SDimitry Andric }
2040b57cec5SDimitry Andric
fillValidCPUList(SmallVectorImpl<StringRef> & Values) const2050b57cec5SDimitry Andric void AMDGPUTargetInfo::fillValidCPUList(
2060b57cec5SDimitry Andric SmallVectorImpl<StringRef> &Values) const {
2070b57cec5SDimitry Andric if (isAMDGCN(getTriple()))
2080b57cec5SDimitry Andric llvm::AMDGPU::fillValidArchListAMDGCN(Values);
2090b57cec5SDimitry Andric else
2100b57cec5SDimitry Andric llvm::AMDGPU::fillValidArchListR600(Values);
2110b57cec5SDimitry Andric }
2120b57cec5SDimitry Andric
setAddressSpaceMap(bool DefaultIsPrivate)2130b57cec5SDimitry Andric void AMDGPUTargetInfo::setAddressSpaceMap(bool DefaultIsPrivate) {
2140b57cec5SDimitry Andric AddrSpaceMap = DefaultIsPrivate ? &AMDGPUDefIsPrivMap : &AMDGPUDefIsGenMap;
2150b57cec5SDimitry Andric }
2160b57cec5SDimitry Andric
AMDGPUTargetInfo(const llvm::Triple & Triple,const TargetOptions & Opts)2170b57cec5SDimitry Andric AMDGPUTargetInfo::AMDGPUTargetInfo(const llvm::Triple &Triple,
2180b57cec5SDimitry Andric const TargetOptions &Opts)
2190b57cec5SDimitry Andric : TargetInfo(Triple),
2200b57cec5SDimitry Andric GPUKind(isAMDGCN(Triple) ?
2210b57cec5SDimitry Andric llvm::AMDGPU::parseArchAMDGCN(Opts.CPU) :
2220b57cec5SDimitry Andric llvm::AMDGPU::parseArchR600(Opts.CPU)),
2230b57cec5SDimitry Andric GPUFeatures(isAMDGCN(Triple) ?
2240b57cec5SDimitry Andric llvm::AMDGPU::getArchAttrAMDGCN(GPUKind) :
2250b57cec5SDimitry Andric llvm::AMDGPU::getArchAttrR600(GPUKind)) {
2260b57cec5SDimitry Andric resetDataLayout(isAMDGCN(getTriple()) ? DataLayoutStringAMDGCN
2270b57cec5SDimitry Andric : DataLayoutStringR600);
2280b57cec5SDimitry Andric
2290b57cec5SDimitry Andric setAddressSpaceMap(Triple.getOS() == llvm::Triple::Mesa3D ||
2300b57cec5SDimitry Andric !isAMDGCN(Triple));
2310b57cec5SDimitry Andric UseAddrSpaceMapMangling = true;
2320b57cec5SDimitry Andric
233bdd1243dSDimitry Andric if (isAMDGCN(Triple)) {
234bdd1243dSDimitry Andric // __bf16 is always available as a load/store only type on AMDGCN.
235bdd1243dSDimitry Andric BFloat16Width = BFloat16Align = 16;
236bdd1243dSDimitry Andric BFloat16Format = &llvm::APFloat::BFloat();
237bdd1243dSDimitry Andric }
238bdd1243dSDimitry Andric
2390b57cec5SDimitry Andric HasLegalHalfType = true;
2400b57cec5SDimitry Andric HasFloat16 = true;
241*0fca6ea1SDimitry Andric WavefrontSize = (GPUFeatures & llvm::AMDGPU::FEATURE_WAVE32) ? 32 : 64;
242e8d8bef9SDimitry Andric AllowAMDGPUUnsafeFPAtomics = Opts.AllowAMDGPUUnsafeFPAtomics;
2430b57cec5SDimitry Andric
244bdd1243dSDimitry Andric // Set pointer width and alignment for the generic address space.
245bdd1243dSDimitry Andric PointerWidth = PointerAlign = getPointerWidthV(LangAS::Default);
2460b57cec5SDimitry Andric if (getMaxPointerWidth() == 64) {
2470b57cec5SDimitry Andric LongWidth = LongAlign = 64;
2480b57cec5SDimitry Andric SizeType = UnsignedLong;
2490b57cec5SDimitry Andric PtrDiffType = SignedLong;
2500b57cec5SDimitry Andric IntPtrType = SignedLong;
2510b57cec5SDimitry Andric }
2520b57cec5SDimitry Andric
2530b57cec5SDimitry Andric MaxAtomicPromoteWidth = MaxAtomicInlineWidth = 64;
25406c3fb27SDimitry Andric CUMode = !(GPUFeatures & llvm::AMDGPU::FEATURE_WGP);
2555f757f3fSDimitry Andric for (auto F : {"image-insts", "gws"})
2565f757f3fSDimitry Andric ReadOnlyFeatures.insert(F);
2575f757f3fSDimitry Andric HalfArgsAndReturns = true;
2580b57cec5SDimitry Andric }
2590b57cec5SDimitry Andric
adjust(DiagnosticsEngine & Diags,LangOptions & Opts)260fe6060f1SDimitry Andric void AMDGPUTargetInfo::adjust(DiagnosticsEngine &Diags, LangOptions &Opts) {
261fe6060f1SDimitry Andric TargetInfo::adjust(Diags, Opts);
2620b57cec5SDimitry Andric // ToDo: There are still a few places using default address space as private
2630b57cec5SDimitry Andric // address space in OpenCL, which needs to be cleaned up, then Opts.OpenCL
2640b57cec5SDimitry Andric // can be removed from the following line.
2650b57cec5SDimitry Andric setAddressSpaceMap(/*DefaultIsPrivate=*/Opts.OpenCL ||
2660b57cec5SDimitry Andric !isAMDGCN(getTriple()));
2670b57cec5SDimitry Andric }
2680b57cec5SDimitry Andric
getTargetBuiltins() const2690b57cec5SDimitry Andric ArrayRef<Builtin::Info> AMDGPUTargetInfo::getTargetBuiltins() const {
270bdd1243dSDimitry Andric return llvm::ArrayRef(BuiltinInfo,
271bdd1243dSDimitry Andric clang::AMDGPU::LastTSBuiltin - Builtin::FirstTSBuiltin);
2720b57cec5SDimitry Andric }
2730b57cec5SDimitry Andric
getTargetDefines(const LangOptions & Opts,MacroBuilder & Builder) const2740b57cec5SDimitry Andric void AMDGPUTargetInfo::getTargetDefines(const LangOptions &Opts,
2750b57cec5SDimitry Andric MacroBuilder &Builder) const {
2760b57cec5SDimitry Andric Builder.defineMacro("__AMD__");
2770b57cec5SDimitry Andric Builder.defineMacro("__AMDGPU__");
2780b57cec5SDimitry Andric
2790b57cec5SDimitry Andric if (isAMDGCN(getTriple()))
2800b57cec5SDimitry Andric Builder.defineMacro("__AMDGCN__");
2810b57cec5SDimitry Andric else
2820b57cec5SDimitry Andric Builder.defineMacro("__R600__");
2830b57cec5SDimitry Andric
284*0fca6ea1SDimitry Andric // Legacy HIP host code relies on these default attributes to be defined.
285*0fca6ea1SDimitry Andric bool IsHIPHost = Opts.HIP && !Opts.CUDAIsDevice;
286*0fca6ea1SDimitry Andric if (GPUKind == llvm::AMDGPU::GK_NONE && !IsHIPHost)
287*0fca6ea1SDimitry Andric return;
288*0fca6ea1SDimitry Andric
289*0fca6ea1SDimitry Andric llvm::SmallString<16> CanonName =
290*0fca6ea1SDimitry Andric (isAMDGCN(getTriple()) ? getArchNameAMDGCN(GPUKind)
291*0fca6ea1SDimitry Andric : getArchNameR600(GPUKind));
292*0fca6ea1SDimitry Andric
293*0fca6ea1SDimitry Andric // Sanitize the name of generic targets.
294*0fca6ea1SDimitry Andric // e.g. gfx10-1-generic -> gfx10_1_generic
295*0fca6ea1SDimitry Andric if (GPUKind >= llvm::AMDGPU::GK_AMDGCN_GENERIC_FIRST &&
296*0fca6ea1SDimitry Andric GPUKind <= llvm::AMDGPU::GK_AMDGCN_GENERIC_LAST) {
297*0fca6ea1SDimitry Andric std::replace(CanonName.begin(), CanonName.end(), '-', '_');
298*0fca6ea1SDimitry Andric }
299*0fca6ea1SDimitry Andric
3000b57cec5SDimitry Andric Builder.defineMacro(Twine("__") + Twine(CanonName) + Twine("__"));
30181ad6265SDimitry Andric // Emit macros for gfx family e.g. gfx906 -> __GFX9__, gfx1030 -> __GFX10___
302*0fca6ea1SDimitry Andric if (isAMDGCN(getTriple()) && !IsHIPHost) {
303*0fca6ea1SDimitry Andric assert(StringRef(CanonName).starts_with("gfx") &&
304*0fca6ea1SDimitry Andric "Invalid amdgcn canonical name");
305*0fca6ea1SDimitry Andric StringRef CanonFamilyName = getArchFamilyNameAMDGCN(GPUKind);
306*0fca6ea1SDimitry Andric Builder.defineMacro(Twine("__") + Twine(CanonFamilyName.upper()) +
30781ad6265SDimitry Andric Twine("__"));
308e8d8bef9SDimitry Andric Builder.defineMacro("__amdgcn_processor__",
309e8d8bef9SDimitry Andric Twine("\"") + Twine(CanonName) + Twine("\""));
310e8d8bef9SDimitry Andric Builder.defineMacro("__amdgcn_target_id__",
31181ad6265SDimitry Andric Twine("\"") + Twine(*getTargetID()) + Twine("\""));
312e8d8bef9SDimitry Andric for (auto F : getAllPossibleTargetIDFeatures(getTriple(), CanonName)) {
313e8d8bef9SDimitry Andric auto Loc = OffloadArchFeatures.find(F);
314e8d8bef9SDimitry Andric if (Loc != OffloadArchFeatures.end()) {
315e8d8bef9SDimitry Andric std::string NewF = F.str();
316e8d8bef9SDimitry Andric std::replace(NewF.begin(), NewF.end(), '-', '_');
317e8d8bef9SDimitry Andric Builder.defineMacro(Twine("__amdgcn_feature_") + Twine(NewF) +
318e8d8bef9SDimitry Andric Twine("__"),
319e8d8bef9SDimitry Andric Loc->second ? "1" : "0");
320e8d8bef9SDimitry Andric }
321e8d8bef9SDimitry Andric }
322e8d8bef9SDimitry Andric }
3230b57cec5SDimitry Andric
32481ad6265SDimitry Andric if (AllowAMDGPUUnsafeFPAtomics)
32581ad6265SDimitry Andric Builder.defineMacro("__AMDGCN_UNSAFE_FP_ATOMICS__");
32681ad6265SDimitry Andric
3270b57cec5SDimitry Andric // TODO: __HAS_FMAF__, __HAS_LDEXPF__, __HAS_FP64__ are deprecated and will be
3280b57cec5SDimitry Andric // removed in the near future.
3290b57cec5SDimitry Andric if (hasFMAF())
3300b57cec5SDimitry Andric Builder.defineMacro("__HAS_FMAF__");
3310b57cec5SDimitry Andric if (hasFastFMAF())
3320b57cec5SDimitry Andric Builder.defineMacro("FP_FAST_FMAF");
3330b57cec5SDimitry Andric if (hasLDEXPF())
3340b57cec5SDimitry Andric Builder.defineMacro("__HAS_LDEXPF__");
3350b57cec5SDimitry Andric if (hasFP64())
3360b57cec5SDimitry Andric Builder.defineMacro("__HAS_FP64__");
3370b57cec5SDimitry Andric if (hasFastFMA())
3380b57cec5SDimitry Andric Builder.defineMacro("FP_FAST_FMA");
339e8d8bef9SDimitry Andric
34006c3fb27SDimitry Andric Builder.defineMacro("__AMDGCN_WAVEFRONT_SIZE__", Twine(WavefrontSize));
34106c3fb27SDimitry Andric // ToDo: deprecate this macro for naming consistency.
342e8d8bef9SDimitry Andric Builder.defineMacro("__AMDGCN_WAVEFRONT_SIZE", Twine(WavefrontSize));
34306c3fb27SDimitry Andric Builder.defineMacro("__AMDGCN_CUMODE__", Twine(CUMode));
3440b57cec5SDimitry Andric }
3450b57cec5SDimitry Andric
setAuxTarget(const TargetInfo * Aux)3460b57cec5SDimitry Andric void AMDGPUTargetInfo::setAuxTarget(const TargetInfo *Aux) {
3470b57cec5SDimitry Andric assert(HalfFormat == Aux->HalfFormat);
3480b57cec5SDimitry Andric assert(FloatFormat == Aux->FloatFormat);
3490b57cec5SDimitry Andric assert(DoubleFormat == Aux->DoubleFormat);
3500b57cec5SDimitry Andric
3510b57cec5SDimitry Andric // On x86_64 long double is 80-bit extended precision format, which is
3520b57cec5SDimitry Andric // not supported by AMDGPU. 128-bit floating point format is also not
3530b57cec5SDimitry Andric // supported by AMDGPU. Therefore keep its own format for these two types.
3540b57cec5SDimitry Andric auto SaveLongDoubleFormat = LongDoubleFormat;
3550b57cec5SDimitry Andric auto SaveFloat128Format = Float128Format;
35681ad6265SDimitry Andric auto SaveLongDoubleWidth = LongDoubleWidth;
35781ad6265SDimitry Andric auto SaveLongDoubleAlign = LongDoubleAlign;
3580b57cec5SDimitry Andric copyAuxTarget(Aux);
3590b57cec5SDimitry Andric LongDoubleFormat = SaveLongDoubleFormat;
3600b57cec5SDimitry Andric Float128Format = SaveFloat128Format;
36181ad6265SDimitry Andric LongDoubleWidth = SaveLongDoubleWidth;
36281ad6265SDimitry Andric LongDoubleAlign = SaveLongDoubleAlign;
3635ffd83dbSDimitry Andric // For certain builtin types support on the host target, claim they are
3645ffd83dbSDimitry Andric // support to pass the compilation of the host code during the device-side
3655ffd83dbSDimitry Andric // compilation.
3665ffd83dbSDimitry Andric // FIXME: As the side effect, we also accept `__float128` uses in the device
3675ffd83dbSDimitry Andric // code. To rejct these builtin types supported in the host target but not in
3685ffd83dbSDimitry Andric // the device target, one approach would support `device_builtin` attribute
3695ffd83dbSDimitry Andric // so that we could tell the device builtin types from the host ones. The
3705ffd83dbSDimitry Andric // also solves the different representations of the same builtin type, such
3715ffd83dbSDimitry Andric // as `size_t` in the MSVC environment.
3725ffd83dbSDimitry Andric if (Aux->hasFloat128Type()) {
3735ffd83dbSDimitry Andric HasFloat128 = true;
3745ffd83dbSDimitry Andric Float128Format = DoubleFormat;
3755ffd83dbSDimitry Andric }
3760b57cec5SDimitry Andric }
377