10b57cec5SDimitry Andric //===--- AMDGPU.cpp - Implement AMDGPU target feature support -------------===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric // 90b57cec5SDimitry Andric // This file implements AMDGPU TargetInfo objects. 100b57cec5SDimitry Andric // 110b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 120b57cec5SDimitry Andric 130b57cec5SDimitry Andric #include "AMDGPU.h" 140b57cec5SDimitry Andric #include "clang/Basic/Builtins.h" 150b57cec5SDimitry Andric #include "clang/Basic/CodeGenOptions.h" 16bdd1243dSDimitry Andric #include "clang/Basic/Diagnostic.h" 170b57cec5SDimitry Andric #include "clang/Basic/LangOptions.h" 180b57cec5SDimitry Andric #include "clang/Basic/MacroBuilder.h" 190b57cec5SDimitry Andric #include "clang/Basic/TargetBuiltins.h" 200b57cec5SDimitry Andric using namespace clang; 210b57cec5SDimitry Andric using namespace clang::targets; 220b57cec5SDimitry Andric 230b57cec5SDimitry Andric namespace clang { 240b57cec5SDimitry Andric namespace targets { 250b57cec5SDimitry Andric 260b57cec5SDimitry Andric // If you edit the description strings, make sure you update 270b57cec5SDimitry Andric // getPointerWidthV(). 280b57cec5SDimitry Andric 290b57cec5SDimitry Andric static const char *const DataLayoutStringR600 = 300b57cec5SDimitry Andric "e-p:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128" 31e8d8bef9SDimitry Andric "-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1"; 320b57cec5SDimitry Andric 330b57cec5SDimitry Andric static const char *const DataLayoutStringAMDGCN = 340b57cec5SDimitry Andric "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32" 35*5f757f3fSDimitry Andric "-p7:160:256:256:32-p8:128:128-p9:192:256:256:32-i64:64-v16:16-v24:32-v32:" 36*5f757f3fSDimitry Andric "32-v48:64-v96:128" 37e8d8bef9SDimitry Andric "-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1" 38*5f757f3fSDimitry Andric "-ni:7:8:9"; 390b57cec5SDimitry Andric 400b57cec5SDimitry Andric const LangASMap AMDGPUTargetInfo::AMDGPUDefIsGenMap = { 41*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // Default 42*5f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global 43*5f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // opencl_local 44*5f757f3fSDimitry Andric llvm::AMDGPUAS::CONSTANT_ADDRESS, // opencl_constant 45*5f757f3fSDimitry Andric llvm::AMDGPUAS::PRIVATE_ADDRESS, // opencl_private 46*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // opencl_generic 47*5f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global_device 48*5f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global_host 49*5f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // cuda_device 50*5f757f3fSDimitry Andric llvm::AMDGPUAS::CONSTANT_ADDRESS, // cuda_constant 51*5f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // cuda_shared 52*5f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // sycl_global 53*5f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // sycl_global_device 54*5f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // sycl_global_host 55*5f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // sycl_local 56*5f757f3fSDimitry Andric llvm::AMDGPUAS::PRIVATE_ADDRESS, // sycl_private 57*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_sptr 58*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_uptr 59*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr64 60*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // hlsl_groupshared 610b57cec5SDimitry Andric }; 620b57cec5SDimitry Andric 630b57cec5SDimitry Andric const LangASMap AMDGPUTargetInfo::AMDGPUDefIsPrivMap = { 64*5f757f3fSDimitry Andric llvm::AMDGPUAS::PRIVATE_ADDRESS, // Default 65*5f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global 66*5f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // opencl_local 67*5f757f3fSDimitry Andric llvm::AMDGPUAS::CONSTANT_ADDRESS, // opencl_constant 68*5f757f3fSDimitry Andric llvm::AMDGPUAS::PRIVATE_ADDRESS, // opencl_private 69*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // opencl_generic 70*5f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global_device 71*5f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global_host 72*5f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // cuda_device 73*5f757f3fSDimitry Andric llvm::AMDGPUAS::CONSTANT_ADDRESS, // cuda_constant 74*5f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // cuda_shared 75fe6060f1SDimitry Andric // SYCL address space values for this map are dummy 76*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global 77*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global_device 78*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global_host 79*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_local 80*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_private 81*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_sptr 82*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_uptr 83*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr64 84*5f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // hlsl_groupshared 85480093f4SDimitry Andric 860b57cec5SDimitry Andric }; 870b57cec5SDimitry Andric } // namespace targets 880b57cec5SDimitry Andric } // namespace clang 890b57cec5SDimitry Andric 90bdd1243dSDimitry Andric static constexpr Builtin::Info BuiltinInfo[] = { 910b57cec5SDimitry Andric #define BUILTIN(ID, TYPE, ATTRS) \ 92bdd1243dSDimitry Andric {#ID, TYPE, ATTRS, nullptr, HeaderDesc::NO_HEADER, ALL_LANGUAGES}, 930b57cec5SDimitry Andric #define TARGET_BUILTIN(ID, TYPE, ATTRS, FEATURE) \ 94bdd1243dSDimitry Andric {#ID, TYPE, ATTRS, FEATURE, HeaderDesc::NO_HEADER, ALL_LANGUAGES}, 950b57cec5SDimitry Andric #include "clang/Basic/BuiltinsAMDGPU.def" 960b57cec5SDimitry Andric }; 970b57cec5SDimitry Andric 980b57cec5SDimitry Andric const char *const AMDGPUTargetInfo::GCCRegNames[] = { 990b57cec5SDimitry Andric "v0", "v1", "v2", "v3", "v4", "v5", "v6", "v7", "v8", 1000b57cec5SDimitry Andric "v9", "v10", "v11", "v12", "v13", "v14", "v15", "v16", "v17", 1010b57cec5SDimitry Andric "v18", "v19", "v20", "v21", "v22", "v23", "v24", "v25", "v26", 1020b57cec5SDimitry Andric "v27", "v28", "v29", "v30", "v31", "v32", "v33", "v34", "v35", 1030b57cec5SDimitry Andric "v36", "v37", "v38", "v39", "v40", "v41", "v42", "v43", "v44", 1040b57cec5SDimitry Andric "v45", "v46", "v47", "v48", "v49", "v50", "v51", "v52", "v53", 1050b57cec5SDimitry Andric "v54", "v55", "v56", "v57", "v58", "v59", "v60", "v61", "v62", 1060b57cec5SDimitry Andric "v63", "v64", "v65", "v66", "v67", "v68", "v69", "v70", "v71", 1070b57cec5SDimitry Andric "v72", "v73", "v74", "v75", "v76", "v77", "v78", "v79", "v80", 1080b57cec5SDimitry Andric "v81", "v82", "v83", "v84", "v85", "v86", "v87", "v88", "v89", 1090b57cec5SDimitry Andric "v90", "v91", "v92", "v93", "v94", "v95", "v96", "v97", "v98", 1100b57cec5SDimitry Andric "v99", "v100", "v101", "v102", "v103", "v104", "v105", "v106", "v107", 1110b57cec5SDimitry Andric "v108", "v109", "v110", "v111", "v112", "v113", "v114", "v115", "v116", 1120b57cec5SDimitry Andric "v117", "v118", "v119", "v120", "v121", "v122", "v123", "v124", "v125", 1130b57cec5SDimitry Andric "v126", "v127", "v128", "v129", "v130", "v131", "v132", "v133", "v134", 1140b57cec5SDimitry Andric "v135", "v136", "v137", "v138", "v139", "v140", "v141", "v142", "v143", 1150b57cec5SDimitry Andric "v144", "v145", "v146", "v147", "v148", "v149", "v150", "v151", "v152", 1160b57cec5SDimitry Andric "v153", "v154", "v155", "v156", "v157", "v158", "v159", "v160", "v161", 1170b57cec5SDimitry Andric "v162", "v163", "v164", "v165", "v166", "v167", "v168", "v169", "v170", 1180b57cec5SDimitry Andric "v171", "v172", "v173", "v174", "v175", "v176", "v177", "v178", "v179", 1190b57cec5SDimitry Andric "v180", "v181", "v182", "v183", "v184", "v185", "v186", "v187", "v188", 1200b57cec5SDimitry Andric "v189", "v190", "v191", "v192", "v193", "v194", "v195", "v196", "v197", 1210b57cec5SDimitry Andric "v198", "v199", "v200", "v201", "v202", "v203", "v204", "v205", "v206", 1220b57cec5SDimitry Andric "v207", "v208", "v209", "v210", "v211", "v212", "v213", "v214", "v215", 1230b57cec5SDimitry Andric "v216", "v217", "v218", "v219", "v220", "v221", "v222", "v223", "v224", 1240b57cec5SDimitry Andric "v225", "v226", "v227", "v228", "v229", "v230", "v231", "v232", "v233", 1250b57cec5SDimitry Andric "v234", "v235", "v236", "v237", "v238", "v239", "v240", "v241", "v242", 1260b57cec5SDimitry Andric "v243", "v244", "v245", "v246", "v247", "v248", "v249", "v250", "v251", 1270b57cec5SDimitry Andric "v252", "v253", "v254", "v255", "s0", "s1", "s2", "s3", "s4", 1280b57cec5SDimitry Andric "s5", "s6", "s7", "s8", "s9", "s10", "s11", "s12", "s13", 1290b57cec5SDimitry Andric "s14", "s15", "s16", "s17", "s18", "s19", "s20", "s21", "s22", 1300b57cec5SDimitry Andric "s23", "s24", "s25", "s26", "s27", "s28", "s29", "s30", "s31", 1310b57cec5SDimitry Andric "s32", "s33", "s34", "s35", "s36", "s37", "s38", "s39", "s40", 1320b57cec5SDimitry Andric "s41", "s42", "s43", "s44", "s45", "s46", "s47", "s48", "s49", 1330b57cec5SDimitry Andric "s50", "s51", "s52", "s53", "s54", "s55", "s56", "s57", "s58", 1340b57cec5SDimitry Andric "s59", "s60", "s61", "s62", "s63", "s64", "s65", "s66", "s67", 1350b57cec5SDimitry Andric "s68", "s69", "s70", "s71", "s72", "s73", "s74", "s75", "s76", 1360b57cec5SDimitry Andric "s77", "s78", "s79", "s80", "s81", "s82", "s83", "s84", "s85", 1370b57cec5SDimitry Andric "s86", "s87", "s88", "s89", "s90", "s91", "s92", "s93", "s94", 1380b57cec5SDimitry Andric "s95", "s96", "s97", "s98", "s99", "s100", "s101", "s102", "s103", 1390b57cec5SDimitry Andric "s104", "s105", "s106", "s107", "s108", "s109", "s110", "s111", "s112", 1400b57cec5SDimitry Andric "s113", "s114", "s115", "s116", "s117", "s118", "s119", "s120", "s121", 1410b57cec5SDimitry Andric "s122", "s123", "s124", "s125", "s126", "s127", "exec", "vcc", "scc", 1420b57cec5SDimitry Andric "m0", "flat_scratch", "exec_lo", "exec_hi", "vcc_lo", "vcc_hi", 1435ffd83dbSDimitry Andric "flat_scratch_lo", "flat_scratch_hi", 1445ffd83dbSDimitry Andric "a0", "a1", "a2", "a3", "a4", "a5", "a6", "a7", "a8", 1455ffd83dbSDimitry Andric "a9", "a10", "a11", "a12", "a13", "a14", "a15", "a16", "a17", 1465ffd83dbSDimitry Andric "a18", "a19", "a20", "a21", "a22", "a23", "a24", "a25", "a26", 1475ffd83dbSDimitry Andric "a27", "a28", "a29", "a30", "a31", "a32", "a33", "a34", "a35", 1485ffd83dbSDimitry Andric "a36", "a37", "a38", "a39", "a40", "a41", "a42", "a43", "a44", 1495ffd83dbSDimitry Andric "a45", "a46", "a47", "a48", "a49", "a50", "a51", "a52", "a53", 1505ffd83dbSDimitry Andric "a54", "a55", "a56", "a57", "a58", "a59", "a60", "a61", "a62", 1515ffd83dbSDimitry Andric "a63", "a64", "a65", "a66", "a67", "a68", "a69", "a70", "a71", 1525ffd83dbSDimitry Andric "a72", "a73", "a74", "a75", "a76", "a77", "a78", "a79", "a80", 1535ffd83dbSDimitry Andric "a81", "a82", "a83", "a84", "a85", "a86", "a87", "a88", "a89", 1545ffd83dbSDimitry Andric "a90", "a91", "a92", "a93", "a94", "a95", "a96", "a97", "a98", 1555ffd83dbSDimitry Andric "a99", "a100", "a101", "a102", "a103", "a104", "a105", "a106", "a107", 1565ffd83dbSDimitry Andric "a108", "a109", "a110", "a111", "a112", "a113", "a114", "a115", "a116", 1575ffd83dbSDimitry Andric "a117", "a118", "a119", "a120", "a121", "a122", "a123", "a124", "a125", 1585ffd83dbSDimitry Andric "a126", "a127", "a128", "a129", "a130", "a131", "a132", "a133", "a134", 1595ffd83dbSDimitry Andric "a135", "a136", "a137", "a138", "a139", "a140", "a141", "a142", "a143", 1605ffd83dbSDimitry Andric "a144", "a145", "a146", "a147", "a148", "a149", "a150", "a151", "a152", 1615ffd83dbSDimitry Andric "a153", "a154", "a155", "a156", "a157", "a158", "a159", "a160", "a161", 1625ffd83dbSDimitry Andric "a162", "a163", "a164", "a165", "a166", "a167", "a168", "a169", "a170", 1635ffd83dbSDimitry Andric "a171", "a172", "a173", "a174", "a175", "a176", "a177", "a178", "a179", 1645ffd83dbSDimitry Andric "a180", "a181", "a182", "a183", "a184", "a185", "a186", "a187", "a188", 1655ffd83dbSDimitry Andric "a189", "a190", "a191", "a192", "a193", "a194", "a195", "a196", "a197", 1665ffd83dbSDimitry Andric "a198", "a199", "a200", "a201", "a202", "a203", "a204", "a205", "a206", 1675ffd83dbSDimitry Andric "a207", "a208", "a209", "a210", "a211", "a212", "a213", "a214", "a215", 1685ffd83dbSDimitry Andric "a216", "a217", "a218", "a219", "a220", "a221", "a222", "a223", "a224", 1695ffd83dbSDimitry Andric "a225", "a226", "a227", "a228", "a229", "a230", "a231", "a232", "a233", 1705ffd83dbSDimitry Andric "a234", "a235", "a236", "a237", "a238", "a239", "a240", "a241", "a242", 1715ffd83dbSDimitry Andric "a243", "a244", "a245", "a246", "a247", "a248", "a249", "a250", "a251", 1725ffd83dbSDimitry Andric "a252", "a253", "a254", "a255" 1730b57cec5SDimitry Andric }; 1740b57cec5SDimitry Andric 1750b57cec5SDimitry Andric ArrayRef<const char *> AMDGPUTargetInfo::getGCCRegNames() const { 176bdd1243dSDimitry Andric return llvm::ArrayRef(GCCRegNames); 1770b57cec5SDimitry Andric } 1780b57cec5SDimitry Andric 1790b57cec5SDimitry Andric bool AMDGPUTargetInfo::initFeatureMap( 1800b57cec5SDimitry Andric llvm::StringMap<bool> &Features, DiagnosticsEngine &Diags, StringRef CPU, 1810b57cec5SDimitry Andric const std::vector<std::string> &FeatureVec) const { 1820b57cec5SDimitry Andric 1830b57cec5SDimitry Andric using namespace llvm::AMDGPU; 18406c3fb27SDimitry Andric fillAMDGPUFeatureMap(CPU, getTriple(), Features); 185bdd1243dSDimitry Andric if (!TargetInfo::initFeatureMap(Features, Diags, CPU, FeatureVec)) 186bdd1243dSDimitry Andric return false; 187bdd1243dSDimitry Andric 188bdd1243dSDimitry Andric // TODO: Should move this logic into TargetParser 18906c3fb27SDimitry Andric std::string ErrorMsg; 19006c3fb27SDimitry Andric if (!insertWaveSizeFeature(CPU, getTriple(), Features, ErrorMsg)) { 19106c3fb27SDimitry Andric Diags.Report(diag::err_invalid_feature_combination) << ErrorMsg; 192bdd1243dSDimitry Andric return false; 193bdd1243dSDimitry Andric } 194bdd1243dSDimitry Andric 195bdd1243dSDimitry Andric return true; 1960b57cec5SDimitry Andric } 1970b57cec5SDimitry Andric 1980b57cec5SDimitry Andric void AMDGPUTargetInfo::fillValidCPUList( 1990b57cec5SDimitry Andric SmallVectorImpl<StringRef> &Values) const { 2000b57cec5SDimitry Andric if (isAMDGCN(getTriple())) 2010b57cec5SDimitry Andric llvm::AMDGPU::fillValidArchListAMDGCN(Values); 2020b57cec5SDimitry Andric else 2030b57cec5SDimitry Andric llvm::AMDGPU::fillValidArchListR600(Values); 2040b57cec5SDimitry Andric } 2050b57cec5SDimitry Andric 2060b57cec5SDimitry Andric void AMDGPUTargetInfo::setAddressSpaceMap(bool DefaultIsPrivate) { 2070b57cec5SDimitry Andric AddrSpaceMap = DefaultIsPrivate ? &AMDGPUDefIsPrivMap : &AMDGPUDefIsGenMap; 2080b57cec5SDimitry Andric } 2090b57cec5SDimitry Andric 2100b57cec5SDimitry Andric AMDGPUTargetInfo::AMDGPUTargetInfo(const llvm::Triple &Triple, 2110b57cec5SDimitry Andric const TargetOptions &Opts) 2120b57cec5SDimitry Andric : TargetInfo(Triple), 2130b57cec5SDimitry Andric GPUKind(isAMDGCN(Triple) ? 2140b57cec5SDimitry Andric llvm::AMDGPU::parseArchAMDGCN(Opts.CPU) : 2150b57cec5SDimitry Andric llvm::AMDGPU::parseArchR600(Opts.CPU)), 2160b57cec5SDimitry Andric GPUFeatures(isAMDGCN(Triple) ? 2170b57cec5SDimitry Andric llvm::AMDGPU::getArchAttrAMDGCN(GPUKind) : 2180b57cec5SDimitry Andric llvm::AMDGPU::getArchAttrR600(GPUKind)) { 2190b57cec5SDimitry Andric resetDataLayout(isAMDGCN(getTriple()) ? DataLayoutStringAMDGCN 2200b57cec5SDimitry Andric : DataLayoutStringR600); 2210b57cec5SDimitry Andric 2220b57cec5SDimitry Andric setAddressSpaceMap(Triple.getOS() == llvm::Triple::Mesa3D || 2230b57cec5SDimitry Andric !isAMDGCN(Triple)); 2240b57cec5SDimitry Andric UseAddrSpaceMapMangling = true; 2250b57cec5SDimitry Andric 226bdd1243dSDimitry Andric if (isAMDGCN(Triple)) { 227bdd1243dSDimitry Andric // __bf16 is always available as a load/store only type on AMDGCN. 228bdd1243dSDimitry Andric BFloat16Width = BFloat16Align = 16; 229bdd1243dSDimitry Andric BFloat16Format = &llvm::APFloat::BFloat(); 230bdd1243dSDimitry Andric } 231bdd1243dSDimitry Andric 2320b57cec5SDimitry Andric HasLegalHalfType = true; 2330b57cec5SDimitry Andric HasFloat16 = true; 234e8d8bef9SDimitry Andric WavefrontSize = GPUFeatures & llvm::AMDGPU::FEATURE_WAVE32 ? 32 : 64; 235e8d8bef9SDimitry Andric AllowAMDGPUUnsafeFPAtomics = Opts.AllowAMDGPUUnsafeFPAtomics; 2360b57cec5SDimitry Andric 237bdd1243dSDimitry Andric // Set pointer width and alignment for the generic address space. 238bdd1243dSDimitry Andric PointerWidth = PointerAlign = getPointerWidthV(LangAS::Default); 2390b57cec5SDimitry Andric if (getMaxPointerWidth() == 64) { 2400b57cec5SDimitry Andric LongWidth = LongAlign = 64; 2410b57cec5SDimitry Andric SizeType = UnsignedLong; 2420b57cec5SDimitry Andric PtrDiffType = SignedLong; 2430b57cec5SDimitry Andric IntPtrType = SignedLong; 2440b57cec5SDimitry Andric } 2450b57cec5SDimitry Andric 2460b57cec5SDimitry Andric MaxAtomicPromoteWidth = MaxAtomicInlineWidth = 64; 24706c3fb27SDimitry Andric CUMode = !(GPUFeatures & llvm::AMDGPU::FEATURE_WGP); 248*5f757f3fSDimitry Andric for (auto F : {"image-insts", "gws"}) 249*5f757f3fSDimitry Andric ReadOnlyFeatures.insert(F); 250*5f757f3fSDimitry Andric HalfArgsAndReturns = true; 2510b57cec5SDimitry Andric } 2520b57cec5SDimitry Andric 253fe6060f1SDimitry Andric void AMDGPUTargetInfo::adjust(DiagnosticsEngine &Diags, LangOptions &Opts) { 254fe6060f1SDimitry Andric TargetInfo::adjust(Diags, Opts); 2550b57cec5SDimitry Andric // ToDo: There are still a few places using default address space as private 2560b57cec5SDimitry Andric // address space in OpenCL, which needs to be cleaned up, then Opts.OpenCL 2570b57cec5SDimitry Andric // can be removed from the following line. 2580b57cec5SDimitry Andric setAddressSpaceMap(/*DefaultIsPrivate=*/Opts.OpenCL || 2590b57cec5SDimitry Andric !isAMDGCN(getTriple())); 2600b57cec5SDimitry Andric } 2610b57cec5SDimitry Andric 2620b57cec5SDimitry Andric ArrayRef<Builtin::Info> AMDGPUTargetInfo::getTargetBuiltins() const { 263bdd1243dSDimitry Andric return llvm::ArrayRef(BuiltinInfo, 264bdd1243dSDimitry Andric clang::AMDGPU::LastTSBuiltin - Builtin::FirstTSBuiltin); 2650b57cec5SDimitry Andric } 2660b57cec5SDimitry Andric 2670b57cec5SDimitry Andric void AMDGPUTargetInfo::getTargetDefines(const LangOptions &Opts, 2680b57cec5SDimitry Andric MacroBuilder &Builder) const { 2690b57cec5SDimitry Andric Builder.defineMacro("__AMD__"); 2700b57cec5SDimitry Andric Builder.defineMacro("__AMDGPU__"); 2710b57cec5SDimitry Andric 2720b57cec5SDimitry Andric if (isAMDGCN(getTriple())) 2730b57cec5SDimitry Andric Builder.defineMacro("__AMDGCN__"); 2740b57cec5SDimitry Andric else 2750b57cec5SDimitry Andric Builder.defineMacro("__R600__"); 2760b57cec5SDimitry Andric 2770b57cec5SDimitry Andric if (GPUKind != llvm::AMDGPU::GK_NONE) { 2780b57cec5SDimitry Andric StringRef CanonName = isAMDGCN(getTriple()) ? 2790b57cec5SDimitry Andric getArchNameAMDGCN(GPUKind) : getArchNameR600(GPUKind); 2800b57cec5SDimitry Andric Builder.defineMacro(Twine("__") + Twine(CanonName) + Twine("__")); 28181ad6265SDimitry Andric // Emit macros for gfx family e.g. gfx906 -> __GFX9__, gfx1030 -> __GFX10___ 28281ad6265SDimitry Andric if (isAMDGCN(getTriple())) { 283*5f757f3fSDimitry Andric assert(CanonName.starts_with("gfx") && "Invalid amdgcn canonical name"); 28481ad6265SDimitry Andric Builder.defineMacro(Twine("__") + Twine(CanonName.drop_back(2).upper()) + 28581ad6265SDimitry Andric Twine("__")); 28681ad6265SDimitry Andric } 287e8d8bef9SDimitry Andric if (isAMDGCN(getTriple())) { 288e8d8bef9SDimitry Andric Builder.defineMacro("__amdgcn_processor__", 289e8d8bef9SDimitry Andric Twine("\"") + Twine(CanonName) + Twine("\"")); 290e8d8bef9SDimitry Andric Builder.defineMacro("__amdgcn_target_id__", 29181ad6265SDimitry Andric Twine("\"") + Twine(*getTargetID()) + Twine("\"")); 292e8d8bef9SDimitry Andric for (auto F : getAllPossibleTargetIDFeatures(getTriple(), CanonName)) { 293e8d8bef9SDimitry Andric auto Loc = OffloadArchFeatures.find(F); 294e8d8bef9SDimitry Andric if (Loc != OffloadArchFeatures.end()) { 295e8d8bef9SDimitry Andric std::string NewF = F.str(); 296e8d8bef9SDimitry Andric std::replace(NewF.begin(), NewF.end(), '-', '_'); 297e8d8bef9SDimitry Andric Builder.defineMacro(Twine("__amdgcn_feature_") + Twine(NewF) + 298e8d8bef9SDimitry Andric Twine("__"), 299e8d8bef9SDimitry Andric Loc->second ? "1" : "0"); 300e8d8bef9SDimitry Andric } 301e8d8bef9SDimitry Andric } 302e8d8bef9SDimitry Andric } 3030b57cec5SDimitry Andric } 3040b57cec5SDimitry Andric 30581ad6265SDimitry Andric if (AllowAMDGPUUnsafeFPAtomics) 30681ad6265SDimitry Andric Builder.defineMacro("__AMDGCN_UNSAFE_FP_ATOMICS__"); 30781ad6265SDimitry Andric 3080b57cec5SDimitry Andric // TODO: __HAS_FMAF__, __HAS_LDEXPF__, __HAS_FP64__ are deprecated and will be 3090b57cec5SDimitry Andric // removed in the near future. 3100b57cec5SDimitry Andric if (hasFMAF()) 3110b57cec5SDimitry Andric Builder.defineMacro("__HAS_FMAF__"); 3120b57cec5SDimitry Andric if (hasFastFMAF()) 3130b57cec5SDimitry Andric Builder.defineMacro("FP_FAST_FMAF"); 3140b57cec5SDimitry Andric if (hasLDEXPF()) 3150b57cec5SDimitry Andric Builder.defineMacro("__HAS_LDEXPF__"); 3160b57cec5SDimitry Andric if (hasFP64()) 3170b57cec5SDimitry Andric Builder.defineMacro("__HAS_FP64__"); 3180b57cec5SDimitry Andric if (hasFastFMA()) 3190b57cec5SDimitry Andric Builder.defineMacro("FP_FAST_FMA"); 320e8d8bef9SDimitry Andric 32106c3fb27SDimitry Andric Builder.defineMacro("__AMDGCN_WAVEFRONT_SIZE__", Twine(WavefrontSize)); 32206c3fb27SDimitry Andric // ToDo: deprecate this macro for naming consistency. 323e8d8bef9SDimitry Andric Builder.defineMacro("__AMDGCN_WAVEFRONT_SIZE", Twine(WavefrontSize)); 32406c3fb27SDimitry Andric Builder.defineMacro("__AMDGCN_CUMODE__", Twine(CUMode)); 3250b57cec5SDimitry Andric } 3260b57cec5SDimitry Andric 3270b57cec5SDimitry Andric void AMDGPUTargetInfo::setAuxTarget(const TargetInfo *Aux) { 3280b57cec5SDimitry Andric assert(HalfFormat == Aux->HalfFormat); 3290b57cec5SDimitry Andric assert(FloatFormat == Aux->FloatFormat); 3300b57cec5SDimitry Andric assert(DoubleFormat == Aux->DoubleFormat); 3310b57cec5SDimitry Andric 3320b57cec5SDimitry Andric // On x86_64 long double is 80-bit extended precision format, which is 3330b57cec5SDimitry Andric // not supported by AMDGPU. 128-bit floating point format is also not 3340b57cec5SDimitry Andric // supported by AMDGPU. Therefore keep its own format for these two types. 3350b57cec5SDimitry Andric auto SaveLongDoubleFormat = LongDoubleFormat; 3360b57cec5SDimitry Andric auto SaveFloat128Format = Float128Format; 33781ad6265SDimitry Andric auto SaveLongDoubleWidth = LongDoubleWidth; 33881ad6265SDimitry Andric auto SaveLongDoubleAlign = LongDoubleAlign; 3390b57cec5SDimitry Andric copyAuxTarget(Aux); 3400b57cec5SDimitry Andric LongDoubleFormat = SaveLongDoubleFormat; 3410b57cec5SDimitry Andric Float128Format = SaveFloat128Format; 34281ad6265SDimitry Andric LongDoubleWidth = SaveLongDoubleWidth; 34381ad6265SDimitry Andric LongDoubleAlign = SaveLongDoubleAlign; 3445ffd83dbSDimitry Andric // For certain builtin types support on the host target, claim they are 3455ffd83dbSDimitry Andric // support to pass the compilation of the host code during the device-side 3465ffd83dbSDimitry Andric // compilation. 3475ffd83dbSDimitry Andric // FIXME: As the side effect, we also accept `__float128` uses in the device 3485ffd83dbSDimitry Andric // code. To rejct these builtin types supported in the host target but not in 3495ffd83dbSDimitry Andric // the device target, one approach would support `device_builtin` attribute 3505ffd83dbSDimitry Andric // so that we could tell the device builtin types from the host ones. The 3515ffd83dbSDimitry Andric // also solves the different representations of the same builtin type, such 3525ffd83dbSDimitry Andric // as `size_t` in the MSVC environment. 3535ffd83dbSDimitry Andric if (Aux->hasFloat128Type()) { 3545ffd83dbSDimitry Andric HasFloat128 = true; 3555ffd83dbSDimitry Andric Float128Format = DoubleFormat; 3565ffd83dbSDimitry Andric } 3570b57cec5SDimitry Andric } 358