10b57cec5SDimitry Andric //===--- AMDGPU.cpp - Implement AMDGPU target feature support -------------===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric // 90b57cec5SDimitry Andric // This file implements AMDGPU TargetInfo objects. 100b57cec5SDimitry Andric // 110b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 120b57cec5SDimitry Andric 130b57cec5SDimitry Andric #include "AMDGPU.h" 140b57cec5SDimitry Andric #include "clang/Basic/Builtins.h" 150b57cec5SDimitry Andric #include "clang/Basic/CodeGenOptions.h" 16bdd1243dSDimitry Andric #include "clang/Basic/Diagnostic.h" 170b57cec5SDimitry Andric #include "clang/Basic/LangOptions.h" 180b57cec5SDimitry Andric #include "clang/Basic/MacroBuilder.h" 190b57cec5SDimitry Andric #include "clang/Basic/TargetBuiltins.h" 20*0fca6ea1SDimitry Andric #include "llvm/ADT/SmallString.h" 210b57cec5SDimitry Andric using namespace clang; 220b57cec5SDimitry Andric using namespace clang::targets; 230b57cec5SDimitry Andric 240b57cec5SDimitry Andric namespace clang { 250b57cec5SDimitry Andric namespace targets { 260b57cec5SDimitry Andric 270b57cec5SDimitry Andric // If you edit the description strings, make sure you update 280b57cec5SDimitry Andric // getPointerWidthV(). 290b57cec5SDimitry Andric 300b57cec5SDimitry Andric static const char *const DataLayoutStringR600 = 310b57cec5SDimitry Andric "e-p:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128" 32e8d8bef9SDimitry Andric "-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1"; 330b57cec5SDimitry Andric 340b57cec5SDimitry Andric static const char *const DataLayoutStringAMDGCN = 350b57cec5SDimitry Andric "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32" 365f757f3fSDimitry Andric "-p7:160:256:256:32-p8:128:128-p9:192:256:256:32-i64:64-v16:16-v24:32-v32:" 375f757f3fSDimitry Andric "32-v48:64-v96:128" 38e8d8bef9SDimitry Andric "-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1" 395f757f3fSDimitry Andric "-ni:7:8:9"; 400b57cec5SDimitry Andric 410b57cec5SDimitry Andric const LangASMap AMDGPUTargetInfo::AMDGPUDefIsGenMap = { 425f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // Default 435f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global 445f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // opencl_local 455f757f3fSDimitry Andric llvm::AMDGPUAS::CONSTANT_ADDRESS, // opencl_constant 465f757f3fSDimitry Andric llvm::AMDGPUAS::PRIVATE_ADDRESS, // opencl_private 475f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // opencl_generic 485f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global_device 495f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global_host 505f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // cuda_device 515f757f3fSDimitry Andric llvm::AMDGPUAS::CONSTANT_ADDRESS, // cuda_constant 525f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // cuda_shared 535f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // sycl_global 545f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // sycl_global_device 555f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // sycl_global_host 565f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // sycl_local 575f757f3fSDimitry Andric llvm::AMDGPUAS::PRIVATE_ADDRESS, // sycl_private 585f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_sptr 595f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_uptr 605f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr64 615f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // hlsl_groupshared 620b57cec5SDimitry Andric }; 630b57cec5SDimitry Andric 640b57cec5SDimitry Andric const LangASMap AMDGPUTargetInfo::AMDGPUDefIsPrivMap = { 655f757f3fSDimitry Andric llvm::AMDGPUAS::PRIVATE_ADDRESS, // Default 665f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global 675f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // opencl_local 685f757f3fSDimitry Andric llvm::AMDGPUAS::CONSTANT_ADDRESS, // opencl_constant 695f757f3fSDimitry Andric llvm::AMDGPUAS::PRIVATE_ADDRESS, // opencl_private 705f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // opencl_generic 715f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global_device 725f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // opencl_global_host 735f757f3fSDimitry Andric llvm::AMDGPUAS::GLOBAL_ADDRESS, // cuda_device 745f757f3fSDimitry Andric llvm::AMDGPUAS::CONSTANT_ADDRESS, // cuda_constant 755f757f3fSDimitry Andric llvm::AMDGPUAS::LOCAL_ADDRESS, // cuda_shared 76fe6060f1SDimitry Andric // SYCL address space values for this map are dummy 775f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global 785f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global_device 795f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_global_host 805f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_local 815f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // sycl_private 825f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_sptr 835f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr32_uptr 845f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // ptr64 855f757f3fSDimitry Andric llvm::AMDGPUAS::FLAT_ADDRESS, // hlsl_groupshared 86480093f4SDimitry Andric 870b57cec5SDimitry Andric }; 880b57cec5SDimitry Andric } // namespace targets 890b57cec5SDimitry Andric } // namespace clang 900b57cec5SDimitry Andric 91bdd1243dSDimitry Andric static constexpr Builtin::Info BuiltinInfo[] = { 920b57cec5SDimitry Andric #define BUILTIN(ID, TYPE, ATTRS) \ 93bdd1243dSDimitry Andric {#ID, TYPE, ATTRS, nullptr, HeaderDesc::NO_HEADER, ALL_LANGUAGES}, 940b57cec5SDimitry Andric #define TARGET_BUILTIN(ID, TYPE, ATTRS, FEATURE) \ 95bdd1243dSDimitry Andric {#ID, TYPE, ATTRS, FEATURE, HeaderDesc::NO_HEADER, ALL_LANGUAGES}, 960b57cec5SDimitry Andric #include "clang/Basic/BuiltinsAMDGPU.def" 970b57cec5SDimitry Andric }; 980b57cec5SDimitry Andric 990b57cec5SDimitry Andric const char *const AMDGPUTargetInfo::GCCRegNames[] = { 1000b57cec5SDimitry Andric "v0", "v1", "v2", "v3", "v4", "v5", "v6", "v7", "v8", 1010b57cec5SDimitry Andric "v9", "v10", "v11", "v12", "v13", "v14", "v15", "v16", "v17", 1020b57cec5SDimitry Andric "v18", "v19", "v20", "v21", "v22", "v23", "v24", "v25", "v26", 1030b57cec5SDimitry Andric "v27", "v28", "v29", "v30", "v31", "v32", "v33", "v34", "v35", 1040b57cec5SDimitry Andric "v36", "v37", "v38", "v39", "v40", "v41", "v42", "v43", "v44", 1050b57cec5SDimitry Andric "v45", "v46", "v47", "v48", "v49", "v50", "v51", "v52", "v53", 1060b57cec5SDimitry Andric "v54", "v55", "v56", "v57", "v58", "v59", "v60", "v61", "v62", 1070b57cec5SDimitry Andric "v63", "v64", "v65", "v66", "v67", "v68", "v69", "v70", "v71", 1080b57cec5SDimitry Andric "v72", "v73", "v74", "v75", "v76", "v77", "v78", "v79", "v80", 1090b57cec5SDimitry Andric "v81", "v82", "v83", "v84", "v85", "v86", "v87", "v88", "v89", 1100b57cec5SDimitry Andric "v90", "v91", "v92", "v93", "v94", "v95", "v96", "v97", "v98", 1110b57cec5SDimitry Andric "v99", "v100", "v101", "v102", "v103", "v104", "v105", "v106", "v107", 1120b57cec5SDimitry Andric "v108", "v109", "v110", "v111", "v112", "v113", "v114", "v115", "v116", 1130b57cec5SDimitry Andric "v117", "v118", "v119", "v120", "v121", "v122", "v123", "v124", "v125", 1140b57cec5SDimitry Andric "v126", "v127", "v128", "v129", "v130", "v131", "v132", "v133", "v134", 1150b57cec5SDimitry Andric "v135", "v136", "v137", "v138", "v139", "v140", "v141", "v142", "v143", 1160b57cec5SDimitry Andric "v144", "v145", "v146", "v147", "v148", "v149", "v150", "v151", "v152", 1170b57cec5SDimitry Andric "v153", "v154", "v155", "v156", "v157", "v158", "v159", "v160", "v161", 1180b57cec5SDimitry Andric "v162", "v163", "v164", "v165", "v166", "v167", "v168", "v169", "v170", 1190b57cec5SDimitry Andric "v171", "v172", "v173", "v174", "v175", "v176", "v177", "v178", "v179", 1200b57cec5SDimitry Andric "v180", "v181", "v182", "v183", "v184", "v185", "v186", "v187", "v188", 1210b57cec5SDimitry Andric "v189", "v190", "v191", "v192", "v193", "v194", "v195", "v196", "v197", 1220b57cec5SDimitry Andric "v198", "v199", "v200", "v201", "v202", "v203", "v204", "v205", "v206", 1230b57cec5SDimitry Andric "v207", "v208", "v209", "v210", "v211", "v212", "v213", "v214", "v215", 1240b57cec5SDimitry Andric "v216", "v217", "v218", "v219", "v220", "v221", "v222", "v223", "v224", 1250b57cec5SDimitry Andric "v225", "v226", "v227", "v228", "v229", "v230", "v231", "v232", "v233", 1260b57cec5SDimitry Andric "v234", "v235", "v236", "v237", "v238", "v239", "v240", "v241", "v242", 1270b57cec5SDimitry Andric "v243", "v244", "v245", "v246", "v247", "v248", "v249", "v250", "v251", 1280b57cec5SDimitry Andric "v252", "v253", "v254", "v255", "s0", "s1", "s2", "s3", "s4", 1290b57cec5SDimitry Andric "s5", "s6", "s7", "s8", "s9", "s10", "s11", "s12", "s13", 1300b57cec5SDimitry Andric "s14", "s15", "s16", "s17", "s18", "s19", "s20", "s21", "s22", 1310b57cec5SDimitry Andric "s23", "s24", "s25", "s26", "s27", "s28", "s29", "s30", "s31", 1320b57cec5SDimitry Andric "s32", "s33", "s34", "s35", "s36", "s37", "s38", "s39", "s40", 1330b57cec5SDimitry Andric "s41", "s42", "s43", "s44", "s45", "s46", "s47", "s48", "s49", 1340b57cec5SDimitry Andric "s50", "s51", "s52", "s53", "s54", "s55", "s56", "s57", "s58", 1350b57cec5SDimitry Andric "s59", "s60", "s61", "s62", "s63", "s64", "s65", "s66", "s67", 1360b57cec5SDimitry Andric "s68", "s69", "s70", "s71", "s72", "s73", "s74", "s75", "s76", 1370b57cec5SDimitry Andric "s77", "s78", "s79", "s80", "s81", "s82", "s83", "s84", "s85", 1380b57cec5SDimitry Andric "s86", "s87", "s88", "s89", "s90", "s91", "s92", "s93", "s94", 1390b57cec5SDimitry Andric "s95", "s96", "s97", "s98", "s99", "s100", "s101", "s102", "s103", 1400b57cec5SDimitry Andric "s104", "s105", "s106", "s107", "s108", "s109", "s110", "s111", "s112", 1410b57cec5SDimitry Andric "s113", "s114", "s115", "s116", "s117", "s118", "s119", "s120", "s121", 1420b57cec5SDimitry Andric "s122", "s123", "s124", "s125", "s126", "s127", "exec", "vcc", "scc", 1430b57cec5SDimitry Andric "m0", "flat_scratch", "exec_lo", "exec_hi", "vcc_lo", "vcc_hi", 1445ffd83dbSDimitry Andric "flat_scratch_lo", "flat_scratch_hi", 1455ffd83dbSDimitry Andric "a0", "a1", "a2", "a3", "a4", "a5", "a6", "a7", "a8", 1465ffd83dbSDimitry Andric "a9", "a10", "a11", "a12", "a13", "a14", "a15", "a16", "a17", 1475ffd83dbSDimitry Andric "a18", "a19", "a20", "a21", "a22", "a23", "a24", "a25", "a26", 1485ffd83dbSDimitry Andric "a27", "a28", "a29", "a30", "a31", "a32", "a33", "a34", "a35", 1495ffd83dbSDimitry Andric "a36", "a37", "a38", "a39", "a40", "a41", "a42", "a43", "a44", 1505ffd83dbSDimitry Andric "a45", "a46", "a47", "a48", "a49", "a50", "a51", "a52", "a53", 1515ffd83dbSDimitry Andric "a54", "a55", "a56", "a57", "a58", "a59", "a60", "a61", "a62", 1525ffd83dbSDimitry Andric "a63", "a64", "a65", "a66", "a67", "a68", "a69", "a70", "a71", 1535ffd83dbSDimitry Andric "a72", "a73", "a74", "a75", "a76", "a77", "a78", "a79", "a80", 1545ffd83dbSDimitry Andric "a81", "a82", "a83", "a84", "a85", "a86", "a87", "a88", "a89", 1555ffd83dbSDimitry Andric "a90", "a91", "a92", "a93", "a94", "a95", "a96", "a97", "a98", 1565ffd83dbSDimitry Andric "a99", "a100", "a101", "a102", "a103", "a104", "a105", "a106", "a107", 1575ffd83dbSDimitry Andric "a108", "a109", "a110", "a111", "a112", "a113", "a114", "a115", "a116", 1585ffd83dbSDimitry Andric "a117", "a118", "a119", "a120", "a121", "a122", "a123", "a124", "a125", 1595ffd83dbSDimitry Andric "a126", "a127", "a128", "a129", "a130", "a131", "a132", "a133", "a134", 1605ffd83dbSDimitry Andric "a135", "a136", "a137", "a138", "a139", "a140", "a141", "a142", "a143", 1615ffd83dbSDimitry Andric "a144", "a145", "a146", "a147", "a148", "a149", "a150", "a151", "a152", 1625ffd83dbSDimitry Andric "a153", "a154", "a155", "a156", "a157", "a158", "a159", "a160", "a161", 1635ffd83dbSDimitry Andric "a162", "a163", "a164", "a165", "a166", "a167", "a168", "a169", "a170", 1645ffd83dbSDimitry Andric "a171", "a172", "a173", "a174", "a175", "a176", "a177", "a178", "a179", 1655ffd83dbSDimitry Andric "a180", "a181", "a182", "a183", "a184", "a185", "a186", "a187", "a188", 1665ffd83dbSDimitry Andric "a189", "a190", "a191", "a192", "a193", "a194", "a195", "a196", "a197", 1675ffd83dbSDimitry Andric "a198", "a199", "a200", "a201", "a202", "a203", "a204", "a205", "a206", 1685ffd83dbSDimitry Andric "a207", "a208", "a209", "a210", "a211", "a212", "a213", "a214", "a215", 1695ffd83dbSDimitry Andric "a216", "a217", "a218", "a219", "a220", "a221", "a222", "a223", "a224", 1705ffd83dbSDimitry Andric "a225", "a226", "a227", "a228", "a229", "a230", "a231", "a232", "a233", 1715ffd83dbSDimitry Andric "a234", "a235", "a236", "a237", "a238", "a239", "a240", "a241", "a242", 1725ffd83dbSDimitry Andric "a243", "a244", "a245", "a246", "a247", "a248", "a249", "a250", "a251", 1735ffd83dbSDimitry Andric "a252", "a253", "a254", "a255" 1740b57cec5SDimitry Andric }; 1750b57cec5SDimitry Andric 1760b57cec5SDimitry Andric ArrayRef<const char *> AMDGPUTargetInfo::getGCCRegNames() const { 177bdd1243dSDimitry Andric return llvm::ArrayRef(GCCRegNames); 1780b57cec5SDimitry Andric } 1790b57cec5SDimitry Andric 1800b57cec5SDimitry Andric bool AMDGPUTargetInfo::initFeatureMap( 1810b57cec5SDimitry Andric llvm::StringMap<bool> &Features, DiagnosticsEngine &Diags, StringRef CPU, 1820b57cec5SDimitry Andric const std::vector<std::string> &FeatureVec) const { 1830b57cec5SDimitry Andric 1840b57cec5SDimitry Andric using namespace llvm::AMDGPU; 18506c3fb27SDimitry Andric fillAMDGPUFeatureMap(CPU, getTriple(), Features); 186bdd1243dSDimitry Andric if (!TargetInfo::initFeatureMap(Features, Diags, CPU, FeatureVec)) 187bdd1243dSDimitry Andric return false; 188bdd1243dSDimitry Andric 189bdd1243dSDimitry Andric // TODO: Should move this logic into TargetParser 190*0fca6ea1SDimitry Andric auto HasError = insertWaveSizeFeature(CPU, getTriple(), Features); 191*0fca6ea1SDimitry Andric switch (HasError.first) { 192*0fca6ea1SDimitry Andric default: 193*0fca6ea1SDimitry Andric break; 194*0fca6ea1SDimitry Andric case llvm::AMDGPU::INVALID_FEATURE_COMBINATION: 195*0fca6ea1SDimitry Andric Diags.Report(diag::err_invalid_feature_combination) << HasError.second; 196*0fca6ea1SDimitry Andric return false; 197*0fca6ea1SDimitry Andric case llvm::AMDGPU::UNSUPPORTED_TARGET_FEATURE: 198*0fca6ea1SDimitry Andric Diags.Report(diag::err_opt_not_valid_on_target) << HasError.second; 199bdd1243dSDimitry Andric return false; 200bdd1243dSDimitry Andric } 201bdd1243dSDimitry Andric 202bdd1243dSDimitry Andric return true; 2030b57cec5SDimitry Andric } 2040b57cec5SDimitry Andric 2050b57cec5SDimitry Andric void AMDGPUTargetInfo::fillValidCPUList( 2060b57cec5SDimitry Andric SmallVectorImpl<StringRef> &Values) const { 2070b57cec5SDimitry Andric if (isAMDGCN(getTriple())) 2080b57cec5SDimitry Andric llvm::AMDGPU::fillValidArchListAMDGCN(Values); 2090b57cec5SDimitry Andric else 2100b57cec5SDimitry Andric llvm::AMDGPU::fillValidArchListR600(Values); 2110b57cec5SDimitry Andric } 2120b57cec5SDimitry Andric 2130b57cec5SDimitry Andric void AMDGPUTargetInfo::setAddressSpaceMap(bool DefaultIsPrivate) { 2140b57cec5SDimitry Andric AddrSpaceMap = DefaultIsPrivate ? &AMDGPUDefIsPrivMap : &AMDGPUDefIsGenMap; 2150b57cec5SDimitry Andric } 2160b57cec5SDimitry Andric 2170b57cec5SDimitry Andric AMDGPUTargetInfo::AMDGPUTargetInfo(const llvm::Triple &Triple, 2180b57cec5SDimitry Andric const TargetOptions &Opts) 2190b57cec5SDimitry Andric : TargetInfo(Triple), 2200b57cec5SDimitry Andric GPUKind(isAMDGCN(Triple) ? 2210b57cec5SDimitry Andric llvm::AMDGPU::parseArchAMDGCN(Opts.CPU) : 2220b57cec5SDimitry Andric llvm::AMDGPU::parseArchR600(Opts.CPU)), 2230b57cec5SDimitry Andric GPUFeatures(isAMDGCN(Triple) ? 2240b57cec5SDimitry Andric llvm::AMDGPU::getArchAttrAMDGCN(GPUKind) : 2250b57cec5SDimitry Andric llvm::AMDGPU::getArchAttrR600(GPUKind)) { 2260b57cec5SDimitry Andric resetDataLayout(isAMDGCN(getTriple()) ? DataLayoutStringAMDGCN 2270b57cec5SDimitry Andric : DataLayoutStringR600); 2280b57cec5SDimitry Andric 2290b57cec5SDimitry Andric setAddressSpaceMap(Triple.getOS() == llvm::Triple::Mesa3D || 2300b57cec5SDimitry Andric !isAMDGCN(Triple)); 2310b57cec5SDimitry Andric UseAddrSpaceMapMangling = true; 2320b57cec5SDimitry Andric 233bdd1243dSDimitry Andric if (isAMDGCN(Triple)) { 234bdd1243dSDimitry Andric // __bf16 is always available as a load/store only type on AMDGCN. 235bdd1243dSDimitry Andric BFloat16Width = BFloat16Align = 16; 236bdd1243dSDimitry Andric BFloat16Format = &llvm::APFloat::BFloat(); 237bdd1243dSDimitry Andric } 238bdd1243dSDimitry Andric 2390b57cec5SDimitry Andric HasLegalHalfType = true; 2400b57cec5SDimitry Andric HasFloat16 = true; 241*0fca6ea1SDimitry Andric WavefrontSize = (GPUFeatures & llvm::AMDGPU::FEATURE_WAVE32) ? 32 : 64; 242e8d8bef9SDimitry Andric AllowAMDGPUUnsafeFPAtomics = Opts.AllowAMDGPUUnsafeFPAtomics; 2430b57cec5SDimitry Andric 244bdd1243dSDimitry Andric // Set pointer width and alignment for the generic address space. 245bdd1243dSDimitry Andric PointerWidth = PointerAlign = getPointerWidthV(LangAS::Default); 2460b57cec5SDimitry Andric if (getMaxPointerWidth() == 64) { 2470b57cec5SDimitry Andric LongWidth = LongAlign = 64; 2480b57cec5SDimitry Andric SizeType = UnsignedLong; 2490b57cec5SDimitry Andric PtrDiffType = SignedLong; 2500b57cec5SDimitry Andric IntPtrType = SignedLong; 2510b57cec5SDimitry Andric } 2520b57cec5SDimitry Andric 2530b57cec5SDimitry Andric MaxAtomicPromoteWidth = MaxAtomicInlineWidth = 64; 25406c3fb27SDimitry Andric CUMode = !(GPUFeatures & llvm::AMDGPU::FEATURE_WGP); 2555f757f3fSDimitry Andric for (auto F : {"image-insts", "gws"}) 2565f757f3fSDimitry Andric ReadOnlyFeatures.insert(F); 2575f757f3fSDimitry Andric HalfArgsAndReturns = true; 2580b57cec5SDimitry Andric } 2590b57cec5SDimitry Andric 260fe6060f1SDimitry Andric void AMDGPUTargetInfo::adjust(DiagnosticsEngine &Diags, LangOptions &Opts) { 261fe6060f1SDimitry Andric TargetInfo::adjust(Diags, Opts); 2620b57cec5SDimitry Andric // ToDo: There are still a few places using default address space as private 2630b57cec5SDimitry Andric // address space in OpenCL, which needs to be cleaned up, then Opts.OpenCL 2640b57cec5SDimitry Andric // can be removed from the following line. 2650b57cec5SDimitry Andric setAddressSpaceMap(/*DefaultIsPrivate=*/Opts.OpenCL || 2660b57cec5SDimitry Andric !isAMDGCN(getTriple())); 2670b57cec5SDimitry Andric } 2680b57cec5SDimitry Andric 2690b57cec5SDimitry Andric ArrayRef<Builtin::Info> AMDGPUTargetInfo::getTargetBuiltins() const { 270bdd1243dSDimitry Andric return llvm::ArrayRef(BuiltinInfo, 271bdd1243dSDimitry Andric clang::AMDGPU::LastTSBuiltin - Builtin::FirstTSBuiltin); 2720b57cec5SDimitry Andric } 2730b57cec5SDimitry Andric 2740b57cec5SDimitry Andric void AMDGPUTargetInfo::getTargetDefines(const LangOptions &Opts, 2750b57cec5SDimitry Andric MacroBuilder &Builder) const { 2760b57cec5SDimitry Andric Builder.defineMacro("__AMD__"); 2770b57cec5SDimitry Andric Builder.defineMacro("__AMDGPU__"); 2780b57cec5SDimitry Andric 2790b57cec5SDimitry Andric if (isAMDGCN(getTriple())) 2800b57cec5SDimitry Andric Builder.defineMacro("__AMDGCN__"); 2810b57cec5SDimitry Andric else 2820b57cec5SDimitry Andric Builder.defineMacro("__R600__"); 2830b57cec5SDimitry Andric 284*0fca6ea1SDimitry Andric // Legacy HIP host code relies on these default attributes to be defined. 285*0fca6ea1SDimitry Andric bool IsHIPHost = Opts.HIP && !Opts.CUDAIsDevice; 286*0fca6ea1SDimitry Andric if (GPUKind == llvm::AMDGPU::GK_NONE && !IsHIPHost) 287*0fca6ea1SDimitry Andric return; 288*0fca6ea1SDimitry Andric 289*0fca6ea1SDimitry Andric llvm::SmallString<16> CanonName = 290*0fca6ea1SDimitry Andric (isAMDGCN(getTriple()) ? getArchNameAMDGCN(GPUKind) 291*0fca6ea1SDimitry Andric : getArchNameR600(GPUKind)); 292*0fca6ea1SDimitry Andric 293*0fca6ea1SDimitry Andric // Sanitize the name of generic targets. 294*0fca6ea1SDimitry Andric // e.g. gfx10-1-generic -> gfx10_1_generic 295*0fca6ea1SDimitry Andric if (GPUKind >= llvm::AMDGPU::GK_AMDGCN_GENERIC_FIRST && 296*0fca6ea1SDimitry Andric GPUKind <= llvm::AMDGPU::GK_AMDGCN_GENERIC_LAST) { 297*0fca6ea1SDimitry Andric std::replace(CanonName.begin(), CanonName.end(), '-', '_'); 298*0fca6ea1SDimitry Andric } 299*0fca6ea1SDimitry Andric 3000b57cec5SDimitry Andric Builder.defineMacro(Twine("__") + Twine(CanonName) + Twine("__")); 30181ad6265SDimitry Andric // Emit macros for gfx family e.g. gfx906 -> __GFX9__, gfx1030 -> __GFX10___ 302*0fca6ea1SDimitry Andric if (isAMDGCN(getTriple()) && !IsHIPHost) { 303*0fca6ea1SDimitry Andric assert(StringRef(CanonName).starts_with("gfx") && 304*0fca6ea1SDimitry Andric "Invalid amdgcn canonical name"); 305*0fca6ea1SDimitry Andric StringRef CanonFamilyName = getArchFamilyNameAMDGCN(GPUKind); 306*0fca6ea1SDimitry Andric Builder.defineMacro(Twine("__") + Twine(CanonFamilyName.upper()) + 30781ad6265SDimitry Andric Twine("__")); 308e8d8bef9SDimitry Andric Builder.defineMacro("__amdgcn_processor__", 309e8d8bef9SDimitry Andric Twine("\"") + Twine(CanonName) + Twine("\"")); 310e8d8bef9SDimitry Andric Builder.defineMacro("__amdgcn_target_id__", 31181ad6265SDimitry Andric Twine("\"") + Twine(*getTargetID()) + Twine("\"")); 312e8d8bef9SDimitry Andric for (auto F : getAllPossibleTargetIDFeatures(getTriple(), CanonName)) { 313e8d8bef9SDimitry Andric auto Loc = OffloadArchFeatures.find(F); 314e8d8bef9SDimitry Andric if (Loc != OffloadArchFeatures.end()) { 315e8d8bef9SDimitry Andric std::string NewF = F.str(); 316e8d8bef9SDimitry Andric std::replace(NewF.begin(), NewF.end(), '-', '_'); 317e8d8bef9SDimitry Andric Builder.defineMacro(Twine("__amdgcn_feature_") + Twine(NewF) + 318e8d8bef9SDimitry Andric Twine("__"), 319e8d8bef9SDimitry Andric Loc->second ? "1" : "0"); 320e8d8bef9SDimitry Andric } 321e8d8bef9SDimitry Andric } 322e8d8bef9SDimitry Andric } 3230b57cec5SDimitry Andric 32481ad6265SDimitry Andric if (AllowAMDGPUUnsafeFPAtomics) 32581ad6265SDimitry Andric Builder.defineMacro("__AMDGCN_UNSAFE_FP_ATOMICS__"); 32681ad6265SDimitry Andric 3270b57cec5SDimitry Andric // TODO: __HAS_FMAF__, __HAS_LDEXPF__, __HAS_FP64__ are deprecated and will be 3280b57cec5SDimitry Andric // removed in the near future. 3290b57cec5SDimitry Andric if (hasFMAF()) 3300b57cec5SDimitry Andric Builder.defineMacro("__HAS_FMAF__"); 3310b57cec5SDimitry Andric if (hasFastFMAF()) 3320b57cec5SDimitry Andric Builder.defineMacro("FP_FAST_FMAF"); 3330b57cec5SDimitry Andric if (hasLDEXPF()) 3340b57cec5SDimitry Andric Builder.defineMacro("__HAS_LDEXPF__"); 3350b57cec5SDimitry Andric if (hasFP64()) 3360b57cec5SDimitry Andric Builder.defineMacro("__HAS_FP64__"); 3370b57cec5SDimitry Andric if (hasFastFMA()) 3380b57cec5SDimitry Andric Builder.defineMacro("FP_FAST_FMA"); 339e8d8bef9SDimitry Andric 34006c3fb27SDimitry Andric Builder.defineMacro("__AMDGCN_WAVEFRONT_SIZE__", Twine(WavefrontSize)); 34106c3fb27SDimitry Andric // ToDo: deprecate this macro for naming consistency. 342e8d8bef9SDimitry Andric Builder.defineMacro("__AMDGCN_WAVEFRONT_SIZE", Twine(WavefrontSize)); 34306c3fb27SDimitry Andric Builder.defineMacro("__AMDGCN_CUMODE__", Twine(CUMode)); 3440b57cec5SDimitry Andric } 3450b57cec5SDimitry Andric 3460b57cec5SDimitry Andric void AMDGPUTargetInfo::setAuxTarget(const TargetInfo *Aux) { 3470b57cec5SDimitry Andric assert(HalfFormat == Aux->HalfFormat); 3480b57cec5SDimitry Andric assert(FloatFormat == Aux->FloatFormat); 3490b57cec5SDimitry Andric assert(DoubleFormat == Aux->DoubleFormat); 3500b57cec5SDimitry Andric 3510b57cec5SDimitry Andric // On x86_64 long double is 80-bit extended precision format, which is 3520b57cec5SDimitry Andric // not supported by AMDGPU. 128-bit floating point format is also not 3530b57cec5SDimitry Andric // supported by AMDGPU. Therefore keep its own format for these two types. 3540b57cec5SDimitry Andric auto SaveLongDoubleFormat = LongDoubleFormat; 3550b57cec5SDimitry Andric auto SaveFloat128Format = Float128Format; 35681ad6265SDimitry Andric auto SaveLongDoubleWidth = LongDoubleWidth; 35781ad6265SDimitry Andric auto SaveLongDoubleAlign = LongDoubleAlign; 3580b57cec5SDimitry Andric copyAuxTarget(Aux); 3590b57cec5SDimitry Andric LongDoubleFormat = SaveLongDoubleFormat; 3600b57cec5SDimitry Andric Float128Format = SaveFloat128Format; 36181ad6265SDimitry Andric LongDoubleWidth = SaveLongDoubleWidth; 36281ad6265SDimitry Andric LongDoubleAlign = SaveLongDoubleAlign; 3635ffd83dbSDimitry Andric // For certain builtin types support on the host target, claim they are 3645ffd83dbSDimitry Andric // support to pass the compilation of the host code during the device-side 3655ffd83dbSDimitry Andric // compilation. 3665ffd83dbSDimitry Andric // FIXME: As the side effect, we also accept `__float128` uses in the device 3675ffd83dbSDimitry Andric // code. To rejct these builtin types supported in the host target but not in 3685ffd83dbSDimitry Andric // the device target, one approach would support `device_builtin` attribute 3695ffd83dbSDimitry Andric // so that we could tell the device builtin types from the host ones. The 3705ffd83dbSDimitry Andric // also solves the different representations of the same builtin type, such 3715ffd83dbSDimitry Andric // as `size_t` in the MSVC environment. 3725ffd83dbSDimitry Andric if (Aux->hasFloat128Type()) { 3735ffd83dbSDimitry Andric HasFloat128 = true; 3745ffd83dbSDimitry Andric Float128Format = DoubleFormat; 3755ffd83dbSDimitry Andric } 3760b57cec5SDimitry Andric } 377