10b57cec5SDimitry Andric //===-- AMDGPUMachineFunctionInfo.h -------------------------------*- C++ -*-=// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric 90b57cec5SDimitry Andric #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUMACHINEFUNCTION_H 100b57cec5SDimitry Andric #define LLVM_LIB_TARGET_AMDGPU_AMDGPUMACHINEFUNCTION_H 110b57cec5SDimitry Andric 12e8d8bef9SDimitry Andric #include "Utils/AMDGPUBaseInfo.h" 130b57cec5SDimitry Andric #include "llvm/ADT/DenseMap.h" 140b57cec5SDimitry Andric #include "llvm/CodeGen/MachineFunction.h" 1581ad6265SDimitry Andric #include "llvm/IR/DataLayout.h" 16fcaf7f86SDimitry Andric #include "llvm/IR/Function.h" 1781ad6265SDimitry Andric #include "llvm/IR/GlobalValue.h" 1881ad6265SDimitry Andric #include "llvm/IR/GlobalVariable.h" 190b57cec5SDimitry Andric 200b57cec5SDimitry Andric namespace llvm { 210b57cec5SDimitry Andric 22bdd1243dSDimitry Andric class AMDGPUSubtarget; 23bdd1243dSDimitry Andric 240b57cec5SDimitry Andric class AMDGPUMachineFunction : public MachineFunctionInfo { 250b57cec5SDimitry Andric /// A map to keep track of local memory objects and their offsets within the 260b57cec5SDimitry Andric /// local memory space. 270b57cec5SDimitry Andric SmallDenseMap<const GlobalValue *, unsigned, 4> LocalMemoryObjects; 280b57cec5SDimitry Andric 290b57cec5SDimitry Andric protected: 305ffd83dbSDimitry Andric uint64_t ExplicitKernArgSize = 0; // Cache for this. 318bcb0991SDimitry Andric Align MaxKernArgAlign; // Cache for this. 320b57cec5SDimitry Andric 330b57cec5SDimitry Andric /// Number of bytes in the LDS that are being used. 3481ad6265SDimitry Andric uint32_t LDSSize = 0; 3581ad6265SDimitry Andric uint32_t GDSSize = 0; 360b57cec5SDimitry Andric 37e8d8bef9SDimitry Andric /// Number of bytes in the LDS allocated statically. This field is only used 38e8d8bef9SDimitry Andric /// in the instruction selector and not part of the machine function info. 3981ad6265SDimitry Andric uint32_t StaticLDSSize = 0; 4081ad6265SDimitry Andric uint32_t StaticGDSSize = 0; 41e8d8bef9SDimitry Andric 42e8d8bef9SDimitry Andric /// Align for dynamic shared memory if any. Dynamic shared memory is 43e8d8bef9SDimitry Andric /// allocated directly after the static one, i.e., LDSSize. Need to pad 44e8d8bef9SDimitry Andric /// LDSSize to ensure that dynamic one is aligned accordingly. 45e8d8bef9SDimitry Andric /// The maximal alignment is updated during IR translation or lowering 46e8d8bef9SDimitry Andric /// stages. 47e8d8bef9SDimitry Andric Align DynLDSAlign; 48e8d8bef9SDimitry Andric 49e8d8bef9SDimitry Andric // Kernels + shaders. i.e. functions called by the hardware and not called 500b57cec5SDimitry Andric // by other functions. 515ffd83dbSDimitry Andric bool IsEntryFunction = false; 520b57cec5SDimitry Andric 53e8d8bef9SDimitry Andric // Entry points called by other functions instead of directly by the hardware. 54e8d8bef9SDimitry Andric bool IsModuleEntryFunction = false; 55e8d8bef9SDimitry Andric 56*5f757f3fSDimitry Andric // Functions with the amdgpu_cs_chain or amdgpu_cs_chain_preserve CC. 57*5f757f3fSDimitry Andric bool IsChainFunction = false; 58*5f757f3fSDimitry Andric 595ffd83dbSDimitry Andric bool NoSignedZerosFPMath = false; 600b57cec5SDimitry Andric 610b57cec5SDimitry Andric // Function may be memory bound. 625ffd83dbSDimitry Andric bool MemoryBound = false; 630b57cec5SDimitry Andric 640b57cec5SDimitry Andric // Kernel may need limited waves per EU for better performance. 655ffd83dbSDimitry Andric bool WaveLimiter = false; 660b57cec5SDimitry Andric 670b57cec5SDimitry Andric public: 68bdd1243dSDimitry Andric AMDGPUMachineFunction(const Function &F, const AMDGPUSubtarget &ST); 690b57cec5SDimitry Andric 700b57cec5SDimitry Andric uint64_t getExplicitKernArgSize() const { 710b57cec5SDimitry Andric return ExplicitKernArgSize; 720b57cec5SDimitry Andric } 730b57cec5SDimitry Andric 7481ad6265SDimitry Andric Align getMaxKernArgAlign() const { return MaxKernArgAlign; } 750b57cec5SDimitry Andric 7681ad6265SDimitry Andric uint32_t getLDSSize() const { 770b57cec5SDimitry Andric return LDSSize; 780b57cec5SDimitry Andric } 790b57cec5SDimitry Andric 8081ad6265SDimitry Andric uint32_t getGDSSize() const { 8181ad6265SDimitry Andric return GDSSize; 8281ad6265SDimitry Andric } 8381ad6265SDimitry Andric 840b57cec5SDimitry Andric bool isEntryFunction() const { 850b57cec5SDimitry Andric return IsEntryFunction; 860b57cec5SDimitry Andric } 870b57cec5SDimitry Andric 88e8d8bef9SDimitry Andric bool isModuleEntryFunction() const { return IsModuleEntryFunction; } 89e8d8bef9SDimitry Andric 90*5f757f3fSDimitry Andric bool isChainFunction() const { return IsChainFunction; } 91*5f757f3fSDimitry Andric 92*5f757f3fSDimitry Andric // The stack is empty upon entry to this function. 93*5f757f3fSDimitry Andric bool isBottomOfStack() const { 94*5f757f3fSDimitry Andric return isEntryFunction() || isChainFunction(); 95*5f757f3fSDimitry Andric } 96*5f757f3fSDimitry Andric 970b57cec5SDimitry Andric bool hasNoSignedZerosFPMath() const { 980b57cec5SDimitry Andric return NoSignedZerosFPMath; 990b57cec5SDimitry Andric } 1000b57cec5SDimitry Andric 1010b57cec5SDimitry Andric bool isMemoryBound() const { 1020b57cec5SDimitry Andric return MemoryBound; 1030b57cec5SDimitry Andric } 1040b57cec5SDimitry Andric 1050b57cec5SDimitry Andric bool needsWaveLimiter() const { 1060b57cec5SDimitry Andric return WaveLimiter; 1070b57cec5SDimitry Andric } 1080b57cec5SDimitry Andric 109bdd1243dSDimitry Andric unsigned allocateLDSGlobal(const DataLayout &DL, const GlobalVariable &GV) { 110bdd1243dSDimitry Andric return allocateLDSGlobal(DL, GV, DynLDSAlign); 111bdd1243dSDimitry Andric } 112e8d8bef9SDimitry Andric 113bdd1243dSDimitry Andric unsigned allocateLDSGlobal(const DataLayout &DL, const GlobalVariable &GV, 114bdd1243dSDimitry Andric Align Trailing); 115bdd1243dSDimitry Andric 116bdd1243dSDimitry Andric static std::optional<uint32_t> getLDSKernelIdMetadata(const Function &F); 11706c3fb27SDimitry Andric static std::optional<uint32_t> getLDSAbsoluteAddress(const GlobalValue &GV); 118fcaf7f86SDimitry Andric 119e8d8bef9SDimitry Andric Align getDynLDSAlign() const { return DynLDSAlign; } 120e8d8bef9SDimitry Andric 12106c3fb27SDimitry Andric void setDynLDSAlign(const Function &F, const GlobalVariable &GV); 1220b57cec5SDimitry Andric }; 1230b57cec5SDimitry Andric 1240b57cec5SDimitry Andric } 1250b57cec5SDimitry Andric #endif 126