xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AMDGPU/AMDGPUMachineFunction.h (revision 5f757f3ff9144b609b3c433dfd370cc6bdc191ad)
10b57cec5SDimitry Andric //===-- AMDGPUMachineFunctionInfo.h -------------------------------*- C++ -*-=//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric 
90b57cec5SDimitry Andric #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUMACHINEFUNCTION_H
100b57cec5SDimitry Andric #define LLVM_LIB_TARGET_AMDGPU_AMDGPUMACHINEFUNCTION_H
110b57cec5SDimitry Andric 
12e8d8bef9SDimitry Andric #include "Utils/AMDGPUBaseInfo.h"
130b57cec5SDimitry Andric #include "llvm/ADT/DenseMap.h"
140b57cec5SDimitry Andric #include "llvm/CodeGen/MachineFunction.h"
1581ad6265SDimitry Andric #include "llvm/IR/DataLayout.h"
16fcaf7f86SDimitry Andric #include "llvm/IR/Function.h"
1781ad6265SDimitry Andric #include "llvm/IR/GlobalValue.h"
1881ad6265SDimitry Andric #include "llvm/IR/GlobalVariable.h"
190b57cec5SDimitry Andric 
200b57cec5SDimitry Andric namespace llvm {
210b57cec5SDimitry Andric 
22bdd1243dSDimitry Andric class AMDGPUSubtarget;
23bdd1243dSDimitry Andric 
240b57cec5SDimitry Andric class AMDGPUMachineFunction : public MachineFunctionInfo {
250b57cec5SDimitry Andric   /// A map to keep track of local memory objects and their offsets within the
260b57cec5SDimitry Andric   /// local memory space.
270b57cec5SDimitry Andric   SmallDenseMap<const GlobalValue *, unsigned, 4> LocalMemoryObjects;
280b57cec5SDimitry Andric 
290b57cec5SDimitry Andric protected:
305ffd83dbSDimitry Andric   uint64_t ExplicitKernArgSize = 0; // Cache for this.
318bcb0991SDimitry Andric   Align MaxKernArgAlign;        // Cache for this.
320b57cec5SDimitry Andric 
330b57cec5SDimitry Andric   /// Number of bytes in the LDS that are being used.
3481ad6265SDimitry Andric   uint32_t LDSSize = 0;
3581ad6265SDimitry Andric   uint32_t GDSSize = 0;
360b57cec5SDimitry Andric 
37e8d8bef9SDimitry Andric   /// Number of bytes in the LDS allocated statically. This field is only used
38e8d8bef9SDimitry Andric   /// in the instruction selector and not part of the machine function info.
3981ad6265SDimitry Andric   uint32_t StaticLDSSize = 0;
4081ad6265SDimitry Andric   uint32_t StaticGDSSize = 0;
41e8d8bef9SDimitry Andric 
42e8d8bef9SDimitry Andric   /// Align for dynamic shared memory if any. Dynamic shared memory is
43e8d8bef9SDimitry Andric   /// allocated directly after the static one, i.e., LDSSize. Need to pad
44e8d8bef9SDimitry Andric   /// LDSSize to ensure that dynamic one is aligned accordingly.
45e8d8bef9SDimitry Andric   /// The maximal alignment is updated during IR translation or lowering
46e8d8bef9SDimitry Andric   /// stages.
47e8d8bef9SDimitry Andric   Align DynLDSAlign;
48e8d8bef9SDimitry Andric 
49e8d8bef9SDimitry Andric   // Kernels + shaders. i.e. functions called by the hardware and not called
500b57cec5SDimitry Andric   // by other functions.
515ffd83dbSDimitry Andric   bool IsEntryFunction = false;
520b57cec5SDimitry Andric 
53e8d8bef9SDimitry Andric   // Entry points called by other functions instead of directly by the hardware.
54e8d8bef9SDimitry Andric   bool IsModuleEntryFunction = false;
55e8d8bef9SDimitry Andric 
56*5f757f3fSDimitry Andric   // Functions with the amdgpu_cs_chain or amdgpu_cs_chain_preserve CC.
57*5f757f3fSDimitry Andric   bool IsChainFunction = false;
58*5f757f3fSDimitry Andric 
595ffd83dbSDimitry Andric   bool NoSignedZerosFPMath = false;
600b57cec5SDimitry Andric 
610b57cec5SDimitry Andric   // Function may be memory bound.
625ffd83dbSDimitry Andric   bool MemoryBound = false;
630b57cec5SDimitry Andric 
640b57cec5SDimitry Andric   // Kernel may need limited waves per EU for better performance.
655ffd83dbSDimitry Andric   bool WaveLimiter = false;
660b57cec5SDimitry Andric 
670b57cec5SDimitry Andric public:
68bdd1243dSDimitry Andric   AMDGPUMachineFunction(const Function &F, const AMDGPUSubtarget &ST);
690b57cec5SDimitry Andric 
700b57cec5SDimitry Andric   uint64_t getExplicitKernArgSize() const {
710b57cec5SDimitry Andric     return ExplicitKernArgSize;
720b57cec5SDimitry Andric   }
730b57cec5SDimitry Andric 
7481ad6265SDimitry Andric   Align getMaxKernArgAlign() const { return MaxKernArgAlign; }
750b57cec5SDimitry Andric 
7681ad6265SDimitry Andric   uint32_t getLDSSize() const {
770b57cec5SDimitry Andric     return LDSSize;
780b57cec5SDimitry Andric   }
790b57cec5SDimitry Andric 
8081ad6265SDimitry Andric   uint32_t getGDSSize() const {
8181ad6265SDimitry Andric     return GDSSize;
8281ad6265SDimitry Andric   }
8381ad6265SDimitry Andric 
840b57cec5SDimitry Andric   bool isEntryFunction() const {
850b57cec5SDimitry Andric     return IsEntryFunction;
860b57cec5SDimitry Andric   }
870b57cec5SDimitry Andric 
88e8d8bef9SDimitry Andric   bool isModuleEntryFunction() const { return IsModuleEntryFunction; }
89e8d8bef9SDimitry Andric 
90*5f757f3fSDimitry Andric   bool isChainFunction() const { return IsChainFunction; }
91*5f757f3fSDimitry Andric 
92*5f757f3fSDimitry Andric   // The stack is empty upon entry to this function.
93*5f757f3fSDimitry Andric   bool isBottomOfStack() const {
94*5f757f3fSDimitry Andric     return isEntryFunction() || isChainFunction();
95*5f757f3fSDimitry Andric   }
96*5f757f3fSDimitry Andric 
970b57cec5SDimitry Andric   bool hasNoSignedZerosFPMath() const {
980b57cec5SDimitry Andric     return NoSignedZerosFPMath;
990b57cec5SDimitry Andric   }
1000b57cec5SDimitry Andric 
1010b57cec5SDimitry Andric   bool isMemoryBound() const {
1020b57cec5SDimitry Andric     return MemoryBound;
1030b57cec5SDimitry Andric   }
1040b57cec5SDimitry Andric 
1050b57cec5SDimitry Andric   bool needsWaveLimiter() const {
1060b57cec5SDimitry Andric     return WaveLimiter;
1070b57cec5SDimitry Andric   }
1080b57cec5SDimitry Andric 
109bdd1243dSDimitry Andric   unsigned allocateLDSGlobal(const DataLayout &DL, const GlobalVariable &GV) {
110bdd1243dSDimitry Andric     return allocateLDSGlobal(DL, GV, DynLDSAlign);
111bdd1243dSDimitry Andric   }
112e8d8bef9SDimitry Andric 
113bdd1243dSDimitry Andric   unsigned allocateLDSGlobal(const DataLayout &DL, const GlobalVariable &GV,
114bdd1243dSDimitry Andric                              Align Trailing);
115bdd1243dSDimitry Andric 
116bdd1243dSDimitry Andric   static std::optional<uint32_t> getLDSKernelIdMetadata(const Function &F);
11706c3fb27SDimitry Andric   static std::optional<uint32_t> getLDSAbsoluteAddress(const GlobalValue &GV);
118fcaf7f86SDimitry Andric 
119e8d8bef9SDimitry Andric   Align getDynLDSAlign() const { return DynLDSAlign; }
120e8d8bef9SDimitry Andric 
12106c3fb27SDimitry Andric   void setDynLDSAlign(const Function &F, const GlobalVariable &GV);
1220b57cec5SDimitry Andric };
1230b57cec5SDimitry Andric 
1240b57cec5SDimitry Andric }
1250b57cec5SDimitry Andric #endif
126