xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AMDGPU/AMDGPUMachineFunction.cpp (revision 04eeddc0aa8e0a417a16eaf9d7d095207f4a8623)
10b57cec5SDimitry Andric //===-- AMDGPUMachineFunctionInfo.cpp ---------------------------------------=//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric 
90b57cec5SDimitry Andric #include "AMDGPUMachineFunction.h"
100b57cec5SDimitry Andric #include "AMDGPUPerfHintAnalysis.h"
11e8d8bef9SDimitry Andric #include "AMDGPUSubtarget.h"
120b57cec5SDimitry Andric #include "llvm/CodeGen/MachineModuleInfo.h"
13e8d8bef9SDimitry Andric #include "llvm/Target/TargetMachine.h"
140b57cec5SDimitry Andric 
150b57cec5SDimitry Andric using namespace llvm;
160b57cec5SDimitry Andric 
17e8d8bef9SDimitry Andric AMDGPUMachineFunction::AMDGPUMachineFunction(const MachineFunction &MF)
18*04eeddc0SDimitry Andric     : Mode(MF.getFunction()), IsEntryFunction(AMDGPU::isEntryFunctionCC(
19*04eeddc0SDimitry Andric                                   MF.getFunction().getCallingConv())),
20e8d8bef9SDimitry Andric       IsModuleEntryFunction(
21e8d8bef9SDimitry Andric           AMDGPU::isModuleEntryFunctionCC(MF.getFunction().getCallingConv())),
225ffd83dbSDimitry Andric       NoSignedZerosFPMath(MF.getTarget().Options.NoSignedZerosFPMath) {
230b57cec5SDimitry Andric   const AMDGPUSubtarget &ST = AMDGPUSubtarget::get(MF);
240b57cec5SDimitry Andric 
250b57cec5SDimitry Andric   // FIXME: Should initialize KernArgSize based on ExplicitKernelArgOffset,
260b57cec5SDimitry Andric   // except reserved size is not correctly aligned.
270b57cec5SDimitry Andric   const Function &F = MF.getFunction();
280b57cec5SDimitry Andric 
290b57cec5SDimitry Andric   Attribute MemBoundAttr = F.getFnAttribute("amdgpu-memory-bound");
30fe6060f1SDimitry Andric   MemoryBound = MemBoundAttr.getValueAsBool();
310b57cec5SDimitry Andric 
320b57cec5SDimitry Andric   Attribute WaveLimitAttr = F.getFnAttribute("amdgpu-wave-limiter");
33fe6060f1SDimitry Andric   WaveLimiter = WaveLimitAttr.getValueAsBool();
340b57cec5SDimitry Andric 
350b57cec5SDimitry Andric   CallingConv::ID CC = F.getCallingConv();
360b57cec5SDimitry Andric   if (CC == CallingConv::AMDGPU_KERNEL || CC == CallingConv::SPIR_KERNEL)
370b57cec5SDimitry Andric     ExplicitKernArgSize = ST.getExplicitKernArgSize(F, MaxKernArgAlign);
380b57cec5SDimitry Andric }
390b57cec5SDimitry Andric 
400b57cec5SDimitry Andric unsigned AMDGPUMachineFunction::allocateLDSGlobal(const DataLayout &DL,
415ffd83dbSDimitry Andric                                                   const GlobalVariable &GV) {
420b57cec5SDimitry Andric   auto Entry = LocalMemoryObjects.insert(std::make_pair(&GV, 0));
430b57cec5SDimitry Andric   if (!Entry.second)
440b57cec5SDimitry Andric     return Entry.first->second;
450b57cec5SDimitry Andric 
465ffd83dbSDimitry Andric   Align Alignment =
475ffd83dbSDimitry Andric       DL.getValueOrABITypeAlignment(GV.getAlign(), GV.getValueType());
480b57cec5SDimitry Andric 
490b57cec5SDimitry Andric   /// TODO: We should sort these to minimize wasted space due to alignment
500b57cec5SDimitry Andric   /// padding. Currently the padding is decided by the first encountered use
510b57cec5SDimitry Andric   /// during lowering.
52e8d8bef9SDimitry Andric   unsigned Offset = StaticLDSSize = alignTo(StaticLDSSize, Alignment);
530b57cec5SDimitry Andric 
540b57cec5SDimitry Andric   Entry.first->second = Offset;
55e8d8bef9SDimitry Andric   StaticLDSSize += DL.getTypeAllocSize(GV.getValueType());
56e8d8bef9SDimitry Andric 
57e8d8bef9SDimitry Andric   // Update the LDS size considering the padding to align the dynamic shared
58e8d8bef9SDimitry Andric   // memory.
59e8d8bef9SDimitry Andric   LDSSize = alignTo(StaticLDSSize, DynLDSAlign);
600b57cec5SDimitry Andric 
610b57cec5SDimitry Andric   return Offset;
620b57cec5SDimitry Andric }
63e8d8bef9SDimitry Andric 
64fe6060f1SDimitry Andric void AMDGPUMachineFunction::allocateModuleLDSGlobal(const Module *M) {
65fe6060f1SDimitry Andric   if (isModuleEntryFunction()) {
66fe6060f1SDimitry Andric     const GlobalVariable *GV = M->getNamedGlobal("llvm.amdgcn.module.lds");
67fe6060f1SDimitry Andric     if (GV) {
68fe6060f1SDimitry Andric       unsigned Offset = allocateLDSGlobal(M->getDataLayout(), *GV);
69fe6060f1SDimitry Andric       (void)Offset;
70fe6060f1SDimitry Andric       assert(Offset == 0 &&
71fe6060f1SDimitry Andric              "Module LDS expected to be allocated before other LDS");
72fe6060f1SDimitry Andric     }
73fe6060f1SDimitry Andric   }
74fe6060f1SDimitry Andric }
75fe6060f1SDimitry Andric 
76e8d8bef9SDimitry Andric void AMDGPUMachineFunction::setDynLDSAlign(const DataLayout &DL,
77e8d8bef9SDimitry Andric                                            const GlobalVariable &GV) {
78e8d8bef9SDimitry Andric   assert(DL.getTypeAllocSize(GV.getValueType()).isZero());
79e8d8bef9SDimitry Andric 
80e8d8bef9SDimitry Andric   Align Alignment =
81e8d8bef9SDimitry Andric       DL.getValueOrABITypeAlignment(GV.getAlign(), GV.getValueType());
82e8d8bef9SDimitry Andric   if (Alignment <= DynLDSAlign)
83e8d8bef9SDimitry Andric     return;
84e8d8bef9SDimitry Andric 
85e8d8bef9SDimitry Andric   LDSSize = alignTo(StaticLDSSize, Alignment);
86e8d8bef9SDimitry Andric   DynLDSAlign = Alignment;
87e8d8bef9SDimitry Andric }
88