xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AMDGPU/AMDGPUMachineFunction.cpp (revision 0b57cec536236d46e3dba9bd041533462f33dbb7)
1*0b57cec5SDimitry Andric //===-- AMDGPUMachineFunctionInfo.cpp ---------------------------------------=//
2*0b57cec5SDimitry Andric //
3*0b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*0b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
5*0b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*0b57cec5SDimitry Andric //
7*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
8*0b57cec5SDimitry Andric 
9*0b57cec5SDimitry Andric #include "AMDGPUMachineFunction.h"
10*0b57cec5SDimitry Andric #include "AMDGPUSubtarget.h"
11*0b57cec5SDimitry Andric #include "AMDGPUPerfHintAnalysis.h"
12*0b57cec5SDimitry Andric #include "llvm/CodeGen/MachineModuleInfo.h"
13*0b57cec5SDimitry Andric 
14*0b57cec5SDimitry Andric using namespace llvm;
15*0b57cec5SDimitry Andric 
16*0b57cec5SDimitry Andric AMDGPUMachineFunction::AMDGPUMachineFunction(const MachineFunction &MF) :
17*0b57cec5SDimitry Andric   MachineFunctionInfo(),
18*0b57cec5SDimitry Andric   LocalMemoryObjects(),
19*0b57cec5SDimitry Andric   ExplicitKernArgSize(0),
20*0b57cec5SDimitry Andric   MaxKernArgAlign(0),
21*0b57cec5SDimitry Andric   LDSSize(0),
22*0b57cec5SDimitry Andric   IsEntryFunction(AMDGPU::isEntryFunctionCC(MF.getFunction().getCallingConv())),
23*0b57cec5SDimitry Andric   NoSignedZerosFPMath(MF.getTarget().Options.NoSignedZerosFPMath),
24*0b57cec5SDimitry Andric   MemoryBound(false),
25*0b57cec5SDimitry Andric   WaveLimiter(false) {
26*0b57cec5SDimitry Andric   const AMDGPUSubtarget &ST = AMDGPUSubtarget::get(MF);
27*0b57cec5SDimitry Andric 
28*0b57cec5SDimitry Andric   // FIXME: Should initialize KernArgSize based on ExplicitKernelArgOffset,
29*0b57cec5SDimitry Andric   // except reserved size is not correctly aligned.
30*0b57cec5SDimitry Andric   const Function &F = MF.getFunction();
31*0b57cec5SDimitry Andric 
32*0b57cec5SDimitry Andric   Attribute MemBoundAttr = F.getFnAttribute("amdgpu-memory-bound");
33*0b57cec5SDimitry Andric   MemoryBound = MemBoundAttr.isStringAttribute() &&
34*0b57cec5SDimitry Andric                 MemBoundAttr.getValueAsString() == "true";
35*0b57cec5SDimitry Andric 
36*0b57cec5SDimitry Andric   Attribute WaveLimitAttr = F.getFnAttribute("amdgpu-wave-limiter");
37*0b57cec5SDimitry Andric   WaveLimiter = WaveLimitAttr.isStringAttribute() &&
38*0b57cec5SDimitry Andric                 WaveLimitAttr.getValueAsString() == "true";
39*0b57cec5SDimitry Andric 
40*0b57cec5SDimitry Andric   CallingConv::ID CC = F.getCallingConv();
41*0b57cec5SDimitry Andric   if (CC == CallingConv::AMDGPU_KERNEL || CC == CallingConv::SPIR_KERNEL)
42*0b57cec5SDimitry Andric     ExplicitKernArgSize = ST.getExplicitKernArgSize(F, MaxKernArgAlign);
43*0b57cec5SDimitry Andric }
44*0b57cec5SDimitry Andric 
45*0b57cec5SDimitry Andric unsigned AMDGPUMachineFunction::allocateLDSGlobal(const DataLayout &DL,
46*0b57cec5SDimitry Andric                                                   const GlobalValue &GV) {
47*0b57cec5SDimitry Andric   auto Entry = LocalMemoryObjects.insert(std::make_pair(&GV, 0));
48*0b57cec5SDimitry Andric   if (!Entry.second)
49*0b57cec5SDimitry Andric     return Entry.first->second;
50*0b57cec5SDimitry Andric 
51*0b57cec5SDimitry Andric   unsigned Align = GV.getAlignment();
52*0b57cec5SDimitry Andric   if (Align == 0)
53*0b57cec5SDimitry Andric     Align = DL.getABITypeAlignment(GV.getValueType());
54*0b57cec5SDimitry Andric 
55*0b57cec5SDimitry Andric   /// TODO: We should sort these to minimize wasted space due to alignment
56*0b57cec5SDimitry Andric   /// padding. Currently the padding is decided by the first encountered use
57*0b57cec5SDimitry Andric   /// during lowering.
58*0b57cec5SDimitry Andric   unsigned Offset = LDSSize = alignTo(LDSSize, Align);
59*0b57cec5SDimitry Andric 
60*0b57cec5SDimitry Andric   Entry.first->second = Offset;
61*0b57cec5SDimitry Andric   LDSSize += DL.getTypeAllocSize(GV.getValueType());
62*0b57cec5SDimitry Andric 
63*0b57cec5SDimitry Andric   return Offset;
64*0b57cec5SDimitry Andric }
65