10b57cec5SDimitry Andric //===-- AMDGPUMachineFunctionInfo.cpp ---------------------------------------=// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric 90b57cec5SDimitry Andric #include "AMDGPUMachineFunction.h" 100b57cec5SDimitry Andric #include "AMDGPUPerfHintAnalysis.h" 11e8d8bef9SDimitry Andric #include "AMDGPUSubtarget.h" 120b57cec5SDimitry Andric #include "llvm/CodeGen/MachineModuleInfo.h" 13e8d8bef9SDimitry Andric #include "llvm/Target/TargetMachine.h" 140b57cec5SDimitry Andric 150b57cec5SDimitry Andric using namespace llvm; 160b57cec5SDimitry Andric 17e8d8bef9SDimitry Andric AMDGPUMachineFunction::AMDGPUMachineFunction(const MachineFunction &MF) 18e8d8bef9SDimitry Andric : MachineFunctionInfo(), Mode(MF.getFunction()), 19e8d8bef9SDimitry Andric IsEntryFunction( 20e8d8bef9SDimitry Andric AMDGPU::isEntryFunctionCC(MF.getFunction().getCallingConv())), 21e8d8bef9SDimitry Andric IsModuleEntryFunction( 22e8d8bef9SDimitry Andric AMDGPU::isModuleEntryFunctionCC(MF.getFunction().getCallingConv())), 235ffd83dbSDimitry Andric NoSignedZerosFPMath(MF.getTarget().Options.NoSignedZerosFPMath) { 240b57cec5SDimitry Andric const AMDGPUSubtarget &ST = AMDGPUSubtarget::get(MF); 250b57cec5SDimitry Andric 260b57cec5SDimitry Andric // FIXME: Should initialize KernArgSize based on ExplicitKernelArgOffset, 270b57cec5SDimitry Andric // except reserved size is not correctly aligned. 280b57cec5SDimitry Andric const Function &F = MF.getFunction(); 290b57cec5SDimitry Andric 300b57cec5SDimitry Andric Attribute MemBoundAttr = F.getFnAttribute("amdgpu-memory-bound"); 31*fe6060f1SDimitry Andric MemoryBound = MemBoundAttr.getValueAsBool(); 320b57cec5SDimitry Andric 330b57cec5SDimitry Andric Attribute WaveLimitAttr = F.getFnAttribute("amdgpu-wave-limiter"); 34*fe6060f1SDimitry Andric WaveLimiter = WaveLimitAttr.getValueAsBool(); 350b57cec5SDimitry Andric 360b57cec5SDimitry Andric CallingConv::ID CC = F.getCallingConv(); 370b57cec5SDimitry Andric if (CC == CallingConv::AMDGPU_KERNEL || CC == CallingConv::SPIR_KERNEL) 380b57cec5SDimitry Andric ExplicitKernArgSize = ST.getExplicitKernArgSize(F, MaxKernArgAlign); 390b57cec5SDimitry Andric } 400b57cec5SDimitry Andric 410b57cec5SDimitry Andric unsigned AMDGPUMachineFunction::allocateLDSGlobal(const DataLayout &DL, 425ffd83dbSDimitry Andric const GlobalVariable &GV) { 430b57cec5SDimitry Andric auto Entry = LocalMemoryObjects.insert(std::make_pair(&GV, 0)); 440b57cec5SDimitry Andric if (!Entry.second) 450b57cec5SDimitry Andric return Entry.first->second; 460b57cec5SDimitry Andric 475ffd83dbSDimitry Andric Align Alignment = 485ffd83dbSDimitry Andric DL.getValueOrABITypeAlignment(GV.getAlign(), GV.getValueType()); 490b57cec5SDimitry Andric 500b57cec5SDimitry Andric /// TODO: We should sort these to minimize wasted space due to alignment 510b57cec5SDimitry Andric /// padding. Currently the padding is decided by the first encountered use 520b57cec5SDimitry Andric /// during lowering. 53e8d8bef9SDimitry Andric unsigned Offset = StaticLDSSize = alignTo(StaticLDSSize, Alignment); 540b57cec5SDimitry Andric 550b57cec5SDimitry Andric Entry.first->second = Offset; 56e8d8bef9SDimitry Andric StaticLDSSize += DL.getTypeAllocSize(GV.getValueType()); 57e8d8bef9SDimitry Andric 58e8d8bef9SDimitry Andric // Update the LDS size considering the padding to align the dynamic shared 59e8d8bef9SDimitry Andric // memory. 60e8d8bef9SDimitry Andric LDSSize = alignTo(StaticLDSSize, DynLDSAlign); 610b57cec5SDimitry Andric 620b57cec5SDimitry Andric return Offset; 630b57cec5SDimitry Andric } 64e8d8bef9SDimitry Andric 65*fe6060f1SDimitry Andric void AMDGPUMachineFunction::allocateModuleLDSGlobal(const Module *M) { 66*fe6060f1SDimitry Andric if (isModuleEntryFunction()) { 67*fe6060f1SDimitry Andric const GlobalVariable *GV = M->getNamedGlobal("llvm.amdgcn.module.lds"); 68*fe6060f1SDimitry Andric if (GV) { 69*fe6060f1SDimitry Andric unsigned Offset = allocateLDSGlobal(M->getDataLayout(), *GV); 70*fe6060f1SDimitry Andric (void)Offset; 71*fe6060f1SDimitry Andric assert(Offset == 0 && 72*fe6060f1SDimitry Andric "Module LDS expected to be allocated before other LDS"); 73*fe6060f1SDimitry Andric } 74*fe6060f1SDimitry Andric } 75*fe6060f1SDimitry Andric } 76*fe6060f1SDimitry Andric 77e8d8bef9SDimitry Andric void AMDGPUMachineFunction::setDynLDSAlign(const DataLayout &DL, 78e8d8bef9SDimitry Andric const GlobalVariable &GV) { 79e8d8bef9SDimitry Andric assert(DL.getTypeAllocSize(GV.getValueType()).isZero()); 80e8d8bef9SDimitry Andric 81e8d8bef9SDimitry Andric Align Alignment = 82e8d8bef9SDimitry Andric DL.getValueOrABITypeAlignment(GV.getAlign(), GV.getValueType()); 83e8d8bef9SDimitry Andric if (Alignment <= DynLDSAlign) 84e8d8bef9SDimitry Andric return; 85e8d8bef9SDimitry Andric 86e8d8bef9SDimitry Andric LDSSize = alignTo(StaticLDSSize, Alignment); 87e8d8bef9SDimitry Andric DynLDSAlign = Alignment; 88e8d8bef9SDimitry Andric } 89