10b57cec5SDimitry Andric //===-- AMDGPU.h - MachineFunction passes hw codegen --------------*- C++ -*-=// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric /// \file 80b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 90b57cec5SDimitry Andric 100b57cec5SDimitry Andric #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPU_H 110b57cec5SDimitry Andric #define LLVM_LIB_TARGET_AMDGPU_AMDGPU_H 120b57cec5SDimitry Andric 13e8d8bef9SDimitry Andric #include "llvm/IR/PassManager.h" 141fd87a68SDimitry Andric #include "llvm/Pass.h" 155ffd83dbSDimitry Andric #include "llvm/Support/CodeGen.h" 160b57cec5SDimitry Andric 170b57cec5SDimitry Andric namespace llvm { 180b57cec5SDimitry Andric 190b57cec5SDimitry Andric class TargetMachine; 200b57cec5SDimitry Andric 215ffd83dbSDimitry Andric // GlobalISel passes 225ffd83dbSDimitry Andric void initializeAMDGPUPreLegalizerCombinerPass(PassRegistry &); 235ffd83dbSDimitry Andric FunctionPass *createAMDGPUPreLegalizeCombiner(bool IsOptNone); 245ffd83dbSDimitry Andric void initializeAMDGPUPostLegalizerCombinerPass(PassRegistry &); 255ffd83dbSDimitry Andric FunctionPass *createAMDGPUPostLegalizeCombiner(bool IsOptNone); 265ffd83dbSDimitry Andric FunctionPass *createAMDGPURegBankCombiner(bool IsOptNone); 275ffd83dbSDimitry Andric void initializeAMDGPURegBankCombinerPass(PassRegistry &); 285ffd83dbSDimitry Andric 29*06c3fb27SDimitry Andric void initializeAMDGPURegBankSelectPass(PassRegistry &); 30*06c3fb27SDimitry Andric 310b57cec5SDimitry Andric // SI Passes 320b57cec5SDimitry Andric FunctionPass *createGCNDPPCombinePass(); 330b57cec5SDimitry Andric FunctionPass *createSIAnnotateControlFlowPass(); 340b57cec5SDimitry Andric FunctionPass *createSIFoldOperandsPass(); 350b57cec5SDimitry Andric FunctionPass *createSIPeepholeSDWAPass(); 360b57cec5SDimitry Andric FunctionPass *createSILowerI1CopiesPass(); 370b57cec5SDimitry Andric FunctionPass *createSIShrinkInstructionsPass(); 380b57cec5SDimitry Andric FunctionPass *createSILoadStoreOptimizerPass(); 390b57cec5SDimitry Andric FunctionPass *createSIWholeQuadModePass(); 400b57cec5SDimitry Andric FunctionPass *createSIFixControlFlowLiveIntervalsPass(); 410b57cec5SDimitry Andric FunctionPass *createSIOptimizeExecMaskingPreRAPass(); 42fe6060f1SDimitry Andric FunctionPass *createSIOptimizeVGPRLiveRangePass(); 430b57cec5SDimitry Andric FunctionPass *createSIFixSGPRCopiesPass(); 44*06c3fb27SDimitry Andric FunctionPass *createLowerWWMCopiesPass(); 450b57cec5SDimitry Andric FunctionPass *createSIMemoryLegalizerPass(); 460b57cec5SDimitry Andric FunctionPass *createSIInsertWaitcntsPass(); 470b57cec5SDimitry Andric FunctionPass *createSIPreAllocateWWMRegsPass(); 480b57cec5SDimitry Andric FunctionPass *createSIFormMemoryClausesPass(); 495ffd83dbSDimitry Andric 505ffd83dbSDimitry Andric FunctionPass *createSIPostRABundlerPass(); 515ffd83dbSDimitry Andric FunctionPass *createAMDGPUSimplifyLibCallsPass(const TargetMachine *); 520b57cec5SDimitry Andric FunctionPass *createAMDGPUUseNativeCallsPass(); 53*06c3fb27SDimitry Andric ModulePass *createAMDGPURemoveIncompatibleFunctionsPass(const TargetMachine *); 540b57cec5SDimitry Andric FunctionPass *createAMDGPUCodeGenPreparePass(); 55e8d8bef9SDimitry Andric FunctionPass *createAMDGPULateCodeGenPreparePass(); 560b57cec5SDimitry Andric FunctionPass *createAMDGPUMachineCFGStructurizerPass(); 570b57cec5SDimitry Andric FunctionPass *createAMDGPURewriteOutArgumentsPass(); 58fe6060f1SDimitry Andric ModulePass *createAMDGPULowerModuleLDSPass(); 590b57cec5SDimitry Andric FunctionPass *createSIModeRegisterPass(); 60fe6060f1SDimitry Andric FunctionPass *createGCNPreRAOptimizationsPass(); 610b57cec5SDimitry Andric 62e8d8bef9SDimitry Andric struct AMDGPUSimplifyLibCallsPass : PassInfoMixin<AMDGPUSimplifyLibCallsPass> { 63e8d8bef9SDimitry Andric AMDGPUSimplifyLibCallsPass(TargetMachine &TM) : TM(TM) {} 64e8d8bef9SDimitry Andric PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); 65e8d8bef9SDimitry Andric 66e8d8bef9SDimitry Andric private: 67e8d8bef9SDimitry Andric TargetMachine &TM; 68e8d8bef9SDimitry Andric }; 69e8d8bef9SDimitry Andric 70e8d8bef9SDimitry Andric struct AMDGPUUseNativeCallsPass : PassInfoMixin<AMDGPUUseNativeCallsPass> { 71e8d8bef9SDimitry Andric PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); 72e8d8bef9SDimitry Andric }; 73e8d8bef9SDimitry Andric 740b57cec5SDimitry Andric void initializeAMDGPUDAGToDAGISelPass(PassRegistry&); 750b57cec5SDimitry Andric 760b57cec5SDimitry Andric void initializeAMDGPUMachineCFGStructurizerPass(PassRegistry&); 770b57cec5SDimitry Andric extern char &AMDGPUMachineCFGStructurizerID; 780b57cec5SDimitry Andric 790b57cec5SDimitry Andric void initializeAMDGPUAlwaysInlinePass(PassRegistry&); 800b57cec5SDimitry Andric 810b57cec5SDimitry Andric Pass *createAMDGPUAnnotateKernelFeaturesPass(); 82fe6060f1SDimitry Andric Pass *createAMDGPUAttributorPass(); 83fe6060f1SDimitry Andric void initializeAMDGPUAttributorPass(PassRegistry &); 840b57cec5SDimitry Andric void initializeAMDGPUAnnotateKernelFeaturesPass(PassRegistry &); 850b57cec5SDimitry Andric extern char &AMDGPUAnnotateKernelFeaturesID; 860b57cec5SDimitry Andric 87*06c3fb27SDimitry Andric // DPP/Iterative option enables the atomic optimizer with given strategy 88*06c3fb27SDimitry Andric // whereas None disables the atomic optimizer. 89*06c3fb27SDimitry Andric enum class ScanOptions { DPP, Iterative, None }; 90*06c3fb27SDimitry Andric FunctionPass *createAMDGPUAtomicOptimizerPass(ScanOptions ScanStrategy); 910b57cec5SDimitry Andric void initializeAMDGPUAtomicOptimizerPass(PassRegistry &); 920b57cec5SDimitry Andric extern char &AMDGPUAtomicOptimizerID; 930b57cec5SDimitry Andric 94bdd1243dSDimitry Andric ModulePass *createAMDGPUCtorDtorLoweringLegacyPass(); 95bdd1243dSDimitry Andric void initializeAMDGPUCtorDtorLoweringLegacyPass(PassRegistry &); 96bdd1243dSDimitry Andric extern char &AMDGPUCtorDtorLoweringLegacyPassID; 97349cc55cSDimitry Andric 980b57cec5SDimitry Andric FunctionPass *createAMDGPULowerKernelArgumentsPass(); 990b57cec5SDimitry Andric void initializeAMDGPULowerKernelArgumentsPass(PassRegistry &); 1000b57cec5SDimitry Andric extern char &AMDGPULowerKernelArgumentsID; 1010b57cec5SDimitry Andric 102349cc55cSDimitry Andric FunctionPass *createAMDGPUPromoteKernelArgumentsPass(); 103349cc55cSDimitry Andric void initializeAMDGPUPromoteKernelArgumentsPass(PassRegistry &); 104349cc55cSDimitry Andric extern char &AMDGPUPromoteKernelArgumentsID; 105349cc55cSDimitry Andric 106349cc55cSDimitry Andric struct AMDGPUPromoteKernelArgumentsPass 107349cc55cSDimitry Andric : PassInfoMixin<AMDGPUPromoteKernelArgumentsPass> { 108349cc55cSDimitry Andric PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); 109349cc55cSDimitry Andric }; 110349cc55cSDimitry Andric 1110b57cec5SDimitry Andric ModulePass *createAMDGPULowerKernelAttributesPass(); 1120b57cec5SDimitry Andric void initializeAMDGPULowerKernelAttributesPass(PassRegistry &); 1130b57cec5SDimitry Andric extern char &AMDGPULowerKernelAttributesID; 1140b57cec5SDimitry Andric 115e8d8bef9SDimitry Andric struct AMDGPULowerKernelAttributesPass 116e8d8bef9SDimitry Andric : PassInfoMixin<AMDGPULowerKernelAttributesPass> { 117e8d8bef9SDimitry Andric PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); 118e8d8bef9SDimitry Andric }; 119e8d8bef9SDimitry Andric 120fe6060f1SDimitry Andric void initializeAMDGPULowerModuleLDSPass(PassRegistry &); 121fe6060f1SDimitry Andric extern char &AMDGPULowerModuleLDSID; 122fe6060f1SDimitry Andric 123fe6060f1SDimitry Andric struct AMDGPULowerModuleLDSPass : PassInfoMixin<AMDGPULowerModuleLDSPass> { 124fe6060f1SDimitry Andric PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM); 125fe6060f1SDimitry Andric }; 126fe6060f1SDimitry Andric 1270b57cec5SDimitry Andric void initializeAMDGPURewriteOutArgumentsPass(PassRegistry &); 1280b57cec5SDimitry Andric extern char &AMDGPURewriteOutArgumentsID; 1290b57cec5SDimitry Andric 1300b57cec5SDimitry Andric void initializeGCNDPPCombinePass(PassRegistry &); 1310b57cec5SDimitry Andric extern char &GCNDPPCombineID; 1320b57cec5SDimitry Andric 1330b57cec5SDimitry Andric void initializeSIFoldOperandsPass(PassRegistry &); 1340b57cec5SDimitry Andric extern char &SIFoldOperandsID; 1350b57cec5SDimitry Andric 1360b57cec5SDimitry Andric void initializeSIPeepholeSDWAPass(PassRegistry &); 1370b57cec5SDimitry Andric extern char &SIPeepholeSDWAID; 1380b57cec5SDimitry Andric 1390b57cec5SDimitry Andric void initializeSIShrinkInstructionsPass(PassRegistry&); 1400b57cec5SDimitry Andric extern char &SIShrinkInstructionsID; 1410b57cec5SDimitry Andric 1420b57cec5SDimitry Andric void initializeSIFixSGPRCopiesPass(PassRegistry &); 1430b57cec5SDimitry Andric extern char &SIFixSGPRCopiesID; 1440b57cec5SDimitry Andric 1450b57cec5SDimitry Andric void initializeSIFixVGPRCopiesPass(PassRegistry &); 1460b57cec5SDimitry Andric extern char &SIFixVGPRCopiesID; 1470b57cec5SDimitry Andric 148*06c3fb27SDimitry Andric void initializeSILowerWWMCopiesPass(PassRegistry &); 149*06c3fb27SDimitry Andric extern char &SILowerWWMCopiesID; 150*06c3fb27SDimitry Andric 1510b57cec5SDimitry Andric void initializeSILowerI1CopiesPass(PassRegistry &); 1520b57cec5SDimitry Andric extern char &SILowerI1CopiesID; 1530b57cec5SDimitry Andric 1540b57cec5SDimitry Andric void initializeSILowerSGPRSpillsPass(PassRegistry &); 1550b57cec5SDimitry Andric extern char &SILowerSGPRSpillsID; 1560b57cec5SDimitry Andric 1570b57cec5SDimitry Andric void initializeSILoadStoreOptimizerPass(PassRegistry &); 1580b57cec5SDimitry Andric extern char &SILoadStoreOptimizerID; 1590b57cec5SDimitry Andric 1600b57cec5SDimitry Andric void initializeSIWholeQuadModePass(PassRegistry &); 1610b57cec5SDimitry Andric extern char &SIWholeQuadModeID; 1620b57cec5SDimitry Andric 1630b57cec5SDimitry Andric void initializeSILowerControlFlowPass(PassRegistry &); 1640b57cec5SDimitry Andric extern char &SILowerControlFlowID; 1650b57cec5SDimitry Andric 1665ffd83dbSDimitry Andric void initializeSIPreEmitPeepholePass(PassRegistry &); 1675ffd83dbSDimitry Andric extern char &SIPreEmitPeepholeID; 1685ffd83dbSDimitry Andric 169fe6060f1SDimitry Andric void initializeSILateBranchLoweringPass(PassRegistry &); 170fe6060f1SDimitry Andric extern char &SILateBranchLoweringPassID; 1710b57cec5SDimitry Andric 1720b57cec5SDimitry Andric void initializeSIOptimizeExecMaskingPass(PassRegistry &); 1730b57cec5SDimitry Andric extern char &SIOptimizeExecMaskingID; 1740b57cec5SDimitry Andric 1750b57cec5SDimitry Andric void initializeSIPreAllocateWWMRegsPass(PassRegistry &); 1760b57cec5SDimitry Andric extern char &SIPreAllocateWWMRegsID; 1770b57cec5SDimitry Andric 1780b57cec5SDimitry Andric void initializeAMDGPUSimplifyLibCallsPass(PassRegistry &); 1790b57cec5SDimitry Andric extern char &AMDGPUSimplifyLibCallsID; 1800b57cec5SDimitry Andric 1810b57cec5SDimitry Andric void initializeAMDGPUUseNativeCallsPass(PassRegistry &); 1820b57cec5SDimitry Andric extern char &AMDGPUUseNativeCallsID; 1830b57cec5SDimitry Andric 1840b57cec5SDimitry Andric void initializeAMDGPUPerfHintAnalysisPass(PassRegistry &); 1850b57cec5SDimitry Andric extern char &AMDGPUPerfHintAnalysisID; 1860b57cec5SDimitry Andric 1870b57cec5SDimitry Andric // Passes common to R600 and SI 1880b57cec5SDimitry Andric FunctionPass *createAMDGPUPromoteAlloca(); 1890b57cec5SDimitry Andric void initializeAMDGPUPromoteAllocaPass(PassRegistry&); 1900b57cec5SDimitry Andric extern char &AMDGPUPromoteAllocaID; 1910b57cec5SDimitry Andric 1925ffd83dbSDimitry Andric FunctionPass *createAMDGPUPromoteAllocaToVector(); 1935ffd83dbSDimitry Andric void initializeAMDGPUPromoteAllocaToVectorPass(PassRegistry&); 1945ffd83dbSDimitry Andric extern char &AMDGPUPromoteAllocaToVectorID; 1955ffd83dbSDimitry Andric 196e8d8bef9SDimitry Andric struct AMDGPUPromoteAllocaPass : PassInfoMixin<AMDGPUPromoteAllocaPass> { 197e8d8bef9SDimitry Andric AMDGPUPromoteAllocaPass(TargetMachine &TM) : TM(TM) {} 198e8d8bef9SDimitry Andric PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); 199e8d8bef9SDimitry Andric 200e8d8bef9SDimitry Andric private: 201e8d8bef9SDimitry Andric TargetMachine &TM; 202e8d8bef9SDimitry Andric }; 203e8d8bef9SDimitry Andric 204e8d8bef9SDimitry Andric struct AMDGPUPromoteAllocaToVectorPass 205e8d8bef9SDimitry Andric : PassInfoMixin<AMDGPUPromoteAllocaToVectorPass> { 206e8d8bef9SDimitry Andric AMDGPUPromoteAllocaToVectorPass(TargetMachine &TM) : TM(TM) {} 207e8d8bef9SDimitry Andric PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); 208e8d8bef9SDimitry Andric 209e8d8bef9SDimitry Andric private: 210e8d8bef9SDimitry Andric TargetMachine &TM; 211e8d8bef9SDimitry Andric }; 212e8d8bef9SDimitry Andric 213*06c3fb27SDimitry Andric struct AMDGPUAtomicOptimizerPass : PassInfoMixin<AMDGPUAtomicOptimizerPass> { 214*06c3fb27SDimitry Andric AMDGPUAtomicOptimizerPass(TargetMachine &TM, ScanOptions ScanImpl) 215*06c3fb27SDimitry Andric : TM(TM), ScanImpl(ScanImpl) {} 216*06c3fb27SDimitry Andric PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); 217*06c3fb27SDimitry Andric 218*06c3fb27SDimitry Andric private: 219*06c3fb27SDimitry Andric TargetMachine &TM; 220*06c3fb27SDimitry Andric ScanOptions ScanImpl; 221*06c3fb27SDimitry Andric }; 222*06c3fb27SDimitry Andric 2230b57cec5SDimitry Andric Pass *createAMDGPUStructurizeCFGPass(); 224bdd1243dSDimitry Andric FunctionPass *createAMDGPUISelDag(TargetMachine &TM, 225bdd1243dSDimitry Andric CodeGenOpt::Level OptLevel); 2260b57cec5SDimitry Andric ModulePass *createAMDGPUAlwaysInlinePass(bool GlobalOpt = true); 227e8d8bef9SDimitry Andric 228e8d8bef9SDimitry Andric struct AMDGPUAlwaysInlinePass : PassInfoMixin<AMDGPUAlwaysInlinePass> { 229e8d8bef9SDimitry Andric AMDGPUAlwaysInlinePass(bool GlobalOpt = true) : GlobalOpt(GlobalOpt) {} 230e8d8bef9SDimitry Andric PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM); 231e8d8bef9SDimitry Andric 232e8d8bef9SDimitry Andric private: 233e8d8bef9SDimitry Andric bool GlobalOpt; 234e8d8bef9SDimitry Andric }; 235e8d8bef9SDimitry Andric 236*06c3fb27SDimitry Andric class AMDGPUCodeGenPreparePass 237*06c3fb27SDimitry Andric : public PassInfoMixin<AMDGPUCodeGenPreparePass> { 238*06c3fb27SDimitry Andric private: 239*06c3fb27SDimitry Andric TargetMachine &TM; 240*06c3fb27SDimitry Andric 241*06c3fb27SDimitry Andric public: 242*06c3fb27SDimitry Andric AMDGPUCodeGenPreparePass(TargetMachine &TM) : TM(TM){}; 243*06c3fb27SDimitry Andric PreservedAnalyses run(Function &, FunctionAnalysisManager &); 244*06c3fb27SDimitry Andric }; 245*06c3fb27SDimitry Andric 2460b57cec5SDimitry Andric FunctionPass *createAMDGPUAnnotateUniformValues(); 2470b57cec5SDimitry Andric 2488bcb0991SDimitry Andric ModulePass *createAMDGPUPrintfRuntimeBinding(); 2498bcb0991SDimitry Andric void initializeAMDGPUPrintfRuntimeBindingPass(PassRegistry&); 2508bcb0991SDimitry Andric extern char &AMDGPUPrintfRuntimeBindingID; 2518bcb0991SDimitry Andric 252fe6060f1SDimitry Andric void initializeAMDGPUResourceUsageAnalysisPass(PassRegistry &); 253fe6060f1SDimitry Andric extern char &AMDGPUResourceUsageAnalysisID; 254fe6060f1SDimitry Andric 255e8d8bef9SDimitry Andric struct AMDGPUPrintfRuntimeBindingPass 256e8d8bef9SDimitry Andric : PassInfoMixin<AMDGPUPrintfRuntimeBindingPass> { 257e8d8bef9SDimitry Andric PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM); 258e8d8bef9SDimitry Andric }; 259e8d8bef9SDimitry Andric 2600b57cec5SDimitry Andric ModulePass* createAMDGPUUnifyMetadataPass(); 2610b57cec5SDimitry Andric void initializeAMDGPUUnifyMetadataPass(PassRegistry&); 2620b57cec5SDimitry Andric extern char &AMDGPUUnifyMetadataID; 2630b57cec5SDimitry Andric 264e8d8bef9SDimitry Andric struct AMDGPUUnifyMetadataPass : PassInfoMixin<AMDGPUUnifyMetadataPass> { 265e8d8bef9SDimitry Andric PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM); 266e8d8bef9SDimitry Andric }; 267e8d8bef9SDimitry Andric 2680b57cec5SDimitry Andric void initializeSIOptimizeExecMaskingPreRAPass(PassRegistry&); 2690b57cec5SDimitry Andric extern char &SIOptimizeExecMaskingPreRAID; 2700b57cec5SDimitry Andric 271fe6060f1SDimitry Andric void initializeSIOptimizeVGPRLiveRangePass(PassRegistry &); 272fe6060f1SDimitry Andric extern char &SIOptimizeVGPRLiveRangeID; 273fe6060f1SDimitry Andric 2740b57cec5SDimitry Andric void initializeAMDGPUAnnotateUniformValuesPass(PassRegistry&); 2750b57cec5SDimitry Andric extern char &AMDGPUAnnotateUniformValuesPassID; 2760b57cec5SDimitry Andric 2770b57cec5SDimitry Andric void initializeAMDGPUCodeGenPreparePass(PassRegistry&); 2780b57cec5SDimitry Andric extern char &AMDGPUCodeGenPrepareID; 2790b57cec5SDimitry Andric 280*06c3fb27SDimitry Andric void initializeAMDGPURemoveIncompatibleFunctionsPass(PassRegistry &); 281*06c3fb27SDimitry Andric extern char &AMDGPURemoveIncompatibleFunctionsID; 282*06c3fb27SDimitry Andric 283e8d8bef9SDimitry Andric void initializeAMDGPULateCodeGenPreparePass(PassRegistry &); 284e8d8bef9SDimitry Andric extern char &AMDGPULateCodeGenPrepareID; 285e8d8bef9SDimitry Andric 286bdd1243dSDimitry Andric FunctionPass *createAMDGPURewriteUndefForPHIPass(); 287bdd1243dSDimitry Andric void initializeAMDGPURewriteUndefForPHIPass(PassRegistry &); 288bdd1243dSDimitry Andric extern char &AMDGPURewriteUndefForPHIPassID; 289bdd1243dSDimitry Andric 2900b57cec5SDimitry Andric void initializeSIAnnotateControlFlowPass(PassRegistry&); 2910b57cec5SDimitry Andric extern char &SIAnnotateControlFlowPassID; 2920b57cec5SDimitry Andric 2930b57cec5SDimitry Andric void initializeSIMemoryLegalizerPass(PassRegistry&); 2940b57cec5SDimitry Andric extern char &SIMemoryLegalizerID; 2950b57cec5SDimitry Andric 2960b57cec5SDimitry Andric void initializeSIModeRegisterPass(PassRegistry&); 2970b57cec5SDimitry Andric extern char &SIModeRegisterID; 2980b57cec5SDimitry Andric 29981ad6265SDimitry Andric void initializeAMDGPUInsertDelayAluPass(PassRegistry &); 30081ad6265SDimitry Andric extern char &AMDGPUInsertDelayAluID; 30181ad6265SDimitry Andric 3025ffd83dbSDimitry Andric void initializeSIInsertHardClausesPass(PassRegistry &); 3035ffd83dbSDimitry Andric extern char &SIInsertHardClausesID; 3045ffd83dbSDimitry Andric 3050b57cec5SDimitry Andric void initializeSIInsertWaitcntsPass(PassRegistry&); 3060b57cec5SDimitry Andric extern char &SIInsertWaitcntsID; 3070b57cec5SDimitry Andric 3080b57cec5SDimitry Andric void initializeSIFormMemoryClausesPass(PassRegistry&); 3090b57cec5SDimitry Andric extern char &SIFormMemoryClausesID; 3100b57cec5SDimitry Andric 3115ffd83dbSDimitry Andric void initializeSIPostRABundlerPass(PassRegistry&); 3125ffd83dbSDimitry Andric extern char &SIPostRABundlerID; 3135ffd83dbSDimitry Andric 314753f127fSDimitry Andric void initializeGCNCreateVOPDPass(PassRegistry &); 315753f127fSDimitry Andric extern char &GCNCreateVOPDID; 316753f127fSDimitry Andric 3170b57cec5SDimitry Andric void initializeAMDGPUUnifyDivergentExitNodesPass(PassRegistry&); 3180b57cec5SDimitry Andric extern char &AMDGPUUnifyDivergentExitNodesID; 3190b57cec5SDimitry Andric 3200b57cec5SDimitry Andric ImmutablePass *createAMDGPUAAWrapperPass(); 3210b57cec5SDimitry Andric void initializeAMDGPUAAWrapperPassPass(PassRegistry&); 3220b57cec5SDimitry Andric ImmutablePass *createAMDGPUExternalAAWrapperPass(); 3230b57cec5SDimitry Andric void initializeAMDGPUExternalAAWrapperPass(PassRegistry&); 3240b57cec5SDimitry Andric 3250b57cec5SDimitry Andric void initializeAMDGPUArgumentUsageInfoPass(PassRegistry &); 3260b57cec5SDimitry Andric 3270b57cec5SDimitry Andric ModulePass *createAMDGPUOpenCLEnqueuedBlockLoweringPass(); 3280b57cec5SDimitry Andric void initializeAMDGPUOpenCLEnqueuedBlockLoweringPass(PassRegistry &); 3290b57cec5SDimitry Andric extern char &AMDGPUOpenCLEnqueuedBlockLoweringID; 3300b57cec5SDimitry Andric 3310b57cec5SDimitry Andric void initializeGCNNSAReassignPass(PassRegistry &); 3320b57cec5SDimitry Andric extern char &GCNNSAReassignID; 3330b57cec5SDimitry Andric 334*06c3fb27SDimitry Andric void initializeGCNPreRALongBranchRegPass(PassRegistry &); 335*06c3fb27SDimitry Andric extern char &GCNPreRALongBranchRegID; 336*06c3fb27SDimitry Andric 337fe6060f1SDimitry Andric void initializeGCNPreRAOptimizationsPass(PassRegistry &); 338fe6060f1SDimitry Andric extern char &GCNPreRAOptimizationsID; 339fe6060f1SDimitry Andric 34081ad6265SDimitry Andric FunctionPass *createAMDGPUSetWavePriorityPass(); 34181ad6265SDimitry Andric void initializeAMDGPUSetWavePriorityPass(PassRegistry &); 34281ad6265SDimitry Andric 343*06c3fb27SDimitry Andric void initializeGCNRewritePartialRegUsesPass(llvm::PassRegistry &); 344*06c3fb27SDimitry Andric extern char &GCNRewritePartialRegUsesID; 345*06c3fb27SDimitry Andric 3460b57cec5SDimitry Andric namespace AMDGPU { 3470b57cec5SDimitry Andric enum TargetIndex { 3480b57cec5SDimitry Andric TI_CONSTDATA_START, 3490b57cec5SDimitry Andric TI_SCRATCH_RSRC_DWORD0, 3500b57cec5SDimitry Andric TI_SCRATCH_RSRC_DWORD1, 3510b57cec5SDimitry Andric TI_SCRATCH_RSRC_DWORD2, 3520b57cec5SDimitry Andric TI_SCRATCH_RSRC_DWORD3 3530b57cec5SDimitry Andric }; 3540b57cec5SDimitry Andric } 3550b57cec5SDimitry Andric 3560b57cec5SDimitry Andric /// OpenCL uses address spaces to differentiate between 3570b57cec5SDimitry Andric /// various memory regions on the hardware. On the CPU 3580b57cec5SDimitry Andric /// all of the address spaces point to the same memory, 3590b57cec5SDimitry Andric /// however on the GPU, each address space points to 3600b57cec5SDimitry Andric /// a separate piece of memory that is unique from other 3610b57cec5SDimitry Andric /// memory locations. 3620b57cec5SDimitry Andric namespace AMDGPUAS { 3630b57cec5SDimitry Andric enum : unsigned { 3640b57cec5SDimitry Andric // The maximum value for flat, generic, local, private, constant and region. 365*06c3fb27SDimitry Andric MAX_AMDGPU_ADDRESS = 8, 3660b57cec5SDimitry Andric 3670b57cec5SDimitry Andric FLAT_ADDRESS = 0, ///< Address space for flat memory. 3680b57cec5SDimitry Andric GLOBAL_ADDRESS = 1, ///< Address space for global memory (RAT0, VTX0). 3690b57cec5SDimitry Andric REGION_ADDRESS = 2, ///< Address space for region memory. (GDS) 3700b57cec5SDimitry Andric 3710b57cec5SDimitry Andric CONSTANT_ADDRESS = 4, ///< Address space for constant memory (VTX2). 3720b57cec5SDimitry Andric LOCAL_ADDRESS = 3, ///< Address space for local memory. 3730b57cec5SDimitry Andric PRIVATE_ADDRESS = 5, ///< Address space for private memory. 3740b57cec5SDimitry Andric 3750b57cec5SDimitry Andric CONSTANT_ADDRESS_32BIT = 6, ///< Address space for 32-bit constant memory. 3760b57cec5SDimitry Andric 3770b57cec5SDimitry Andric BUFFER_FAT_POINTER = 7, ///< Address space for 160-bit buffer fat pointers. 378*06c3fb27SDimitry Andric ///< Not used in backend. 379*06c3fb27SDimitry Andric 380*06c3fb27SDimitry Andric BUFFER_RESOURCE = 8, ///< Address space for 128-bit buffer resources. 381*06c3fb27SDimitry Andric 382*06c3fb27SDimitry Andric /// Internal address spaces. Can be freely renumbered. 383*06c3fb27SDimitry Andric STREAMOUT_REGISTER = 128, ///< Address space for GS NGG Streamout registers. 384*06c3fb27SDimitry Andric /// end Internal address spaces. 3850b57cec5SDimitry Andric 386349cc55cSDimitry Andric /// Address space for direct addressable parameter memory (CONST0). 3870b57cec5SDimitry Andric PARAM_D_ADDRESS = 6, 388349cc55cSDimitry Andric /// Address space for indirect addressable parameter memory (VTX1). 3890b57cec5SDimitry Andric PARAM_I_ADDRESS = 7, 3900b57cec5SDimitry Andric 3910b57cec5SDimitry Andric // Do not re-order the CONSTANT_BUFFER_* enums. Several places depend on 3920b57cec5SDimitry Andric // this order to be able to dynamically index a constant buffer, for 3930b57cec5SDimitry Andric // example: 3940b57cec5SDimitry Andric // 3950b57cec5SDimitry Andric // ConstantBufferAS = CONSTANT_BUFFER_0 + CBIdx 3960b57cec5SDimitry Andric 3970b57cec5SDimitry Andric CONSTANT_BUFFER_0 = 8, 3980b57cec5SDimitry Andric CONSTANT_BUFFER_1 = 9, 3990b57cec5SDimitry Andric CONSTANT_BUFFER_2 = 10, 4000b57cec5SDimitry Andric CONSTANT_BUFFER_3 = 11, 4010b57cec5SDimitry Andric CONSTANT_BUFFER_4 = 12, 4020b57cec5SDimitry Andric CONSTANT_BUFFER_5 = 13, 4030b57cec5SDimitry Andric CONSTANT_BUFFER_6 = 14, 4040b57cec5SDimitry Andric CONSTANT_BUFFER_7 = 15, 4050b57cec5SDimitry Andric CONSTANT_BUFFER_8 = 16, 4060b57cec5SDimitry Andric CONSTANT_BUFFER_9 = 17, 4070b57cec5SDimitry Andric CONSTANT_BUFFER_10 = 18, 4080b57cec5SDimitry Andric CONSTANT_BUFFER_11 = 19, 4090b57cec5SDimitry Andric CONSTANT_BUFFER_12 = 20, 4100b57cec5SDimitry Andric CONSTANT_BUFFER_13 = 21, 4110b57cec5SDimitry Andric CONSTANT_BUFFER_14 = 22, 4120b57cec5SDimitry Andric CONSTANT_BUFFER_15 = 23, 4130b57cec5SDimitry Andric 4140b57cec5SDimitry Andric // Some places use this if the address space can't be determined. 4150b57cec5SDimitry Andric UNKNOWN_ADDRESS_SPACE = ~0u, 4160b57cec5SDimitry Andric }; 4170b57cec5SDimitry Andric } 4180b57cec5SDimitry Andric 419e8d8bef9SDimitry Andric namespace AMDGPU { 420e8d8bef9SDimitry Andric 421e8d8bef9SDimitry Andric // FIXME: Missing constant_32bit 422e8d8bef9SDimitry Andric inline bool isFlatGlobalAddrSpace(unsigned AS) { 423e8d8bef9SDimitry Andric return AS == AMDGPUAS::GLOBAL_ADDRESS || 424e8d8bef9SDimitry Andric AS == AMDGPUAS::FLAT_ADDRESS || 425e8d8bef9SDimitry Andric AS == AMDGPUAS::CONSTANT_ADDRESS || 426e8d8bef9SDimitry Andric AS > AMDGPUAS::MAX_AMDGPU_ADDRESS; 427e8d8bef9SDimitry Andric } 428*06c3fb27SDimitry Andric 429*06c3fb27SDimitry Andric inline bool isExtendedGlobalAddrSpace(unsigned AS) { 430*06c3fb27SDimitry Andric return AS == AMDGPUAS::GLOBAL_ADDRESS || AS == AMDGPUAS::CONSTANT_ADDRESS || 431*06c3fb27SDimitry Andric AS == AMDGPUAS::CONSTANT_ADDRESS_32BIT || 432*06c3fb27SDimitry Andric AS > AMDGPUAS::MAX_AMDGPU_ADDRESS; 433*06c3fb27SDimitry Andric } 434*06c3fb27SDimitry Andric 435*06c3fb27SDimitry Andric static inline bool addrspacesMayAlias(unsigned AS1, unsigned AS2) { 436*06c3fb27SDimitry Andric static_assert(AMDGPUAS::MAX_AMDGPU_ADDRESS <= 8, "Addr space out of range"); 437*06c3fb27SDimitry Andric 438*06c3fb27SDimitry Andric if (AS1 > AMDGPUAS::MAX_AMDGPU_ADDRESS || AS2 > AMDGPUAS::MAX_AMDGPU_ADDRESS) 439*06c3fb27SDimitry Andric return true; 440*06c3fb27SDimitry Andric 441*06c3fb27SDimitry Andric // This array is indexed by address space value enum elements 0 ... to 8 442*06c3fb27SDimitry Andric // clang-format off 443*06c3fb27SDimitry Andric static const bool ASAliasRules[9][9] = { 444*06c3fb27SDimitry Andric /* Flat Global Region Group Constant Private Const32 BufFatPtr BufRsrc */ 445*06c3fb27SDimitry Andric /* Flat */ {true, true, false, true, true, true, true, true, true}, 446*06c3fb27SDimitry Andric /* Global */ {true, true, false, false, true, false, true, true, true}, 447*06c3fb27SDimitry Andric /* Region */ {false, false, true, false, false, false, false, false, false}, 448*06c3fb27SDimitry Andric /* Group */ {true, false, false, true, false, false, false, false, false}, 449*06c3fb27SDimitry Andric /* Constant */ {true, true, false, false, false, false, true, true, true}, 450*06c3fb27SDimitry Andric /* Private */ {true, false, false, false, false, true, false, false, false}, 451*06c3fb27SDimitry Andric /* Constant 32-bit */ {true, true, false, false, true, false, false, true, true}, 452*06c3fb27SDimitry Andric /* Buffer Fat Ptr */ {true, true, false, false, true, false, true, true, true}, 453*06c3fb27SDimitry Andric /* Buffer Resource */ {true, true, false, false, true, false, true, true, true}, 454*06c3fb27SDimitry Andric }; 455*06c3fb27SDimitry Andric // clang-format on 456*06c3fb27SDimitry Andric 457*06c3fb27SDimitry Andric return ASAliasRules[AS1][AS2]; 458*06c3fb27SDimitry Andric } 459*06c3fb27SDimitry Andric 460e8d8bef9SDimitry Andric } 461e8d8bef9SDimitry Andric 462e8d8bef9SDimitry Andric } // End namespace llvm 463e8d8bef9SDimitry Andric 4640b57cec5SDimitry Andric #endif 465