xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AMDGPU/AMDGPU.h (revision 06c3fb2749bda94cb5201f81ffdb8fa6c3161b2e)
10b57cec5SDimitry Andric //===-- AMDGPU.h - MachineFunction passes hw codegen --------------*- C++ -*-=//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric /// \file
80b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
90b57cec5SDimitry Andric 
100b57cec5SDimitry Andric #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPU_H
110b57cec5SDimitry Andric #define LLVM_LIB_TARGET_AMDGPU_AMDGPU_H
120b57cec5SDimitry Andric 
13e8d8bef9SDimitry Andric #include "llvm/IR/PassManager.h"
141fd87a68SDimitry Andric #include "llvm/Pass.h"
155ffd83dbSDimitry Andric #include "llvm/Support/CodeGen.h"
160b57cec5SDimitry Andric 
170b57cec5SDimitry Andric namespace llvm {
180b57cec5SDimitry Andric 
190b57cec5SDimitry Andric class TargetMachine;
200b57cec5SDimitry Andric 
215ffd83dbSDimitry Andric // GlobalISel passes
225ffd83dbSDimitry Andric void initializeAMDGPUPreLegalizerCombinerPass(PassRegistry &);
235ffd83dbSDimitry Andric FunctionPass *createAMDGPUPreLegalizeCombiner(bool IsOptNone);
245ffd83dbSDimitry Andric void initializeAMDGPUPostLegalizerCombinerPass(PassRegistry &);
255ffd83dbSDimitry Andric FunctionPass *createAMDGPUPostLegalizeCombiner(bool IsOptNone);
265ffd83dbSDimitry Andric FunctionPass *createAMDGPURegBankCombiner(bool IsOptNone);
275ffd83dbSDimitry Andric void initializeAMDGPURegBankCombinerPass(PassRegistry &);
285ffd83dbSDimitry Andric 
29*06c3fb27SDimitry Andric void initializeAMDGPURegBankSelectPass(PassRegistry &);
30*06c3fb27SDimitry Andric 
310b57cec5SDimitry Andric // SI Passes
320b57cec5SDimitry Andric FunctionPass *createGCNDPPCombinePass();
330b57cec5SDimitry Andric FunctionPass *createSIAnnotateControlFlowPass();
340b57cec5SDimitry Andric FunctionPass *createSIFoldOperandsPass();
350b57cec5SDimitry Andric FunctionPass *createSIPeepholeSDWAPass();
360b57cec5SDimitry Andric FunctionPass *createSILowerI1CopiesPass();
370b57cec5SDimitry Andric FunctionPass *createSIShrinkInstructionsPass();
380b57cec5SDimitry Andric FunctionPass *createSILoadStoreOptimizerPass();
390b57cec5SDimitry Andric FunctionPass *createSIWholeQuadModePass();
400b57cec5SDimitry Andric FunctionPass *createSIFixControlFlowLiveIntervalsPass();
410b57cec5SDimitry Andric FunctionPass *createSIOptimizeExecMaskingPreRAPass();
42fe6060f1SDimitry Andric FunctionPass *createSIOptimizeVGPRLiveRangePass();
430b57cec5SDimitry Andric FunctionPass *createSIFixSGPRCopiesPass();
44*06c3fb27SDimitry Andric FunctionPass *createLowerWWMCopiesPass();
450b57cec5SDimitry Andric FunctionPass *createSIMemoryLegalizerPass();
460b57cec5SDimitry Andric FunctionPass *createSIInsertWaitcntsPass();
470b57cec5SDimitry Andric FunctionPass *createSIPreAllocateWWMRegsPass();
480b57cec5SDimitry Andric FunctionPass *createSIFormMemoryClausesPass();
495ffd83dbSDimitry Andric 
505ffd83dbSDimitry Andric FunctionPass *createSIPostRABundlerPass();
515ffd83dbSDimitry Andric FunctionPass *createAMDGPUSimplifyLibCallsPass(const TargetMachine *);
520b57cec5SDimitry Andric FunctionPass *createAMDGPUUseNativeCallsPass();
53*06c3fb27SDimitry Andric ModulePass *createAMDGPURemoveIncompatibleFunctionsPass(const TargetMachine *);
540b57cec5SDimitry Andric FunctionPass *createAMDGPUCodeGenPreparePass();
55e8d8bef9SDimitry Andric FunctionPass *createAMDGPULateCodeGenPreparePass();
560b57cec5SDimitry Andric FunctionPass *createAMDGPUMachineCFGStructurizerPass();
570b57cec5SDimitry Andric FunctionPass *createAMDGPURewriteOutArgumentsPass();
58fe6060f1SDimitry Andric ModulePass *createAMDGPULowerModuleLDSPass();
590b57cec5SDimitry Andric FunctionPass *createSIModeRegisterPass();
60fe6060f1SDimitry Andric FunctionPass *createGCNPreRAOptimizationsPass();
610b57cec5SDimitry Andric 
62e8d8bef9SDimitry Andric struct AMDGPUSimplifyLibCallsPass : PassInfoMixin<AMDGPUSimplifyLibCallsPass> {
63e8d8bef9SDimitry Andric   AMDGPUSimplifyLibCallsPass(TargetMachine &TM) : TM(TM) {}
64e8d8bef9SDimitry Andric   PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM);
65e8d8bef9SDimitry Andric 
66e8d8bef9SDimitry Andric private:
67e8d8bef9SDimitry Andric   TargetMachine &TM;
68e8d8bef9SDimitry Andric };
69e8d8bef9SDimitry Andric 
70e8d8bef9SDimitry Andric struct AMDGPUUseNativeCallsPass : PassInfoMixin<AMDGPUUseNativeCallsPass> {
71e8d8bef9SDimitry Andric   PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM);
72e8d8bef9SDimitry Andric };
73e8d8bef9SDimitry Andric 
740b57cec5SDimitry Andric void initializeAMDGPUDAGToDAGISelPass(PassRegistry&);
750b57cec5SDimitry Andric 
760b57cec5SDimitry Andric void initializeAMDGPUMachineCFGStructurizerPass(PassRegistry&);
770b57cec5SDimitry Andric extern char &AMDGPUMachineCFGStructurizerID;
780b57cec5SDimitry Andric 
790b57cec5SDimitry Andric void initializeAMDGPUAlwaysInlinePass(PassRegistry&);
800b57cec5SDimitry Andric 
810b57cec5SDimitry Andric Pass *createAMDGPUAnnotateKernelFeaturesPass();
82fe6060f1SDimitry Andric Pass *createAMDGPUAttributorPass();
83fe6060f1SDimitry Andric void initializeAMDGPUAttributorPass(PassRegistry &);
840b57cec5SDimitry Andric void initializeAMDGPUAnnotateKernelFeaturesPass(PassRegistry &);
850b57cec5SDimitry Andric extern char &AMDGPUAnnotateKernelFeaturesID;
860b57cec5SDimitry Andric 
87*06c3fb27SDimitry Andric // DPP/Iterative option enables the atomic optimizer with given strategy
88*06c3fb27SDimitry Andric // whereas None disables the atomic optimizer.
89*06c3fb27SDimitry Andric enum class ScanOptions { DPP, Iterative, None };
90*06c3fb27SDimitry Andric FunctionPass *createAMDGPUAtomicOptimizerPass(ScanOptions ScanStrategy);
910b57cec5SDimitry Andric void initializeAMDGPUAtomicOptimizerPass(PassRegistry &);
920b57cec5SDimitry Andric extern char &AMDGPUAtomicOptimizerID;
930b57cec5SDimitry Andric 
94bdd1243dSDimitry Andric ModulePass *createAMDGPUCtorDtorLoweringLegacyPass();
95bdd1243dSDimitry Andric void initializeAMDGPUCtorDtorLoweringLegacyPass(PassRegistry &);
96bdd1243dSDimitry Andric extern char &AMDGPUCtorDtorLoweringLegacyPassID;
97349cc55cSDimitry Andric 
980b57cec5SDimitry Andric FunctionPass *createAMDGPULowerKernelArgumentsPass();
990b57cec5SDimitry Andric void initializeAMDGPULowerKernelArgumentsPass(PassRegistry &);
1000b57cec5SDimitry Andric extern char &AMDGPULowerKernelArgumentsID;
1010b57cec5SDimitry Andric 
102349cc55cSDimitry Andric FunctionPass *createAMDGPUPromoteKernelArgumentsPass();
103349cc55cSDimitry Andric void initializeAMDGPUPromoteKernelArgumentsPass(PassRegistry &);
104349cc55cSDimitry Andric extern char &AMDGPUPromoteKernelArgumentsID;
105349cc55cSDimitry Andric 
106349cc55cSDimitry Andric struct AMDGPUPromoteKernelArgumentsPass
107349cc55cSDimitry Andric     : PassInfoMixin<AMDGPUPromoteKernelArgumentsPass> {
108349cc55cSDimitry Andric   PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM);
109349cc55cSDimitry Andric };
110349cc55cSDimitry Andric 
1110b57cec5SDimitry Andric ModulePass *createAMDGPULowerKernelAttributesPass();
1120b57cec5SDimitry Andric void initializeAMDGPULowerKernelAttributesPass(PassRegistry &);
1130b57cec5SDimitry Andric extern char &AMDGPULowerKernelAttributesID;
1140b57cec5SDimitry Andric 
115e8d8bef9SDimitry Andric struct AMDGPULowerKernelAttributesPass
116e8d8bef9SDimitry Andric     : PassInfoMixin<AMDGPULowerKernelAttributesPass> {
117e8d8bef9SDimitry Andric   PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM);
118e8d8bef9SDimitry Andric };
119e8d8bef9SDimitry Andric 
120fe6060f1SDimitry Andric void initializeAMDGPULowerModuleLDSPass(PassRegistry &);
121fe6060f1SDimitry Andric extern char &AMDGPULowerModuleLDSID;
122fe6060f1SDimitry Andric 
123fe6060f1SDimitry Andric struct AMDGPULowerModuleLDSPass : PassInfoMixin<AMDGPULowerModuleLDSPass> {
124fe6060f1SDimitry Andric   PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM);
125fe6060f1SDimitry Andric };
126fe6060f1SDimitry Andric 
1270b57cec5SDimitry Andric void initializeAMDGPURewriteOutArgumentsPass(PassRegistry &);
1280b57cec5SDimitry Andric extern char &AMDGPURewriteOutArgumentsID;
1290b57cec5SDimitry Andric 
1300b57cec5SDimitry Andric void initializeGCNDPPCombinePass(PassRegistry &);
1310b57cec5SDimitry Andric extern char &GCNDPPCombineID;
1320b57cec5SDimitry Andric 
1330b57cec5SDimitry Andric void initializeSIFoldOperandsPass(PassRegistry &);
1340b57cec5SDimitry Andric extern char &SIFoldOperandsID;
1350b57cec5SDimitry Andric 
1360b57cec5SDimitry Andric void initializeSIPeepholeSDWAPass(PassRegistry &);
1370b57cec5SDimitry Andric extern char &SIPeepholeSDWAID;
1380b57cec5SDimitry Andric 
1390b57cec5SDimitry Andric void initializeSIShrinkInstructionsPass(PassRegistry&);
1400b57cec5SDimitry Andric extern char &SIShrinkInstructionsID;
1410b57cec5SDimitry Andric 
1420b57cec5SDimitry Andric void initializeSIFixSGPRCopiesPass(PassRegistry &);
1430b57cec5SDimitry Andric extern char &SIFixSGPRCopiesID;
1440b57cec5SDimitry Andric 
1450b57cec5SDimitry Andric void initializeSIFixVGPRCopiesPass(PassRegistry &);
1460b57cec5SDimitry Andric extern char &SIFixVGPRCopiesID;
1470b57cec5SDimitry Andric 
148*06c3fb27SDimitry Andric void initializeSILowerWWMCopiesPass(PassRegistry &);
149*06c3fb27SDimitry Andric extern char &SILowerWWMCopiesID;
150*06c3fb27SDimitry Andric 
1510b57cec5SDimitry Andric void initializeSILowerI1CopiesPass(PassRegistry &);
1520b57cec5SDimitry Andric extern char &SILowerI1CopiesID;
1530b57cec5SDimitry Andric 
1540b57cec5SDimitry Andric void initializeSILowerSGPRSpillsPass(PassRegistry &);
1550b57cec5SDimitry Andric extern char &SILowerSGPRSpillsID;
1560b57cec5SDimitry Andric 
1570b57cec5SDimitry Andric void initializeSILoadStoreOptimizerPass(PassRegistry &);
1580b57cec5SDimitry Andric extern char &SILoadStoreOptimizerID;
1590b57cec5SDimitry Andric 
1600b57cec5SDimitry Andric void initializeSIWholeQuadModePass(PassRegistry &);
1610b57cec5SDimitry Andric extern char &SIWholeQuadModeID;
1620b57cec5SDimitry Andric 
1630b57cec5SDimitry Andric void initializeSILowerControlFlowPass(PassRegistry &);
1640b57cec5SDimitry Andric extern char &SILowerControlFlowID;
1650b57cec5SDimitry Andric 
1665ffd83dbSDimitry Andric void initializeSIPreEmitPeepholePass(PassRegistry &);
1675ffd83dbSDimitry Andric extern char &SIPreEmitPeepholeID;
1685ffd83dbSDimitry Andric 
169fe6060f1SDimitry Andric void initializeSILateBranchLoweringPass(PassRegistry &);
170fe6060f1SDimitry Andric extern char &SILateBranchLoweringPassID;
1710b57cec5SDimitry Andric 
1720b57cec5SDimitry Andric void initializeSIOptimizeExecMaskingPass(PassRegistry &);
1730b57cec5SDimitry Andric extern char &SIOptimizeExecMaskingID;
1740b57cec5SDimitry Andric 
1750b57cec5SDimitry Andric void initializeSIPreAllocateWWMRegsPass(PassRegistry &);
1760b57cec5SDimitry Andric extern char &SIPreAllocateWWMRegsID;
1770b57cec5SDimitry Andric 
1780b57cec5SDimitry Andric void initializeAMDGPUSimplifyLibCallsPass(PassRegistry &);
1790b57cec5SDimitry Andric extern char &AMDGPUSimplifyLibCallsID;
1800b57cec5SDimitry Andric 
1810b57cec5SDimitry Andric void initializeAMDGPUUseNativeCallsPass(PassRegistry &);
1820b57cec5SDimitry Andric extern char &AMDGPUUseNativeCallsID;
1830b57cec5SDimitry Andric 
1840b57cec5SDimitry Andric void initializeAMDGPUPerfHintAnalysisPass(PassRegistry &);
1850b57cec5SDimitry Andric extern char &AMDGPUPerfHintAnalysisID;
1860b57cec5SDimitry Andric 
1870b57cec5SDimitry Andric // Passes common to R600 and SI
1880b57cec5SDimitry Andric FunctionPass *createAMDGPUPromoteAlloca();
1890b57cec5SDimitry Andric void initializeAMDGPUPromoteAllocaPass(PassRegistry&);
1900b57cec5SDimitry Andric extern char &AMDGPUPromoteAllocaID;
1910b57cec5SDimitry Andric 
1925ffd83dbSDimitry Andric FunctionPass *createAMDGPUPromoteAllocaToVector();
1935ffd83dbSDimitry Andric void initializeAMDGPUPromoteAllocaToVectorPass(PassRegistry&);
1945ffd83dbSDimitry Andric extern char &AMDGPUPromoteAllocaToVectorID;
1955ffd83dbSDimitry Andric 
196e8d8bef9SDimitry Andric struct AMDGPUPromoteAllocaPass : PassInfoMixin<AMDGPUPromoteAllocaPass> {
197e8d8bef9SDimitry Andric   AMDGPUPromoteAllocaPass(TargetMachine &TM) : TM(TM) {}
198e8d8bef9SDimitry Andric   PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM);
199e8d8bef9SDimitry Andric 
200e8d8bef9SDimitry Andric private:
201e8d8bef9SDimitry Andric   TargetMachine &TM;
202e8d8bef9SDimitry Andric };
203e8d8bef9SDimitry Andric 
204e8d8bef9SDimitry Andric struct AMDGPUPromoteAllocaToVectorPass
205e8d8bef9SDimitry Andric     : PassInfoMixin<AMDGPUPromoteAllocaToVectorPass> {
206e8d8bef9SDimitry Andric   AMDGPUPromoteAllocaToVectorPass(TargetMachine &TM) : TM(TM) {}
207e8d8bef9SDimitry Andric   PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM);
208e8d8bef9SDimitry Andric 
209e8d8bef9SDimitry Andric private:
210e8d8bef9SDimitry Andric   TargetMachine &TM;
211e8d8bef9SDimitry Andric };
212e8d8bef9SDimitry Andric 
213*06c3fb27SDimitry Andric struct AMDGPUAtomicOptimizerPass : PassInfoMixin<AMDGPUAtomicOptimizerPass> {
214*06c3fb27SDimitry Andric   AMDGPUAtomicOptimizerPass(TargetMachine &TM, ScanOptions ScanImpl)
215*06c3fb27SDimitry Andric       : TM(TM), ScanImpl(ScanImpl) {}
216*06c3fb27SDimitry Andric   PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM);
217*06c3fb27SDimitry Andric 
218*06c3fb27SDimitry Andric private:
219*06c3fb27SDimitry Andric   TargetMachine &TM;
220*06c3fb27SDimitry Andric   ScanOptions ScanImpl;
221*06c3fb27SDimitry Andric };
222*06c3fb27SDimitry Andric 
2230b57cec5SDimitry Andric Pass *createAMDGPUStructurizeCFGPass();
224bdd1243dSDimitry Andric FunctionPass *createAMDGPUISelDag(TargetMachine &TM,
225bdd1243dSDimitry Andric                                   CodeGenOpt::Level OptLevel);
2260b57cec5SDimitry Andric ModulePass *createAMDGPUAlwaysInlinePass(bool GlobalOpt = true);
227e8d8bef9SDimitry Andric 
228e8d8bef9SDimitry Andric struct AMDGPUAlwaysInlinePass : PassInfoMixin<AMDGPUAlwaysInlinePass> {
229e8d8bef9SDimitry Andric   AMDGPUAlwaysInlinePass(bool GlobalOpt = true) : GlobalOpt(GlobalOpt) {}
230e8d8bef9SDimitry Andric   PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM);
231e8d8bef9SDimitry Andric 
232e8d8bef9SDimitry Andric private:
233e8d8bef9SDimitry Andric   bool GlobalOpt;
234e8d8bef9SDimitry Andric };
235e8d8bef9SDimitry Andric 
236*06c3fb27SDimitry Andric class AMDGPUCodeGenPreparePass
237*06c3fb27SDimitry Andric     : public PassInfoMixin<AMDGPUCodeGenPreparePass> {
238*06c3fb27SDimitry Andric private:
239*06c3fb27SDimitry Andric   TargetMachine &TM;
240*06c3fb27SDimitry Andric 
241*06c3fb27SDimitry Andric public:
242*06c3fb27SDimitry Andric   AMDGPUCodeGenPreparePass(TargetMachine &TM) : TM(TM){};
243*06c3fb27SDimitry Andric   PreservedAnalyses run(Function &, FunctionAnalysisManager &);
244*06c3fb27SDimitry Andric };
245*06c3fb27SDimitry Andric 
2460b57cec5SDimitry Andric FunctionPass *createAMDGPUAnnotateUniformValues();
2470b57cec5SDimitry Andric 
2488bcb0991SDimitry Andric ModulePass *createAMDGPUPrintfRuntimeBinding();
2498bcb0991SDimitry Andric void initializeAMDGPUPrintfRuntimeBindingPass(PassRegistry&);
2508bcb0991SDimitry Andric extern char &AMDGPUPrintfRuntimeBindingID;
2518bcb0991SDimitry Andric 
252fe6060f1SDimitry Andric void initializeAMDGPUResourceUsageAnalysisPass(PassRegistry &);
253fe6060f1SDimitry Andric extern char &AMDGPUResourceUsageAnalysisID;
254fe6060f1SDimitry Andric 
255e8d8bef9SDimitry Andric struct AMDGPUPrintfRuntimeBindingPass
256e8d8bef9SDimitry Andric     : PassInfoMixin<AMDGPUPrintfRuntimeBindingPass> {
257e8d8bef9SDimitry Andric   PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM);
258e8d8bef9SDimitry Andric };
259e8d8bef9SDimitry Andric 
2600b57cec5SDimitry Andric ModulePass* createAMDGPUUnifyMetadataPass();
2610b57cec5SDimitry Andric void initializeAMDGPUUnifyMetadataPass(PassRegistry&);
2620b57cec5SDimitry Andric extern char &AMDGPUUnifyMetadataID;
2630b57cec5SDimitry Andric 
264e8d8bef9SDimitry Andric struct AMDGPUUnifyMetadataPass : PassInfoMixin<AMDGPUUnifyMetadataPass> {
265e8d8bef9SDimitry Andric   PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM);
266e8d8bef9SDimitry Andric };
267e8d8bef9SDimitry Andric 
2680b57cec5SDimitry Andric void initializeSIOptimizeExecMaskingPreRAPass(PassRegistry&);
2690b57cec5SDimitry Andric extern char &SIOptimizeExecMaskingPreRAID;
2700b57cec5SDimitry Andric 
271fe6060f1SDimitry Andric void initializeSIOptimizeVGPRLiveRangePass(PassRegistry &);
272fe6060f1SDimitry Andric extern char &SIOptimizeVGPRLiveRangeID;
273fe6060f1SDimitry Andric 
2740b57cec5SDimitry Andric void initializeAMDGPUAnnotateUniformValuesPass(PassRegistry&);
2750b57cec5SDimitry Andric extern char &AMDGPUAnnotateUniformValuesPassID;
2760b57cec5SDimitry Andric 
2770b57cec5SDimitry Andric void initializeAMDGPUCodeGenPreparePass(PassRegistry&);
2780b57cec5SDimitry Andric extern char &AMDGPUCodeGenPrepareID;
2790b57cec5SDimitry Andric 
280*06c3fb27SDimitry Andric void initializeAMDGPURemoveIncompatibleFunctionsPass(PassRegistry &);
281*06c3fb27SDimitry Andric extern char &AMDGPURemoveIncompatibleFunctionsID;
282*06c3fb27SDimitry Andric 
283e8d8bef9SDimitry Andric void initializeAMDGPULateCodeGenPreparePass(PassRegistry &);
284e8d8bef9SDimitry Andric extern char &AMDGPULateCodeGenPrepareID;
285e8d8bef9SDimitry Andric 
286bdd1243dSDimitry Andric FunctionPass *createAMDGPURewriteUndefForPHIPass();
287bdd1243dSDimitry Andric void initializeAMDGPURewriteUndefForPHIPass(PassRegistry &);
288bdd1243dSDimitry Andric extern char &AMDGPURewriteUndefForPHIPassID;
289bdd1243dSDimitry Andric 
2900b57cec5SDimitry Andric void initializeSIAnnotateControlFlowPass(PassRegistry&);
2910b57cec5SDimitry Andric extern char &SIAnnotateControlFlowPassID;
2920b57cec5SDimitry Andric 
2930b57cec5SDimitry Andric void initializeSIMemoryLegalizerPass(PassRegistry&);
2940b57cec5SDimitry Andric extern char &SIMemoryLegalizerID;
2950b57cec5SDimitry Andric 
2960b57cec5SDimitry Andric void initializeSIModeRegisterPass(PassRegistry&);
2970b57cec5SDimitry Andric extern char &SIModeRegisterID;
2980b57cec5SDimitry Andric 
29981ad6265SDimitry Andric void initializeAMDGPUInsertDelayAluPass(PassRegistry &);
30081ad6265SDimitry Andric extern char &AMDGPUInsertDelayAluID;
30181ad6265SDimitry Andric 
3025ffd83dbSDimitry Andric void initializeSIInsertHardClausesPass(PassRegistry &);
3035ffd83dbSDimitry Andric extern char &SIInsertHardClausesID;
3045ffd83dbSDimitry Andric 
3050b57cec5SDimitry Andric void initializeSIInsertWaitcntsPass(PassRegistry&);
3060b57cec5SDimitry Andric extern char &SIInsertWaitcntsID;
3070b57cec5SDimitry Andric 
3080b57cec5SDimitry Andric void initializeSIFormMemoryClausesPass(PassRegistry&);
3090b57cec5SDimitry Andric extern char &SIFormMemoryClausesID;
3100b57cec5SDimitry Andric 
3115ffd83dbSDimitry Andric void initializeSIPostRABundlerPass(PassRegistry&);
3125ffd83dbSDimitry Andric extern char &SIPostRABundlerID;
3135ffd83dbSDimitry Andric 
314753f127fSDimitry Andric void initializeGCNCreateVOPDPass(PassRegistry &);
315753f127fSDimitry Andric extern char &GCNCreateVOPDID;
316753f127fSDimitry Andric 
3170b57cec5SDimitry Andric void initializeAMDGPUUnifyDivergentExitNodesPass(PassRegistry&);
3180b57cec5SDimitry Andric extern char &AMDGPUUnifyDivergentExitNodesID;
3190b57cec5SDimitry Andric 
3200b57cec5SDimitry Andric ImmutablePass *createAMDGPUAAWrapperPass();
3210b57cec5SDimitry Andric void initializeAMDGPUAAWrapperPassPass(PassRegistry&);
3220b57cec5SDimitry Andric ImmutablePass *createAMDGPUExternalAAWrapperPass();
3230b57cec5SDimitry Andric void initializeAMDGPUExternalAAWrapperPass(PassRegistry&);
3240b57cec5SDimitry Andric 
3250b57cec5SDimitry Andric void initializeAMDGPUArgumentUsageInfoPass(PassRegistry &);
3260b57cec5SDimitry Andric 
3270b57cec5SDimitry Andric ModulePass *createAMDGPUOpenCLEnqueuedBlockLoweringPass();
3280b57cec5SDimitry Andric void initializeAMDGPUOpenCLEnqueuedBlockLoweringPass(PassRegistry &);
3290b57cec5SDimitry Andric extern char &AMDGPUOpenCLEnqueuedBlockLoweringID;
3300b57cec5SDimitry Andric 
3310b57cec5SDimitry Andric void initializeGCNNSAReassignPass(PassRegistry &);
3320b57cec5SDimitry Andric extern char &GCNNSAReassignID;
3330b57cec5SDimitry Andric 
334*06c3fb27SDimitry Andric void initializeGCNPreRALongBranchRegPass(PassRegistry &);
335*06c3fb27SDimitry Andric extern char &GCNPreRALongBranchRegID;
336*06c3fb27SDimitry Andric 
337fe6060f1SDimitry Andric void initializeGCNPreRAOptimizationsPass(PassRegistry &);
338fe6060f1SDimitry Andric extern char &GCNPreRAOptimizationsID;
339fe6060f1SDimitry Andric 
34081ad6265SDimitry Andric FunctionPass *createAMDGPUSetWavePriorityPass();
34181ad6265SDimitry Andric void initializeAMDGPUSetWavePriorityPass(PassRegistry &);
34281ad6265SDimitry Andric 
343*06c3fb27SDimitry Andric void initializeGCNRewritePartialRegUsesPass(llvm::PassRegistry &);
344*06c3fb27SDimitry Andric extern char &GCNRewritePartialRegUsesID;
345*06c3fb27SDimitry Andric 
3460b57cec5SDimitry Andric namespace AMDGPU {
3470b57cec5SDimitry Andric enum TargetIndex {
3480b57cec5SDimitry Andric   TI_CONSTDATA_START,
3490b57cec5SDimitry Andric   TI_SCRATCH_RSRC_DWORD0,
3500b57cec5SDimitry Andric   TI_SCRATCH_RSRC_DWORD1,
3510b57cec5SDimitry Andric   TI_SCRATCH_RSRC_DWORD2,
3520b57cec5SDimitry Andric   TI_SCRATCH_RSRC_DWORD3
3530b57cec5SDimitry Andric };
3540b57cec5SDimitry Andric }
3550b57cec5SDimitry Andric 
3560b57cec5SDimitry Andric /// OpenCL uses address spaces to differentiate between
3570b57cec5SDimitry Andric /// various memory regions on the hardware. On the CPU
3580b57cec5SDimitry Andric /// all of the address spaces point to the same memory,
3590b57cec5SDimitry Andric /// however on the GPU, each address space points to
3600b57cec5SDimitry Andric /// a separate piece of memory that is unique from other
3610b57cec5SDimitry Andric /// memory locations.
3620b57cec5SDimitry Andric namespace AMDGPUAS {
3630b57cec5SDimitry Andric enum : unsigned {
3640b57cec5SDimitry Andric   // The maximum value for flat, generic, local, private, constant and region.
365*06c3fb27SDimitry Andric   MAX_AMDGPU_ADDRESS = 8,
3660b57cec5SDimitry Andric 
3670b57cec5SDimitry Andric   FLAT_ADDRESS = 0,   ///< Address space for flat memory.
3680b57cec5SDimitry Andric   GLOBAL_ADDRESS = 1, ///< Address space for global memory (RAT0, VTX0).
3690b57cec5SDimitry Andric   REGION_ADDRESS = 2, ///< Address space for region memory. (GDS)
3700b57cec5SDimitry Andric 
3710b57cec5SDimitry Andric   CONSTANT_ADDRESS = 4, ///< Address space for constant memory (VTX2).
3720b57cec5SDimitry Andric   LOCAL_ADDRESS = 3,    ///< Address space for local memory.
3730b57cec5SDimitry Andric   PRIVATE_ADDRESS = 5,  ///< Address space for private memory.
3740b57cec5SDimitry Andric 
3750b57cec5SDimitry Andric   CONSTANT_ADDRESS_32BIT = 6, ///< Address space for 32-bit constant memory.
3760b57cec5SDimitry Andric 
3770b57cec5SDimitry Andric   BUFFER_FAT_POINTER = 7, ///< Address space for 160-bit buffer fat pointers.
378*06c3fb27SDimitry Andric                           ///< Not used in backend.
379*06c3fb27SDimitry Andric 
380*06c3fb27SDimitry Andric   BUFFER_RESOURCE = 8, ///< Address space for 128-bit buffer resources.
381*06c3fb27SDimitry Andric 
382*06c3fb27SDimitry Andric   /// Internal address spaces. Can be freely renumbered.
383*06c3fb27SDimitry Andric   STREAMOUT_REGISTER = 128, ///< Address space for GS NGG Streamout registers.
384*06c3fb27SDimitry Andric   /// end Internal address spaces.
3850b57cec5SDimitry Andric 
386349cc55cSDimitry Andric   /// Address space for direct addressable parameter memory (CONST0).
3870b57cec5SDimitry Andric   PARAM_D_ADDRESS = 6,
388349cc55cSDimitry Andric   /// Address space for indirect addressable parameter memory (VTX1).
3890b57cec5SDimitry Andric   PARAM_I_ADDRESS = 7,
3900b57cec5SDimitry Andric 
3910b57cec5SDimitry Andric   // Do not re-order the CONSTANT_BUFFER_* enums.  Several places depend on
3920b57cec5SDimitry Andric   // this order to be able to dynamically index a constant buffer, for
3930b57cec5SDimitry Andric   // example:
3940b57cec5SDimitry Andric   //
3950b57cec5SDimitry Andric   // ConstantBufferAS = CONSTANT_BUFFER_0 + CBIdx
3960b57cec5SDimitry Andric 
3970b57cec5SDimitry Andric   CONSTANT_BUFFER_0 = 8,
3980b57cec5SDimitry Andric   CONSTANT_BUFFER_1 = 9,
3990b57cec5SDimitry Andric   CONSTANT_BUFFER_2 = 10,
4000b57cec5SDimitry Andric   CONSTANT_BUFFER_3 = 11,
4010b57cec5SDimitry Andric   CONSTANT_BUFFER_4 = 12,
4020b57cec5SDimitry Andric   CONSTANT_BUFFER_5 = 13,
4030b57cec5SDimitry Andric   CONSTANT_BUFFER_6 = 14,
4040b57cec5SDimitry Andric   CONSTANT_BUFFER_7 = 15,
4050b57cec5SDimitry Andric   CONSTANT_BUFFER_8 = 16,
4060b57cec5SDimitry Andric   CONSTANT_BUFFER_9 = 17,
4070b57cec5SDimitry Andric   CONSTANT_BUFFER_10 = 18,
4080b57cec5SDimitry Andric   CONSTANT_BUFFER_11 = 19,
4090b57cec5SDimitry Andric   CONSTANT_BUFFER_12 = 20,
4100b57cec5SDimitry Andric   CONSTANT_BUFFER_13 = 21,
4110b57cec5SDimitry Andric   CONSTANT_BUFFER_14 = 22,
4120b57cec5SDimitry Andric   CONSTANT_BUFFER_15 = 23,
4130b57cec5SDimitry Andric 
4140b57cec5SDimitry Andric   // Some places use this if the address space can't be determined.
4150b57cec5SDimitry Andric   UNKNOWN_ADDRESS_SPACE = ~0u,
4160b57cec5SDimitry Andric };
4170b57cec5SDimitry Andric }
4180b57cec5SDimitry Andric 
419e8d8bef9SDimitry Andric namespace AMDGPU {
420e8d8bef9SDimitry Andric 
421e8d8bef9SDimitry Andric // FIXME: Missing constant_32bit
422e8d8bef9SDimitry Andric inline bool isFlatGlobalAddrSpace(unsigned AS) {
423e8d8bef9SDimitry Andric   return AS == AMDGPUAS::GLOBAL_ADDRESS ||
424e8d8bef9SDimitry Andric          AS == AMDGPUAS::FLAT_ADDRESS ||
425e8d8bef9SDimitry Andric          AS == AMDGPUAS::CONSTANT_ADDRESS ||
426e8d8bef9SDimitry Andric          AS > AMDGPUAS::MAX_AMDGPU_ADDRESS;
427e8d8bef9SDimitry Andric }
428*06c3fb27SDimitry Andric 
429*06c3fb27SDimitry Andric inline bool isExtendedGlobalAddrSpace(unsigned AS) {
430*06c3fb27SDimitry Andric   return AS == AMDGPUAS::GLOBAL_ADDRESS || AS == AMDGPUAS::CONSTANT_ADDRESS ||
431*06c3fb27SDimitry Andric          AS == AMDGPUAS::CONSTANT_ADDRESS_32BIT ||
432*06c3fb27SDimitry Andric          AS > AMDGPUAS::MAX_AMDGPU_ADDRESS;
433*06c3fb27SDimitry Andric }
434*06c3fb27SDimitry Andric 
435*06c3fb27SDimitry Andric static inline bool addrspacesMayAlias(unsigned AS1, unsigned AS2) {
436*06c3fb27SDimitry Andric   static_assert(AMDGPUAS::MAX_AMDGPU_ADDRESS <= 8, "Addr space out of range");
437*06c3fb27SDimitry Andric 
438*06c3fb27SDimitry Andric   if (AS1 > AMDGPUAS::MAX_AMDGPU_ADDRESS || AS2 > AMDGPUAS::MAX_AMDGPU_ADDRESS)
439*06c3fb27SDimitry Andric     return true;
440*06c3fb27SDimitry Andric 
441*06c3fb27SDimitry Andric   // This array is indexed by address space value enum elements 0 ... to 8
442*06c3fb27SDimitry Andric   // clang-format off
443*06c3fb27SDimitry Andric   static const bool ASAliasRules[9][9] = {
444*06c3fb27SDimitry Andric     /*                   Flat   Global Region  Group Constant Private Const32 BufFatPtr BufRsrc */
445*06c3fb27SDimitry Andric     /* Flat     */        {true,  true,  false, true,  true,  true,  true,  true,  true},
446*06c3fb27SDimitry Andric     /* Global   */        {true,  true,  false, false, true,  false, true,  true,  true},
447*06c3fb27SDimitry Andric     /* Region   */        {false, false, true,  false, false, false, false, false, false},
448*06c3fb27SDimitry Andric     /* Group    */        {true,  false, false, true,  false, false, false, false, false},
449*06c3fb27SDimitry Andric     /* Constant */        {true,  true,  false, false, false, false, true,  true,  true},
450*06c3fb27SDimitry Andric     /* Private  */        {true,  false, false, false, false, true,  false, false, false},
451*06c3fb27SDimitry Andric     /* Constant 32-bit */ {true,  true,  false, false, true,  false, false, true,  true},
452*06c3fb27SDimitry Andric     /* Buffer Fat Ptr  */ {true,  true,  false, false, true,  false, true,  true,  true},
453*06c3fb27SDimitry Andric     /* Buffer Resource */ {true,  true,  false, false, true,  false, true,  true,  true},
454*06c3fb27SDimitry Andric   };
455*06c3fb27SDimitry Andric   // clang-format on
456*06c3fb27SDimitry Andric 
457*06c3fb27SDimitry Andric   return ASAliasRules[AS1][AS2];
458*06c3fb27SDimitry Andric }
459*06c3fb27SDimitry Andric 
460e8d8bef9SDimitry Andric }
461e8d8bef9SDimitry Andric 
462e8d8bef9SDimitry Andric } // End namespace llvm
463e8d8bef9SDimitry Andric 
4640b57cec5SDimitry Andric #endif
465