10b57cec5SDimitry Andric //===-- AMDGPU.h - MachineFunction passes hw codegen --------------*- C++ -*-=// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric /// \file 80b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 90b57cec5SDimitry Andric 100b57cec5SDimitry Andric #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPU_H 110b57cec5SDimitry Andric #define LLVM_LIB_TARGET_AMDGPU_AMDGPU_H 120b57cec5SDimitry Andric 13*e8d8bef9SDimitry Andric #include "llvm/IR/PassManager.h" 145ffd83dbSDimitry Andric #include "llvm/Support/CodeGen.h" 150b57cec5SDimitry Andric 160b57cec5SDimitry Andric namespace llvm { 170b57cec5SDimitry Andric 180b57cec5SDimitry Andric class AMDGPUTargetMachine; 190b57cec5SDimitry Andric class FunctionPass; 200b57cec5SDimitry Andric class GCNTargetMachine; 215ffd83dbSDimitry Andric class ImmutablePass; 220b57cec5SDimitry Andric class ModulePass; 230b57cec5SDimitry Andric class Pass; 240b57cec5SDimitry Andric class Target; 250b57cec5SDimitry Andric class TargetMachine; 260b57cec5SDimitry Andric class TargetOptions; 270b57cec5SDimitry Andric class PassRegistry; 280b57cec5SDimitry Andric class Module; 290b57cec5SDimitry Andric 305ffd83dbSDimitry Andric // GlobalISel passes 315ffd83dbSDimitry Andric void initializeAMDGPUPreLegalizerCombinerPass(PassRegistry &); 325ffd83dbSDimitry Andric FunctionPass *createAMDGPUPreLegalizeCombiner(bool IsOptNone); 335ffd83dbSDimitry Andric void initializeAMDGPUPostLegalizerCombinerPass(PassRegistry &); 345ffd83dbSDimitry Andric FunctionPass *createAMDGPUPostLegalizeCombiner(bool IsOptNone); 355ffd83dbSDimitry Andric FunctionPass *createAMDGPURegBankCombiner(bool IsOptNone); 365ffd83dbSDimitry Andric void initializeAMDGPURegBankCombinerPass(PassRegistry &); 375ffd83dbSDimitry Andric 380b57cec5SDimitry Andric // R600 Passes 390b57cec5SDimitry Andric FunctionPass *createR600VectorRegMerger(); 400b57cec5SDimitry Andric FunctionPass *createR600ExpandSpecialInstrsPass(); 410b57cec5SDimitry Andric FunctionPass *createR600EmitClauseMarkers(); 420b57cec5SDimitry Andric FunctionPass *createR600ClauseMergePass(); 430b57cec5SDimitry Andric FunctionPass *createR600Packetizer(); 440b57cec5SDimitry Andric FunctionPass *createR600ControlFlowFinalizer(); 450b57cec5SDimitry Andric FunctionPass *createAMDGPUCFGStructurizerPass(); 460b57cec5SDimitry Andric FunctionPass *createR600ISelDag(TargetMachine *TM, CodeGenOpt::Level OptLevel); 470b57cec5SDimitry Andric 480b57cec5SDimitry Andric // SI Passes 490b57cec5SDimitry Andric FunctionPass *createGCNDPPCombinePass(); 500b57cec5SDimitry Andric FunctionPass *createSIAnnotateControlFlowPass(); 510b57cec5SDimitry Andric FunctionPass *createSIFoldOperandsPass(); 520b57cec5SDimitry Andric FunctionPass *createSIPeepholeSDWAPass(); 530b57cec5SDimitry Andric FunctionPass *createSILowerI1CopiesPass(); 540b57cec5SDimitry Andric FunctionPass *createSIAddIMGInitPass(); 550b57cec5SDimitry Andric FunctionPass *createSIShrinkInstructionsPass(); 560b57cec5SDimitry Andric FunctionPass *createSILoadStoreOptimizerPass(); 570b57cec5SDimitry Andric FunctionPass *createSIWholeQuadModePass(); 580b57cec5SDimitry Andric FunctionPass *createSIFixControlFlowLiveIntervalsPass(); 590b57cec5SDimitry Andric FunctionPass *createSIOptimizeExecMaskingPreRAPass(); 600b57cec5SDimitry Andric FunctionPass *createSIFixSGPRCopiesPass(); 610b57cec5SDimitry Andric FunctionPass *createSIMemoryLegalizerPass(); 620b57cec5SDimitry Andric FunctionPass *createSIInsertWaitcntsPass(); 630b57cec5SDimitry Andric FunctionPass *createSIPreAllocateWWMRegsPass(); 640b57cec5SDimitry Andric FunctionPass *createSIFormMemoryClausesPass(); 655ffd83dbSDimitry Andric 665ffd83dbSDimitry Andric FunctionPass *createSIPostRABundlerPass(); 675ffd83dbSDimitry Andric FunctionPass *createAMDGPUSimplifyLibCallsPass(const TargetMachine *); 680b57cec5SDimitry Andric FunctionPass *createAMDGPUUseNativeCallsPass(); 690b57cec5SDimitry Andric FunctionPass *createAMDGPUCodeGenPreparePass(); 70*e8d8bef9SDimitry Andric FunctionPass *createAMDGPULateCodeGenPreparePass(); 710b57cec5SDimitry Andric FunctionPass *createAMDGPUMachineCFGStructurizerPass(); 720b57cec5SDimitry Andric FunctionPass *createAMDGPUPropagateAttributesEarlyPass(const TargetMachine *); 730b57cec5SDimitry Andric ModulePass *createAMDGPUPropagateAttributesLatePass(const TargetMachine *); 740b57cec5SDimitry Andric FunctionPass *createAMDGPURewriteOutArgumentsPass(); 750b57cec5SDimitry Andric FunctionPass *createSIModeRegisterPass(); 760b57cec5SDimitry Andric 77*e8d8bef9SDimitry Andric struct AMDGPUSimplifyLibCallsPass : PassInfoMixin<AMDGPUSimplifyLibCallsPass> { 78*e8d8bef9SDimitry Andric AMDGPUSimplifyLibCallsPass(TargetMachine &TM) : TM(TM) {} 79*e8d8bef9SDimitry Andric PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); 80*e8d8bef9SDimitry Andric 81*e8d8bef9SDimitry Andric private: 82*e8d8bef9SDimitry Andric TargetMachine &TM; 83*e8d8bef9SDimitry Andric }; 84*e8d8bef9SDimitry Andric 85*e8d8bef9SDimitry Andric struct AMDGPUUseNativeCallsPass : PassInfoMixin<AMDGPUUseNativeCallsPass> { 86*e8d8bef9SDimitry Andric PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); 87*e8d8bef9SDimitry Andric }; 88*e8d8bef9SDimitry Andric 890b57cec5SDimitry Andric void initializeAMDGPUDAGToDAGISelPass(PassRegistry&); 900b57cec5SDimitry Andric 910b57cec5SDimitry Andric void initializeAMDGPUMachineCFGStructurizerPass(PassRegistry&); 920b57cec5SDimitry Andric extern char &AMDGPUMachineCFGStructurizerID; 930b57cec5SDimitry Andric 940b57cec5SDimitry Andric void initializeAMDGPUAlwaysInlinePass(PassRegistry&); 950b57cec5SDimitry Andric 960b57cec5SDimitry Andric Pass *createAMDGPUAnnotateKernelFeaturesPass(); 970b57cec5SDimitry Andric void initializeAMDGPUAnnotateKernelFeaturesPass(PassRegistry &); 980b57cec5SDimitry Andric extern char &AMDGPUAnnotateKernelFeaturesID; 990b57cec5SDimitry Andric 1000b57cec5SDimitry Andric FunctionPass *createAMDGPUAtomicOptimizerPass(); 1010b57cec5SDimitry Andric void initializeAMDGPUAtomicOptimizerPass(PassRegistry &); 1020b57cec5SDimitry Andric extern char &AMDGPUAtomicOptimizerID; 1030b57cec5SDimitry Andric 1040b57cec5SDimitry Andric ModulePass *createAMDGPULowerIntrinsicsPass(); 1050b57cec5SDimitry Andric void initializeAMDGPULowerIntrinsicsPass(PassRegistry &); 1060b57cec5SDimitry Andric extern char &AMDGPULowerIntrinsicsID; 1070b57cec5SDimitry Andric 1080b57cec5SDimitry Andric ModulePass *createAMDGPUFixFunctionBitcastsPass(); 1090b57cec5SDimitry Andric void initializeAMDGPUFixFunctionBitcastsPass(PassRegistry &); 1100b57cec5SDimitry Andric extern char &AMDGPUFixFunctionBitcastsID; 1110b57cec5SDimitry Andric 1120b57cec5SDimitry Andric FunctionPass *createAMDGPULowerKernelArgumentsPass(); 1130b57cec5SDimitry Andric void initializeAMDGPULowerKernelArgumentsPass(PassRegistry &); 1140b57cec5SDimitry Andric extern char &AMDGPULowerKernelArgumentsID; 1150b57cec5SDimitry Andric 1160b57cec5SDimitry Andric ModulePass *createAMDGPULowerKernelAttributesPass(); 1170b57cec5SDimitry Andric void initializeAMDGPULowerKernelAttributesPass(PassRegistry &); 1180b57cec5SDimitry Andric extern char &AMDGPULowerKernelAttributesID; 1190b57cec5SDimitry Andric 120*e8d8bef9SDimitry Andric struct AMDGPULowerKernelAttributesPass 121*e8d8bef9SDimitry Andric : PassInfoMixin<AMDGPULowerKernelAttributesPass> { 122*e8d8bef9SDimitry Andric PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); 123*e8d8bef9SDimitry Andric }; 124*e8d8bef9SDimitry Andric 1250b57cec5SDimitry Andric void initializeAMDGPUPropagateAttributesEarlyPass(PassRegistry &); 1260b57cec5SDimitry Andric extern char &AMDGPUPropagateAttributesEarlyID; 1270b57cec5SDimitry Andric 128*e8d8bef9SDimitry Andric struct AMDGPUPropagateAttributesEarlyPass 129*e8d8bef9SDimitry Andric : PassInfoMixin<AMDGPUPropagateAttributesEarlyPass> { 130*e8d8bef9SDimitry Andric AMDGPUPropagateAttributesEarlyPass(TargetMachine &TM) : TM(TM) {} 131*e8d8bef9SDimitry Andric PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); 132*e8d8bef9SDimitry Andric 133*e8d8bef9SDimitry Andric private: 134*e8d8bef9SDimitry Andric TargetMachine &TM; 135*e8d8bef9SDimitry Andric }; 136*e8d8bef9SDimitry Andric 1370b57cec5SDimitry Andric void initializeAMDGPUPropagateAttributesLatePass(PassRegistry &); 1380b57cec5SDimitry Andric extern char &AMDGPUPropagateAttributesLateID; 1390b57cec5SDimitry Andric 140*e8d8bef9SDimitry Andric struct AMDGPUPropagateAttributesLatePass 141*e8d8bef9SDimitry Andric : PassInfoMixin<AMDGPUPropagateAttributesLatePass> { 142*e8d8bef9SDimitry Andric AMDGPUPropagateAttributesLatePass(TargetMachine &TM) : TM(TM) {} 143*e8d8bef9SDimitry Andric PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM); 144*e8d8bef9SDimitry Andric 145*e8d8bef9SDimitry Andric private: 146*e8d8bef9SDimitry Andric TargetMachine &TM; 147*e8d8bef9SDimitry Andric }; 148*e8d8bef9SDimitry Andric 1490b57cec5SDimitry Andric void initializeAMDGPURewriteOutArgumentsPass(PassRegistry &); 1500b57cec5SDimitry Andric extern char &AMDGPURewriteOutArgumentsID; 1510b57cec5SDimitry Andric 1520b57cec5SDimitry Andric void initializeGCNDPPCombinePass(PassRegistry &); 1530b57cec5SDimitry Andric extern char &GCNDPPCombineID; 1540b57cec5SDimitry Andric 1550b57cec5SDimitry Andric void initializeR600ClauseMergePassPass(PassRegistry &); 1560b57cec5SDimitry Andric extern char &R600ClauseMergePassID; 1570b57cec5SDimitry Andric 1580b57cec5SDimitry Andric void initializeR600ControlFlowFinalizerPass(PassRegistry &); 1590b57cec5SDimitry Andric extern char &R600ControlFlowFinalizerID; 1600b57cec5SDimitry Andric 1610b57cec5SDimitry Andric void initializeR600ExpandSpecialInstrsPassPass(PassRegistry &); 1620b57cec5SDimitry Andric extern char &R600ExpandSpecialInstrsPassID; 1630b57cec5SDimitry Andric 1640b57cec5SDimitry Andric void initializeR600VectorRegMergerPass(PassRegistry &); 1650b57cec5SDimitry Andric extern char &R600VectorRegMergerID; 1660b57cec5SDimitry Andric 1670b57cec5SDimitry Andric void initializeR600PacketizerPass(PassRegistry &); 1680b57cec5SDimitry Andric extern char &R600PacketizerID; 1690b57cec5SDimitry Andric 1700b57cec5SDimitry Andric void initializeSIFoldOperandsPass(PassRegistry &); 1710b57cec5SDimitry Andric extern char &SIFoldOperandsID; 1720b57cec5SDimitry Andric 1730b57cec5SDimitry Andric void initializeSIPeepholeSDWAPass(PassRegistry &); 1740b57cec5SDimitry Andric extern char &SIPeepholeSDWAID; 1750b57cec5SDimitry Andric 1760b57cec5SDimitry Andric void initializeSIShrinkInstructionsPass(PassRegistry&); 1770b57cec5SDimitry Andric extern char &SIShrinkInstructionsID; 1780b57cec5SDimitry Andric 1790b57cec5SDimitry Andric void initializeSIFixSGPRCopiesPass(PassRegistry &); 1800b57cec5SDimitry Andric extern char &SIFixSGPRCopiesID; 1810b57cec5SDimitry Andric 1820b57cec5SDimitry Andric void initializeSIFixVGPRCopiesPass(PassRegistry &); 1830b57cec5SDimitry Andric extern char &SIFixVGPRCopiesID; 1840b57cec5SDimitry Andric 1850b57cec5SDimitry Andric void initializeSILowerI1CopiesPass(PassRegistry &); 1860b57cec5SDimitry Andric extern char &SILowerI1CopiesID; 1870b57cec5SDimitry Andric 1880b57cec5SDimitry Andric void initializeSILowerSGPRSpillsPass(PassRegistry &); 1890b57cec5SDimitry Andric extern char &SILowerSGPRSpillsID; 1900b57cec5SDimitry Andric 1910b57cec5SDimitry Andric void initializeSILoadStoreOptimizerPass(PassRegistry &); 1920b57cec5SDimitry Andric extern char &SILoadStoreOptimizerID; 1930b57cec5SDimitry Andric 1940b57cec5SDimitry Andric void initializeSIWholeQuadModePass(PassRegistry &); 1950b57cec5SDimitry Andric extern char &SIWholeQuadModeID; 1960b57cec5SDimitry Andric 1970b57cec5SDimitry Andric void initializeSILowerControlFlowPass(PassRegistry &); 1980b57cec5SDimitry Andric extern char &SILowerControlFlowID; 1990b57cec5SDimitry Andric 2005ffd83dbSDimitry Andric void initializeSIRemoveShortExecBranchesPass(PassRegistry &); 2015ffd83dbSDimitry Andric extern char &SIRemoveShortExecBranchesID; 2025ffd83dbSDimitry Andric 2035ffd83dbSDimitry Andric void initializeSIPreEmitPeepholePass(PassRegistry &); 2045ffd83dbSDimitry Andric extern char &SIPreEmitPeepholeID; 2055ffd83dbSDimitry Andric 2060b57cec5SDimitry Andric void initializeSIInsertSkipsPass(PassRegistry &); 2070b57cec5SDimitry Andric extern char &SIInsertSkipsPassID; 2080b57cec5SDimitry Andric 2090b57cec5SDimitry Andric void initializeSIOptimizeExecMaskingPass(PassRegistry &); 2100b57cec5SDimitry Andric extern char &SIOptimizeExecMaskingID; 2110b57cec5SDimitry Andric 2120b57cec5SDimitry Andric void initializeSIPreAllocateWWMRegsPass(PassRegistry &); 2130b57cec5SDimitry Andric extern char &SIPreAllocateWWMRegsID; 2140b57cec5SDimitry Andric 2150b57cec5SDimitry Andric void initializeAMDGPUSimplifyLibCallsPass(PassRegistry &); 2160b57cec5SDimitry Andric extern char &AMDGPUSimplifyLibCallsID; 2170b57cec5SDimitry Andric 2180b57cec5SDimitry Andric void initializeAMDGPUUseNativeCallsPass(PassRegistry &); 2190b57cec5SDimitry Andric extern char &AMDGPUUseNativeCallsID; 2200b57cec5SDimitry Andric 2210b57cec5SDimitry Andric void initializeSIAddIMGInitPass(PassRegistry &); 2220b57cec5SDimitry Andric extern char &SIAddIMGInitID; 2230b57cec5SDimitry Andric 2240b57cec5SDimitry Andric void initializeAMDGPUPerfHintAnalysisPass(PassRegistry &); 2250b57cec5SDimitry Andric extern char &AMDGPUPerfHintAnalysisID; 2260b57cec5SDimitry Andric 2270b57cec5SDimitry Andric // Passes common to R600 and SI 2280b57cec5SDimitry Andric FunctionPass *createAMDGPUPromoteAlloca(); 2290b57cec5SDimitry Andric void initializeAMDGPUPromoteAllocaPass(PassRegistry&); 2300b57cec5SDimitry Andric extern char &AMDGPUPromoteAllocaID; 2310b57cec5SDimitry Andric 2325ffd83dbSDimitry Andric FunctionPass *createAMDGPUPromoteAllocaToVector(); 2335ffd83dbSDimitry Andric void initializeAMDGPUPromoteAllocaToVectorPass(PassRegistry&); 2345ffd83dbSDimitry Andric extern char &AMDGPUPromoteAllocaToVectorID; 2355ffd83dbSDimitry Andric 236*e8d8bef9SDimitry Andric struct AMDGPUPromoteAllocaPass : PassInfoMixin<AMDGPUPromoteAllocaPass> { 237*e8d8bef9SDimitry Andric AMDGPUPromoteAllocaPass(TargetMachine &TM) : TM(TM) {} 238*e8d8bef9SDimitry Andric PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); 239*e8d8bef9SDimitry Andric 240*e8d8bef9SDimitry Andric private: 241*e8d8bef9SDimitry Andric TargetMachine &TM; 242*e8d8bef9SDimitry Andric }; 243*e8d8bef9SDimitry Andric 244*e8d8bef9SDimitry Andric struct AMDGPUPromoteAllocaToVectorPass 245*e8d8bef9SDimitry Andric : PassInfoMixin<AMDGPUPromoteAllocaToVectorPass> { 246*e8d8bef9SDimitry Andric AMDGPUPromoteAllocaToVectorPass(TargetMachine &TM) : TM(TM) {} 247*e8d8bef9SDimitry Andric PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM); 248*e8d8bef9SDimitry Andric 249*e8d8bef9SDimitry Andric private: 250*e8d8bef9SDimitry Andric TargetMachine &TM; 251*e8d8bef9SDimitry Andric }; 252*e8d8bef9SDimitry Andric 2530b57cec5SDimitry Andric Pass *createAMDGPUStructurizeCFGPass(); 2540b57cec5SDimitry Andric FunctionPass *createAMDGPUISelDag( 2550b57cec5SDimitry Andric TargetMachine *TM = nullptr, 2560b57cec5SDimitry Andric CodeGenOpt::Level OptLevel = CodeGenOpt::Default); 2570b57cec5SDimitry Andric ModulePass *createAMDGPUAlwaysInlinePass(bool GlobalOpt = true); 258*e8d8bef9SDimitry Andric 259*e8d8bef9SDimitry Andric struct AMDGPUAlwaysInlinePass : PassInfoMixin<AMDGPUAlwaysInlinePass> { 260*e8d8bef9SDimitry Andric AMDGPUAlwaysInlinePass(bool GlobalOpt = true) : GlobalOpt(GlobalOpt) {} 261*e8d8bef9SDimitry Andric PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM); 262*e8d8bef9SDimitry Andric 263*e8d8bef9SDimitry Andric private: 264*e8d8bef9SDimitry Andric bool GlobalOpt; 265*e8d8bef9SDimitry Andric }; 266*e8d8bef9SDimitry Andric 2670b57cec5SDimitry Andric ModulePass *createR600OpenCLImageTypeLoweringPass(); 2680b57cec5SDimitry Andric FunctionPass *createAMDGPUAnnotateUniformValues(); 2690b57cec5SDimitry Andric 2708bcb0991SDimitry Andric ModulePass *createAMDGPUPrintfRuntimeBinding(); 2718bcb0991SDimitry Andric void initializeAMDGPUPrintfRuntimeBindingPass(PassRegistry&); 2728bcb0991SDimitry Andric extern char &AMDGPUPrintfRuntimeBindingID; 2738bcb0991SDimitry Andric 274*e8d8bef9SDimitry Andric struct AMDGPUPrintfRuntimeBindingPass 275*e8d8bef9SDimitry Andric : PassInfoMixin<AMDGPUPrintfRuntimeBindingPass> { 276*e8d8bef9SDimitry Andric PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM); 277*e8d8bef9SDimitry Andric }; 278*e8d8bef9SDimitry Andric 2790b57cec5SDimitry Andric ModulePass* createAMDGPUUnifyMetadataPass(); 2800b57cec5SDimitry Andric void initializeAMDGPUUnifyMetadataPass(PassRegistry&); 2810b57cec5SDimitry Andric extern char &AMDGPUUnifyMetadataID; 2820b57cec5SDimitry Andric 283*e8d8bef9SDimitry Andric struct AMDGPUUnifyMetadataPass : PassInfoMixin<AMDGPUUnifyMetadataPass> { 284*e8d8bef9SDimitry Andric PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM); 285*e8d8bef9SDimitry Andric }; 286*e8d8bef9SDimitry Andric 2870b57cec5SDimitry Andric void initializeSIOptimizeExecMaskingPreRAPass(PassRegistry&); 2880b57cec5SDimitry Andric extern char &SIOptimizeExecMaskingPreRAID; 2890b57cec5SDimitry Andric 2900b57cec5SDimitry Andric void initializeAMDGPUAnnotateUniformValuesPass(PassRegistry&); 2910b57cec5SDimitry Andric extern char &AMDGPUAnnotateUniformValuesPassID; 2920b57cec5SDimitry Andric 2930b57cec5SDimitry Andric void initializeAMDGPUCodeGenPreparePass(PassRegistry&); 2940b57cec5SDimitry Andric extern char &AMDGPUCodeGenPrepareID; 2950b57cec5SDimitry Andric 296*e8d8bef9SDimitry Andric void initializeAMDGPULateCodeGenPreparePass(PassRegistry &); 297*e8d8bef9SDimitry Andric extern char &AMDGPULateCodeGenPrepareID; 298*e8d8bef9SDimitry Andric 2990b57cec5SDimitry Andric void initializeSIAnnotateControlFlowPass(PassRegistry&); 3000b57cec5SDimitry Andric extern char &SIAnnotateControlFlowPassID; 3010b57cec5SDimitry Andric 3020b57cec5SDimitry Andric void initializeSIMemoryLegalizerPass(PassRegistry&); 3030b57cec5SDimitry Andric extern char &SIMemoryLegalizerID; 3040b57cec5SDimitry Andric 3050b57cec5SDimitry Andric void initializeSIModeRegisterPass(PassRegistry&); 3060b57cec5SDimitry Andric extern char &SIModeRegisterID; 3070b57cec5SDimitry Andric 3085ffd83dbSDimitry Andric void initializeSIInsertHardClausesPass(PassRegistry &); 3095ffd83dbSDimitry Andric extern char &SIInsertHardClausesID; 3105ffd83dbSDimitry Andric 3110b57cec5SDimitry Andric void initializeSIInsertWaitcntsPass(PassRegistry&); 3120b57cec5SDimitry Andric extern char &SIInsertWaitcntsID; 3130b57cec5SDimitry Andric 3140b57cec5SDimitry Andric void initializeSIFormMemoryClausesPass(PassRegistry&); 3150b57cec5SDimitry Andric extern char &SIFormMemoryClausesID; 3160b57cec5SDimitry Andric 3175ffd83dbSDimitry Andric void initializeSIPostRABundlerPass(PassRegistry&); 3185ffd83dbSDimitry Andric extern char &SIPostRABundlerID; 3195ffd83dbSDimitry Andric 3200b57cec5SDimitry Andric void initializeAMDGPUUnifyDivergentExitNodesPass(PassRegistry&); 3210b57cec5SDimitry Andric extern char &AMDGPUUnifyDivergentExitNodesID; 3220b57cec5SDimitry Andric 3230b57cec5SDimitry Andric ImmutablePass *createAMDGPUAAWrapperPass(); 3240b57cec5SDimitry Andric void initializeAMDGPUAAWrapperPassPass(PassRegistry&); 3250b57cec5SDimitry Andric ImmutablePass *createAMDGPUExternalAAWrapperPass(); 3260b57cec5SDimitry Andric void initializeAMDGPUExternalAAWrapperPass(PassRegistry&); 3270b57cec5SDimitry Andric 3280b57cec5SDimitry Andric void initializeAMDGPUArgumentUsageInfoPass(PassRegistry &); 3290b57cec5SDimitry Andric 3300b57cec5SDimitry Andric ModulePass *createAMDGPUOpenCLEnqueuedBlockLoweringPass(); 3310b57cec5SDimitry Andric void initializeAMDGPUOpenCLEnqueuedBlockLoweringPass(PassRegistry &); 3320b57cec5SDimitry Andric extern char &AMDGPUOpenCLEnqueuedBlockLoweringID; 3330b57cec5SDimitry Andric 3340b57cec5SDimitry Andric void initializeGCNRegBankReassignPass(PassRegistry &); 3350b57cec5SDimitry Andric extern char &GCNRegBankReassignID; 3360b57cec5SDimitry Andric 3370b57cec5SDimitry Andric void initializeGCNNSAReassignPass(PassRegistry &); 3380b57cec5SDimitry Andric extern char &GCNNSAReassignID; 3390b57cec5SDimitry Andric 3400b57cec5SDimitry Andric namespace AMDGPU { 3410b57cec5SDimitry Andric enum TargetIndex { 3420b57cec5SDimitry Andric TI_CONSTDATA_START, 3430b57cec5SDimitry Andric TI_SCRATCH_RSRC_DWORD0, 3440b57cec5SDimitry Andric TI_SCRATCH_RSRC_DWORD1, 3450b57cec5SDimitry Andric TI_SCRATCH_RSRC_DWORD2, 3460b57cec5SDimitry Andric TI_SCRATCH_RSRC_DWORD3 3470b57cec5SDimitry Andric }; 3480b57cec5SDimitry Andric } 3490b57cec5SDimitry Andric 3500b57cec5SDimitry Andric /// OpenCL uses address spaces to differentiate between 3510b57cec5SDimitry Andric /// various memory regions on the hardware. On the CPU 3520b57cec5SDimitry Andric /// all of the address spaces point to the same memory, 3530b57cec5SDimitry Andric /// however on the GPU, each address space points to 3540b57cec5SDimitry Andric /// a separate piece of memory that is unique from other 3550b57cec5SDimitry Andric /// memory locations. 3560b57cec5SDimitry Andric namespace AMDGPUAS { 3570b57cec5SDimitry Andric enum : unsigned { 3580b57cec5SDimitry Andric // The maximum value for flat, generic, local, private, constant and region. 3590b57cec5SDimitry Andric MAX_AMDGPU_ADDRESS = 7, 3600b57cec5SDimitry Andric 3610b57cec5SDimitry Andric FLAT_ADDRESS = 0, ///< Address space for flat memory. 3620b57cec5SDimitry Andric GLOBAL_ADDRESS = 1, ///< Address space for global memory (RAT0, VTX0). 3630b57cec5SDimitry Andric REGION_ADDRESS = 2, ///< Address space for region memory. (GDS) 3640b57cec5SDimitry Andric 3650b57cec5SDimitry Andric CONSTANT_ADDRESS = 4, ///< Address space for constant memory (VTX2). 3660b57cec5SDimitry Andric LOCAL_ADDRESS = 3, ///< Address space for local memory. 3670b57cec5SDimitry Andric PRIVATE_ADDRESS = 5, ///< Address space for private memory. 3680b57cec5SDimitry Andric 3690b57cec5SDimitry Andric CONSTANT_ADDRESS_32BIT = 6, ///< Address space for 32-bit constant memory. 3700b57cec5SDimitry Andric 3710b57cec5SDimitry Andric BUFFER_FAT_POINTER = 7, ///< Address space for 160-bit buffer fat pointers. 3720b57cec5SDimitry Andric 3730b57cec5SDimitry Andric /// Address space for direct addressible parameter memory (CONST0). 3740b57cec5SDimitry Andric PARAM_D_ADDRESS = 6, 3750b57cec5SDimitry Andric /// Address space for indirect addressible parameter memory (VTX1). 3760b57cec5SDimitry Andric PARAM_I_ADDRESS = 7, 3770b57cec5SDimitry Andric 3780b57cec5SDimitry Andric // Do not re-order the CONSTANT_BUFFER_* enums. Several places depend on 3790b57cec5SDimitry Andric // this order to be able to dynamically index a constant buffer, for 3800b57cec5SDimitry Andric // example: 3810b57cec5SDimitry Andric // 3820b57cec5SDimitry Andric // ConstantBufferAS = CONSTANT_BUFFER_0 + CBIdx 3830b57cec5SDimitry Andric 3840b57cec5SDimitry Andric CONSTANT_BUFFER_0 = 8, 3850b57cec5SDimitry Andric CONSTANT_BUFFER_1 = 9, 3860b57cec5SDimitry Andric CONSTANT_BUFFER_2 = 10, 3870b57cec5SDimitry Andric CONSTANT_BUFFER_3 = 11, 3880b57cec5SDimitry Andric CONSTANT_BUFFER_4 = 12, 3890b57cec5SDimitry Andric CONSTANT_BUFFER_5 = 13, 3900b57cec5SDimitry Andric CONSTANT_BUFFER_6 = 14, 3910b57cec5SDimitry Andric CONSTANT_BUFFER_7 = 15, 3920b57cec5SDimitry Andric CONSTANT_BUFFER_8 = 16, 3930b57cec5SDimitry Andric CONSTANT_BUFFER_9 = 17, 3940b57cec5SDimitry Andric CONSTANT_BUFFER_10 = 18, 3950b57cec5SDimitry Andric CONSTANT_BUFFER_11 = 19, 3960b57cec5SDimitry Andric CONSTANT_BUFFER_12 = 20, 3970b57cec5SDimitry Andric CONSTANT_BUFFER_13 = 21, 3980b57cec5SDimitry Andric CONSTANT_BUFFER_14 = 22, 3990b57cec5SDimitry Andric CONSTANT_BUFFER_15 = 23, 4000b57cec5SDimitry Andric 4010b57cec5SDimitry Andric // Some places use this if the address space can't be determined. 4020b57cec5SDimitry Andric UNKNOWN_ADDRESS_SPACE = ~0u, 4030b57cec5SDimitry Andric }; 4040b57cec5SDimitry Andric } 4050b57cec5SDimitry Andric 406*e8d8bef9SDimitry Andric namespace AMDGPU { 407*e8d8bef9SDimitry Andric 408*e8d8bef9SDimitry Andric // FIXME: Missing constant_32bit 409*e8d8bef9SDimitry Andric inline bool isFlatGlobalAddrSpace(unsigned AS) { 410*e8d8bef9SDimitry Andric return AS == AMDGPUAS::GLOBAL_ADDRESS || 411*e8d8bef9SDimitry Andric AS == AMDGPUAS::FLAT_ADDRESS || 412*e8d8bef9SDimitry Andric AS == AMDGPUAS::CONSTANT_ADDRESS || 413*e8d8bef9SDimitry Andric AS > AMDGPUAS::MAX_AMDGPU_ADDRESS; 414*e8d8bef9SDimitry Andric } 415*e8d8bef9SDimitry Andric } 416*e8d8bef9SDimitry Andric 417*e8d8bef9SDimitry Andric } // End namespace llvm 418*e8d8bef9SDimitry Andric 4190b57cec5SDimitry Andric #endif 420