10b57cec5SDimitry Andric //===-- AMDGPU.h - MachineFunction passes hw codegen --------------*- C++ -*-=// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric /// \file 80b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 90b57cec5SDimitry Andric 100b57cec5SDimitry Andric #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPU_H 110b57cec5SDimitry Andric #define LLVM_LIB_TARGET_AMDGPU_AMDGPU_H 120b57cec5SDimitry Andric 130b57cec5SDimitry Andric #include "llvm/Target/TargetMachine.h" 140b57cec5SDimitry Andric 150b57cec5SDimitry Andric namespace llvm { 160b57cec5SDimitry Andric 170b57cec5SDimitry Andric class AMDGPUTargetMachine; 180b57cec5SDimitry Andric class FunctionPass; 190b57cec5SDimitry Andric class GCNTargetMachine; 200b57cec5SDimitry Andric class ModulePass; 210b57cec5SDimitry Andric class Pass; 220b57cec5SDimitry Andric class Target; 230b57cec5SDimitry Andric class TargetMachine; 240b57cec5SDimitry Andric class TargetOptions; 250b57cec5SDimitry Andric class PassRegistry; 260b57cec5SDimitry Andric class Module; 270b57cec5SDimitry Andric 280b57cec5SDimitry Andric // R600 Passes 290b57cec5SDimitry Andric FunctionPass *createR600VectorRegMerger(); 300b57cec5SDimitry Andric FunctionPass *createR600ExpandSpecialInstrsPass(); 310b57cec5SDimitry Andric FunctionPass *createR600EmitClauseMarkers(); 320b57cec5SDimitry Andric FunctionPass *createR600ClauseMergePass(); 330b57cec5SDimitry Andric FunctionPass *createR600Packetizer(); 340b57cec5SDimitry Andric FunctionPass *createR600ControlFlowFinalizer(); 350b57cec5SDimitry Andric FunctionPass *createAMDGPUCFGStructurizerPass(); 360b57cec5SDimitry Andric FunctionPass *createR600ISelDag(TargetMachine *TM, CodeGenOpt::Level OptLevel); 370b57cec5SDimitry Andric 380b57cec5SDimitry Andric // SI Passes 390b57cec5SDimitry Andric FunctionPass *createGCNDPPCombinePass(); 400b57cec5SDimitry Andric FunctionPass *createSIAnnotateControlFlowPass(); 410b57cec5SDimitry Andric FunctionPass *createSIFoldOperandsPass(); 420b57cec5SDimitry Andric FunctionPass *createSIPeepholeSDWAPass(); 430b57cec5SDimitry Andric FunctionPass *createSILowerI1CopiesPass(); 440b57cec5SDimitry Andric FunctionPass *createSIFixupVectorISelPass(); 450b57cec5SDimitry Andric FunctionPass *createSIAddIMGInitPass(); 460b57cec5SDimitry Andric FunctionPass *createSIShrinkInstructionsPass(); 470b57cec5SDimitry Andric FunctionPass *createSILoadStoreOptimizerPass(); 480b57cec5SDimitry Andric FunctionPass *createSIWholeQuadModePass(); 490b57cec5SDimitry Andric FunctionPass *createSIFixControlFlowLiveIntervalsPass(); 500b57cec5SDimitry Andric FunctionPass *createSIOptimizeExecMaskingPreRAPass(); 510b57cec5SDimitry Andric FunctionPass *createSIFixSGPRCopiesPass(); 520b57cec5SDimitry Andric FunctionPass *createSIMemoryLegalizerPass(); 530b57cec5SDimitry Andric FunctionPass *createSIInsertWaitcntsPass(); 540b57cec5SDimitry Andric FunctionPass *createSIPreAllocateWWMRegsPass(); 550b57cec5SDimitry Andric FunctionPass *createSIFormMemoryClausesPass(); 560b57cec5SDimitry Andric FunctionPass *createAMDGPUSimplifyLibCallsPass(const TargetOptions &, 570b57cec5SDimitry Andric const TargetMachine *); 580b57cec5SDimitry Andric FunctionPass *createAMDGPUUseNativeCallsPass(); 590b57cec5SDimitry Andric FunctionPass *createAMDGPUCodeGenPreparePass(); 600b57cec5SDimitry Andric FunctionPass *createAMDGPUMachineCFGStructurizerPass(); 610b57cec5SDimitry Andric FunctionPass *createAMDGPUPropagateAttributesEarlyPass(const TargetMachine *); 620b57cec5SDimitry Andric ModulePass *createAMDGPUPropagateAttributesLatePass(const TargetMachine *); 630b57cec5SDimitry Andric FunctionPass *createAMDGPURewriteOutArgumentsPass(); 640b57cec5SDimitry Andric FunctionPass *createSIModeRegisterPass(); 650b57cec5SDimitry Andric 660b57cec5SDimitry Andric void initializeAMDGPUDAGToDAGISelPass(PassRegistry&); 670b57cec5SDimitry Andric 680b57cec5SDimitry Andric void initializeAMDGPUMachineCFGStructurizerPass(PassRegistry&); 690b57cec5SDimitry Andric extern char &AMDGPUMachineCFGStructurizerID; 700b57cec5SDimitry Andric 710b57cec5SDimitry Andric void initializeAMDGPUAlwaysInlinePass(PassRegistry&); 720b57cec5SDimitry Andric 730b57cec5SDimitry Andric Pass *createAMDGPUAnnotateKernelFeaturesPass(); 740b57cec5SDimitry Andric void initializeAMDGPUAnnotateKernelFeaturesPass(PassRegistry &); 750b57cec5SDimitry Andric extern char &AMDGPUAnnotateKernelFeaturesID; 760b57cec5SDimitry Andric 770b57cec5SDimitry Andric FunctionPass *createAMDGPUAtomicOptimizerPass(); 780b57cec5SDimitry Andric void initializeAMDGPUAtomicOptimizerPass(PassRegistry &); 790b57cec5SDimitry Andric extern char &AMDGPUAtomicOptimizerID; 800b57cec5SDimitry Andric 810b57cec5SDimitry Andric ModulePass *createAMDGPULowerIntrinsicsPass(); 820b57cec5SDimitry Andric void initializeAMDGPULowerIntrinsicsPass(PassRegistry &); 830b57cec5SDimitry Andric extern char &AMDGPULowerIntrinsicsID; 840b57cec5SDimitry Andric 850b57cec5SDimitry Andric ModulePass *createAMDGPUFixFunctionBitcastsPass(); 860b57cec5SDimitry Andric void initializeAMDGPUFixFunctionBitcastsPass(PassRegistry &); 870b57cec5SDimitry Andric extern char &AMDGPUFixFunctionBitcastsID; 880b57cec5SDimitry Andric 890b57cec5SDimitry Andric FunctionPass *createAMDGPULowerKernelArgumentsPass(); 900b57cec5SDimitry Andric void initializeAMDGPULowerKernelArgumentsPass(PassRegistry &); 910b57cec5SDimitry Andric extern char &AMDGPULowerKernelArgumentsID; 920b57cec5SDimitry Andric 930b57cec5SDimitry Andric ModulePass *createAMDGPULowerKernelAttributesPass(); 940b57cec5SDimitry Andric void initializeAMDGPULowerKernelAttributesPass(PassRegistry &); 950b57cec5SDimitry Andric extern char &AMDGPULowerKernelAttributesID; 960b57cec5SDimitry Andric 970b57cec5SDimitry Andric void initializeAMDGPUPropagateAttributesEarlyPass(PassRegistry &); 980b57cec5SDimitry Andric extern char &AMDGPUPropagateAttributesEarlyID; 990b57cec5SDimitry Andric 1000b57cec5SDimitry Andric void initializeAMDGPUPropagateAttributesLatePass(PassRegistry &); 1010b57cec5SDimitry Andric extern char &AMDGPUPropagateAttributesLateID; 1020b57cec5SDimitry Andric 1030b57cec5SDimitry Andric void initializeAMDGPURewriteOutArgumentsPass(PassRegistry &); 1040b57cec5SDimitry Andric extern char &AMDGPURewriteOutArgumentsID; 1050b57cec5SDimitry Andric 1060b57cec5SDimitry Andric void initializeGCNDPPCombinePass(PassRegistry &); 1070b57cec5SDimitry Andric extern char &GCNDPPCombineID; 1080b57cec5SDimitry Andric 1090b57cec5SDimitry Andric void initializeR600ClauseMergePassPass(PassRegistry &); 1100b57cec5SDimitry Andric extern char &R600ClauseMergePassID; 1110b57cec5SDimitry Andric 1120b57cec5SDimitry Andric void initializeR600ControlFlowFinalizerPass(PassRegistry &); 1130b57cec5SDimitry Andric extern char &R600ControlFlowFinalizerID; 1140b57cec5SDimitry Andric 1150b57cec5SDimitry Andric void initializeR600ExpandSpecialInstrsPassPass(PassRegistry &); 1160b57cec5SDimitry Andric extern char &R600ExpandSpecialInstrsPassID; 1170b57cec5SDimitry Andric 1180b57cec5SDimitry Andric void initializeR600VectorRegMergerPass(PassRegistry &); 1190b57cec5SDimitry Andric extern char &R600VectorRegMergerID; 1200b57cec5SDimitry Andric 1210b57cec5SDimitry Andric void initializeR600PacketizerPass(PassRegistry &); 1220b57cec5SDimitry Andric extern char &R600PacketizerID; 1230b57cec5SDimitry Andric 1240b57cec5SDimitry Andric void initializeSIFoldOperandsPass(PassRegistry &); 1250b57cec5SDimitry Andric extern char &SIFoldOperandsID; 1260b57cec5SDimitry Andric 1270b57cec5SDimitry Andric void initializeSIPeepholeSDWAPass(PassRegistry &); 1280b57cec5SDimitry Andric extern char &SIPeepholeSDWAID; 1290b57cec5SDimitry Andric 1300b57cec5SDimitry Andric void initializeSIShrinkInstructionsPass(PassRegistry&); 1310b57cec5SDimitry Andric extern char &SIShrinkInstructionsID; 1320b57cec5SDimitry Andric 1330b57cec5SDimitry Andric void initializeSIFixSGPRCopiesPass(PassRegistry &); 1340b57cec5SDimitry Andric extern char &SIFixSGPRCopiesID; 1350b57cec5SDimitry Andric 1360b57cec5SDimitry Andric void initializeSIFixVGPRCopiesPass(PassRegistry &); 1370b57cec5SDimitry Andric extern char &SIFixVGPRCopiesID; 1380b57cec5SDimitry Andric 1390b57cec5SDimitry Andric void initializeSIFixupVectorISelPass(PassRegistry &); 1400b57cec5SDimitry Andric extern char &SIFixupVectorISelID; 1410b57cec5SDimitry Andric 1420b57cec5SDimitry Andric void initializeSILowerI1CopiesPass(PassRegistry &); 1430b57cec5SDimitry Andric extern char &SILowerI1CopiesID; 1440b57cec5SDimitry Andric 1450b57cec5SDimitry Andric void initializeSILowerSGPRSpillsPass(PassRegistry &); 1460b57cec5SDimitry Andric extern char &SILowerSGPRSpillsID; 1470b57cec5SDimitry Andric 1480b57cec5SDimitry Andric void initializeSILoadStoreOptimizerPass(PassRegistry &); 1490b57cec5SDimitry Andric extern char &SILoadStoreOptimizerID; 1500b57cec5SDimitry Andric 1510b57cec5SDimitry Andric void initializeSIWholeQuadModePass(PassRegistry &); 1520b57cec5SDimitry Andric extern char &SIWholeQuadModeID; 1530b57cec5SDimitry Andric 1540b57cec5SDimitry Andric void initializeSILowerControlFlowPass(PassRegistry &); 1550b57cec5SDimitry Andric extern char &SILowerControlFlowID; 1560b57cec5SDimitry Andric 1570b57cec5SDimitry Andric void initializeSIInsertSkipsPass(PassRegistry &); 1580b57cec5SDimitry Andric extern char &SIInsertSkipsPassID; 1590b57cec5SDimitry Andric 1600b57cec5SDimitry Andric void initializeSIOptimizeExecMaskingPass(PassRegistry &); 1610b57cec5SDimitry Andric extern char &SIOptimizeExecMaskingID; 1620b57cec5SDimitry Andric 1630b57cec5SDimitry Andric void initializeSIPreAllocateWWMRegsPass(PassRegistry &); 1640b57cec5SDimitry Andric extern char &SIPreAllocateWWMRegsID; 1650b57cec5SDimitry Andric 1660b57cec5SDimitry Andric void initializeAMDGPUSimplifyLibCallsPass(PassRegistry &); 1670b57cec5SDimitry Andric extern char &AMDGPUSimplifyLibCallsID; 1680b57cec5SDimitry Andric 1690b57cec5SDimitry Andric void initializeAMDGPUUseNativeCallsPass(PassRegistry &); 1700b57cec5SDimitry Andric extern char &AMDGPUUseNativeCallsID; 1710b57cec5SDimitry Andric 1720b57cec5SDimitry Andric void initializeSIAddIMGInitPass(PassRegistry &); 1730b57cec5SDimitry Andric extern char &SIAddIMGInitID; 1740b57cec5SDimitry Andric 1750b57cec5SDimitry Andric void initializeAMDGPUPerfHintAnalysisPass(PassRegistry &); 1760b57cec5SDimitry Andric extern char &AMDGPUPerfHintAnalysisID; 1770b57cec5SDimitry Andric 1780b57cec5SDimitry Andric // Passes common to R600 and SI 1790b57cec5SDimitry Andric FunctionPass *createAMDGPUPromoteAlloca(); 1800b57cec5SDimitry Andric void initializeAMDGPUPromoteAllocaPass(PassRegistry&); 1810b57cec5SDimitry Andric extern char &AMDGPUPromoteAllocaID; 1820b57cec5SDimitry Andric 1830b57cec5SDimitry Andric Pass *createAMDGPUStructurizeCFGPass(); 1840b57cec5SDimitry Andric FunctionPass *createAMDGPUISelDag( 1850b57cec5SDimitry Andric TargetMachine *TM = nullptr, 1860b57cec5SDimitry Andric CodeGenOpt::Level OptLevel = CodeGenOpt::Default); 1870b57cec5SDimitry Andric ModulePass *createAMDGPUAlwaysInlinePass(bool GlobalOpt = true); 1880b57cec5SDimitry Andric ModulePass *createR600OpenCLImageTypeLoweringPass(); 1890b57cec5SDimitry Andric FunctionPass *createAMDGPUAnnotateUniformValues(); 1900b57cec5SDimitry Andric 191*8bcb0991SDimitry Andric ModulePass *createAMDGPUPrintfRuntimeBinding(); 192*8bcb0991SDimitry Andric void initializeAMDGPUPrintfRuntimeBindingPass(PassRegistry&); 193*8bcb0991SDimitry Andric extern char &AMDGPUPrintfRuntimeBindingID; 194*8bcb0991SDimitry Andric 1950b57cec5SDimitry Andric ModulePass* createAMDGPUUnifyMetadataPass(); 1960b57cec5SDimitry Andric void initializeAMDGPUUnifyMetadataPass(PassRegistry&); 1970b57cec5SDimitry Andric extern char &AMDGPUUnifyMetadataID; 1980b57cec5SDimitry Andric 1990b57cec5SDimitry Andric void initializeSIOptimizeExecMaskingPreRAPass(PassRegistry&); 2000b57cec5SDimitry Andric extern char &SIOptimizeExecMaskingPreRAID; 2010b57cec5SDimitry Andric 2020b57cec5SDimitry Andric void initializeAMDGPUAnnotateUniformValuesPass(PassRegistry&); 2030b57cec5SDimitry Andric extern char &AMDGPUAnnotateUniformValuesPassID; 2040b57cec5SDimitry Andric 2050b57cec5SDimitry Andric void initializeAMDGPUCodeGenPreparePass(PassRegistry&); 2060b57cec5SDimitry Andric extern char &AMDGPUCodeGenPrepareID; 2070b57cec5SDimitry Andric 2080b57cec5SDimitry Andric void initializeSIAnnotateControlFlowPass(PassRegistry&); 2090b57cec5SDimitry Andric extern char &SIAnnotateControlFlowPassID; 2100b57cec5SDimitry Andric 2110b57cec5SDimitry Andric void initializeSIMemoryLegalizerPass(PassRegistry&); 2120b57cec5SDimitry Andric extern char &SIMemoryLegalizerID; 2130b57cec5SDimitry Andric 2140b57cec5SDimitry Andric void initializeSIModeRegisterPass(PassRegistry&); 2150b57cec5SDimitry Andric extern char &SIModeRegisterID; 2160b57cec5SDimitry Andric 2170b57cec5SDimitry Andric void initializeSIInsertWaitcntsPass(PassRegistry&); 2180b57cec5SDimitry Andric extern char &SIInsertWaitcntsID; 2190b57cec5SDimitry Andric 2200b57cec5SDimitry Andric void initializeSIFormMemoryClausesPass(PassRegistry&); 2210b57cec5SDimitry Andric extern char &SIFormMemoryClausesID; 2220b57cec5SDimitry Andric 2230b57cec5SDimitry Andric void initializeAMDGPUUnifyDivergentExitNodesPass(PassRegistry&); 2240b57cec5SDimitry Andric extern char &AMDGPUUnifyDivergentExitNodesID; 2250b57cec5SDimitry Andric 2260b57cec5SDimitry Andric ImmutablePass *createAMDGPUAAWrapperPass(); 2270b57cec5SDimitry Andric void initializeAMDGPUAAWrapperPassPass(PassRegistry&); 2280b57cec5SDimitry Andric ImmutablePass *createAMDGPUExternalAAWrapperPass(); 2290b57cec5SDimitry Andric void initializeAMDGPUExternalAAWrapperPass(PassRegistry&); 2300b57cec5SDimitry Andric 2310b57cec5SDimitry Andric void initializeAMDGPUArgumentUsageInfoPass(PassRegistry &); 2320b57cec5SDimitry Andric 2330b57cec5SDimitry Andric Pass *createAMDGPUFunctionInliningPass(); 2340b57cec5SDimitry Andric void initializeAMDGPUInlinerPass(PassRegistry&); 2350b57cec5SDimitry Andric 2360b57cec5SDimitry Andric ModulePass *createAMDGPUOpenCLEnqueuedBlockLoweringPass(); 2370b57cec5SDimitry Andric void initializeAMDGPUOpenCLEnqueuedBlockLoweringPass(PassRegistry &); 2380b57cec5SDimitry Andric extern char &AMDGPUOpenCLEnqueuedBlockLoweringID; 2390b57cec5SDimitry Andric 2400b57cec5SDimitry Andric void initializeGCNRegBankReassignPass(PassRegistry &); 2410b57cec5SDimitry Andric extern char &GCNRegBankReassignID; 2420b57cec5SDimitry Andric 2430b57cec5SDimitry Andric void initializeGCNNSAReassignPass(PassRegistry &); 2440b57cec5SDimitry Andric extern char &GCNNSAReassignID; 2450b57cec5SDimitry Andric 2460b57cec5SDimitry Andric namespace AMDGPU { 2470b57cec5SDimitry Andric enum TargetIndex { 2480b57cec5SDimitry Andric TI_CONSTDATA_START, 2490b57cec5SDimitry Andric TI_SCRATCH_RSRC_DWORD0, 2500b57cec5SDimitry Andric TI_SCRATCH_RSRC_DWORD1, 2510b57cec5SDimitry Andric TI_SCRATCH_RSRC_DWORD2, 2520b57cec5SDimitry Andric TI_SCRATCH_RSRC_DWORD3 2530b57cec5SDimitry Andric }; 2540b57cec5SDimitry Andric } 2550b57cec5SDimitry Andric 2560b57cec5SDimitry Andric } // End namespace llvm 2570b57cec5SDimitry Andric 2580b57cec5SDimitry Andric /// OpenCL uses address spaces to differentiate between 2590b57cec5SDimitry Andric /// various memory regions on the hardware. On the CPU 2600b57cec5SDimitry Andric /// all of the address spaces point to the same memory, 2610b57cec5SDimitry Andric /// however on the GPU, each address space points to 2620b57cec5SDimitry Andric /// a separate piece of memory that is unique from other 2630b57cec5SDimitry Andric /// memory locations. 2640b57cec5SDimitry Andric namespace AMDGPUAS { 2650b57cec5SDimitry Andric enum : unsigned { 2660b57cec5SDimitry Andric // The maximum value for flat, generic, local, private, constant and region. 2670b57cec5SDimitry Andric MAX_AMDGPU_ADDRESS = 7, 2680b57cec5SDimitry Andric 2690b57cec5SDimitry Andric FLAT_ADDRESS = 0, ///< Address space for flat memory. 2700b57cec5SDimitry Andric GLOBAL_ADDRESS = 1, ///< Address space for global memory (RAT0, VTX0). 2710b57cec5SDimitry Andric REGION_ADDRESS = 2, ///< Address space for region memory. (GDS) 2720b57cec5SDimitry Andric 2730b57cec5SDimitry Andric CONSTANT_ADDRESS = 4, ///< Address space for constant memory (VTX2). 2740b57cec5SDimitry Andric LOCAL_ADDRESS = 3, ///< Address space for local memory. 2750b57cec5SDimitry Andric PRIVATE_ADDRESS = 5, ///< Address space for private memory. 2760b57cec5SDimitry Andric 2770b57cec5SDimitry Andric CONSTANT_ADDRESS_32BIT = 6, ///< Address space for 32-bit constant memory. 2780b57cec5SDimitry Andric 2790b57cec5SDimitry Andric BUFFER_FAT_POINTER = 7, ///< Address space for 160-bit buffer fat pointers. 2800b57cec5SDimitry Andric 2810b57cec5SDimitry Andric /// Address space for direct addressible parameter memory (CONST0). 2820b57cec5SDimitry Andric PARAM_D_ADDRESS = 6, 2830b57cec5SDimitry Andric /// Address space for indirect addressible parameter memory (VTX1). 2840b57cec5SDimitry Andric PARAM_I_ADDRESS = 7, 2850b57cec5SDimitry Andric 2860b57cec5SDimitry Andric // Do not re-order the CONSTANT_BUFFER_* enums. Several places depend on 2870b57cec5SDimitry Andric // this order to be able to dynamically index a constant buffer, for 2880b57cec5SDimitry Andric // example: 2890b57cec5SDimitry Andric // 2900b57cec5SDimitry Andric // ConstantBufferAS = CONSTANT_BUFFER_0 + CBIdx 2910b57cec5SDimitry Andric 2920b57cec5SDimitry Andric CONSTANT_BUFFER_0 = 8, 2930b57cec5SDimitry Andric CONSTANT_BUFFER_1 = 9, 2940b57cec5SDimitry Andric CONSTANT_BUFFER_2 = 10, 2950b57cec5SDimitry Andric CONSTANT_BUFFER_3 = 11, 2960b57cec5SDimitry Andric CONSTANT_BUFFER_4 = 12, 2970b57cec5SDimitry Andric CONSTANT_BUFFER_5 = 13, 2980b57cec5SDimitry Andric CONSTANT_BUFFER_6 = 14, 2990b57cec5SDimitry Andric CONSTANT_BUFFER_7 = 15, 3000b57cec5SDimitry Andric CONSTANT_BUFFER_8 = 16, 3010b57cec5SDimitry Andric CONSTANT_BUFFER_9 = 17, 3020b57cec5SDimitry Andric CONSTANT_BUFFER_10 = 18, 3030b57cec5SDimitry Andric CONSTANT_BUFFER_11 = 19, 3040b57cec5SDimitry Andric CONSTANT_BUFFER_12 = 20, 3050b57cec5SDimitry Andric CONSTANT_BUFFER_13 = 21, 3060b57cec5SDimitry Andric CONSTANT_BUFFER_14 = 22, 3070b57cec5SDimitry Andric CONSTANT_BUFFER_15 = 23, 3080b57cec5SDimitry Andric 3090b57cec5SDimitry Andric // Some places use this if the address space can't be determined. 3100b57cec5SDimitry Andric UNKNOWN_ADDRESS_SPACE = ~0u, 3110b57cec5SDimitry Andric }; 3120b57cec5SDimitry Andric } 3130b57cec5SDimitry Andric 3140b57cec5SDimitry Andric #endif 315