xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AMDGPU/AMDGPUInstructionSelector.h (revision da477bcdc0c335171bb0ed3813f570026de6df85)
1 //===- AMDGPUInstructionSelector --------------------------------*- C++ -*-==//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 /// \file
9 /// This file declares the targeting of the InstructionSelector class for
10 /// AMDGPU.
11 //===----------------------------------------------------------------------===//
12 
13 #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUINSTRUCTIONSELECTOR_H
14 #define LLVM_LIB_TARGET_AMDGPU_AMDGPUINSTRUCTIONSELECTOR_H
15 
16 #include "AMDGPU.h"
17 #include "AMDGPUArgumentUsageInfo.h"
18 #include "llvm/ADT/ArrayRef.h"
19 #include "llvm/ADT/SmallVector.h"
20 #include "llvm/CodeGen/Register.h"
21 #include "llvm/CodeGen/GlobalISel/InstructionSelector.h"
22 #include "llvm/IR/InstrTypes.h"
23 
24 namespace {
25 #define GET_GLOBALISEL_PREDICATE_BITSET
26 #define AMDGPUSubtarget GCNSubtarget
27 #include "AMDGPUGenGlobalISel.inc"
28 #undef GET_GLOBALISEL_PREDICATE_BITSET
29 #undef AMDGPUSubtarget
30 }
31 
32 namespace llvm {
33 
34 namespace AMDGPU {
35 struct ImageDimIntrinsicInfo;
36 }
37 
38 class AMDGPUInstrInfo;
39 class AMDGPURegisterBankInfo;
40 class GCNSubtarget;
41 class MachineInstr;
42 class MachineIRBuilder;
43 class MachineOperand;
44 class MachineRegisterInfo;
45 class RegisterBank;
46 class SIInstrInfo;
47 class SIMachineFunctionInfo;
48 class SIRegisterInfo;
49 
50 class AMDGPUInstructionSelector : public InstructionSelector {
51 private:
52   MachineRegisterInfo *MRI;
53 
54 public:
55   AMDGPUInstructionSelector(const GCNSubtarget &STI,
56                             const AMDGPURegisterBankInfo &RBI,
57                             const AMDGPUTargetMachine &TM);
58 
59   bool select(MachineInstr &I) override;
60   static const char *getName();
61 
62   void setupMF(MachineFunction &MF, GISelKnownBits &KB,
63                CodeGenCoverage &CoverageInfo) override;
64 
65 private:
66   struct GEPInfo {
67     const MachineInstr &GEP;
68     SmallVector<unsigned, 2> SgprParts;
69     SmallVector<unsigned, 2> VgprParts;
70     int64_t Imm;
71     GEPInfo(const MachineInstr &GEP) : GEP(GEP), Imm(0) { }
72   };
73 
74   bool isInstrUniform(const MachineInstr &MI) const;
75   bool isVCC(Register Reg, const MachineRegisterInfo &MRI) const;
76 
77   const RegisterBank *getArtifactRegBank(
78     Register Reg, const MachineRegisterInfo &MRI,
79     const TargetRegisterInfo &TRI) const;
80 
81   /// tblgen-erated 'select' implementation.
82   bool selectImpl(MachineInstr &I, CodeGenCoverage &CoverageInfo) const;
83 
84   MachineOperand getSubOperand64(MachineOperand &MO,
85                                  const TargetRegisterClass &SubRC,
86                                  unsigned SubIdx) const;
87 
88   bool constrainCopyLikeIntrin(MachineInstr &MI, unsigned NewOpc) const;
89   bool selectCOPY(MachineInstr &I) const;
90   bool selectPHI(MachineInstr &I) const;
91   bool selectG_TRUNC(MachineInstr &I) const;
92   bool selectG_SZA_EXT(MachineInstr &I) const;
93   bool selectG_CONSTANT(MachineInstr &I) const;
94   bool selectG_FNEG(MachineInstr &I) const;
95   bool selectG_FABS(MachineInstr &I) const;
96   bool selectG_AND_OR_XOR(MachineInstr &I) const;
97   bool selectG_ADD_SUB(MachineInstr &I) const;
98   bool selectG_UADDO_USUBO_UADDE_USUBE(MachineInstr &I) const;
99   bool selectG_EXTRACT(MachineInstr &I) const;
100   bool selectG_MERGE_VALUES(MachineInstr &I) const;
101   bool selectG_UNMERGE_VALUES(MachineInstr &I) const;
102   bool selectG_BUILD_VECTOR_TRUNC(MachineInstr &I) const;
103   bool selectG_PTR_ADD(MachineInstr &I) const;
104   bool selectG_IMPLICIT_DEF(MachineInstr &I) const;
105   bool selectG_INSERT(MachineInstr &I) const;
106 
107   bool selectInterpP1F16(MachineInstr &MI) const;
108   bool selectDivScale(MachineInstr &MI) const;
109   bool selectIntrinsicIcmp(MachineInstr &MI) const;
110   bool selectBallot(MachineInstr &I) const;
111   bool selectG_INTRINSIC(MachineInstr &I) const;
112 
113   bool selectEndCfIntrinsic(MachineInstr &MI) const;
114   bool selectDSOrderedIntrinsic(MachineInstr &MI, Intrinsic::ID IID) const;
115   bool selectDSGWSIntrinsic(MachineInstr &MI, Intrinsic::ID IID) const;
116   bool selectDSAppendConsume(MachineInstr &MI, bool IsAppend) const;
117 
118   bool selectImageIntrinsic(MachineInstr &MI,
119                             const AMDGPU::ImageDimIntrinsicInfo *Intr) const;
120   bool selectG_INTRINSIC_W_SIDE_EFFECTS(MachineInstr &I) const;
121   int getS_CMPOpcode(CmpInst::Predicate P, unsigned Size) const;
122   bool selectG_ICMP(MachineInstr &I) const;
123   bool hasVgprParts(ArrayRef<GEPInfo> AddrInfo) const;
124   void getAddrModeInfo(const MachineInstr &Load, const MachineRegisterInfo &MRI,
125                        SmallVectorImpl<GEPInfo> &AddrInfo) const;
126   bool selectSMRD(MachineInstr &I, ArrayRef<GEPInfo> AddrInfo) const;
127 
128   void initM0(MachineInstr &I) const;
129   bool selectG_LOAD_ATOMICRMW(MachineInstr &I) const;
130   bool selectG_AMDGPU_ATOMIC_CMPXCHG(MachineInstr &I) const;
131   bool selectG_STORE(MachineInstr &I) const;
132   bool selectG_SELECT(MachineInstr &I) const;
133   bool selectG_BRCOND(MachineInstr &I) const;
134   bool selectG_FRAME_INDEX_GLOBAL_VALUE(MachineInstr &I) const;
135   bool selectG_PTRMASK(MachineInstr &I) const;
136   bool selectG_EXTRACT_VECTOR_ELT(MachineInstr &I) const;
137   bool selectG_INSERT_VECTOR_ELT(MachineInstr &I) const;
138   bool selectG_SHUFFLE_VECTOR(MachineInstr &I) const;
139 
140   std::pair<Register, unsigned>
141   selectVOP3ModsImpl(MachineOperand &Root) const;
142 
143   InstructionSelector::ComplexRendererFns
144   selectVCSRC(MachineOperand &Root) const;
145 
146   InstructionSelector::ComplexRendererFns
147   selectVSRC0(MachineOperand &Root) const;
148 
149   InstructionSelector::ComplexRendererFns
150   selectVOP3Mods0(MachineOperand &Root) const;
151   InstructionSelector::ComplexRendererFns
152   selectVOP3OMods(MachineOperand &Root) const;
153   InstructionSelector::ComplexRendererFns
154   selectVOP3Mods(MachineOperand &Root) const;
155 
156   ComplexRendererFns selectVOP3NoMods(MachineOperand &Root) const;
157 
158   InstructionSelector::ComplexRendererFns
159   selectVOP3Mods_nnan(MachineOperand &Root) const;
160 
161   std::pair<Register, unsigned>
162   selectVOP3PModsImpl(Register Src, const MachineRegisterInfo &MRI) const;
163 
164   InstructionSelector::ComplexRendererFns
165   selectVOP3PMods(MachineOperand &Root) const;
166 
167   InstructionSelector::ComplexRendererFns
168   selectVOP3OpSelMods(MachineOperand &Root) const;
169 
170   InstructionSelector::ComplexRendererFns
171   selectSmrdImm(MachineOperand &Root) const;
172   InstructionSelector::ComplexRendererFns
173   selectSmrdImm32(MachineOperand &Root) const;
174   InstructionSelector::ComplexRendererFns
175   selectSmrdSgpr(MachineOperand &Root) const;
176 
177   template <bool Signed>
178   InstructionSelector::ComplexRendererFns
179   selectFlatOffsetImpl(MachineOperand &Root) const;
180   InstructionSelector::ComplexRendererFns
181   selectFlatOffset(MachineOperand &Root) const;
182 
183   InstructionSelector::ComplexRendererFns
184   selectFlatOffsetSigned(MachineOperand &Root) const;
185 
186   InstructionSelector::ComplexRendererFns
187   selectMUBUFScratchOffen(MachineOperand &Root) const;
188   InstructionSelector::ComplexRendererFns
189   selectMUBUFScratchOffset(MachineOperand &Root) const;
190 
191   bool isDSOffsetLegal(Register Base, int64_t Offset,
192                        unsigned OffsetBits) const;
193 
194   std::pair<Register, unsigned>
195   selectDS1Addr1OffsetImpl(MachineOperand &Root) const;
196   InstructionSelector::ComplexRendererFns
197   selectDS1Addr1Offset(MachineOperand &Root) const;
198 
199   std::pair<Register, unsigned>
200   selectDS64Bit4ByteAlignedImpl(MachineOperand &Root) const;
201   InstructionSelector::ComplexRendererFns
202   selectDS64Bit4ByteAligned(MachineOperand &Root) const;
203 
204   std::pair<Register, int64_t>
205   getPtrBaseWithConstantOffset(Register Root,
206                                const MachineRegisterInfo &MRI) const;
207 
208   // Parse out a chain of up to two g_ptr_add instructions.
209   // g_ptr_add (n0, _)
210   // g_ptr_add (n0, (n1 = g_ptr_add n2, n3))
211   struct MUBUFAddressData {
212     Register N0, N2, N3;
213     int64_t Offset = 0;
214   };
215 
216   bool shouldUseAddr64(MUBUFAddressData AddrData) const;
217 
218   void splitIllegalMUBUFOffset(MachineIRBuilder &B,
219                                Register &SOffset, int64_t &ImmOffset) const;
220 
221   MUBUFAddressData parseMUBUFAddress(Register Src) const;
222 
223   bool selectMUBUFAddr64Impl(MachineOperand &Root, Register &VAddr,
224                              Register &RSrcReg, Register &SOffset,
225                              int64_t &Offset) const;
226 
227   bool selectMUBUFOffsetImpl(MachineOperand &Root, Register &RSrcReg,
228                              Register &SOffset, int64_t &Offset) const;
229 
230   InstructionSelector::ComplexRendererFns
231   selectMUBUFAddr64(MachineOperand &Root) const;
232 
233   InstructionSelector::ComplexRendererFns
234   selectMUBUFOffset(MachineOperand &Root) const;
235 
236   InstructionSelector::ComplexRendererFns
237   selectMUBUFOffsetAtomic(MachineOperand &Root) const;
238 
239   InstructionSelector::ComplexRendererFns
240   selectMUBUFAddr64Atomic(MachineOperand &Root) const;
241 
242   ComplexRendererFns selectSMRDBufferImm(MachineOperand &Root) const;
243   ComplexRendererFns selectSMRDBufferImm32(MachineOperand &Root) const;
244 
245   void renderTruncImm32(MachineInstrBuilder &MIB, const MachineInstr &MI,
246                         int OpIdx = -1) const;
247 
248   void renderTruncTImm(MachineInstrBuilder &MIB, const MachineInstr &MI,
249                        int OpIdx) const;
250 
251   void renderTruncTImm1(MachineInstrBuilder &MIB, const MachineInstr &MI,
252                         int OpIdx) const {
253     renderTruncTImm(MIB, MI, OpIdx);
254   }
255 
256   void renderTruncTImm8(MachineInstrBuilder &MIB, const MachineInstr &MI,
257                         int OpIdx) const {
258     renderTruncTImm(MIB, MI, OpIdx);
259   }
260 
261   void renderTruncTImm16(MachineInstrBuilder &MIB, const MachineInstr &MI,
262                         int OpIdx) const {
263     renderTruncTImm(MIB, MI, OpIdx);
264   }
265 
266   void renderTruncTImm32(MachineInstrBuilder &MIB, const MachineInstr &MI,
267                         int OpIdx) const {
268     renderTruncTImm(MIB, MI, OpIdx);
269   }
270 
271   void renderNegateImm(MachineInstrBuilder &MIB, const MachineInstr &MI,
272                        int OpIdx) const;
273 
274   void renderBitcastImm(MachineInstrBuilder &MIB, const MachineInstr &MI,
275                         int OpIdx) const;
276 
277   void renderPopcntImm(MachineInstrBuilder &MIB, const MachineInstr &MI,
278                        int OpIdx) const;
279   void renderExtractGLC(MachineInstrBuilder &MIB, const MachineInstr &MI,
280                         int OpIdx) const;
281   void renderExtractSLC(MachineInstrBuilder &MIB, const MachineInstr &MI,
282                         int OpIdx) const;
283   void renderExtractDLC(MachineInstrBuilder &MIB, const MachineInstr &MI,
284                         int OpIdx) const;
285   void renderExtractSWZ(MachineInstrBuilder &MIB, const MachineInstr &MI,
286                         int OpIdx) const;
287 
288   bool isInlineImmediate16(int64_t Imm) const;
289   bool isInlineImmediate32(int64_t Imm) const;
290   bool isInlineImmediate64(int64_t Imm) const;
291   bool isInlineImmediate(const APFloat &Imm) const;
292 
293   const SIInstrInfo &TII;
294   const SIRegisterInfo &TRI;
295   const AMDGPURegisterBankInfo &RBI;
296   const AMDGPUTargetMachine &TM;
297   const GCNSubtarget &STI;
298   bool EnableLateStructurizeCFG;
299 #define GET_GLOBALISEL_PREDICATES_DECL
300 #define AMDGPUSubtarget GCNSubtarget
301 #include "AMDGPUGenGlobalISel.inc"
302 #undef GET_GLOBALISEL_PREDICATES_DECL
303 #undef AMDGPUSubtarget
304 
305 #define GET_GLOBALISEL_TEMPORARIES_DECL
306 #include "AMDGPUGenGlobalISel.inc"
307 #undef GET_GLOBALISEL_TEMPORARIES_DECL
308 };
309 
310 } // End llvm namespace.
311 #endif
312