]> CyberLeo.Net >> Repos - FreeBSD/FreeBSD.git/blob - contrib/llvm-project/llvm/lib/Target/AMDGPU/AMDGPUInstructionSelector.h
Import tzdata 2020b
[FreeBSD/FreeBSD.git] / contrib / llvm-project / llvm / lib / Target / AMDGPU / AMDGPUInstructionSelector.h
1 //===- AMDGPUInstructionSelector --------------------------------*- C++ -*-==//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 /// \file
9 /// This file declares the targeting of the InstructionSelector class for
10 /// AMDGPU.
11 //===----------------------------------------------------------------------===//
12
13 #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUINSTRUCTIONSELECTOR_H
14 #define LLVM_LIB_TARGET_AMDGPU_AMDGPUINSTRUCTIONSELECTOR_H
15
16 #include "AMDGPU.h"
17 #include "AMDGPUArgumentUsageInfo.h"
18 #include "llvm/ADT/ArrayRef.h"
19 #include "llvm/ADT/SmallVector.h"
20 #include "llvm/CodeGen/Register.h"
21 #include "llvm/CodeGen/GlobalISel/InstructionSelector.h"
22 #include "llvm/IR/InstrTypes.h"
23
24 namespace {
25 #define GET_GLOBALISEL_PREDICATE_BITSET
26 #define AMDGPUSubtarget GCNSubtarget
27 #include "AMDGPUGenGlobalISel.inc"
28 #undef GET_GLOBALISEL_PREDICATE_BITSET
29 #undef AMDGPUSubtarget
30 }
31
32 namespace llvm {
33
34 namespace AMDGPU {
35 struct ImageDimIntrinsicInfo;
36 }
37
38 class AMDGPUInstrInfo;
39 class AMDGPURegisterBankInfo;
40 class GCNSubtarget;
41 class MachineInstr;
42 class MachineIRBuilder;
43 class MachineOperand;
44 class MachineRegisterInfo;
45 class RegisterBank;
46 class SIInstrInfo;
47 class SIMachineFunctionInfo;
48 class SIRegisterInfo;
49
50 class AMDGPUInstructionSelector : public InstructionSelector {
51 private:
52   MachineRegisterInfo *MRI;
53
54 public:
55   AMDGPUInstructionSelector(const GCNSubtarget &STI,
56                             const AMDGPURegisterBankInfo &RBI,
57                             const AMDGPUTargetMachine &TM);
58
59   bool select(MachineInstr &I) override;
60   static const char *getName();
61
62   void setupMF(MachineFunction &MF, GISelKnownBits &KB,
63                CodeGenCoverage &CoverageInfo) override;
64
65 private:
66   struct GEPInfo {
67     const MachineInstr &GEP;
68     SmallVector<unsigned, 2> SgprParts;
69     SmallVector<unsigned, 2> VgprParts;
70     int64_t Imm;
71     GEPInfo(const MachineInstr &GEP) : GEP(GEP), Imm(0) { }
72   };
73
74   bool isInstrUniform(const MachineInstr &MI) const;
75   bool isVCC(Register Reg, const MachineRegisterInfo &MRI) const;
76
77   const RegisterBank *getArtifactRegBank(
78     Register Reg, const MachineRegisterInfo &MRI,
79     const TargetRegisterInfo &TRI) const;
80
81   /// tblgen-erated 'select' implementation.
82   bool selectImpl(MachineInstr &I, CodeGenCoverage &CoverageInfo) const;
83
84   MachineOperand getSubOperand64(MachineOperand &MO,
85                                  const TargetRegisterClass &SubRC,
86                                  unsigned SubIdx) const;
87
88   bool constrainCopyLikeIntrin(MachineInstr &MI, unsigned NewOpc) const;
89   bool selectCOPY(MachineInstr &I) const;
90   bool selectPHI(MachineInstr &I) const;
91   bool selectG_TRUNC(MachineInstr &I) const;
92   bool selectG_SZA_EXT(MachineInstr &I) const;
93   bool selectG_CONSTANT(MachineInstr &I) const;
94   bool selectG_FNEG(MachineInstr &I) const;
95   bool selectG_FABS(MachineInstr &I) const;
96   bool selectG_AND_OR_XOR(MachineInstr &I) const;
97   bool selectG_ADD_SUB(MachineInstr &I) const;
98   bool selectG_UADDO_USUBO_UADDE_USUBE(MachineInstr &I) const;
99   bool selectG_EXTRACT(MachineInstr &I) const;
100   bool selectG_MERGE_VALUES(MachineInstr &I) const;
101   bool selectG_UNMERGE_VALUES(MachineInstr &I) const;
102   bool selectG_BUILD_VECTOR_TRUNC(MachineInstr &I) const;
103   bool selectG_PTR_ADD(MachineInstr &I) const;
104   bool selectG_IMPLICIT_DEF(MachineInstr &I) const;
105   bool selectG_INSERT(MachineInstr &I) const;
106
107   bool selectInterpP1F16(MachineInstr &MI) const;
108   bool selectDivScale(MachineInstr &MI) const;
109   bool selectIntrinsicIcmp(MachineInstr &MI) const;
110   bool selectBallot(MachineInstr &I) const;
111   bool selectG_INTRINSIC(MachineInstr &I) const;
112
113   bool selectEndCfIntrinsic(MachineInstr &MI) const;
114   bool selectDSOrderedIntrinsic(MachineInstr &MI, Intrinsic::ID IID) const;
115   bool selectDSGWSIntrinsic(MachineInstr &MI, Intrinsic::ID IID) const;
116   bool selectDSAppendConsume(MachineInstr &MI, bool IsAppend) const;
117
118   bool selectImageIntrinsic(MachineInstr &MI,
119                             const AMDGPU::ImageDimIntrinsicInfo *Intr) const;
120   bool selectG_INTRINSIC_W_SIDE_EFFECTS(MachineInstr &I) const;
121   int getS_CMPOpcode(CmpInst::Predicate P, unsigned Size) const;
122   bool selectG_ICMP(MachineInstr &I) const;
123   bool hasVgprParts(ArrayRef<GEPInfo> AddrInfo) const;
124   void getAddrModeInfo(const MachineInstr &Load, const MachineRegisterInfo &MRI,
125                        SmallVectorImpl<GEPInfo> &AddrInfo) const;
126   bool selectSMRD(MachineInstr &I, ArrayRef<GEPInfo> AddrInfo) const;
127
128   void initM0(MachineInstr &I) const;
129   bool selectG_LOAD_ATOMICRMW(MachineInstr &I) const;
130   bool selectG_AMDGPU_ATOMIC_CMPXCHG(MachineInstr &I) const;
131   bool selectG_STORE(MachineInstr &I) const;
132   bool selectG_SELECT(MachineInstr &I) const;
133   bool selectG_BRCOND(MachineInstr &I) const;
134   bool selectG_FRAME_INDEX_GLOBAL_VALUE(MachineInstr &I) const;
135   bool selectG_PTRMASK(MachineInstr &I) const;
136   bool selectG_EXTRACT_VECTOR_ELT(MachineInstr &I) const;
137   bool selectG_INSERT_VECTOR_ELT(MachineInstr &I) const;
138   bool selectG_SHUFFLE_VECTOR(MachineInstr &I) const;
139
140   std::pair<Register, unsigned>
141   selectVOP3ModsImpl(MachineOperand &Root) const;
142
143   InstructionSelector::ComplexRendererFns
144   selectVCSRC(MachineOperand &Root) const;
145
146   InstructionSelector::ComplexRendererFns
147   selectVSRC0(MachineOperand &Root) const;
148
149   InstructionSelector::ComplexRendererFns
150   selectVOP3Mods0(MachineOperand &Root) const;
151   InstructionSelector::ComplexRendererFns
152   selectVOP3OMods(MachineOperand &Root) const;
153   InstructionSelector::ComplexRendererFns
154   selectVOP3Mods(MachineOperand &Root) const;
155
156   ComplexRendererFns selectVOP3NoMods(MachineOperand &Root) const;
157
158   InstructionSelector::ComplexRendererFns
159   selectVOP3Mods_nnan(MachineOperand &Root) const;
160
161   std::pair<Register, unsigned>
162   selectVOP3PModsImpl(Register Src, const MachineRegisterInfo &MRI) const;
163
164   InstructionSelector::ComplexRendererFns
165   selectVOP3PMods(MachineOperand &Root) const;
166
167   InstructionSelector::ComplexRendererFns
168   selectVOP3OpSelMods(MachineOperand &Root) const;
169
170   InstructionSelector::ComplexRendererFns
171   selectSmrdImm(MachineOperand &Root) const;
172   InstructionSelector::ComplexRendererFns
173   selectSmrdImm32(MachineOperand &Root) const;
174   InstructionSelector::ComplexRendererFns
175   selectSmrdSgpr(MachineOperand &Root) const;
176
177   template <bool Signed>
178   InstructionSelector::ComplexRendererFns
179   selectFlatOffsetImpl(MachineOperand &Root) const;
180   InstructionSelector::ComplexRendererFns
181   selectFlatOffset(MachineOperand &Root) const;
182
183   InstructionSelector::ComplexRendererFns
184   selectFlatOffsetSigned(MachineOperand &Root) const;
185
186   InstructionSelector::ComplexRendererFns
187   selectMUBUFScratchOffen(MachineOperand &Root) const;
188   InstructionSelector::ComplexRendererFns
189   selectMUBUFScratchOffset(MachineOperand &Root) const;
190
191   bool isDSOffsetLegal(Register Base, int64_t Offset,
192                        unsigned OffsetBits) const;
193
194   std::pair<Register, unsigned>
195   selectDS1Addr1OffsetImpl(MachineOperand &Root) const;
196   InstructionSelector::ComplexRendererFns
197   selectDS1Addr1Offset(MachineOperand &Root) const;
198
199   std::pair<Register, unsigned>
200   selectDS64Bit4ByteAlignedImpl(MachineOperand &Root) const;
201   InstructionSelector::ComplexRendererFns
202   selectDS64Bit4ByteAligned(MachineOperand &Root) const;
203
204   std::pair<Register, int64_t>
205   getPtrBaseWithConstantOffset(Register Root,
206                                const MachineRegisterInfo &MRI) const;
207
208   // Parse out a chain of up to two g_ptr_add instructions.
209   // g_ptr_add (n0, _)
210   // g_ptr_add (n0, (n1 = g_ptr_add n2, n3))
211   struct MUBUFAddressData {
212     Register N0, N2, N3;
213     int64_t Offset = 0;
214   };
215
216   bool shouldUseAddr64(MUBUFAddressData AddrData) const;
217
218   void splitIllegalMUBUFOffset(MachineIRBuilder &B,
219                                Register &SOffset, int64_t &ImmOffset) const;
220
221   MUBUFAddressData parseMUBUFAddress(Register Src) const;
222
223   bool selectMUBUFAddr64Impl(MachineOperand &Root, Register &VAddr,
224                              Register &RSrcReg, Register &SOffset,
225                              int64_t &Offset) const;
226
227   bool selectMUBUFOffsetImpl(MachineOperand &Root, Register &RSrcReg,
228                              Register &SOffset, int64_t &Offset) const;
229
230   InstructionSelector::ComplexRendererFns
231   selectMUBUFAddr64(MachineOperand &Root) const;
232
233   InstructionSelector::ComplexRendererFns
234   selectMUBUFOffset(MachineOperand &Root) const;
235
236   InstructionSelector::ComplexRendererFns
237   selectMUBUFOffsetAtomic(MachineOperand &Root) const;
238
239   InstructionSelector::ComplexRendererFns
240   selectMUBUFAddr64Atomic(MachineOperand &Root) const;
241
242   ComplexRendererFns selectSMRDBufferImm(MachineOperand &Root) const;
243   ComplexRendererFns selectSMRDBufferImm32(MachineOperand &Root) const;
244
245   void renderTruncImm32(MachineInstrBuilder &MIB, const MachineInstr &MI,
246                         int OpIdx = -1) const;
247
248   void renderTruncTImm(MachineInstrBuilder &MIB, const MachineInstr &MI,
249                        int OpIdx) const;
250
251   void renderTruncTImm1(MachineInstrBuilder &MIB, const MachineInstr &MI,
252                         int OpIdx) const {
253     renderTruncTImm(MIB, MI, OpIdx);
254   }
255
256   void renderTruncTImm8(MachineInstrBuilder &MIB, const MachineInstr &MI,
257                         int OpIdx) const {
258     renderTruncTImm(MIB, MI, OpIdx);
259   }
260
261   void renderTruncTImm16(MachineInstrBuilder &MIB, const MachineInstr &MI,
262                         int OpIdx) const {
263     renderTruncTImm(MIB, MI, OpIdx);
264   }
265
266   void renderTruncTImm32(MachineInstrBuilder &MIB, const MachineInstr &MI,
267                         int OpIdx) const {
268     renderTruncTImm(MIB, MI, OpIdx);
269   }
270
271   void renderNegateImm(MachineInstrBuilder &MIB, const MachineInstr &MI,
272                        int OpIdx) const;
273
274   void renderBitcastImm(MachineInstrBuilder &MIB, const MachineInstr &MI,
275                         int OpIdx) const;
276
277   void renderPopcntImm(MachineInstrBuilder &MIB, const MachineInstr &MI,
278                        int OpIdx) const;
279   void renderExtractGLC(MachineInstrBuilder &MIB, const MachineInstr &MI,
280                         int OpIdx) const;
281   void renderExtractSLC(MachineInstrBuilder &MIB, const MachineInstr &MI,
282                         int OpIdx) const;
283   void renderExtractDLC(MachineInstrBuilder &MIB, const MachineInstr &MI,
284                         int OpIdx) const;
285   void renderExtractSWZ(MachineInstrBuilder &MIB, const MachineInstr &MI,
286                         int OpIdx) const;
287
288   bool isInlineImmediate16(int64_t Imm) const;
289   bool isInlineImmediate32(int64_t Imm) const;
290   bool isInlineImmediate64(int64_t Imm) const;
291   bool isInlineImmediate(const APFloat &Imm) const;
292
293   const SIInstrInfo &TII;
294   const SIRegisterInfo &TRI;
295   const AMDGPURegisterBankInfo &RBI;
296   const AMDGPUTargetMachine &TM;
297   const GCNSubtarget &STI;
298   bool EnableLateStructurizeCFG;
299 #define GET_GLOBALISEL_PREDICATES_DECL
300 #define AMDGPUSubtarget GCNSubtarget
301 #include "AMDGPUGenGlobalISel.inc"
302 #undef GET_GLOBALISEL_PREDICATES_DECL
303 #undef AMDGPUSubtarget
304
305 #define GET_GLOBALISEL_TEMPORARIES_DECL
306 #include "AMDGPUGenGlobalISel.inc"
307 #undef GET_GLOBALISEL_TEMPORARIES_DECL
308 };
309
310 } // End llvm namespace.
311 #endif