1 //===- ARMInstructionSelector.cpp ----------------------------*- C++ -*-==//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 /// This file implements the targeting of the InstructionSelector class for ARM.
11 /// \todo This should be generated by TableGen.
12 //===----------------------------------------------------------------------===//
14 #include "ARMRegisterBankInfo.h"
15 #include "ARMSubtarget.h"
16 #include "ARMTargetMachine.h"
17 #include "llvm/CodeGen/GlobalISel/InstructionSelector.h"
18 #include "llvm/CodeGen/MachineRegisterInfo.h"
19 #include "llvm/Support/Debug.h"
21 #define DEBUG_TYPE "arm-isel"
25 #ifndef LLVM_BUILD_GLOBAL_ISEL
26 #error "You shouldn't build this"
31 #define GET_GLOBALISEL_PREDICATE_BITSET
32 #include "ARMGenGlobalISel.inc"
33 #undef GET_GLOBALISEL_PREDICATE_BITSET
35 class ARMInstructionSelector : public InstructionSelector {
37 ARMInstructionSelector(const ARMBaseTargetMachine &TM, const ARMSubtarget &STI,
38 const ARMRegisterBankInfo &RBI);
40 bool select(MachineInstr &I) const override;
43 bool selectImpl(MachineInstr &I) const;
45 const ARMBaseInstrInfo &TII;
46 const ARMBaseRegisterInfo &TRI;
47 const ARMBaseTargetMachine &TM;
48 const ARMRegisterBankInfo &RBI;
49 const ARMSubtarget &STI;
51 #define GET_GLOBALISEL_PREDICATES_DECL
52 #include "ARMGenGlobalISel.inc"
53 #undef GET_GLOBALISEL_PREDICATES_DECL
55 // We declare the temporaries used by selectImpl() in the class to minimize the
56 // cost of constructing placeholder values.
57 #define GET_GLOBALISEL_TEMPORARIES_DECL
58 #include "ARMGenGlobalISel.inc"
59 #undef GET_GLOBALISEL_TEMPORARIES_DECL
61 } // end anonymous namespace
65 createARMInstructionSelector(const ARMBaseTargetMachine &TM,
66 const ARMSubtarget &STI,
67 const ARMRegisterBankInfo &RBI) {
68 return new ARMInstructionSelector(TM, STI, RBI);
72 unsigned zero_reg = 0;
74 #define GET_GLOBALISEL_IMPL
75 #include "ARMGenGlobalISel.inc"
76 #undef GET_GLOBALISEL_IMPL
78 ARMInstructionSelector::ARMInstructionSelector(const ARMBaseTargetMachine &TM,
79 const ARMSubtarget &STI,
80 const ARMRegisterBankInfo &RBI)
81 : InstructionSelector(), TII(*STI.getInstrInfo()),
82 TRI(*STI.getRegisterInfo()), TM(TM), RBI(RBI), STI(STI),
83 #define GET_GLOBALISEL_PREDICATES_INIT
84 #include "ARMGenGlobalISel.inc"
85 #undef GET_GLOBALISEL_PREDICATES_INIT
86 #define GET_GLOBALISEL_TEMPORARIES_INIT
87 #include "ARMGenGlobalISel.inc"
88 #undef GET_GLOBALISEL_TEMPORARIES_INIT
92 static bool selectCopy(MachineInstr &I, const TargetInstrInfo &TII,
93 MachineRegisterInfo &MRI, const TargetRegisterInfo &TRI,
94 const RegisterBankInfo &RBI) {
95 unsigned DstReg = I.getOperand(0).getReg();
96 if (TargetRegisterInfo::isPhysicalRegister(DstReg))
99 const RegisterBank *RegBank = RBI.getRegBank(DstReg, MRI, TRI);
101 assert(RegBank && "Can't get reg bank for virtual register");
103 const unsigned DstSize = MRI.getType(DstReg).getSizeInBits();
104 assert((RegBank->getID() == ARM::GPRRegBankID ||
105 RegBank->getID() == ARM::FPRRegBankID) &&
106 "Unsupported reg bank");
108 const TargetRegisterClass *RC = &ARM::GPRRegClass;
110 if (RegBank->getID() == ARM::FPRRegBankID) {
112 RC = &ARM::SPRRegClass;
113 else if (DstSize == 64)
114 RC = &ARM::DPRRegClass;
116 llvm_unreachable("Unsupported destination size");
119 // No need to constrain SrcReg. It will get constrained when
120 // we hit another of its uses or its defs.
121 // Copies do not have constraints.
122 if (!RBI.constrainGenericRegister(DstReg, *RC, MRI)) {
123 DEBUG(dbgs() << "Failed to constrain " << TII.getName(I.getOpcode())
130 static bool selectSequence(MachineInstrBuilder &MIB,
131 const ARMBaseInstrInfo &TII,
132 MachineRegisterInfo &MRI,
133 const TargetRegisterInfo &TRI,
134 const RegisterBankInfo &RBI) {
135 assert(TII.getSubtarget().hasVFP2() && "Can't select sequence without VFP");
137 // We only support G_SEQUENCE as a way to stick together two scalar GPRs
139 unsigned VReg0 = MIB->getOperand(0).getReg();
141 assert(MRI.getType(VReg0).getSizeInBits() == 64 &&
142 RBI.getRegBank(VReg0, MRI, TRI)->getID() == ARM::FPRRegBankID &&
143 "Unsupported operand for G_SEQUENCE");
144 unsigned VReg1 = MIB->getOperand(1).getReg();
146 assert(MRI.getType(VReg1).getSizeInBits() == 32 &&
147 RBI.getRegBank(VReg1, MRI, TRI)->getID() == ARM::GPRRegBankID &&
148 "Unsupported operand for G_SEQUENCE");
149 unsigned VReg2 = MIB->getOperand(3).getReg();
151 assert(MRI.getType(VReg2).getSizeInBits() == 32 &&
152 RBI.getRegBank(VReg2, MRI, TRI)->getID() == ARM::GPRRegBankID &&
153 "Unsupported operand for G_SEQUENCE");
155 // Remove the operands corresponding to the offsets.
156 MIB->RemoveOperand(4);
157 MIB->RemoveOperand(2);
159 MIB->setDesc(TII.get(ARM::VMOVDRR));
160 MIB.add(predOps(ARMCC::AL));
165 static bool selectExtract(MachineInstrBuilder &MIB, const ARMBaseInstrInfo &TII,
166 MachineRegisterInfo &MRI,
167 const TargetRegisterInfo &TRI,
168 const RegisterBankInfo &RBI) {
169 assert(TII.getSubtarget().hasVFP2() && "Can't select extract without VFP");
171 // We only support G_EXTRACT as a way to break up one DPR into two GPRs.
172 unsigned VReg0 = MIB->getOperand(0).getReg();
174 assert(MRI.getType(VReg0).getSizeInBits() == 32 &&
175 RBI.getRegBank(VReg0, MRI, TRI)->getID() == ARM::GPRRegBankID &&
176 "Unsupported operand for G_EXTRACT");
177 unsigned VReg1 = MIB->getOperand(1).getReg();
179 assert(MRI.getType(VReg1).getSizeInBits() == 64 &&
180 RBI.getRegBank(VReg1, MRI, TRI)->getID() == ARM::FPRRegBankID &&
181 "Unsupported operand for G_EXTRACT");
182 assert(MIB->getOperand(2).getImm() % 32 == 0 &&
183 "Unsupported operand for G_EXTRACT");
185 // Remove the operands corresponding to the offsets.
186 MIB->getOperand(2).setImm(MIB->getOperand(2).getImm() / 32);
188 MIB->setDesc(TII.get(ARM::VGETLNi32));
189 MIB.add(predOps(ARMCC::AL));
194 /// Select the opcode for simple extensions (that translate to a single SXT/UXT
195 /// instruction). Extension operations more complicated than that should not
196 /// invoke this. Returns the original opcode if it doesn't know how to select a
198 static unsigned selectSimpleExtOpc(unsigned Opc, unsigned Size) {
199 using namespace TargetOpcode;
201 if (Size != 8 && Size != 16)
205 return Size == 8 ? ARM::SXTB : ARM::SXTH;
208 return Size == 8 ? ARM::UXTB : ARM::UXTH;
213 /// Select the opcode for simple loads and stores. For types smaller than 32
214 /// bits, the value will be zero extended. Returns the original opcode if it
215 /// doesn't know how to select a better one.
216 static unsigned selectLoadStoreOpCode(unsigned Opc, unsigned RegBank,
218 bool isStore = Opc == TargetOpcode::G_STORE;
220 if (RegBank == ARM::GPRRegBankID) {
224 return isStore ? ARM::STRBi12 : ARM::LDRBi12;
226 return isStore ? ARM::STRH : ARM::LDRH;
228 return isStore ? ARM::STRi12 : ARM::LDRi12;
234 if (RegBank == ARM::FPRRegBankID) {
237 return isStore ? ARM::VSTRS : ARM::VLDRS;
239 return isStore ? ARM::VSTRD : ARM::VLDRD;
248 bool ARMInstructionSelector::select(MachineInstr &I) const {
249 assert(I.getParent() && "Instruction should be in a basic block!");
250 assert(I.getParent()->getParent() && "Instruction should be in a function!");
252 auto &MBB = *I.getParent();
253 auto &MF = *MBB.getParent();
254 auto &MRI = MF.getRegInfo();
256 if (!isPreISelGenericOpcode(I.getOpcode())) {
258 return selectCopy(I, TII, MRI, TRI, RBI);
266 MachineInstrBuilder MIB{MF, I};
269 using namespace TargetOpcode;
270 switch (I.getOpcode()) {
275 LLT DstTy = MRI.getType(I.getOperand(0).getReg());
276 // FIXME: Smaller destination sizes coming soon!
277 if (DstTy.getSizeInBits() != 32) {
278 DEBUG(dbgs() << "Unsupported destination size for extension");
282 LLT SrcTy = MRI.getType(I.getOperand(1).getReg());
283 unsigned SrcSize = SrcTy.getSizeInBits();
286 // ZExt boils down to & 0x1; for SExt we also subtract that from 0
287 I.setDesc(TII.get(ARM::ANDri));
288 MIB.addImm(1).add(predOps(ARMCC::AL)).add(condCodeOp());
291 unsigned SExtResult = I.getOperand(0).getReg();
293 // Use a new virtual register for the result of the AND
294 unsigned AndResult = MRI.createVirtualRegister(&ARM::GPRRegClass);
295 I.getOperand(0).setReg(AndResult);
297 auto InsertBefore = std::next(I.getIterator());
299 BuildMI(MBB, InsertBefore, I.getDebugLoc(), TII.get(ARM::RSBri))
303 .add(predOps(ARMCC::AL))
305 if (!constrainSelectedInstRegOperands(*SubI, TII, TRI, RBI))
312 unsigned NewOpc = selectSimpleExtOpc(I.getOpcode(), SrcSize);
313 if (NewOpc == I.getOpcode())
315 I.setDesc(TII.get(NewOpc));
316 MIB.addImm(0).add(predOps(ARMCC::AL));
320 DEBUG(dbgs() << "Unsupported source size for extension");
327 // The high bits are undefined, so there's nothing special to do, just
328 // treat it as a copy.
329 auto SrcReg = I.getOperand(1).getReg();
330 auto DstReg = I.getOperand(0).getReg();
332 const auto &SrcRegBank = *RBI.getRegBank(SrcReg, MRI, TRI);
333 const auto &DstRegBank = *RBI.getRegBank(DstReg, MRI, TRI);
335 if (SrcRegBank.getID() != DstRegBank.getID()) {
336 DEBUG(dbgs() << "G_TRUNC/G_ANYEXT operands on different register banks\n");
340 if (SrcRegBank.getID() != ARM::GPRRegBankID) {
341 DEBUG(dbgs() << "G_TRUNC/G_ANYEXT on non-GPR not supported yet\n");
345 I.setDesc(TII.get(COPY));
346 return selectCopy(I, TII, MRI, TRI, RBI);
349 I.setDesc(TII.get(ARM::ADDrr));
350 MIB.add(predOps(ARMCC::AL)).add(condCodeOp());
353 // Add 0 to the given frame index and hope it will eventually be folded into
355 I.setDesc(TII.get(ARM::ADDri));
356 MIB.addImm(0).add(predOps(ARMCC::AL)).add(condCodeOp());
359 unsigned Reg = I.getOperand(0).getReg();
360 if (MRI.getType(Reg).getSizeInBits() != 32)
363 assert(RBI.getRegBank(Reg, MRI, TRI)->getID() == ARM::GPRRegBankID &&
364 "Expected constant to live in a GPR");
365 I.setDesc(TII.get(ARM::MOVi));
366 MIB.add(predOps(ARMCC::AL)).add(condCodeOp());
368 auto &Val = I.getOperand(1);
370 if (Val.getCImm()->getBitWidth() > 32)
372 Val.ChangeToImmediate(Val.getCImm()->getZExtValue());
383 const auto &MemOp = **I.memoperands_begin();
384 if (MemOp.getOrdering() != AtomicOrdering::NotAtomic) {
385 DEBUG(dbgs() << "Atomic load/store not supported yet\n");
389 unsigned Reg = I.getOperand(0).getReg();
390 unsigned RegBank = RBI.getRegBank(Reg, MRI, TRI)->getID();
392 LLT ValTy = MRI.getType(Reg);
393 const auto ValSize = ValTy.getSizeInBits();
395 assert((ValSize != 64 || TII.getSubtarget().hasVFP2()) &&
396 "Don't know how to load/store 64-bit value without VFP");
398 const auto NewOpc = selectLoadStoreOpCode(I.getOpcode(), RegBank, ValSize);
399 if (NewOpc == G_LOAD || NewOpc == G_STORE)
402 I.setDesc(TII.get(NewOpc));
404 if (NewOpc == ARM::LDRH || NewOpc == ARM::STRH)
405 // LDRH has a funny addressing mode (there's already a FIXME for it).
407 MIB.addImm(0).add(predOps(ARMCC::AL));
411 if (!selectSequence(MIB, TII, MRI, TRI, RBI))
416 if (!selectExtract(MIB, TII, MRI, TRI, RBI))
424 return constrainSelectedInstRegOperands(I, TII, TRI, RBI);