1 //===-- LanaiMemAluCombiner.cpp - Pass to combine memory & ALU operations -===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
9 // Simple pass to combine memory and ALU operations
11 // The Lanai ISA supports instructions where a load/store modifies the base
12 // register used in the load/store operation. This pass finds suitable
13 // load/store and ALU instructions and combines them into one instruction.
16 // ld [ %r6 -- ], %r12
17 // is a supported instruction that is not currently generated by the instruction
18 // selection pass of this backend. This pass generates these instructions by
23 // in the same machine basic block into one machine instruction.
24 //===----------------------------------------------------------------------===//
27 #include "LanaiTargetMachine.h"
28 #include "llvm/ADT/SmallSet.h"
29 #include "llvm/ADT/Statistic.h"
30 #include "llvm/CodeGen/MachineFunctionPass.h"
31 #include "llvm/CodeGen/MachineInstrBuilder.h"
32 #include "llvm/CodeGen/RegisterScavenging.h"
33 #include "llvm/CodeGen/TargetInstrInfo.h"
34 #include "llvm/Support/CommandLine.h"
37 #define GET_INSTRMAP_INFO
38 #include "LanaiGenInstrInfo.inc"
40 #define DEBUG_TYPE "lanai-mem-alu-combiner"
42 STATISTIC(NumLdStAluCombined, "Number of memory and ALU instructions combined");
44 static llvm::cl::opt<bool> DisableMemAluCombiner(
45 "disable-lanai-mem-alu-combiner", llvm::cl::init(false),
46 llvm::cl::desc("Do not combine ALU and memory operators"),
50 void initializeLanaiMemAluCombinerPass(PassRegistry &);
54 typedef MachineBasicBlock::iterator MbbIterator;
55 typedef MachineFunction::iterator MfIterator;
57 class LanaiMemAluCombiner : public MachineFunctionPass {
60 explicit LanaiMemAluCombiner() : MachineFunctionPass(ID) {
61 initializeLanaiMemAluCombinerPass(*PassRegistry::getPassRegistry());
64 StringRef getPassName() const override {
65 return "Lanai load / store optimization pass";
68 bool runOnMachineFunction(MachineFunction &F) override;
70 MachineFunctionProperties getRequiredProperties() const override {
71 return MachineFunctionProperties().set(
72 MachineFunctionProperties::Property::NoVRegs);
76 MbbIterator findClosestSuitableAluInstr(MachineBasicBlock *BB,
77 const MbbIterator &MemInstr,
79 void insertMergedInstruction(MachineBasicBlock *BB,
80 const MbbIterator &MemInstr,
81 const MbbIterator &AluInstr, bool Before);
82 bool combineMemAluInBasicBlock(MachineBasicBlock *BB);
84 // Target machine description which we query for register names, data
86 const TargetInstrInfo *TII;
90 char LanaiMemAluCombiner::ID = 0;
92 INITIALIZE_PASS(LanaiMemAluCombiner, DEBUG_TYPE,
93 "Lanai memory ALU combiner pass", false, false)
96 bool isSpls(uint16_t Opcode) { return Lanai::splsIdempotent(Opcode) == Opcode; }
98 // Determine the opcode for the merged instruction created by considering the
99 // old memory operation's opcode and whether the merged opcode will have an
101 unsigned mergedOpcode(unsigned OldOpcode, bool ImmediateOffset) {
106 return Lanai::LDW_RI;
107 return Lanai::LDW_RR;
111 return Lanai::LDHs_RI;
112 return Lanai::LDHs_RR;
116 return Lanai::LDHz_RI;
117 return Lanai::LDHz_RR;
121 return Lanai::LDBs_RI;
122 return Lanai::LDBs_RR;
126 return Lanai::LDBz_RI;
127 return Lanai::LDBz_RR;
136 return Lanai::STB_RI;
137 return Lanai::STB_RR;
141 return Lanai::STH_RI;
142 return Lanai::STH_RR;
148 // Check if the machine instruction has non-volatile memory operands of the type
149 // supported for combining with ALU instructions.
150 bool isNonVolatileMemoryOp(const MachineInstr &MI) {
151 if (!MI.hasOneMemOperand())
154 // Determine if the machine instruction is a supported memory operation by
155 // testing if the computed merge opcode is a valid memory operation opcode.
156 if (mergedOpcode(MI.getOpcode(), false) == 0)
159 const MachineMemOperand *MemOperand = *MI.memoperands_begin();
161 // Don't move volatile memory accesses
162 if (MemOperand->isVolatile())
168 // Test to see if two machine operands are of the same type. This test is less
169 // strict than the MachineOperand::isIdenticalTo function.
170 bool isSameOperand(const MachineOperand &Op1, const MachineOperand &Op2) {
171 if (Op1.getType() != Op2.getType())
174 switch (Op1.getType()) {
175 case MachineOperand::MO_Register:
176 return Op1.getReg() == Op2.getReg();
177 case MachineOperand::MO_Immediate:
178 return Op1.getImm() == Op2.getImm();
184 bool isZeroOperand(const MachineOperand &Op) {
185 return ((Op.isReg() && Op.getReg() == Lanai::R0) ||
186 (Op.isImm() && Op.getImm() == 0));
189 // Determines whether a register is used by an instruction.
190 bool InstrUsesReg(const MbbIterator &Instr, const MachineOperand *Reg) {
191 for (MachineInstr::const_mop_iterator Mop = Instr->operands_begin();
192 Mop != Instr->operands_end(); ++Mop) {
193 if (isSameOperand(*Mop, *Reg))
199 // Converts between machine opcode and AluCode.
200 // Flag using/modifying ALU operations should not be considered for merging and
201 // are omitted from this list.
202 LPAC::AluCode mergedAluCode(unsigned AluOpcode) {
204 case Lanai::ADD_I_LO:
207 case Lanai::SUB_I_LO:
210 case Lanai::AND_I_LO:
216 case Lanai::XOR_I_LO:
228 return LPAC::UNKNOWN;
232 // Insert a new combined memory and ALU operation instruction.
234 // This function builds a new machine instruction using the MachineInstrBuilder
235 // class and inserts it before the memory instruction.
236 void LanaiMemAluCombiner::insertMergedInstruction(MachineBasicBlock *BB,
237 const MbbIterator &MemInstr,
238 const MbbIterator &AluInstr,
240 // Insert new combined load/store + alu operation
241 MachineOperand Dest = MemInstr->getOperand(0);
242 MachineOperand Base = MemInstr->getOperand(1);
243 MachineOperand MemOffset = MemInstr->getOperand(2);
244 MachineOperand AluOffset = AluInstr->getOperand(2);
246 // Abort if ALU offset is not a register or immediate
247 assert((AluOffset.isReg() || AluOffset.isImm()) &&
248 "Unsupported operand type in merge");
250 // Determined merged instructions opcode and ALU code
251 LPAC::AluCode AluOpcode = mergedAluCode(AluInstr->getOpcode());
252 unsigned NewOpc = mergedOpcode(MemInstr->getOpcode(), AluOffset.isImm());
254 assert(AluOpcode != LPAC::UNKNOWN && "Unknown ALU code in merging");
255 assert(NewOpc != 0 && "Unknown merged node opcode");
257 // Build and insert new machine instruction
258 MachineInstrBuilder InstrBuilder =
259 BuildMI(*BB, MemInstr, MemInstr->getDebugLoc(), TII->get(NewOpc));
260 InstrBuilder.addReg(Dest.getReg(), getDefRegState(true));
261 InstrBuilder.addReg(Base.getReg(), getKillRegState(true));
263 // Add offset to machine instruction
264 if (AluOffset.isReg())
265 InstrBuilder.addReg(AluOffset.getReg());
266 else if (AluOffset.isImm())
267 InstrBuilder.addImm(AluOffset.getImm());
269 llvm_unreachable("Unsupported ld/st ALU merge.");
271 // Create a pre-op if the ALU operation preceded the memory operation or the
272 // MemOffset is non-zero (i.e. the memory value should be adjusted before
273 // accessing it), else create a post-op.
274 if (Before || !isZeroOperand(MemOffset))
275 InstrBuilder.addImm(LPAC::makePreOp(AluOpcode));
277 InstrBuilder.addImm(LPAC::makePostOp(AluOpcode));
279 // Transfer memory operands.
280 InstrBuilder->setMemRefs(MemInstr->memoperands_begin(),
281 MemInstr->memoperands_end());
284 // Function determines if ALU operation (in alu_iter) can be combined with
285 // a load/store with base and offset.
286 bool isSuitableAluInstr(bool IsSpls, const MbbIterator &AluIter,
287 const MachineOperand &Base,
288 const MachineOperand &Offset) {
289 // ALU operations have 3 operands
290 if (AluIter->getNumOperands() != 3)
293 MachineOperand &Dest = AluIter->getOperand(0);
294 MachineOperand &Op1 = AluIter->getOperand(1);
295 MachineOperand &Op2 = AluIter->getOperand(2);
297 // Only match instructions using the base register as destination and with the
298 // base and first operand equal
299 if (!isSameOperand(Dest, Base) || !isSameOperand(Dest, Op1))
303 // It is not a match if the 2nd operand in the ALU operation is an
304 // immediate but the ALU operation is not an addition.
305 if (AluIter->getOpcode() != Lanai::ADD_I_LO)
308 if (Offset.isReg() && Offset.getReg() == Lanai::R0)
311 if (Offset.isImm() &&
312 ((Offset.getImm() == 0 &&
313 // Check that the Op2 would fit in the immediate field of the
315 ((IsSpls && isInt<10>(Op2.getImm())) ||
316 (!IsSpls && isInt<16>(Op2.getImm())))) ||
317 Offset.getImm() == Op2.getImm()))
319 } else if (Op2.isReg()) {
320 // The Offset and 2nd operand are both registers and equal
321 if (Offset.isReg() && Op2.getReg() == Offset.getReg())
324 // Only consider operations with register or immediate values
330 MbbIterator LanaiMemAluCombiner::findClosestSuitableAluInstr(
331 MachineBasicBlock *BB, const MbbIterator &MemInstr, const bool Decrement) {
332 MachineOperand *Base = &MemInstr->getOperand(1);
333 MachineOperand *Offset = &MemInstr->getOperand(2);
334 bool IsSpls = isSpls(MemInstr->getOpcode());
336 MbbIterator First = MemInstr;
337 MbbIterator Last = Decrement ? BB->begin() : BB->end();
339 while (First != Last) {
340 Decrement ? --First : ++First;
345 // Skip over debug instructions
346 if (First->isDebugInstr())
349 if (isSuitableAluInstr(IsSpls, First, *Base, *Offset)) {
353 // Usage of the base or offset register is not a form suitable for merging.
355 if (InstrUsesReg(First, Base))
357 if (Offset->isReg() && InstrUsesReg(First, Offset))
365 bool LanaiMemAluCombiner::combineMemAluInBasicBlock(MachineBasicBlock *BB) {
366 bool Modified = false;
368 MbbIterator MBBIter = BB->begin(), End = BB->end();
369 while (MBBIter != End) {
370 bool IsMemOp = isNonVolatileMemoryOp(*MBBIter);
373 MachineOperand AluOperand = MBBIter->getOperand(3);
374 unsigned int DestReg = MBBIter->getOperand(0).getReg(),
375 BaseReg = MBBIter->getOperand(1).getReg();
376 assert(AluOperand.isImm() && "Unexpected memory operator type");
377 LPAC::AluCode AluOpcode = static_cast<LPAC::AluCode>(AluOperand.getImm());
379 // Skip memory operations that already modify the base register or if
380 // the destination and base register are the same
381 if (!LPAC::modifiesOp(AluOpcode) && DestReg != BaseReg) {
382 for (int Inc = 0; Inc <= 1; ++Inc) {
383 MbbIterator AluIter =
384 findClosestSuitableAluInstr(BB, MBBIter, Inc == 0);
385 if (AluIter != MBBIter) {
386 insertMergedInstruction(BB, MBBIter, AluIter, Inc == 0);
388 ++NumLdStAluCombined;
391 // Erase the matching ALU instruction
393 // Erase old load/store instruction
394 BB->erase(MBBIter++);
408 // Driver function that iterates over the machine basic building blocks of a
410 bool LanaiMemAluCombiner::runOnMachineFunction(MachineFunction &MF) {
411 if (DisableMemAluCombiner)
414 TII = MF.getSubtarget<LanaiSubtarget>().getInstrInfo();
415 bool Modified = false;
416 for (MfIterator MFI = MF.begin(); MFI != MF.end(); ++MFI) {
417 Modified |= combineMemAluInBasicBlock(&*MFI);
423 FunctionPass *llvm::createLanaiMemAluCombinerPass() {
424 return new LanaiMemAluCombiner();