1 //===------------- PPCExpandISEL.cpp - Expand ISEL instruction ------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // A pass that expands the ISEL instruction into an if-then-else sequence.
11 // This pass must be run post-RA since all operands must be physical registers.
12 //
13 //===----------------------------------------------------------------------===//
14
15 #include "PPC.h"
16 #include "PPCInstrInfo.h"
17 #include "PPCSubtarget.h"
18 #include "llvm/ADT/DenseMap.h"
19 #include "llvm/ADT/Statistic.h"
20 #include "llvm/CodeGen/LivePhysRegs.h"
21 #include "llvm/CodeGen/MachineFunctionPass.h"
22 #include "llvm/CodeGen/MachineInstrBuilder.h"
23 #include "llvm/CodeGen/MachineRegisterInfo.h"
24 #include "llvm/Support/CommandLine.h"
25 #include "llvm/Support/Debug.h"
26 #include "llvm/Support/raw_ostream.h"
27
28 using namespace llvm;
29
30 #define DEBUG_TYPE "ppc-expand-isel"
31
32 STATISTIC(NumExpanded, "Number of ISEL instructions expanded");
33 STATISTIC(NumRemoved, "Number of ISEL instructions removed");
34 STATISTIC(NumFolded, "Number of ISEL instructions folded");
35
36 // If -ppc-gen-isel=false is set, we will disable generating the ISEL
37 // instruction on all PPC targets. Otherwise, if the user set option
38 // -misel or the platform supports ISEL by default, still generate the
39 // ISEL instruction, else expand it.
40 static cl::opt<bool>
41 GenerateISEL("ppc-gen-isel",
42 cl::desc("Enable generating the ISEL instruction."),
43 cl::init(true), cl::Hidden);
44
45 namespace {
46 class PPCExpandISEL : public MachineFunctionPass {
47 DebugLoc dl;
48 MachineFunction *MF;
49 const TargetInstrInfo *TII;
50 bool IsTrueBlockRequired;
51 bool IsFalseBlockRequired;
52 MachineBasicBlock *TrueBlock;
53 MachineBasicBlock *FalseBlock;
54 MachineBasicBlock *NewSuccessor;
55 MachineBasicBlock::iterator TrueBlockI;
56 MachineBasicBlock::iterator FalseBlockI;
57
58 typedef SmallVector<MachineInstr *, 4> BlockISELList;
59 typedef SmallDenseMap<int, BlockISELList> ISELInstructionList;
60
61 // A map of MBB numbers to their lists of contained ISEL instructions.
62 // Please note when we traverse this list and expand ISEL, we only remove
63 // the ISEL from the MBB not from this list.
64 ISELInstructionList ISELInstructions;
65
66 /// Initialize the object.
67 void initialize(MachineFunction &MFParam);
68
69 void handleSpecialCases(BlockISELList &BIL, MachineBasicBlock *MBB);
70 void reorganizeBlockLayout(BlockISELList &BIL, MachineBasicBlock *MBB);
71 void populateBlocks(BlockISELList &BIL);
72 void expandMergeableISELs(BlockISELList &BIL);
73 void expandAndMergeISELs();
74
75 bool canMerge(MachineInstr *PrevPushedMI, MachineInstr *MI);
76
77 /// Is this instruction an ISEL or ISEL8?
isISEL(const MachineInstr & MI)78 static bool isISEL(const MachineInstr &MI) {
79 return (MI.getOpcode() == PPC::ISEL || MI.getOpcode() == PPC::ISEL8);
80 }
81
82 /// Is this instruction an ISEL8?
isISEL8(const MachineInstr & MI)83 static bool isISEL8(const MachineInstr &MI) {
84 return (MI.getOpcode() == PPC::ISEL8);
85 }
86
87 /// Are the two operands using the same register?
useSameRegister(const MachineOperand & Op1,const MachineOperand & Op2)88 bool useSameRegister(const MachineOperand &Op1, const MachineOperand &Op2) {
89 return (Op1.getReg() == Op2.getReg());
90 }
91
92 ///
93 /// Collect all ISEL instructions from the current function.
94 ///
95 /// Walk the current function and collect all the ISEL instructions that are
96 /// found. The instructions are placed in the ISELInstructions vector.
97 ///
98 /// \return true if any ISEL instructions were found, false otherwise
99 ///
100 bool collectISELInstructions();
101
102 public:
103 static char ID;
PPCExpandISEL()104 PPCExpandISEL() : MachineFunctionPass(ID) {
105 initializePPCExpandISELPass(*PassRegistry::getPassRegistry());
106 }
107
108 ///
109 /// Determine whether to generate the ISEL instruction or expand it.
110 ///
111 /// Expand ISEL instruction into if-then-else sequence when one of
112 /// the following two conditions hold:
113 /// (1) -ppc-gen-isel=false
114 /// (2) hasISEL() return false
115 /// Otherwise, still generate ISEL instruction.
116 /// The -ppc-gen-isel option is set to true by default. Which means the ISEL
117 /// instruction is still generated by default on targets that support them.
118 ///
119 /// \return true if ISEL should be expanded into if-then-else code sequence;
120 /// false if ISEL instruction should be generated, i.e. not expanded.
121 ///
122 static bool isExpandISELEnabled(const MachineFunction &MF);
123
124 #ifndef NDEBUG
125 void DumpISELInstructions() const;
126 #endif
127
runOnMachineFunction(MachineFunction & MF)128 bool runOnMachineFunction(MachineFunction &MF) override {
129 LLVM_DEBUG(dbgs() << "Function: "; MF.dump(); dbgs() << "\n");
130 initialize(MF);
131
132 if (!collectISELInstructions()) {
133 LLVM_DEBUG(dbgs() << "No ISEL instructions in this function\n");
134 return false;
135 }
136
137 #ifndef NDEBUG
138 DumpISELInstructions();
139 #endif
140
141 expandAndMergeISELs();
142
143 return true;
144 }
145 };
146 } // end anonymous namespace
147
initialize(MachineFunction & MFParam)148 void PPCExpandISEL::initialize(MachineFunction &MFParam) {
149 MF = &MFParam;
150 TII = MF->getSubtarget().getInstrInfo();
151 ISELInstructions.clear();
152 }
153
isExpandISELEnabled(const MachineFunction & MF)154 bool PPCExpandISEL::isExpandISELEnabled(const MachineFunction &MF) {
155 return !GenerateISEL || !MF.getSubtarget<PPCSubtarget>().hasISEL();
156 }
157
collectISELInstructions()158 bool PPCExpandISEL::collectISELInstructions() {
159 for (MachineBasicBlock &MBB : *MF) {
160 BlockISELList thisBlockISELs;
161 for (MachineInstr &MI : MBB)
162 if (isISEL(MI))
163 thisBlockISELs.push_back(&MI);
164 if (!thisBlockISELs.empty())
165 ISELInstructions.insert(std::make_pair(MBB.getNumber(), thisBlockISELs));
166 }
167 return !ISELInstructions.empty();
168 }
169
170 #ifndef NDEBUG
DumpISELInstructions() const171 void PPCExpandISEL::DumpISELInstructions() const {
172 for (const auto &I : ISELInstructions) {
173 LLVM_DEBUG(dbgs() << printMBBReference(*MF->getBlockNumbered(I.first))
174 << ":\n");
175 for (const auto &VI : I.second)
176 LLVM_DEBUG(dbgs() << " "; VI->print(dbgs()));
177 }
178 }
179 #endif
180
181 /// Contiguous ISELs that have the same condition can be merged.
canMerge(MachineInstr * PrevPushedMI,MachineInstr * MI)182 bool PPCExpandISEL::canMerge(MachineInstr *PrevPushedMI, MachineInstr *MI) {
183 // Same Condition Register?
184 if (!useSameRegister(PrevPushedMI->getOperand(3), MI->getOperand(3)))
185 return false;
186
187 MachineBasicBlock::iterator PrevPushedMBBI = *PrevPushedMI;
188 MachineBasicBlock::iterator MBBI = *MI;
189 return (std::prev(MBBI) == PrevPushedMBBI); // Contiguous ISELs?
190 }
191
expandAndMergeISELs()192 void PPCExpandISEL::expandAndMergeISELs() {
193 bool ExpandISELEnabled = isExpandISELEnabled(*MF);
194
195 for (auto &BlockList : ISELInstructions) {
196 LLVM_DEBUG(
197 dbgs() << "Expanding ISEL instructions in "
198 << printMBBReference(*MF->getBlockNumbered(BlockList.first))
199 << "\n");
200 BlockISELList &CurrentISELList = BlockList.second;
201 auto I = CurrentISELList.begin();
202 auto E = CurrentISELList.end();
203
204 while (I != E) {
205 assert(isISEL(**I) && "Expecting an ISEL instruction");
206 MachineOperand &Dest = (*I)->getOperand(0);
207 MachineOperand &TrueValue = (*I)->getOperand(1);
208 MachineOperand &FalseValue = (*I)->getOperand(2);
209
210 // Special case 1, all registers used by ISEL are the same one.
211 // The non-redundant isel 0, 0, 0, N would not satisfy these conditions
212 // as it would be ISEL %R0, %ZERO, %R0, %CRN.
213 if (useSameRegister(Dest, TrueValue) &&
214 useSameRegister(Dest, FalseValue)) {
215 LLVM_DEBUG(dbgs() << "Remove redundant ISEL instruction: " << **I
216 << "\n");
217 // FIXME: if the CR field used has no other uses, we could eliminate the
218 // instruction that defines it. This would have to be done manually
219 // since this pass runs too late to run DCE after it.
220 NumRemoved++;
221 (*I)->eraseFromParent();
222 I++;
223 } else if (useSameRegister(TrueValue, FalseValue)) {
224 // Special case 2, the two input registers used by ISEL are the same.
225 // Note: the non-foldable isel RX, 0, 0, N would not satisfy this
226 // condition as it would be ISEL %RX, %ZERO, %R0, %CRN, which makes it
227 // safe to fold ISEL to MR(OR) instead of ADDI.
228 MachineBasicBlock *MBB = (*I)->getParent();
229 LLVM_DEBUG(
230 dbgs() << "Fold the ISEL instruction to an unconditional copy:\n");
231 LLVM_DEBUG(dbgs() << "ISEL: " << **I << "\n");
232 NumFolded++;
233 // Note: we're using both the TrueValue and FalseValue operands so as
234 // not to lose the kill flag if it is set on either of them.
235 BuildMI(*MBB, (*I), dl, TII->get(isISEL8(**I) ? PPC::OR8 : PPC::OR))
236 .add(Dest)
237 .add(TrueValue)
238 .add(FalseValue);
239 (*I)->eraseFromParent();
240 I++;
241 } else if (ExpandISELEnabled) { // Normal cases expansion enabled
242 LLVM_DEBUG(dbgs() << "Expand ISEL instructions:\n");
243 LLVM_DEBUG(dbgs() << "ISEL: " << **I << "\n");
244 BlockISELList SubISELList;
245 SubISELList.push_back(*I++);
246 // Collect the ISELs that can be merged together.
247 // This will eat up ISEL instructions without considering whether they
248 // may be redundant or foldable to a register copy. So we still keep
249 // the handleSpecialCases() downstream to handle them.
250 while (I != E && canMerge(SubISELList.back(), *I)) {
251 LLVM_DEBUG(dbgs() << "ISEL: " << **I << "\n");
252 SubISELList.push_back(*I++);
253 }
254
255 expandMergeableISELs(SubISELList);
256 } else { // Normal cases expansion disabled
257 I++; // leave the ISEL as it is
258 }
259 } // end while
260 } // end for
261 }
262
handleSpecialCases(BlockISELList & BIL,MachineBasicBlock * MBB)263 void PPCExpandISEL::handleSpecialCases(BlockISELList &BIL,
264 MachineBasicBlock *MBB) {
265 IsTrueBlockRequired = false;
266 IsFalseBlockRequired = false;
267
268 auto MI = BIL.begin();
269 while (MI != BIL.end()) {
270 assert(isISEL(**MI) && "Expecting an ISEL instruction");
271 LLVM_DEBUG(dbgs() << "ISEL: " << **MI << "\n");
272
273 MachineOperand &Dest = (*MI)->getOperand(0);
274 MachineOperand &TrueValue = (*MI)->getOperand(1);
275 MachineOperand &FalseValue = (*MI)->getOperand(2);
276
277 // If at least one of the ISEL instructions satisfy the following
278 // condition, we need the True Block:
279 // The Dest Register and True Value Register are not the same
280 // Similarly, if at least one of the ISEL instructions satisfy the
281 // following condition, we need the False Block:
282 // The Dest Register and False Value Register are not the same.
283 bool IsADDIInstRequired = !useSameRegister(Dest, TrueValue);
284 bool IsORIInstRequired = !useSameRegister(Dest, FalseValue);
285
286 // Special case 1, all registers used by ISEL are the same one.
287 if (!IsADDIInstRequired && !IsORIInstRequired) {
288 LLVM_DEBUG(dbgs() << "Remove redundant ISEL instruction.");
289 // FIXME: if the CR field used has no other uses, we could eliminate the
290 // instruction that defines it. This would have to be done manually
291 // since this pass runs too late to run DCE after it.
292 NumRemoved++;
293 (*MI)->eraseFromParent();
294 // Setting MI to the erase result keeps the iterator valid and increased.
295 MI = BIL.erase(MI);
296 continue;
297 }
298
299 // Special case 2, the two input registers used by ISEL are the same.
300 // Note 1: We favor merging ISEL expansions over folding a single one. If
301 // the passed list has multiple merge-able ISEL's, we won't fold any.
302 // Note 2: There is no need to test for PPC::R0/PPC::X0 because PPC::ZERO/
303 // PPC::ZERO8 will be used for the first operand if the value is meant to
304 // be zero. In this case, the useSameRegister method will return false,
305 // thereby preventing this ISEL from being folded.
306 if (useSameRegister(TrueValue, FalseValue) && (BIL.size() == 1)) {
307 LLVM_DEBUG(
308 dbgs() << "Fold the ISEL instruction to an unconditional copy.");
309 NumFolded++;
310 // Note: we're using both the TrueValue and FalseValue operands so as
311 // not to lose the kill flag if it is set on either of them.
312 BuildMI(*MBB, (*MI), dl, TII->get(isISEL8(**MI) ? PPC::OR8 : PPC::OR))
313 .add(Dest)
314 .add(TrueValue)
315 .add(FalseValue);
316 (*MI)->eraseFromParent();
317 // Setting MI to the erase result keeps the iterator valid and increased.
318 MI = BIL.erase(MI);
319 continue;
320 }
321
322 IsTrueBlockRequired |= IsADDIInstRequired;
323 IsFalseBlockRequired |= IsORIInstRequired;
324 MI++;
325 }
326 }
327
reorganizeBlockLayout(BlockISELList & BIL,MachineBasicBlock * MBB)328 void PPCExpandISEL::reorganizeBlockLayout(BlockISELList &BIL,
329 MachineBasicBlock *MBB) {
330 if (BIL.empty())
331 return;
332
333 assert((IsTrueBlockRequired || IsFalseBlockRequired) &&
334 "Should have been handled by special cases earlier!");
335
336 MachineBasicBlock *Successor = nullptr;
337 const BasicBlock *LLVM_BB = MBB->getBasicBlock();
338 MachineBasicBlock::iterator MBBI = (*BIL.back());
339 NewSuccessor = (MBBI != MBB->getLastNonDebugInstr() || !MBB->canFallThrough())
340 // Another BB is needed to move the instructions that
341 // follow this ISEL. If the ISEL is the last instruction
342 // in a block that can't fall through, we also need a block
343 // to branch to.
344 ? MF->CreateMachineBasicBlock(LLVM_BB)
345 : nullptr;
346
347 MachineFunction::iterator It = MBB->getIterator();
348 ++It; // Point to the successor block of MBB.
349
350 // If NewSuccessor is NULL then the last ISEL in this group is the last
351 // non-debug instruction in this block. Find the fall-through successor
352 // of this block to use when updating the CFG below.
353 if (!NewSuccessor) {
354 for (auto &Succ : MBB->successors()) {
355 if (MBB->isLayoutSuccessor(Succ)) {
356 Successor = Succ;
357 break;
358 }
359 }
360 } else
361 Successor = NewSuccessor;
362
363 // The FalseBlock and TrueBlock are inserted after the MBB block but before
364 // its successor.
365 // Note this need to be done *after* the above setting the Successor code.
366 if (IsFalseBlockRequired) {
367 FalseBlock = MF->CreateMachineBasicBlock(LLVM_BB);
368 MF->insert(It, FalseBlock);
369 }
370
371 if (IsTrueBlockRequired) {
372 TrueBlock = MF->CreateMachineBasicBlock(LLVM_BB);
373 MF->insert(It, TrueBlock);
374 }
375
376 if (NewSuccessor) {
377 MF->insert(It, NewSuccessor);
378
379 // Transfer the rest of this block into the new successor block.
380 NewSuccessor->splice(NewSuccessor->end(), MBB,
381 std::next(MachineBasicBlock::iterator(BIL.back())),
382 MBB->end());
383 NewSuccessor->transferSuccessorsAndUpdatePHIs(MBB);
384
385 // Copy the original liveIns of MBB to NewSuccessor.
386 for (auto &LI : MBB->liveins())
387 NewSuccessor->addLiveIn(LI);
388
389 // After splitting the NewSuccessor block, Regs defined but not killed
390 // in MBB should be treated as liveins of NewSuccessor.
391 // Note: Cannot use stepBackward instead since we are using the Reg
392 // liveness state at the end of MBB (liveOut of MBB) as the liveIn for
393 // NewSuccessor. Otherwise, will cause cyclic dependence.
394 LivePhysRegs LPR(*MF->getSubtarget<PPCSubtarget>().getRegisterInfo());
395 SmallVector<std::pair<unsigned, const MachineOperand *>, 2> Clobbers;
396 for (MachineInstr &MI : *MBB)
397 LPR.stepForward(MI, Clobbers);
398 for (auto &LI : LPR)
399 NewSuccessor->addLiveIn(LI);
400 } else {
401 // Remove successor from MBB.
402 MBB->removeSuccessor(Successor);
403 }
404
405 // Note that this needs to be done *after* transfering the successors from MBB
406 // to the NewSuccessor block, otherwise these blocks will also be transferred
407 // as successors!
408 MBB->addSuccessor(IsTrueBlockRequired ? TrueBlock : Successor);
409 MBB->addSuccessor(IsFalseBlockRequired ? FalseBlock : Successor);
410
411 if (IsTrueBlockRequired) {
412 TrueBlockI = TrueBlock->begin();
413 TrueBlock->addSuccessor(Successor);
414 }
415
416 if (IsFalseBlockRequired) {
417 FalseBlockI = FalseBlock->begin();
418 FalseBlock->addSuccessor(Successor);
419 }
420
421 // Conditional branch to the TrueBlock or Successor
422 BuildMI(*MBB, BIL.back(), dl, TII->get(PPC::BC))
423 .add(BIL.back()->getOperand(3))
424 .addMBB(IsTrueBlockRequired ? TrueBlock : Successor);
425
426 // Jump over the true block to the new successor if the condition is false.
427 BuildMI(*(IsFalseBlockRequired ? FalseBlock : MBB),
428 (IsFalseBlockRequired ? FalseBlockI : BIL.back()), dl,
429 TII->get(PPC::B))
430 .addMBB(Successor);
431
432 if (IsFalseBlockRequired)
433 FalseBlockI = FalseBlock->begin(); // get the position of PPC::B
434 }
435
populateBlocks(BlockISELList & BIL)436 void PPCExpandISEL::populateBlocks(BlockISELList &BIL) {
437 for (auto &MI : BIL) {
438 assert(isISEL(*MI) && "Expecting an ISEL instruction");
439
440 MachineOperand &Dest = MI->getOperand(0); // location to store to
441 MachineOperand &TrueValue = MI->getOperand(1); // Value to store if
442 // condition is true
443 MachineOperand &FalseValue = MI->getOperand(2); // Value to store if
444 // condition is false
445 MachineOperand &ConditionRegister = MI->getOperand(3); // Condition
446
447 LLVM_DEBUG(dbgs() << "Dest: " << Dest << "\n");
448 LLVM_DEBUG(dbgs() << "TrueValue: " << TrueValue << "\n");
449 LLVM_DEBUG(dbgs() << "FalseValue: " << FalseValue << "\n");
450 LLVM_DEBUG(dbgs() << "ConditionRegister: " << ConditionRegister << "\n");
451
452 // If the Dest Register and True Value Register are not the same one, we
453 // need the True Block.
454 bool IsADDIInstRequired = !useSameRegister(Dest, TrueValue);
455 bool IsORIInstRequired = !useSameRegister(Dest, FalseValue);
456
457 if (IsADDIInstRequired) {
458 // Copy the result into the destination if the condition is true.
459 BuildMI(*TrueBlock, TrueBlockI, dl,
460 TII->get(isISEL8(*MI) ? PPC::ADDI8 : PPC::ADDI))
461 .add(Dest)
462 .add(TrueValue)
463 .add(MachineOperand::CreateImm(0));
464
465 // Add the LiveIn registers required by true block.
466 TrueBlock->addLiveIn(TrueValue.getReg());
467 }
468
469 if (IsORIInstRequired) {
470 // Add the LiveIn registers required by false block.
471 FalseBlock->addLiveIn(FalseValue.getReg());
472 }
473
474 if (NewSuccessor) {
475 // Add the LiveIn registers required by NewSuccessor block.
476 NewSuccessor->addLiveIn(Dest.getReg());
477 NewSuccessor->addLiveIn(TrueValue.getReg());
478 NewSuccessor->addLiveIn(FalseValue.getReg());
479 NewSuccessor->addLiveIn(ConditionRegister.getReg());
480 }
481
482 // Copy the value into the destination if the condition is false.
483 if (IsORIInstRequired)
484 BuildMI(*FalseBlock, FalseBlockI, dl,
485 TII->get(isISEL8(*MI) ? PPC::ORI8 : PPC::ORI))
486 .add(Dest)
487 .add(FalseValue)
488 .add(MachineOperand::CreateImm(0));
489
490 MI->eraseFromParent(); // Remove the ISEL instruction.
491
492 NumExpanded++;
493 }
494 }
495
expandMergeableISELs(BlockISELList & BIL)496 void PPCExpandISEL::expandMergeableISELs(BlockISELList &BIL) {
497 // At this stage all the ISELs of BIL are in the same MBB.
498 MachineBasicBlock *MBB = BIL.back()->getParent();
499
500 handleSpecialCases(BIL, MBB);
501 reorganizeBlockLayout(BIL, MBB);
502 populateBlocks(BIL);
503 }
504
505 INITIALIZE_PASS(PPCExpandISEL, DEBUG_TYPE, "PowerPC Expand ISEL Generation",
506 false, false)
507 char PPCExpandISEL::ID = 0;
508
createPPCExpandISELPass()509 FunctionPass *llvm::createPPCExpandISELPass() { return new PPCExpandISEL(); }
510