1 //===------------- PPCExpandISEL.cpp - Expand ISEL instruction ------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // A pass that expands the ISEL instruction into an if-then-else sequence.
10 // This pass must be run post-RA since all operands must be physical registers.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "PPC.h"
15 #include "PPCInstrInfo.h"
16 #include "PPCSubtarget.h"
17 #include "llvm/ADT/DenseMap.h"
18 #include "llvm/ADT/Statistic.h"
19 #include "llvm/CodeGen/LivePhysRegs.h"
20 #include "llvm/CodeGen/MachineFunctionPass.h"
21 #include "llvm/CodeGen/MachineInstrBuilder.h"
22 #include "llvm/CodeGen/MachineRegisterInfo.h"
23 #include "llvm/Support/CommandLine.h"
24 #include "llvm/Support/Debug.h"
25 #include "llvm/Support/raw_ostream.h"
26 
27 using namespace llvm;
28 
29 #define DEBUG_TYPE "ppc-expand-isel"
30 
31 STATISTIC(NumExpanded, "Number of ISEL instructions expanded");
32 STATISTIC(NumRemoved, "Number of ISEL instructions removed");
33 STATISTIC(NumFolded, "Number of ISEL instructions folded");
34 
35 // If -ppc-gen-isel=false is set, we will disable generating the ISEL
36 // instruction on all PPC targets. Otherwise, if the user set option
37 // -misel or the platform supports ISEL by default, still generate the
38 // ISEL instruction, else expand it.
39 static cl::opt<bool>
40     GenerateISEL("ppc-gen-isel",
41                  cl::desc("Enable generating the ISEL instruction."),
42                  cl::init(true), cl::Hidden);
43 
44 namespace {
45 class PPCExpandISEL : public MachineFunctionPass {
46   DebugLoc dl;
47   MachineFunction *MF;
48   const TargetInstrInfo *TII;
49   bool IsTrueBlockRequired;
50   bool IsFalseBlockRequired;
51   MachineBasicBlock *TrueBlock;
52   MachineBasicBlock *FalseBlock;
53   MachineBasicBlock *NewSuccessor;
54   MachineBasicBlock::iterator TrueBlockI;
55   MachineBasicBlock::iterator FalseBlockI;
56 
57   typedef SmallVector<MachineInstr *, 4> BlockISELList;
58   typedef SmallDenseMap<int, BlockISELList> ISELInstructionList;
59 
60   // A map of MBB numbers to their lists of contained ISEL instructions.
61   // Please note when we traverse this list and expand ISEL, we only remove
62   // the ISEL from the MBB not from this list.
63   ISELInstructionList ISELInstructions;
64 
65   /// Initialize the object.
66   void initialize(MachineFunction &MFParam);
67 
68   void handleSpecialCases(BlockISELList &BIL, MachineBasicBlock *MBB);
69   void reorganizeBlockLayout(BlockISELList &BIL, MachineBasicBlock *MBB);
70   void populateBlocks(BlockISELList &BIL);
71   void expandMergeableISELs(BlockISELList &BIL);
72   void expandAndMergeISELs();
73 
74   bool canMerge(MachineInstr *PrevPushedMI, MachineInstr *MI);
75 
76   ///  Is this instruction an ISEL or ISEL8?
77   static bool isISEL(const MachineInstr &MI) {
78     return (MI.getOpcode() == PPC::ISEL || MI.getOpcode() == PPC::ISEL8);
79   }
80 
81   ///  Is this instruction an ISEL8?
82   static bool isISEL8(const MachineInstr &MI) {
83     return (MI.getOpcode() == PPC::ISEL8);
84   }
85 
86   /// Are the two operands using the same register?
87   bool useSameRegister(const MachineOperand &Op1, const MachineOperand &Op2) {
88     return (Op1.getReg() == Op2.getReg());
89   }
90 
91   ///
92   ///  Collect all ISEL instructions from the current function.
93   ///
94   /// Walk the current function and collect all the ISEL instructions that are
95   /// found. The instructions are placed in the ISELInstructions vector.
96   ///
97   /// \return true if any ISEL instructions were found, false otherwise
98   ///
99   bool collectISELInstructions();
100 
101 public:
102   static char ID;
103   PPCExpandISEL() : MachineFunctionPass(ID) {
104     initializePPCExpandISELPass(*PassRegistry::getPassRegistry());
105   }
106 
107   ///
108   ///  Determine whether to generate the ISEL instruction or expand it.
109   ///
110   /// Expand ISEL instruction into if-then-else sequence when one of
111   /// the following two conditions hold:
112   /// (1) -ppc-gen-isel=false
113   /// (2) hasISEL() return false
114   /// Otherwise, still generate ISEL instruction.
115   /// The -ppc-gen-isel option is set to true by default. Which means the ISEL
116   /// instruction is still generated by default on targets that support them.
117   ///
118   /// \return true if ISEL should be expanded into if-then-else code sequence;
119   ///         false if ISEL instruction should be generated, i.e. not expanded.
120   ///
121   static bool isExpandISELEnabled(const MachineFunction &MF);
122 
123 #ifndef NDEBUG
124   void DumpISELInstructions() const;
125 #endif
126 
127   bool runOnMachineFunction(MachineFunction &MF) override {
128     LLVM_DEBUG(dbgs() << "Function: "; MF.dump(); dbgs() << "\n");
129     initialize(MF);
130 
131     if (!collectISELInstructions()) {
132       LLVM_DEBUG(dbgs() << "No ISEL instructions in this function\n");
133       return false;
134     }
135 
136 #ifndef NDEBUG
137     DumpISELInstructions();
138 #endif
139 
140     expandAndMergeISELs();
141 
142     return true;
143   }
144 };
145 } // end anonymous namespace
146 
147 void PPCExpandISEL::initialize(MachineFunction &MFParam) {
148   MF = &MFParam;
149   TII = MF->getSubtarget().getInstrInfo();
150   ISELInstructions.clear();
151 }
152 
153 bool PPCExpandISEL::isExpandISELEnabled(const MachineFunction &MF) {
154   return !GenerateISEL || !MF.getSubtarget<PPCSubtarget>().hasISEL();
155 }
156 
157 bool PPCExpandISEL::collectISELInstructions() {
158   for (MachineBasicBlock &MBB : *MF) {
159     BlockISELList thisBlockISELs;
160     for (MachineInstr &MI : MBB)
161       if (isISEL(MI))
162         thisBlockISELs.push_back(&MI);
163     if (!thisBlockISELs.empty())
164       ISELInstructions.insert(std::make_pair(MBB.getNumber(), thisBlockISELs));
165   }
166   return !ISELInstructions.empty();
167 }
168 
169 #ifndef NDEBUG
170 void PPCExpandISEL::DumpISELInstructions() const {
171   for (const auto &I : ISELInstructions) {
172     LLVM_DEBUG(dbgs() << printMBBReference(*MF->getBlockNumbered(I.first))
173                       << ":\n");
174     for (const auto &VI : I.second)
175       LLVM_DEBUG(dbgs() << "    "; VI->print(dbgs()));
176   }
177 }
178 #endif
179 
180 /// Contiguous ISELs that have the same condition can be merged.
181 bool PPCExpandISEL::canMerge(MachineInstr *PrevPushedMI, MachineInstr *MI) {
182   // Same Condition Register?
183   if (!useSameRegister(PrevPushedMI->getOperand(3), MI->getOperand(3)))
184     return false;
185 
186   MachineBasicBlock::iterator PrevPushedMBBI = *PrevPushedMI;
187   MachineBasicBlock::iterator MBBI = *MI;
188   return (std::prev(MBBI) == PrevPushedMBBI); // Contiguous ISELs?
189 }
190 
191 void PPCExpandISEL::expandAndMergeISELs() {
192   bool ExpandISELEnabled = isExpandISELEnabled(*MF);
193 
194   for (auto &BlockList : ISELInstructions) {
195     LLVM_DEBUG(
196         dbgs() << "Expanding ISEL instructions in "
197                << printMBBReference(*MF->getBlockNumbered(BlockList.first))
198                << "\n");
199     BlockISELList &CurrentISELList = BlockList.second;
200     auto I = CurrentISELList.begin();
201     auto E = CurrentISELList.end();
202 
203     while (I != E) {
204       assert(isISEL(**I) && "Expecting an ISEL instruction");
205       MachineOperand &Dest = (*I)->getOperand(0);
206       MachineOperand &TrueValue = (*I)->getOperand(1);
207       MachineOperand &FalseValue = (*I)->getOperand(2);
208 
209       // Special case 1, all registers used by ISEL are the same one.
210       // The non-redundant isel 0, 0, 0, N would not satisfy these conditions
211       // as it would be ISEL %R0, %ZERO, %R0, %CRN.
212       if (useSameRegister(Dest, TrueValue) &&
213           useSameRegister(Dest, FalseValue)) {
214         LLVM_DEBUG(dbgs() << "Remove redundant ISEL instruction: " << **I
215                           << "\n");
216         // FIXME: if the CR field used has no other uses, we could eliminate the
217         // instruction that defines it. This would have to be done manually
218         // since this pass runs too late to run DCE after it.
219         NumRemoved++;
220         (*I)->eraseFromParent();
221         I++;
222       } else if (useSameRegister(TrueValue, FalseValue)) {
223         // Special case 2, the two input registers used by ISEL are the same.
224         // Note: the non-foldable isel RX, 0, 0, N would not satisfy this
225         // condition as it would be ISEL %RX, %ZERO, %R0, %CRN, which makes it
226         // safe to fold ISEL to MR(OR) instead of ADDI.
227         MachineBasicBlock *MBB = (*I)->getParent();
228         LLVM_DEBUG(
229             dbgs() << "Fold the ISEL instruction to an unconditional copy:\n");
230         LLVM_DEBUG(dbgs() << "ISEL: " << **I << "\n");
231         NumFolded++;
232         // Note: we're using both the TrueValue and FalseValue operands so as
233         // not to lose the kill flag if it is set on either of them.
234         BuildMI(*MBB, (*I), dl, TII->get(isISEL8(**I) ? PPC::OR8 : PPC::OR))
235             .add(Dest)
236             .add(TrueValue)
237             .add(FalseValue);
238         (*I)->eraseFromParent();
239         I++;
240       } else if (ExpandISELEnabled) { // Normal cases expansion enabled
241         LLVM_DEBUG(dbgs() << "Expand ISEL instructions:\n");
242         LLVM_DEBUG(dbgs() << "ISEL: " << **I << "\n");
243         BlockISELList SubISELList;
244         SubISELList.push_back(*I++);
245         // Collect the ISELs that can be merged together.
246         // This will eat up ISEL instructions without considering whether they
247         // may be redundant or foldable to a register copy. So we still keep
248         // the handleSpecialCases() downstream to handle them.
249         while (I != E && canMerge(SubISELList.back(), *I)) {
250           LLVM_DEBUG(dbgs() << "ISEL: " << **I << "\n");
251           SubISELList.push_back(*I++);
252         }
253 
254         expandMergeableISELs(SubISELList);
255       } else { // Normal cases expansion disabled
256         I++; // leave the ISEL as it is
257       }
258     } // end while
259   } // end for
260 }
261 
262 void PPCExpandISEL::handleSpecialCases(BlockISELList &BIL,
263                                        MachineBasicBlock *MBB) {
264   IsTrueBlockRequired = false;
265   IsFalseBlockRequired = false;
266 
267   auto MI = BIL.begin();
268   while (MI != BIL.end()) {
269     assert(isISEL(**MI) && "Expecting an ISEL instruction");
270     LLVM_DEBUG(dbgs() << "ISEL: " << **MI << "\n");
271 
272     MachineOperand &Dest = (*MI)->getOperand(0);
273     MachineOperand &TrueValue = (*MI)->getOperand(1);
274     MachineOperand &FalseValue = (*MI)->getOperand(2);
275 
276     // If at least one of the ISEL instructions satisfy the following
277     // condition, we need the True Block:
278     // The Dest Register and True Value Register are not the same
279     // Similarly, if at least one of the ISEL instructions satisfy the
280     // following condition, we need the False Block:
281     // The Dest Register and False Value Register are not the same.
282     bool IsADDIInstRequired = !useSameRegister(Dest, TrueValue);
283     bool IsORIInstRequired = !useSameRegister(Dest, FalseValue);
284 
285     // Special case 1, all registers used by ISEL are the same one.
286     if (!IsADDIInstRequired && !IsORIInstRequired) {
287       LLVM_DEBUG(dbgs() << "Remove redundant ISEL instruction.");
288       // FIXME: if the CR field used has no other uses, we could eliminate the
289       // instruction that defines it. This would have to be done manually
290       // since this pass runs too late to run DCE after it.
291       NumRemoved++;
292       (*MI)->eraseFromParent();
293       // Setting MI to the erase result keeps the iterator valid and increased.
294       MI = BIL.erase(MI);
295       continue;
296     }
297 
298     // Special case 2, the two input registers used by ISEL are the same.
299     // Note 1: We favor merging ISEL expansions over folding a single one. If
300     // the passed list has multiple merge-able ISEL's, we won't fold any.
301     // Note 2: There is no need to test for PPC::R0/PPC::X0 because PPC::ZERO/
302     // PPC::ZERO8 will be used for the first operand if the value is meant to
303     // be zero. In this case, the useSameRegister method will return false,
304     // thereby preventing this ISEL from being folded.
305     if (useSameRegister(TrueValue, FalseValue) && (BIL.size() == 1)) {
306       LLVM_DEBUG(
307           dbgs() << "Fold the ISEL instruction to an unconditional copy.");
308       NumFolded++;
309       // Note: we're using both the TrueValue and FalseValue operands so as
310       // not to lose the kill flag if it is set on either of them.
311       BuildMI(*MBB, (*MI), dl, TII->get(isISEL8(**MI) ? PPC::OR8 : PPC::OR))
312           .add(Dest)
313           .add(TrueValue)
314           .add(FalseValue);
315       (*MI)->eraseFromParent();
316       // Setting MI to the erase result keeps the iterator valid and increased.
317       MI = BIL.erase(MI);
318       continue;
319     }
320 
321     IsTrueBlockRequired |= IsADDIInstRequired;
322     IsFalseBlockRequired |= IsORIInstRequired;
323     MI++;
324   }
325 }
326 
327 void PPCExpandISEL::reorganizeBlockLayout(BlockISELList &BIL,
328                                           MachineBasicBlock *MBB) {
329   if (BIL.empty())
330     return;
331 
332   assert((IsTrueBlockRequired || IsFalseBlockRequired) &&
333          "Should have been handled by special cases earlier!");
334 
335   MachineBasicBlock *Successor = nullptr;
336   const BasicBlock *LLVM_BB = MBB->getBasicBlock();
337   MachineBasicBlock::iterator MBBI = (*BIL.back());
338   NewSuccessor = (MBBI != MBB->getLastNonDebugInstr() || !MBB->canFallThrough())
339                      // Another BB is needed to move the instructions that
340                      // follow this ISEL.  If the ISEL is the last instruction
341                      // in a block that can't fall through, we also need a block
342                      // to branch to.
343                      ? MF->CreateMachineBasicBlock(LLVM_BB)
344                      : nullptr;
345 
346   MachineFunction::iterator It = MBB->getIterator();
347   ++It; // Point to the successor block of MBB.
348 
349   // If NewSuccessor is NULL then the last ISEL in this group is the last
350   // non-debug instruction in this block. Find the fall-through successor
351   // of this block to use when updating the CFG below.
352   if (!NewSuccessor) {
353     for (auto &Succ : MBB->successors()) {
354       if (MBB->isLayoutSuccessor(Succ)) {
355         Successor = Succ;
356         break;
357       }
358     }
359   } else
360     Successor = NewSuccessor;
361 
362   // The FalseBlock and TrueBlock are inserted after the MBB block but before
363   // its successor.
364   // Note this need to be done *after* the above setting the Successor code.
365   if (IsFalseBlockRequired) {
366     FalseBlock = MF->CreateMachineBasicBlock(LLVM_BB);
367     MF->insert(It, FalseBlock);
368   }
369 
370   if (IsTrueBlockRequired) {
371     TrueBlock = MF->CreateMachineBasicBlock(LLVM_BB);
372     MF->insert(It, TrueBlock);
373   }
374 
375   if (NewSuccessor) {
376     MF->insert(It, NewSuccessor);
377 
378     // Transfer the rest of this block into the new successor block.
379     NewSuccessor->splice(NewSuccessor->end(), MBB,
380                          std::next(MachineBasicBlock::iterator(BIL.back())),
381                          MBB->end());
382     NewSuccessor->transferSuccessorsAndUpdatePHIs(MBB);
383 
384     // Copy the original liveIns of MBB to NewSuccessor.
385     for (auto &LI : MBB->liveins())
386       NewSuccessor->addLiveIn(LI);
387 
388     // After splitting the NewSuccessor block, Regs defined but not killed
389     // in MBB should be treated as liveins of NewSuccessor.
390     // Note: Cannot use stepBackward instead since we are using the Reg
391     // liveness state at the end of MBB (liveOut of MBB) as the liveIn for
392     // NewSuccessor. Otherwise, will cause cyclic dependence.
393     LivePhysRegs LPR(*MF->getSubtarget<PPCSubtarget>().getRegisterInfo());
394     SmallVector<std::pair<MCPhysReg, const MachineOperand *>, 2> Clobbers;
395     for (MachineInstr &MI : *MBB)
396       LPR.stepForward(MI, Clobbers);
397     for (auto &LI : LPR)
398       NewSuccessor->addLiveIn(LI);
399   } else {
400     // Remove successor from MBB.
401     MBB->removeSuccessor(Successor);
402   }
403 
404   // Note that this needs to be done *after* transfering the successors from MBB
405   // to the NewSuccessor block, otherwise these blocks will also be transferred
406   // as successors!
407   MBB->addSuccessor(IsTrueBlockRequired ? TrueBlock : Successor);
408   MBB->addSuccessor(IsFalseBlockRequired ? FalseBlock : Successor);
409 
410   if (IsTrueBlockRequired) {
411     TrueBlockI = TrueBlock->begin();
412     TrueBlock->addSuccessor(Successor);
413   }
414 
415   if (IsFalseBlockRequired) {
416     FalseBlockI = FalseBlock->begin();
417     FalseBlock->addSuccessor(Successor);
418   }
419 
420   // Conditional branch to the TrueBlock or Successor
421   BuildMI(*MBB, BIL.back(), dl, TII->get(PPC::BC))
422       .add(BIL.back()->getOperand(3))
423       .addMBB(IsTrueBlockRequired ? TrueBlock : Successor);
424 
425   // Jump over the true block to the new successor if the condition is false.
426   BuildMI(*(IsFalseBlockRequired ? FalseBlock : MBB),
427           (IsFalseBlockRequired ? FalseBlockI : BIL.back()), dl,
428           TII->get(PPC::B))
429       .addMBB(Successor);
430 
431   if (IsFalseBlockRequired)
432     FalseBlockI = FalseBlock->begin(); // get the position of PPC::B
433 }
434 
435 void PPCExpandISEL::populateBlocks(BlockISELList &BIL) {
436   for (auto &MI : BIL) {
437     assert(isISEL(*MI) && "Expecting an ISEL instruction");
438 
439     MachineOperand &Dest = MI->getOperand(0);       // location to store to
440     MachineOperand &TrueValue = MI->getOperand(1);  // Value to store if
441                                                        // condition is true
442     MachineOperand &FalseValue = MI->getOperand(2); // Value to store if
443                                                        // condition is false
444     MachineOperand &ConditionRegister = MI->getOperand(3); // Condition
445 
446     LLVM_DEBUG(dbgs() << "Dest: " << Dest << "\n");
447     LLVM_DEBUG(dbgs() << "TrueValue: " << TrueValue << "\n");
448     LLVM_DEBUG(dbgs() << "FalseValue: " << FalseValue << "\n");
449     LLVM_DEBUG(dbgs() << "ConditionRegister: " << ConditionRegister << "\n");
450 
451     // If the Dest Register and True Value Register are not the same one, we
452     // need the True Block.
453     bool IsADDIInstRequired = !useSameRegister(Dest, TrueValue);
454     bool IsORIInstRequired = !useSameRegister(Dest, FalseValue);
455 
456     if (IsADDIInstRequired) {
457       // Copy the result into the destination if the condition is true.
458       BuildMI(*TrueBlock, TrueBlockI, dl,
459               TII->get(isISEL8(*MI) ? PPC::ADDI8 : PPC::ADDI))
460           .add(Dest)
461           .add(TrueValue)
462           .add(MachineOperand::CreateImm(0));
463 
464       // Add the LiveIn registers required by true block.
465       TrueBlock->addLiveIn(TrueValue.getReg());
466     }
467 
468     if (IsORIInstRequired) {
469       // Add the LiveIn registers required by false block.
470       FalseBlock->addLiveIn(FalseValue.getReg());
471     }
472 
473     if (NewSuccessor) {
474       // Add the LiveIn registers required by NewSuccessor block.
475       NewSuccessor->addLiveIn(Dest.getReg());
476       NewSuccessor->addLiveIn(TrueValue.getReg());
477       NewSuccessor->addLiveIn(FalseValue.getReg());
478       NewSuccessor->addLiveIn(ConditionRegister.getReg());
479     }
480 
481     // Copy the value into the destination if the condition is false.
482     if (IsORIInstRequired)
483       BuildMI(*FalseBlock, FalseBlockI, dl,
484               TII->get(isISEL8(*MI) ? PPC::ORI8 : PPC::ORI))
485           .add(Dest)
486           .add(FalseValue)
487           .add(MachineOperand::CreateImm(0));
488 
489     MI->eraseFromParent(); // Remove the ISEL instruction.
490 
491     NumExpanded++;
492   }
493 }
494 
495 void PPCExpandISEL::expandMergeableISELs(BlockISELList &BIL) {
496   // At this stage all the ISELs of BIL are in the same MBB.
497   MachineBasicBlock *MBB = BIL.back()->getParent();
498 
499   handleSpecialCases(BIL, MBB);
500   reorganizeBlockLayout(BIL, MBB);
501   populateBlocks(BIL);
502 }
503 
504 INITIALIZE_PASS(PPCExpandISEL, DEBUG_TYPE, "PowerPC Expand ISEL Generation",
505                 false, false)
506 char PPCExpandISEL::ID = 0;
507 
508 FunctionPass *llvm::createPPCExpandISELPass() { return new PPCExpandISEL(); }
509