| //===-- CoalesceBranches.cpp - Coalesce blocks with the same condition ---===// | 
 | // | 
 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | 
 | // See https://llvm.org/LICENSE.txt for license information. | 
 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | 
 | // | 
 | //===----------------------------------------------------------------------===// | 
 | /// | 
 | /// \file | 
 | /// Coalesce basic blocks guarded by the same branch condition into a single | 
 | /// basic block. | 
 | /// | 
 | //===----------------------------------------------------------------------===// | 
 |  | 
 | #include "PPC.h" | 
 | #include "llvm/ADT/BitVector.h" | 
 | #include "llvm/ADT/Statistic.h" | 
 | #include "llvm/CodeGen/MachineDominators.h" | 
 | #include "llvm/CodeGen/MachineFunctionPass.h" | 
 | #include "llvm/CodeGen/MachinePostDominators.h" | 
 | #include "llvm/CodeGen/MachineRegisterInfo.h" | 
 | #include "llvm/CodeGen/Passes.h" | 
 | #include "llvm/CodeGen/TargetFrameLowering.h" | 
 | #include "llvm/CodeGen/TargetInstrInfo.h" | 
 | #include "llvm/CodeGen/TargetSubtargetInfo.h" | 
 | #include "llvm/Support/Debug.h" | 
 |  | 
 | using namespace llvm; | 
 |  | 
 | #define DEBUG_TYPE "ppc-branch-coalescing" | 
 |  | 
 | STATISTIC(NumBlocksCoalesced, "Number of blocks coalesced"); | 
 | STATISTIC(NumPHINotMoved, "Number of PHI Nodes that cannot be merged"); | 
 | STATISTIC(NumBlocksNotCoalesced, "Number of blocks not coalesced"); | 
 |  | 
 | //===----------------------------------------------------------------------===// | 
 | //                               PPCBranchCoalescing | 
 | //===----------------------------------------------------------------------===// | 
 | /// | 
 | /// Improve scheduling by coalescing branches that depend on the same condition. | 
 | /// This pass looks for blocks that are guarded by the same branch condition | 
 | /// and attempts to merge the blocks together. Such opportunities arise from | 
 | /// the expansion of select statements in the IR. | 
 | /// | 
 | /// This pass does not handle implicit operands on branch statements. In order | 
 | /// to run on targets that use implicit operands, changes need to be made in the | 
 | /// canCoalesceBranch and canMerge methods. | 
 | /// | 
 | /// Example: the following LLVM IR | 
 | /// | 
 | ///     %test = icmp eq i32 %x 0 | 
 | ///     %tmp1 = select i1 %test, double %a, double 2.000000e-03 | 
 | ///     %tmp2 = select i1 %test, double %b, double 5.000000e-03 | 
 | /// | 
 | /// expands to the following machine code: | 
 | /// | 
 | /// %bb.0: derived from LLVM BB %entry | 
 | ///    liveins: %f1 %f3 %x6 | 
 | ///        <SNIP1> | 
 | ///        %0 = COPY %f1; F8RC:%0 | 
 | ///        %5 = CMPLWI killed %4, 0; CRRC:%5 GPRC:%4 | 
 | ///        %8 = LXSDX %zero8, killed %7, implicit %rm; | 
 | ///                    mem:LD8[ConstantPool] F8RC:%8 G8RC:%7 | 
 | ///        BCC 76, %5, <%bb.2>; CRRC:%5 | 
 | ///    Successors according to CFG: %bb.1(?%) %bb.2(?%) | 
 | /// | 
 | /// %bb.1: derived from LLVM BB %entry | 
 | ///    Predecessors according to CFG: %bb.0 | 
 | ///    Successors according to CFG: %bb.2(?%) | 
 | /// | 
 | /// %bb.2: derived from LLVM BB %entry | 
 | ///    Predecessors according to CFG: %bb.0 %bb.1 | 
 | ///        %9 = PHI %8, <%bb.1>, %0, <%bb.0>; | 
 | ///                    F8RC:%9,%8,%0 | 
 | ///        <SNIP2> | 
 | ///        BCC 76, %5, <%bb.4>; CRRC:%5 | 
 | ///    Successors according to CFG: %bb.3(?%) %bb.4(?%) | 
 | /// | 
 | /// %bb.3: derived from LLVM BB %entry | 
 | ///    Predecessors according to CFG: %bb.2 | 
 | ///    Successors according to CFG: %bb.4(?%) | 
 | /// | 
 | /// %bb.4: derived from LLVM BB %entry | 
 | ///    Predecessors according to CFG: %bb.2 %bb.3 | 
 | ///        %13 = PHI %12, <%bb.3>, %2, <%bb.2>; | 
 | ///                     F8RC:%13,%12,%2 | 
 | ///        <SNIP3> | 
 | ///        BLR8 implicit %lr8, implicit %rm, implicit %f1 | 
 | /// | 
 | /// When this pattern is detected, branch coalescing will try to collapse | 
 | /// it by moving code in %bb.2 to %bb.0 and/or %bb.4 and removing %bb.3. | 
 | /// | 
 | /// If all conditions are meet, IR should collapse to: | 
 | /// | 
 | /// %bb.0: derived from LLVM BB %entry | 
 | ///    liveins: %f1 %f3 %x6 | 
 | ///        <SNIP1> | 
 | ///        %0 = COPY %f1; F8RC:%0 | 
 | ///        %5 = CMPLWI killed %4, 0; CRRC:%5 GPRC:%4 | 
 | ///        %8 = LXSDX %zero8, killed %7, implicit %rm; | 
 | ///                     mem:LD8[ConstantPool] F8RC:%8 G8RC:%7 | 
 | ///        <SNIP2> | 
 | ///        BCC 76, %5, <%bb.4>; CRRC:%5 | 
 | ///    Successors according to CFG: %bb.1(0x2aaaaaaa / 0x80000000 = 33.33%) | 
 | ///      %bb.4(0x55555554 / 0x80000000 = 66.67%) | 
 | /// | 
 | /// %bb.1: derived from LLVM BB %entry | 
 | ///    Predecessors according to CFG: %bb.0 | 
 | ///    Successors according to CFG: %bb.4(0x40000000 / 0x80000000 = 50.00%) | 
 | /// | 
 | /// %bb.4: derived from LLVM BB %entry | 
 | ///    Predecessors according to CFG: %bb.0 %bb.1 | 
 | ///        %9 = PHI %8, <%bb.1>, %0, <%bb.0>; | 
 | ///                    F8RC:%9,%8,%0 | 
 | ///        %13 = PHI %12, <%bb.1>, %2, <%bb.0>; | 
 | ///                     F8RC:%13,%12,%2 | 
 | ///        <SNIP3> | 
 | ///        BLR8 implicit %lr8, implicit %rm, implicit %f1 | 
 | /// | 
 | /// Branch Coalescing does not split blocks, it moves everything in the same | 
 | /// direction ensuring it does not break use/definition semantics. | 
 | /// | 
 | /// PHI nodes and its corresponding use instructions are moved to its successor | 
 | /// block if there are no uses within the successor block PHI nodes.  PHI | 
 | /// node ordering cannot be assumed. | 
 | /// | 
 | /// Non-PHI can be moved up to the predecessor basic block or down to the | 
 | /// successor basic block following any PHI instructions. Whether it moves | 
 | /// up or down depends on whether the register(s) defined in the instructions | 
 | /// are used in current block or in any PHI instructions at the beginning of | 
 | /// the successor block. | 
 |  | 
 | namespace { | 
 |  | 
 | class PPCBranchCoalescing : public MachineFunctionPass { | 
 |   struct CoalescingCandidateInfo { | 
 |     MachineBasicBlock *BranchBlock;       // Block containing the branch | 
 |     MachineBasicBlock *BranchTargetBlock; // Block branched to | 
 |     MachineBasicBlock *FallThroughBlock;  // Fall-through if branch not taken | 
 |     SmallVector<MachineOperand, 4> Cond; | 
 |     bool MustMoveDown; | 
 |     bool MustMoveUp; | 
 |  | 
 |     CoalescingCandidateInfo(); | 
 |     void clear(); | 
 |   }; | 
 |  | 
 |   MachineDominatorTree *MDT; | 
 |   MachinePostDominatorTree *MPDT; | 
 |   const TargetInstrInfo *TII; | 
 |   MachineRegisterInfo *MRI; | 
 |  | 
 |   void initialize(MachineFunction &F); | 
 |   bool canCoalesceBranch(CoalescingCandidateInfo &Cand); | 
 |   bool identicalOperands(ArrayRef<MachineOperand> OperandList1, | 
 |                          ArrayRef<MachineOperand> OperandList2) const; | 
 |   bool validateCandidates(CoalescingCandidateInfo &SourceRegion, | 
 |                           CoalescingCandidateInfo &TargetRegion) const; | 
 |  | 
 | public: | 
 |   static char ID; | 
 |  | 
 |   PPCBranchCoalescing() : MachineFunctionPass(ID) { | 
 |     initializePPCBranchCoalescingPass(*PassRegistry::getPassRegistry()); | 
 |   } | 
 |  | 
 |   void getAnalysisUsage(AnalysisUsage &AU) const override { | 
 |     AU.addRequired<MachineDominatorTree>(); | 
 |     AU.addRequired<MachinePostDominatorTree>(); | 
 |     MachineFunctionPass::getAnalysisUsage(AU); | 
 |   } | 
 |  | 
 |   StringRef getPassName() const override { return "Branch Coalescing"; } | 
 |  | 
 |   bool mergeCandidates(CoalescingCandidateInfo &SourceRegion, | 
 |                        CoalescingCandidateInfo &TargetRegion); | 
 |   bool canMoveToBeginning(const MachineInstr &MI, | 
 |                           const MachineBasicBlock &MBB) const; | 
 |   bool canMoveToEnd(const MachineInstr &MI, | 
 |                     const MachineBasicBlock &MBB) const; | 
 |   bool canMerge(CoalescingCandidateInfo &SourceRegion, | 
 |                 CoalescingCandidateInfo &TargetRegion) const; | 
 |   void moveAndUpdatePHIs(MachineBasicBlock *SourceRegionMBB, | 
 |                          MachineBasicBlock *TargetRegionMBB); | 
 |   bool runOnMachineFunction(MachineFunction &MF) override; | 
 | }; | 
 | } // End anonymous namespace. | 
 |  | 
 | char PPCBranchCoalescing::ID = 0; | 
 | /// createPPCBranchCoalescingPass - returns an instance of the Branch Coalescing | 
 | /// Pass | 
 | FunctionPass *llvm::createPPCBranchCoalescingPass() { | 
 |   return new PPCBranchCoalescing(); | 
 | } | 
 |  | 
 | INITIALIZE_PASS_BEGIN(PPCBranchCoalescing, DEBUG_TYPE, | 
 |                       "Branch Coalescing", false, false) | 
 | INITIALIZE_PASS_DEPENDENCY(MachineDominatorTree) | 
 | INITIALIZE_PASS_DEPENDENCY(MachinePostDominatorTree) | 
 | INITIALIZE_PASS_END(PPCBranchCoalescing, DEBUG_TYPE, "Branch Coalescing", | 
 |                     false, false) | 
 |  | 
 | PPCBranchCoalescing::CoalescingCandidateInfo::CoalescingCandidateInfo() | 
 |     : BranchBlock(nullptr), BranchTargetBlock(nullptr), | 
 |       FallThroughBlock(nullptr), MustMoveDown(false), MustMoveUp(false) {} | 
 |  | 
 | void PPCBranchCoalescing::CoalescingCandidateInfo::clear() { | 
 |   BranchBlock = nullptr; | 
 |   BranchTargetBlock = nullptr; | 
 |   FallThroughBlock = nullptr; | 
 |   Cond.clear(); | 
 |   MustMoveDown = false; | 
 |   MustMoveUp = false; | 
 | } | 
 |  | 
 | void PPCBranchCoalescing::initialize(MachineFunction &MF) { | 
 |   MDT = &getAnalysis<MachineDominatorTree>(); | 
 |   MPDT = &getAnalysis<MachinePostDominatorTree>(); | 
 |   TII = MF.getSubtarget().getInstrInfo(); | 
 |   MRI = &MF.getRegInfo(); | 
 | } | 
 |  | 
 | /// | 
 | /// Analyze the branch statement to determine if it can be coalesced. This | 
 | /// method analyses the branch statement for the given candidate to determine | 
 | /// if it can be coalesced. If the branch can be coalesced, then the | 
 | /// BranchTargetBlock and the FallThroughBlock are recorded in the specified | 
 | /// Candidate. | 
 | /// | 
 | ///\param[in,out] Cand The coalescing candidate to analyze | 
 | ///\return true if and only if the branch can be coalesced, false otherwise | 
 | /// | 
 | bool PPCBranchCoalescing::canCoalesceBranch(CoalescingCandidateInfo &Cand) { | 
 |   LLVM_DEBUG(dbgs() << "Determine if branch block " | 
 |                     << Cand.BranchBlock->getNumber() << " can be coalesced:"); | 
 |   MachineBasicBlock *FalseMBB = nullptr; | 
 |  | 
 |   if (TII->analyzeBranch(*Cand.BranchBlock, Cand.BranchTargetBlock, FalseMBB, | 
 |                          Cand.Cond)) { | 
 |     LLVM_DEBUG(dbgs() << "TII unable to Analyze Branch - skip\n"); | 
 |     return false; | 
 |   } | 
 |  | 
 |   for (auto &I : Cand.BranchBlock->terminators()) { | 
 |     LLVM_DEBUG(dbgs() << "Looking at terminator : " << I << "\n"); | 
 |     if (!I.isBranch()) | 
 |       continue; | 
 |  | 
 |     // The analyzeBranch method does not include any implicit operands. | 
 |     // This is not an issue on PPC but must be handled on other targets. | 
 |     // For this pass to be made target-independent, the analyzeBranch API | 
 |     // need to be updated to support implicit operands and there would | 
 |     // need to be a way to verify that any implicit operands would not be | 
 |     // clobbered by merging blocks.  This would include identifying the | 
 |     // implicit operands as well as the basic block they are defined in. | 
 |     // This could be done by changing the analyzeBranch API to have it also | 
 |     // record and return the implicit operands and the blocks where they are | 
 |     // defined. Alternatively, the BranchCoalescing code would need to be | 
 |     // extended to identify the implicit operands.  The analysis in canMerge | 
 |     // must then be extended to prove that none of the implicit operands are | 
 |     // changed in the blocks that are combined during coalescing. | 
 |     if (I.getNumOperands() != I.getNumExplicitOperands()) { | 
 |       LLVM_DEBUG(dbgs() << "Terminator contains implicit operands - skip : " | 
 |                         << I << "\n"); | 
 |       return false; | 
 |     } | 
 |   } | 
 |  | 
 |   if (Cand.BranchBlock->isEHPad() || Cand.BranchBlock->hasEHPadSuccessor()) { | 
 |     LLVM_DEBUG(dbgs() << "EH Pad - skip\n"); | 
 |     return false; | 
 |   } | 
 |  | 
 |   // For now only consider triangles (i.e, BranchTargetBlock is set, | 
 |   // FalseMBB is null, and BranchTargetBlock is a successor to BranchBlock) | 
 |   if (!Cand.BranchTargetBlock || FalseMBB || | 
 |       !Cand.BranchBlock->isSuccessor(Cand.BranchTargetBlock)) { | 
 |     LLVM_DEBUG(dbgs() << "Does not form a triangle - skip\n"); | 
 |     return false; | 
 |   } | 
 |  | 
 |   // Ensure there are only two successors | 
 |   if (Cand.BranchBlock->succ_size() != 2) { | 
 |     LLVM_DEBUG(dbgs() << "Does not have 2 successors - skip\n"); | 
 |     return false; | 
 |   } | 
 |  | 
 |   // Sanity check - the block must be able to fall through | 
 |   assert(Cand.BranchBlock->canFallThrough() && | 
 |          "Expecting the block to fall through!"); | 
 |  | 
 |   // We have already ensured there are exactly two successors to | 
 |   // BranchBlock and that BranchTargetBlock is a successor to BranchBlock. | 
 |   // Ensure the single fall though block is empty. | 
 |   MachineBasicBlock *Succ = | 
 |     (*Cand.BranchBlock->succ_begin() == Cand.BranchTargetBlock) | 
 |     ? *Cand.BranchBlock->succ_rbegin() | 
 |     : *Cand.BranchBlock->succ_begin(); | 
 |  | 
 |   assert(Succ && "Expecting a valid fall-through block\n"); | 
 |  | 
 |   if (!Succ->empty()) { | 
 |     LLVM_DEBUG(dbgs() << "Fall-through block contains code -- skip\n"); | 
 |     return false; | 
 |   } | 
 |  | 
 |   if (!Succ->isSuccessor(Cand.BranchTargetBlock)) { | 
 |     LLVM_DEBUG( | 
 |         dbgs() | 
 |         << "Successor of fall through block is not branch taken block\n"); | 
 |     return false; | 
 |   } | 
 |  | 
 |   Cand.FallThroughBlock = Succ; | 
 |   LLVM_DEBUG(dbgs() << "Valid Candidate\n"); | 
 |   return true; | 
 | } | 
 |  | 
 | /// | 
 | /// Determine if the two operand lists are identical | 
 | /// | 
 | /// \param[in] OpList1 operand list | 
 | /// \param[in] OpList2 operand list | 
 | /// \return true if and only if the operands lists are identical | 
 | /// | 
 | bool PPCBranchCoalescing::identicalOperands( | 
 |     ArrayRef<MachineOperand> OpList1, ArrayRef<MachineOperand> OpList2) const { | 
 |  | 
 |   if (OpList1.size() != OpList2.size()) { | 
 |     LLVM_DEBUG(dbgs() << "Operand list is different size\n"); | 
 |     return false; | 
 |   } | 
 |  | 
 |   for (unsigned i = 0; i < OpList1.size(); ++i) { | 
 |     const MachineOperand &Op1 = OpList1[i]; | 
 |     const MachineOperand &Op2 = OpList2[i]; | 
 |  | 
 |     LLVM_DEBUG(dbgs() << "Op1: " << Op1 << "\n" | 
 |                       << "Op2: " << Op2 << "\n"); | 
 |  | 
 |     if (Op1.isIdenticalTo(Op2)) { | 
 |       // filter out instructions with physical-register uses | 
 |       if (Op1.isReg() && TargetRegisterInfo::isPhysicalRegister(Op1.getReg()) | 
 |         // If the physical register is constant then we can assume the value | 
 |         // has not changed between uses. | 
 |           && !(Op1.isUse() && MRI->isConstantPhysReg(Op1.getReg()))) { | 
 |         LLVM_DEBUG(dbgs() << "The operands are not provably identical.\n"); | 
 |         return false; | 
 |       } | 
 |       LLVM_DEBUG(dbgs() << "Op1 and Op2 are identical!\n"); | 
 |       continue; | 
 |     } | 
 |  | 
 |     // If the operands are not identical, but are registers, check to see if the | 
 |     // definition of the register produces the same value. If they produce the | 
 |     // same value, consider them to be identical. | 
 |     if (Op1.isReg() && Op2.isReg() && | 
 |         TargetRegisterInfo::isVirtualRegister(Op1.getReg()) && | 
 |         TargetRegisterInfo::isVirtualRegister(Op2.getReg())) { | 
 |       MachineInstr *Op1Def = MRI->getVRegDef(Op1.getReg()); | 
 |       MachineInstr *Op2Def = MRI->getVRegDef(Op2.getReg()); | 
 |       if (TII->produceSameValue(*Op1Def, *Op2Def, MRI)) { | 
 |         LLVM_DEBUG(dbgs() << "Op1Def: " << *Op1Def << " and " << *Op2Def | 
 |                           << " produce the same value!\n"); | 
 |       } else { | 
 |         LLVM_DEBUG(dbgs() << "Operands produce different values\n"); | 
 |         return false; | 
 |       } | 
 |     } else { | 
 |       LLVM_DEBUG(dbgs() << "The operands are not provably identical.\n"); | 
 |       return false; | 
 |     } | 
 |   } | 
 |  | 
 |   return true; | 
 | } | 
 |  | 
 | /// | 
 | /// Moves ALL PHI instructions in SourceMBB to beginning of TargetMBB | 
 | /// and update them to refer to the new block.  PHI node ordering | 
 | /// cannot be assumed so it does not matter where the PHI instructions | 
 | /// are moved to in TargetMBB. | 
 | /// | 
 | /// \param[in] SourceMBB block to move PHI instructions from | 
 | /// \param[in] TargetMBB block to move PHI instructions to | 
 | /// | 
 | void PPCBranchCoalescing::moveAndUpdatePHIs(MachineBasicBlock *SourceMBB, | 
 |                                          MachineBasicBlock *TargetMBB) { | 
 |  | 
 |   MachineBasicBlock::iterator MI = SourceMBB->begin(); | 
 |   MachineBasicBlock::iterator ME = SourceMBB->getFirstNonPHI(); | 
 |  | 
 |   if (MI == ME) { | 
 |     LLVM_DEBUG(dbgs() << "SourceMBB contains no PHI instructions.\n"); | 
 |     return; | 
 |   } | 
 |  | 
 |   // Update all PHI instructions in SourceMBB and move to top of TargetMBB | 
 |   for (MachineBasicBlock::iterator Iter = MI; Iter != ME; Iter++) { | 
 |     MachineInstr &PHIInst = *Iter; | 
 |     for (unsigned i = 2, e = PHIInst.getNumOperands() + 1; i != e; i += 2) { | 
 |       MachineOperand &MO = PHIInst.getOperand(i); | 
 |       if (MO.getMBB() == SourceMBB) | 
 |         MO.setMBB(TargetMBB); | 
 |     } | 
 |   } | 
 |   TargetMBB->splice(TargetMBB->begin(), SourceMBB, MI, ME); | 
 | } | 
 |  | 
 | /// | 
 | /// This function checks if MI can be moved to the beginning of the TargetMBB | 
 | /// following PHI instructions. A MI instruction can be moved to beginning of | 
 | /// the TargetMBB if there are no uses of it within the TargetMBB PHI nodes. | 
 | /// | 
 | /// \param[in] MI the machine instruction to move. | 
 | /// \param[in] TargetMBB the machine basic block to move to | 
 | /// \return true if it is safe to move MI to beginning of TargetMBB, | 
 | ///         false otherwise. | 
 | /// | 
 | bool PPCBranchCoalescing::canMoveToBeginning(const MachineInstr &MI, | 
 |                                           const MachineBasicBlock &TargetMBB | 
 |                                           ) const { | 
 |  | 
 |   LLVM_DEBUG(dbgs() << "Checking if " << MI << " can move to beginning of " | 
 |                     << TargetMBB.getNumber() << "\n"); | 
 |  | 
 |   for (auto &Def : MI.defs()) { // Looking at Def | 
 |     for (auto &Use : MRI->use_instructions(Def.getReg())) { | 
 |       if (Use.isPHI() && Use.getParent() == &TargetMBB) { | 
 |         LLVM_DEBUG(dbgs() << "    *** used in a PHI -- cannot move ***\n"); | 
 |         return false; | 
 |       } | 
 |     } | 
 |   } | 
 |  | 
 |   LLVM_DEBUG(dbgs() << "  Safe to move to the beginning.\n"); | 
 |   return true; | 
 | } | 
 |  | 
 | /// | 
 | /// This function checks if MI can be moved to the end of the TargetMBB, | 
 | /// immediately before the first terminator.  A MI instruction can be moved | 
 | /// to then end of the TargetMBB if no PHI node defines what MI uses within | 
 | /// it's own MBB. | 
 | /// | 
 | /// \param[in] MI the machine instruction to move. | 
 | /// \param[in] TargetMBB the machine basic block to move to | 
 | /// \return true if it is safe to move MI to end of TargetMBB, | 
 | ///         false otherwise. | 
 | /// | 
 | bool PPCBranchCoalescing::canMoveToEnd(const MachineInstr &MI, | 
 |                                     const MachineBasicBlock &TargetMBB | 
 |                                     ) const { | 
 |  | 
 |   LLVM_DEBUG(dbgs() << "Checking if " << MI << " can move to end of " | 
 |                     << TargetMBB.getNumber() << "\n"); | 
 |  | 
 |   for (auto &Use : MI.uses()) { | 
 |     if (Use.isReg() && TargetRegisterInfo::isVirtualRegister(Use.getReg())) { | 
 |       MachineInstr *DefInst = MRI->getVRegDef(Use.getReg()); | 
 |       if (DefInst->isPHI() && DefInst->getParent() == MI.getParent()) { | 
 |         LLVM_DEBUG(dbgs() << "    *** Cannot move this instruction ***\n"); | 
 |         return false; | 
 |       } else { | 
 |         LLVM_DEBUG( | 
 |             dbgs() << "    *** def is in another block -- safe to move!\n"); | 
 |       } | 
 |     } | 
 |   } | 
 |  | 
 |   LLVM_DEBUG(dbgs() << "  Safe to move to the end.\n"); | 
 |   return true; | 
 | } | 
 |  | 
 | /// | 
 | /// This method checks to ensure the two coalescing candidates follows the | 
 | /// expected pattern required for coalescing. | 
 | /// | 
 | /// \param[in] SourceRegion The candidate to move statements from | 
 | /// \param[in] TargetRegion The candidate to move statements to | 
 | /// \return true if all instructions in SourceRegion.BranchBlock can be merged | 
 | /// into a block in TargetRegion; false otherwise. | 
 | /// | 
 | bool PPCBranchCoalescing::validateCandidates( | 
 |     CoalescingCandidateInfo &SourceRegion, | 
 |     CoalescingCandidateInfo &TargetRegion) const { | 
 |  | 
 |   if (TargetRegion.BranchTargetBlock != SourceRegion.BranchBlock) | 
 |     llvm_unreachable("Expecting SourceRegion to immediately follow TargetRegion"); | 
 |   else if (!MDT->dominates(TargetRegion.BranchBlock, SourceRegion.BranchBlock)) | 
 |     llvm_unreachable("Expecting TargetRegion to dominate SourceRegion"); | 
 |   else if (!MPDT->dominates(SourceRegion.BranchBlock, TargetRegion.BranchBlock)) | 
 |     llvm_unreachable("Expecting SourceRegion to post-dominate TargetRegion"); | 
 |   else if (!TargetRegion.FallThroughBlock->empty() || | 
 |            !SourceRegion.FallThroughBlock->empty()) | 
 |     llvm_unreachable("Expecting fall-through blocks to be empty"); | 
 |  | 
 |   return true; | 
 | } | 
 |  | 
 | /// | 
 | /// This method determines whether the two coalescing candidates can be merged. | 
 | /// In order to be merged, all instructions must be able to | 
 | ///   1. Move to the beginning of the SourceRegion.BranchTargetBlock; | 
 | ///   2. Move to the end of the TargetRegion.BranchBlock. | 
 | /// Merging involves moving the instructions in the | 
 | /// TargetRegion.BranchTargetBlock (also SourceRegion.BranchBlock). | 
 | /// | 
 | /// This function first try to move instructions from the | 
 | /// TargetRegion.BranchTargetBlock down, to the beginning of the | 
 | /// SourceRegion.BranchTargetBlock. This is not possible if any register defined | 
 | /// in TargetRegion.BranchTargetBlock is used in a PHI node in the | 
 | /// SourceRegion.BranchTargetBlock. In this case, check whether the statement | 
 | /// can be moved up, to the end of the TargetRegion.BranchBlock (immediately | 
 | /// before the branch statement). If it cannot move, then these blocks cannot | 
 | /// be merged. | 
 | /// | 
 | /// Note that there is no analysis for moving instructions past the fall-through | 
 | /// blocks because they are confirmed to be empty. An assert is thrown if they | 
 | /// are not. | 
 | /// | 
 | /// \param[in] SourceRegion The candidate to move statements from | 
 | /// \param[in] TargetRegion The candidate to move statements to | 
 | /// \return true if all instructions in SourceRegion.BranchBlock can be merged | 
 | ///         into a block in TargetRegion, false otherwise. | 
 | /// | 
 | bool PPCBranchCoalescing::canMerge(CoalescingCandidateInfo &SourceRegion, | 
 |                                 CoalescingCandidateInfo &TargetRegion) const { | 
 |   if (!validateCandidates(SourceRegion, TargetRegion)) | 
 |     return false; | 
 |  | 
 |   // Walk through PHI nodes first and see if they force the merge into the | 
 |   // SourceRegion.BranchTargetBlock. | 
 |   for (MachineBasicBlock::iterator | 
 |            I = SourceRegion.BranchBlock->instr_begin(), | 
 |            E = SourceRegion.BranchBlock->getFirstNonPHI(); | 
 |        I != E; ++I) { | 
 |     for (auto &Def : I->defs()) | 
 |       for (auto &Use : MRI->use_instructions(Def.getReg())) { | 
 |         if (Use.isPHI() && Use.getParent() == SourceRegion.BranchTargetBlock) { | 
 |           LLVM_DEBUG(dbgs() | 
 |                      << "PHI " << *I | 
 |                      << " defines register used in another " | 
 |                         "PHI within branch target block -- can't merge\n"); | 
 |           NumPHINotMoved++; | 
 |           return false; | 
 |         } | 
 |         if (Use.getParent() == SourceRegion.BranchBlock) { | 
 |           LLVM_DEBUG(dbgs() << "PHI " << *I | 
 |                             << " defines register used in this " | 
 |                                "block -- all must move down\n"); | 
 |           SourceRegion.MustMoveDown = true; | 
 |         } | 
 |       } | 
 |   } | 
 |  | 
 |   // Walk through the MI to see if they should be merged into | 
 |   // TargetRegion.BranchBlock (up) or SourceRegion.BranchTargetBlock (down) | 
 |   for (MachineBasicBlock::iterator | 
 |            I = SourceRegion.BranchBlock->getFirstNonPHI(), | 
 |            E = SourceRegion.BranchBlock->end(); | 
 |        I != E; ++I) { | 
 |     if (!canMoveToBeginning(*I, *SourceRegion.BranchTargetBlock)) { | 
 |       LLVM_DEBUG(dbgs() << "Instruction " << *I | 
 |                         << " cannot move down - must move up!\n"); | 
 |       SourceRegion.MustMoveUp = true; | 
 |     } | 
 |     if (!canMoveToEnd(*I, *TargetRegion.BranchBlock)) { | 
 |       LLVM_DEBUG(dbgs() << "Instruction " << *I | 
 |                         << " cannot move up - must move down!\n"); | 
 |       SourceRegion.MustMoveDown = true; | 
 |     } | 
 |   } | 
 |  | 
 |   return (SourceRegion.MustMoveUp && SourceRegion.MustMoveDown) ? false : true; | 
 | } | 
 |  | 
 | /// Merge the instructions from SourceRegion.BranchBlock, | 
 | /// SourceRegion.BranchTargetBlock, and SourceRegion.FallThroughBlock into | 
 | /// TargetRegion.BranchBlock, TargetRegion.BranchTargetBlock and | 
 | /// TargetRegion.FallThroughBlock respectively. | 
 | /// | 
 | /// The successors for blocks in TargetRegion will be updated to use the | 
 | /// successors from blocks in SourceRegion. Finally, the blocks in SourceRegion | 
 | /// will be removed from the function. | 
 | /// | 
 | /// A region consists of a BranchBlock, a FallThroughBlock, and a | 
 | /// BranchTargetBlock. Branch coalesce works on patterns where the | 
 | /// TargetRegion's BranchTargetBlock must also be the SourceRegions's | 
 | /// BranchBlock. | 
 | /// | 
 | ///  Before mergeCandidates: | 
 | /// | 
 | ///  +---------------------------+ | 
 | ///  |  TargetRegion.BranchBlock | | 
 | ///  +---------------------------+ | 
 | ///     /        | | 
 | ///    /   +--------------------------------+ | 
 | ///   |    |  TargetRegion.FallThroughBlock | | 
 | ///    \   +--------------------------------+ | 
 | ///     \        | | 
 | ///  +----------------------------------+ | 
 | ///  |  TargetRegion.BranchTargetBlock  | | 
 | ///  |  SourceRegion.BranchBlock        | | 
 | ///  +----------------------------------+ | 
 | ///     /        | | 
 | ///    /   +--------------------------------+ | 
 | ///   |    |  SourceRegion.FallThroughBlock | | 
 | ///    \   +--------------------------------+ | 
 | ///     \        | | 
 | ///  +----------------------------------+ | 
 | ///  |  SourceRegion.BranchTargetBlock  | | 
 | ///  +----------------------------------+ | 
 | /// | 
 | ///  After mergeCandidates: | 
 | /// | 
 | ///  +-----------------------------+ | 
 | ///  |  TargetRegion.BranchBlock   | | 
 | ///  |  SourceRegion.BranchBlock   | | 
 | ///  +-----------------------------+ | 
 | ///     /        | | 
 | ///    /   +---------------------------------+ | 
 | ///   |    |  TargetRegion.FallThroughBlock  | | 
 | ///   |    |  SourceRegion.FallThroughBlock  | | 
 | ///    \   +---------------------------------+ | 
 | ///     \        | | 
 | ///  +----------------------------------+ | 
 | ///  |  SourceRegion.BranchTargetBlock  | | 
 | ///  +----------------------------------+ | 
 | /// | 
 | /// \param[in] SourceRegion The candidate to move blocks from | 
 | /// \param[in] TargetRegion The candidate to move blocks to | 
 | /// | 
 | bool PPCBranchCoalescing::mergeCandidates(CoalescingCandidateInfo &SourceRegion, | 
 |                                        CoalescingCandidateInfo &TargetRegion) { | 
 |  | 
 |   if (SourceRegion.MustMoveUp && SourceRegion.MustMoveDown) { | 
 |     llvm_unreachable("Cannot have both MustMoveDown and MustMoveUp set!"); | 
 |     return false; | 
 |   } | 
 |  | 
 |   if (!validateCandidates(SourceRegion, TargetRegion)) | 
 |     return false; | 
 |  | 
 |   // Start the merging process by first handling the BranchBlock. | 
 |   // Move any PHIs in SourceRegion.BranchBlock down to the branch-taken block | 
 |   moveAndUpdatePHIs(SourceRegion.BranchBlock, SourceRegion.BranchTargetBlock); | 
 |  | 
 |   // Move remaining instructions in SourceRegion.BranchBlock into | 
 |   // TargetRegion.BranchBlock | 
 |   MachineBasicBlock::iterator firstInstr = | 
 |       SourceRegion.BranchBlock->getFirstNonPHI(); | 
 |   MachineBasicBlock::iterator lastInstr = | 
 |       SourceRegion.BranchBlock->getFirstTerminator(); | 
 |  | 
 |   MachineBasicBlock *Source = SourceRegion.MustMoveDown | 
 |                                   ? SourceRegion.BranchTargetBlock | 
 |                                   : TargetRegion.BranchBlock; | 
 |  | 
 |   MachineBasicBlock::iterator Target = | 
 |       SourceRegion.MustMoveDown | 
 |           ? SourceRegion.BranchTargetBlock->getFirstNonPHI() | 
 |           : TargetRegion.BranchBlock->getFirstTerminator(); | 
 |  | 
 |   Source->splice(Target, SourceRegion.BranchBlock, firstInstr, lastInstr); | 
 |  | 
 |   // Once PHI and instructions have been moved we need to clean up the | 
 |   // control flow. | 
 |  | 
 |   // Remove SourceRegion.FallThroughBlock before transferring successors of | 
 |   // SourceRegion.BranchBlock to TargetRegion.BranchBlock. | 
 |   SourceRegion.BranchBlock->removeSuccessor(SourceRegion.FallThroughBlock); | 
 |   TargetRegion.BranchBlock->transferSuccessorsAndUpdatePHIs( | 
 |       SourceRegion.BranchBlock); | 
 |   // Update branch in TargetRegion.BranchBlock to jump to | 
 |   // SourceRegion.BranchTargetBlock | 
 |   // In this case, TargetRegion.BranchTargetBlock == SourceRegion.BranchBlock. | 
 |   TargetRegion.BranchBlock->ReplaceUsesOfBlockWith( | 
 |       SourceRegion.BranchBlock, SourceRegion.BranchTargetBlock); | 
 |   // Remove the branch statement(s) in SourceRegion.BranchBlock | 
 |   MachineBasicBlock::iterator I = | 
 |       SourceRegion.BranchBlock->terminators().begin(); | 
 |   while (I != SourceRegion.BranchBlock->terminators().end()) { | 
 |     MachineInstr &CurrInst = *I; | 
 |     ++I; | 
 |     if (CurrInst.isBranch()) | 
 |       CurrInst.eraseFromParent(); | 
 |   } | 
 |  | 
 |   // Fall-through block should be empty since this is part of the condition | 
 |   // to coalesce the branches. | 
 |   assert(TargetRegion.FallThroughBlock->empty() && | 
 |          "FallThroughBlocks should be empty!"); | 
 |  | 
 |   // Transfer successor information and move PHIs down to the | 
 |   // branch-taken block. | 
 |   TargetRegion.FallThroughBlock->transferSuccessorsAndUpdatePHIs( | 
 |       SourceRegion.FallThroughBlock); | 
 |   TargetRegion.FallThroughBlock->removeSuccessor(SourceRegion.BranchBlock); | 
 |  | 
 |   // Remove the blocks from the function. | 
 |   assert(SourceRegion.BranchBlock->empty() && | 
 |          "Expecting branch block to be empty!"); | 
 |   SourceRegion.BranchBlock->eraseFromParent(); | 
 |  | 
 |   assert(SourceRegion.FallThroughBlock->empty() && | 
 |          "Expecting fall-through block to be empty!\n"); | 
 |   SourceRegion.FallThroughBlock->eraseFromParent(); | 
 |  | 
 |   NumBlocksCoalesced++; | 
 |   return true; | 
 | } | 
 |  | 
 | bool PPCBranchCoalescing::runOnMachineFunction(MachineFunction &MF) { | 
 |  | 
 |   if (skipFunction(MF.getFunction()) || MF.empty()) | 
 |     return false; | 
 |  | 
 |   bool didSomething = false; | 
 |  | 
 |   LLVM_DEBUG(dbgs() << "******** Branch Coalescing ********\n"); | 
 |   initialize(MF); | 
 |  | 
 |   LLVM_DEBUG(dbgs() << "Function: "; MF.dump(); dbgs() << "\n"); | 
 |  | 
 |   CoalescingCandidateInfo Cand1, Cand2; | 
 |   // Walk over blocks and find candidates to merge | 
 |   // Continue trying to merge with the first candidate found, as long as merging | 
 |   // is successfull. | 
 |   for (MachineBasicBlock &MBB : MF) { | 
 |     bool MergedCandidates = false; | 
 |     do { | 
 |       MergedCandidates = false; | 
 |       Cand1.clear(); | 
 |       Cand2.clear(); | 
 |  | 
 |       Cand1.BranchBlock = &MBB; | 
 |  | 
 |       // If unable to coalesce the branch, then continue to next block | 
 |       if (!canCoalesceBranch(Cand1)) | 
 |         break; | 
 |  | 
 |       Cand2.BranchBlock = Cand1.BranchTargetBlock; | 
 |       if (!canCoalesceBranch(Cand2)) | 
 |         break; | 
 |  | 
 |       // Sanity check | 
 |       // The branch-taken block of the second candidate should post-dominate the | 
 |       // first candidate | 
 |       assert(MPDT->dominates(Cand2.BranchTargetBlock, Cand1.BranchBlock) && | 
 |              "Branch-taken block should post-dominate first candidate"); | 
 |  | 
 |       if (!identicalOperands(Cand1.Cond, Cand2.Cond)) { | 
 |         LLVM_DEBUG(dbgs() << "Blocks " << Cand1.BranchBlock->getNumber() | 
 |                           << " and " << Cand2.BranchBlock->getNumber() | 
 |                           << " have different branches\n"); | 
 |         break; | 
 |       } | 
 |       if (!canMerge(Cand2, Cand1)) { | 
 |         LLVM_DEBUG(dbgs() << "Cannot merge blocks " | 
 |                           << Cand1.BranchBlock->getNumber() << " and " | 
 |                           << Cand2.BranchBlock->getNumber() << "\n"); | 
 |         NumBlocksNotCoalesced++; | 
 |         continue; | 
 |       } | 
 |       LLVM_DEBUG(dbgs() << "Merging blocks " << Cand1.BranchBlock->getNumber() | 
 |                         << " and " << Cand1.BranchTargetBlock->getNumber() | 
 |                         << "\n"); | 
 |       MergedCandidates = mergeCandidates(Cand2, Cand1); | 
 |       if (MergedCandidates) | 
 |         didSomething = true; | 
 |  | 
 |       LLVM_DEBUG(dbgs() << "Function after merging: "; MF.dump(); | 
 |                  dbgs() << "\n"); | 
 |     } while (MergedCandidates); | 
 |   } | 
 |  | 
 | #ifndef NDEBUG | 
 |   // Verify MF is still valid after branch coalescing | 
 |   if (didSomething) | 
 |     MF.verify(nullptr, "Error in code produced by branch coalescing"); | 
 | #endif // NDEBUG | 
 |  | 
 |   LLVM_DEBUG(dbgs() << "Finished Branch Coalescing\n"); | 
 |   return didSomething; | 
 | } |