//===-- CodePlacementOpt.cpp - Code Placement pass. -----------------------===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This file implements the pass that optimizes code placement and aligns loop // headers to target-specific alignment boundaries. // //===----------------------------------------------------------------------===// #define DEBUG_TYPE "code-placement" #include "llvm/CodeGen/MachineLoopInfo.h" #include "llvm/CodeGen/MachineFunctionPass.h" #include "llvm/CodeGen/Passes.h" #include "llvm/Target/TargetInstrInfo.h" #include "llvm/Target/TargetLowering.h" #include "llvm/Target/TargetMachine.h" #include "llvm/Support/Compiler.h" #include "llvm/Support/Debug.h" #include "llvm/ADT/Statistic.h" using namespace llvm; STATISTIC(NumLoopsAligned, "Number of loops aligned"); STATISTIC(NumIntraElim, "Number of intra loop branches eliminated"); STATISTIC(NumIntraMoved, "Number of intra loop branches moved"); namespace { class CodePlacementOpt : public MachineFunctionPass { const MachineLoopInfo *MLI; const TargetInstrInfo *TII; const TargetLowering *TLI; public: static char ID; CodePlacementOpt() : MachineFunctionPass(ID) {} virtual bool runOnMachineFunction(MachineFunction &MF); virtual const char *getPassName() const { return "Code Placement Optimizer"; } virtual void getAnalysisUsage(AnalysisUsage &AU) const { AU.addRequired<MachineLoopInfo>(); AU.addPreservedID(MachineDominatorsID); MachineFunctionPass::getAnalysisUsage(AU); } private: bool HasFallthrough(MachineBasicBlock *MBB); bool HasAnalyzableTerminator(MachineBasicBlock *MBB); void Splice(MachineFunction &MF, MachineFunction::iterator InsertPt, MachineFunction::iterator Begin, MachineFunction::iterator End); bool EliminateUnconditionalJumpsToTop(MachineFunction &MF, MachineLoop *L); bool MoveDiscontiguousLoopBlocks(MachineFunction &MF, MachineLoop *L); bool OptimizeIntraLoopEdgesInLoopNest(MachineFunction &MF, MachineLoop *L); bool OptimizeIntraLoopEdges(MachineFunction &MF); bool AlignLoops(MachineFunction &MF); bool AlignLoop(MachineFunction &MF, MachineLoop *L, unsigned Align); }; char CodePlacementOpt::ID = 0; } // end anonymous namespace FunctionPass *llvm::createCodePlacementOptPass() { return new CodePlacementOpt(); } /// HasFallthrough - Test whether the given branch has a fallthrough, either as /// a plain fallthrough or as a fallthrough case of a conditional branch. /// bool CodePlacementOpt::HasFallthrough(MachineBasicBlock *MBB) { MachineBasicBlock *TBB = 0, *FBB = 0; SmallVector<MachineOperand, 4> Cond; if (TII->AnalyzeBranch(*MBB, TBB, FBB, Cond)) return false; // This conditional branch has no fallthrough. if (FBB) return false; // An unconditional branch has no fallthrough. if (Cond.empty() && TBB) return false; // It has a fallthrough. return true; } /// HasAnalyzableTerminator - Test whether AnalyzeBranch will succeed on MBB. /// This is called before major changes are begun to test whether it will be /// possible to complete the changes. /// /// Target-specific code is hereby encouraged to make AnalyzeBranch succeed /// whenever possible. /// bool CodePlacementOpt::HasAnalyzableTerminator(MachineBasicBlock *MBB) { // Conservatively ignore EH landing pads. if (MBB->isLandingPad()) return false; // Aggressively handle return blocks and similar constructs. if (MBB->succ_empty()) return true; // Ask the target's AnalyzeBranch if it can handle this block. MachineBasicBlock *TBB = 0, *FBB = 0; SmallVector<MachineOperand, 4> Cond; // Make sure the terminator is understood. if (TII->AnalyzeBranch(*MBB, TBB, FBB, Cond)) return false; // Ignore blocks which look like they might have EH-related control flow. // AnalyzeBranch thinks it knows how to analyze such things, but it doesn't // recognize the possibility of a control transfer through an unwind. // Such blocks contain EH_LABEL instructions, however they may be in the // middle of the block. Instead of searching for them, just check to see // if the CFG disagrees with AnalyzeBranch. if (1u + !Cond.empty() != MBB->succ_size()) return false; // Make sure we have the option of reversing the condition. if (!Cond.empty() && TII->ReverseBranchCondition(Cond)) return false; return true; } /// Splice - Move the sequence of instructions [Begin,End) to just before /// InsertPt. Update branch instructions as needed to account for broken /// fallthrough edges and to take advantage of newly exposed fallthrough /// opportunities. /// void CodePlacementOpt::Splice(MachineFunction &MF, MachineFunction::iterator InsertPt, MachineFunction::iterator Begin, MachineFunction::iterator End) { assert(Begin != MF.begin() && End != MF.begin() && InsertPt != MF.begin() && "Splice can't change the entry block!"); MachineFunction::iterator OldBeginPrior = prior(Begin); MachineFunction::iterator OldEndPrior = prior(End); MF.splice(InsertPt, Begin, End); prior(Begin)->updateTerminator(); OldBeginPrior->updateTerminator(); OldEndPrior->updateTerminator(); } /// EliminateUnconditionalJumpsToTop - Move blocks which unconditionally jump /// to the loop top to the top of the loop so that they have a fall through. /// This can introduce a branch on entry to the loop, but it can eliminate a /// branch within the loop. See the @simple case in /// test/CodeGen/X86/loop_blocks.ll for an example of this. bool CodePlacementOpt::EliminateUnconditionalJumpsToTop(MachineFunction &MF, MachineLoop *L) { bool Changed = false; MachineBasicBlock *TopMBB = L->getTopBlock(); bool BotHasFallthrough = HasFallthrough(L->getBottomBlock()); if (TopMBB == MF.begin() || HasAnalyzableTerminator(prior(MachineFunction::iterator(TopMBB)))) { new_top: for (MachineBasicBlock::pred_iterator PI = TopMBB->pred_begin(), PE = TopMBB->pred_end(); PI != PE; ++PI) { MachineBasicBlock *Pred = *PI; if (Pred == TopMBB) continue; if (HasFallthrough(Pred)) continue; if (!L->contains(Pred)) continue; // Verify that we can analyze all the loop entry edges before beginning // any changes which will require us to be able to analyze them. if (Pred == MF.begin()) continue; if (!HasAnalyzableTerminator(Pred)) continue; if (!HasAnalyzableTerminator(prior(MachineFunction::iterator(Pred)))) continue; // Move the block. DEBUG(dbgs() << "CGP: Moving blocks starting at BB#" << Pred->getNumber() << " to top of loop.\n"); Changed = true; // Move it and all the blocks that can reach it via fallthrough edges // exclusively, to keep existing fallthrough edges intact. MachineFunction::iterator Begin = Pred; MachineFunction::iterator End = llvm::next(Begin); while (Begin != MF.begin()) { MachineFunction::iterator Prior = prior(Begin); if (Prior == MF.begin()) break; // Stop when a non-fallthrough edge is found. if (!HasFallthrough(Prior)) break; // Stop if a block which could fall-through out of the loop is found. if (Prior->isSuccessor(End)) break; // If we've reached the top, stop scanning. if (Prior == MachineFunction::iterator(TopMBB)) { // We know top currently has a fall through (because we just checked // it) which would be lost if we do the transformation, so it isn't // worthwhile to do the transformation unless it would expose a new // fallthrough edge. if (!Prior->isSuccessor(End)) goto next_pred; // Otherwise we can stop scanning and procede to move the blocks. break; } // If we hit a switch or something complicated, don't move anything // for this predecessor. if (!HasAnalyzableTerminator(prior(MachineFunction::iterator(Prior)))) break; // Ok, the block prior to Begin will be moved along with the rest. // Extend the range to include it. Begin = Prior; ++NumIntraMoved; } // Move the blocks. Splice(MF, TopMBB, Begin, End); // Update TopMBB. TopMBB = L->getTopBlock(); // We have a new loop top. Iterate on it. We shouldn't have to do this // too many times if BranchFolding has done a reasonable job. goto new_top; next_pred:; } } // If the loop previously didn't exit with a fall-through and it now does, // we eliminated a branch. if (Changed && !BotHasFallthrough && HasFallthrough(L->getBottomBlock())) { ++NumIntraElim; } return Changed; } /// MoveDiscontiguousLoopBlocks - Move any loop blocks that are not in the /// portion of the loop contiguous with the header. This usually makes the loop /// contiguous, provided that AnalyzeBranch can handle all the relevant /// branching. See the @cfg_islands case in test/CodeGen/X86/loop_blocks.ll /// for an example of this. bool CodePlacementOpt::MoveDiscontiguousLoopBlocks(MachineFunction &MF, MachineLoop *L) { bool Changed = false; MachineBasicBlock *TopMBB = L->getTopBlock(); MachineBasicBlock *BotMBB = L->getBottomBlock(); // Determine a position to move orphaned loop blocks to. If TopMBB is not // entered via fallthrough and BotMBB is exited via fallthrough, prepend them // to the top of the loop to avoid losing that fallthrough. Otherwise append // them to the bottom, even if it previously had a fallthrough, on the theory // that it's worth an extra branch to keep the loop contiguous. MachineFunction::iterator InsertPt = llvm::next(MachineFunction::iterator(BotMBB)); bool InsertAtTop = false; if (TopMBB != MF.begin() && !HasFallthrough(prior(MachineFunction::iterator(TopMBB))) && HasFallthrough(BotMBB)) { InsertPt = TopMBB; InsertAtTop = true; } // Keep a record of which blocks are in the portion of the loop contiguous // with the loop header. SmallPtrSet<MachineBasicBlock *, 8> ContiguousBlocks; for (MachineFunction::iterator I = TopMBB, E = llvm::next(MachineFunction::iterator(BotMBB)); I != E; ++I) ContiguousBlocks.insert(I); // Find non-contigous blocks and fix them. if (InsertPt != MF.begin() && HasAnalyzableTerminator(prior(InsertPt))) for (MachineLoop::block_iterator BI = L->block_begin(), BE = L->block_end(); BI != BE; ++BI) { MachineBasicBlock *BB = *BI; // Verify that we can analyze all the loop entry edges before beginning // any changes which will require us to be able to analyze them. if (!HasAnalyzableTerminator(BB)) continue; if (!HasAnalyzableTerminator(prior(MachineFunction::iterator(BB)))) continue; // If the layout predecessor is part of the loop, this block will be // processed along with it. This keeps them in their relative order. if (BB != MF.begin() && L->contains(prior(MachineFunction::iterator(BB)))) continue; // Check to see if this block is already contiguous with the main // portion of the loop. if (!ContiguousBlocks.insert(BB)) continue; // Move the block. DEBUG(dbgs() << "CGP: Moving blocks starting at BB#" << BB->getNumber() << " to be contiguous with loop.\n"); Changed = true; // Process this block and all loop blocks contiguous with it, to keep // them in their relative order. MachineFunction::iterator Begin = BB; MachineFunction::iterator End = llvm::next(MachineFunction::iterator(BB)); for (; End != MF.end(); ++End) { if (!L->contains(End)) break; if (!HasAnalyzableTerminator(End)) break; ContiguousBlocks.insert(End); ++NumIntraMoved; } // If we're inserting at the bottom of the loop, and the code we're // moving originally had fall-through successors, bring the sucessors // up with the loop blocks to preserve the fall-through edges. if (!InsertAtTop) for (; End != MF.end(); ++End) { if (L->contains(End)) break; if (!HasAnalyzableTerminator(End)) break; if (!HasFallthrough(prior(End))) break; } // Move the blocks. This may invalidate TopMBB and/or BotMBB, but // we don't need them anymore at this point. Splice(MF, InsertPt, Begin, End); } return Changed; } /// OptimizeIntraLoopEdgesInLoopNest - Reposition loop blocks to minimize /// intra-loop branching and to form contiguous loops. /// /// This code takes the approach of making minor changes to the existing /// layout to fix specific loop-oriented problems. Also, it depends on /// AnalyzeBranch, which can't understand complex control instructions. /// bool CodePlacementOpt::OptimizeIntraLoopEdgesInLoopNest(MachineFunction &MF, MachineLoop *L) { bool Changed = false; // Do optimization for nested loops. for (MachineLoop::iterator I = L->begin(), E = L->end(); I != E; ++I) Changed |= OptimizeIntraLoopEdgesInLoopNest(MF, *I); // Do optimization for this loop. Changed |= EliminateUnconditionalJumpsToTop(MF, L); Changed |= MoveDiscontiguousLoopBlocks(MF, L); return Changed; } /// OptimizeIntraLoopEdges - Reposition loop blocks to minimize /// intra-loop branching and to form contiguous loops. /// bool CodePlacementOpt::OptimizeIntraLoopEdges(MachineFunction &MF) { bool Changed = false; if (!TLI->shouldOptimizeCodePlacement()) return Changed; // Do optimization for each loop in the function. for (MachineLoopInfo::iterator I = MLI->begin(), E = MLI->end(); I != E; ++I) if (!(*I)->getParentLoop()) Changed |= OptimizeIntraLoopEdgesInLoopNest(MF, *I); return Changed; } /// AlignLoops - Align loop headers to target preferred alignments. /// bool CodePlacementOpt::AlignLoops(MachineFunction &MF) { const Function *F = MF.getFunction(); if (F->hasFnAttr(Attribute::OptimizeForSize)) return false; unsigned Align = TLI->getPrefLoopAlignment(); if (!Align) return false; // Don't care about loop alignment. bool Changed = false; for (MachineLoopInfo::iterator I = MLI->begin(), E = MLI->end(); I != E; ++I) Changed |= AlignLoop(MF, *I, Align); return Changed; } /// AlignLoop - Align loop headers to target preferred alignments. /// bool CodePlacementOpt::AlignLoop(MachineFunction &MF, MachineLoop *L, unsigned Align) { bool Changed = false; // Do alignment for nested loops. for (MachineLoop::iterator I = L->begin(), E = L->end(); I != E; ++I) Changed |= AlignLoop(MF, *I, Align); L->getTopBlock()->setAlignment(Align); Changed = true; ++NumLoopsAligned; return Changed; } bool CodePlacementOpt::runOnMachineFunction(MachineFunction &MF) { MLI = &getAnalysis<MachineLoopInfo>(); if (MLI->empty()) return false; // No loops. TLI = MF.getTarget().getTargetLowering(); TII = MF.getTarget().getInstrInfo(); bool Changed = OptimizeIntraLoopEdges(MF); Changed |= AlignLoops(MF); return Changed; }