| //===---- BlockFrequencyImpl.h - Machine Block Frequency Implementation ---===// |
| // |
| // The LLVM Compiler Infrastructure |
| // |
| // This file is distributed under the University of Illinois Open Source |
| // License. See LICENSE.TXT for details. |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // Shared implementation of BlockFrequency for IR and Machine Instructions. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #ifndef LLVM_ANALYSIS_BLOCKFREQUENCYIMPL_H |
| #define LLVM_ANALYSIS_BLOCKFREQUENCYIMPL_H |
| |
| #include "llvm/BasicBlock.h" |
| #include "llvm/ADT/DenseMap.h" |
| #include "llvm/ADT/PostOrderIterator.h" |
| #include "llvm/CodeGen/MachineBasicBlock.h" |
| #include "llvm/CodeGen/MachineFunction.h" |
| #include "llvm/Support/BlockFrequency.h" |
| #include "llvm/Support/BranchProbability.h" |
| #include "llvm/Support/Debug.h" |
| #include "llvm/Support/raw_ostream.h" |
| #include <vector> |
| #include <sstream> |
| #include <string> |
| |
| namespace llvm { |
| |
| |
| class BlockFrequencyInfo; |
| class MachineBlockFrequencyInfo; |
| |
| /// BlockFrequencyImpl implements block frequency algorithm for IR and |
| /// Machine Instructions. Algorithm starts with value 1024 (START_FREQ) |
| /// for the entry block and then propagates frequencies using branch weights |
| /// from (Machine)BranchProbabilityInfo. LoopInfo is not required because |
| /// algorithm can find "backedges" by itself. |
| template<class BlockT, class FunctionT, class BlockProbInfoT> |
| class BlockFrequencyImpl { |
| |
| DenseMap<BlockT *, BlockFrequency> Freqs; |
| |
| BlockProbInfoT *BPI; |
| |
| FunctionT *Fn; |
| |
| typedef GraphTraits< Inverse<BlockT *> > GT; |
| |
| const uint32_t EntryFreq; |
| |
| std::string getBlockName(BasicBlock *BB) const { |
| return BB->getNameStr(); |
| } |
| |
| std::string getBlockName(MachineBasicBlock *MBB) const { |
| std::stringstream ss; |
| ss << "BB#" << MBB->getNumber(); |
| |
| if (const BasicBlock *BB = MBB->getBasicBlock()) |
| ss << " derived from LLVM BB " << BB->getNameStr(); |
| |
| return ss.str(); |
| } |
| |
| void setBlockFreq(BlockT *BB, BlockFrequency Freq) { |
| Freqs[BB] = Freq; |
| DEBUG(dbgs() << "Frequency(" << getBlockName(BB) << ") = " << Freq << "\n"); |
| } |
| |
| /// getEdgeFreq - Return edge frequency based on SRC frequency and Src -> Dst |
| /// edge probability. |
| BlockFrequency getEdgeFreq(BlockT *Src, BlockT *Dst) const { |
| BranchProbability Prob = BPI->getEdgeProbability(Src, Dst); |
| return getBlockFreq(Src) * Prob; |
| } |
| |
| /// incBlockFreq - Increase BB block frequency by FREQ. |
| /// |
| void incBlockFreq(BlockT *BB, BlockFrequency Freq) { |
| Freqs[BB] += Freq; |
| DEBUG(dbgs() << "Frequency(" << getBlockName(BB) << ") += " << Freq |
| << " --> " << Freqs[BB] << "\n"); |
| } |
| |
| /// divBlockFreq - Divide BB block frequency by PROB. If Prob = 0 do nothing. |
| /// |
| void divBlockFreq(BlockT *BB, BranchProbability Prob) { |
| uint64_t N = Prob.getNumerator(); |
| assert(N && "Illegal division by zero!"); |
| uint64_t D = Prob.getDenominator(); |
| uint64_t Freq = (Freqs[BB].getFrequency() * D) / N; |
| |
| // Should we assert it? |
| if (Freq > UINT32_MAX) |
| Freq = UINT32_MAX; |
| |
| Freqs[BB] = BlockFrequency(Freq); |
| DEBUG(dbgs() << "Frequency(" << getBlockName(BB) << ") /= (" << Prob |
| << ") --> " << Freqs[BB] << "\n"); |
| } |
| |
| // All blocks in postorder. |
| std::vector<BlockT *> POT; |
| |
| // Map Block -> Position in reverse-postorder list. |
| DenseMap<BlockT *, unsigned> RPO; |
| |
| // Cycle Probability for each bloch. |
| DenseMap<BlockT *, uint32_t> CycleProb; |
| |
| // (reverse-)postorder traversal iterators. |
| typedef typename std::vector<BlockT *>::iterator pot_iterator; |
| typedef typename std::vector<BlockT *>::reverse_iterator rpot_iterator; |
| |
| pot_iterator pot_begin() { return POT.begin(); } |
| pot_iterator pot_end() { return POT.end(); } |
| |
| rpot_iterator rpot_begin() { return POT.rbegin(); } |
| rpot_iterator rpot_end() { return POT.rend(); } |
| |
| rpot_iterator rpot_at(BlockT *BB) { |
| rpot_iterator I = rpot_begin(); |
| unsigned idx = RPO[BB]; |
| assert(idx); |
| std::advance(I, idx - 1); |
| |
| assert(*I == BB); |
| return I; |
| } |
| |
| |
| /// isReachable - Returns if BB block is reachable from the entry. |
| /// |
| bool isReachable(BlockT *BB) { |
| return RPO.count(BB); |
| } |
| |
| /// isBackedge - Return if edge Src -> Dst is a backedge. |
| /// |
| bool isBackedge(BlockT *Src, BlockT *Dst) { |
| assert(isReachable(Src)); |
| assert(isReachable(Dst)); |
| |
| unsigned a = RPO[Src]; |
| unsigned b = RPO[Dst]; |
| |
| return a >= b; |
| } |
| |
| /// getSingleBlockPred - return single BB block predecessor or NULL if |
| /// BB has none or more predecessors. |
| BlockT *getSingleBlockPred(BlockT *BB) { |
| typename GT::ChildIteratorType |
| PI = GraphTraits< Inverse<BlockT *> >::child_begin(BB), |
| PE = GraphTraits< Inverse<BlockT *> >::child_end(BB); |
| |
| if (PI == PE) |
| return 0; |
| |
| BlockT *Pred = *PI; |
| |
| ++PI; |
| if (PI != PE) |
| return 0; |
| |
| return Pred; |
| } |
| |
| void doBlock(BlockT *BB, BlockT *LoopHead, |
| SmallPtrSet<BlockT *, 8> &BlocksInLoop) { |
| |
| DEBUG(dbgs() << "doBlock(" << getBlockName(BB) << ")\n"); |
| setBlockFreq(BB, 0); |
| |
| if (BB == LoopHead) { |
| setBlockFreq(BB, EntryFreq); |
| return; |
| } |
| |
| if(BlockT *Pred = getSingleBlockPred(BB)) { |
| if (BlocksInLoop.count(Pred)) |
| setBlockFreq(BB, getEdgeFreq(Pred, BB)); |
| // TODO: else? irreducible, ignore it for now. |
| return; |
| } |
| |
| bool isInLoop = false; |
| bool isLoopHead = false; |
| |
| for (typename GT::ChildIteratorType |
| PI = GraphTraits< Inverse<BlockT *> >::child_begin(BB), |
| PE = GraphTraits< Inverse<BlockT *> >::child_end(BB); |
| PI != PE; ++PI) { |
| BlockT *Pred = *PI; |
| |
| if (isReachable(Pred) && isBackedge(Pred, BB)) { |
| isLoopHead = true; |
| } else if (BlocksInLoop.count(Pred)) { |
| incBlockFreq(BB, getEdgeFreq(Pred, BB)); |
| isInLoop = true; |
| } |
| // TODO: else? irreducible. |
| } |
| |
| if (!isInLoop) |
| return; |
| |
| if (!isLoopHead) |
| return; |
| |
| assert(EntryFreq >= CycleProb[BB]); |
| uint32_t CProb = CycleProb[BB]; |
| uint32_t Numerator = EntryFreq - CProb ? EntryFreq - CProb : 1; |
| divBlockFreq(BB, BranchProbability(Numerator, EntryFreq)); |
| } |
| |
| /// doLoop - Propagate block frequency down throught the loop. |
| void doLoop(BlockT *Head, BlockT *Tail) { |
| DEBUG(dbgs() << "doLoop(" << getBlockName(Head) << ", " |
| << getBlockName(Tail) << ")\n"); |
| |
| SmallPtrSet<BlockT *, 8> BlocksInLoop; |
| |
| for (rpot_iterator I = rpot_at(Head), E = rpot_at(Tail); ; ++I) { |
| BlockT *BB = *I; |
| doBlock(BB, Head, BlocksInLoop); |
| |
| BlocksInLoop.insert(BB); |
| if (I == E) |
| break; |
| } |
| |
| // Compute loop's cyclic probability using backedges probabilities. |
| for (typename GT::ChildIteratorType |
| PI = GraphTraits< Inverse<BlockT *> >::child_begin(Head), |
| PE = GraphTraits< Inverse<BlockT *> >::child_end(Head); |
| PI != PE; ++PI) { |
| BlockT *Pred = *PI; |
| assert(Pred); |
| if (isReachable(Pred) && isBackedge(Pred, Head)) { |
| uint64_t N = getEdgeFreq(Pred, Head).getFrequency(); |
| uint64_t D = getBlockFreq(Head).getFrequency(); |
| assert(N <= EntryFreq && "Backedge frequency must be <= EntryFreq!"); |
| uint64_t Res = (N * EntryFreq) / D; |
| |
| assert(Res <= UINT32_MAX); |
| CycleProb[Head] += (uint32_t) Res; |
| DEBUG(dbgs() << " CycleProb[" << getBlockName(Head) << "] += " << Res |
| << " --> " << CycleProb[Head] << "\n"); |
| } |
| } |
| } |
| |
| friend class BlockFrequencyInfo; |
| friend class MachineBlockFrequencyInfo; |
| |
| BlockFrequencyImpl() : EntryFreq(BlockFrequency::getEntryFrequency()) { } |
| |
| void doFunction(FunctionT *fn, BlockProbInfoT *bpi) { |
| Fn = fn; |
| BPI = bpi; |
| |
| // Clear everything. |
| RPO.clear(); |
| POT.clear(); |
| CycleProb.clear(); |
| Freqs.clear(); |
| |
| BlockT *EntryBlock = fn->begin(); |
| |
| copy(po_begin(EntryBlock), po_end(EntryBlock), back_inserter(POT)); |
| |
| unsigned RPOidx = 0; |
| for (rpot_iterator I = rpot_begin(), E = rpot_end(); I != E; ++I) { |
| BlockT *BB = *I; |
| RPO[BB] = ++RPOidx; |
| DEBUG(dbgs() << "RPO[" << getBlockName(BB) << "] = " << RPO[BB] << "\n"); |
| } |
| |
| // Travel over all blocks in postorder. |
| for (pot_iterator I = pot_begin(), E = pot_end(); I != E; ++I) { |
| BlockT *BB = *I; |
| BlockT *LastTail = 0; |
| DEBUG(dbgs() << "POT: " << getBlockName(BB) << "\n"); |
| |
| for (typename GT::ChildIteratorType |
| PI = GraphTraits< Inverse<BlockT *> >::child_begin(BB), |
| PE = GraphTraits< Inverse<BlockT *> >::child_end(BB); |
| PI != PE; ++PI) { |
| |
| BlockT *Pred = *PI; |
| if (isReachable(Pred) && isBackedge(Pred, BB) |
| && (!LastTail || RPO[Pred] > RPO[LastTail])) |
| LastTail = Pred; |
| } |
| |
| if (LastTail) |
| doLoop(BB, LastTail); |
| } |
| |
| // At the end assume the whole function as a loop, and travel over it once |
| // again. |
| doLoop(*(rpot_begin()), *(pot_begin())); |
| } |
| |
| public: |
| /// getBlockFreq - Return block frequency. Return 0 if we don't have it. |
| BlockFrequency getBlockFreq(BlockT *BB) const { |
| typename DenseMap<BlockT *, BlockFrequency>::const_iterator I = Freqs.find(BB); |
| if (I != Freqs.end()) |
| return I->second; |
| return 0; |
| } |
| |
| void print(raw_ostream &OS) const { |
| OS << "\n\n---- Block Freqs ----\n"; |
| for (typename FunctionT::iterator I = Fn->begin(), E = Fn->end(); I != E;) { |
| BlockT *BB = I++; |
| OS << " " << getBlockName(BB) << " = " << getBlockFreq(BB) << "\n"; |
| |
| for (typename GraphTraits<BlockT *>::ChildIteratorType |
| SI = GraphTraits<BlockT *>::child_begin(BB), |
| SE = GraphTraits<BlockT *>::child_end(BB); SI != SE; ++SI) { |
| BlockT *Succ = *SI; |
| OS << " " << getBlockName(BB) << " -> " << getBlockName(Succ) |
| << " = " << getEdgeFreq(BB, Succ) << "\n"; |
| } |
| } |
| } |
| |
| void dump() const { |
| print(dbgs()); |
| } |
| }; |
| |
| } |
| |
| #endif |