1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045 |
- //===- BranchProbabilityInfo.cpp - Branch Probability Analysis ------------===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- //
- // Loops should be simplified before this analysis.
- //
- //===----------------------------------------------------------------------===//
- #include "llvm/Analysis/BranchProbabilityInfo.h"
- #include "llvm/ADT/PostOrderIterator.h"
- #include "llvm/ADT/SCCIterator.h"
- #include "llvm/ADT/STLExtras.h"
- #include "llvm/ADT/SmallVector.h"
- #include "llvm/Analysis/LoopInfo.h"
- #include "llvm/Analysis/TargetLibraryInfo.h"
- #include "llvm/IR/Attributes.h"
- #include "llvm/IR/BasicBlock.h"
- #include "llvm/IR/CFG.h"
- #include "llvm/IR/Constants.h"
- #include "llvm/IR/Dominators.h"
- #include "llvm/IR/Function.h"
- #include "llvm/IR/InstrTypes.h"
- #include "llvm/IR/Instruction.h"
- #include "llvm/IR/Instructions.h"
- #include "llvm/IR/LLVMContext.h"
- #include "llvm/IR/Metadata.h"
- #include "llvm/IR/PassManager.h"
- #include "llvm/IR/Type.h"
- #include "llvm/IR/Value.h"
- #include "llvm/Pass.h"
- #include "llvm/Support/BranchProbability.h"
- #include "llvm/Support/Casting.h"
- #include "llvm/Support/Debug.h"
- #include "llvm/Support/raw_ostream.h"
- #include <cassert>
- #include <cstdint>
- #include <iterator>
- #include <utility>
- using namespace llvm;
- #define DEBUG_TYPE "branch-prob"
- static cl::opt<bool> PrintBranchProb(
- "print-bpi", cl::init(false), cl::Hidden,
- cl::desc("Print the branch probability info."));
- cl::opt<std::string> PrintBranchProbFuncName(
- "print-bpi-func-name", cl::Hidden,
- cl::desc("The option to specify the name of the function "
- "whose branch probability info is printed."));
- INITIALIZE_PASS_BEGIN(BranchProbabilityInfoWrapperPass, "branch-prob",
- "Branch Probability Analysis", false, true)
- INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass)
- INITIALIZE_PASS_DEPENDENCY(TargetLibraryInfoWrapperPass)
- INITIALIZE_PASS_END(BranchProbabilityInfoWrapperPass, "branch-prob",
- "Branch Probability Analysis", false, true)
- char BranchProbabilityInfoWrapperPass::ID = 0;
- // Weights are for internal use only. They are used by heuristics to help to
- // estimate edges' probability. Example:
- //
- // Using "Loop Branch Heuristics" we predict weights of edges for the
- // block BB2.
- // ...
- // |
- // V
- // BB1<-+
- // | |
- // | | (Weight = 124)
- // V |
- // BB2--+
- // |
- // | (Weight = 4)
- // V
- // BB3
- //
- // Probability of the edge BB2->BB1 = 124 / (124 + 4) = 0.96875
- // Probability of the edge BB2->BB3 = 4 / (124 + 4) = 0.03125
- static const uint32_t LBH_TAKEN_WEIGHT = 124;
- static const uint32_t LBH_NONTAKEN_WEIGHT = 4;
- // Unlikely edges within a loop are half as likely as other edges
- static const uint32_t LBH_UNLIKELY_WEIGHT = 62;
- /// Unreachable-terminating branch taken probability.
- ///
- /// This is the probability for a branch being taken to a block that terminates
- /// (eventually) in unreachable. These are predicted as unlikely as possible.
- /// All reachable probability will equally share the remaining part.
- static const BranchProbability UR_TAKEN_PROB = BranchProbability::getRaw(1);
- /// Weight for a branch taken going into a cold block.
- ///
- /// This is the weight for a branch taken toward a block marked
- /// cold. A block is marked cold if it's postdominated by a
- /// block containing a call to a cold function. Cold functions
- /// are those marked with attribute 'cold'.
- static const uint32_t CC_TAKEN_WEIGHT = 4;
- /// Weight for a branch not-taken into a cold block.
- ///
- /// This is the weight for a branch not taken toward a block marked
- /// cold.
- static const uint32_t CC_NONTAKEN_WEIGHT = 64;
- static const uint32_t PH_TAKEN_WEIGHT = 20;
- static const uint32_t PH_NONTAKEN_WEIGHT = 12;
- static const uint32_t ZH_TAKEN_WEIGHT = 20;
- static const uint32_t ZH_NONTAKEN_WEIGHT = 12;
- static const uint32_t FPH_TAKEN_WEIGHT = 20;
- static const uint32_t FPH_NONTAKEN_WEIGHT = 12;
- /// Invoke-terminating normal branch taken weight
- ///
- /// This is the weight for branching to the normal destination of an invoke
- /// instruction. We expect this to happen most of the time. Set the weight to an
- /// absurdly high value so that nested loops subsume it.
- static const uint32_t IH_TAKEN_WEIGHT = 1024 * 1024 - 1;
- /// Invoke-terminating normal branch not-taken weight.
- ///
- /// This is the weight for branching to the unwind destination of an invoke
- /// instruction. This is essentially never taken.
- static const uint32_t IH_NONTAKEN_WEIGHT = 1;
- /// Add \p BB to PostDominatedByUnreachable set if applicable.
- void
- BranchProbabilityInfo::updatePostDominatedByUnreachable(const BasicBlock *BB) {
- const Instruction *TI = BB->getTerminator();
- if (TI->getNumSuccessors() == 0) {
- if (isa<UnreachableInst>(TI) ||
- // If this block is terminated by a call to
- // @llvm.experimental.deoptimize then treat it like an unreachable since
- // the @llvm.experimental.deoptimize call is expected to practically
- // never execute.
- BB->getTerminatingDeoptimizeCall())
- PostDominatedByUnreachable.insert(BB);
- return;
- }
- // If the terminator is an InvokeInst, check only the normal destination block
- // as the unwind edge of InvokeInst is also very unlikely taken.
- if (auto *II = dyn_cast<InvokeInst>(TI)) {
- if (PostDominatedByUnreachable.count(II->getNormalDest()))
- PostDominatedByUnreachable.insert(BB);
- return;
- }
- for (auto *I : successors(BB))
- // If any of successor is not post dominated then BB is also not.
- if (!PostDominatedByUnreachable.count(I))
- return;
- PostDominatedByUnreachable.insert(BB);
- }
- /// Add \p BB to PostDominatedByColdCall set if applicable.
- void
- BranchProbabilityInfo::updatePostDominatedByColdCall(const BasicBlock *BB) {
- assert(!PostDominatedByColdCall.count(BB));
- const Instruction *TI = BB->getTerminator();
- if (TI->getNumSuccessors() == 0)
- return;
- // If all of successor are post dominated then BB is also done.
- if (llvm::all_of(successors(BB), [&](const BasicBlock *SuccBB) {
- return PostDominatedByColdCall.count(SuccBB);
- })) {
- PostDominatedByColdCall.insert(BB);
- return;
- }
- // If the terminator is an InvokeInst, check only the normal destination
- // block as the unwind edge of InvokeInst is also very unlikely taken.
- if (auto *II = dyn_cast<InvokeInst>(TI))
- if (PostDominatedByColdCall.count(II->getNormalDest())) {
- PostDominatedByColdCall.insert(BB);
- return;
- }
- // Otherwise, if the block itself contains a cold function, add it to the
- // set of blocks post-dominated by a cold call.
- for (auto &I : *BB)
- if (const CallInst *CI = dyn_cast<CallInst>(&I))
- if (CI->hasFnAttr(Attribute::Cold)) {
- PostDominatedByColdCall.insert(BB);
- return;
- }
- }
- /// Calculate edge weights for successors lead to unreachable.
- ///
- /// Predict that a successor which leads necessarily to an
- /// unreachable-terminated block as extremely unlikely.
- bool BranchProbabilityInfo::calcUnreachableHeuristics(const BasicBlock *BB) {
- const Instruction *TI = BB->getTerminator();
- (void) TI;
- assert(TI->getNumSuccessors() > 1 && "expected more than one successor!");
- assert(!isa<InvokeInst>(TI) &&
- "Invokes should have already been handled by calcInvokeHeuristics");
- SmallVector<unsigned, 4> UnreachableEdges;
- SmallVector<unsigned, 4> ReachableEdges;
- for (succ_const_iterator I = succ_begin(BB), E = succ_end(BB); I != E; ++I)
- if (PostDominatedByUnreachable.count(*I))
- UnreachableEdges.push_back(I.getSuccessorIndex());
- else
- ReachableEdges.push_back(I.getSuccessorIndex());
- // Skip probabilities if all were reachable.
- if (UnreachableEdges.empty())
- return false;
- if (ReachableEdges.empty()) {
- BranchProbability Prob(1, UnreachableEdges.size());
- for (unsigned SuccIdx : UnreachableEdges)
- setEdgeProbability(BB, SuccIdx, Prob);
- return true;
- }
- auto UnreachableProb = UR_TAKEN_PROB;
- auto ReachableProb =
- (BranchProbability::getOne() - UR_TAKEN_PROB * UnreachableEdges.size()) /
- ReachableEdges.size();
- for (unsigned SuccIdx : UnreachableEdges)
- setEdgeProbability(BB, SuccIdx, UnreachableProb);
- for (unsigned SuccIdx : ReachableEdges)
- setEdgeProbability(BB, SuccIdx, ReachableProb);
- return true;
- }
- // Propagate existing explicit probabilities from either profile data or
- // 'expect' intrinsic processing. Examine metadata against unreachable
- // heuristic. The probability of the edge coming to unreachable block is
- // set to min of metadata and unreachable heuristic.
- bool BranchProbabilityInfo::calcMetadataWeights(const BasicBlock *BB) {
- const Instruction *TI = BB->getTerminator();
- assert(TI->getNumSuccessors() > 1 && "expected more than one successor!");
- if (!(isa<BranchInst>(TI) || isa<SwitchInst>(TI) || isa<IndirectBrInst>(TI)))
- return false;
- MDNode *WeightsNode = TI->getMetadata(LLVMContext::MD_prof);
- if (!WeightsNode)
- return false;
- // Check that the number of successors is manageable.
- assert(TI->getNumSuccessors() < UINT32_MAX && "Too many successors");
- // Ensure there are weights for all of the successors. Note that the first
- // operand to the metadata node is a name, not a weight.
- if (WeightsNode->getNumOperands() != TI->getNumSuccessors() + 1)
- return false;
- // Build up the final weights that will be used in a temporary buffer.
- // Compute the sum of all weights to later decide whether they need to
- // be scaled to fit in 32 bits.
- uint64_t WeightSum = 0;
- SmallVector<uint32_t, 2> Weights;
- SmallVector<unsigned, 2> UnreachableIdxs;
- SmallVector<unsigned, 2> ReachableIdxs;
- Weights.reserve(TI->getNumSuccessors());
- for (unsigned i = 1, e = WeightsNode->getNumOperands(); i != e; ++i) {
- ConstantInt *Weight =
- mdconst::dyn_extract<ConstantInt>(WeightsNode->getOperand(i));
- if (!Weight)
- return false;
- assert(Weight->getValue().getActiveBits() <= 32 &&
- "Too many bits for uint32_t");
- Weights.push_back(Weight->getZExtValue());
- WeightSum += Weights.back();
- if (PostDominatedByUnreachable.count(TI->getSuccessor(i - 1)))
- UnreachableIdxs.push_back(i - 1);
- else
- ReachableIdxs.push_back(i - 1);
- }
- assert(Weights.size() == TI->getNumSuccessors() && "Checked above");
- // If the sum of weights does not fit in 32 bits, scale every weight down
- // accordingly.
- uint64_t ScalingFactor =
- (WeightSum > UINT32_MAX) ? WeightSum / UINT32_MAX + 1 : 1;
- if (ScalingFactor > 1) {
- WeightSum = 0;
- for (unsigned i = 0, e = TI->getNumSuccessors(); i != e; ++i) {
- Weights[i] /= ScalingFactor;
- WeightSum += Weights[i];
- }
- }
- assert(WeightSum <= UINT32_MAX &&
- "Expected weights to scale down to 32 bits");
- if (WeightSum == 0 || ReachableIdxs.size() == 0) {
- for (unsigned i = 0, e = TI->getNumSuccessors(); i != e; ++i)
- Weights[i] = 1;
- WeightSum = TI->getNumSuccessors();
- }
- // Set the probability.
- SmallVector<BranchProbability, 2> BP;
- for (unsigned i = 0, e = TI->getNumSuccessors(); i != e; ++i)
- BP.push_back({ Weights[i], static_cast<uint32_t>(WeightSum) });
- // Examine the metadata against unreachable heuristic.
- // If the unreachable heuristic is more strong then we use it for this edge.
- if (UnreachableIdxs.size() > 0 && ReachableIdxs.size() > 0) {
- auto ToDistribute = BranchProbability::getZero();
- auto UnreachableProb = UR_TAKEN_PROB;
- for (auto i : UnreachableIdxs)
- if (UnreachableProb < BP[i]) {
- ToDistribute += BP[i] - UnreachableProb;
- BP[i] = UnreachableProb;
- }
- // If we modified the probability of some edges then we must distribute
- // the difference between reachable blocks.
- if (ToDistribute > BranchProbability::getZero()) {
- BranchProbability PerEdge = ToDistribute / ReachableIdxs.size();
- for (auto i : ReachableIdxs)
- BP[i] += PerEdge;
- }
- }
- for (unsigned i = 0, e = TI->getNumSuccessors(); i != e; ++i)
- setEdgeProbability(BB, i, BP[i]);
- return true;
- }
- /// Calculate edge weights for edges leading to cold blocks.
- ///
- /// A cold block is one post-dominated by a block with a call to a
- /// cold function. Those edges are unlikely to be taken, so we give
- /// them relatively low weight.
- ///
- /// Return true if we could compute the weights for cold edges.
- /// Return false, otherwise.
- bool BranchProbabilityInfo::calcColdCallHeuristics(const BasicBlock *BB) {
- const Instruction *TI = BB->getTerminator();
- (void) TI;
- assert(TI->getNumSuccessors() > 1 && "expected more than one successor!");
- assert(!isa<InvokeInst>(TI) &&
- "Invokes should have already been handled by calcInvokeHeuristics");
- // Determine which successors are post-dominated by a cold block.
- SmallVector<unsigned, 4> ColdEdges;
- SmallVector<unsigned, 4> NormalEdges;
- for (succ_const_iterator I = succ_begin(BB), E = succ_end(BB); I != E; ++I)
- if (PostDominatedByColdCall.count(*I))
- ColdEdges.push_back(I.getSuccessorIndex());
- else
- NormalEdges.push_back(I.getSuccessorIndex());
- // Skip probabilities if no cold edges.
- if (ColdEdges.empty())
- return false;
- if (NormalEdges.empty()) {
- BranchProbability Prob(1, ColdEdges.size());
- for (unsigned SuccIdx : ColdEdges)
- setEdgeProbability(BB, SuccIdx, Prob);
- return true;
- }
- auto ColdProb = BranchProbability::getBranchProbability(
- CC_TAKEN_WEIGHT,
- (CC_TAKEN_WEIGHT + CC_NONTAKEN_WEIGHT) * uint64_t(ColdEdges.size()));
- auto NormalProb = BranchProbability::getBranchProbability(
- CC_NONTAKEN_WEIGHT,
- (CC_TAKEN_WEIGHT + CC_NONTAKEN_WEIGHT) * uint64_t(NormalEdges.size()));
- for (unsigned SuccIdx : ColdEdges)
- setEdgeProbability(BB, SuccIdx, ColdProb);
- for (unsigned SuccIdx : NormalEdges)
- setEdgeProbability(BB, SuccIdx, NormalProb);
- return true;
- }
- // Calculate Edge Weights using "Pointer Heuristics". Predict a comparison
- // between two pointer or pointer and NULL will fail.
- bool BranchProbabilityInfo::calcPointerHeuristics(const BasicBlock *BB) {
- const BranchInst *BI = dyn_cast<BranchInst>(BB->getTerminator());
- if (!BI || !BI->isConditional())
- return false;
- Value *Cond = BI->getCondition();
- ICmpInst *CI = dyn_cast<ICmpInst>(Cond);
- if (!CI || !CI->isEquality())
- return false;
- Value *LHS = CI->getOperand(0);
- if (!LHS->getType()->isPointerTy())
- return false;
- assert(CI->getOperand(1)->getType()->isPointerTy());
- // p != 0 -> isProb = true
- // p == 0 -> isProb = false
- // p != q -> isProb = true
- // p == q -> isProb = false;
- unsigned TakenIdx = 0, NonTakenIdx = 1;
- bool isProb = CI->getPredicate() == ICmpInst::ICMP_NE;
- if (!isProb)
- std::swap(TakenIdx, NonTakenIdx);
- BranchProbability TakenProb(PH_TAKEN_WEIGHT,
- PH_TAKEN_WEIGHT + PH_NONTAKEN_WEIGHT);
- setEdgeProbability(BB, TakenIdx, TakenProb);
- setEdgeProbability(BB, NonTakenIdx, TakenProb.getCompl());
- return true;
- }
- static int getSCCNum(const BasicBlock *BB,
- const BranchProbabilityInfo::SccInfo &SccI) {
- auto SccIt = SccI.SccNums.find(BB);
- if (SccIt == SccI.SccNums.end())
- return -1;
- return SccIt->second;
- }
- // Consider any block that is an entry point to the SCC as a header.
- static bool isSCCHeader(const BasicBlock *BB, int SccNum,
- BranchProbabilityInfo::SccInfo &SccI) {
- assert(getSCCNum(BB, SccI) == SccNum);
- // Lazily compute the set of headers for a given SCC and cache the results
- // in the SccHeaderMap.
- if (SccI.SccHeaders.size() <= static_cast<unsigned>(SccNum))
- SccI.SccHeaders.resize(SccNum + 1);
- auto &HeaderMap = SccI.SccHeaders[SccNum];
- bool Inserted;
- BranchProbabilityInfo::SccHeaderMap::iterator HeaderMapIt;
- std::tie(HeaderMapIt, Inserted) = HeaderMap.insert(std::make_pair(BB, false));
- if (Inserted) {
- bool IsHeader = llvm::any_of(make_range(pred_begin(BB), pred_end(BB)),
- [&](const BasicBlock *Pred) {
- return getSCCNum(Pred, SccI) != SccNum;
- });
- HeaderMapIt->second = IsHeader;
- return IsHeader;
- } else
- return HeaderMapIt->second;
- }
- // Compute the unlikely successors to the block BB in the loop L, specifically
- // those that are unlikely because this is a loop, and add them to the
- // UnlikelyBlocks set.
- static void
- computeUnlikelySuccessors(const BasicBlock *BB, Loop *L,
- SmallPtrSetImpl<const BasicBlock*> &UnlikelyBlocks) {
- // Sometimes in a loop we have a branch whose condition is made false by
- // taking it. This is typically something like
- // int n = 0;
- // while (...) {
- // if (++n >= MAX) {
- // n = 0;
- // }
- // }
- // In this sort of situation taking the branch means that at the very least it
- // won't be taken again in the next iteration of the loop, so we should
- // consider it less likely than a typical branch.
- //
- // We detect this by looking back through the graph of PHI nodes that sets the
- // value that the condition depends on, and seeing if we can reach a successor
- // block which can be determined to make the condition false.
- //
- // FIXME: We currently consider unlikely blocks to be half as likely as other
- // blocks, but if we consider the example above the likelyhood is actually
- // 1/MAX. We could therefore be more precise in how unlikely we consider
- // blocks to be, but it would require more careful examination of the form
- // of the comparison expression.
- const BranchInst *BI = dyn_cast<BranchInst>(BB->getTerminator());
- if (!BI || !BI->isConditional())
- return;
- // Check if the branch is based on an instruction compared with a constant
- CmpInst *CI = dyn_cast<CmpInst>(BI->getCondition());
- if (!CI || !isa<Instruction>(CI->getOperand(0)) ||
- !isa<Constant>(CI->getOperand(1)))
- return;
- // Either the instruction must be a PHI, or a chain of operations involving
- // constants that ends in a PHI which we can then collapse into a single value
- // if the PHI value is known.
- Instruction *CmpLHS = dyn_cast<Instruction>(CI->getOperand(0));
- PHINode *CmpPHI = dyn_cast<PHINode>(CmpLHS);
- Constant *CmpConst = dyn_cast<Constant>(CI->getOperand(1));
- // Collect the instructions until we hit a PHI
- SmallVector<BinaryOperator *, 1> InstChain;
- while (!CmpPHI && CmpLHS && isa<BinaryOperator>(CmpLHS) &&
- isa<Constant>(CmpLHS->getOperand(1))) {
- // Stop if the chain extends outside of the loop
- if (!L->contains(CmpLHS))
- return;
- InstChain.push_back(cast<BinaryOperator>(CmpLHS));
- CmpLHS = dyn_cast<Instruction>(CmpLHS->getOperand(0));
- if (CmpLHS)
- CmpPHI = dyn_cast<PHINode>(CmpLHS);
- }
- if (!CmpPHI || !L->contains(CmpPHI))
- return;
- // Trace the phi node to find all values that come from successors of BB
- SmallPtrSet<PHINode*, 8> VisitedInsts;
- SmallVector<PHINode*, 8> WorkList;
- WorkList.push_back(CmpPHI);
- VisitedInsts.insert(CmpPHI);
- while (!WorkList.empty()) {
- PHINode *P = WorkList.back();
- WorkList.pop_back();
- for (BasicBlock *B : P->blocks()) {
- // Skip blocks that aren't part of the loop
- if (!L->contains(B))
- continue;
- Value *V = P->getIncomingValueForBlock(B);
- // If the source is a PHI add it to the work list if we haven't
- // already visited it.
- if (PHINode *PN = dyn_cast<PHINode>(V)) {
- if (VisitedInsts.insert(PN).second)
- WorkList.push_back(PN);
- continue;
- }
- // If this incoming value is a constant and B is a successor of BB, then
- // we can constant-evaluate the compare to see if it makes the branch be
- // taken or not.
- Constant *CmpLHSConst = dyn_cast<Constant>(V);
- if (!CmpLHSConst ||
- std::find(succ_begin(BB), succ_end(BB), B) == succ_end(BB))
- continue;
- // First collapse InstChain
- for (Instruction *I : llvm::reverse(InstChain)) {
- CmpLHSConst = ConstantExpr::get(I->getOpcode(), CmpLHSConst,
- cast<Constant>(I->getOperand(1)), true);
- if (!CmpLHSConst)
- break;
- }
- if (!CmpLHSConst)
- continue;
- // Now constant-evaluate the compare
- Constant *Result = ConstantExpr::getCompare(CI->getPredicate(),
- CmpLHSConst, CmpConst, true);
- // If the result means we don't branch to the block then that block is
- // unlikely.
- if (Result &&
- ((Result->isZeroValue() && B == BI->getSuccessor(0)) ||
- (Result->isOneValue() && B == BI->getSuccessor(1))))
- UnlikelyBlocks.insert(B);
- }
- }
- }
- // Calculate Edge Weights using "Loop Branch Heuristics". Predict backedges
- // as taken, exiting edges as not-taken.
- bool BranchProbabilityInfo::calcLoopBranchHeuristics(const BasicBlock *BB,
- const LoopInfo &LI,
- SccInfo &SccI) {
- int SccNum;
- Loop *L = LI.getLoopFor(BB);
- if (!L) {
- SccNum = getSCCNum(BB, SccI);
- if (SccNum < 0)
- return false;
- }
- SmallPtrSet<const BasicBlock*, 8> UnlikelyBlocks;
- if (L)
- computeUnlikelySuccessors(BB, L, UnlikelyBlocks);
- SmallVector<unsigned, 8> BackEdges;
- SmallVector<unsigned, 8> ExitingEdges;
- SmallVector<unsigned, 8> InEdges; // Edges from header to the loop.
- SmallVector<unsigned, 8> UnlikelyEdges;
- for (succ_const_iterator I = succ_begin(BB), E = succ_end(BB); I != E; ++I) {
- // Use LoopInfo if we have it, otherwise fall-back to SCC info to catch
- // irreducible loops.
- if (L) {
- if (UnlikelyBlocks.count(*I) != 0)
- UnlikelyEdges.push_back(I.getSuccessorIndex());
- else if (!L->contains(*I))
- ExitingEdges.push_back(I.getSuccessorIndex());
- else if (L->getHeader() == *I)
- BackEdges.push_back(I.getSuccessorIndex());
- else
- InEdges.push_back(I.getSuccessorIndex());
- } else {
- if (getSCCNum(*I, SccI) != SccNum)
- ExitingEdges.push_back(I.getSuccessorIndex());
- else if (isSCCHeader(*I, SccNum, SccI))
- BackEdges.push_back(I.getSuccessorIndex());
- else
- InEdges.push_back(I.getSuccessorIndex());
- }
- }
- if (BackEdges.empty() && ExitingEdges.empty() && UnlikelyEdges.empty())
- return false;
- // Collect the sum of probabilities of back-edges/in-edges/exiting-edges, and
- // normalize them so that they sum up to one.
- unsigned Denom = (BackEdges.empty() ? 0 : LBH_TAKEN_WEIGHT) +
- (InEdges.empty() ? 0 : LBH_TAKEN_WEIGHT) +
- (UnlikelyEdges.empty() ? 0 : LBH_UNLIKELY_WEIGHT) +
- (ExitingEdges.empty() ? 0 : LBH_NONTAKEN_WEIGHT);
- if (uint32_t numBackEdges = BackEdges.size()) {
- BranchProbability TakenProb = BranchProbability(LBH_TAKEN_WEIGHT, Denom);
- auto Prob = TakenProb / numBackEdges;
- for (unsigned SuccIdx : BackEdges)
- setEdgeProbability(BB, SuccIdx, Prob);
- }
- if (uint32_t numInEdges = InEdges.size()) {
- BranchProbability TakenProb = BranchProbability(LBH_TAKEN_WEIGHT, Denom);
- auto Prob = TakenProb / numInEdges;
- for (unsigned SuccIdx : InEdges)
- setEdgeProbability(BB, SuccIdx, Prob);
- }
- if (uint32_t numExitingEdges = ExitingEdges.size()) {
- BranchProbability NotTakenProb = BranchProbability(LBH_NONTAKEN_WEIGHT,
- Denom);
- auto Prob = NotTakenProb / numExitingEdges;
- for (unsigned SuccIdx : ExitingEdges)
- setEdgeProbability(BB, SuccIdx, Prob);
- }
- if (uint32_t numUnlikelyEdges = UnlikelyEdges.size()) {
- BranchProbability UnlikelyProb = BranchProbability(LBH_UNLIKELY_WEIGHT,
- Denom);
- auto Prob = UnlikelyProb / numUnlikelyEdges;
- for (unsigned SuccIdx : UnlikelyEdges)
- setEdgeProbability(BB, SuccIdx, Prob);
- }
- return true;
- }
- bool BranchProbabilityInfo::calcZeroHeuristics(const BasicBlock *BB,
- const TargetLibraryInfo *TLI) {
- const BranchInst *BI = dyn_cast<BranchInst>(BB->getTerminator());
- if (!BI || !BI->isConditional())
- return false;
- Value *Cond = BI->getCondition();
- ICmpInst *CI = dyn_cast<ICmpInst>(Cond);
- if (!CI)
- return false;
- auto GetConstantInt = [](Value *V) {
- if (auto *I = dyn_cast<BitCastInst>(V))
- return dyn_cast<ConstantInt>(I->getOperand(0));
- return dyn_cast<ConstantInt>(V);
- };
- Value *RHS = CI->getOperand(1);
- ConstantInt *CV = GetConstantInt(RHS);
- if (!CV)
- return false;
- // If the LHS is the result of AND'ing a value with a single bit bitmask,
- // we don't have information about probabilities.
- if (Instruction *LHS = dyn_cast<Instruction>(CI->getOperand(0)))
- if (LHS->getOpcode() == Instruction::And)
- if (ConstantInt *AndRHS = dyn_cast<ConstantInt>(LHS->getOperand(1)))
- if (AndRHS->getValue().isPowerOf2())
- return false;
- // Check if the LHS is the return value of a library function
- LibFunc Func = NumLibFuncs;
- if (TLI)
- if (CallInst *Call = dyn_cast<CallInst>(CI->getOperand(0)))
- if (Function *CalledFn = Call->getCalledFunction())
- TLI->getLibFunc(*CalledFn, Func);
- bool isProb;
- if (Func == LibFunc_strcasecmp ||
- Func == LibFunc_strcmp ||
- Func == LibFunc_strncasecmp ||
- Func == LibFunc_strncmp ||
- Func == LibFunc_memcmp) {
- // strcmp and similar functions return zero, negative, or positive, if the
- // first string is equal, less, or greater than the second. We consider it
- // likely that the strings are not equal, so a comparison with zero is
- // probably false, but also a comparison with any other number is also
- // probably false given that what exactly is returned for nonzero values is
- // not specified. Any kind of comparison other than equality we know
- // nothing about.
- switch (CI->getPredicate()) {
- case CmpInst::ICMP_EQ:
- isProb = false;
- break;
- case CmpInst::ICMP_NE:
- isProb = true;
- break;
- default:
- return false;
- }
- } else if (CV->isZero()) {
- switch (CI->getPredicate()) {
- case CmpInst::ICMP_EQ:
- // X == 0 -> Unlikely
- isProb = false;
- break;
- case CmpInst::ICMP_NE:
- // X != 0 -> Likely
- isProb = true;
- break;
- case CmpInst::ICMP_SLT:
- // X < 0 -> Unlikely
- isProb = false;
- break;
- case CmpInst::ICMP_SGT:
- // X > 0 -> Likely
- isProb = true;
- break;
- default:
- return false;
- }
- } else if (CV->isOne() && CI->getPredicate() == CmpInst::ICMP_SLT) {
- // InstCombine canonicalizes X <= 0 into X < 1.
- // X <= 0 -> Unlikely
- isProb = false;
- } else if (CV->isMinusOne()) {
- switch (CI->getPredicate()) {
- case CmpInst::ICMP_EQ:
- // X == -1 -> Unlikely
- isProb = false;
- break;
- case CmpInst::ICMP_NE:
- // X != -1 -> Likely
- isProb = true;
- break;
- case CmpInst::ICMP_SGT:
- // InstCombine canonicalizes X >= 0 into X > -1.
- // X >= 0 -> Likely
- isProb = true;
- break;
- default:
- return false;
- }
- } else {
- return false;
- }
- unsigned TakenIdx = 0, NonTakenIdx = 1;
- if (!isProb)
- std::swap(TakenIdx, NonTakenIdx);
- BranchProbability TakenProb(ZH_TAKEN_WEIGHT,
- ZH_TAKEN_WEIGHT + ZH_NONTAKEN_WEIGHT);
- setEdgeProbability(BB, TakenIdx, TakenProb);
- setEdgeProbability(BB, NonTakenIdx, TakenProb.getCompl());
- return true;
- }
- bool BranchProbabilityInfo::calcFloatingPointHeuristics(const BasicBlock *BB) {
- const BranchInst *BI = dyn_cast<BranchInst>(BB->getTerminator());
- if (!BI || !BI->isConditional())
- return false;
- Value *Cond = BI->getCondition();
- FCmpInst *FCmp = dyn_cast<FCmpInst>(Cond);
- if (!FCmp)
- return false;
- bool isProb;
- if (FCmp->isEquality()) {
- // f1 == f2 -> Unlikely
- // f1 != f2 -> Likely
- isProb = !FCmp->isTrueWhenEqual();
- } else if (FCmp->getPredicate() == FCmpInst::FCMP_ORD) {
- // !isnan -> Likely
- isProb = true;
- } else if (FCmp->getPredicate() == FCmpInst::FCMP_UNO) {
- // isnan -> Unlikely
- isProb = false;
- } else {
- return false;
- }
- unsigned TakenIdx = 0, NonTakenIdx = 1;
- if (!isProb)
- std::swap(TakenIdx, NonTakenIdx);
- BranchProbability TakenProb(FPH_TAKEN_WEIGHT,
- FPH_TAKEN_WEIGHT + FPH_NONTAKEN_WEIGHT);
- setEdgeProbability(BB, TakenIdx, TakenProb);
- setEdgeProbability(BB, NonTakenIdx, TakenProb.getCompl());
- return true;
- }
- bool BranchProbabilityInfo::calcInvokeHeuristics(const BasicBlock *BB) {
- const InvokeInst *II = dyn_cast<InvokeInst>(BB->getTerminator());
- if (!II)
- return false;
- BranchProbability TakenProb(IH_TAKEN_WEIGHT,
- IH_TAKEN_WEIGHT + IH_NONTAKEN_WEIGHT);
- setEdgeProbability(BB, 0 /*Index for Normal*/, TakenProb);
- setEdgeProbability(BB, 1 /*Index for Unwind*/, TakenProb.getCompl());
- return true;
- }
- void BranchProbabilityInfo::releaseMemory() {
- Probs.clear();
- }
- void BranchProbabilityInfo::print(raw_ostream &OS) const {
- OS << "---- Branch Probabilities ----\n";
- // We print the probabilities from the last function the analysis ran over,
- // or the function it is currently running over.
- assert(LastF && "Cannot print prior to running over a function");
- for (const auto &BI : *LastF) {
- for (succ_const_iterator SI = succ_begin(&BI), SE = succ_end(&BI); SI != SE;
- ++SI) {
- printEdgeProbability(OS << " ", &BI, *SI);
- }
- }
- }
- bool BranchProbabilityInfo::
- isEdgeHot(const BasicBlock *Src, const BasicBlock *Dst) const {
- // Hot probability is at least 4/5 = 80%
- // FIXME: Compare against a static "hot" BranchProbability.
- return getEdgeProbability(Src, Dst) > BranchProbability(4, 5);
- }
- const BasicBlock *
- BranchProbabilityInfo::getHotSucc(const BasicBlock *BB) const {
- auto MaxProb = BranchProbability::getZero();
- const BasicBlock *MaxSucc = nullptr;
- for (succ_const_iterator I = succ_begin(BB), E = succ_end(BB); I != E; ++I) {
- const BasicBlock *Succ = *I;
- auto Prob = getEdgeProbability(BB, Succ);
- if (Prob > MaxProb) {
- MaxProb = Prob;
- MaxSucc = Succ;
- }
- }
- // Hot probability is at least 4/5 = 80%
- if (MaxProb > BranchProbability(4, 5))
- return MaxSucc;
- return nullptr;
- }
- /// Get the raw edge probability for the edge. If can't find it, return a
- /// default probability 1/N where N is the number of successors. Here an edge is
- /// specified using PredBlock and an
- /// index to the successors.
- BranchProbability
- BranchProbabilityInfo::getEdgeProbability(const BasicBlock *Src,
- unsigned IndexInSuccessors) const {
- auto I = Probs.find(std::make_pair(Src, IndexInSuccessors));
- if (I != Probs.end())
- return I->second;
- return {1, static_cast<uint32_t>(succ_size(Src))};
- }
- BranchProbability
- BranchProbabilityInfo::getEdgeProbability(const BasicBlock *Src,
- succ_const_iterator Dst) const {
- return getEdgeProbability(Src, Dst.getSuccessorIndex());
- }
- /// Get the raw edge probability calculated for the block pair. This returns the
- /// sum of all raw edge probabilities from Src to Dst.
- BranchProbability
- BranchProbabilityInfo::getEdgeProbability(const BasicBlock *Src,
- const BasicBlock *Dst) const {
- auto Prob = BranchProbability::getZero();
- bool FoundProb = false;
- for (succ_const_iterator I = succ_begin(Src), E = succ_end(Src); I != E; ++I)
- if (*I == Dst) {
- auto MapI = Probs.find(std::make_pair(Src, I.getSuccessorIndex()));
- if (MapI != Probs.end()) {
- FoundProb = true;
- Prob += MapI->second;
- }
- }
- uint32_t succ_num = std::distance(succ_begin(Src), succ_end(Src));
- return FoundProb ? Prob : BranchProbability(1, succ_num);
- }
- /// Set the edge probability for a given edge specified by PredBlock and an
- /// index to the successors.
- void BranchProbabilityInfo::setEdgeProbability(const BasicBlock *Src,
- unsigned IndexInSuccessors,
- BranchProbability Prob) {
- Probs[std::make_pair(Src, IndexInSuccessors)] = Prob;
- Handles.insert(BasicBlockCallbackVH(Src, this));
- LLVM_DEBUG(dbgs() << "set edge " << Src->getName() << " -> "
- << IndexInSuccessors << " successor probability to " << Prob
- << "\n");
- }
- raw_ostream &
- BranchProbabilityInfo::printEdgeProbability(raw_ostream &OS,
- const BasicBlock *Src,
- const BasicBlock *Dst) const {
- const BranchProbability Prob = getEdgeProbability(Src, Dst);
- OS << "edge " << Src->getName() << " -> " << Dst->getName()
- << " probability is " << Prob
- << (isEdgeHot(Src, Dst) ? " [HOT edge]\n" : "\n");
- return OS;
- }
- void BranchProbabilityInfo::eraseBlock(const BasicBlock *BB) {
- for (auto I = Probs.begin(), E = Probs.end(); I != E; ++I) {
- auto Key = I->first;
- if (Key.first == BB)
- Probs.erase(Key);
- }
- }
- void BranchProbabilityInfo::calculate(const Function &F, const LoopInfo &LI,
- const TargetLibraryInfo *TLI) {
- LLVM_DEBUG(dbgs() << "---- Branch Probability Info : " << F.getName()
- << " ----\n\n");
- LastF = &F; // Store the last function we ran on for printing.
- assert(PostDominatedByUnreachable.empty());
- assert(PostDominatedByColdCall.empty());
- // Record SCC numbers of blocks in the CFG to identify irreducible loops.
- // FIXME: We could only calculate this if the CFG is known to be irreducible
- // (perhaps cache this info in LoopInfo if we can easily calculate it there?).
- int SccNum = 0;
- SccInfo SccI;
- for (scc_iterator<const Function *> It = scc_begin(&F); !It.isAtEnd();
- ++It, ++SccNum) {
- // Ignore single-block SCCs since they either aren't loops or LoopInfo will
- // catch them.
- const std::vector<const BasicBlock *> &Scc = *It;
- if (Scc.size() == 1)
- continue;
- LLVM_DEBUG(dbgs() << "BPI: SCC " << SccNum << ":");
- for (auto *BB : Scc) {
- LLVM_DEBUG(dbgs() << " " << BB->getName());
- SccI.SccNums[BB] = SccNum;
- }
- LLVM_DEBUG(dbgs() << "\n");
- }
- // Walk the basic blocks in post-order so that we can build up state about
- // the successors of a block iteratively.
- for (auto BB : post_order(&F.getEntryBlock())) {
- LLVM_DEBUG(dbgs() << "Computing probabilities for " << BB->getName()
- << "\n");
- updatePostDominatedByUnreachable(BB);
- updatePostDominatedByColdCall(BB);
- // If there is no at least two successors, no sense to set probability.
- if (BB->getTerminator()->getNumSuccessors() < 2)
- continue;
- if (calcMetadataWeights(BB))
- continue;
- if (calcInvokeHeuristics(BB))
- continue;
- if (calcUnreachableHeuristics(BB))
- continue;
- if (calcColdCallHeuristics(BB))
- continue;
- if (calcLoopBranchHeuristics(BB, LI, SccI))
- continue;
- if (calcPointerHeuristics(BB))
- continue;
- if (calcZeroHeuristics(BB, TLI))
- continue;
- if (calcFloatingPointHeuristics(BB))
- continue;
- }
- PostDominatedByUnreachable.clear();
- PostDominatedByColdCall.clear();
- if (PrintBranchProb &&
- (PrintBranchProbFuncName.empty() ||
- F.getName().equals(PrintBranchProbFuncName))) {
- print(dbgs());
- }
- }
- void BranchProbabilityInfoWrapperPass::getAnalysisUsage(
- AnalysisUsage &AU) const {
- // We require DT so it's available when LI is available. The LI updating code
- // asserts that DT is also present so if we don't make sure that we have DT
- // here, that assert will trigger.
- AU.addRequired<DominatorTreeWrapperPass>();
- AU.addRequired<LoopInfoWrapperPass>();
- AU.addRequired<TargetLibraryInfoWrapperPass>();
- AU.setPreservesAll();
- }
- bool BranchProbabilityInfoWrapperPass::runOnFunction(Function &F) {
- const LoopInfo &LI = getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
- const TargetLibraryInfo &TLI =
- getAnalysis<TargetLibraryInfoWrapperPass>().getTLI(F);
- BPI.calculate(F, LI, &TLI);
- return false;
- }
- void BranchProbabilityInfoWrapperPass::releaseMemory() { BPI.releaseMemory(); }
- void BranchProbabilityInfoWrapperPass::print(raw_ostream &OS,
- const Module *) const {
- BPI.print(OS);
- }
- AnalysisKey BranchProbabilityAnalysis::Key;
- BranchProbabilityInfo
- BranchProbabilityAnalysis::run(Function &F, FunctionAnalysisManager &AM) {
- BranchProbabilityInfo BPI;
- BPI.calculate(F, AM.getResult<LoopAnalysis>(F), &AM.getResult<TargetLibraryAnalysis>(F));
- return BPI;
- }
- PreservedAnalyses
- BranchProbabilityPrinterPass::run(Function &F, FunctionAnalysisManager &AM) {
- OS << "Printing analysis results of BPI for function "
- << "'" << F.getName() << "':"
- << "\n";
- AM.getResult<BranchProbabilityAnalysis>(F).print(OS);
- return PreservedAnalyses::all();
- }
|