| //===- ProfileSummaryInfo.cpp - Global profile summary information --------===// |
| // |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| // See https://llvm.org/LICENSE.txt for license information. |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // This file contains a pass that provides access to the global profile summary |
| // information. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #include "llvm/Analysis/ProfileSummaryInfo.h" |
| #include "llvm/Analysis/BlockFrequencyInfo.h" |
| #include "llvm/IR/BasicBlock.h" |
| #include "llvm/IR/CallSite.h" |
| #include "llvm/IR/Metadata.h" |
| #include "llvm/IR/Module.h" |
| #include "llvm/IR/ProfileSummary.h" |
| #include "llvm/InitializePasses.h" |
| #include "llvm/Support/CommandLine.h" |
| using namespace llvm; |
| |
| // The following two parameters determine the threshold for a count to be |
| // considered hot/cold. These two parameters are percentile values (multiplied |
| // by 10000). If the counts are sorted in descending order, the minimum count to |
| // reach ProfileSummaryCutoffHot gives the threshold to determine a hot count. |
| // Similarly, the minimum count to reach ProfileSummaryCutoffCold gives the |
| // threshold for determining cold count (everything <= this threshold is |
| // considered cold). |
| |
| static cl::opt<int> ProfileSummaryCutoffHot( |
| "profile-summary-cutoff-hot", cl::Hidden, cl::init(990000), cl::ZeroOrMore, |
| cl::desc("A count is hot if it exceeds the minimum count to" |
| " reach this percentile of total counts.")); |
| |
| static cl::opt<int> ProfileSummaryCutoffCold( |
| "profile-summary-cutoff-cold", cl::Hidden, cl::init(999999), cl::ZeroOrMore, |
| cl::desc("A count is cold if it is below the minimum count" |
| " to reach this percentile of total counts.")); |
| |
| static cl::opt<unsigned> ProfileSummaryHugeWorkingSetSizeThreshold( |
| "profile-summary-huge-working-set-size-threshold", cl::Hidden, |
| cl::init(15000), cl::ZeroOrMore, |
| cl::desc("The code working set size is considered huge if the number of" |
| " blocks required to reach the -profile-summary-cutoff-hot" |
| " percentile exceeds this count.")); |
| |
| static cl::opt<unsigned> ProfileSummaryLargeWorkingSetSizeThreshold( |
| "profile-summary-large-working-set-size-threshold", cl::Hidden, |
| cl::init(12500), cl::ZeroOrMore, |
| cl::desc("The code working set size is considered large if the number of" |
| " blocks required to reach the -profile-summary-cutoff-hot" |
| " percentile exceeds this count.")); |
| |
| // The next two options override the counts derived from summary computation and |
| // are useful for debugging purposes. |
| static cl::opt<int> ProfileSummaryHotCount( |
| "profile-summary-hot-count", cl::ReallyHidden, cl::ZeroOrMore, |
| cl::desc("A fixed hot count that overrides the count derived from" |
| " profile-summary-cutoff-hot")); |
| |
| static cl::opt<int> ProfileSummaryColdCount( |
| "profile-summary-cold-count", cl::ReallyHidden, cl::ZeroOrMore, |
| cl::desc("A fixed cold count that overrides the count derived from" |
| " profile-summary-cutoff-cold")); |
| |
| // Find the summary entry for a desired percentile of counts. |
| static const ProfileSummaryEntry &getEntryForPercentile(SummaryEntryVector &DS, |
| uint64_t Percentile) { |
| auto It = partition_point(DS, [=](const ProfileSummaryEntry &Entry) { |
| return Entry.Cutoff < Percentile; |
| }); |
| // The required percentile has to be <= one of the percentiles in the |
| // detailed summary. |
| if (It == DS.end()) |
| report_fatal_error("Desired percentile exceeds the maximum cutoff"); |
| return *It; |
| } |
| |
| // The profile summary metadata may be attached either by the frontend or by |
| // any backend passes (IR level instrumentation, for example). This method |
| // checks if the Summary is null and if so checks if the summary metadata is now |
| // available in the module and parses it to get the Summary object. Returns true |
| // if a valid Summary is available. |
| bool ProfileSummaryInfo::computeSummary() { |
| if (Summary) |
| return true; |
| // First try to get context sensitive ProfileSummary. |
| auto *SummaryMD = M.getProfileSummary(/* IsCS */ true); |
| if (SummaryMD) { |
| Summary.reset(ProfileSummary::getFromMD(SummaryMD)); |
| return true; |
| } |
| // This will actually return PSK_Instr or PSK_Sample summary. |
| SummaryMD = M.getProfileSummary(/* IsCS */ false); |
| if (!SummaryMD) |
| return false; |
| Summary.reset(ProfileSummary::getFromMD(SummaryMD)); |
| return true; |
| } |
| |
| Optional<uint64_t> |
| ProfileSummaryInfo::getProfileCount(const Instruction *Inst, |
| BlockFrequencyInfo *BFI, |
| bool AllowSynthetic) { |
| if (!Inst) |
| return None; |
| assert((isa<CallInst>(Inst) || isa<InvokeInst>(Inst)) && |
| "We can only get profile count for call/invoke instruction."); |
| if (hasSampleProfile()) { |
| // In sample PGO mode, check if there is a profile metadata on the |
| // instruction. If it is present, determine hotness solely based on that, |
| // since the sampled entry count may not be accurate. If there is no |
| // annotated on the instruction, return None. |
| uint64_t TotalCount; |
| if (Inst->extractProfTotalWeight(TotalCount)) |
| return TotalCount; |
| return None; |
| } |
| if (BFI) |
| return BFI->getBlockProfileCount(Inst->getParent(), AllowSynthetic); |
| return None; |
| } |
| |
| /// Returns true if the function's entry is hot. If it returns false, it |
| /// either means it is not hot or it is unknown whether it is hot or not (for |
| /// example, no profile data is available). |
| bool ProfileSummaryInfo::isFunctionEntryHot(const Function *F) { |
| if (!F || !computeSummary()) |
| return false; |
| auto FunctionCount = F->getEntryCount(); |
| // FIXME: The heuristic used below for determining hotness is based on |
| // preliminary SPEC tuning for inliner. This will eventually be a |
| // convenience method that calls isHotCount. |
| return FunctionCount && isHotCount(FunctionCount.getCount()); |
| } |
| |
| /// Returns true if the function contains hot code. This can include a hot |
| /// function entry count, hot basic block, or (in the case of Sample PGO) |
| /// hot total call edge count. |
| /// If it returns false, it either means it is not hot or it is unknown |
| /// (for example, no profile data is available). |
| bool ProfileSummaryInfo::isFunctionHotInCallGraph(const Function *F, |
| BlockFrequencyInfo &BFI) { |
| if (!F || !computeSummary()) |
| return false; |
| if (auto FunctionCount = F->getEntryCount()) |
| if (isHotCount(FunctionCount.getCount())) |
| return true; |
| |
| if (hasSampleProfile()) { |
| uint64_t TotalCallCount = 0; |
| for (const auto &BB : *F) |
| for (const auto &I : BB) |
| if (isa<CallInst>(I) || isa<InvokeInst>(I)) |
| if (auto CallCount = getProfileCount(&I, nullptr)) |
| TotalCallCount += CallCount.getValue(); |
| if (isHotCount(TotalCallCount)) |
| return true; |
| } |
| for (const auto &BB : *F) |
| if (isHotBlock(&BB, &BFI)) |
| return true; |
| return false; |
| } |
| |
| /// Returns true if the function only contains cold code. This means that |
| /// the function entry and blocks are all cold, and (in the case of Sample PGO) |
| /// the total call edge count is cold. |
| /// If it returns false, it either means it is not cold or it is unknown |
| /// (for example, no profile data is available). |
| bool ProfileSummaryInfo::isFunctionColdInCallGraph(const Function *F, |
| BlockFrequencyInfo &BFI) { |
| if (!F || !computeSummary()) |
| return false; |
| if (auto FunctionCount = F->getEntryCount()) |
| if (!isColdCount(FunctionCount.getCount())) |
| return false; |
| |
| if (hasSampleProfile()) { |
| uint64_t TotalCallCount = 0; |
| for (const auto &BB : *F) |
| for (const auto &I : BB) |
| if (isa<CallInst>(I) || isa<InvokeInst>(I)) |
| if (auto CallCount = getProfileCount(&I, nullptr)) |
| TotalCallCount += CallCount.getValue(); |
| if (!isColdCount(TotalCallCount)) |
| return false; |
| } |
| for (const auto &BB : *F) |
| if (!isColdBlock(&BB, &BFI)) |
| return false; |
| return true; |
| } |
| |
| // Like isFunctionHotInCallGraph but for a given cutoff. |
| bool ProfileSummaryInfo::isFunctionHotInCallGraphNthPercentile( |
| int PercentileCutoff, const Function *F, BlockFrequencyInfo &BFI) { |
| if (!F || !computeSummary()) |
| return false; |
| if (auto FunctionCount = F->getEntryCount()) |
| if (isHotCountNthPercentile(PercentileCutoff, FunctionCount.getCount())) |
| return true; |
| |
| if (hasSampleProfile()) { |
| uint64_t TotalCallCount = 0; |
| for (const auto &BB : *F) |
| for (const auto &I : BB) |
| if (isa<CallInst>(I) || isa<InvokeInst>(I)) |
| if (auto CallCount = getProfileCount(&I, nullptr)) |
| TotalCallCount += CallCount.getValue(); |
| if (isHotCountNthPercentile(PercentileCutoff, TotalCallCount)) |
| return true; |
| } |
| for (const auto &BB : *F) |
| if (isHotBlockNthPercentile(PercentileCutoff, &BB, &BFI)) |
| return true; |
| return false; |
| } |
| |
| /// Returns true if the function's entry is a cold. If it returns false, it |
| /// either means it is not cold or it is unknown whether it is cold or not (for |
| /// example, no profile data is available). |
| bool ProfileSummaryInfo::isFunctionEntryCold(const Function *F) { |
| if (!F) |
| return false; |
| if (F->hasFnAttribute(Attribute::Cold)) |
| return true; |
| if (!computeSummary()) |
| return false; |
| auto FunctionCount = F->getEntryCount(); |
| // FIXME: The heuristic used below for determining coldness is based on |
| // preliminary SPEC tuning for inliner. This will eventually be a |
| // convenience method that calls isHotCount. |
| return FunctionCount && isColdCount(FunctionCount.getCount()); |
| } |
| |
| /// Compute the hot and cold thresholds. |
| void ProfileSummaryInfo::computeThresholds() { |
| if (!computeSummary()) |
| return; |
| auto &DetailedSummary = Summary->getDetailedSummary(); |
| auto &HotEntry = |
| getEntryForPercentile(DetailedSummary, ProfileSummaryCutoffHot); |
| HotCountThreshold = HotEntry.MinCount; |
| if (ProfileSummaryHotCount.getNumOccurrences() > 0) |
| HotCountThreshold = ProfileSummaryHotCount; |
| auto &ColdEntry = |
| getEntryForPercentile(DetailedSummary, ProfileSummaryCutoffCold); |
| ColdCountThreshold = ColdEntry.MinCount; |
| if (ProfileSummaryColdCount.getNumOccurrences() > 0) |
| ColdCountThreshold = ProfileSummaryColdCount; |
| assert(ColdCountThreshold <= HotCountThreshold && |
| "Cold count threshold cannot exceed hot count threshold!"); |
| HasHugeWorkingSetSize = |
| HotEntry.NumCounts > ProfileSummaryHugeWorkingSetSizeThreshold; |
| HasLargeWorkingSetSize = |
| HotEntry.NumCounts > ProfileSummaryLargeWorkingSetSizeThreshold; |
| } |
| |
| Optional<uint64_t> ProfileSummaryInfo::computeThreshold(int PercentileCutoff) { |
| if (!computeSummary()) |
| return None; |
| auto iter = ThresholdCache.find(PercentileCutoff); |
| if (iter != ThresholdCache.end()) { |
| return iter->second; |
| } |
| auto &DetailedSummary = Summary->getDetailedSummary(); |
| auto &Entry = |
| getEntryForPercentile(DetailedSummary, PercentileCutoff); |
| uint64_t CountThreshold = Entry.MinCount; |
| ThresholdCache[PercentileCutoff] = CountThreshold; |
| return CountThreshold; |
| } |
| |
| bool ProfileSummaryInfo::hasHugeWorkingSetSize() { |
| if (!HasHugeWorkingSetSize) |
| computeThresholds(); |
| return HasHugeWorkingSetSize && HasHugeWorkingSetSize.getValue(); |
| } |
| |
| bool ProfileSummaryInfo::hasLargeWorkingSetSize() { |
| if (!HasLargeWorkingSetSize) |
| computeThresholds(); |
| return HasLargeWorkingSetSize && HasLargeWorkingSetSize.getValue(); |
| } |
| |
| bool ProfileSummaryInfo::isHotCount(uint64_t C) { |
| if (!HotCountThreshold) |
| computeThresholds(); |
| return HotCountThreshold && C >= HotCountThreshold.getValue(); |
| } |
| |
| bool ProfileSummaryInfo::isColdCount(uint64_t C) { |
| if (!ColdCountThreshold) |
| computeThresholds(); |
| return ColdCountThreshold && C <= ColdCountThreshold.getValue(); |
| } |
| |
| bool ProfileSummaryInfo::isHotCountNthPercentile(int PercentileCutoff, uint64_t C) { |
| auto CountThreshold = computeThreshold(PercentileCutoff); |
| return CountThreshold && C >= CountThreshold.getValue(); |
| } |
| |
| uint64_t ProfileSummaryInfo::getOrCompHotCountThreshold() { |
| if (!HotCountThreshold) |
| computeThresholds(); |
| return HotCountThreshold ? HotCountThreshold.getValue() : UINT64_MAX; |
| } |
| |
| uint64_t ProfileSummaryInfo::getOrCompColdCountThreshold() { |
| if (!ColdCountThreshold) |
| computeThresholds(); |
| return ColdCountThreshold ? ColdCountThreshold.getValue() : 0; |
| } |
| |
| bool ProfileSummaryInfo::isHotBlock(const BasicBlock *BB, BlockFrequencyInfo *BFI) { |
| auto Count = BFI->getBlockProfileCount(BB); |
| return Count && isHotCount(*Count); |
| } |
| |
| bool ProfileSummaryInfo::isColdBlock(const BasicBlock *BB, |
| BlockFrequencyInfo *BFI) { |
| auto Count = BFI->getBlockProfileCount(BB); |
| return Count && isColdCount(*Count); |
| } |
| |
| bool ProfileSummaryInfo::isHotBlockNthPercentile(int PercentileCutoff, |
| const BasicBlock *BB, |
| BlockFrequencyInfo *BFI) { |
| auto Count = BFI->getBlockProfileCount(BB); |
| return Count && isHotCountNthPercentile(PercentileCutoff, *Count); |
| } |
| |
| bool ProfileSummaryInfo::isHotCallSite(const CallSite &CS, |
| BlockFrequencyInfo *BFI) { |
| auto C = getProfileCount(CS.getInstruction(), BFI); |
| return C && isHotCount(*C); |
| } |
| |
| bool ProfileSummaryInfo::isColdCallSite(const CallSite &CS, |
| BlockFrequencyInfo *BFI) { |
| auto C = getProfileCount(CS.getInstruction(), BFI); |
| if (C) |
| return isColdCount(*C); |
| |
| // In SamplePGO, if the caller has been sampled, and there is no profile |
| // annotated on the callsite, we consider the callsite as cold. |
| return hasSampleProfile() && CS.getCaller()->hasProfileData(); |
| } |
| |
| INITIALIZE_PASS(ProfileSummaryInfoWrapperPass, "profile-summary-info", |
| "Profile summary info", false, true) |
| |
| ProfileSummaryInfoWrapperPass::ProfileSummaryInfoWrapperPass() |
| : ImmutablePass(ID) { |
| initializeProfileSummaryInfoWrapperPassPass(*PassRegistry::getPassRegistry()); |
| } |
| |
| bool ProfileSummaryInfoWrapperPass::doInitialization(Module &M) { |
| PSI.reset(new ProfileSummaryInfo(M)); |
| return false; |
| } |
| |
| bool ProfileSummaryInfoWrapperPass::doFinalization(Module &M) { |
| PSI.reset(); |
| return false; |
| } |
| |
| AnalysisKey ProfileSummaryAnalysis::Key; |
| ProfileSummaryInfo ProfileSummaryAnalysis::run(Module &M, |
| ModuleAnalysisManager &) { |
| return ProfileSummaryInfo(M); |
| } |
| |
| PreservedAnalyses ProfileSummaryPrinterPass::run(Module &M, |
| ModuleAnalysisManager &AM) { |
| ProfileSummaryInfo &PSI = AM.getResult<ProfileSummaryAnalysis>(M); |
| |
| OS << "Functions in " << M.getName() << " with hot/cold annotations: \n"; |
| for (auto &F : M) { |
| OS << F.getName(); |
| if (PSI.isFunctionEntryHot(&F)) |
| OS << " :hot entry "; |
| else if (PSI.isFunctionEntryCold(&F)) |
| OS << " :cold entry "; |
| OS << "\n"; |
| } |
| return PreservedAnalyses::all(); |
| } |
| |
| char ProfileSummaryInfoWrapperPass::ID = 0; |