//===- SampleProfileLoaderBaseUtil.cpp - Profile loader Util func ---------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // This file implements the SampleProfileLoader base utility functions. // //===----------------------------------------------------------------------===// #include "llvm/Transforms/Utils/SampleProfileLoaderBaseUtil.h" namespace llvm { cl::opt SampleProfileMaxPropagateIterations( "sample-profile-max-propagate-iterations", cl::init(100), cl::desc("Maximum number of iterations to go through when propagating " "sample block/edge weights through the CFG.")); cl::opt SampleProfileRecordCoverage( "sample-profile-check-record-coverage", cl::init(0), cl::value_desc("N"), cl::desc("Emit a warning if less than N% of records in the input profile " "are matched to the IR.")); cl::opt SampleProfileSampleCoverage( "sample-profile-check-sample-coverage", cl::init(0), cl::value_desc("N"), cl::desc("Emit a warning if less than N% of samples in the input profile " "are matched to the IR.")); cl::opt NoWarnSampleUnused( "no-warn-sample-unused", cl::init(false), cl::Hidden, cl::desc("Use this option to turn off/on warnings about function with " "samples but without debug information to use those samples. ")); namespace sampleprofutil { /// Return true if the given callsite is hot wrt to hot cutoff threshold. /// /// Functions that were inlined in the original binary will be represented /// in the inline stack in the sample profile. If the profile shows that /// the original inline decision was "good" (i.e., the callsite is executed /// frequently), then we will recreate the inline decision and apply the /// profile from the inlined callsite. /// /// To decide whether an inlined callsite is hot, we compare the callsite /// sample count with the hot cutoff computed by ProfileSummaryInfo, it is /// regarded as hot if the count is above the cutoff value. /// /// When ProfileAccurateForSymsInList is enabled and profile symbol list /// is present, functions in the profile symbol list but without profile will /// be regarded as cold and much less inlining will happen in CGSCC inlining /// pass, so we tend to lower the hot criteria here to allow more early /// inlining to happen for warm callsites and it is helpful for performance. bool callsiteIsHot(const FunctionSamples *CallsiteFS, ProfileSummaryInfo *PSI, bool ProfAccForSymsInList) { if (!CallsiteFS) return false; // The callsite was not inlined in the original binary. assert(PSI && "PSI is expected to be non null"); uint64_t CallsiteTotalSamples = CallsiteFS->getTotalSamples(); if (ProfAccForSymsInList) return !PSI->isColdCount(CallsiteTotalSamples); else return PSI->isHotCount(CallsiteTotalSamples); } /// Mark as used the sample record for the given function samples at /// (LineOffset, Discriminator). /// /// \returns true if this is the first time we mark the given record. bool SampleCoverageTracker::markSamplesUsed(const FunctionSamples *FS, uint32_t LineOffset, uint32_t Discriminator, uint64_t Samples) { LineLocation Loc(LineOffset, Discriminator); unsigned &Count = SampleCoverage[FS][Loc]; bool FirstTime = (++Count == 1); if (FirstTime) TotalUsedSamples += Samples; return FirstTime; } /// Return the number of sample records that were applied from this profile. /// /// This count does not include records from cold inlined callsites. unsigned SampleCoverageTracker::countUsedRecords(const FunctionSamples *FS, ProfileSummaryInfo *PSI) const { auto I = SampleCoverage.find(FS); // The size of the coverage map for FS represents the number of records // that were marked used at least once. unsigned Count = (I != SampleCoverage.end()) ? I->second.size() : 0; // If there are inlined callsites in this function, count the samples found // in the respective bodies. However, do not bother counting callees with 0 // total samples, these are callees that were never invoked at runtime. for (const auto &I : FS->getCallsiteSamples()) for (const auto &J : I.second) { const FunctionSamples *CalleeSamples = &J.second; if (callsiteIsHot(CalleeSamples, PSI, ProfAccForSymsInList)) Count += countUsedRecords(CalleeSamples, PSI); } return Count; } /// Return the number of sample records in the body of this profile. /// /// This count does not include records from cold inlined callsites. unsigned SampleCoverageTracker::countBodyRecords(const FunctionSamples *FS, ProfileSummaryInfo *PSI) const { unsigned Count = FS->getBodySamples().size(); // Only count records in hot callsites. for (const auto &I : FS->getCallsiteSamples()) for (const auto &J : I.second) { const FunctionSamples *CalleeSamples = &J.second; if (callsiteIsHot(CalleeSamples, PSI, ProfAccForSymsInList)) Count += countBodyRecords(CalleeSamples, PSI); } return Count; } /// Return the number of samples collected in the body of this profile. /// /// This count does not include samples from cold inlined callsites. uint64_t SampleCoverageTracker::countBodySamples(const FunctionSamples *FS, ProfileSummaryInfo *PSI) const { uint64_t Total = 0; for (const auto &I : FS->getBodySamples()) Total += I.second.getSamples(); // Only count samples in hot callsites. for (const auto &I : FS->getCallsiteSamples()) for (const auto &J : I.second) { const FunctionSamples *CalleeSamples = &J.second; if (callsiteIsHot(CalleeSamples, PSI, ProfAccForSymsInList)) Total += countBodySamples(CalleeSamples, PSI); } return Total; } /// Return the fraction of sample records used in this profile. /// /// The returned value is an unsigned integer in the range 0-100 indicating /// the percentage of sample records that were used while applying this /// profile to the associated function. unsigned SampleCoverageTracker::computeCoverage(unsigned Used, unsigned Total) const { assert(Used <= Total && "number of used records cannot exceed the total number of records"); return Total > 0 ? Used * 100 / Total : 100; } /// Create a global variable to flag FSDiscriminators are used. void createFSDiscriminatorVariable(Module *M) { const char *FSDiscriminatorVar = "__llvm_fs_discriminator__"; if (M->getGlobalVariable(FSDiscriminatorVar)) return; auto &Context = M->getContext(); // Place this variable to llvm.used so it won't be GC'ed. appendToUsed(*M, {new GlobalVariable(*M, Type::getInt1Ty(Context), true, GlobalValue::WeakODRLinkage, ConstantInt::getTrue(Context), FSDiscriminatorVar)}); } } // end of namespace sampleprofutil } // end of namespace llvm