xref: /freebsd/contrib/llvm-project/llvm/lib/ProfileData/ProfileSummaryBuilder.cpp (revision d409305fa3838fb39b38c26fc085fb729b8766d5)
10b57cec5SDimitry Andric //=-- ProfilesummaryBuilder.cpp - Profile summary computation ---------------=//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric //
90b57cec5SDimitry Andric // This file contains support for computing profile summary data.
100b57cec5SDimitry Andric //
110b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
120b57cec5SDimitry Andric 
130b57cec5SDimitry Andric #include "llvm/IR/Attributes.h"
140b57cec5SDimitry Andric #include "llvm/IR/Function.h"
150b57cec5SDimitry Andric #include "llvm/IR/Metadata.h"
160b57cec5SDimitry Andric #include "llvm/IR/Type.h"
170b57cec5SDimitry Andric #include "llvm/ProfileData/InstrProf.h"
180b57cec5SDimitry Andric #include "llvm/ProfileData/ProfileCommon.h"
190b57cec5SDimitry Andric #include "llvm/ProfileData/SampleProf.h"
200b57cec5SDimitry Andric #include "llvm/Support/Casting.h"
21*d409305fSDimitry Andric #include "llvm/Support/CommandLine.h"
220b57cec5SDimitry Andric 
230b57cec5SDimitry Andric using namespace llvm;
240b57cec5SDimitry Andric 
25*d409305fSDimitry Andric cl::opt<bool> UseContextLessSummary(
26*d409305fSDimitry Andric     "profile-summary-contextless", cl::Hidden, cl::init(false), cl::ZeroOrMore,
27*d409305fSDimitry Andric     cl::desc("Merge context profiles before calculating thresholds."));
28*d409305fSDimitry Andric 
290b57cec5SDimitry Andric // A set of cutoff values. Each value, when divided by ProfileSummary::Scale
300b57cec5SDimitry Andric // (which is 1000000) is a desired percentile of total counts.
310b57cec5SDimitry Andric static const uint32_t DefaultCutoffsData[] = {
320b57cec5SDimitry Andric     10000,  /*  1% */
330b57cec5SDimitry Andric     100000, /* 10% */
340b57cec5SDimitry Andric     200000, 300000, 400000, 500000, 600000, 700000, 800000,
350b57cec5SDimitry Andric     900000, 950000, 990000, 999000, 999900, 999990, 999999};
360b57cec5SDimitry Andric const ArrayRef<uint32_t> ProfileSummaryBuilder::DefaultCutoffs =
370b57cec5SDimitry Andric     DefaultCutoffsData;
380b57cec5SDimitry Andric 
395ffd83dbSDimitry Andric const ProfileSummaryEntry &
405ffd83dbSDimitry Andric ProfileSummaryBuilder::getEntryForPercentile(SummaryEntryVector &DS,
415ffd83dbSDimitry Andric                                              uint64_t Percentile) {
425ffd83dbSDimitry Andric   auto It = partition_point(DS, [=](const ProfileSummaryEntry &Entry) {
435ffd83dbSDimitry Andric     return Entry.Cutoff < Percentile;
445ffd83dbSDimitry Andric   });
455ffd83dbSDimitry Andric   // The required percentile has to be <= one of the percentiles in the
465ffd83dbSDimitry Andric   // detailed summary.
475ffd83dbSDimitry Andric   if (It == DS.end())
485ffd83dbSDimitry Andric     report_fatal_error("Desired percentile exceeds the maximum cutoff");
495ffd83dbSDimitry Andric   return *It;
505ffd83dbSDimitry Andric }
515ffd83dbSDimitry Andric 
520b57cec5SDimitry Andric void InstrProfSummaryBuilder::addRecord(const InstrProfRecord &R) {
530b57cec5SDimitry Andric   // The first counter is not necessarily an entry count for IR
540b57cec5SDimitry Andric   // instrumentation profiles.
550b57cec5SDimitry Andric   // Eventually MaxFunctionCount will become obsolete and this can be
560b57cec5SDimitry Andric   // removed.
570b57cec5SDimitry Andric   addEntryCount(R.Counts[0]);
580b57cec5SDimitry Andric   for (size_t I = 1, E = R.Counts.size(); I < E; ++I)
590b57cec5SDimitry Andric     addInternalCount(R.Counts[I]);
600b57cec5SDimitry Andric }
610b57cec5SDimitry Andric 
620b57cec5SDimitry Andric // To compute the detailed summary, we consider each line containing samples as
630b57cec5SDimitry Andric // equivalent to a block with a count in the instrumented profile.
640b57cec5SDimitry Andric void SampleProfileSummaryBuilder::addRecord(
650b57cec5SDimitry Andric     const sampleprof::FunctionSamples &FS, bool isCallsiteSample) {
660b57cec5SDimitry Andric   if (!isCallsiteSample) {
670b57cec5SDimitry Andric     NumFunctions++;
680b57cec5SDimitry Andric     if (FS.getHeadSamples() > MaxFunctionCount)
690b57cec5SDimitry Andric       MaxFunctionCount = FS.getHeadSamples();
700b57cec5SDimitry Andric   }
710b57cec5SDimitry Andric   for (const auto &I : FS.getBodySamples())
720b57cec5SDimitry Andric     addCount(I.second.getSamples());
730b57cec5SDimitry Andric   for (const auto &I : FS.getCallsiteSamples())
740b57cec5SDimitry Andric     for (const auto &CS : I.second)
750b57cec5SDimitry Andric       addRecord(CS.second, true);
760b57cec5SDimitry Andric }
770b57cec5SDimitry Andric 
780b57cec5SDimitry Andric // The argument to this method is a vector of cutoff percentages and the return
790b57cec5SDimitry Andric // value is a vector of (Cutoff, MinCount, NumCounts) triplets.
800b57cec5SDimitry Andric void ProfileSummaryBuilder::computeDetailedSummary() {
810b57cec5SDimitry Andric   if (DetailedSummaryCutoffs.empty())
820b57cec5SDimitry Andric     return;
830b57cec5SDimitry Andric   llvm::sort(DetailedSummaryCutoffs);
840b57cec5SDimitry Andric   auto Iter = CountFrequencies.begin();
850b57cec5SDimitry Andric   const auto End = CountFrequencies.end();
860b57cec5SDimitry Andric 
870b57cec5SDimitry Andric   uint32_t CountsSeen = 0;
880b57cec5SDimitry Andric   uint64_t CurrSum = 0, Count = 0;
890b57cec5SDimitry Andric 
900b57cec5SDimitry Andric   for (const uint32_t Cutoff : DetailedSummaryCutoffs) {
910b57cec5SDimitry Andric     assert(Cutoff <= 999999);
920b57cec5SDimitry Andric     APInt Temp(128, TotalCount);
930b57cec5SDimitry Andric     APInt N(128, Cutoff);
940b57cec5SDimitry Andric     APInt D(128, ProfileSummary::Scale);
950b57cec5SDimitry Andric     Temp *= N;
960b57cec5SDimitry Andric     Temp = Temp.sdiv(D);
970b57cec5SDimitry Andric     uint64_t DesiredCount = Temp.getZExtValue();
980b57cec5SDimitry Andric     assert(DesiredCount <= TotalCount);
990b57cec5SDimitry Andric     while (CurrSum < DesiredCount && Iter != End) {
1000b57cec5SDimitry Andric       Count = Iter->first;
1010b57cec5SDimitry Andric       uint32_t Freq = Iter->second;
1020b57cec5SDimitry Andric       CurrSum += (Count * Freq);
1030b57cec5SDimitry Andric       CountsSeen += Freq;
1040b57cec5SDimitry Andric       Iter++;
1050b57cec5SDimitry Andric     }
1060b57cec5SDimitry Andric     assert(CurrSum >= DesiredCount);
1070b57cec5SDimitry Andric     ProfileSummaryEntry PSE = {Cutoff, Count, CountsSeen};
1080b57cec5SDimitry Andric     DetailedSummary.push_back(PSE);
1090b57cec5SDimitry Andric   }
1100b57cec5SDimitry Andric }
1110b57cec5SDimitry Andric 
1120b57cec5SDimitry Andric std::unique_ptr<ProfileSummary> SampleProfileSummaryBuilder::getSummary() {
1130b57cec5SDimitry Andric   computeDetailedSummary();
1148bcb0991SDimitry Andric   return std::make_unique<ProfileSummary>(
1150b57cec5SDimitry Andric       ProfileSummary::PSK_Sample, DetailedSummary, TotalCount, MaxCount, 0,
1160b57cec5SDimitry Andric       MaxFunctionCount, NumCounts, NumFunctions);
1170b57cec5SDimitry Andric }
1180b57cec5SDimitry Andric 
119*d409305fSDimitry Andric std::unique_ptr<ProfileSummary>
120*d409305fSDimitry Andric SampleProfileSummaryBuilder::computeSummaryForProfiles(
121*d409305fSDimitry Andric     const StringMap<sampleprof::FunctionSamples> &Profiles) {
122*d409305fSDimitry Andric   assert(NumFunctions == 0 &&
123*d409305fSDimitry Andric          "This can only be called on an empty summary builder");
124*d409305fSDimitry Andric   StringMap<sampleprof::FunctionSamples> ContextLessProfiles;
125*d409305fSDimitry Andric   const StringMap<sampleprof::FunctionSamples> *ProfilesToUse = &Profiles;
126*d409305fSDimitry Andric   // For CSSPGO, context-sensitive profile effectively split a function profile
127*d409305fSDimitry Andric   // into many copies each representing the CFG profile of a particular calling
128*d409305fSDimitry Andric   // context. That makes the count distribution looks more flat as we now have
129*d409305fSDimitry Andric   // more function profiles each with lower counts, which in turn leads to lower
130*d409305fSDimitry Andric   // hot thresholds. To compensate for that, by defauly we merge context
131*d409305fSDimitry Andric   // profiles before coumputing profile summary.
132*d409305fSDimitry Andric   if (UseContextLessSummary || (sampleprof::FunctionSamples::ProfileIsCS &&
133*d409305fSDimitry Andric                                 !UseContextLessSummary.getNumOccurrences())) {
134*d409305fSDimitry Andric     for (const auto &I : Profiles) {
135*d409305fSDimitry Andric       ContextLessProfiles[I.second.getName()].merge(I.second);
136*d409305fSDimitry Andric     }
137*d409305fSDimitry Andric     ProfilesToUse = &ContextLessProfiles;
138*d409305fSDimitry Andric   }
139*d409305fSDimitry Andric 
140*d409305fSDimitry Andric   for (const auto &I : *ProfilesToUse) {
141*d409305fSDimitry Andric     const sampleprof::FunctionSamples &Profile = I.second;
142*d409305fSDimitry Andric     addRecord(Profile);
143*d409305fSDimitry Andric   }
144*d409305fSDimitry Andric 
145*d409305fSDimitry Andric   return getSummary();
146*d409305fSDimitry Andric }
147*d409305fSDimitry Andric 
1480b57cec5SDimitry Andric std::unique_ptr<ProfileSummary> InstrProfSummaryBuilder::getSummary() {
1490b57cec5SDimitry Andric   computeDetailedSummary();
1508bcb0991SDimitry Andric   return std::make_unique<ProfileSummary>(
1510b57cec5SDimitry Andric       ProfileSummary::PSK_Instr, DetailedSummary, TotalCount, MaxCount,
1520b57cec5SDimitry Andric       MaxInternalBlockCount, MaxFunctionCount, NumCounts, NumFunctions);
1530b57cec5SDimitry Andric }
1540b57cec5SDimitry Andric 
1550b57cec5SDimitry Andric void InstrProfSummaryBuilder::addEntryCount(uint64_t Count) {
1560b57cec5SDimitry Andric   NumFunctions++;
157e8d8bef9SDimitry Andric 
158e8d8bef9SDimitry Andric   // Skip invalid count.
159e8d8bef9SDimitry Andric   if (Count == (uint64_t)-1)
160e8d8bef9SDimitry Andric     return;
161e8d8bef9SDimitry Andric 
162e8d8bef9SDimitry Andric   addCount(Count);
1630b57cec5SDimitry Andric   if (Count > MaxFunctionCount)
1640b57cec5SDimitry Andric     MaxFunctionCount = Count;
1650b57cec5SDimitry Andric }
1660b57cec5SDimitry Andric 
1670b57cec5SDimitry Andric void InstrProfSummaryBuilder::addInternalCount(uint64_t Count) {
168e8d8bef9SDimitry Andric   // Skip invalid count.
169e8d8bef9SDimitry Andric   if (Count == (uint64_t)-1)
170e8d8bef9SDimitry Andric     return;
171e8d8bef9SDimitry Andric 
1720b57cec5SDimitry Andric   addCount(Count);
1730b57cec5SDimitry Andric   if (Count > MaxInternalBlockCount)
1740b57cec5SDimitry Andric     MaxInternalBlockCount = Count;
1750b57cec5SDimitry Andric }
176