xref: /freebsd/contrib/llvm-project/compiler-rt/lib/fuzzer/FuzzerTracePC.h (revision fe6060f10f634930ff71b7c50291ddc610da2475)
10b57cec5SDimitry Andric //===- FuzzerTracePC.h - Internal header for the Fuzzer ---------*- C++ -* ===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric // fuzzer::TracePC
90b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
100b57cec5SDimitry Andric 
110b57cec5SDimitry Andric #ifndef LLVM_FUZZER_TRACE_PC
120b57cec5SDimitry Andric #define LLVM_FUZZER_TRACE_PC
130b57cec5SDimitry Andric 
140b57cec5SDimitry Andric #include "FuzzerDefs.h"
150b57cec5SDimitry Andric #include "FuzzerDictionary.h"
160b57cec5SDimitry Andric #include "FuzzerValueBitMap.h"
170b57cec5SDimitry Andric 
180b57cec5SDimitry Andric #include <set>
190b57cec5SDimitry Andric #include <unordered_map>
200b57cec5SDimitry Andric 
210b57cec5SDimitry Andric namespace fuzzer {
220b57cec5SDimitry Andric 
230b57cec5SDimitry Andric // TableOfRecentCompares (TORC) remembers the most recently performed
240b57cec5SDimitry Andric // comparisons of type T.
250b57cec5SDimitry Andric // We record the arguments of CMP instructions in this table unconditionally
260b57cec5SDimitry Andric // because it seems cheaper this way than to compute some expensive
270b57cec5SDimitry Andric // conditions inside __sanitizer_cov_trace_cmp*.
280b57cec5SDimitry Andric // After the unit has been executed we may decide to use the contents of
290b57cec5SDimitry Andric // this table to populate a Dictionary.
300b57cec5SDimitry Andric template<class T, size_t kSizeT>
310b57cec5SDimitry Andric struct TableOfRecentCompares {
320b57cec5SDimitry Andric   static const size_t kSize = kSizeT;
330b57cec5SDimitry Andric   struct Pair {
340b57cec5SDimitry Andric     T A, B;
350b57cec5SDimitry Andric   };
360b57cec5SDimitry Andric   ATTRIBUTE_NO_SANITIZE_ALL
370b57cec5SDimitry Andric   void Insert(size_t Idx, const T &Arg1, const T &Arg2) {
380b57cec5SDimitry Andric     Idx = Idx % kSize;
390b57cec5SDimitry Andric     Table[Idx].A = Arg1;
400b57cec5SDimitry Andric     Table[Idx].B = Arg2;
410b57cec5SDimitry Andric   }
420b57cec5SDimitry Andric 
430b57cec5SDimitry Andric   Pair Get(size_t I) { return Table[I % kSize]; }
440b57cec5SDimitry Andric 
450b57cec5SDimitry Andric   Pair Table[kSize];
460b57cec5SDimitry Andric };
470b57cec5SDimitry Andric 
480b57cec5SDimitry Andric template <size_t kSizeT>
490b57cec5SDimitry Andric struct MemMemTable {
500b57cec5SDimitry Andric   static const size_t kSize = kSizeT;
510b57cec5SDimitry Andric   Word MemMemWords[kSize];
520b57cec5SDimitry Andric   Word EmptyWord;
530b57cec5SDimitry Andric 
540b57cec5SDimitry Andric   void Add(const uint8_t *Data, size_t Size) {
550b57cec5SDimitry Andric     if (Size <= 2) return;
560b57cec5SDimitry Andric     Size = std::min(Size, Word::GetMaxSize());
57*fe6060f1SDimitry Andric     auto Idx = SimpleFastHash(Data, Size) % kSize;
580b57cec5SDimitry Andric     MemMemWords[Idx].Set(Data, Size);
590b57cec5SDimitry Andric   }
600b57cec5SDimitry Andric   const Word &Get(size_t Idx) {
610b57cec5SDimitry Andric     for (size_t i = 0; i < kSize; i++) {
620b57cec5SDimitry Andric       const Word &W = MemMemWords[(Idx + i) % kSize];
630b57cec5SDimitry Andric       if (W.size()) return W;
640b57cec5SDimitry Andric     }
650b57cec5SDimitry Andric     EmptyWord.Set(nullptr, 0);
660b57cec5SDimitry Andric     return EmptyWord;
670b57cec5SDimitry Andric   }
680b57cec5SDimitry Andric };
690b57cec5SDimitry Andric 
700b57cec5SDimitry Andric class TracePC {
710b57cec5SDimitry Andric  public:
720b57cec5SDimitry Andric   void HandleInline8bitCountersInit(uint8_t *Start, uint8_t *Stop);
730b57cec5SDimitry Andric   void HandlePCsInit(const uintptr_t *Start, const uintptr_t *Stop);
740b57cec5SDimitry Andric   void HandleCallerCallee(uintptr_t Caller, uintptr_t Callee);
750b57cec5SDimitry Andric   template <class T> void HandleCmp(uintptr_t PC, T Arg1, T Arg2);
760b57cec5SDimitry Andric   size_t GetTotalPCCoverage();
770b57cec5SDimitry Andric   void SetUseCounters(bool UC) { UseCounters = UC; }
780b57cec5SDimitry Andric   void SetUseValueProfileMask(uint32_t VPMask) { UseValueProfileMask = VPMask; }
790b57cec5SDimitry Andric   void SetPrintNewPCs(bool P) { DoPrintNewPCs = P; }
800b57cec5SDimitry Andric   void SetPrintNewFuncs(size_t P) { NumPrintNewFuncs = P; }
810b57cec5SDimitry Andric   void UpdateObservedPCs();
82*fe6060f1SDimitry Andric   template <class Callback> size_t CollectFeatures(Callback CB) const;
830b57cec5SDimitry Andric 
840b57cec5SDimitry Andric   void ResetMaps() {
850b57cec5SDimitry Andric     ValueProfileMap.Reset();
860b57cec5SDimitry Andric     ClearExtraCounters();
870b57cec5SDimitry Andric     ClearInlineCounters();
880b57cec5SDimitry Andric   }
890b57cec5SDimitry Andric 
900b57cec5SDimitry Andric   void ClearInlineCounters();
910b57cec5SDimitry Andric 
920b57cec5SDimitry Andric   void UpdateFeatureSet(size_t CurrentElementIdx, size_t CurrentElementSize);
930b57cec5SDimitry Andric   void PrintFeatureSet();
940b57cec5SDimitry Andric 
950b57cec5SDimitry Andric   void PrintModuleInfo();
960b57cec5SDimitry Andric 
97e8d8bef9SDimitry Andric   void PrintCoverage(bool PrintAllCounters);
980b57cec5SDimitry Andric 
990b57cec5SDimitry Andric   template<class CallBack>
1000b57cec5SDimitry Andric   void IterateCoveredFunctions(CallBack CB);
1010b57cec5SDimitry Andric 
1020b57cec5SDimitry Andric   void AddValueForMemcmp(void *caller_pc, const void *s1, const void *s2,
1030b57cec5SDimitry Andric                          size_t n, bool StopAtZero);
1040b57cec5SDimitry Andric 
1050b57cec5SDimitry Andric   TableOfRecentCompares<uint32_t, 32> TORC4;
1060b57cec5SDimitry Andric   TableOfRecentCompares<uint64_t, 32> TORC8;
1070b57cec5SDimitry Andric   TableOfRecentCompares<Word, 32> TORCW;
1080b57cec5SDimitry Andric   MemMemTable<1024> MMT;
1090b57cec5SDimitry Andric 
1100b57cec5SDimitry Andric   void RecordInitialStack();
1110b57cec5SDimitry Andric   uintptr_t GetMaxStackOffset() const;
1120b57cec5SDimitry Andric 
1130b57cec5SDimitry Andric   template<class CallBack>
1140b57cec5SDimitry Andric   void ForEachObservedPC(CallBack CB) {
1150b57cec5SDimitry Andric     for (auto PC : ObservedPCs)
1160b57cec5SDimitry Andric       CB(PC);
1170b57cec5SDimitry Andric   }
1180b57cec5SDimitry Andric 
1190b57cec5SDimitry Andric   void SetFocusFunction(const std::string &FuncName);
1200b57cec5SDimitry Andric   bool ObservedFocusFunction();
1210b57cec5SDimitry Andric 
1220b57cec5SDimitry Andric   struct PCTableEntry {
1230b57cec5SDimitry Andric     uintptr_t PC, PCFlags;
1240b57cec5SDimitry Andric   };
1250b57cec5SDimitry Andric 
1260b57cec5SDimitry Andric   uintptr_t PCTableEntryIdx(const PCTableEntry *TE);
1270b57cec5SDimitry Andric   const PCTableEntry *PCTableEntryByIdx(uintptr_t Idx);
1280b57cec5SDimitry Andric   static uintptr_t GetNextInstructionPc(uintptr_t PC);
1290b57cec5SDimitry Andric   bool PcIsFuncEntry(const PCTableEntry *TE) { return TE->PCFlags & 1; }
1300b57cec5SDimitry Andric 
1310b57cec5SDimitry Andric private:
1320b57cec5SDimitry Andric   bool UseCounters = false;
1330b57cec5SDimitry Andric   uint32_t UseValueProfileMask = false;
1340b57cec5SDimitry Andric   bool DoPrintNewPCs = false;
1350b57cec5SDimitry Andric   size_t NumPrintNewFuncs = 0;
1360b57cec5SDimitry Andric 
1370b57cec5SDimitry Andric   // Module represents the array of 8-bit counters split into regions
1380b57cec5SDimitry Andric   // such that every region, except maybe the first and the last one, is one
1390b57cec5SDimitry Andric   // full page.
1400b57cec5SDimitry Andric   struct Module {
1410b57cec5SDimitry Andric     struct Region {
1420b57cec5SDimitry Andric       uint8_t *Start, *Stop;
1430b57cec5SDimitry Andric       bool Enabled;
1440b57cec5SDimitry Andric       bool OneFullPage;
1450b57cec5SDimitry Andric     };
1460b57cec5SDimitry Andric     Region *Regions;
1470b57cec5SDimitry Andric     size_t NumRegions;
1480b57cec5SDimitry Andric     uint8_t *Start() { return Regions[0].Start; }
1490b57cec5SDimitry Andric     uint8_t *Stop()  { return Regions[NumRegions - 1].Stop; }
1500b57cec5SDimitry Andric     size_t Size()   { return Stop() - Start(); }
1510b57cec5SDimitry Andric     size_t  Idx(uint8_t *P) {
1520b57cec5SDimitry Andric       assert(P >= Start() && P < Stop());
1530b57cec5SDimitry Andric       return P - Start();
1540b57cec5SDimitry Andric     }
1550b57cec5SDimitry Andric   };
1560b57cec5SDimitry Andric 
1570b57cec5SDimitry Andric   Module Modules[4096];
1580b57cec5SDimitry Andric   size_t NumModules;  // linker-initialized.
1590b57cec5SDimitry Andric   size_t NumInline8bitCounters;
1600b57cec5SDimitry Andric 
1610b57cec5SDimitry Andric   template <class Callback>
1620b57cec5SDimitry Andric   void IterateCounterRegions(Callback CB) {
1630b57cec5SDimitry Andric     for (size_t m = 0; m < NumModules; m++)
1640b57cec5SDimitry Andric       for (size_t r = 0; r < Modules[m].NumRegions; r++)
1650b57cec5SDimitry Andric         CB(Modules[m].Regions[r]);
1660b57cec5SDimitry Andric   }
1670b57cec5SDimitry Andric 
1680b57cec5SDimitry Andric   struct { const PCTableEntry *Start, *Stop; } ModulePCTable[4096];
1690b57cec5SDimitry Andric   size_t NumPCTables;
1700b57cec5SDimitry Andric   size_t NumPCsInPCTables;
1710b57cec5SDimitry Andric 
1720b57cec5SDimitry Andric   Set<const PCTableEntry*> ObservedPCs;
1730b57cec5SDimitry Andric   std::unordered_map<uintptr_t, uintptr_t> ObservedFuncs;  // PC => Counter.
1740b57cec5SDimitry Andric 
1750b57cec5SDimitry Andric   uint8_t *FocusFunctionCounterPtr = nullptr;
1760b57cec5SDimitry Andric 
1770b57cec5SDimitry Andric   ValueBitMap ValueProfileMap;
1780b57cec5SDimitry Andric   uintptr_t InitialStack;
1790b57cec5SDimitry Andric };
1800b57cec5SDimitry Andric 
1810b57cec5SDimitry Andric template <class Callback>
1820b57cec5SDimitry Andric // void Callback(size_t FirstFeature, size_t Idx, uint8_t Value);
1830b57cec5SDimitry Andric ATTRIBUTE_NO_SANITIZE_ALL
1840b57cec5SDimitry Andric size_t ForEachNonZeroByte(const uint8_t *Begin, const uint8_t *End,
1850b57cec5SDimitry Andric                         size_t FirstFeature, Callback Handle8bitCounter) {
1860b57cec5SDimitry Andric   typedef uintptr_t LargeType;
1870b57cec5SDimitry Andric   const size_t Step = sizeof(LargeType) / sizeof(uint8_t);
1880b57cec5SDimitry Andric   const size_t StepMask = Step - 1;
1890b57cec5SDimitry Andric   auto P = Begin;
1900b57cec5SDimitry Andric   // Iterate by 1 byte until either the alignment boundary or the end.
1910b57cec5SDimitry Andric   for (; reinterpret_cast<uintptr_t>(P) & StepMask && P < End; P++)
1920b57cec5SDimitry Andric     if (uint8_t V = *P)
1930b57cec5SDimitry Andric       Handle8bitCounter(FirstFeature, P - Begin, V);
1940b57cec5SDimitry Andric 
1950b57cec5SDimitry Andric   // Iterate by Step bytes at a time.
196*fe6060f1SDimitry Andric   for (; P + Step <= End; P += Step)
197e8d8bef9SDimitry Andric     if (LargeType Bundle = *reinterpret_cast<const LargeType *>(P)) {
198e8d8bef9SDimitry Andric       Bundle = HostToLE(Bundle);
1990b57cec5SDimitry Andric       for (size_t I = 0; I < Step; I++, Bundle >>= 8)
2000b57cec5SDimitry Andric         if (uint8_t V = Bundle & 0xff)
2010b57cec5SDimitry Andric           Handle8bitCounter(FirstFeature, P - Begin + I, V);
202e8d8bef9SDimitry Andric     }
2030b57cec5SDimitry Andric 
2040b57cec5SDimitry Andric   // Iterate by 1 byte until the end.
2050b57cec5SDimitry Andric   for (; P < End; P++)
2060b57cec5SDimitry Andric     if (uint8_t V = *P)
2070b57cec5SDimitry Andric       Handle8bitCounter(FirstFeature, P - Begin, V);
2080b57cec5SDimitry Andric   return End - Begin;
2090b57cec5SDimitry Andric }
2100b57cec5SDimitry Andric 
2110b57cec5SDimitry Andric // Given a non-zero Counter returns a number in the range [0,7].
2120b57cec5SDimitry Andric template<class T>
2130b57cec5SDimitry Andric unsigned CounterToFeature(T Counter) {
2140b57cec5SDimitry Andric     // Returns a feature number by placing Counters into buckets as illustrated
2150b57cec5SDimitry Andric     // below.
2160b57cec5SDimitry Andric     //
2170b57cec5SDimitry Andric     // Counter bucket: [1] [2] [3] [4-7] [8-15] [16-31] [32-127] [128+]
2180b57cec5SDimitry Andric     // Feature number:  0   1   2    3     4       5       6       7
2190b57cec5SDimitry Andric     //
2200b57cec5SDimitry Andric     // This is a heuristic taken from AFL (see
2210b57cec5SDimitry Andric     // http://lcamtuf.coredump.cx/afl/technical_details.txt).
2220b57cec5SDimitry Andric     //
2230b57cec5SDimitry Andric     // This implementation may change in the future so clients should
2240b57cec5SDimitry Andric     // not rely on it.
2250b57cec5SDimitry Andric     assert(Counter);
2260b57cec5SDimitry Andric     unsigned Bit = 0;
2270b57cec5SDimitry Andric     /**/ if (Counter >= 128) Bit = 7;
2280b57cec5SDimitry Andric     else if (Counter >= 32) Bit = 6;
2290b57cec5SDimitry Andric     else if (Counter >= 16) Bit = 5;
2300b57cec5SDimitry Andric     else if (Counter >= 8) Bit = 4;
2310b57cec5SDimitry Andric     else if (Counter >= 4) Bit = 3;
2320b57cec5SDimitry Andric     else if (Counter >= 3) Bit = 2;
2330b57cec5SDimitry Andric     else if (Counter >= 2) Bit = 1;
2340b57cec5SDimitry Andric     return Bit;
2350b57cec5SDimitry Andric }
2360b57cec5SDimitry Andric 
237*fe6060f1SDimitry Andric template <class Callback> // void Callback(uint32_t Feature)
238*fe6060f1SDimitry Andric ATTRIBUTE_NO_SANITIZE_ADDRESS ATTRIBUTE_NOINLINE size_t
239*fe6060f1SDimitry Andric TracePC::CollectFeatures(Callback HandleFeature) const {
2400b57cec5SDimitry Andric   auto Handle8bitCounter = [&](size_t FirstFeature,
2410b57cec5SDimitry Andric                                size_t Idx, uint8_t Counter) {
2420b57cec5SDimitry Andric     if (UseCounters)
243*fe6060f1SDimitry Andric       HandleFeature(static_cast<uint32_t>(FirstFeature + Idx * 8 +
244*fe6060f1SDimitry Andric                                           CounterToFeature(Counter)));
2450b57cec5SDimitry Andric     else
246*fe6060f1SDimitry Andric       HandleFeature(static_cast<uint32_t>(FirstFeature + Idx));
2470b57cec5SDimitry Andric   };
2480b57cec5SDimitry Andric 
2490b57cec5SDimitry Andric   size_t FirstFeature = 0;
2500b57cec5SDimitry Andric 
2510b57cec5SDimitry Andric   for (size_t i = 0; i < NumModules; i++) {
2520b57cec5SDimitry Andric     for (size_t r = 0; r < Modules[i].NumRegions; r++) {
2530b57cec5SDimitry Andric       if (!Modules[i].Regions[r].Enabled) continue;
2540b57cec5SDimitry Andric       FirstFeature += 8 * ForEachNonZeroByte(Modules[i].Regions[r].Start,
2550b57cec5SDimitry Andric                                              Modules[i].Regions[r].Stop,
2560b57cec5SDimitry Andric                                              FirstFeature, Handle8bitCounter);
2570b57cec5SDimitry Andric     }
2580b57cec5SDimitry Andric   }
2590b57cec5SDimitry Andric 
2600b57cec5SDimitry Andric   FirstFeature +=
2610b57cec5SDimitry Andric       8 * ForEachNonZeroByte(ExtraCountersBegin(), ExtraCountersEnd(),
2620b57cec5SDimitry Andric                              FirstFeature, Handle8bitCounter);
2630b57cec5SDimitry Andric 
2640b57cec5SDimitry Andric   if (UseValueProfileMask) {
2650b57cec5SDimitry Andric     ValueProfileMap.ForEach([&](size_t Idx) {
266*fe6060f1SDimitry Andric       HandleFeature(static_cast<uint32_t>(FirstFeature + Idx));
2670b57cec5SDimitry Andric     });
2680b57cec5SDimitry Andric     FirstFeature += ValueProfileMap.SizeInBits();
2690b57cec5SDimitry Andric   }
2700b57cec5SDimitry Andric 
2710b57cec5SDimitry Andric   // Step function, grows similar to 8 * Log_2(A).
272*fe6060f1SDimitry Andric   auto StackDepthStepFunction = [](size_t A) -> size_t {
273*fe6060f1SDimitry Andric     if (!A)
274*fe6060f1SDimitry Andric       return A;
275*fe6060f1SDimitry Andric     auto Log2 = Log(A);
276*fe6060f1SDimitry Andric     if (Log2 < 3)
277*fe6060f1SDimitry Andric       return A;
2780b57cec5SDimitry Andric     Log2 -= 3;
2790b57cec5SDimitry Andric     return (Log2 + 1) * 8 + ((A >> Log2) & 7);
2800b57cec5SDimitry Andric   };
2810b57cec5SDimitry Andric   assert(StackDepthStepFunction(1024) == 64);
2820b57cec5SDimitry Andric   assert(StackDepthStepFunction(1024 * 4) == 80);
2830b57cec5SDimitry Andric   assert(StackDepthStepFunction(1024 * 1024) == 144);
2840b57cec5SDimitry Andric 
285*fe6060f1SDimitry Andric   if (auto MaxStackOffset = GetMaxStackOffset()) {
286*fe6060f1SDimitry Andric     HandleFeature(static_cast<uint32_t>(
287*fe6060f1SDimitry Andric         FirstFeature + StackDepthStepFunction(MaxStackOffset / 8)));
288*fe6060f1SDimitry Andric     FirstFeature += StackDepthStepFunction(std::numeric_limits<size_t>::max());
289*fe6060f1SDimitry Andric   }
290*fe6060f1SDimitry Andric 
291*fe6060f1SDimitry Andric   return FirstFeature;
2920b57cec5SDimitry Andric }
2930b57cec5SDimitry Andric 
2940b57cec5SDimitry Andric extern TracePC TPC;
2950b57cec5SDimitry Andric 
2960b57cec5SDimitry Andric }  // namespace fuzzer
2970b57cec5SDimitry Andric 
2980b57cec5SDimitry Andric #endif  // LLVM_FUZZER_TRACE_PC
299