george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 1 | //===- FuzzerTracePC.h - Internal header for the Fuzzer ---------*- C++ -* ===// |
| 2 | // |
chandlerc | 4028449 | 2019-01-19 08:50:56 +0000 | [diff] [blame] | 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // fuzzer::TracePC |
| 9 | //===----------------------------------------------------------------------===// |
| 10 | |
| 11 | #ifndef LLVM_FUZZER_TRACE_PC |
| 12 | #define LLVM_FUZZER_TRACE_PC |
| 13 | |
| 14 | #include "FuzzerDefs.h" |
| 15 | #include "FuzzerDictionary.h" |
| 16 | #include "FuzzerValueBitMap.h" |
| 17 | |
| 18 | #include <set> |
kcc | b3080d0 | 2018-07-19 22:00:48 +0000 | [diff] [blame] | 19 | #include <unordered_map> |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 20 | |
| 21 | namespace fuzzer { |
| 22 | |
| 23 | // TableOfRecentCompares (TORC) remembers the most recently performed |
| 24 | // comparisons of type T. |
| 25 | // We record the arguments of CMP instructions in this table unconditionally |
| 26 | // because it seems cheaper this way than to compute some expensive |
| 27 | // conditions inside __sanitizer_cov_trace_cmp*. |
| 28 | // After the unit has been executed we may decide to use the contents of |
| 29 | // this table to populate a Dictionary. |
| 30 | template<class T, size_t kSizeT> |
| 31 | struct TableOfRecentCompares { |
| 32 | static const size_t kSize = kSizeT; |
| 33 | struct Pair { |
| 34 | T A, B; |
| 35 | }; |
| 36 | ATTRIBUTE_NO_SANITIZE_ALL |
| 37 | void Insert(size_t Idx, const T &Arg1, const T &Arg2) { |
| 38 | Idx = Idx % kSize; |
| 39 | Table[Idx].A = Arg1; |
| 40 | Table[Idx].B = Arg2; |
| 41 | } |
| 42 | |
| 43 | Pair Get(size_t I) { return Table[I % kSize]; } |
| 44 | |
| 45 | Pair Table[kSize]; |
| 46 | }; |
| 47 | |
| 48 | template <size_t kSizeT> |
| 49 | struct MemMemTable { |
| 50 | static const size_t kSize = kSizeT; |
| 51 | Word MemMemWords[kSize]; |
| 52 | Word EmptyWord; |
| 53 | |
| 54 | void Add(const uint8_t *Data, size_t Size) { |
| 55 | if (Size <= 2) return; |
| 56 | Size = std::min(Size, Word::GetMaxSize()); |
| 57 | size_t Idx = SimpleFastHash(Data, Size) % kSize; |
| 58 | MemMemWords[Idx].Set(Data, Size); |
| 59 | } |
| 60 | const Word &Get(size_t Idx) { |
| 61 | for (size_t i = 0; i < kSize; i++) { |
| 62 | const Word &W = MemMemWords[(Idx + i) % kSize]; |
| 63 | if (W.size()) return W; |
| 64 | } |
| 65 | EmptyWord.Set(nullptr, 0); |
| 66 | return EmptyWord; |
| 67 | } |
| 68 | }; |
| 69 | |
| 70 | class TracePC { |
dor1s | e6729cb | 2018-07-16 15:15:34 +0000 | [diff] [blame] | 71 | public: |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 72 | void HandleInline8bitCountersInit(uint8_t *Start, uint8_t *Stop); |
kcc | 98957a1 | 2017-08-25 19:29:47 +0000 | [diff] [blame] | 73 | void HandlePCsInit(const uintptr_t *Start, const uintptr_t *Stop); |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 74 | void HandleCallerCallee(uintptr_t Caller, uintptr_t Callee); |
| 75 | template <class T> void HandleCmp(uintptr_t PC, T Arg1, T Arg2); |
| 76 | size_t GetTotalPCCoverage(); |
| 77 | void SetUseCounters(bool UC) { UseCounters = UC; } |
kcc | 3850d06 | 2018-07-03 22:33:09 +0000 | [diff] [blame] | 78 | void SetUseValueProfileMask(uint32_t VPMask) { UseValueProfileMask = VPMask; } |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 79 | void SetPrintNewPCs(bool P) { DoPrintNewPCs = P; } |
kcc | ec9da66 | 2017-08-28 22:52:22 +0000 | [diff] [blame] | 80 | void SetPrintNewFuncs(size_t P) { NumPrintNewFuncs = P; } |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 81 | void UpdateObservedPCs(); |
| 82 | template <class Callback> void CollectFeatures(Callback CB) const; |
| 83 | |
| 84 | void ResetMaps() { |
| 85 | ValueProfileMap.Reset(); |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 86 | ClearExtraCounters(); |
| 87 | ClearInlineCounters(); |
| 88 | } |
| 89 | |
| 90 | void ClearInlineCounters(); |
| 91 | |
| 92 | void UpdateFeatureSet(size_t CurrentElementIdx, size_t CurrentElementSize); |
| 93 | void PrintFeatureSet(); |
| 94 | |
| 95 | void PrintModuleInfo(); |
| 96 | |
| 97 | void PrintCoverage(); |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 98 | |
kcc | 85cad3d | 2018-05-11 01:17:52 +0000 | [diff] [blame] | 99 | template<class CallBack> |
| 100 | void IterateCoveredFunctions(CallBack CB); |
| 101 | |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 102 | void AddValueForMemcmp(void *caller_pc, const void *s1, const void *s2, |
| 103 | size_t n, bool StopAtZero); |
| 104 | |
| 105 | TableOfRecentCompares<uint32_t, 32> TORC4; |
| 106 | TableOfRecentCompares<uint64_t, 32> TORC8; |
| 107 | TableOfRecentCompares<Word, 32> TORCW; |
| 108 | MemMemTable<1024> MMT; |
| 109 | |
kcc | 1c0379f | 2017-08-22 01:28:32 +0000 | [diff] [blame] | 110 | void RecordInitialStack(); |
| 111 | uintptr_t GetMaxStackOffset() const; |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 112 | |
| 113 | template<class CallBack> |
| 114 | void ForEachObservedPC(CallBack CB) { |
| 115 | for (auto PC : ObservedPCs) |
| 116 | CB(PC); |
| 117 | } |
| 118 | |
kcc | 3acbe07 | 2018-05-16 23:26:37 +0000 | [diff] [blame] | 119 | void SetFocusFunction(const std::string &FuncName); |
| 120 | bool ObservedFocusFunction(); |
| 121 | |
kcc | 001e5f7 | 2019-02-14 23:12:33 +0000 | [diff] [blame] | 122 | struct PCTableEntry { |
| 123 | uintptr_t PC, PCFlags; |
| 124 | }; |
| 125 | |
| 126 | uintptr_t PCTableEntryIdx(const PCTableEntry *TE); |
kcc | 9c0ed93 | 2019-02-15 01:22:00 +0000 | [diff] [blame] | 127 | const PCTableEntry *PCTableEntryByIdx(uintptr_t Idx); |
| 128 | static uintptr_t GetNextInstructionPc(uintptr_t PC); |
| 129 | bool PcIsFuncEntry(const PCTableEntry *TE) { return TE->PCFlags & 1; } |
kcc | 001e5f7 | 2019-02-14 23:12:33 +0000 | [diff] [blame] | 130 | |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 131 | private: |
| 132 | bool UseCounters = false; |
kcc | 3850d06 | 2018-07-03 22:33:09 +0000 | [diff] [blame] | 133 | uint32_t UseValueProfileMask = false; |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 134 | bool DoPrintNewPCs = false; |
kcc | ec9da66 | 2017-08-28 22:52:22 +0000 | [diff] [blame] | 135 | size_t NumPrintNewFuncs = 0; |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 136 | |
kcc | e246920 | 2019-01-30 06:15:52 +0000 | [diff] [blame] | 137 | // Module represents the array of 8-bit counters split into regions |
| 138 | // such that every region, except maybe the first and the last one, is one |
| 139 | // full page. |
| 140 | struct Module { |
| 141 | struct Region { |
| 142 | uint8_t *Start, *Stop; |
| 143 | bool Enabled; |
| 144 | bool OneFullPage; |
| 145 | }; |
| 146 | Region *Regions; |
| 147 | size_t NumRegions; |
| 148 | uint8_t *Start() { return Regions[0].Start; } |
| 149 | uint8_t *Stop() { return Regions[NumRegions - 1].Stop; } |
| 150 | size_t Size() { return Stop() - Start(); } |
| 151 | size_t Idx(uint8_t *P) { |
| 152 | assert(P >= Start() && P < Stop()); |
| 153 | return P - Start(); |
| 154 | } |
| 155 | }; |
| 156 | |
| 157 | Module Modules[4096]; |
| 158 | size_t NumModules; // linker-initialized. |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 159 | size_t NumInline8bitCounters; |
| 160 | |
kcc | e246920 | 2019-01-30 06:15:52 +0000 | [diff] [blame] | 161 | template <class Callback> |
| 162 | void IterateCounterRegions(Callback CB) { |
| 163 | for (size_t m = 0; m < NumModules; m++) |
| 164 | for (size_t r = 0; r < Modules[m].NumRegions; r++) |
| 165 | CB(Modules[m].Regions[r]); |
| 166 | } |
| 167 | |
kcc | 98957a1 | 2017-08-25 19:29:47 +0000 | [diff] [blame] | 168 | struct { const PCTableEntry *Start, *Stop; } ModulePCTable[4096]; |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 169 | size_t NumPCTables; |
| 170 | size_t NumPCsInPCTables; |
| 171 | |
kcc | 001e5f7 | 2019-02-14 23:12:33 +0000 | [diff] [blame] | 172 | Set<const PCTableEntry*> ObservedPCs; |
kcc | b3080d0 | 2018-07-19 22:00:48 +0000 | [diff] [blame] | 173 | std::unordered_map<uintptr_t, uintptr_t> ObservedFuncs; // PC => Counter. |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 174 | |
kcc | e246920 | 2019-01-30 06:15:52 +0000 | [diff] [blame] | 175 | uint8_t *FocusFunctionCounterPtr = nullptr; |
kcc | 3acbe07 | 2018-05-16 23:26:37 +0000 | [diff] [blame] | 176 | |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 177 | ValueBitMap ValueProfileMap; |
kcc | 1c0379f | 2017-08-22 01:28:32 +0000 | [diff] [blame] | 178 | uintptr_t InitialStack; |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 179 | }; |
| 180 | |
| 181 | template <class Callback> |
| 182 | // void Callback(size_t FirstFeature, size_t Idx, uint8_t Value); |
| 183 | ATTRIBUTE_NO_SANITIZE_ALL |
kcc | e246920 | 2019-01-30 06:15:52 +0000 | [diff] [blame] | 184 | size_t ForEachNonZeroByte(const uint8_t *Begin, const uint8_t *End, |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 185 | size_t FirstFeature, Callback Handle8bitCounter) { |
| 186 | typedef uintptr_t LargeType; |
| 187 | const size_t Step = sizeof(LargeType) / sizeof(uint8_t); |
| 188 | const size_t StepMask = Step - 1; |
| 189 | auto P = Begin; |
| 190 | // Iterate by 1 byte until either the alignment boundary or the end. |
| 191 | for (; reinterpret_cast<uintptr_t>(P) & StepMask && P < End; P++) |
| 192 | if (uint8_t V = *P) |
| 193 | Handle8bitCounter(FirstFeature, P - Begin, V); |
| 194 | |
| 195 | // Iterate by Step bytes at a time. |
| 196 | for (; P < End; P += Step) |
| 197 | if (LargeType Bundle = *reinterpret_cast<const LargeType *>(P)) |
| 198 | for (size_t I = 0; I < Step; I++, Bundle >>= 8) |
| 199 | if (uint8_t V = Bundle & 0xff) |
| 200 | Handle8bitCounter(FirstFeature, P - Begin + I, V); |
| 201 | |
| 202 | // Iterate by 1 byte until the end. |
| 203 | for (; P < End; P++) |
| 204 | if (uint8_t V = *P) |
| 205 | Handle8bitCounter(FirstFeature, P - Begin, V); |
kcc | e246920 | 2019-01-30 06:15:52 +0000 | [diff] [blame] | 206 | return End - Begin; |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 207 | } |
| 208 | |
delcypher | 64c0334 | 2017-11-28 17:41:58 +0000 | [diff] [blame] | 209 | // Given a non-zero Counter returns a number in the range [0,7]. |
kcc | 1c0379f | 2017-08-22 01:28:32 +0000 | [diff] [blame] | 210 | template<class T> |
| 211 | unsigned CounterToFeature(T Counter) { |
dor1s | e6729cb | 2018-07-16 15:15:34 +0000 | [diff] [blame] | 212 | // Returns a feature number by placing Counters into buckets as illustrated |
| 213 | // below. |
| 214 | // |
| 215 | // Counter bucket: [1] [2] [3] [4-7] [8-15] [16-31] [32-127] [128+] |
| 216 | // Feature number: 0 1 2 3 4 5 6 7 |
| 217 | // |
| 218 | // This is a heuristic taken from AFL (see |
| 219 | // http://lcamtuf.coredump.cx/afl/technical_details.txt). |
| 220 | // |
| 221 | // This implementation may change in the future so clients should |
| 222 | // not rely on it. |
| 223 | assert(Counter); |
| 224 | unsigned Bit = 0; |
| 225 | /**/ if (Counter >= 128) Bit = 7; |
| 226 | else if (Counter >= 32) Bit = 6; |
| 227 | else if (Counter >= 16) Bit = 5; |
| 228 | else if (Counter >= 8) Bit = 4; |
| 229 | else if (Counter >= 4) Bit = 3; |
| 230 | else if (Counter >= 3) Bit = 2; |
| 231 | else if (Counter >= 2) Bit = 1; |
| 232 | return Bit; |
kcc | 1c0379f | 2017-08-22 01:28:32 +0000 | [diff] [blame] | 233 | } |
| 234 | |
kcc | c924e38 | 2017-09-15 22:10:36 +0000 | [diff] [blame] | 235 | template <class Callback> // void Callback(size_t Feature) |
kcc | 1c0379f | 2017-08-22 01:28:32 +0000 | [diff] [blame] | 236 | ATTRIBUTE_NO_SANITIZE_ADDRESS |
metzman | 2fe66e6 | 2019-01-17 16:36:05 +0000 | [diff] [blame] | 237 | ATTRIBUTE_NOINLINE |
kcc | 1c0379f | 2017-08-22 01:28:32 +0000 | [diff] [blame] | 238 | void TracePC::CollectFeatures(Callback HandleFeature) const { |
kcc | 1c0379f | 2017-08-22 01:28:32 +0000 | [diff] [blame] | 239 | auto Handle8bitCounter = [&](size_t FirstFeature, |
| 240 | size_t Idx, uint8_t Counter) { |
kcc | 1f5638d | 2017-12-08 22:21:42 +0000 | [diff] [blame] | 241 | if (UseCounters) |
| 242 | HandleFeature(FirstFeature + Idx * 8 + CounterToFeature(Counter)); |
| 243 | else |
| 244 | HandleFeature(FirstFeature + Idx); |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 245 | }; |
| 246 | |
| 247 | size_t FirstFeature = 0; |
| 248 | |
kcc | e246920 | 2019-01-30 06:15:52 +0000 | [diff] [blame] | 249 | for (size_t i = 0; i < NumModules; i++) { |
| 250 | for (size_t r = 0; r < Modules[i].NumRegions; r++) { |
| 251 | if (!Modules[i].Regions[r].Enabled) continue; |
| 252 | FirstFeature += 8 * ForEachNonZeroByte(Modules[i].Regions[r].Start, |
| 253 | Modules[i].Regions[r].Stop, |
| 254 | FirstFeature, Handle8bitCounter); |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 255 | } |
| 256 | } |
| 257 | |
kcc | e246920 | 2019-01-30 06:15:52 +0000 | [diff] [blame] | 258 | FirstFeature += |
| 259 | 8 * ForEachNonZeroByte(ExtraCountersBegin(), ExtraCountersEnd(), |
| 260 | FirstFeature, Handle8bitCounter); |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 261 | |
kcc | 3850d06 | 2018-07-03 22:33:09 +0000 | [diff] [blame] | 262 | if (UseValueProfileMask) { |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 263 | ValueProfileMap.ForEach([&](size_t Idx) { |
| 264 | HandleFeature(FirstFeature + Idx); |
| 265 | }); |
| 266 | FirstFeature += ValueProfileMap.SizeInBits(); |
| 267 | } |
| 268 | |
kcc | d804ddb | 2017-12-09 19:18:10 +0000 | [diff] [blame] | 269 | // Step function, grows similar to 8 * Log_2(A). |
| 270 | auto StackDepthStepFunction = [](uint32_t A) -> uint32_t { |
dor1s | a66e776 | 2017-12-20 19:31:51 +0000 | [diff] [blame] | 271 | if (!A) return A; |
kcc | e29d7e3 | 2017-12-12 23:11:28 +0000 | [diff] [blame] | 272 | uint32_t Log2 = Log(A); |
kcc | d804ddb | 2017-12-09 19:18:10 +0000 | [diff] [blame] | 273 | if (Log2 < 3) return A; |
| 274 | Log2 -= 3; |
| 275 | return (Log2 + 1) * 8 + ((A >> Log2) & 7); |
| 276 | }; |
| 277 | assert(StackDepthStepFunction(1024) == 64); |
| 278 | assert(StackDepthStepFunction(1024 * 4) == 80); |
| 279 | assert(StackDepthStepFunction(1024 * 1024) == 144); |
| 280 | |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 281 | if (auto MaxStackOffset = GetMaxStackOffset()) |
kcc | d804ddb | 2017-12-09 19:18:10 +0000 | [diff] [blame] | 282 | HandleFeature(FirstFeature + StackDepthStepFunction(MaxStackOffset / 8)); |
george.karpenkov | 29efa6d | 2017-08-21 23:25:50 +0000 | [diff] [blame] | 283 | } |
| 284 | |
| 285 | extern TracePC TPC; |
| 286 | |
| 287 | } // namespace fuzzer |
| 288 | |
| 289 | #endif // LLVM_FUZZER_TRACE_PC |