1 //===- FuzzerDriver.cpp - FuzzerDriver function and flags -----------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // FuzzerDriver and flag parsing. 9 //===----------------------------------------------------------------------===// 10 11 #include "FuzzerCommand.h" 12 #include "FuzzerCorpus.h" 13 #include "FuzzerFork.h" 14 #include "FuzzerIO.h" 15 #include "FuzzerInterface.h" 16 #include "FuzzerInternal.h" 17 #include "FuzzerMerge.h" 18 #include "FuzzerMutate.h" 19 #include "FuzzerPlatform.h" 20 #include "FuzzerRandom.h" 21 #include "FuzzerTracePC.h" 22 #include <algorithm> 23 #include <atomic> 24 #include <chrono> 25 #include <cstdlib> 26 #include <cstring> 27 #include <mutex> 28 #include <string> 29 #include <thread> 30 #include <fstream> 31 32 // This function should be present in the libFuzzer so that the client 33 // binary can test for its existence. 34 #if LIBFUZZER_MSVC 35 extern "C" void __libfuzzer_is_present() {} 36 #if defined(_M_IX86) || defined(__i386__) 37 #pragma comment(linker, "/include:___libfuzzer_is_present") 38 #else 39 #pragma comment(linker, "/include:__libfuzzer_is_present") 40 #endif 41 #else 42 extern "C" __attribute__((used)) void __libfuzzer_is_present() {} 43 #endif // LIBFUZZER_MSVC 44 45 namespace fuzzer { 46 47 // Program arguments. 48 struct FlagDescription { 49 const char *Name; 50 const char *Description; 51 int Default; 52 int *IntFlag; 53 const char **StrFlag; 54 unsigned int *UIntFlag; 55 }; 56 57 struct { 58 #define FUZZER_DEPRECATED_FLAG(Name) 59 #define FUZZER_FLAG_INT(Name, Default, Description) int Name; 60 #define FUZZER_FLAG_UNSIGNED(Name, Default, Description) unsigned int Name; 61 #define FUZZER_FLAG_STRING(Name, Description) const char *Name; 62 #include "FuzzerFlags.def" 63 #undef FUZZER_DEPRECATED_FLAG 64 #undef FUZZER_FLAG_INT 65 #undef FUZZER_FLAG_UNSIGNED 66 #undef FUZZER_FLAG_STRING 67 } Flags; 68 69 static const FlagDescription FlagDescriptions [] { 70 #define FUZZER_DEPRECATED_FLAG(Name) \ 71 {#Name, "Deprecated; don't use", 0, nullptr, nullptr, nullptr}, 72 #define FUZZER_FLAG_INT(Name, Default, Description) \ 73 {#Name, Description, Default, &Flags.Name, nullptr, nullptr}, 74 #define FUZZER_FLAG_UNSIGNED(Name, Default, Description) \ 75 {#Name, Description, static_cast<int>(Default), \ 76 nullptr, nullptr, &Flags.Name}, 77 #define FUZZER_FLAG_STRING(Name, Description) \ 78 {#Name, Description, 0, nullptr, &Flags.Name, nullptr}, 79 #include "FuzzerFlags.def" 80 #undef FUZZER_DEPRECATED_FLAG 81 #undef FUZZER_FLAG_INT 82 #undef FUZZER_FLAG_UNSIGNED 83 #undef FUZZER_FLAG_STRING 84 }; 85 86 static const size_t kNumFlags = 87 sizeof(FlagDescriptions) / sizeof(FlagDescriptions[0]); 88 89 static std::vector<std::string> *Inputs; 90 static std::string *ProgName; 91 92 static void PrintHelp() { 93 Printf("Usage:\n"); 94 auto Prog = ProgName->c_str(); 95 Printf("\nTo run fuzzing pass 0 or more directories.\n"); 96 Printf("%s [-flag1=val1 [-flag2=val2 ...] ] [dir1 [dir2 ...] ]\n", Prog); 97 98 Printf("\nTo run individual tests without fuzzing pass 1 or more files:\n"); 99 Printf("%s [-flag1=val1 [-flag2=val2 ...] ] file1 [file2 ...]\n", Prog); 100 101 Printf("\nFlags: (strictly in form -flag=value)\n"); 102 size_t MaxFlagLen = 0; 103 for (size_t F = 0; F < kNumFlags; F++) 104 MaxFlagLen = std::max(strlen(FlagDescriptions[F].Name), MaxFlagLen); 105 106 for (size_t F = 0; F < kNumFlags; F++) { 107 const auto &D = FlagDescriptions[F]; 108 if (strstr(D.Description, "internal flag") == D.Description) continue; 109 Printf(" %s", D.Name); 110 for (size_t i = 0, n = MaxFlagLen - strlen(D.Name); i < n; i++) 111 Printf(" "); 112 Printf("\t"); 113 Printf("%d\t%s\n", D.Default, D.Description); 114 } 115 Printf("\nFlags starting with '--' will be ignored and " 116 "will be passed verbatim to subprocesses.\n"); 117 } 118 119 static const char *FlagValue(const char *Param, const char *Name) { 120 size_t Len = strlen(Name); 121 if (Param[0] == '-' && strstr(Param + 1, Name) == Param + 1 && 122 Param[Len + 1] == '=') 123 return &Param[Len + 2]; 124 return nullptr; 125 } 126 127 // Avoid calling stol as it triggers a bug in clang/glibc build. 128 static long MyStol(const char *Str) { 129 long Res = 0; 130 long Sign = 1; 131 if (*Str == '-') { 132 Str++; 133 Sign = -1; 134 } 135 for (size_t i = 0; Str[i]; i++) { 136 char Ch = Str[i]; 137 if (Ch < '0' || Ch > '9') 138 return Res; 139 Res = Res * 10 + (Ch - '0'); 140 } 141 return Res * Sign; 142 } 143 144 static bool ParseOneFlag(const char *Param) { 145 if (Param[0] != '-') return false; 146 if (Param[1] == '-') { 147 static bool PrintedWarning = false; 148 if (!PrintedWarning) { 149 PrintedWarning = true; 150 Printf("INFO: libFuzzer ignores flags that start with '--'\n"); 151 } 152 for (size_t F = 0; F < kNumFlags; F++) 153 if (FlagValue(Param + 1, FlagDescriptions[F].Name)) 154 Printf("WARNING: did you mean '%s' (single dash)?\n", Param + 1); 155 return true; 156 } 157 for (size_t F = 0; F < kNumFlags; F++) { 158 const char *Name = FlagDescriptions[F].Name; 159 const char *Str = FlagValue(Param, Name); 160 if (Str) { 161 if (FlagDescriptions[F].IntFlag) { 162 auto Val = MyStol(Str); 163 *FlagDescriptions[F].IntFlag = static_cast<int>(Val); 164 if (Flags.verbosity >= 2) 165 Printf("Flag: %s %d\n", Name, Val); 166 return true; 167 } else if (FlagDescriptions[F].UIntFlag) { 168 auto Val = std::stoul(Str); 169 *FlagDescriptions[F].UIntFlag = static_cast<unsigned int>(Val); 170 if (Flags.verbosity >= 2) 171 Printf("Flag: %s %u\n", Name, Val); 172 return true; 173 } else if (FlagDescriptions[F].StrFlag) { 174 *FlagDescriptions[F].StrFlag = Str; 175 if (Flags.verbosity >= 2) 176 Printf("Flag: %s %s\n", Name, Str); 177 return true; 178 } else { // Deprecated flag. 179 Printf("Flag: %s: deprecated, don't use\n", Name); 180 return true; 181 } 182 } 183 } 184 Printf("\n\nWARNING: unrecognized flag '%s'; " 185 "use -help=1 to list all flags\n\n", Param); 186 return true; 187 } 188 189 // We don't use any library to minimize dependencies. 190 static void ParseFlags(const std::vector<std::string> &Args, 191 const ExternalFunctions *EF) { 192 for (size_t F = 0; F < kNumFlags; F++) { 193 if (FlagDescriptions[F].IntFlag) 194 *FlagDescriptions[F].IntFlag = FlagDescriptions[F].Default; 195 if (FlagDescriptions[F].UIntFlag) 196 *FlagDescriptions[F].UIntFlag = 197 static_cast<unsigned int>(FlagDescriptions[F].Default); 198 if (FlagDescriptions[F].StrFlag) 199 *FlagDescriptions[F].StrFlag = nullptr; 200 } 201 202 // Disable len_control by default, if LLVMFuzzerCustomMutator is used. 203 if (EF->LLVMFuzzerCustomMutator) { 204 Flags.len_control = 0; 205 Printf("INFO: found LLVMFuzzerCustomMutator (%p). " 206 "Disabling -len_control by default.\n", EF->LLVMFuzzerCustomMutator); 207 } 208 209 Inputs = new std::vector<std::string>; 210 for (size_t A = 1; A < Args.size(); A++) { 211 if (ParseOneFlag(Args[A].c_str())) { 212 if (Flags.ignore_remaining_args) 213 break; 214 continue; 215 } 216 Inputs->push_back(Args[A]); 217 } 218 } 219 220 static std::mutex Mu; 221 222 static void PulseThread() { 223 while (true) { 224 SleepSeconds(600); 225 std::lock_guard<std::mutex> Lock(Mu); 226 Printf("pulse...\n"); 227 } 228 } 229 230 static void WorkerThread(const Command &BaseCmd, std::atomic<unsigned> *Counter, 231 unsigned NumJobs, std::atomic<bool> *HasErrors) { 232 while (true) { 233 unsigned C = (*Counter)++; 234 if (C >= NumJobs) break; 235 std::string Log = "fuzz-" + std::to_string(C) + ".log"; 236 Command Cmd(BaseCmd); 237 Cmd.setOutputFile(Log); 238 Cmd.combineOutAndErr(); 239 if (Flags.verbosity) { 240 std::string CommandLine = Cmd.toString(); 241 Printf("%s\n", CommandLine.c_str()); 242 } 243 int ExitCode = ExecuteCommand(Cmd); 244 if (ExitCode != 0) 245 *HasErrors = true; 246 std::lock_guard<std::mutex> Lock(Mu); 247 Printf("================== Job %u exited with exit code %d ============\n", 248 C, ExitCode); 249 fuzzer::CopyFileToErr(Log); 250 } 251 } 252 253 static void ValidateDirectoryExists(const std::string &Path, 254 bool CreateDirectory) { 255 if (Path.empty()) { 256 Printf("ERROR: Provided directory path is an empty string\n"); 257 exit(1); 258 } 259 260 if (IsDirectory(Path)) 261 return; 262 263 if (CreateDirectory) { 264 if (!MkDirRecursive(Path)) { 265 Printf("ERROR: Failed to create directory \"%s\"\n", Path.c_str()); 266 exit(1); 267 } 268 return; 269 } 270 271 Printf("ERROR: The required directory \"%s\" does not exist\n", Path.c_str()); 272 exit(1); 273 } 274 275 std::string CloneArgsWithoutX(const std::vector<std::string> &Args, 276 const char *X1, const char *X2) { 277 std::string Cmd; 278 for (auto &S : Args) { 279 if (FlagValue(S.c_str(), X1) || FlagValue(S.c_str(), X2)) 280 continue; 281 Cmd += S + " "; 282 } 283 return Cmd; 284 } 285 286 static int RunInMultipleProcesses(const std::vector<std::string> &Args, 287 unsigned NumWorkers, unsigned NumJobs) { 288 std::atomic<unsigned> Counter(0); 289 std::atomic<bool> HasErrors(false); 290 Command Cmd(Args); 291 Cmd.removeFlag("jobs"); 292 Cmd.removeFlag("workers"); 293 std::vector<std::thread> V; 294 std::thread Pulse(PulseThread); 295 Pulse.detach(); 296 for (unsigned i = 0; i < NumWorkers; i++) 297 V.push_back(std::thread(WorkerThread, std::ref(Cmd), &Counter, NumJobs, 298 &HasErrors)); 299 for (auto &T : V) 300 T.join(); 301 return HasErrors ? 1 : 0; 302 } 303 304 static void RssThread(Fuzzer *F, size_t RssLimitMb) { 305 while (true) { 306 SleepSeconds(1); 307 size_t Peak = GetPeakRSSMb(); 308 if (Peak > RssLimitMb) 309 F->RssLimitCallback(); 310 } 311 } 312 313 static void StartRssThread(Fuzzer *F, size_t RssLimitMb) { 314 if (!RssLimitMb) 315 return; 316 std::thread T(RssThread, F, RssLimitMb); 317 T.detach(); 318 } 319 320 int RunOneTest(Fuzzer *F, const char *InputFilePath, size_t MaxLen) { 321 Unit U = FileToVector(InputFilePath); 322 if (MaxLen && MaxLen < U.size()) 323 U.resize(MaxLen); 324 F->ExecuteCallback(U.data(), U.size()); 325 if (Flags.print_full_coverage) { 326 // Leak detection is not needed when collecting full coverage data. 327 F->TPCUpdateObservedPCs(); 328 } else { 329 F->TryDetectingAMemoryLeak(U.data(), U.size(), true); 330 } 331 return 0; 332 } 333 334 static bool AllInputsAreFiles() { 335 if (Inputs->empty()) return false; 336 for (auto &Path : *Inputs) 337 if (!IsFile(Path)) 338 return false; 339 return true; 340 } 341 342 static std::string GetDedupTokenFromCmdOutput(const std::string &S) { 343 auto Beg = S.find("DEDUP_TOKEN:"); 344 if (Beg == std::string::npos) 345 return ""; 346 auto End = S.find('\n', Beg); 347 if (End == std::string::npos) 348 return ""; 349 return S.substr(Beg, End - Beg); 350 } 351 352 int CleanseCrashInput(const std::vector<std::string> &Args, 353 const FuzzingOptions &Options) { 354 if (Inputs->size() != 1 || !Flags.exact_artifact_path) { 355 Printf("ERROR: -cleanse_crash should be given one input file and" 356 " -exact_artifact_path\n"); 357 exit(1); 358 } 359 std::string InputFilePath = Inputs->at(0); 360 std::string OutputFilePath = Flags.exact_artifact_path; 361 Command Cmd(Args); 362 Cmd.removeFlag("cleanse_crash"); 363 364 assert(Cmd.hasArgument(InputFilePath)); 365 Cmd.removeArgument(InputFilePath); 366 367 auto TmpFilePath = TempPath("CleanseCrashInput", ".repro"); 368 Cmd.addArgument(TmpFilePath); 369 Cmd.setOutputFile(getDevNull()); 370 Cmd.combineOutAndErr(); 371 372 std::string CurrentFilePath = InputFilePath; 373 auto U = FileToVector(CurrentFilePath); 374 size_t Size = U.size(); 375 376 const std::vector<uint8_t> ReplacementBytes = {' ', 0xff}; 377 for (int NumAttempts = 0; NumAttempts < 5; NumAttempts++) { 378 bool Changed = false; 379 for (size_t Idx = 0; Idx < Size; Idx++) { 380 Printf("CLEANSE[%d]: Trying to replace byte %zd of %zd\n", NumAttempts, 381 Idx, Size); 382 uint8_t OriginalByte = U[Idx]; 383 if (ReplacementBytes.end() != std::find(ReplacementBytes.begin(), 384 ReplacementBytes.end(), 385 OriginalByte)) 386 continue; 387 for (auto NewByte : ReplacementBytes) { 388 U[Idx] = NewByte; 389 WriteToFile(U, TmpFilePath); 390 auto ExitCode = ExecuteCommand(Cmd); 391 RemoveFile(TmpFilePath); 392 if (!ExitCode) { 393 U[Idx] = OriginalByte; 394 } else { 395 Changed = true; 396 Printf("CLEANSE: Replaced byte %zd with 0x%x\n", Idx, NewByte); 397 WriteToFile(U, OutputFilePath); 398 break; 399 } 400 } 401 } 402 if (!Changed) break; 403 } 404 return 0; 405 } 406 407 int MinimizeCrashInput(const std::vector<std::string> &Args, 408 const FuzzingOptions &Options) { 409 if (Inputs->size() != 1) { 410 Printf("ERROR: -minimize_crash should be given one input file\n"); 411 exit(1); 412 } 413 std::string InputFilePath = Inputs->at(0); 414 Command BaseCmd(Args); 415 BaseCmd.removeFlag("minimize_crash"); 416 BaseCmd.removeFlag("exact_artifact_path"); 417 assert(BaseCmd.hasArgument(InputFilePath)); 418 BaseCmd.removeArgument(InputFilePath); 419 if (Flags.runs <= 0 && Flags.max_total_time == 0) { 420 Printf("INFO: you need to specify -runs=N or " 421 "-max_total_time=N with -minimize_crash=1\n" 422 "INFO: defaulting to -max_total_time=600\n"); 423 BaseCmd.addFlag("max_total_time", "600"); 424 } 425 426 BaseCmd.combineOutAndErr(); 427 428 std::string CurrentFilePath = InputFilePath; 429 while (true) { 430 Unit U = FileToVector(CurrentFilePath); 431 Printf("CRASH_MIN: minimizing crash input: '%s' (%zd bytes)\n", 432 CurrentFilePath.c_str(), U.size()); 433 434 Command Cmd(BaseCmd); 435 Cmd.addArgument(CurrentFilePath); 436 437 Printf("CRASH_MIN: executing: %s\n", Cmd.toString().c_str()); 438 std::string CmdOutput; 439 bool Success = ExecuteCommand(Cmd, &CmdOutput); 440 if (Success) { 441 Printf("ERROR: the input %s did not crash\n", CurrentFilePath.c_str()); 442 exit(1); 443 } 444 Printf("CRASH_MIN: '%s' (%zd bytes) caused a crash. Will try to minimize " 445 "it further\n", 446 CurrentFilePath.c_str(), U.size()); 447 auto DedupToken1 = GetDedupTokenFromCmdOutput(CmdOutput); 448 if (!DedupToken1.empty()) 449 Printf("CRASH_MIN: DedupToken1: %s\n", DedupToken1.c_str()); 450 451 std::string ArtifactPath = 452 Flags.exact_artifact_path 453 ? Flags.exact_artifact_path 454 : Options.ArtifactPrefix + "minimized-from-" + Hash(U); 455 Cmd.addFlag("minimize_crash_internal_step", "1"); 456 Cmd.addFlag("exact_artifact_path", ArtifactPath); 457 Printf("CRASH_MIN: executing: %s\n", Cmd.toString().c_str()); 458 CmdOutput.clear(); 459 Success = ExecuteCommand(Cmd, &CmdOutput); 460 Printf("%s", CmdOutput.c_str()); 461 if (Success) { 462 if (Flags.exact_artifact_path) { 463 CurrentFilePath = Flags.exact_artifact_path; 464 WriteToFile(U, CurrentFilePath); 465 } 466 Printf("CRASH_MIN: failed to minimize beyond %s (%zu bytes), exiting\n", 467 CurrentFilePath.c_str(), U.size()); 468 break; 469 } 470 auto DedupToken2 = GetDedupTokenFromCmdOutput(CmdOutput); 471 if (!DedupToken2.empty()) 472 Printf("CRASH_MIN: DedupToken2: %s\n", DedupToken2.c_str()); 473 474 if (DedupToken1 != DedupToken2) { 475 if (Flags.exact_artifact_path) { 476 CurrentFilePath = Flags.exact_artifact_path; 477 WriteToFile(U, CurrentFilePath); 478 } 479 Printf("CRASH_MIN: mismatch in dedup tokens" 480 " (looks like a different bug). Won't minimize further\n"); 481 break; 482 } 483 484 CurrentFilePath = ArtifactPath; 485 Printf("*********************************\n"); 486 } 487 return 0; 488 } 489 490 int MinimizeCrashInputInternalStep(Fuzzer *F, InputCorpus *Corpus) { 491 assert(Inputs->size() == 1); 492 std::string InputFilePath = Inputs->at(0); 493 Unit U = FileToVector(InputFilePath); 494 Printf("INFO: Starting MinimizeCrashInputInternalStep: %zd\n", U.size()); 495 if (U.size() < 2) { 496 Printf("INFO: The input is small enough, exiting\n"); 497 exit(0); 498 } 499 F->SetMaxInputLen(U.size()); 500 F->SetMaxMutationLen(U.size() - 1); 501 F->MinimizeCrashLoop(U); 502 Printf("INFO: Done MinimizeCrashInputInternalStep, no crashes found\n"); 503 exit(0); 504 } 505 506 void Merge(Fuzzer *F, FuzzingOptions &Options, 507 const std::vector<std::string> &Args, 508 const std::vector<std::string> &Corpora, const char *CFPathOrNull) { 509 if (Corpora.size() < 2) { 510 Printf("INFO: Merge requires two or more corpus dirs\n"); 511 exit(0); 512 } 513 514 std::vector<SizedFile> OldCorpus, NewCorpus; 515 GetSizedFilesFromDir(Corpora[0], &OldCorpus); 516 for (size_t i = 1; i < Corpora.size(); i++) 517 GetSizedFilesFromDir(Corpora[i], &NewCorpus); 518 std::sort(OldCorpus.begin(), OldCorpus.end()); 519 std::sort(NewCorpus.begin(), NewCorpus.end()); 520 521 std::string CFPath = CFPathOrNull ? CFPathOrNull : TempPath("Merge", ".txt"); 522 std::vector<std::string> NewFiles; 523 std::set<uint32_t> NewFeatures, NewCov; 524 CrashResistantMerge(Args, OldCorpus, NewCorpus, &NewFiles, {}, &NewFeatures, 525 {}, &NewCov, CFPath, true, Flags.set_cover_merge); 526 for (auto &Path : NewFiles) 527 F->WriteToOutputCorpus(FileToVector(Path, Options.MaxLen)); 528 // We are done, delete the control file if it was a temporary one. 529 if (!Flags.merge_control_file) 530 RemoveFile(CFPath); 531 532 exit(0); 533 } 534 535 int AnalyzeDictionary(Fuzzer *F, const std::vector<Unit> &Dict, 536 UnitVector &Corpus) { 537 Printf("Started dictionary minimization (up to %zu tests)\n", 538 Dict.size() * Corpus.size() * 2); 539 540 // Scores and usage count for each dictionary unit. 541 std::vector<int> Scores(Dict.size()); 542 std::vector<int> Usages(Dict.size()); 543 544 std::vector<size_t> InitialFeatures; 545 std::vector<size_t> ModifiedFeatures; 546 for (auto &C : Corpus) { 547 // Get coverage for the testcase without modifications. 548 F->ExecuteCallback(C.data(), C.size()); 549 InitialFeatures.clear(); 550 TPC.CollectFeatures([&](size_t Feature) { 551 InitialFeatures.push_back(Feature); 552 }); 553 554 for (size_t i = 0; i < Dict.size(); ++i) { 555 std::vector<uint8_t> Data = C; 556 auto StartPos = std::search(Data.begin(), Data.end(), 557 Dict[i].begin(), Dict[i].end()); 558 // Skip dictionary unit, if the testcase does not contain it. 559 if (StartPos == Data.end()) 560 continue; 561 562 ++Usages[i]; 563 while (StartPos != Data.end()) { 564 // Replace all occurrences of dictionary unit in the testcase. 565 auto EndPos = StartPos + Dict[i].size(); 566 for (auto It = StartPos; It != EndPos; ++It) 567 *It ^= 0xFF; 568 569 StartPos = std::search(EndPos, Data.end(), 570 Dict[i].begin(), Dict[i].end()); 571 } 572 573 // Get coverage for testcase with masked occurrences of dictionary unit. 574 F->ExecuteCallback(Data.data(), Data.size()); 575 ModifiedFeatures.clear(); 576 TPC.CollectFeatures([&](size_t Feature) { 577 ModifiedFeatures.push_back(Feature); 578 }); 579 580 if (InitialFeatures == ModifiedFeatures) 581 --Scores[i]; 582 else 583 Scores[i] += 2; 584 } 585 } 586 587 Printf("###### Useless dictionary elements. ######\n"); 588 for (size_t i = 0; i < Dict.size(); ++i) { 589 // Dictionary units with positive score are treated as useful ones. 590 if (Scores[i] > 0) 591 continue; 592 593 Printf("\""); 594 PrintASCII(Dict[i].data(), Dict[i].size(), "\""); 595 Printf(" # Score: %d, Used: %d\n", Scores[i], Usages[i]); 596 } 597 Printf("###### End of useless dictionary elements. ######\n"); 598 return 0; 599 } 600 601 std::vector<std::string> ParseSeedInuts(const char *seed_inputs) { 602 // Parse -seed_inputs=file1,file2,... or -seed_inputs=@seed_inputs_file 603 std::vector<std::string> Files; 604 if (!seed_inputs) return Files; 605 std::string SeedInputs; 606 if (Flags.seed_inputs[0] == '@') 607 SeedInputs = FileToString(Flags.seed_inputs + 1); // File contains list. 608 else 609 SeedInputs = Flags.seed_inputs; // seed_inputs contains the list. 610 if (SeedInputs.empty()) { 611 Printf("seed_inputs is empty or @file does not exist.\n"); 612 exit(1); 613 } 614 // Parse SeedInputs. 615 size_t comma_pos = 0; 616 while ((comma_pos = SeedInputs.find_last_of(',')) != std::string::npos) { 617 Files.push_back(SeedInputs.substr(comma_pos + 1)); 618 SeedInputs = SeedInputs.substr(0, comma_pos); 619 } 620 Files.push_back(SeedInputs); 621 return Files; 622 } 623 624 static std::vector<SizedFile> 625 ReadCorpora(const std::vector<std::string> &CorpusDirs, 626 const std::vector<std::string> &ExtraSeedFiles) { 627 std::vector<SizedFile> SizedFiles; 628 size_t LastNumFiles = 0; 629 for (auto &Dir : CorpusDirs) { 630 GetSizedFilesFromDir(Dir, &SizedFiles); 631 Printf("INFO: % 8zd files found in %s\n", SizedFiles.size() - LastNumFiles, 632 Dir.c_str()); 633 LastNumFiles = SizedFiles.size(); 634 } 635 for (auto &File : ExtraSeedFiles) 636 if (auto Size = FileSize(File)) 637 SizedFiles.push_back({File, Size}); 638 return SizedFiles; 639 } 640 641 int FuzzerDriver(int *argc, char ***argv, UserCallback Callback) { 642 using namespace fuzzer; 643 assert(argc && argv && "Argument pointers cannot be nullptr"); 644 std::string Argv0((*argv)[0]); 645 EF = new ExternalFunctions(); 646 if (EF->LLVMFuzzerInitialize) 647 EF->LLVMFuzzerInitialize(argc, argv); 648 if (EF->__msan_scoped_disable_interceptor_checks) 649 EF->__msan_scoped_disable_interceptor_checks(); 650 const std::vector<std::string> Args(*argv, *argv + *argc); 651 assert(!Args.empty()); 652 ProgName = new std::string(Args[0]); 653 if (Argv0 != *ProgName) { 654 Printf("ERROR: argv[0] has been modified in LLVMFuzzerInitialize\n"); 655 exit(1); 656 } 657 ParseFlags(Args, EF); 658 if (Flags.help) { 659 PrintHelp(); 660 return 0; 661 } 662 663 if (Flags.close_fd_mask & 2) 664 DupAndCloseStderr(); 665 if (Flags.close_fd_mask & 1) 666 CloseStdout(); 667 668 if (Flags.jobs > 0 && Flags.workers == 0) { 669 Flags.workers = std::min(NumberOfCpuCores() / 2, Flags.jobs); 670 if (Flags.workers > 1) 671 Printf("Running %u workers\n", Flags.workers); 672 } 673 674 if (Flags.workers > 0 && Flags.jobs > 0) 675 return RunInMultipleProcesses(Args, Flags.workers, Flags.jobs); 676 677 FuzzingOptions Options; 678 Options.Verbosity = Flags.verbosity; 679 Options.MaxLen = Flags.max_len; 680 Options.LenControl = Flags.len_control; 681 Options.KeepSeed = Flags.keep_seed; 682 Options.UnitTimeoutSec = Flags.timeout; 683 Options.ErrorExitCode = Flags.error_exitcode; 684 Options.TimeoutExitCode = Flags.timeout_exitcode; 685 Options.IgnoreTimeouts = Flags.ignore_timeouts; 686 Options.IgnoreOOMs = Flags.ignore_ooms; 687 Options.IgnoreCrashes = Flags.ignore_crashes; 688 Options.MaxTotalTimeSec = Flags.max_total_time; 689 Options.DoCrossOver = Flags.cross_over; 690 Options.CrossOverUniformDist = Flags.cross_over_uniform_dist; 691 Options.MutateDepth = Flags.mutate_depth; 692 Options.ReduceDepth = Flags.reduce_depth; 693 Options.UseCounters = Flags.use_counters; 694 Options.UseMemmem = Flags.use_memmem; 695 Options.UseCmp = Flags.use_cmp; 696 Options.UseValueProfile = Flags.use_value_profile; 697 Options.Shrink = Flags.shrink; 698 Options.ReduceInputs = Flags.reduce_inputs; 699 Options.ShuffleAtStartUp = Flags.shuffle; 700 Options.PreferSmall = Flags.prefer_small; 701 Options.ReloadIntervalSec = Flags.reload; 702 Options.OnlyASCII = Flags.only_ascii; 703 Options.DetectLeaks = Flags.detect_leaks; 704 Options.PurgeAllocatorIntervalSec = Flags.purge_allocator_interval; 705 Options.TraceMalloc = Flags.trace_malloc; 706 Options.RssLimitMb = Flags.rss_limit_mb; 707 Options.MallocLimitMb = Flags.malloc_limit_mb; 708 if (!Options.MallocLimitMb) 709 Options.MallocLimitMb = Options.RssLimitMb; 710 if (Flags.runs >= 0) 711 Options.MaxNumberOfRuns = Flags.runs; 712 if (!Inputs->empty() && !Flags.minimize_crash_internal_step) { 713 // Ensure output corpus assumed to be the first arbitrary argument input 714 // is not a path to an existing file. 715 std::string OutputCorpusDir = (*Inputs)[0]; 716 if (!IsFile(OutputCorpusDir)) { 717 Options.OutputCorpus = OutputCorpusDir; 718 ValidateDirectoryExists(Options.OutputCorpus, Flags.create_missing_dirs); 719 } 720 } 721 Options.ReportSlowUnits = Flags.report_slow_units; 722 if (Flags.artifact_prefix) { 723 Options.ArtifactPrefix = Flags.artifact_prefix; 724 725 // Since the prefix could be a full path to a file name prefix, assume 726 // that if the path ends with the platform's separator that a directory 727 // is desired 728 std::string ArtifactPathDir = Options.ArtifactPrefix; 729 if (!IsSeparator(ArtifactPathDir[ArtifactPathDir.length() - 1])) { 730 ArtifactPathDir = DirName(ArtifactPathDir); 731 } 732 ValidateDirectoryExists(ArtifactPathDir, Flags.create_missing_dirs); 733 } 734 if (Flags.exact_artifact_path) { 735 Options.ExactArtifactPath = Flags.exact_artifact_path; 736 ValidateDirectoryExists(DirName(Options.ExactArtifactPath), 737 Flags.create_missing_dirs); 738 } 739 std::vector<Unit> Dictionary; 740 if (Flags.dict) 741 if (!ParseDictionaryFile(FileToString(Flags.dict), &Dictionary)) 742 return 1; 743 if (Flags.verbosity > 0 && !Dictionary.empty()) 744 Printf("Dictionary: %zd entries\n", Dictionary.size()); 745 bool RunIndividualFiles = AllInputsAreFiles(); 746 Options.SaveArtifacts = 747 !RunIndividualFiles || Flags.minimize_crash_internal_step; 748 Options.PrintNewCovPcs = Flags.print_pcs; 749 Options.PrintNewCovFuncs = Flags.print_funcs; 750 Options.PrintFinalStats = Flags.print_final_stats; 751 Options.PrintCorpusStats = Flags.print_corpus_stats; 752 Options.PrintCoverage = Flags.print_coverage; 753 Options.PrintFullCoverage = Flags.print_full_coverage; 754 if (Flags.exit_on_src_pos) 755 Options.ExitOnSrcPos = Flags.exit_on_src_pos; 756 if (Flags.exit_on_item) 757 Options.ExitOnItem = Flags.exit_on_item; 758 if (Flags.focus_function) 759 Options.FocusFunction = Flags.focus_function; 760 if (Flags.data_flow_trace) 761 Options.DataFlowTrace = Flags.data_flow_trace; 762 if (Flags.features_dir) { 763 Options.FeaturesDir = Flags.features_dir; 764 ValidateDirectoryExists(Options.FeaturesDir, Flags.create_missing_dirs); 765 } 766 if (Flags.mutation_graph_file) 767 Options.MutationGraphFile = Flags.mutation_graph_file; 768 if (Flags.collect_data_flow) 769 Options.CollectDataFlow = Flags.collect_data_flow; 770 if (Flags.stop_file) 771 Options.StopFile = Flags.stop_file; 772 Options.Entropic = Flags.entropic; 773 Options.EntropicFeatureFrequencyThreshold = 774 (size_t)Flags.entropic_feature_frequency_threshold; 775 Options.EntropicNumberOfRarestFeatures = 776 (size_t)Flags.entropic_number_of_rarest_features; 777 Options.EntropicScalePerExecTime = Flags.entropic_scale_per_exec_time; 778 if (!Options.FocusFunction.empty()) 779 Options.Entropic = false; // FocusFunction overrides entropic scheduling. 780 if (Options.Entropic) 781 Printf("INFO: Running with entropic power schedule (0x%zX, %zu).\n", 782 Options.EntropicFeatureFrequencyThreshold, 783 Options.EntropicNumberOfRarestFeatures); 784 struct EntropicOptions Entropic; 785 Entropic.Enabled = Options.Entropic; 786 Entropic.FeatureFrequencyThreshold = 787 Options.EntropicFeatureFrequencyThreshold; 788 Entropic.NumberOfRarestFeatures = Options.EntropicNumberOfRarestFeatures; 789 Entropic.ScalePerExecTime = Options.EntropicScalePerExecTime; 790 791 unsigned Seed = Flags.seed; 792 // Initialize Seed. 793 if (Seed == 0) 794 Seed = static_cast<unsigned>( 795 std::chrono::system_clock::now().time_since_epoch().count() + GetPid()); 796 if (Flags.verbosity) 797 Printf("INFO: Seed: %u\n", Seed); 798 799 if (Flags.collect_data_flow && Flags.data_flow_trace && !Flags.fork && 800 !(Flags.merge || Flags.set_cover_merge)) { 801 if (RunIndividualFiles) 802 return CollectDataFlow(Flags.collect_data_flow, Flags.data_flow_trace, 803 ReadCorpora({}, *Inputs)); 804 else 805 return CollectDataFlow(Flags.collect_data_flow, Flags.data_flow_trace, 806 ReadCorpora(*Inputs, {})); 807 } 808 809 Random Rand(Seed); 810 auto *MD = new MutationDispatcher(Rand, Options); 811 auto *Corpus = new InputCorpus(Options.OutputCorpus, Entropic); 812 auto *F = new Fuzzer(Callback, *Corpus, *MD, Options); 813 814 for (auto &U: Dictionary) 815 if (U.size() <= Word::GetMaxSize()) 816 MD->AddWordToManualDictionary(Word(U.data(), U.size())); 817 818 // Threads are only supported by Chrome. Don't use them with emscripten 819 // for now. 820 #if !LIBFUZZER_EMSCRIPTEN 821 StartRssThread(F, Flags.rss_limit_mb); 822 #endif // LIBFUZZER_EMSCRIPTEN 823 824 Options.HandleAbrt = Flags.handle_abrt; 825 Options.HandleAlrm = !Flags.minimize_crash; 826 Options.HandleBus = Flags.handle_bus; 827 Options.HandleFpe = Flags.handle_fpe; 828 Options.HandleIll = Flags.handle_ill; 829 Options.HandleInt = Flags.handle_int; 830 Options.HandleSegv = Flags.handle_segv; 831 Options.HandleTerm = Flags.handle_term; 832 Options.HandleXfsz = Flags.handle_xfsz; 833 Options.HandleUsr1 = Flags.handle_usr1; 834 Options.HandleUsr2 = Flags.handle_usr2; 835 Options.HandleWinExcept = Flags.handle_winexcept; 836 837 SetSignalHandler(Options); 838 839 std::atexit(Fuzzer::StaticExitCallback); 840 841 if (Flags.minimize_crash) 842 return MinimizeCrashInput(Args, Options); 843 844 if (Flags.minimize_crash_internal_step) 845 return MinimizeCrashInputInternalStep(F, Corpus); 846 847 if (Flags.cleanse_crash) 848 return CleanseCrashInput(Args, Options); 849 850 if (RunIndividualFiles) { 851 Options.SaveArtifacts = false; 852 int Runs = std::max(1, Flags.runs); 853 Printf("%s: Running %zd inputs %d time(s) each.\n", ProgName->c_str(), 854 Inputs->size(), Runs); 855 for (auto &Path : *Inputs) { 856 auto StartTime = system_clock::now(); 857 Printf("Running: %s\n", Path.c_str()); 858 for (int Iter = 0; Iter < Runs; Iter++) 859 RunOneTest(F, Path.c_str(), Options.MaxLen); 860 auto StopTime = system_clock::now(); 861 auto MS = duration_cast<milliseconds>(StopTime - StartTime).count(); 862 Printf("Executed %s in %ld ms\n", Path.c_str(), (long)MS); 863 } 864 Printf("***\n" 865 "*** NOTE: fuzzing was not performed, you have only\n" 866 "*** executed the target code on a fixed set of inputs.\n" 867 "***\n"); 868 F->PrintFinalStats(); 869 exit(0); 870 } 871 872 Options.ForkCorpusGroups = Flags.fork_corpus_groups; 873 if (Flags.fork) 874 FuzzWithFork(F->GetMD().GetRand(), Options, Args, *Inputs, Flags.fork); 875 876 if (Flags.merge || Flags.set_cover_merge) 877 Merge(F, Options, Args, *Inputs, Flags.merge_control_file); 878 879 if (Flags.merge_inner) { 880 const size_t kDefaultMaxMergeLen = 1 << 20; 881 if (Options.MaxLen == 0) 882 F->SetMaxInputLen(kDefaultMaxMergeLen); 883 assert(Flags.merge_control_file); 884 F->CrashResistantMergeInternalStep(Flags.merge_control_file, 885 !strncmp(Flags.merge_inner, "2", 1)); 886 exit(0); 887 } 888 889 if (Flags.analyze_dict) { 890 size_t MaxLen = INT_MAX; // Large max length. 891 UnitVector InitialCorpus; 892 for (auto &Inp : *Inputs) { 893 Printf("Loading corpus dir: %s\n", Inp.c_str()); 894 ReadDirToVectorOfUnits(Inp.c_str(), &InitialCorpus, nullptr, 895 MaxLen, /*ExitOnError=*/false); 896 } 897 898 if (Dictionary.empty() || Inputs->empty()) { 899 Printf("ERROR: can't analyze dict without dict and corpus provided\n"); 900 return 1; 901 } 902 if (AnalyzeDictionary(F, Dictionary, InitialCorpus)) { 903 Printf("Dictionary analysis failed\n"); 904 exit(1); 905 } 906 Printf("Dictionary analysis succeeded\n"); 907 exit(0); 908 } 909 910 auto CorporaFiles = ReadCorpora(*Inputs, ParseSeedInuts(Flags.seed_inputs)); 911 F->Loop(CorporaFiles); 912 913 if (Flags.verbosity) 914 Printf("Done %zd runs in %zd second(s)\n", F->getTotalNumberOfRuns(), 915 F->secondsSinceProcessStartUp()); 916 F->PrintFinalStats(); 917 918 exit(0); // Don't let F destroy itself. 919 } 920 921 extern "C" ATTRIBUTE_INTERFACE int 922 LLVMFuzzerRunDriver(int *argc, char ***argv, 923 int (*UserCb)(const uint8_t *Data, size_t Size)) { 924 return FuzzerDriver(argc, argv, UserCb); 925 } 926 927 // Storage for global ExternalFunctions object. 928 ExternalFunctions *EF = nullptr; 929 930 } // namespace fuzzer 931