1 //===- FuzzerDriver.cpp - FuzzerDriver function and flags -----------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // FuzzerDriver and flag parsing. 9 //===----------------------------------------------------------------------===// 10 11 #include "FuzzerCommand.h" 12 #include "FuzzerCorpus.h" 13 #include "FuzzerFork.h" 14 #include "FuzzerIO.h" 15 #include "FuzzerInterface.h" 16 #include "FuzzerInternal.h" 17 #include "FuzzerMerge.h" 18 #include "FuzzerMutate.h" 19 #include "FuzzerPlatform.h" 20 #include "FuzzerRandom.h" 21 #include "FuzzerTracePC.h" 22 #include <algorithm> 23 #include <atomic> 24 #include <chrono> 25 #include <cstdlib> 26 #include <cstring> 27 #include <mutex> 28 #include <string> 29 #include <thread> 30 #include <fstream> 31 32 // This function should be present in the libFuzzer so that the client 33 // binary can test for its existence. 34 #if LIBFUZZER_MSVC 35 extern "C" void __libfuzzer_is_present() {} 36 #if defined(_M_IX86) || defined(__i386__) 37 #pragma comment(linker, "/include:___libfuzzer_is_present") 38 #else 39 #pragma comment(linker, "/include:__libfuzzer_is_present") 40 #endif 41 #else 42 extern "C" __attribute__((used)) void __libfuzzer_is_present() {} 43 #endif // LIBFUZZER_MSVC 44 45 namespace fuzzer { 46 47 // Program arguments. 48 struct FlagDescription { 49 const char *Name; 50 const char *Description; 51 int Default; 52 int *IntFlag; 53 const char **StrFlag; 54 unsigned int *UIntFlag; 55 }; 56 57 struct { 58 #define FUZZER_DEPRECATED_FLAG(Name) 59 #define FUZZER_FLAG_INT(Name, Default, Description) int Name; 60 #define FUZZER_FLAG_UNSIGNED(Name, Default, Description) unsigned int Name; 61 #define FUZZER_FLAG_STRING(Name, Description) const char *Name; 62 #include "FuzzerFlags.def" 63 #undef FUZZER_DEPRECATED_FLAG 64 #undef FUZZER_FLAG_INT 65 #undef FUZZER_FLAG_UNSIGNED 66 #undef FUZZER_FLAG_STRING 67 } Flags; 68 69 static const FlagDescription FlagDescriptions [] { 70 #define FUZZER_DEPRECATED_FLAG(Name) \ 71 {#Name, "Deprecated; don't use", 0, nullptr, nullptr, nullptr}, 72 #define FUZZER_FLAG_INT(Name, Default, Description) \ 73 {#Name, Description, Default, &Flags.Name, nullptr, nullptr}, 74 #define FUZZER_FLAG_UNSIGNED(Name, Default, Description) \ 75 {#Name, Description, static_cast<int>(Default), \ 76 nullptr, nullptr, &Flags.Name}, 77 #define FUZZER_FLAG_STRING(Name, Description) \ 78 {#Name, Description, 0, nullptr, &Flags.Name, nullptr}, 79 #include "FuzzerFlags.def" 80 #undef FUZZER_DEPRECATED_FLAG 81 #undef FUZZER_FLAG_INT 82 #undef FUZZER_FLAG_UNSIGNED 83 #undef FUZZER_FLAG_STRING 84 }; 85 86 static const size_t kNumFlags = 87 sizeof(FlagDescriptions) / sizeof(FlagDescriptions[0]); 88 89 static std::vector<std::string> *Inputs; 90 static std::string *ProgName; 91 92 static void PrintHelp() { 93 Printf("Usage:\n"); 94 auto Prog = ProgName->c_str(); 95 Printf("\nTo run fuzzing pass 0 or more directories.\n"); 96 Printf("%s [-flag1=val1 [-flag2=val2 ...] ] [dir1 [dir2 ...] ]\n", Prog); 97 98 Printf("\nTo run individual tests without fuzzing pass 1 or more files:\n"); 99 Printf("%s [-flag1=val1 [-flag2=val2 ...] ] file1 [file2 ...]\n", Prog); 100 101 Printf("\nFlags: (strictly in form -flag=value)\n"); 102 size_t MaxFlagLen = 0; 103 for (size_t F = 0; F < kNumFlags; F++) 104 MaxFlagLen = std::max(strlen(FlagDescriptions[F].Name), MaxFlagLen); 105 106 for (size_t F = 0; F < kNumFlags; F++) { 107 const auto &D = FlagDescriptions[F]; 108 if (strstr(D.Description, "internal flag") == D.Description) continue; 109 Printf(" %s", D.Name); 110 for (size_t i = 0, n = MaxFlagLen - strlen(D.Name); i < n; i++) 111 Printf(" "); 112 Printf("\t"); 113 Printf("%d\t%s\n", D.Default, D.Description); 114 } 115 Printf("\nFlags starting with '--' will be ignored and " 116 "will be passed verbatim to subprocesses.\n"); 117 } 118 119 static const char *FlagValue(const char *Param, const char *Name) { 120 size_t Len = strlen(Name); 121 if (Param[0] == '-' && strstr(Param + 1, Name) == Param + 1 && 122 Param[Len + 1] == '=') 123 return &Param[Len + 2]; 124 return nullptr; 125 } 126 127 // Avoid calling stol as it triggers a bug in clang/glibc build. 128 static long MyStol(const char *Str) { 129 long Res = 0; 130 long Sign = 1; 131 if (*Str == '-') { 132 Str++; 133 Sign = -1; 134 } 135 for (size_t i = 0; Str[i]; i++) { 136 char Ch = Str[i]; 137 if (Ch < '0' || Ch > '9') 138 return Res; 139 Res = Res * 10 + (Ch - '0'); 140 } 141 return Res * Sign; 142 } 143 144 static bool ParseOneFlag(const char *Param) { 145 if (Param[0] != '-') return false; 146 if (Param[1] == '-') { 147 static bool PrintedWarning = false; 148 if (!PrintedWarning) { 149 PrintedWarning = true; 150 Printf("INFO: libFuzzer ignores flags that start with '--'\n"); 151 } 152 for (size_t F = 0; F < kNumFlags; F++) 153 if (FlagValue(Param + 1, FlagDescriptions[F].Name)) 154 Printf("WARNING: did you mean '%s' (single dash)?\n", Param + 1); 155 return true; 156 } 157 for (size_t F = 0; F < kNumFlags; F++) { 158 const char *Name = FlagDescriptions[F].Name; 159 const char *Str = FlagValue(Param, Name); 160 if (Str) { 161 if (FlagDescriptions[F].IntFlag) { 162 auto Val = MyStol(Str); 163 *FlagDescriptions[F].IntFlag = static_cast<int>(Val); 164 if (Flags.verbosity >= 2) 165 Printf("Flag: %s %d\n", Name, Val); 166 return true; 167 } else if (FlagDescriptions[F].UIntFlag) { 168 auto Val = std::stoul(Str); 169 *FlagDescriptions[F].UIntFlag = static_cast<unsigned int>(Val); 170 if (Flags.verbosity >= 2) 171 Printf("Flag: %s %u\n", Name, Val); 172 return true; 173 } else if (FlagDescriptions[F].StrFlag) { 174 *FlagDescriptions[F].StrFlag = Str; 175 if (Flags.verbosity >= 2) 176 Printf("Flag: %s %s\n", Name, Str); 177 return true; 178 } else { // Deprecated flag. 179 Printf("Flag: %s: deprecated, don't use\n", Name); 180 return true; 181 } 182 } 183 } 184 Printf("\n\nWARNING: unrecognized flag '%s'; " 185 "use -help=1 to list all flags\n\n", Param); 186 return true; 187 } 188 189 // We don't use any library to minimize dependencies. 190 static void ParseFlags(const std::vector<std::string> &Args, 191 const ExternalFunctions *EF) { 192 for (size_t F = 0; F < kNumFlags; F++) { 193 if (FlagDescriptions[F].IntFlag) 194 *FlagDescriptions[F].IntFlag = FlagDescriptions[F].Default; 195 if (FlagDescriptions[F].UIntFlag) 196 *FlagDescriptions[F].UIntFlag = 197 static_cast<unsigned int>(FlagDescriptions[F].Default); 198 if (FlagDescriptions[F].StrFlag) 199 *FlagDescriptions[F].StrFlag = nullptr; 200 } 201 202 // Disable len_control by default, if LLVMFuzzerCustomMutator is used. 203 if (EF->LLVMFuzzerCustomMutator) { 204 Flags.len_control = 0; 205 Printf("INFO: found LLVMFuzzerCustomMutator (%p). " 206 "Disabling -len_control by default.\n", EF->LLVMFuzzerCustomMutator); 207 } 208 209 Inputs = new std::vector<std::string>; 210 for (size_t A = 1; A < Args.size(); A++) { 211 if (ParseOneFlag(Args[A].c_str())) { 212 if (Flags.ignore_remaining_args) 213 break; 214 continue; 215 } 216 Inputs->push_back(Args[A]); 217 } 218 } 219 220 static std::mutex Mu; 221 222 static void PulseThread() { 223 while (true) { 224 SleepSeconds(600); 225 std::lock_guard<std::mutex> Lock(Mu); 226 Printf("pulse...\n"); 227 } 228 } 229 230 static void WorkerThread(const Command &BaseCmd, std::atomic<unsigned> *Counter, 231 unsigned NumJobs, std::atomic<bool> *HasErrors) { 232 while (true) { 233 unsigned C = (*Counter)++; 234 if (C >= NumJobs) break; 235 std::string Log = "fuzz-" + std::to_string(C) + ".log"; 236 Command Cmd(BaseCmd); 237 Cmd.setOutputFile(Log); 238 Cmd.combineOutAndErr(); 239 if (Flags.verbosity) { 240 std::string CommandLine = Cmd.toString(); 241 Printf("%s\n", CommandLine.c_str()); 242 } 243 int ExitCode = ExecuteCommand(Cmd); 244 if (ExitCode != 0) 245 *HasErrors = true; 246 std::lock_guard<std::mutex> Lock(Mu); 247 Printf("================== Job %u exited with exit code %d ============\n", 248 C, ExitCode); 249 fuzzer::CopyFileToErr(Log); 250 } 251 } 252 253 static void ValidateDirectoryExists(const std::string &Path, 254 bool CreateDirectory) { 255 if (Path.empty()) { 256 Printf("ERROR: Provided directory path is an empty string\n"); 257 exit(1); 258 } 259 260 if (IsDirectory(Path)) 261 return; 262 263 if (CreateDirectory) { 264 if (!MkDirRecursive(Path)) { 265 Printf("ERROR: Failed to create directory \"%s\"\n", Path.c_str()); 266 exit(1); 267 } 268 return; 269 } 270 271 Printf("ERROR: The required directory \"%s\" does not exist\n", Path.c_str()); 272 exit(1); 273 } 274 275 std::string CloneArgsWithoutX(const std::vector<std::string> &Args, 276 const char *X1, const char *X2) { 277 std::string Cmd; 278 for (auto &S : Args) { 279 if (FlagValue(S.c_str(), X1) || FlagValue(S.c_str(), X2)) 280 continue; 281 Cmd += S + " "; 282 } 283 return Cmd; 284 } 285 286 static int RunInMultipleProcesses(const std::vector<std::string> &Args, 287 unsigned NumWorkers, unsigned NumJobs) { 288 std::atomic<unsigned> Counter(0); 289 std::atomic<bool> HasErrors(false); 290 Command Cmd(Args); 291 Cmd.removeFlag("jobs"); 292 Cmd.removeFlag("workers"); 293 std::vector<std::thread> V; 294 std::thread Pulse(PulseThread); 295 Pulse.detach(); 296 for (unsigned i = 0; i < NumWorkers; i++) 297 V.push_back(std::thread(WorkerThread, std::ref(Cmd), &Counter, NumJobs, 298 &HasErrors)); 299 for (auto &T : V) 300 T.join(); 301 return HasErrors ? 1 : 0; 302 } 303 304 static void RssThread(Fuzzer *F, size_t RssLimitMb) { 305 while (true) { 306 SleepSeconds(1); 307 size_t Peak = GetPeakRSSMb(); 308 if (Peak > RssLimitMb) 309 F->RssLimitCallback(); 310 } 311 } 312 313 static void StartRssThread(Fuzzer *F, size_t RssLimitMb) { 314 if (!RssLimitMb) 315 return; 316 std::thread T(RssThread, F, RssLimitMb); 317 T.detach(); 318 } 319 320 int RunOneTest(Fuzzer *F, const char *InputFilePath, size_t MaxLen) { 321 Unit U = FileToVector(InputFilePath); 322 if (MaxLen && MaxLen < U.size()) 323 U.resize(MaxLen); 324 F->ExecuteCallback(U.data(), U.size()); 325 if (Flags.print_full_coverage) { 326 // Leak detection is not needed when collecting full coverage data. 327 F->TPCUpdateObservedPCs(); 328 } else { 329 F->TryDetectingAMemoryLeak(U.data(), U.size(), true); 330 } 331 return 0; 332 } 333 334 static bool AllInputsAreFiles() { 335 if (Inputs->empty()) return false; 336 for (auto &Path : *Inputs) 337 if (!IsFile(Path)) 338 return false; 339 return true; 340 } 341 342 static std::string GetDedupTokenFromCmdOutput(const std::string &S) { 343 auto Beg = S.find("DEDUP_TOKEN:"); 344 if (Beg == std::string::npos) 345 return ""; 346 auto End = S.find('\n', Beg); 347 if (End == std::string::npos) 348 return ""; 349 return S.substr(Beg, End - Beg); 350 } 351 352 int CleanseCrashInput(const std::vector<std::string> &Args, 353 const FuzzingOptions &Options) { 354 if (Inputs->size() != 1 || !Flags.exact_artifact_path) { 355 Printf("ERROR: -cleanse_crash should be given one input file and" 356 " -exact_artifact_path\n"); 357 exit(1); 358 } 359 std::string InputFilePath = Inputs->at(0); 360 std::string OutputFilePath = Flags.exact_artifact_path; 361 Command Cmd(Args); 362 Cmd.removeFlag("cleanse_crash"); 363 364 assert(Cmd.hasArgument(InputFilePath)); 365 Cmd.removeArgument(InputFilePath); 366 367 auto TmpFilePath = TempPath("CleanseCrashInput", ".repro"); 368 Cmd.addArgument(TmpFilePath); 369 Cmd.setOutputFile(getDevNull()); 370 Cmd.combineOutAndErr(); 371 372 std::string CurrentFilePath = InputFilePath; 373 auto U = FileToVector(CurrentFilePath); 374 size_t Size = U.size(); 375 376 const std::vector<uint8_t> ReplacementBytes = {' ', 0xff}; 377 for (int NumAttempts = 0; NumAttempts < 5; NumAttempts++) { 378 bool Changed = false; 379 for (size_t Idx = 0; Idx < Size; Idx++) { 380 Printf("CLEANSE[%d]: Trying to replace byte %zd of %zd\n", NumAttempts, 381 Idx, Size); 382 uint8_t OriginalByte = U[Idx]; 383 if (ReplacementBytes.end() != std::find(ReplacementBytes.begin(), 384 ReplacementBytes.end(), 385 OriginalByte)) 386 continue; 387 for (auto NewByte : ReplacementBytes) { 388 U[Idx] = NewByte; 389 WriteToFile(U, TmpFilePath); 390 auto ExitCode = ExecuteCommand(Cmd); 391 RemoveFile(TmpFilePath); 392 if (!ExitCode) { 393 U[Idx] = OriginalByte; 394 } else { 395 Changed = true; 396 Printf("CLEANSE: Replaced byte %zd with 0x%x\n", Idx, NewByte); 397 WriteToFile(U, OutputFilePath); 398 break; 399 } 400 } 401 } 402 if (!Changed) break; 403 } 404 return 0; 405 } 406 407 int MinimizeCrashInput(const std::vector<std::string> &Args, 408 const FuzzingOptions &Options) { 409 if (Inputs->size() != 1) { 410 Printf("ERROR: -minimize_crash should be given one input file\n"); 411 exit(1); 412 } 413 std::string InputFilePath = Inputs->at(0); 414 Command BaseCmd(Args); 415 BaseCmd.removeFlag("minimize_crash"); 416 BaseCmd.removeFlag("exact_artifact_path"); 417 assert(BaseCmd.hasArgument(InputFilePath)); 418 BaseCmd.removeArgument(InputFilePath); 419 if (Flags.runs <= 0 && Flags.max_total_time == 0) { 420 Printf("INFO: you need to specify -runs=N or " 421 "-max_total_time=N with -minimize_crash=1\n" 422 "INFO: defaulting to -max_total_time=600\n"); 423 BaseCmd.addFlag("max_total_time", "600"); 424 } 425 426 BaseCmd.combineOutAndErr(); 427 428 std::string CurrentFilePath = InputFilePath; 429 while (true) { 430 Unit U = FileToVector(CurrentFilePath); 431 Printf("CRASH_MIN: minimizing crash input: '%s' (%zd bytes)\n", 432 CurrentFilePath.c_str(), U.size()); 433 434 Command Cmd(BaseCmd); 435 Cmd.addArgument(CurrentFilePath); 436 437 Printf("CRASH_MIN: executing: %s\n", Cmd.toString().c_str()); 438 std::string CmdOutput; 439 bool Success = ExecuteCommand(Cmd, &CmdOutput); 440 if (Success) { 441 Printf("ERROR: the input %s did not crash\n", CurrentFilePath.c_str()); 442 exit(1); 443 } 444 Printf("CRASH_MIN: '%s' (%zd bytes) caused a crash. Will try to minimize " 445 "it further\n", 446 CurrentFilePath.c_str(), U.size()); 447 auto DedupToken1 = GetDedupTokenFromCmdOutput(CmdOutput); 448 if (!DedupToken1.empty()) 449 Printf("CRASH_MIN: DedupToken1: %s\n", DedupToken1.c_str()); 450 451 std::string ArtifactPath = 452 Flags.exact_artifact_path 453 ? Flags.exact_artifact_path 454 : Options.ArtifactPrefix + "minimized-from-" + Hash(U); 455 Cmd.addFlag("minimize_crash_internal_step", "1"); 456 Cmd.addFlag("exact_artifact_path", ArtifactPath); 457 Printf("CRASH_MIN: executing: %s\n", Cmd.toString().c_str()); 458 CmdOutput.clear(); 459 Success = ExecuteCommand(Cmd, &CmdOutput); 460 Printf("%s", CmdOutput.c_str()); 461 if (Success) { 462 if (Flags.exact_artifact_path) { 463 CurrentFilePath = Flags.exact_artifact_path; 464 WriteToFile(U, CurrentFilePath); 465 } 466 Printf("CRASH_MIN: failed to minimize beyond %s (%d bytes), exiting\n", 467 CurrentFilePath.c_str(), U.size()); 468 break; 469 } 470 auto DedupToken2 = GetDedupTokenFromCmdOutput(CmdOutput); 471 if (!DedupToken2.empty()) 472 Printf("CRASH_MIN: DedupToken2: %s\n", DedupToken2.c_str()); 473 474 if (DedupToken1 != DedupToken2) { 475 if (Flags.exact_artifact_path) { 476 CurrentFilePath = Flags.exact_artifact_path; 477 WriteToFile(U, CurrentFilePath); 478 } 479 Printf("CRASH_MIN: mismatch in dedup tokens" 480 " (looks like a different bug). Won't minimize further\n"); 481 break; 482 } 483 484 CurrentFilePath = ArtifactPath; 485 Printf("*********************************\n"); 486 } 487 return 0; 488 } 489 490 int MinimizeCrashInputInternalStep(Fuzzer *F, InputCorpus *Corpus) { 491 assert(Inputs->size() == 1); 492 std::string InputFilePath = Inputs->at(0); 493 Unit U = FileToVector(InputFilePath); 494 Printf("INFO: Starting MinimizeCrashInputInternalStep: %zd\n", U.size()); 495 if (U.size() < 2) { 496 Printf("INFO: The input is small enough, exiting\n"); 497 exit(0); 498 } 499 F->SetMaxInputLen(U.size()); 500 F->SetMaxMutationLen(U.size() - 1); 501 F->MinimizeCrashLoop(U); 502 Printf("INFO: Done MinimizeCrashInputInternalStep, no crashes found\n"); 503 exit(0); 504 return 0; 505 } 506 507 void Merge(Fuzzer *F, FuzzingOptions &Options, 508 const std::vector<std::string> &Args, 509 const std::vector<std::string> &Corpora, const char *CFPathOrNull) { 510 if (Corpora.size() < 2) { 511 Printf("INFO: Merge requires two or more corpus dirs\n"); 512 exit(0); 513 } 514 515 std::vector<SizedFile> OldCorpus, NewCorpus; 516 GetSizedFilesFromDir(Corpora[0], &OldCorpus); 517 for (size_t i = 1; i < Corpora.size(); i++) 518 GetSizedFilesFromDir(Corpora[i], &NewCorpus); 519 std::sort(OldCorpus.begin(), OldCorpus.end()); 520 std::sort(NewCorpus.begin(), NewCorpus.end()); 521 522 std::string CFPath = CFPathOrNull ? CFPathOrNull : TempPath("Merge", ".txt"); 523 std::vector<std::string> NewFiles; 524 std::set<uint32_t> NewFeatures, NewCov; 525 CrashResistantMerge(Args, OldCorpus, NewCorpus, &NewFiles, {}, &NewFeatures, 526 {}, &NewCov, CFPath, true, Flags.set_cover_merge); 527 for (auto &Path : NewFiles) 528 F->WriteToOutputCorpus(FileToVector(Path, Options.MaxLen)); 529 // We are done, delete the control file if it was a temporary one. 530 if (!Flags.merge_control_file) 531 RemoveFile(CFPath); 532 533 exit(0); 534 } 535 536 int AnalyzeDictionary(Fuzzer *F, const std::vector<Unit> &Dict, 537 UnitVector &Corpus) { 538 Printf("Started dictionary minimization (up to %d tests)\n", 539 Dict.size() * Corpus.size() * 2); 540 541 // Scores and usage count for each dictionary unit. 542 std::vector<int> Scores(Dict.size()); 543 std::vector<int> Usages(Dict.size()); 544 545 std::vector<size_t> InitialFeatures; 546 std::vector<size_t> ModifiedFeatures; 547 for (auto &C : Corpus) { 548 // Get coverage for the testcase without modifications. 549 F->ExecuteCallback(C.data(), C.size()); 550 InitialFeatures.clear(); 551 TPC.CollectFeatures([&](size_t Feature) { 552 InitialFeatures.push_back(Feature); 553 }); 554 555 for (size_t i = 0; i < Dict.size(); ++i) { 556 std::vector<uint8_t> Data = C; 557 auto StartPos = std::search(Data.begin(), Data.end(), 558 Dict[i].begin(), Dict[i].end()); 559 // Skip dictionary unit, if the testcase does not contain it. 560 if (StartPos == Data.end()) 561 continue; 562 563 ++Usages[i]; 564 while (StartPos != Data.end()) { 565 // Replace all occurrences of dictionary unit in the testcase. 566 auto EndPos = StartPos + Dict[i].size(); 567 for (auto It = StartPos; It != EndPos; ++It) 568 *It ^= 0xFF; 569 570 StartPos = std::search(EndPos, Data.end(), 571 Dict[i].begin(), Dict[i].end()); 572 } 573 574 // Get coverage for testcase with masked occurrences of dictionary unit. 575 F->ExecuteCallback(Data.data(), Data.size()); 576 ModifiedFeatures.clear(); 577 TPC.CollectFeatures([&](size_t Feature) { 578 ModifiedFeatures.push_back(Feature); 579 }); 580 581 if (InitialFeatures == ModifiedFeatures) 582 --Scores[i]; 583 else 584 Scores[i] += 2; 585 } 586 } 587 588 Printf("###### Useless dictionary elements. ######\n"); 589 for (size_t i = 0; i < Dict.size(); ++i) { 590 // Dictionary units with positive score are treated as useful ones. 591 if (Scores[i] > 0) 592 continue; 593 594 Printf("\""); 595 PrintASCII(Dict[i].data(), Dict[i].size(), "\""); 596 Printf(" # Score: %d, Used: %d\n", Scores[i], Usages[i]); 597 } 598 Printf("###### End of useless dictionary elements. ######\n"); 599 return 0; 600 } 601 602 std::vector<std::string> ParseSeedInuts(const char *seed_inputs) { 603 // Parse -seed_inputs=file1,file2,... or -seed_inputs=@seed_inputs_file 604 std::vector<std::string> Files; 605 if (!seed_inputs) return Files; 606 std::string SeedInputs; 607 if (Flags.seed_inputs[0] == '@') 608 SeedInputs = FileToString(Flags.seed_inputs + 1); // File contains list. 609 else 610 SeedInputs = Flags.seed_inputs; // seed_inputs contains the list. 611 if (SeedInputs.empty()) { 612 Printf("seed_inputs is empty or @file does not exist.\n"); 613 exit(1); 614 } 615 // Parse SeedInputs. 616 size_t comma_pos = 0; 617 while ((comma_pos = SeedInputs.find_last_of(',')) != std::string::npos) { 618 Files.push_back(SeedInputs.substr(comma_pos + 1)); 619 SeedInputs = SeedInputs.substr(0, comma_pos); 620 } 621 Files.push_back(SeedInputs); 622 return Files; 623 } 624 625 static std::vector<SizedFile> 626 ReadCorpora(const std::vector<std::string> &CorpusDirs, 627 const std::vector<std::string> &ExtraSeedFiles) { 628 std::vector<SizedFile> SizedFiles; 629 size_t LastNumFiles = 0; 630 for (auto &Dir : CorpusDirs) { 631 GetSizedFilesFromDir(Dir, &SizedFiles); 632 Printf("INFO: % 8zd files found in %s\n", SizedFiles.size() - LastNumFiles, 633 Dir.c_str()); 634 LastNumFiles = SizedFiles.size(); 635 } 636 for (auto &File : ExtraSeedFiles) 637 if (auto Size = FileSize(File)) 638 SizedFiles.push_back({File, Size}); 639 return SizedFiles; 640 } 641 642 int FuzzerDriver(int *argc, char ***argv, UserCallback Callback) { 643 using namespace fuzzer; 644 assert(argc && argv && "Argument pointers cannot be nullptr"); 645 std::string Argv0((*argv)[0]); 646 EF = new ExternalFunctions(); 647 if (EF->LLVMFuzzerInitialize) 648 EF->LLVMFuzzerInitialize(argc, argv); 649 if (EF->__msan_scoped_disable_interceptor_checks) 650 EF->__msan_scoped_disable_interceptor_checks(); 651 const std::vector<std::string> Args(*argv, *argv + *argc); 652 assert(!Args.empty()); 653 ProgName = new std::string(Args[0]); 654 if (Argv0 != *ProgName) { 655 Printf("ERROR: argv[0] has been modified in LLVMFuzzerInitialize\n"); 656 exit(1); 657 } 658 ParseFlags(Args, EF); 659 if (Flags.help) { 660 PrintHelp(); 661 return 0; 662 } 663 664 if (Flags.close_fd_mask & 2) 665 DupAndCloseStderr(); 666 if (Flags.close_fd_mask & 1) 667 CloseStdout(); 668 669 if (Flags.jobs > 0 && Flags.workers == 0) { 670 Flags.workers = std::min(NumberOfCpuCores() / 2, Flags.jobs); 671 if (Flags.workers > 1) 672 Printf("Running %u workers\n", Flags.workers); 673 } 674 675 if (Flags.workers > 0 && Flags.jobs > 0) 676 return RunInMultipleProcesses(Args, Flags.workers, Flags.jobs); 677 678 FuzzingOptions Options; 679 Options.Verbosity = Flags.verbosity; 680 Options.MaxLen = Flags.max_len; 681 Options.LenControl = Flags.len_control; 682 Options.KeepSeed = Flags.keep_seed; 683 Options.UnitTimeoutSec = Flags.timeout; 684 Options.ErrorExitCode = Flags.error_exitcode; 685 Options.TimeoutExitCode = Flags.timeout_exitcode; 686 Options.IgnoreTimeouts = Flags.ignore_timeouts; 687 Options.IgnoreOOMs = Flags.ignore_ooms; 688 Options.IgnoreCrashes = Flags.ignore_crashes; 689 Options.MaxTotalTimeSec = Flags.max_total_time; 690 Options.DoCrossOver = Flags.cross_over; 691 Options.CrossOverUniformDist = Flags.cross_over_uniform_dist; 692 Options.MutateDepth = Flags.mutate_depth; 693 Options.ReduceDepth = Flags.reduce_depth; 694 Options.UseCounters = Flags.use_counters; 695 Options.UseMemmem = Flags.use_memmem; 696 Options.UseCmp = Flags.use_cmp; 697 Options.UseValueProfile = Flags.use_value_profile; 698 Options.Shrink = Flags.shrink; 699 Options.ReduceInputs = Flags.reduce_inputs; 700 Options.ShuffleAtStartUp = Flags.shuffle; 701 Options.PreferSmall = Flags.prefer_small; 702 Options.ReloadIntervalSec = Flags.reload; 703 Options.OnlyASCII = Flags.only_ascii; 704 Options.DetectLeaks = Flags.detect_leaks; 705 Options.PurgeAllocatorIntervalSec = Flags.purge_allocator_interval; 706 Options.TraceMalloc = Flags.trace_malloc; 707 Options.RssLimitMb = Flags.rss_limit_mb; 708 Options.MallocLimitMb = Flags.malloc_limit_mb; 709 if (!Options.MallocLimitMb) 710 Options.MallocLimitMb = Options.RssLimitMb; 711 if (Flags.runs >= 0) 712 Options.MaxNumberOfRuns = Flags.runs; 713 if (!Inputs->empty() && !Flags.minimize_crash_internal_step) { 714 // Ensure output corpus assumed to be the first arbitrary argument input 715 // is not a path to an existing file. 716 std::string OutputCorpusDir = (*Inputs)[0]; 717 if (!IsFile(OutputCorpusDir)) { 718 Options.OutputCorpus = OutputCorpusDir; 719 ValidateDirectoryExists(Options.OutputCorpus, Flags.create_missing_dirs); 720 } 721 } 722 Options.ReportSlowUnits = Flags.report_slow_units; 723 if (Flags.artifact_prefix) { 724 Options.ArtifactPrefix = Flags.artifact_prefix; 725 726 // Since the prefix could be a full path to a file name prefix, assume 727 // that if the path ends with the platform's separator that a directory 728 // is desired 729 std::string ArtifactPathDir = Options.ArtifactPrefix; 730 if (!IsSeparator(ArtifactPathDir[ArtifactPathDir.length() - 1])) { 731 ArtifactPathDir = DirName(ArtifactPathDir); 732 } 733 ValidateDirectoryExists(ArtifactPathDir, Flags.create_missing_dirs); 734 } 735 if (Flags.exact_artifact_path) { 736 Options.ExactArtifactPath = Flags.exact_artifact_path; 737 ValidateDirectoryExists(DirName(Options.ExactArtifactPath), 738 Flags.create_missing_dirs); 739 } 740 std::vector<Unit> Dictionary; 741 if (Flags.dict) 742 if (!ParseDictionaryFile(FileToString(Flags.dict), &Dictionary)) 743 return 1; 744 if (Flags.verbosity > 0 && !Dictionary.empty()) 745 Printf("Dictionary: %zd entries\n", Dictionary.size()); 746 bool RunIndividualFiles = AllInputsAreFiles(); 747 Options.SaveArtifacts = 748 !RunIndividualFiles || Flags.minimize_crash_internal_step; 749 Options.PrintNewCovPcs = Flags.print_pcs; 750 Options.PrintNewCovFuncs = Flags.print_funcs; 751 Options.PrintFinalStats = Flags.print_final_stats; 752 Options.PrintCorpusStats = Flags.print_corpus_stats; 753 Options.PrintCoverage = Flags.print_coverage; 754 Options.PrintFullCoverage = Flags.print_full_coverage; 755 if (Flags.exit_on_src_pos) 756 Options.ExitOnSrcPos = Flags.exit_on_src_pos; 757 if (Flags.exit_on_item) 758 Options.ExitOnItem = Flags.exit_on_item; 759 if (Flags.focus_function) 760 Options.FocusFunction = Flags.focus_function; 761 if (Flags.data_flow_trace) 762 Options.DataFlowTrace = Flags.data_flow_trace; 763 if (Flags.features_dir) { 764 Options.FeaturesDir = Flags.features_dir; 765 ValidateDirectoryExists(Options.FeaturesDir, Flags.create_missing_dirs); 766 } 767 if (Flags.mutation_graph_file) 768 Options.MutationGraphFile = Flags.mutation_graph_file; 769 if (Flags.collect_data_flow) 770 Options.CollectDataFlow = Flags.collect_data_flow; 771 if (Flags.stop_file) 772 Options.StopFile = Flags.stop_file; 773 Options.Entropic = Flags.entropic; 774 Options.EntropicFeatureFrequencyThreshold = 775 (size_t)Flags.entropic_feature_frequency_threshold; 776 Options.EntropicNumberOfRarestFeatures = 777 (size_t)Flags.entropic_number_of_rarest_features; 778 Options.EntropicScalePerExecTime = Flags.entropic_scale_per_exec_time; 779 if (!Options.FocusFunction.empty()) 780 Options.Entropic = false; // FocusFunction overrides entropic scheduling. 781 if (Options.Entropic) 782 Printf("INFO: Running with entropic power schedule (0x%X, %d).\n", 783 Options.EntropicFeatureFrequencyThreshold, 784 Options.EntropicNumberOfRarestFeatures); 785 struct EntropicOptions Entropic; 786 Entropic.Enabled = Options.Entropic; 787 Entropic.FeatureFrequencyThreshold = 788 Options.EntropicFeatureFrequencyThreshold; 789 Entropic.NumberOfRarestFeatures = Options.EntropicNumberOfRarestFeatures; 790 Entropic.ScalePerExecTime = Options.EntropicScalePerExecTime; 791 792 unsigned Seed = Flags.seed; 793 // Initialize Seed. 794 if (Seed == 0) 795 Seed = static_cast<unsigned>( 796 std::chrono::system_clock::now().time_since_epoch().count() + GetPid()); 797 if (Flags.verbosity) 798 Printf("INFO: Seed: %u\n", Seed); 799 800 if (Flags.collect_data_flow && !Flags.fork && 801 !(Flags.merge || Flags.set_cover_merge)) { 802 if (RunIndividualFiles) 803 return CollectDataFlow(Flags.collect_data_flow, Flags.data_flow_trace, 804 ReadCorpora({}, *Inputs)); 805 else 806 return CollectDataFlow(Flags.collect_data_flow, Flags.data_flow_trace, 807 ReadCorpora(*Inputs, {})); 808 } 809 810 Random Rand(Seed); 811 auto *MD = new MutationDispatcher(Rand, Options); 812 auto *Corpus = new InputCorpus(Options.OutputCorpus, Entropic); 813 auto *F = new Fuzzer(Callback, *Corpus, *MD, Options); 814 815 for (auto &U: Dictionary) 816 if (U.size() <= Word::GetMaxSize()) 817 MD->AddWordToManualDictionary(Word(U.data(), U.size())); 818 819 // Threads are only supported by Chrome. Don't use them with emscripten 820 // for now. 821 #if !LIBFUZZER_EMSCRIPTEN 822 StartRssThread(F, Flags.rss_limit_mb); 823 #endif // LIBFUZZER_EMSCRIPTEN 824 825 Options.HandleAbrt = Flags.handle_abrt; 826 Options.HandleAlrm = !Flags.minimize_crash; 827 Options.HandleBus = Flags.handle_bus; 828 Options.HandleFpe = Flags.handle_fpe; 829 Options.HandleIll = Flags.handle_ill; 830 Options.HandleInt = Flags.handle_int; 831 Options.HandleSegv = Flags.handle_segv; 832 Options.HandleTerm = Flags.handle_term; 833 Options.HandleXfsz = Flags.handle_xfsz; 834 Options.HandleUsr1 = Flags.handle_usr1; 835 Options.HandleUsr2 = Flags.handle_usr2; 836 Options.HandleWinExcept = Flags.handle_winexcept; 837 838 SetSignalHandler(Options); 839 840 std::atexit(Fuzzer::StaticExitCallback); 841 842 if (Flags.minimize_crash) 843 return MinimizeCrashInput(Args, Options); 844 845 if (Flags.minimize_crash_internal_step) 846 return MinimizeCrashInputInternalStep(F, Corpus); 847 848 if (Flags.cleanse_crash) 849 return CleanseCrashInput(Args, Options); 850 851 if (RunIndividualFiles) { 852 Options.SaveArtifacts = false; 853 int Runs = std::max(1, Flags.runs); 854 Printf("%s: Running %zd inputs %d time(s) each.\n", ProgName->c_str(), 855 Inputs->size(), Runs); 856 for (auto &Path : *Inputs) { 857 auto StartTime = system_clock::now(); 858 Printf("Running: %s\n", Path.c_str()); 859 for (int Iter = 0; Iter < Runs; Iter++) 860 RunOneTest(F, Path.c_str(), Options.MaxLen); 861 auto StopTime = system_clock::now(); 862 auto MS = duration_cast<milliseconds>(StopTime - StartTime).count(); 863 Printf("Executed %s in %zd ms\n", Path.c_str(), (long)MS); 864 } 865 Printf("***\n" 866 "*** NOTE: fuzzing was not performed, you have only\n" 867 "*** executed the target code on a fixed set of inputs.\n" 868 "***\n"); 869 F->PrintFinalStats(); 870 exit(0); 871 } 872 873 Options.ForkCorpusGroups = Flags.fork_corpus_groups; 874 if (Flags.fork) 875 FuzzWithFork(F->GetMD().GetRand(), Options, Args, *Inputs, Flags.fork); 876 877 if (Flags.merge || Flags.set_cover_merge) 878 Merge(F, Options, Args, *Inputs, Flags.merge_control_file); 879 880 if (Flags.merge_inner) { 881 const size_t kDefaultMaxMergeLen = 1 << 20; 882 if (Options.MaxLen == 0) 883 F->SetMaxInputLen(kDefaultMaxMergeLen); 884 assert(Flags.merge_control_file); 885 F->CrashResistantMergeInternalStep(Flags.merge_control_file, 886 !strncmp(Flags.merge_inner, "2", 1)); 887 exit(0); 888 } 889 890 if (Flags.analyze_dict) { 891 size_t MaxLen = INT_MAX; // Large max length. 892 UnitVector InitialCorpus; 893 for (auto &Inp : *Inputs) { 894 Printf("Loading corpus dir: %s\n", Inp.c_str()); 895 ReadDirToVectorOfUnits(Inp.c_str(), &InitialCorpus, nullptr, 896 MaxLen, /*ExitOnError=*/false); 897 } 898 899 if (Dictionary.empty() || Inputs->empty()) { 900 Printf("ERROR: can't analyze dict without dict and corpus provided\n"); 901 return 1; 902 } 903 if (AnalyzeDictionary(F, Dictionary, InitialCorpus)) { 904 Printf("Dictionary analysis failed\n"); 905 exit(1); 906 } 907 Printf("Dictionary analysis succeeded\n"); 908 exit(0); 909 } 910 911 auto CorporaFiles = ReadCorpora(*Inputs, ParseSeedInuts(Flags.seed_inputs)); 912 F->Loop(CorporaFiles); 913 914 if (Flags.verbosity) 915 Printf("Done %zd runs in %zd second(s)\n", F->getTotalNumberOfRuns(), 916 F->secondsSinceProcessStartUp()); 917 F->PrintFinalStats(); 918 919 exit(0); // Don't let F destroy itself. 920 } 921 922 extern "C" ATTRIBUTE_INTERFACE int 923 LLVMFuzzerRunDriver(int *argc, char ***argv, 924 int (*UserCb)(const uint8_t *Data, size_t Size)) { 925 return FuzzerDriver(argc, argv, UserCb); 926 } 927 928 // Storage for global ExternalFunctions object. 929 ExternalFunctions *EF = nullptr; 930 931 } // namespace fuzzer 932