//===- opt.cpp - The LLVM Modular Optimizer -------------------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // Optimizations may be specified an arbitrary number of times on the command // line, They are run in the order specified. // //===----------------------------------------------------------------------===// #include "BreakpointPrinter.h" #include "NewPMDriver.h" #include "llvm/ADT/Triple.h" #include "llvm/Analysis/CallGraph.h" #include "llvm/Analysis/CallGraphSCCPass.h" #include "llvm/Analysis/LoopPass.h" #include "llvm/Analysis/RegionPass.h" #include "llvm/Analysis/TargetLibraryInfo.h" #include "llvm/Analysis/TargetTransformInfo.h" #include "llvm/AsmParser/Parser.h" #include "llvm/CodeGen/CommandFlags.h" #include "llvm/CodeGen/TargetPassConfig.h" #include "llvm/Config/llvm-config.h" #include "llvm/IR/DataLayout.h" #include "llvm/IR/DebugInfo.h" #include "llvm/IR/LLVMContext.h" #include "llvm/IR/LLVMRemarkStreamer.h" #include "llvm/IR/LegacyPassManager.h" #include "llvm/IR/LegacyPassNameParser.h" #include "llvm/IR/Module.h" #include "llvm/IR/ModuleSummaryIndex.h" #include "llvm/IR/Verifier.h" #include "llvm/IRReader/IRReader.h" #include "llvm/InitializePasses.h" #include "llvm/LinkAllIR.h" #include "llvm/LinkAllPasses.h" #include "llvm/MC/SubtargetFeature.h" #include "llvm/MC/TargetRegistry.h" #include "llvm/Passes/PassPlugin.h" #include "llvm/Remarks/HotnessThresholdParser.h" #include "llvm/Support/Debug.h" #include "llvm/Support/FileSystem.h" #include "llvm/Support/Host.h" #include "llvm/Support/InitLLVM.h" #include "llvm/Support/PluginLoader.h" #include "llvm/Support/SourceMgr.h" #include "llvm/Support/SystemUtils.h" #include "llvm/Support/TargetSelect.h" #include "llvm/Support/ToolOutputFile.h" #include "llvm/Support/YAMLTraits.h" #include "llvm/Target/TargetMachine.h" #include "llvm/Transforms/IPO/WholeProgramDevirt.h" #include "llvm/Transforms/Utils/Cloning.h" #include "llvm/Transforms/Utils/Debugify.h" #include #include #include using namespace llvm; using namespace opt_tool; static codegen::RegisterCodeGenFlags CFG; // The OptimizationList is automatically populated with registered Passes by the // PassNameParser. static cl::list PassList(cl::desc( "Optimizations available (use '-passes=' for the new pass manager)")); static cl::opt EnableNewPassManager( "enable-new-pm", cl::desc("Enable the new pass manager, translating " "'opt -foo' to 'opt -passes=foo'. This is strictly for the new PM " "migration, use '-passes=' when possible."), cl::init(true)); // This flag specifies a textual description of the optimization pass pipeline // to run over the module. This flag switches opt to use the new pass manager // infrastructure, completely disabling all of the flags specific to the old // pass management. static cl::opt PassPipeline( "passes", cl::desc( "A textual description of the pass pipeline. To have analysis passes " "available before a certain pass, add 'require'.")); static cl::alias PassPipeline2("p", cl::aliasopt(PassPipeline), cl::desc("Alias for -passes")); static cl::opt PrintPasses("print-passes", cl::desc("Print available passes that can be " "specified in -passes=foo and exit")); static cl::opt InputFilename(cl::Positional, cl::desc(""), cl::init("-"), cl::value_desc("filename")); static cl::opt OutputFilename("o", cl::desc("Override output filename"), cl::value_desc("filename")); static cl::opt Force("f", cl::desc("Enable binary output on terminals")); static cl::opt NoOutput("disable-output", cl::desc("Do not write result bitcode file"), cl::Hidden); static cl::opt OutputAssembly("S", cl::desc("Write output as LLVM assembly")); static cl::opt OutputThinLTOBC("thinlto-bc", cl::desc("Write output as ThinLTO-ready bitcode")); static cl::opt SplitLTOUnit("thinlto-split-lto-unit", cl::desc("Enable splitting of a ThinLTO LTOUnit")); static cl::opt ThinLinkBitcodeFile( "thin-link-bitcode-file", cl::value_desc("filename"), cl::desc( "A file in which to write minimized bitcode for the thin link only")); static cl::opt NoVerify("disable-verify", cl::desc("Do not run the verifier"), cl::Hidden); static cl::opt NoUpgradeDebugInfo("disable-upgrade-debug-info", cl::desc("Generate invalid output"), cl::ReallyHidden); static cl::opt VerifyEach("verify-each", cl::desc("Verify after each transform")); static cl::opt DisableDITypeMap("disable-debug-info-type-map", cl::desc("Don't use a uniquing type map for debug info")); static cl::opt StripDebug("strip-debug", cl::desc("Strip debugger symbol info from translation unit")); static cl::opt StripNamedMetadata("strip-named-metadata", cl::desc("Strip module-level named metadata")); static cl::opt OptLevelO0("O0", cl::desc("Optimization level 0. Similar to clang -O0. " "Use -passes='default' for the new PM")); static cl::opt OptLevelO1("O1", cl::desc("Optimization level 1. Similar to clang -O1. " "Use -passes='default' for the new PM")); static cl::opt OptLevelO2("O2", cl::desc("Optimization level 2. Similar to clang -O2. " "Use -passes='default' for the new PM")); static cl::opt OptLevelOs("Os", cl::desc("Like -O2 but size-conscious. Similar to clang " "-Os. Use -passes='default' for the new PM")); static cl::opt OptLevelOz( "Oz", cl::desc("Like -O2 but optimize for code size above all else. Similar to " "clang -Oz. Use -passes='default' for the new PM")); static cl::opt OptLevelO3("O3", cl::desc("Optimization level 3. Similar to clang -O3. " "Use -passes='default' for the new PM")); static cl::opt CodeGenOptLevel( "codegen-opt-level", cl::desc("Override optimization level for codegen hooks, legacy PM only")); static cl::opt TargetTriple("mtriple", cl::desc("Override target triple for module")); static cl::opt EmitSummaryIndex("module-summary", cl::desc("Emit module summary index"), cl::init(false)); static cl::opt EmitModuleHash("module-hash", cl::desc("Emit module hash"), cl::init(false)); static cl::opt DisableSimplifyLibCalls("disable-simplify-libcalls", cl::desc("Disable simplify-libcalls")); static cl::list DisableBuiltins( "disable-builtin", cl::desc("Disable specific target library builtin function")); static cl::opt EnableDebugify( "enable-debugify", cl::desc( "Start the pipeline with debugify and end it with check-debugify")); static cl::opt VerifyDebugInfoPreserve( "verify-debuginfo-preserve", cl::desc("Start the pipeline with collecting and end it with checking of " "debug info preservation.")); static cl::opt PrintBreakpoints("print-breakpoints-for-testing", cl::desc("Print select breakpoints location for testing")); static cl::opt ClDataLayout("data-layout", cl::desc("data layout string to use"), cl::value_desc("layout-string"), cl::init("")); static cl::opt PreserveBitcodeUseListOrder( "preserve-bc-uselistorder", cl::desc("Preserve use-list order when writing LLVM bitcode."), cl::init(true), cl::Hidden); static cl::opt PreserveAssemblyUseListOrder( "preserve-ll-uselistorder", cl::desc("Preserve use-list order when writing LLVM assembly."), cl::init(false), cl::Hidden); static cl::opt RunTwice("run-twice", cl::desc("Run all passes twice, re-using the " "same pass manager (legacy PM only)."), cl::init(false), cl::Hidden); static cl::opt DiscardValueNames( "discard-value-names", cl::desc("Discard names from Value (other than GlobalValue)."), cl::init(false), cl::Hidden); static cl::opt TimeTrace( "time-trace", cl::desc("Record time trace")); static cl::opt TimeTraceGranularity( "time-trace-granularity", cl::desc("Minimum time granularity (in microseconds) traced by time profiler"), cl::init(500), cl::Hidden); static cl::opt TimeTraceFile("time-trace-file", cl::desc("Specify time trace file destination"), cl::value_desc("filename")); static cl::opt RemarksWithHotness( "pass-remarks-with-hotness", cl::desc("With PGO, include profile count in optimization remarks"), cl::Hidden); static cl::opt, false, remarks::HotnessThresholdParser> RemarksHotnessThreshold( "pass-remarks-hotness-threshold", cl::desc("Minimum profile count required for " "an optimization remark to be output. " "Use 'auto' to apply the threshold from profile summary"), cl::value_desc("N or 'auto'"), cl::init(0), cl::Hidden); static cl::opt RemarksFilename("pass-remarks-output", cl::desc("Output filename for pass remarks"), cl::value_desc("filename")); static cl::opt RemarksPasses("pass-remarks-filter", cl::desc("Only record optimization remarks from passes whose " "names match the given regular expression"), cl::value_desc("regex")); static cl::opt RemarksFormat( "pass-remarks-format", cl::desc("The format used for serializing remarks (default: YAML)"), cl::value_desc("format"), cl::init("yaml")); static cl::list PassPlugins("load-pass-plugin", cl::desc("Load passes from plugin library")); static inline void addPass(legacy::PassManagerBase &PM, Pass *P) { // Add the pass to the pass manager... PM.add(P); // If we are verifying all of the intermediate steps, add the verifier... if (VerifyEach) PM.add(createVerifierPass()); } //===----------------------------------------------------------------------===// // CodeGen-related helper functions. // static CodeGenOpt::Level GetCodeGenOptLevel() { return static_cast(unsigned(CodeGenOptLevel)); } // Returns the TargetMachine instance or zero if no triple is provided. static TargetMachine* GetTargetMachine(Triple TheTriple, StringRef CPUStr, StringRef FeaturesStr, const TargetOptions &Options) { std::string Error; const Target *TheTarget = TargetRegistry::lookupTarget(codegen::getMArch(), TheTriple, Error); // Some modules don't specify a triple, and this is okay. if (!TheTarget) { return nullptr; } return TheTarget->createTargetMachine( TheTriple.getTriple(), codegen::getCPUStr(), codegen::getFeaturesStr(), Options, codegen::getExplicitRelocModel(), codegen::getExplicitCodeModel(), GetCodeGenOptLevel()); } struct TimeTracerRAII { TimeTracerRAII(StringRef ProgramName) { if (TimeTrace) timeTraceProfilerInitialize(TimeTraceGranularity, ProgramName); } ~TimeTracerRAII() { if (TimeTrace) { if (auto E = timeTraceProfilerWrite(TimeTraceFile, OutputFilename)) { handleAllErrors(std::move(E), [&](const StringError &SE) { errs() << SE.getMessage() << "\n"; }); return; } timeTraceProfilerCleanup(); } } }; // For use in NPM transition. Currently this contains most codegen-specific // passes. Remove passes from here when porting to the NPM. // TODO: use a codegen version of PassRegistry.def/PassBuilder::is*Pass() once // it exists. static bool shouldPinPassToLegacyPM(StringRef Pass) { std::vector PassNameExactToIgnore = { "nvvm-reflect", "nvvm-intr-range", "amdgpu-simplifylib", "amdgpu-usenative", "amdgpu-promote-alloca", "amdgpu-promote-alloca-to-vector", "amdgpu-lower-kernel-attributes", "amdgpu-propagate-attributes-early", "amdgpu-propagate-attributes-late", "amdgpu-unify-metadata", "amdgpu-printf-runtime-binding", "amdgpu-always-inline"}; if (llvm::is_contained(PassNameExactToIgnore, Pass)) return false; std::vector PassNamePrefix = { "x86-", "xcore-", "wasm-", "systemz-", "ppc-", "nvvm-", "nvptx-", "mips-", "lanai-", "hexagon-", "bpf-", "avr-", "thumb2-", "arm-", "si-", "gcn-", "amdgpu-", "aarch64-", "amdgcn-", "polly-", "riscv-", "dxil-"}; std::vector PassNameContain = {"ehprepare"}; std::vector PassNameExact = { "safe-stack", "cost-model", "codegenprepare", "interleaved-load-combine", "unreachableblockelim", "verify-safepoint-ir", "atomic-expand", "expandvp", "hardware-loops", "mve-tail-predication", "interleaved-access", "global-merge", "pre-isel-intrinsic-lowering", "expand-reductions", "indirectbr-expand", "generic-to-nvvm", "expandmemcmp", "loop-reduce", "lower-amx-type", "pre-amx-config", "lower-amx-intrinsics", "polyhedral-info", "print-polyhedral-info", "replace-with-veclib", "jmc-instrument", "dot-regions", "dot-regions-only", "view-regions", "view-regions-only", "select-optimize", "expand-large-div-rem", "structurizecfg", "fix-irreducible", "expand-large-fp-convert" }; for (const auto &P : PassNamePrefix) if (Pass.startswith(P)) return true; for (const auto &P : PassNameContain) if (Pass.contains(P)) return true; return llvm::is_contained(PassNameExact, Pass); } // For use in NPM transition. static bool shouldForceLegacyPM() { for (const auto &P : PassList) { StringRef Arg = P->getPassArgument(); if (shouldPinPassToLegacyPM(Arg)) return true; } return false; } //===----------------------------------------------------------------------===// // main for opt // int main(int argc, char **argv) { InitLLVM X(argc, argv); // Enable debug stream buffering. EnableDebugBuffering = true; InitializeAllTargets(); InitializeAllTargetMCs(); InitializeAllAsmPrinters(); InitializeAllAsmParsers(); // Initialize passes PassRegistry &Registry = *PassRegistry::getPassRegistry(); initializeCore(Registry); initializeScalarOpts(Registry); initializeVectorization(Registry); initializeIPO(Registry); initializeAnalysis(Registry); initializeTransformUtils(Registry); initializeInstCombine(Registry); initializeTarget(Registry); // For codegen passes, only passes that do IR to IR transformation are // supported. initializeExpandLargeDivRemLegacyPassPass(Registry); initializeExpandLargeFpConvertLegacyPassPass(Registry); initializeExpandMemCmpPassPass(Registry); initializeScalarizeMaskedMemIntrinLegacyPassPass(Registry); initializeSelectOptimizePass(Registry); initializeCodeGenPreparePass(Registry); initializeAtomicExpandPass(Registry); initializeRewriteSymbolsLegacyPassPass(Registry); initializeWinEHPreparePass(Registry); initializeDwarfEHPrepareLegacyPassPass(Registry); initializeSafeStackLegacyPassPass(Registry); initializeSjLjEHPreparePass(Registry); initializePreISelIntrinsicLoweringLegacyPassPass(Registry); initializeGlobalMergePass(Registry); initializeIndirectBrExpandPassPass(Registry); initializeInterleavedLoadCombinePass(Registry); initializeInterleavedAccessPass(Registry); initializeUnreachableBlockElimLegacyPassPass(Registry); initializeExpandReductionsPass(Registry); initializeExpandVectorPredicationPass(Registry); initializeWasmEHPreparePass(Registry); initializeWriteBitcodePassPass(Registry); initializeHardwareLoopsPass(Registry); initializeReplaceWithVeclibLegacyPass(Registry); initializeJMCInstrumenterPass(Registry); SmallVector PluginList; PassPlugins.setCallback([&](const std::string &PluginPath) { auto Plugin = PassPlugin::Load(PluginPath); if (!Plugin) { errs() << "Failed to load passes from '" << PluginPath << "'. Request ignored.\n"; return; } PluginList.emplace_back(Plugin.get()); }); // Register the Target and CPU printer for --version. cl::AddExtraVersionPrinter(sys::printDefaultTargetAndDetectedCPU); cl::ParseCommandLineOptions(argc, argv, "llvm .bc -> .bc modular optimizer and analysis printer\n"); LLVMContext Context; // If `-passes=` is specified, use NPM. // If `-enable-new-pm` is specified and there are no codegen passes, use NPM. // e.g. `-enable-new-pm -sroa` will use NPM. // but `-enable-new-pm -codegenprepare` will still revert to legacy PM. const bool UseNPM = (EnableNewPassManager && !shouldForceLegacyPM()) || PassPipeline.getNumOccurrences() > 0; if (UseNPM && !PassList.empty()) { errs() << "The `opt -passname` syntax for the new pass manager is " "not supported, please use `opt -passes=` (or the `-p` " "alias for a more concise version).\n"; errs() << "See https://llvm.org/docs/NewPassManager.html#invoking-opt " "for more details on the pass pipeline syntax.\n\n"; return 1; } if (!UseNPM && PluginList.size()) { errs() << argv[0] << ": " << PassPlugins.ArgStr << " specified with legacy PM.\n"; return 1; } // FIXME: once the legacy PM code is deleted, move runPassPipeline() here and // construct the PassBuilder before parsing IR so we can reuse the same // PassBuilder for print passes. if (PrintPasses) { printPasses(outs()); return 0; } TimeTracerRAII TimeTracer(argv[0]); SMDiagnostic Err; Context.setDiscardValueNames(DiscardValueNames); if (!DisableDITypeMap) Context.enableDebugTypeODRUniquing(); Expected> RemarksFileOrErr = setupLLVMOptimizationRemarks(Context, RemarksFilename, RemarksPasses, RemarksFormat, RemarksWithHotness, RemarksHotnessThreshold); if (Error E = RemarksFileOrErr.takeError()) { errs() << toString(std::move(E)) << '\n'; return 1; } std::unique_ptr RemarksFile = std::move(*RemarksFileOrErr); // Load the input module... auto SetDataLayout = [](StringRef, StringRef) -> std::optional { if (ClDataLayout.empty()) return std::nullopt; return ClDataLayout; }; std::unique_ptr M; if (NoUpgradeDebugInfo) M = parseAssemblyFileWithIndexNoUpgradeDebugInfo( InputFilename, Err, Context, nullptr, SetDataLayout) .Mod; else M = parseIRFile(InputFilename, Err, Context, ParserCallbacks(SetDataLayout)); if (!M) { Err.print(argv[0], errs()); return 1; } // Strip debug info before running the verifier. if (StripDebug) StripDebugInfo(*M); // Erase module-level named metadata, if requested. if (StripNamedMetadata) { while (!M->named_metadata_empty()) { NamedMDNode *NMD = &*M->named_metadata_begin(); M->eraseNamedMetadata(NMD); } } // If we are supposed to override the target triple or data layout, do so now. if (!TargetTriple.empty()) M->setTargetTriple(Triple::normalize(TargetTriple)); // Immediately run the verifier to catch any problems before starting up the // pass pipelines. Otherwise we can crash on broken code during // doInitialization(). if (!NoVerify && verifyModule(*M, &errs())) { errs() << argv[0] << ": " << InputFilename << ": error: input module is broken!\n"; return 1; } // Enable testing of whole program devirtualization on this module by invoking // the facility for updating public visibility to linkage unit visibility when // specified by an internal option. This is normally done during LTO which is // not performed via opt. updateVCallVisibilityInModule(*M, /* WholeProgramVisibilityEnabledInLTO */ false, /* DynamicExportSymbols */ {}); // Figure out what stream we are supposed to write to... std::unique_ptr Out; std::unique_ptr ThinLinkOut; if (NoOutput) { if (!OutputFilename.empty()) errs() << "WARNING: The -o (output filename) option is ignored when\n" "the --disable-output option is used.\n"; } else { // Default to standard output. if (OutputFilename.empty()) OutputFilename = "-"; std::error_code EC; sys::fs::OpenFlags Flags = OutputAssembly ? sys::fs::OF_TextWithCRLF : sys::fs::OF_None; Out.reset(new ToolOutputFile(OutputFilename, EC, Flags)); if (EC) { errs() << EC.message() << '\n'; return 1; } if (!ThinLinkBitcodeFile.empty()) { ThinLinkOut.reset( new ToolOutputFile(ThinLinkBitcodeFile, EC, sys::fs::OF_None)); if (EC) { errs() << EC.message() << '\n'; return 1; } } } Triple ModuleTriple(M->getTargetTriple()); std::string CPUStr, FeaturesStr; TargetMachine *Machine = nullptr; const TargetOptions Options = codegen::InitTargetOptionsFromCodeGenFlags(ModuleTriple); if (ModuleTriple.getArch()) { CPUStr = codegen::getCPUStr(); FeaturesStr = codegen::getFeaturesStr(); Machine = GetTargetMachine(ModuleTriple, CPUStr, FeaturesStr, Options); } else if (ModuleTriple.getArchName() != "unknown" && ModuleTriple.getArchName() != "") { errs() << argv[0] << ": unrecognized architecture '" << ModuleTriple.getArchName() << "' provided.\n"; return 1; } std::unique_ptr TM(Machine); // Override function attributes based on CPUStr, FeaturesStr, and command line // flags. codegen::setFunctionAttributes(CPUStr, FeaturesStr, *M); // If the output is set to be emitted to standard out, and standard out is a // console, print out a warning message and refuse to do it. We don't // impress anyone by spewing tons of binary goo to a terminal. if (!Force && !NoOutput && !OutputAssembly) if (CheckBitcodeOutputToConsole(Out->os())) NoOutput = true; if (OutputThinLTOBC) M->addModuleFlag(Module::Error, "EnableSplitLTOUnit", SplitLTOUnit); // Add an appropriate TargetLibraryInfo pass for the module's triple. TargetLibraryInfoImpl TLII(ModuleTriple); // The -disable-simplify-libcalls flag actually disables all builtin optzns. if (DisableSimplifyLibCalls) TLII.disableAllFunctions(); else { // Disable individual builtin functions in TargetLibraryInfo. LibFunc F; for (auto &FuncName : DisableBuiltins) if (TLII.getLibFunc(FuncName, F)) TLII.setUnavailable(F); else { errs() << argv[0] << ": cannot disable nonexistent builtin function " << FuncName << '\n'; return 1; } } if (UseNPM) { if (legacy::debugPassSpecified()) { errs() << "-debug-pass does not work with the new PM, either use " "-debug-pass-manager, or use the legacy PM (-enable-new-pm=0)\n"; return 1; } auto NumOLevel = OptLevelO0 + OptLevelO1 + OptLevelO2 + OptLevelO3 + OptLevelOs + OptLevelOz; if (NumOLevel > 1) { errs() << "Cannot specify multiple -O#\n"; return 1; } if (NumOLevel > 0 && (PassPipeline.getNumOccurrences() > 0)) { errs() << "Cannot specify -O# and --passes=/--foo-pass, use " "-passes='default,other-pass'\n"; return 1; } std::string Pipeline = PassPipeline; if (OptLevelO0) Pipeline = "default"; if (OptLevelO1) Pipeline = "default"; if (OptLevelO2) Pipeline = "default"; if (OptLevelO3) Pipeline = "default"; if (OptLevelOs) Pipeline = "default"; if (OptLevelOz) Pipeline = "default"; OutputKind OK = OK_NoOutput; if (!NoOutput) OK = OutputAssembly ? OK_OutputAssembly : (OutputThinLTOBC ? OK_OutputThinLTOBitcode : OK_OutputBitcode); VerifierKind VK = VK_VerifyOut; if (NoVerify) VK = VK_NoVerifier; else if (VerifyEach) VK = VK_VerifyEachPass; // The user has asked to use the new pass manager and provided a pipeline // string. Hand off the rest of the functionality to the new code for that // layer. return runPassPipeline(argv[0], *M, TM.get(), &TLII, Out.get(), ThinLinkOut.get(), RemarksFile.get(), Pipeline, PluginList, OK, VK, PreserveAssemblyUseListOrder, PreserveBitcodeUseListOrder, EmitSummaryIndex, EmitModuleHash, EnableDebugify, VerifyDebugInfoPreserve) ? 0 : 1; } if (OptLevelO0 || OptLevelO1 || OptLevelO2 || OptLevelOs || OptLevelOz || OptLevelO3) { errs() << "Cannot use -O# with legacy PM.\n"; return 1; } if (EmitSummaryIndex) { errs() << "Cannot use -module-summary with legacy PM.\n"; return 1; } if (EmitModuleHash) { errs() << "Cannot use -module-hash with legacy PM.\n"; return 1; } if (OutputThinLTOBC) { errs() << "Cannot use -thinlto-bc with legacy PM.\n"; return 1; } // Create a PassManager to hold and optimize the collection of passes we are // about to build. If the -debugify-each option is set, wrap each pass with // the (-check)-debugify passes. DebugifyCustomPassManager Passes; DebugifyStatsMap DIStatsMap; DebugInfoPerPass DebugInfoBeforePass; if (DebugifyEach) { Passes.setDebugifyMode(DebugifyMode::SyntheticDebugInfo); Passes.setDIStatsMap(DIStatsMap); } else if (VerifyEachDebugInfoPreserve) { Passes.setDebugifyMode(DebugifyMode::OriginalDebugInfo); Passes.setDebugInfoBeforePass(DebugInfoBeforePass); if (!VerifyDIPreserveExport.empty()) Passes.setOrigDIVerifyBugsReportFilePath(VerifyDIPreserveExport); } bool AddOneTimeDebugifyPasses = (EnableDebugify && !DebugifyEach) || (VerifyDebugInfoPreserve && !VerifyEachDebugInfoPreserve); Passes.add(new TargetLibraryInfoWrapperPass(TLII)); // Add internal analysis passes from the target machine. Passes.add(createTargetTransformInfoWrapperPass(TM ? TM->getTargetIRAnalysis() : TargetIRAnalysis())); if (AddOneTimeDebugifyPasses) { if (EnableDebugify) { Passes.setDIStatsMap(DIStatsMap); Passes.add(createDebugifyModulePass()); } else if (VerifyDebugInfoPreserve) { Passes.setDebugInfoBeforePass(DebugInfoBeforePass); Passes.add(createDebugifyModulePass( DebugifyMode::OriginalDebugInfo, "", &(Passes.getDebugInfoPerPass()))); } } std::unique_ptr FPasses; if (PrintBreakpoints) { // Default to standard output. if (!Out) { if (OutputFilename.empty()) OutputFilename = "-"; std::error_code EC; Out = std::make_unique(OutputFilename, EC, sys::fs::OF_None); if (EC) { errs() << EC.message() << '\n'; return 1; } } Passes.add(createBreakpointPrinter(Out->os())); NoOutput = true; } if (TM) { // FIXME: We should dyn_cast this when supported. auto <M = static_cast(*TM); Pass *TPC = LTM.createPassConfig(Passes); Passes.add(TPC); } // Create a new optimization pass for each one specified on the command line for (unsigned i = 0; i < PassList.size(); ++i) { const PassInfo *PassInf = PassList[i]; Pass *P = nullptr; if (PassInf->getNormalCtor()) P = PassInf->getNormalCtor()(); else errs() << argv[0] << ": cannot create pass: " << PassInf->getPassName() << "\n"; if (P) addPass(Passes, P); } if (FPasses) { FPasses->doInitialization(); for (Function &F : *M) FPasses->run(F); FPasses->doFinalization(); } // Check that the module is well formed on completion of optimization if (!NoVerify && !VerifyEach) Passes.add(createVerifierPass()); if (AddOneTimeDebugifyPasses) { if (EnableDebugify) Passes.add(createCheckDebugifyModulePass(false)); else if (VerifyDebugInfoPreserve) { if (!VerifyDIPreserveExport.empty()) Passes.setOrigDIVerifyBugsReportFilePath(VerifyDIPreserveExport); Passes.add(createCheckDebugifyModulePass( false, "", nullptr, DebugifyMode::OriginalDebugInfo, &(Passes.getDebugInfoPerPass()), VerifyDIPreserveExport)); } } // In run twice mode, we want to make sure the output is bit-by-bit // equivalent if we run the pass manager again, so setup two buffers and // a stream to write to them. Note that llc does something similar and it // may be worth to abstract this out in the future. SmallVector Buffer; SmallVector FirstRunBuffer; std::unique_ptr BOS; raw_ostream *OS = nullptr; const bool ShouldEmitOutput = !NoOutput; // Write bitcode or assembly to the output as the last step... if (ShouldEmitOutput || RunTwice) { assert(Out); OS = &Out->os(); if (RunTwice) { BOS = std::make_unique(Buffer); OS = BOS.get(); } if (OutputAssembly) Passes.add(createPrintModulePass(*OS, "", PreserveAssemblyUseListOrder)); else Passes.add(createBitcodeWriterPass(*OS, PreserveBitcodeUseListOrder)); } // Before executing passes, print the final values of the LLVM options. cl::PrintOptionValues(); if (!RunTwice) { // Now that we have all of the passes ready, run them. Passes.run(*M); } else { // If requested, run all passes twice with the same pass manager to catch // bugs caused by persistent state in the passes. std::unique_ptr M2(CloneModule(*M)); // Run all passes on the original module first, so the second run processes // the clone to catch CloneModule bugs. Passes.run(*M); FirstRunBuffer = Buffer; Buffer.clear(); Passes.run(*M2); // Compare the two outputs and make sure they're the same assert(Out); if (Buffer.size() != FirstRunBuffer.size() || (memcmp(Buffer.data(), FirstRunBuffer.data(), Buffer.size()) != 0)) { errs() << "Running the pass manager twice changed the output.\n" "Writing the result of the second run to the specified output.\n" "To generate the one-run comparison binary, just run without\n" "the compile-twice option\n"; if (ShouldEmitOutput) { Out->os() << BOS->str(); Out->keep(); } if (RemarksFile) RemarksFile->keep(); return 1; } if (ShouldEmitOutput) Out->os() << BOS->str(); } if (DebugifyEach && !DebugifyExport.empty()) exportDebugifyStats(DebugifyExport, Passes.getDebugifyStatsMap()); // Declare success. if (!NoOutput || PrintBreakpoints) Out->keep(); if (RemarksFile) RemarksFile->keep(); if (ThinLinkOut) ThinLinkOut->keep(); return 0; }