//===- Construction of codegen pass pipelines ------------------*- C++ -*--===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// /// \file /// /// Interfaces for producing common pass manager configurations. /// //===----------------------------------------------------------------------===// #ifndef LLVM_PASSES_CODEGENPASSBUILDER_H #define LLVM_PASSES_CODEGENPASSBUILDER_H #include "llvm/ADT/SmallVector.h" #include "llvm/ADT/StringRef.h" #include "llvm/Analysis/AliasAnalysis.h" #include "llvm/Analysis/BasicAliasAnalysis.h" #include "llvm/Analysis/ProfileSummaryInfo.h" #include "llvm/Analysis/ScopedNoAliasAA.h" #include "llvm/Analysis/TargetTransformInfo.h" #include "llvm/Analysis/TypeBasedAliasAnalysis.h" #include "llvm/CodeGen/AssignmentTrackingAnalysis.h" #include "llvm/CodeGen/CallBrPrepare.h" #include "llvm/CodeGen/CodeGenPrepare.h" #include "llvm/CodeGen/DeadMachineInstructionElim.h" #include "llvm/CodeGen/DwarfEHPrepare.h" #include "llvm/CodeGen/ExpandMemCmp.h" #include "llvm/CodeGen/ExpandReductions.h" #include "llvm/CodeGen/FinalizeISel.h" #include "llvm/CodeGen/GCMetadata.h" #include "llvm/CodeGen/GlobalMerge.h" #include "llvm/CodeGen/IndirectBrExpand.h" #include "llvm/CodeGen/InterleavedAccess.h" #include "llvm/CodeGen/InterleavedLoadCombine.h" #include "llvm/CodeGen/JMCInstrumenter.h" #include "llvm/CodeGen/LiveIntervals.h" #include "llvm/CodeGen/LocalStackSlotAllocation.h" #include "llvm/CodeGen/LowerEmuTLS.h" #include "llvm/CodeGen/MIRPrinter.h" #include "llvm/CodeGen/MachineFunctionAnalysis.h" #include "llvm/CodeGen/MachineModuleInfo.h" #include "llvm/CodeGen/MachinePassManager.h" #include "llvm/CodeGen/PHIElimination.h" #include "llvm/CodeGen/PreISelIntrinsicLowering.h" #include "llvm/CodeGen/RegAllocFast.h" #include "llvm/CodeGen/ReplaceWithVeclib.h" #include "llvm/CodeGen/SafeStack.h" #include "llvm/CodeGen/SelectOptimize.h" #include "llvm/CodeGen/ShadowStackGCLowering.h" #include "llvm/CodeGen/SjLjEHPrepare.h" #include "llvm/CodeGen/StackProtector.h" #include "llvm/CodeGen/TargetPassConfig.h" #include "llvm/CodeGen/TwoAddressInstructionPass.h" #include "llvm/CodeGen/UnreachableBlockElim.h" #include "llvm/CodeGen/WasmEHPrepare.h" #include "llvm/CodeGen/WinEHPrepare.h" #include "llvm/IR/PassManager.h" #include "llvm/IR/Verifier.h" #include "llvm/IRPrinter/IRPrintingPasses.h" #include "llvm/MC/MCAsmInfo.h" #include "llvm/MC/MCTargetOptions.h" #include "llvm/Support/CodeGen.h" #include "llvm/Support/Debug.h" #include "llvm/Support/Error.h" #include "llvm/Support/ErrorHandling.h" #include "llvm/Target/CGPassBuilderOption.h" #include "llvm/Target/TargetMachine.h" #include "llvm/Transforms/CFGuard.h" #include "llvm/Transforms/Scalar/ConstantHoisting.h" #include "llvm/Transforms/Scalar/LoopPassManager.h" #include "llvm/Transforms/Scalar/LoopStrengthReduce.h" #include "llvm/Transforms/Scalar/LowerConstantIntrinsics.h" #include "llvm/Transforms/Scalar/MergeICmps.h" #include "llvm/Transforms/Scalar/PartiallyInlineLibCalls.h" #include "llvm/Transforms/Scalar/ScalarizeMaskedMemIntrin.h" #include "llvm/Transforms/Utils/EntryExitInstrumenter.h" #include "llvm/Transforms/Utils/LowerInvoke.h" #include #include #include namespace llvm { // FIXME: Dummy target independent passes definitions that have not yet been // ported to new pass manager. Once they do, remove these. #define DUMMY_FUNCTION_PASS(NAME, PASS_NAME) \ struct PASS_NAME : public PassInfoMixin { \ template PASS_NAME(Ts &&...) {} \ PreservedAnalyses run(Function &, FunctionAnalysisManager &) { \ return PreservedAnalyses::all(); \ } \ }; #define DUMMY_MACHINE_MODULE_PASS(NAME, PASS_NAME) \ struct PASS_NAME : public PassInfoMixin { \ template PASS_NAME(Ts &&...) {} \ PreservedAnalyses run(Module &, ModuleAnalysisManager &) { \ return PreservedAnalyses::all(); \ } \ }; #define DUMMY_MACHINE_FUNCTION_PASS(NAME, PASS_NAME) \ struct PASS_NAME : public PassInfoMixin { \ template PASS_NAME(Ts &&...) {} \ PreservedAnalyses run(MachineFunction &, \ MachineFunctionAnalysisManager &) { \ return PreservedAnalyses::all(); \ } \ }; #include "llvm/Passes/MachinePassRegistry.def" /// This class provides access to building LLVM's passes. /// /// Its members provide the baseline state available to passes during their /// construction. The \c MachinePassRegistry.def file specifies how to construct /// all of the built-in passes, and those may reference these members during /// construction. template class CodeGenPassBuilder { public: explicit CodeGenPassBuilder(TargetMachineT &TM, const CGPassBuilderOption &Opts, PassInstrumentationCallbacks *PIC) : TM(TM), Opt(Opts), PIC(PIC) { // Target could set CGPassBuilderOption::MISchedPostRA to true to achieve // substitutePass(&PostRASchedulerID, &PostMachineSchedulerID) // Target should override TM.Options.EnableIPRA in their target-specific // LLVMTM ctor. See TargetMachine::setGlobalISel for example. if (Opt.EnableIPRA) TM.Options.EnableIPRA = *Opt.EnableIPRA; if (Opt.EnableGlobalISelAbort) TM.Options.GlobalISelAbort = *Opt.EnableGlobalISelAbort; if (!Opt.OptimizeRegAlloc) Opt.OptimizeRegAlloc = getOptLevel() != CodeGenOptLevel::None; } Error buildPipeline(ModulePassManager &MPM, raw_pwrite_stream &Out, raw_pwrite_stream *DwoOut, CodeGenFileType FileType) const; PassInstrumentationCallbacks *getPassInstrumentationCallbacks() const { return PIC; } protected: template using has_required_t = decltype(std::declval().isRequired()); template using is_module_pass_t = decltype(std::declval().run( std::declval(), std::declval())); template using is_function_pass_t = decltype(std::declval().run( std::declval(), std::declval())); template using is_machine_function_pass_t = decltype(std::declval().run( std::declval(), std::declval())); // Function object to maintain state while adding codegen IR passes. // TODO: add a Function -> MachineFunction adaptor and merge // AddIRPass/AddMachinePass so we can have a function pipeline that runs both // function passes and machine function passes. class AddIRPass { public: AddIRPass(ModulePassManager &MPM, const DerivedT &PB) : MPM(MPM), PB(PB) {} ~AddIRPass() { if (!FPM.isEmpty()) MPM.addPass(createModuleToFunctionPassAdaptor(std::move(FPM))); } template void operator()(PassT &&Pass, StringRef Name = PassT::name()) { static_assert((is_detected::value || is_detected::value) && "Only module pass and function pass are supported."); bool Required = false; if constexpr (is_detected::value) Required = PassT::isRequired(); if (!PB.runBeforeAdding(Name) && !Required) return; // Add Function Pass if constexpr (is_detected::value) { FPM.addPass(std::forward(Pass)); } else { // Add Module Pass if (!FPM.isEmpty()) { MPM.addPass(createModuleToFunctionPassAdaptor(std::move(FPM))); FPM = FunctionPassManager(); } MPM.addPass(std::forward(Pass)); } } private: ModulePassManager &MPM; FunctionPassManager FPM; const DerivedT &PB; }; // Function object to maintain state while adding codegen machine passes. class AddMachinePass { public: AddMachinePass(ModulePassManager &MPM, const DerivedT &PB) : MPM(MPM), PB(PB) {} ~AddMachinePass() { if (!MFPM.isEmpty()) { FunctionPassManager FPM; FPM.addPass( createFunctionToMachineFunctionPassAdaptor(std::move(MFPM))); FPM.addPass(InvalidateAnalysisPass()); MPM.addPass(createModuleToFunctionPassAdaptor(std::move(FPM))); } } template void operator()(PassT &&Pass, bool Force = false, StringRef Name = PassT::name()) { static_assert((is_detected::value || is_detected::value) && "Only module pass and function pass are supported."); if (!Force && !PB.runBeforeAdding(Name)) return; // Add Function Pass if constexpr (is_detected::value) { MFPM.addPass(std::forward(Pass)); } else { // Add Module Pass if (!MFPM.isEmpty()) { MPM.addPass(createModuleToFunctionPassAdaptor( createFunctionToMachineFunctionPassAdaptor(std::move(MFPM)))); MFPM = MachineFunctionPassManager(); } MPM.addPass(std::forward(Pass)); } for (auto &C : PB.AfterCallbacks) C(Name, MFPM); } private: ModulePassManager &MPM; MachineFunctionPassManager MFPM; const DerivedT &PB; }; TargetMachineT &TM; CGPassBuilderOption Opt; PassInstrumentationCallbacks *PIC; template TMC &getTM() const { return static_cast(TM); } CodeGenOptLevel getOptLevel() const { return TM.getOptLevel(); } /// Check whether or not GlobalISel should abort on error. /// When this is disabled, GlobalISel will fall back on SDISel instead of /// erroring out. bool isGlobalISelAbortEnabled() const { return TM.Options.GlobalISelAbort == GlobalISelAbortMode::Enable; } /// Check whether or not a diagnostic should be emitted when GlobalISel /// uses the fallback path. In other words, it will emit a diagnostic /// when GlobalISel failed and isGlobalISelAbortEnabled is false. bool reportDiagnosticWhenGlobalISelFallback() const { return TM.Options.GlobalISelAbort == GlobalISelAbortMode::DisableWithDiag; } /// addInstSelector - This method should install an instruction selector pass, /// which converts from LLVM code to machine instructions. Error addInstSelector(AddMachinePass &) const { return make_error("addInstSelector is not overridden", inconvertibleErrorCode()); } /// Target can override this to add GlobalMergePass before all IR passes. void addGlobalMergePass(AddIRPass &) const {} /// Add passes that optimize instruction level parallelism for out-of-order /// targets. These passes are run while the machine code is still in SSA /// form, so they can use MachineTraceMetrics to control their heuristics. /// /// All passes added here should preserve the MachineDominatorTree, /// MachineLoopInfo, and MachineTraceMetrics analyses. void addILPOpts(AddMachinePass &) const {} /// This method may be implemented by targets that want to run passes /// immediately before register allocation. void addPreRegAlloc(AddMachinePass &) const {} /// addPreRewrite - Add passes to the optimized register allocation pipeline /// after register allocation is complete, but before virtual registers are /// rewritten to physical registers. /// /// These passes must preserve VirtRegMap and LiveIntervals, and when running /// after RABasic or RAGreedy, they should take advantage of LiveRegMatrix. /// When these passes run, VirtRegMap contains legal physreg assignments for /// all virtual registers. /// /// Note if the target overloads addRegAssignAndRewriteOptimized, this may not /// be honored. This is also not generally used for the fast variant, /// where the allocation and rewriting are done in one pass. void addPreRewrite(AddMachinePass &) const {} /// Add passes to be run immediately after virtual registers are rewritten /// to physical registers. void addPostRewrite(AddMachinePass &) const {} /// This method may be implemented by targets that want to run passes after /// register allocation pass pipeline but before prolog-epilog insertion. void addPostRegAlloc(AddMachinePass &) const {} /// This method may be implemented by targets that want to run passes after /// prolog-epilog insertion and before the second instruction scheduling pass. void addPreSched2(AddMachinePass &) const {} /// This pass may be implemented by targets that want to run passes /// immediately before machine code is emitted. void addPreEmitPass(AddMachinePass &) const {} /// Targets may add passes immediately before machine code is emitted in this /// callback. This is called even later than `addPreEmitPass`. // FIXME: Rename `addPreEmitPass` to something more sensible given its actual // position and remove the `2` suffix here as this callback is what // `addPreEmitPass` *should* be but in reality isn't. void addPreEmitPass2(AddMachinePass &) const {} /// {{@ For GlobalISel /// /// addPreISel - This method should add any "last minute" LLVM->LLVM /// passes (which are run just before instruction selector). void addPreISel(AddIRPass &) const { llvm_unreachable("addPreISel is not overridden"); } /// This method should install an IR translator pass, which converts from /// LLVM code to machine instructions with possibly generic opcodes. Error addIRTranslator(AddMachinePass &) const { return make_error("addIRTranslator is not overridden", inconvertibleErrorCode()); } /// This method may be implemented by targets that want to run passes /// immediately before legalization. void addPreLegalizeMachineIR(AddMachinePass &) const {} /// This method should install a legalize pass, which converts the instruction /// sequence into one that can be selected by the target. Error addLegalizeMachineIR(AddMachinePass &) const { return make_error("addLegalizeMachineIR is not overridden", inconvertibleErrorCode()); } /// This method may be implemented by targets that want to run passes /// immediately before the register bank selection. void addPreRegBankSelect(AddMachinePass &) const {} /// This method should install a register bank selector pass, which /// assigns register banks to virtual registers without a register /// class or register banks. Error addRegBankSelect(AddMachinePass &) const { return make_error("addRegBankSelect is not overridden", inconvertibleErrorCode()); } /// This method may be implemented by targets that want to run passes /// immediately before the (global) instruction selection. void addPreGlobalInstructionSelect(AddMachinePass &) const {} /// This method should install a (global) instruction selector pass, which /// converts possibly generic instructions to fully target-specific /// instructions, thereby constraining all generic virtual registers to /// register classes. Error addGlobalInstructionSelect(AddMachinePass &) const { return make_error( "addGlobalInstructionSelect is not overridden", inconvertibleErrorCode()); } /// @}} /// High level function that adds all passes necessary to go from llvm IR /// representation to the MI representation. /// Adds IR based lowering and target specific optimization passes and finally /// the core instruction selection passes. void addISelPasses(AddIRPass &) const; /// Add the actual instruction selection passes. This does not include /// preparation passes on IR. Error addCoreISelPasses(AddMachinePass &) const; /// Add the complete, standard set of LLVM CodeGen passes. /// Fully developed targets will not generally override this. Error addMachinePasses(AddMachinePass &) const; /// Add passes to lower exception handling for the code generator. void addPassesToHandleExceptions(AddIRPass &) const; /// Add common target configurable passes that perform LLVM IR to IR /// transforms following machine independent optimization. void addIRPasses(AddIRPass &) const; /// Add pass to prepare the LLVM IR for code generation. This should be done /// before exception handling preparation passes. void addCodeGenPrepare(AddIRPass &) const; /// Add common passes that perform LLVM IR to IR transforms in preparation for /// instruction selection. void addISelPrepare(AddIRPass &) const; /// Methods with trivial inline returns are convenient points in the common /// codegen pass pipeline where targets may insert passes. Methods with /// out-of-line standard implementations are major CodeGen stages called by /// addMachinePasses. Some targets may override major stages when inserting /// passes is insufficient, but maintaining overriden stages is more work. /// /// addMachineSSAOptimization - Add standard passes that optimize machine /// instructions in SSA form. void addMachineSSAOptimization(AddMachinePass &) const; /// addFastRegAlloc - Add the minimum set of target-independent passes that /// are required for fast register allocation. Error addFastRegAlloc(AddMachinePass &) const; /// addOptimizedRegAlloc - Add passes related to register allocation. /// LLVMTargetMachine provides standard regalloc passes for most targets. void addOptimizedRegAlloc(AddMachinePass &) const; /// Add passes that optimize machine instructions after register allocation. void addMachineLateOptimization(AddMachinePass &) const; /// addGCPasses - Add late codegen passes that analyze code for garbage /// collection. This should return true if GC info should be printed after /// these passes. void addGCPasses(AddMachinePass &) const {} /// Add standard basic block placement passes. void addBlockPlacement(AddMachinePass &) const; using CreateMCStreamer = std::function>(MCContext &)>; void addAsmPrinter(AddMachinePass &, CreateMCStreamer) const { llvm_unreachable("addAsmPrinter is not overridden"); } /// Utilities for targets to add passes to the pass manager. /// /// createTargetRegisterAllocator - Create the register allocator pass for /// this target at the current optimization level. void addTargetRegisterAllocator(AddMachinePass &, bool Optimized) const; /// addMachinePasses helper to create the target-selected or overriden /// regalloc pass. void addRegAllocPass(AddMachinePass &, bool Optimized) const; /// Add core register alloator passes which do the actual register assignment /// and rewriting. \returns true if any passes were added. Error addRegAssignmentFast(AddMachinePass &) const; Error addRegAssignmentOptimized(AddMachinePass &) const; /// Allow the target to disable a specific pass by default. /// Backend can declare unwanted passes in constructor. template void disablePass() { BeforeCallbacks.emplace_back( [](StringRef Name) { return ((Name != PassTs::name()) && ...); }); } /// Insert InsertedPass pass after TargetPass pass. /// Only machine function passes are supported. template void insertPass(InsertedPassT &&Pass) { AfterCallbacks.emplace_back( [&](StringRef Name, MachineFunctionPassManager &MFPM) mutable { if (Name == TargetPassT::name()) MFPM.addPass(std::forward(Pass)); }); } private: DerivedT &derived() { return static_cast(*this); } const DerivedT &derived() const { return static_cast(*this); } bool runBeforeAdding(StringRef Name) const { bool ShouldAdd = true; for (auto &C : BeforeCallbacks) ShouldAdd &= C(Name); return ShouldAdd; } void setStartStopPasses(const TargetPassConfig::StartStopInfo &Info) const; Error verifyStartStop(const TargetPassConfig::StartStopInfo &Info) const; mutable SmallVector, 4> BeforeCallbacks; mutable SmallVector< llvm::unique_function, 4> AfterCallbacks; /// Helper variable for `-start-before/-start-after/-stop-before/-stop-after` mutable bool Started = true; mutable bool Stopped = true; }; template Error CodeGenPassBuilder::buildPipeline( ModulePassManager &MPM, raw_pwrite_stream &Out, raw_pwrite_stream *DwoOut, CodeGenFileType FileType) const { auto StartStopInfo = TargetPassConfig::getStartStopInfo(*PIC); if (!StartStopInfo) return StartStopInfo.takeError(); setStartStopPasses(*StartStopInfo); bool PrintAsm = TargetPassConfig::willCompleteCodeGenPipeline(); bool PrintMIR = !PrintAsm && FileType != CodeGenFileType::Null; { AddIRPass addIRPass(MPM, derived()); addIRPass(RequireAnalysisPass()); addIRPass(RequireAnalysisPass()); addIRPass(RequireAnalysisPass()); addISelPasses(addIRPass); } AddMachinePass addPass(MPM, derived()); if (PrintMIR) addPass(PrintMIRPreparePass(Out), /*Force=*/true); if (auto Err = addCoreISelPasses(addPass)) return std::move(Err); if (auto Err = derived().addMachinePasses(addPass)) return std::move(Err); if (PrintAsm) { derived().addAsmPrinter( addPass, [this, &Out, DwoOut, FileType](MCContext &Ctx) { return this->TM.createMCStreamer(Out, DwoOut, FileType, Ctx); }); } if (PrintMIR) addPass(PrintMIRPass(Out), /*Force=*/true); return verifyStartStop(*StartStopInfo); } template void CodeGenPassBuilder::setStartStopPasses( const TargetPassConfig::StartStopInfo &Info) const { if (!Info.StartPass.empty()) { Started = false; BeforeCallbacks.emplace_back([this, &Info, AfterFlag = Info.StartAfter, Count = 0u](StringRef ClassName) mutable { if (Count == Info.StartInstanceNum) { if (AfterFlag) { AfterFlag = false; Started = true; } return Started; } auto PassName = PIC->getPassNameForClassName(ClassName); if (Info.StartPass == PassName && ++Count == Info.StartInstanceNum) Started = !Info.StartAfter; return Started; }); } if (!Info.StopPass.empty()) { Stopped = false; BeforeCallbacks.emplace_back([this, &Info, AfterFlag = Info.StopAfter, Count = 0u](StringRef ClassName) mutable { if (Count == Info.StopInstanceNum) { if (AfterFlag) { AfterFlag = false; Stopped = true; } return !Stopped; } auto PassName = PIC->getPassNameForClassName(ClassName); if (Info.StopPass == PassName && ++Count == Info.StopInstanceNum) Stopped = !Info.StopAfter; return !Stopped; }); } } template Error CodeGenPassBuilder::verifyStartStop( const TargetPassConfig::StartStopInfo &Info) const { if (Started && Stopped) return Error::success(); if (!Started) return make_error( "Can't find start pass \"" + PIC->getPassNameForClassName(Info.StartPass) + "\".", std::make_error_code(std::errc::invalid_argument)); if (!Stopped) return make_error( "Can't find stop pass \"" + PIC->getPassNameForClassName(Info.StopPass) + "\".", std::make_error_code(std::errc::invalid_argument)); return Error::success(); } template void CodeGenPassBuilder::addISelPasses( AddIRPass &addPass) const { derived().addGlobalMergePass(addPass); if (TM.useEmulatedTLS()) addPass(LowerEmuTLSPass()); addPass(PreISelIntrinsicLoweringPass(TM)); derived().addIRPasses(addPass); derived().addCodeGenPrepare(addPass); addPassesToHandleExceptions(addPass); derived().addISelPrepare(addPass); } /// Add common target configurable passes that perform LLVM IR to IR transforms /// following machine independent optimization. template void CodeGenPassBuilder::addIRPasses( AddIRPass &addPass) const { // Before running any passes, run the verifier to determine if the input // coming from the front-end and/or optimizer is valid. if (!Opt.DisableVerify) addPass(VerifierPass()); // Run loop strength reduction before anything else. if (getOptLevel() != CodeGenOptLevel::None && !Opt.DisableLSR) { addPass(createFunctionToLoopPassAdaptor(LoopStrengthReducePass(), /*UseMemorySSA=*/true)); // FIXME: use -stop-after so we could remove PrintLSR if (Opt.PrintLSR) addPass(PrintFunctionPass(dbgs(), "\n\n*** Code after LSR ***\n")); } if (getOptLevel() != CodeGenOptLevel::None) { // The MergeICmpsPass tries to create memcmp calls by grouping sequences of // loads and compares. ExpandMemCmpPass then tries to expand those calls // into optimally-sized loads and compares. The transforms are enabled by a // target lowering hook. if (!Opt.DisableMergeICmps) addPass(MergeICmpsPass()); addPass(ExpandMemCmpPass(&TM)); } // Run GC lowering passes for builtin collectors // TODO: add a pass insertion point here addPass(GCLoweringPass()); addPass(ShadowStackGCLoweringPass()); addPass(LowerConstantIntrinsicsPass()); // Make sure that no unreachable blocks are instruction selected. addPass(UnreachableBlockElimPass()); // Prepare expensive constants for SelectionDAG. if (getOptLevel() != CodeGenOptLevel::None && !Opt.DisableConstantHoisting) addPass(ConstantHoistingPass()); // Replace calls to LLVM intrinsics (e.g., exp, log) operating on vector // operands with calls to the corresponding functions in a vector library. if (getOptLevel() != CodeGenOptLevel::None) addPass(ReplaceWithVeclib()); if (getOptLevel() != CodeGenOptLevel::None && !Opt.DisablePartialLibcallInlining) addPass(PartiallyInlineLibCallsPass()); // Instrument function entry and exit, e.g. with calls to mcount(). addPass(EntryExitInstrumenterPass(/*PostInlining=*/true)); // Add scalarization of target's unsupported masked memory intrinsics pass. // the unsupported intrinsic will be replaced with a chain of basic blocks, // that stores/loads element one-by-one if the appropriate mask bit is set. addPass(ScalarizeMaskedMemIntrinPass()); // Expand reduction intrinsics into shuffle sequences if the target wants to. addPass(ExpandReductionsPass()); // Convert conditional moves to conditional jumps when profitable. if (getOptLevel() != CodeGenOptLevel::None && !Opt.DisableSelectOptimize) addPass(SelectOptimizePass(&TM)); } /// Turn exception handling constructs into something the code generators can /// handle. template void CodeGenPassBuilder::addPassesToHandleExceptions( AddIRPass &addPass) const { const MCAsmInfo *MCAI = TM.getMCAsmInfo(); assert(MCAI && "No MCAsmInfo"); switch (MCAI->getExceptionHandlingType()) { case ExceptionHandling::SjLj: // SjLj piggy-backs on dwarf for this bit. The cleanups done apply to both // Dwarf EH prepare needs to be run after SjLj prepare. Otherwise, // catch info can get misplaced when a selector ends up more than one block // removed from the parent invoke(s). This could happen when a landing // pad is shared by multiple invokes and is also a target of a normal // edge from elsewhere. addPass(SjLjEHPreparePass(&TM)); [[fallthrough]]; case ExceptionHandling::DwarfCFI: case ExceptionHandling::ARM: case ExceptionHandling::AIX: case ExceptionHandling::ZOS: addPass(DwarfEHPreparePass(&TM)); break; case ExceptionHandling::WinEH: // We support using both GCC-style and MSVC-style exceptions on Windows, so // add both preparation passes. Each pass will only actually run if it // recognizes the personality function. addPass(WinEHPreparePass()); addPass(DwarfEHPreparePass(&TM)); break; case ExceptionHandling::Wasm: // Wasm EH uses Windows EH instructions, but it does not need to demote PHIs // on catchpads and cleanuppads because it does not outline them into // funclets. Catchswitch blocks are not lowered in SelectionDAG, so we // should remove PHIs there. addPass(WinEHPreparePass(/*DemoteCatchSwitchPHIOnly=*/false)); addPass(WasmEHPreparePass()); break; case ExceptionHandling::None: addPass(LowerInvokePass()); // The lower invoke pass may create unreachable code. Remove it. addPass(UnreachableBlockElimPass()); break; } } /// Add pass to prepare the LLVM IR for code generation. This should be done /// before exception handling preparation passes. template void CodeGenPassBuilder::addCodeGenPrepare( AddIRPass &addPass) const { if (getOptLevel() != CodeGenOptLevel::None && !Opt.DisableCGP) addPass(CodeGenPreparePass(&TM)); // TODO: Default ctor'd RewriteSymbolPass is no-op. // addPass(RewriteSymbolPass()); } /// Add common passes that perform LLVM IR to IR transforms in preparation for /// instruction selection. template void CodeGenPassBuilder::addISelPrepare( AddIRPass &addPass) const { derived().addPreISel(addPass); addPass(CallBrPreparePass()); // Add both the safe stack and the stack protection passes: each of them will // only protect functions that have corresponding attributes. addPass(SafeStackPass(&TM)); addPass(StackProtectorPass(&TM)); if (Opt.PrintISelInput) addPass(PrintFunctionPass(dbgs(), "\n\n*** Final LLVM Code input to ISel ***\n")); // All passes which modify the LLVM IR are now complete; run the verifier // to ensure that the IR is valid. if (!Opt.DisableVerify) addPass(VerifierPass()); } template Error CodeGenPassBuilder::addCoreISelPasses( AddMachinePass &addPass) const { // Enable FastISel with -fast-isel, but allow that to be overridden. TM.setO0WantsFastISel(Opt.EnableFastISelOption.value_or(true)); // Determine an instruction selector. enum class SelectorType { SelectionDAG, FastISel, GlobalISel }; SelectorType Selector; if (Opt.EnableFastISelOption && *Opt.EnableFastISelOption == true) Selector = SelectorType::FastISel; else if ((Opt.EnableGlobalISelOption && *Opt.EnableGlobalISelOption == true) || (TM.Options.EnableGlobalISel && (!Opt.EnableGlobalISelOption || *Opt.EnableGlobalISelOption == false))) Selector = SelectorType::GlobalISel; else if (TM.getOptLevel() == CodeGenOptLevel::None && TM.getO0WantsFastISel()) Selector = SelectorType::FastISel; else Selector = SelectorType::SelectionDAG; // Set consistently TM.Options.EnableFastISel and EnableGlobalISel. if (Selector == SelectorType::FastISel) { TM.setFastISel(true); TM.setGlobalISel(false); } else if (Selector == SelectorType::GlobalISel) { TM.setFastISel(false); TM.setGlobalISel(true); } // Add instruction selector passes. if (Selector == SelectorType::GlobalISel) { if (auto Err = derived().addIRTranslator(addPass)) return std::move(Err); derived().addPreLegalizeMachineIR(addPass); if (auto Err = derived().addLegalizeMachineIR(addPass)) return std::move(Err); // Before running the register bank selector, ask the target if it // wants to run some passes. derived().addPreRegBankSelect(addPass); if (auto Err = derived().addRegBankSelect(addPass)) return std::move(Err); derived().addPreGlobalInstructionSelect(addPass); if (auto Err = derived().addGlobalInstructionSelect(addPass)) return std::move(Err); // Pass to reset the MachineFunction if the ISel failed. addPass(ResetMachineFunctionPass(reportDiagnosticWhenGlobalISelFallback(), isGlobalISelAbortEnabled())); // Provide a fallback path when we do not want to abort on // not-yet-supported input. if (!isGlobalISelAbortEnabled()) if (auto Err = derived().addInstSelector(addPass)) return std::move(Err); } else if (auto Err = derived().addInstSelector(addPass)) return std::move(Err); // Expand pseudo-instructions emitted by ISel. Don't run the verifier before // FinalizeISel. addPass(FinalizeISelPass()); // // Print the instruction selected machine code... // printAndVerify("After Instruction Selection"); return Error::success(); } /// Add the complete set of target-independent postISel code generator passes. /// /// This can be read as the standard order of major LLVM CodeGen stages. Stages /// with nontrivial configuration or multiple passes are broken out below in /// add%Stage routines. /// /// Any CodeGenPassBuilder::addXX routine may be /// overriden by the Target. The addPre/Post methods with empty header /// implementations allow injecting target-specific fixups just before or after /// major stages. Additionally, targets have the flexibility to change pass /// order within a stage by overriding default implementation of add%Stage /// routines below. Each technique has maintainability tradeoffs because /// alternate pass orders are not well supported. addPre/Post works better if /// the target pass is easily tied to a common pass. But if it has subtle /// dependencies on multiple passes, the target should override the stage /// instead. template Error CodeGenPassBuilder::addMachinePasses( AddMachinePass &addPass) const { // Add passes that optimize machine instructions in SSA form. if (getOptLevel() != CodeGenOptLevel::None) { derived().addMachineSSAOptimization(addPass); } else { // If the target requests it, assign local variables to stack slots relative // to one another and simplify frame index references where possible. addPass(LocalStackSlotAllocationPass()); } if (TM.Options.EnableIPRA) addPass(RegUsageInfoPropagationPass()); // Run pre-ra passes. derived().addPreRegAlloc(addPass); // Run register allocation and passes that are tightly coupled with it, // including phi elimination and scheduling. if (*Opt.OptimizeRegAlloc) { derived().addOptimizedRegAlloc(addPass); } else { if (auto Err = derived().addFastRegAlloc(addPass)) return Err; } // Run post-ra passes. derived().addPostRegAlloc(addPass); addPass(RemoveRedundantDebugValuesPass()); // Insert prolog/epilog code. Eliminate abstract frame index references... if (getOptLevel() != CodeGenOptLevel::None) { addPass(PostRAMachineSinkingPass()); addPass(ShrinkWrapPass()); } addPass(PrologEpilogInserterPass()); /// Add passes that optimize machine instructions after register allocation. if (getOptLevel() != CodeGenOptLevel::None) derived().addMachineLateOptimization(addPass); // Expand pseudo instructions before second scheduling pass. addPass(ExpandPostRAPseudosPass()); // Run pre-sched2 passes. derived().addPreSched2(addPass); if (Opt.EnableImplicitNullChecks) addPass(ImplicitNullChecksPass()); // Second pass scheduler. // Let Target optionally insert this pass by itself at some other // point. if (getOptLevel() != CodeGenOptLevel::None && !TM.targetSchedulesPostRAScheduling()) { if (Opt.MISchedPostRA) addPass(PostMachineSchedulerPass()); else addPass(PostRASchedulerPass()); } // GC derived().addGCPasses(addPass); // Basic block placement. if (getOptLevel() != CodeGenOptLevel::None) derived().addBlockPlacement(addPass); // Insert before XRay Instrumentation. addPass(FEntryInserterPass()); addPass(XRayInstrumentationPass()); addPass(PatchableFunctionPass()); derived().addPreEmitPass(addPass); if (TM.Options.EnableIPRA) // Collect register usage information and produce a register mask of // clobbered registers, to be used to optimize call sites. addPass(RegUsageInfoCollectorPass()); addPass(FuncletLayoutPass()); addPass(StackMapLivenessPass()); addPass(LiveDebugValuesPass()); addPass(MachineSanitizerBinaryMetadata()); if (TM.Options.EnableMachineOutliner && getOptLevel() != CodeGenOptLevel::None && Opt.EnableMachineOutliner != RunOutliner::NeverOutline) { bool RunOnAllFunctions = (Opt.EnableMachineOutliner == RunOutliner::AlwaysOutline); bool AddOutliner = RunOnAllFunctions || TM.Options.SupportsDefaultOutlining; if (AddOutliner) addPass(MachineOutlinerPass(RunOnAllFunctions)); } // Add passes that directly emit MI after all other MI passes. derived().addPreEmitPass2(addPass); return Error::success(); } /// Add passes that optimize machine instructions in SSA form. template void CodeGenPassBuilder::addMachineSSAOptimization( AddMachinePass &addPass) const { // Pre-ra tail duplication. addPass(EarlyTailDuplicatePass()); // Optimize PHIs before DCE: removing dead PHI cycles may make more // instructions dead. addPass(OptimizePHIsPass()); // This pass merges large allocas. StackSlotColoring is a different pass // which merges spill slots. addPass(StackColoringPass()); // If the target requests it, assign local variables to stack slots relative // to one another and simplify frame index references where possible. addPass(LocalStackSlotAllocationPass()); // With optimization, dead code should already be eliminated. However // there is one known exception: lowered code for arguments that are only // used by tail calls, where the tail calls reuse the incoming stack // arguments directly (see t11 in test/CodeGen/X86/sibcall.ll). addPass(DeadMachineInstructionElimPass()); // Allow targets to insert passes that improve instruction level parallelism, // like if-conversion. Such passes will typically need dominator trees and // loop info, just like LICM and CSE below. derived().addILPOpts(addPass); addPass(EarlyMachineLICMPass()); addPass(MachineCSEPass()); addPass(MachineSinkingPass()); addPass(PeepholeOptimizerPass()); // Clean-up the dead code that may have been generated by peephole // rewriting. addPass(DeadMachineInstructionElimPass()); } //===---------------------------------------------------------------------===// /// Register Allocation Pass Configuration //===---------------------------------------------------------------------===// /// Instantiate the default register allocator pass for this target for either /// the optimized or unoptimized allocation path. This will be added to the pass /// manager by addFastRegAlloc in the unoptimized case or addOptimizedRegAlloc /// in the optimized case. /// /// A target that uses the standard regalloc pass order for fast or optimized /// allocation may still override this for per-target regalloc /// selection. But -regalloc=... always takes precedence. template void CodeGenPassBuilder::addTargetRegisterAllocator( AddMachinePass &addPass, bool Optimized) const { if (Optimized) addPass(RAGreedyPass()); else addPass(RegAllocFastPass()); } /// Find and instantiate the register allocation pass requested by this target /// at the current optimization level. Different register allocators are /// defined as separate passes because they may require different analysis. template void CodeGenPassBuilder::addRegAllocPass( AddMachinePass &addPass, bool Optimized) const { // TODO: Parse Opt.RegAlloc to add register allocator. } template Error CodeGenPassBuilder::addRegAssignmentFast( AddMachinePass &addPass) const { // TODO: Ensure allocator is default or fast. addRegAllocPass(addPass, false); return Error::success(); } template Error CodeGenPassBuilder::addRegAssignmentOptimized( AddMachinePass &addPass) const { // Add the selected register allocation pass. addRegAllocPass(addPass, true); // Allow targets to change the register assignments before rewriting. derived().addPreRewrite(addPass); // Finally rewrite virtual registers. addPass(VirtRegRewriterPass()); // Perform stack slot coloring and post-ra machine LICM. // // FIXME: Re-enable coloring with register when it's capable of adding // kill markers. addPass(StackSlotColoringPass()); return Error::success(); } /// Add the minimum set of target-independent passes that are required for /// register allocation. No coalescing or scheduling. template Error CodeGenPassBuilder::addFastRegAlloc( AddMachinePass &addPass) const { addPass(PHIEliminationPass()); addPass(TwoAddressInstructionPass()); return derived().addRegAssignmentFast(addPass); } /// Add standard target-independent passes that are tightly coupled with /// optimized register allocation, including coalescing, machine instruction /// scheduling, and register allocation itself. template void CodeGenPassBuilder::addOptimizedRegAlloc( AddMachinePass &addPass) const { addPass(DetectDeadLanesPass()); addPass(InitUndefPass()); addPass(ProcessImplicitDefsPass()); // Edge splitting is smarter with machine loop info. addPass(PHIEliminationPass()); // Eventually, we want to run LiveIntervals before PHI elimination. if (Opt.EarlyLiveIntervals) addPass(RequireAnalysisPass()); addPass(TwoAddressInstructionPass()); addPass(RegisterCoalescerPass()); // The machine scheduler may accidentally create disconnected components // when moving subregister definitions around, avoid this by splitting them to // separate vregs before. Splitting can also improve reg. allocation quality. addPass(RenameIndependentSubregsPass()); // PreRA instruction scheduling. addPass(MachineSchedulerPass()); if (derived().addRegAssignmentOptimized(addPass)) { // Allow targets to expand pseudo instructions depending on the choice of // registers before MachineCopyPropagation. derived().addPostRewrite(addPass); // Copy propagate to forward register uses and try to eliminate COPYs that // were not coalesced. addPass(MachineCopyPropagationPass()); // Run post-ra machine LICM to hoist reloads / remats. // // FIXME: can this move into MachineLateOptimization? addPass(MachineLICMPass()); } } //===---------------------------------------------------------------------===// /// Post RegAlloc Pass Configuration //===---------------------------------------------------------------------===// /// Add passes that optimize machine instructions after register allocation. template void CodeGenPassBuilder::addMachineLateOptimization( AddMachinePass &addPass) const { // Branch folding must be run after regalloc and prolog/epilog insertion. addPass(BranchFolderPass()); // Tail duplication. // Note that duplicating tail just increases code size and degrades // performance for targets that require Structured Control Flow. // In addition it can also make CFG irreducible. Thus we disable it. if (!TM.requiresStructuredCFG()) addPass(TailDuplicatePass()); // Cleanup of redundant (identical) address/immediate loads. addPass(MachineLateInstrsCleanupPass()); // Copy propagation. addPass(MachineCopyPropagationPass()); } /// Add standard basic block placement passes. template void CodeGenPassBuilder::addBlockPlacement( AddMachinePass &addPass) const { addPass(MachineBlockPlacementPass()); // Run a separate pass to collect block placement statistics. if (Opt.EnableBlockPlacementStats) addPass(MachineBlockPlacementStatsPass()); } } // namespace llvm #endif // LLVM_PASSES_CODEGENPASSBUILDER_H