LLVM: lib/Passes/PassBuilderPipelines.cpp Source File

//===- Construction of pass pipelines -------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

/// \file

///

/// This file provides the implementation of the PassBuilder based on our

/// static pass registry as well as related functionality. It also provides

/// helpers to aid in analyzing, debugging, and testing passes and pass

/// pipelines.

///

//===----------------------------------------------------------------------===//


#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/AliasAnalysis.h"

#include "llvm/Analysis/BasicAliasAnalysis.h"

#include "llvm/Analysis/CGSCCPassManager.h"

#include "llvm/Analysis/CtxProfAnalysis.h"

#include "llvm/Analysis/GlobalsModRef.h"

#include "llvm/Analysis/InlineAdvisor.h"

#include "llvm/Analysis/ProfileSummaryInfo.h"

#include "llvm/Analysis/ScopedNoAliasAA.h"

#include "llvm/Analysis/TypeBasedAliasAnalysis.h"

#include "llvm/IR/PassManager.h"

#include "llvm/Pass.h"

#include "llvm/Passes/OptimizationLevel.h"

#include "llvm/Passes/PassBuilder.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/PGOOptions.h"

#include "llvm/Support/VirtualFileSystem.h"

#include "llvm/Target/TargetMachine.h"

#include "llvm/Transforms/AggressiveInstCombine/AggressiveInstCombine.h"

#include "llvm/Transforms/Coroutines/CoroAnnotationElide.h"

#include "llvm/Transforms/Coroutines/CoroCleanup.h"

#include "llvm/Transforms/Coroutines/CoroConditionalWrapper.h"

#include "llvm/Transforms/Coroutines/CoroEarly.h"

#include "llvm/Transforms/Coroutines/CoroElide.h"

#include "llvm/Transforms/Coroutines/CoroSplit.h"

#include "llvm/Transforms/HipStdPar/HipStdPar.h"

#include "llvm/Transforms/IPO/AlwaysInliner.h"

#include "llvm/Transforms/IPO/Annotation2Metadata.h"

#include "llvm/Transforms/IPO/ArgumentPromotion.h"

#include "llvm/Transforms/IPO/Attributor.h"

#include "llvm/Transforms/IPO/CalledValuePropagation.h"

#include "llvm/Transforms/IPO/ConstantMerge.h"

#include "llvm/Transforms/IPO/CrossDSOCFI.h"

#include "llvm/Transforms/IPO/DeadArgumentElimination.h"

#include "llvm/Transforms/IPO/ElimAvailExtern.h"

#include "llvm/Transforms/IPO/EmbedBitcodePass.h"

#include "llvm/Transforms/IPO/ExpandVariadics.h"

#include "llvm/Transforms/IPO/FatLTOCleanup.h"

#include "llvm/Transforms/IPO/ForceFunctionAttrs.h"

#include "llvm/Transforms/IPO/FunctionAttrs.h"

#include "llvm/Transforms/IPO/GlobalDCE.h"

#include "llvm/Transforms/IPO/GlobalOpt.h"

#include "llvm/Transforms/IPO/GlobalSplit.h"

#include "llvm/Transforms/IPO/HotColdSplitting.h"

#include "llvm/Transforms/IPO/IROutliner.h"

#include "llvm/Transforms/IPO/InferFunctionAttrs.h"

#include "llvm/Transforms/IPO/Inliner.h"

#include "llvm/Transforms/IPO/LowerTypeTests.h"

#include "llvm/Transforms/IPO/MemProfContextDisambiguation.h"

#include "llvm/Transforms/IPO/MergeFunctions.h"

#include "llvm/Transforms/IPO/ModuleInliner.h"

#include "llvm/Transforms/IPO/OpenMPOpt.h"

#include "llvm/Transforms/IPO/PartialInlining.h"

#include "llvm/Transforms/IPO/SCCP.h"

#include "llvm/Transforms/IPO/SampleProfile.h"

#include "llvm/Transforms/IPO/SampleProfileProbe.h"

#include "llvm/Transforms/IPO/WholeProgramDevirt.h"

#include "llvm/Transforms/InstCombine/InstCombine.h"

#include "llvm/Transforms/Instrumentation/CGProfile.h"

#include "llvm/Transforms/Instrumentation/ControlHeightReduction.h"

#include "llvm/Transforms/Instrumentation/InstrProfiling.h"

#include "llvm/Transforms/Instrumentation/MemProfInstrumentation.h"

#include "llvm/Transforms/Instrumentation/MemProfUse.h"

#include "llvm/Transforms/Instrumentation/PGOCtxProfFlattening.h"

#include "llvm/Transforms/Instrumentation/PGOCtxProfLowering.h"

#include "llvm/Transforms/Instrumentation/PGOForceFunctionAttrs.h"

#include "llvm/Transforms/Instrumentation/PGOInstrumentation.h"

#include "llvm/Transforms/Scalar/ADCE.h"

#include "llvm/Transforms/Scalar/AlignmentFromAssumptions.h"

#include "llvm/Transforms/Scalar/AnnotationRemarks.h"

#include "llvm/Transforms/Scalar/BDCE.h"

#include "llvm/Transforms/Scalar/CallSiteSplitting.h"

#include "llvm/Transforms/Scalar/ConstraintElimination.h"

#include "llvm/Transforms/Scalar/CorrelatedValuePropagation.h"

#include "llvm/Transforms/Scalar/DFAJumpThreading.h"

#include "llvm/Transforms/Scalar/DeadStoreElimination.h"

#include "llvm/Transforms/Scalar/DivRemPairs.h"

#include "llvm/Transforms/Scalar/DropUnnecessaryAssumes.h"

#include "llvm/Transforms/Scalar/EarlyCSE.h"

#include "llvm/Transforms/Scalar/Float2Int.h"

#include "llvm/Transforms/Scalar/GVN.h"

#include "llvm/Transforms/Scalar/IndVarSimplify.h"

#include "llvm/Transforms/Scalar/InferAlignment.h"

#include "llvm/Transforms/Scalar/InstSimplifyPass.h"

#include "llvm/Transforms/Scalar/JumpTableToSwitch.h"

#include "llvm/Transforms/Scalar/JumpThreading.h"

#include "llvm/Transforms/Scalar/LICM.h"

#include "llvm/Transforms/Scalar/LoopDeletion.h"

#include "llvm/Transforms/Scalar/LoopDistribute.h"

#include "llvm/Transforms/Scalar/LoopFlatten.h"

#include "llvm/Transforms/Scalar/LoopFuse.h"

#include "llvm/Transforms/Scalar/LoopIdiomRecognize.h"

#include "llvm/Transforms/Scalar/LoopInstSimplify.h"

#include "llvm/Transforms/Scalar/LoopInterchange.h"

#include "llvm/Transforms/Scalar/LoopLoadElimination.h"

#include "llvm/Transforms/Scalar/LoopPassManager.h"

#include "llvm/Transforms/Scalar/LoopRotation.h"

#include "llvm/Transforms/Scalar/LoopSimplifyCFG.h"

#include "llvm/Transforms/Scalar/LoopSink.h"

#include "llvm/Transforms/Scalar/LoopUnrollAndJamPass.h"

#include "llvm/Transforms/Scalar/LoopUnrollPass.h"

#include "llvm/Transforms/Scalar/LoopVersioningLICM.h"

#include "llvm/Transforms/Scalar/LowerConstantIntrinsics.h"

#include "llvm/Transforms/Scalar/LowerExpectIntrinsic.h"

#include "llvm/Transforms/Scalar/LowerMatrixIntrinsics.h"

#include "llvm/Transforms/Scalar/MemCpyOptimizer.h"

#include "llvm/Transforms/Scalar/MergedLoadStoreMotion.h"

#include "llvm/Transforms/Scalar/NewGVN.h"

#include "llvm/Transforms/Scalar/Reassociate.h"

#include "llvm/Transforms/Scalar/SCCP.h"

#include "llvm/Transforms/Scalar/SROA.h"

#include "llvm/Transforms/Scalar/SimpleLoopUnswitch.h"

#include "llvm/Transforms/Scalar/SimplifyCFG.h"

#include "llvm/Transforms/Scalar/SpeculativeExecution.h"

#include "llvm/Transforms/Scalar/TailRecursionElimination.h"

#include "llvm/Transforms/Scalar/WarnMissedTransforms.h"

#include "llvm/Transforms/Utils/AddDiscriminators.h"

#include "llvm/Transforms/Utils/AssumeBundleBuilder.h"

#include "llvm/Transforms/Utils/CanonicalizeAliases.h"

#include "llvm/Transforms/Utils/CountVisits.h"

#include "llvm/Transforms/Utils/EntryExitInstrumenter.h"

#include "llvm/Transforms/Utils/ExtraPassManager.h"

#include "llvm/Transforms/Utils/InjectTLIMappings.h"

#include "llvm/Transforms/Utils/LibCallsShrinkWrap.h"

#include "llvm/Transforms/Utils/Mem2Reg.h"

#include "llvm/Transforms/Utils/MoveAutoInit.h"

#include "llvm/Transforms/Utils/NameAnonGlobals.h"

#include "llvm/Transforms/Utils/RelLookupTableConverter.h"

#include "llvm/Transforms/Utils/SimplifyCFGOptions.h"

#include "llvm/Transforms/Vectorize/LoopVectorize.h"

#include "llvm/Transforms/Vectorize/SLPVectorizer.h"

#include "llvm/Transforms/Vectorize/VectorCombine.h"


using namespace llvm;


static cl::opt<InliningAdvisorMode> UseInlineAdvisor(

    "enable-ml-inliner", cl::init(InliningAdvisorMode::Default), cl::Hidden,

    cl::desc("Enable ML policy for inliner. Currently trained for -Oz only"),

    cl::values(clEnumValN(InliningAdvisorMode::Default, "default",

                          "Heuristics-based inliner version"),

               clEnumValN(InliningAdvisorMode::Development, "development",

                          "Use development mode (runtime-loadable model)"),

               clEnumValN(InliningAdvisorMode::Release, "release",

                          "Use release mode (AOT-compiled model)")));


/// Flag to enable inline deferral during PGO.

static cl::opt<bool>

    EnablePGOInlineDeferral("enable-npm-pgo-inline-deferral", cl::init(true),

                            cl::Hidden,

                            cl::desc("Enable inline deferral during PGO"));


static cl::opt<bool> EnableModuleInliner("enable-module-inliner",

                                         cl::init(false), cl::Hidden,

                                         cl::desc("Enable module inliner"));


static cl::opt<bool> PerformMandatoryInliningsFirst(

    "mandatory-inlining-first", cl::init(false), cl::Hidden,

    cl::desc("Perform mandatory inlinings module-wide, before performing "

             "inlining"));


static cl::opt<bool> EnableEagerlyInvalidateAnalyses(

    "eagerly-invalidate-analyses", cl::init(true), cl::Hidden,

    cl::desc("Eagerly invalidate more analyses in default pipelines"));


static cl::opt<bool> EnableMergeFunctions(

    "enable-merge-functions", cl::init(false), cl::Hidden,

    cl::desc("Enable function merging as part of the optimization pipeline"));


static cl::opt<bool> EnablePostPGOLoopRotation(

    "enable-post-pgo-loop-rotation", cl::init(true), cl::Hidden,

    cl::desc("Run the loop rotation transformation after PGO instrumentation"));


static cl::opt<bool> EnableGlobalAnalyses(

    "enable-global-analyses", cl::init(true), cl::Hidden,

    cl::desc("Enable inter-procedural analyses"));


static cl::opt<bool> RunPartialInlining("enable-partial-inlining",

                                        cl::init(false), cl::Hidden,

                                        cl::desc("Run Partial inlining pass"));


static cl::opt<bool> ExtraVectorizerPasses(

    "extra-vectorizer-passes", cl::init(false), cl::Hidden,

    cl::desc("Run cleanup optimization passes after vectorization"));


static cl::opt<bool> RunNewGVN("enable-newgvn", cl::init(false), cl::Hidden,

                               cl::desc("Run the NewGVN pass"));


static cl::opt<bool>

    EnableLoopInterchange("enable-loopinterchange", cl::init(false), cl::Hidden,

                          cl::desc("Enable the LoopInterchange Pass"));


static cl::opt<bool> EnableUnrollAndJam("enable-unroll-and-jam",

                                        cl::init(false), cl::Hidden,

                                        cl::desc("Enable Unroll And Jam Pass"));


static cl::opt<bool> EnableLoopFlatten("enable-loop-flatten", cl::init(false),

                                       cl::Hidden,

                                       cl::desc("Enable the LoopFlatten Pass"));


// Experimentally allow loop header duplication. This should allow for better

// optimization at Oz, since loop-idiom recognition can then recognize things

// like memcpy. If this ends up being useful for many targets, we should drop

// this flag and make a code generation option that can be controlled

// independent of the opt level and exposed through the frontend.

static cl::opt<bool> EnableLoopHeaderDuplication(

    "enable-loop-header-duplication", cl::init(false), cl::Hidden,

    cl::desc("Enable loop header duplication at any optimization level"));


static cl::opt<bool>

    EnableDFAJumpThreading("enable-dfa-jump-thread",

                           cl::desc("Enable DFA jump threading"),

                           cl::init(false), cl::Hidden);


static cl::opt<bool>

    EnableHotColdSplit("hot-cold-split",

                       cl::desc("Enable hot-cold splitting pass"));


static cl::opt<bool> EnableIROutliner("ir-outliner", cl::init(false),

                                      cl::Hidden,

                                      cl::desc("Enable ir outliner pass"));


static cl::opt<bool>

    DisablePreInliner("disable-preinline", cl::init(false), cl::Hidden,

                      cl::desc("Disable pre-instrumentation inliner"));


static cl::opt<int> PreInlineThreshold(

    "preinline-threshold", cl::Hidden, cl::init(75),

    cl::desc("Control the amount of inlining in pre-instrumentation inliner "

             "(default = 75)"));


static cl::opt<bool>

    EnableGVNHoist("enable-gvn-hoist",

                   cl::desc("Enable the GVN hoisting pass (default = off)"));


static cl::opt<bool>

    EnableGVNSink("enable-gvn-sink",

                  cl::desc("Enable the GVN sinking pass (default = off)"));


static cl::opt<bool> EnableJumpTableToSwitch(

    "enable-jump-table-to-switch",

    cl::desc("Enable JumpTableToSwitch pass (default = off)"));


// This option is used in simplifying testing SampleFDO optimizations for

// profile loading.

static cl::opt<bool>

    EnableCHR("enable-chr", cl::init(true), cl::Hidden,

              cl::desc("Enable control height reduction optimization (CHR)"));


static cl::opt<bool> FlattenedProfileUsed(

    "flattened-profile-used", cl::init(false), cl::Hidden,

    cl::desc("Indicate the sample profile being used is flattened, i.e., "

             "no inline hierarchy exists in the profile"));


static cl::opt<bool>

    EnableMatrix("enable-matrix", cl::init(false), cl::Hidden,

                 cl::desc("Enable lowering of the matrix intrinsics"));


static cl::opt<bool> EnableConstraintElimination(

    "enable-constraint-elimination", cl::init(true), cl::Hidden,

    cl::desc(

        "Enable pass to eliminate conditions based on linear constraints"));


static cl::opt<AttributorRunOption> AttributorRun(

    "attributor-enable", cl::Hidden, cl::init(AttributorRunOption::NONE),

    cl::desc("Enable the attributor inter-procedural deduction pass"),

    cl::values(clEnumValN(AttributorRunOption::ALL, "all",

                          "enable all attributor runs"),

               clEnumValN(AttributorRunOption::MODULE, "module",

                          "enable module-wide attributor runs"),

               clEnumValN(AttributorRunOption::CGSCC, "cgscc",

                          "enable call graph SCC attributor runs"),

               clEnumValN(AttributorRunOption::NONE, "none",

                          "disable attributor runs")));


static cl::opt<bool> EnableSampledInstr(

    "enable-sampled-instrumentation", cl::init(false), cl::Hidden,

    cl::desc("Enable profile instrumentation sampling (default = off)"));

static cl::opt<bool> UseLoopVersioningLICM(

    "enable-loop-versioning-licm", cl::init(false), cl::Hidden,

    cl::desc("Enable the experimental Loop Versioning LICM pass"));


static cl::opt<std::string> InstrumentColdFuncOnlyPath(

    "instrument-cold-function-only-path", cl::init(""),

    cl::desc("File path for cold function only instrumentation(requires use "

             "with --pgo-instrument-cold-function-only)"),

    cl::Hidden);


extern cl::opt<std::string> UseCtxProfile;

extern cl::opt<bool> PGOInstrumentColdFunctionOnly;


namespace llvm {

extern cl::opt<bool> EnableMemProfContextDisambiguation;

} // namespace llvm


PipelineTuningOptions::PipelineTuningOptions() {

  LoopInterleaving = true;

  LoopVectorization = true;

  SLPVectorization = false;

  LoopUnrolling = true;

  LoopInterchange = EnableLoopInterchange;

  LoopFusion = false;

  ForgetAllSCEVInLoopUnroll = ForgetSCEVInLoopUnroll;

  LicmMssaOptCap = SetLicmMssaOptCap;

  LicmMssaNoAccForPromotionCap = SetLicmMssaNoAccForPromotionCap;

  CallGraphProfile = true;

  UnifiedLTO = false;

  MergeFunctions = EnableMergeFunctions;

  InlinerThreshold = -1;

  EagerlyInvalidateAnalyses = EnableEagerlyInvalidateAnalyses;

}


namespace llvm {

extern cl::opt<unsigned> MaxDevirtIterations;

} // namespace llvm


void PassBuilder::invokePeepholeEPCallbacks(FunctionPassManager &FPM,

                                            OptimizationLevel Level) {

  for (auto &C : PeepholeEPCallbacks)

    C(FPM, Level);

}


void PassBuilder::invokeLateLoopOptimizationsEPCallbacks(

    LoopPassManager &LPM, OptimizationLevel Level) {

  for (auto &C : LateLoopOptimizationsEPCallbacks)

    C(LPM, Level);

}


void PassBuilder::invokeLoopOptimizerEndEPCallbacks(LoopPassManager &LPM,

                                                    OptimizationLevel Level) {

  for (auto &C : LoopOptimizerEndEPCallbacks)

    C(LPM, Level);

}


void PassBuilder::invokeScalarOptimizerLateEPCallbacks(

    FunctionPassManager &FPM, OptimizationLevel Level) {

  for (auto &C : ScalarOptimizerLateEPCallbacks)

    C(FPM, Level);

}


void PassBuilder::invokeCGSCCOptimizerLateEPCallbacks(CGSCCPassManager &CGPM,

                                                      OptimizationLevel Level) {

  for (auto &C : CGSCCOptimizerLateEPCallbacks)

    C(CGPM, Level);

}


void PassBuilder::invokeVectorizerStartEPCallbacks(FunctionPassManager &FPM,

                                                   OptimizationLevel Level) {

  for (auto &C : VectorizerStartEPCallbacks)

    C(FPM, Level);

}


void PassBuilder::invokeVectorizerEndEPCallbacks(FunctionPassManager &FPM,

                                                 OptimizationLevel Level) {

  for (auto &C : VectorizerEndEPCallbacks)

    C(FPM, Level);

}


void PassBuilder::invokeOptimizerEarlyEPCallbacks(ModulePassManager &MPM,

                                                  OptimizationLevel Level,

                                                  ThinOrFullLTOPhase Phase) {

  for (auto &C : OptimizerEarlyEPCallbacks)

    C(MPM, Level, Phase);

}


void PassBuilder::invokeOptimizerLastEPCallbacks(ModulePassManager &MPM,

                                                 OptimizationLevel Level,

                                                 ThinOrFullLTOPhase Phase) {

  for (auto &C : OptimizerLastEPCallbacks)

    C(MPM, Level, Phase);

}


void PassBuilder::invokeFullLinkTimeOptimizationEarlyEPCallbacks(

    ModulePassManager &MPM, OptimizationLevel Level) {

  for (auto &C : FullLinkTimeOptimizationEarlyEPCallbacks)

    C(MPM, Level);

}


void PassBuilder::invokeFullLinkTimeOptimizationLastEPCallbacks(

    ModulePassManager &MPM, OptimizationLevel Level) {

  for (auto &C : FullLinkTimeOptimizationLastEPCallbacks)

    C(MPM, Level);

}


void PassBuilder::invokePipelineStartEPCallbacks(ModulePassManager &MPM,

                                                 OptimizationLevel Level) {

  for (auto &C : PipelineStartEPCallbacks)

    C(MPM, Level);

}


void PassBuilder::invokePipelineEarlySimplificationEPCallbacks(

    ModulePassManager &MPM, OptimizationLevel Level, ThinOrFullLTOPhase Phase) {

  for (auto &C : PipelineEarlySimplificationEPCallbacks)

    C(MPM, Level, Phase);

}


// Helper to add AnnotationRemarksPass.


static void addAnnotationRemarksPass(ModulePassManager &MPM) {

  MPM.addPass(createModuleToFunctionPassAdaptor(AnnotationRemarksPass()));

}


// Helper to check if the current compilation phase is preparing for LTO


static bool isLTOPreLink(ThinOrFullLTOPhase Phase) {

  return Phase == ThinOrFullLTOPhase::ThinLTOPreLink ||

         Phase == ThinOrFullLTOPhase::FullLTOPreLink;

}


// Helper to check if the current compilation phase is LTO backend


static bool isLTOPostLink(ThinOrFullLTOPhase Phase) {

  return Phase == ThinOrFullLTOPhase::ThinLTOPostLink ||

         Phase == ThinOrFullLTOPhase::FullLTOPostLink;

}


// Helper to wrap conditionally Coro passes.


static CoroConditionalWrapper buildCoroWrapper(ThinOrFullLTOPhase Phase) {

  // TODO: Skip passes according to Phase.

  ModulePassManager CoroPM;

  CoroPM.addPass(CoroEarlyPass());

  CGSCCPassManager CGPM;

  CGPM.addPass(CoroSplitPass());

  CoroPM.addPass(createModuleToPostOrderCGSCCPassAdaptor(std::move(CGPM)));

  CoroPM.addPass(CoroCleanupPass());

  CoroPM.addPass(GlobalDCEPass());

  return CoroConditionalWrapper(std::move(CoroPM));

}


// TODO: Investigate the cost/benefit of tail call elimination on debugging.

FunctionPassManager

PassBuilder::buildO1FunctionSimplificationPipeline(OptimizationLevel Level,

                                                   ThinOrFullLTOPhase Phase) {


  FunctionPassManager FPM;


  if (AreStatisticsEnabled())

    FPM.addPass(CountVisitsPass());


  // Form SSA out of local memory accesses after breaking apart aggregates into

  // scalars.

  FPM.addPass(SROAPass(SROAOptions::ModifyCFG));


  // Catch trivial redundancies

  FPM.addPass(EarlyCSEPass(true /* Enable mem-ssa. */));


  // Hoisting of scalars and load expressions.

  FPM.addPass(

      SimplifyCFGPass(SimplifyCFGOptions().convertSwitchRangeToICmp(true)));

  FPM.addPass(InstCombinePass());


  FPM.addPass(LibCallsShrinkWrapPass());


  invokePeepholeEPCallbacks(FPM, Level);


  FPM.addPass(

      SimplifyCFGPass(SimplifyCFGOptions().convertSwitchRangeToICmp(true)));


  // Form canonically associated expression trees, and simplify the trees using

  // basic mathematical properties. For example, this will form (nearly)

  // minimal multiplication trees.

  FPM.addPass(ReassociatePass());


  // Add the primary loop simplification pipeline.

  // FIXME: Currently this is split into two loop pass pipelines because we run

  // some function passes in between them. These can and should be removed

  // and/or replaced by scheduling the loop pass equivalents in the correct

  // positions. But those equivalent passes aren't powerful enough yet.

  // Specifically, `SimplifyCFGPass` and `InstCombinePass` are currently still

  // used. We have `LoopSimplifyCFGPass` which isn't yet powerful enough yet to

  // fully replace `SimplifyCFGPass`, and the closest to the other we have is

  // `LoopInstSimplify`.

  LoopPassManager LPM1, LPM2;


  // Simplify the loop body. We do this initially to clean up after other loop

  // passes run, either when iterating on a loop or on inner loops with

  // implications on the outer loop.

  LPM1.addPass(LoopInstSimplifyPass());

  LPM1.addPass(LoopSimplifyCFGPass());


  // Try to remove as much code from the loop header as possible,

  // to reduce amount of IR that will have to be duplicated. However,

  // do not perform speculative hoisting the first time as LICM

  // will destroy metadata that may not need to be destroyed if run

  // after loop rotation.

  // TODO: Investigate promotion cap for O1.

  LPM1.addPass(LICMPass(PTO.LicmMssaOptCap, PTO.LicmMssaNoAccForPromotionCap,

                        /*AllowSpeculation=*/false));


  LPM1.addPass(LoopRotatePass(/* Disable header duplication */ true,

                              isLTOPreLink(Phase)));

  // TODO: Investigate promotion cap for O1.

  LPM1.addPass(LICMPass(PTO.LicmMssaOptCap, PTO.LicmMssaNoAccForPromotionCap,

                        /*AllowSpeculation=*/true));

  LPM1.addPass(SimpleLoopUnswitchPass());

  if (EnableLoopFlatten)

    LPM1.addPass(LoopFlattenPass());


  LPM2.addPass(LoopIdiomRecognizePass());

  LPM2.addPass(IndVarSimplifyPass());


  invokeLateLoopOptimizationsEPCallbacks(LPM2, Level);


  LPM2.addPass(LoopDeletionPass());


  // Do not enable unrolling in PreLinkThinLTO phase during sample PGO

  // because it changes IR to makes profile annotation in back compile

  // inaccurate. The normal unroller doesn't pay attention to forced full unroll

  // attributes so we need to make sure and allow the full unroll pass to pay

  // attention to it.

  if (Phase != ThinOrFullLTOPhase::ThinLTOPreLink || !PGOOpt ||

      PGOOpt->Action != PGOOptions::SampleUse)

    LPM2.addPass(LoopFullUnrollPass(Level.getSpeedupLevel(),

                                    /* OnlyWhenForced= */ !PTO.LoopUnrolling,

                                    PTO.ForgetAllSCEVInLoopUnroll));


  invokeLoopOptimizerEndEPCallbacks(LPM2, Level);


  FPM.addPass(createFunctionToLoopPassAdaptor(std::move(LPM1),

                                              /*UseMemorySSA=*/true,

                                              /*UseBlockFrequencyInfo=*/true));

  FPM.addPass(

      SimplifyCFGPass(SimplifyCFGOptions().convertSwitchRangeToICmp(true)));

  FPM.addPass(InstCombinePass());

  // The loop passes in LPM2 (LoopFullUnrollPass) do not preserve MemorySSA.

  // *All* loop passes must preserve it, in order to be able to use it.

  FPM.addPass(createFunctionToLoopPassAdaptor(std::move(LPM2),

                                              /*UseMemorySSA=*/false,

                                              /*UseBlockFrequencyInfo=*/false));


  // Delete small array after loop unroll.

  FPM.addPass(SROAPass(SROAOptions::ModifyCFG));


  // Specially optimize memory movement as it doesn't look like dataflow in SSA.

  FPM.addPass(MemCpyOptPass());


  // Sparse conditional constant propagation.

  // FIXME: It isn't clear why we do this *after* loop passes rather than

  // before...

  FPM.addPass(SCCPPass());


  // Delete dead bit computations (instcombine runs after to fold away the dead

  // computations, and then ADCE will run later to exploit any new DCE

  // opportunities that creates).

  FPM.addPass(BDCEPass());


  // Run instcombine after redundancy and dead bit elimination to exploit

  // opportunities opened up by them.

  FPM.addPass(InstCombinePass());

  invokePeepholeEPCallbacks(FPM, Level);


  FPM.addPass(CoroElidePass());


  invokeScalarOptimizerLateEPCallbacks(FPM, Level);


  // Finally, do an expensive DCE pass to catch all the dead code exposed by

  // the simplifications and basic cleanup after all the simplifications.

  // TODO: Investigate if this is too expensive.

  FPM.addPass(ADCEPass());

  FPM.addPass(

      SimplifyCFGPass(SimplifyCFGOptions().convertSwitchRangeToICmp(true)));

  FPM.addPass(InstCombinePass());

  invokePeepholeEPCallbacks(FPM, Level);


  return FPM;

}


FunctionPassManager


PassBuilder::buildFunctionSimplificationPipeline(OptimizationLevel Level,

                                                 ThinOrFullLTOPhase Phase) {

  assert(Level != OptimizationLevel::O0 && "Must request optimizations!");


  // The O1 pipeline has a separate pipeline creation function to simplify

  // construction readability.

  if (Level.getSpeedupLevel() == 1)

    return buildO1FunctionSimplificationPipeline(Level, Phase);


  FunctionPassManager FPM;


  if (AreStatisticsEnabled())

    FPM.addPass(CountVisitsPass());


  // Form SSA out of local memory accesses after breaking apart aggregates into

  // scalars.

  FPM.addPass(SROAPass(SROAOptions::ModifyCFG));


  // Catch trivial redundancies

  FPM.addPass(EarlyCSEPass(true /* Enable mem-ssa. */));

  if (EnableKnowledgeRetention)

    FPM.addPass(AssumeSimplifyPass());


  // Hoisting of scalars and load expressions.

  if (EnableGVNHoist)

    FPM.addPass(GVNHoistPass());


  // Global value numbering based sinking.

  if (EnableGVNSink) {

    FPM.addPass(GVNSinkPass());

    FPM.addPass(

        SimplifyCFGPass(SimplifyCFGOptions().convertSwitchRangeToICmp(true)));

  }


  // Speculative execution if the target has divergent branches; otherwise nop.

  FPM.addPass(SpeculativeExecutionPass(/* OnlyIfDivergentTarget =*/true));


  // Optimize based on known information about branches, and cleanup afterward.

  FPM.addPass(JumpThreadingPass());

  FPM.addPass(CorrelatedValuePropagationPass());


  // Jump table to switch conversion.

  if (EnableJumpTableToSwitch)

    FPM.addPass(JumpTableToSwitchPass());


  FPM.addPass(

      SimplifyCFGPass(SimplifyCFGOptions().convertSwitchRangeToICmp(true)));

  FPM.addPass(InstCombinePass());

  FPM.addPass(AggressiveInstCombinePass());


  if (!Level.isOptimizingForSize())

    FPM.addPass(LibCallsShrinkWrapPass());


  invokePeepholeEPCallbacks(FPM, Level);


  // For PGO use pipeline, try to optimize memory intrinsics such as memcpy

  // using the size value profile. Don't perform this when optimizing for size.

  if (PGOOpt && PGOOpt->Action == PGOOptions::IRUse &&

      !Level.isOptimizingForSize())

    FPM.addPass(PGOMemOPSizeOpt());


  FPM.addPass(TailCallElimPass(/*UpdateFunctionEntryCount=*/

                               isInstrumentedPGOUse()));

  FPM.addPass(

      SimplifyCFGPass(SimplifyCFGOptions().convertSwitchRangeToICmp(true)));


  // Form canonically associated expression trees, and simplify the trees using

  // basic mathematical properties. For example, this will form (nearly)

  // minimal multiplication trees.

  FPM.addPass(ReassociatePass());


  if (EnableConstraintElimination)

    FPM.addPass(ConstraintEliminationPass());


  // Add the primary loop simplification pipeline.

  // FIXME: Currently this is split into two loop pass pipelines because we run

  // some function passes in between them. These can and should be removed

  // and/or replaced by scheduling the loop pass equivalents in the correct

  // positions. But those equivalent passes aren't powerful enough yet.

  // Specifically, `SimplifyCFGPass` and `InstCombinePass` are currently still

  // used. We have `LoopSimplifyCFGPass` which isn't yet powerful enough yet to

  // fully replace `SimplifyCFGPass`, and the closest to the other we have is

  // `LoopInstSimplify`.

  LoopPassManager LPM1, LPM2;


  // Simplify the loop body. We do this initially to clean up after other loop

  // passes run, either when iterating on a loop or on inner loops with

  // implications on the outer loop.

  LPM1.addPass(LoopInstSimplifyPass());

  LPM1.addPass(LoopSimplifyCFGPass());


  // Try to remove as much code from the loop header as possible,

  // to reduce amount of IR that will have to be duplicated. However,

  // do not perform speculative hoisting the first time as LICM

  // will destroy metadata that may not need to be destroyed if run

  // after loop rotation.

  // TODO: Investigate promotion cap for O1.

  LPM1.addPass(LICMPass(PTO.LicmMssaOptCap, PTO.LicmMssaNoAccForPromotionCap,

                        /*AllowSpeculation=*/false));


  // Disable header duplication in loop rotation at -Oz.

  LPM1.addPass(LoopRotatePass(EnableLoopHeaderDuplication ||

                                  Level != OptimizationLevel::Oz,

                              isLTOPreLink(Phase)));

  // TODO: Investigate promotion cap for O1.

  LPM1.addPass(LICMPass(PTO.LicmMssaOptCap, PTO.LicmMssaNoAccForPromotionCap,

                        /*AllowSpeculation=*/true));

  LPM1.addPass(

      SimpleLoopUnswitchPass(/* NonTrivial */ Level == OptimizationLevel::O3));

  if (EnableLoopFlatten)

    LPM1.addPass(LoopFlattenPass());


  LPM2.addPass(LoopIdiomRecognizePass());

  LPM2.addPass(IndVarSimplifyPass());


  {

    ExtraLoopPassManager<ShouldRunExtraSimpleLoopUnswitch> ExtraPasses;

    ExtraPasses.addPass(SimpleLoopUnswitchPass(/* NonTrivial */ Level ==

                                               OptimizationLevel::O3));

    LPM2.addPass(std::move(ExtraPasses));

  }


  invokeLateLoopOptimizationsEPCallbacks(LPM2, Level);


  LPM2.addPass(LoopDeletionPass());


  // Do not enable unrolling in PreLinkThinLTO phase during sample PGO

  // because it changes IR to makes profile annotation in back compile

  // inaccurate. The normal unroller doesn't pay attention to forced full unroll

  // attributes so we need to make sure and allow the full unroll pass to pay

  // attention to it.

  if (Phase != ThinOrFullLTOPhase::ThinLTOPreLink || !PGOOpt ||

      PGOOpt->Action != PGOOptions::SampleUse)

    LPM2.addPass(LoopFullUnrollPass(Level.getSpeedupLevel(),

                                    /* OnlyWhenForced= */ !PTO.LoopUnrolling,

                                    PTO.ForgetAllSCEVInLoopUnroll));


  invokeLoopOptimizerEndEPCallbacks(LPM2, Level);


  FPM.addPass(createFunctionToLoopPassAdaptor(std::move(LPM1),

                                              /*UseMemorySSA=*/true,

                                              /*UseBlockFrequencyInfo=*/true));

  FPM.addPass(

      SimplifyCFGPass(SimplifyCFGOptions().convertSwitchRangeToICmp(true)));

  FPM.addPass(InstCombinePass());

  // The loop passes in LPM2 (LoopIdiomRecognizePass, IndVarSimplifyPass,

  // LoopDeletionPass and LoopFullUnrollPass) do not preserve MemorySSA.

  // *All* loop passes must preserve it, in order to be able to use it.

  FPM.addPass(createFunctionToLoopPassAdaptor(std::move(LPM2),

                                              /*UseMemorySSA=*/false,

                                              /*UseBlockFrequencyInfo=*/false));


  // Delete small array after loop unroll.

  FPM.addPass(SROAPass(SROAOptions::ModifyCFG));


  // Try vectorization/scalarization transforms that are both improvements

  // themselves and can allow further folds with GVN and InstCombine.

  FPM.addPass(VectorCombinePass(/*TryEarlyFoldsOnly=*/true));


  // Eliminate redundancies.

  FPM.addPass(MergedLoadStoreMotionPass());

  if (RunNewGVN)

    FPM.addPass(NewGVNPass());

  else

    FPM.addPass(GVNPass());


  // Sparse conditional constant propagation.

  // FIXME: It isn't clear why we do this *after* loop passes rather than

  // before...

  FPM.addPass(SCCPPass());


  // Delete dead bit computations (instcombine runs after to fold away the dead

  // computations, and then ADCE will run later to exploit any new DCE

  // opportunities that creates).

  FPM.addPass(BDCEPass());


  // Run instcombine after redundancy and dead bit elimination to exploit

  // opportunities opened up by them.

  FPM.addPass(InstCombinePass());

  invokePeepholeEPCallbacks(FPM, Level);


  // Re-consider control flow based optimizations after redundancy elimination,

  // redo DCE, etc.

  if (EnableDFAJumpThreading)

    FPM.addPass(DFAJumpThreadingPass());


  FPM.addPass(JumpThreadingPass());

  FPM.addPass(CorrelatedValuePropagationPass());


  // Finally, do an expensive DCE pass to catch all the dead code exposed by

  // the simplifications and basic cleanup after all the simplifications.

  // TODO: Investigate if this is too expensive.

  FPM.addPass(ADCEPass());


  // Specially optimize memory movement as it doesn't look like dataflow in SSA.

  FPM.addPass(MemCpyOptPass());


  FPM.addPass(DSEPass());

  FPM.addPass(MoveAutoInitPass());


  FPM.addPass(createFunctionToLoopPassAdaptor(

      LICMPass(PTO.LicmMssaOptCap, PTO.LicmMssaNoAccForPromotionCap,

               /*AllowSpeculation=*/true),

      /*UseMemorySSA=*/true, /*UseBlockFrequencyInfo=*/false));


  FPM.addPass(CoroElidePass());


  invokeScalarOptimizerLateEPCallbacks(FPM, Level);


  FPM.addPass(SimplifyCFGPass(SimplifyCFGOptions()

                                  .convertSwitchRangeToICmp(true)

                                  .hoistCommonInsts(true)

                                  .sinkCommonInsts(true)));

  FPM.addPass(InstCombinePass());

  invokePeepholeEPCallbacks(FPM, Level);


  return FPM;

}


void PassBuilder::addRequiredLTOPreLinkPasses(ModulePassManager &MPM) {

  MPM.addPass(CanonicalizeAliasesPass());

  MPM.addPass(NameAnonGlobalPass());

}


void PassBuilder::addPreInlinerPasses(ModulePassManager &MPM,

                                      OptimizationLevel Level,

                                      ThinOrFullLTOPhase LTOPhase) {

  assert(Level != OptimizationLevel::O0 && "Not expecting O0 here!");

  if (DisablePreInliner)

    return;

  InlineParams IP;


  IP.DefaultThreshold = PreInlineThreshold;


  // FIXME: The hint threshold has the same value used by the regular inliner

  // when not optimzing for size. This should probably be lowered after

  // performance testing.

  // FIXME: this comment is cargo culted from the old pass manager, revisit).

  IP.HintThreshold = Level.isOptimizingForSize() ? PreInlineThreshold : 325;

  ModuleInlinerWrapperPass MIWP(

      IP, /* MandatoryFirst */ true,

      InlineContext{LTOPhase, InlinePass::EarlyInliner});

  CGSCCPassManager &CGPipeline = MIWP.getPM();


  FunctionPassManager FPM;

  FPM.addPass(SROAPass(SROAOptions::ModifyCFG));

  FPM.addPass(EarlyCSEPass()); // Catch trivial redundancies.

  FPM.addPass(SimplifyCFGPass(SimplifyCFGOptions().convertSwitchRangeToICmp(

      true)));                    // Merge & remove basic blocks.

  FPM.addPass(InstCombinePass()); // Combine silly sequences.

  invokePeepholeEPCallbacks(FPM, Level);


  CGPipeline.addPass(createCGSCCToFunctionPassAdaptor(

      std::move(FPM), PTO.EagerlyInvalidateAnalyses));


  MPM.addPass(std::move(MIWP));


  // Delete anything that is now dead to make sure that we don't instrument

  // dead code. Instrumentation can end up keeping dead code around and

  // dramatically increase code size.

  MPM.addPass(GlobalDCEPass());

}


void PassBuilder::addPostPGOLoopRotation(ModulePassManager &MPM,

                                         OptimizationLevel Level) {

  if (EnablePostPGOLoopRotation) {

    // Disable header duplication in loop rotation at -Oz.

    MPM.addPass(createModuleToFunctionPassAdaptor(

        createFunctionToLoopPassAdaptor(

            LoopRotatePass(EnableLoopHeaderDuplication ||

                           Level != OptimizationLevel::Oz),

            /*UseMemorySSA=*/false,

            /*UseBlockFrequencyInfo=*/false),

        PTO.EagerlyInvalidateAnalyses));

  }

}


void PassBuilder::addPGOInstrPasses(ModulePassManager &MPM,

                                    OptimizationLevel Level, bool RunProfileGen,

                                    bool IsCS, bool AtomicCounterUpdate,

                                    std::string ProfileFile,

                                    std::string ProfileRemappingFile,

                                    IntrusiveRefCntPtr<vfs::FileSystem> FS) {

  assert(Level != OptimizationLevel::O0 && "Not expecting O0 here!");


  if (!RunProfileGen) {

    assert(!ProfileFile.empty() && "Profile use expecting a profile file!");

    MPM.addPass(

        PGOInstrumentationUse(ProfileFile, ProfileRemappingFile, IsCS, FS));

    // Cache ProfileSummaryAnalysis once to avoid the potential need to insert

    // RequireAnalysisPass for PSI before subsequent non-module passes.

    MPM.addPass(RequireAnalysisPass<ProfileSummaryAnalysis, Module>());

    return;

  }


  // Perform PGO instrumentation.

  MPM.addPass(PGOInstrumentationGen(IsCS ? PGOInstrumentationType::CSFDO

                                         : PGOInstrumentationType::FDO));


  addPostPGOLoopRotation(MPM, Level);

  // Add the profile lowering pass.

  InstrProfOptions Options;

  if (!ProfileFile.empty())

    Options.InstrProfileOutput = ProfileFile;

  // Do counter promotion at Level greater than O0.

  Options.DoCounterPromotion = true;

  Options.UseBFIInPromotion = IsCS;

  if (EnableSampledInstr) {

    Options.Sampling = true;

    // With sampling, there is little beneifit to enable counter promotion.

    // But note that sampling does work with counter promotion.

    Options.DoCounterPromotion = false;

  }

  Options.Atomic = AtomicCounterUpdate;

  MPM.addPass(InstrProfilingLoweringPass(Options, IsCS));

}


void PassBuilder::addPGOInstrPassesForO0(

    ModulePassManager &MPM, bool RunProfileGen, bool IsCS,

    bool AtomicCounterUpdate, std::string ProfileFile,

    std::string ProfileRemappingFile, IntrusiveRefCntPtr<vfs::FileSystem> FS) {

  if (!RunProfileGen) {

    assert(!ProfileFile.empty() && "Profile use expecting a profile file!");

    MPM.addPass(

        PGOInstrumentationUse(ProfileFile, ProfileRemappingFile, IsCS, FS));

    // Cache ProfileSummaryAnalysis once to avoid the potential need to insert

    // RequireAnalysisPass for PSI before subsequent non-module passes.

    MPM.addPass(RequireAnalysisPass<ProfileSummaryAnalysis, Module>());

    return;

  }


  // Perform PGO instrumentation.

  MPM.addPass(PGOInstrumentationGen(IsCS ? PGOInstrumentationType::CSFDO

                                         : PGOInstrumentationType::FDO));

  // Add the profile lowering pass.

  InstrProfOptions Options;

  if (!ProfileFile.empty())

    Options.InstrProfileOutput = ProfileFile;

  // Do not do counter promotion at O0.

  Options.DoCounterPromotion = false;

  Options.UseBFIInPromotion = IsCS;

  Options.Atomic = AtomicCounterUpdate;

  MPM.addPass(InstrProfilingLoweringPass(Options, IsCS));

}


static InlineParams getInlineParamsFromOptLevel(OptimizationLevel Level) {

  return getInlineParams(Level.getSpeedupLevel(), Level.getSizeLevel());

}


ModuleInlinerWrapperPass


PassBuilder::buildInlinerPipeline(OptimizationLevel Level,

                                  ThinOrFullLTOPhase Phase) {

  InlineParams IP;

  if (PTO.InlinerThreshold == -1)

    IP = getInlineParamsFromOptLevel(Level);

  else

    IP = getInlineParams(PTO.InlinerThreshold);

  // For PreLinkThinLTO + SamplePGO or PreLinkFullLTO + SamplePGO,

  // set hot-caller threshold to 0 to disable hot

  // callsite inline (as much as possible [1]) because it makes

  // profile annotation in the backend inaccurate.

  //

  // [1] Note the cost of a function could be below zero due to erased

  // prologue / epilogue.

  if (isLTOPreLink(Phase) && PGOOpt && PGOOpt->Action == PGOOptions::SampleUse)

    IP.HotCallSiteThreshold = 0;


  if (PGOOpt)

    IP.EnableDeferral = EnablePGOInlineDeferral;


  ModuleInlinerWrapperPass MIWP(IP, PerformMandatoryInliningsFirst,

                                InlineContext{Phase, InlinePass::CGSCCInliner},

                                UseInlineAdvisor, MaxDevirtIterations);


  // Require the GlobalsAA analysis for the module so we can query it within

  // the CGSCC pipeline.

  if (EnableGlobalAnalyses) {

    MIWP.addModulePass(RequireAnalysisPass<GlobalsAA, Module>());

    // Invalidate AAManager so it can be recreated and pick up the newly

    // available GlobalsAA.

    MIWP.addModulePass(

        createModuleToFunctionPassAdaptor(InvalidateAnalysisPass<AAManager>()));

  }


  // Require the ProfileSummaryAnalysis for the module so we can query it within

  // the inliner pass.

  MIWP.addModulePass(RequireAnalysisPass<ProfileSummaryAnalysis, Module>());


  // Now begin the main postorder CGSCC pipeline.

  // FIXME: The current CGSCC pipeline has its origins in the legacy pass

  // manager and trying to emulate its precise behavior. Much of this doesn't

  // make a lot of sense and we should revisit the core CGSCC structure.

  CGSCCPassManager &MainCGPipeline = MIWP.getPM();


  // Note: historically, the PruneEH pass was run first to deduce nounwind and

  // generally clean up exception handling overhead. It isn't clear this is

  // valuable as the inliner doesn't currently care whether it is inlining an

  // invoke or a call.


  if (AttributorRun & AttributorRunOption::CGSCC)

    MainCGPipeline.addPass(AttributorCGSCCPass());


  // Deduce function attributes. We do another run of this after the function

  // simplification pipeline, so this only needs to run when it could affect the

  // function simplification pipeline, which is only the case with recursive

  // functions.

  MainCGPipeline.addPass(PostOrderFunctionAttrsPass(/*SkipNonRecursive*/ true));


  // When at O3 add argument promotion to the pass pipeline.

  // FIXME: It isn't at all clear why this should be limited to O3.

  if (Level == OptimizationLevel::O3)

    MainCGPipeline.addPass(ArgumentPromotionPass());


  // Try to perform OpenMP specific optimizations. This is a (quick!) no-op if

  // there are no OpenMP runtime calls present in the module.

  if (Level == OptimizationLevel::O2 || Level == OptimizationLevel::O3)

    MainCGPipeline.addPass(OpenMPOptCGSCCPass(Phase));


  invokeCGSCCOptimizerLateEPCallbacks(MainCGPipeline, Level);


  // Add the core function simplification pipeline nested inside the

  // CGSCC walk.

  MainCGPipeline.addPass(createCGSCCToFunctionPassAdaptor(

      buildFunctionSimplificationPipeline(Level, Phase),

      PTO.EagerlyInvalidateAnalyses, /*NoRerun=*/true));


  // Finally, deduce any function attributes based on the fully simplified

  // function.

  MainCGPipeline.addPass(PostOrderFunctionAttrsPass());


  // Mark that the function is fully simplified and that it shouldn't be

  // simplified again if we somehow revisit it due to CGSCC mutations unless

  // it's been modified since.

  MainCGPipeline.addPass(createCGSCCToFunctionPassAdaptor(

      RequireAnalysisPass<ShouldNotRunFunctionPassesAnalysis, Function>()));


  if (Phase != ThinOrFullLTOPhase::ThinLTOPreLink) {

    MainCGPipeline.addPass(CoroSplitPass(Level != OptimizationLevel::O0));

    MainCGPipeline.addPass(CoroAnnotationElidePass());

  }


  // Make sure we don't affect potential future NoRerun CGSCC adaptors.

  MIWP.addLateModulePass(createModuleToFunctionPassAdaptor(

      InvalidateAnalysisPass<ShouldNotRunFunctionPassesAnalysis>()));


  return MIWP;

}


ModulePassManager


PassBuilder::buildModuleInlinerPipeline(OptimizationLevel Level,

                                        ThinOrFullLTOPhase Phase) {

  ModulePassManager MPM;


  InlineParams IP = getInlineParamsFromOptLevel(Level);

  // For PreLinkThinLTO + SamplePGO or PreLinkFullLTO + SamplePGO,

  // set hot-caller threshold to 0 to disable hot

  // callsite inline (as much as possible [1]) because it makes

  // profile annotation in the backend inaccurate.

  //

  // [1] Note the cost of a function could be below zero due to erased

  // prologue / epilogue.

  if (isLTOPreLink(Phase) && PGOOpt && PGOOpt->Action == PGOOptions::SampleUse)

    IP.HotCallSiteThreshold = 0;


  if (PGOOpt)

    IP.EnableDeferral = EnablePGOInlineDeferral;


  // The inline deferral logic is used to avoid losing some

  // inlining chance in future. It is helpful in SCC inliner, in which

  // inlining is processed in bottom-up order.

  // While in module inliner, the inlining order is a priority-based order

  // by default. The inline deferral is unnecessary there. So we disable the

  // inline deferral logic in module inliner.

  IP.EnableDeferral = false;


  MPM.addPass(ModuleInlinerPass(IP, UseInlineAdvisor, Phase));

  if (!UseCtxProfile.empty() && Phase == ThinOrFullLTOPhase::ThinLTOPostLink) {

    MPM.addPass(GlobalOptPass());

    MPM.addPass(GlobalDCEPass());

    MPM.addPass(PGOCtxProfFlatteningPass(/*IsPreThinlink=*/false));

  }


  MPM.addPass(createModuleToFunctionPassAdaptor(

      buildFunctionSimplificationPipeline(Level, Phase),

      PTO.EagerlyInvalidateAnalyses));


  if (Phase != ThinOrFullLTOPhase::ThinLTOPreLink) {

    MPM.addPass(createModuleToPostOrderCGSCCPassAdaptor(

        CoroSplitPass(Level != OptimizationLevel::O0)));

    MPM.addPass(

        createModuleToPostOrderCGSCCPassAdaptor(CoroAnnotationElidePass()));

  }


  return MPM;

}


ModulePassManager


PassBuilder::buildModuleSimplificationPipeline(OptimizationLevel Level,

                                               ThinOrFullLTOPhase Phase) {

  assert(Level != OptimizationLevel::O0 &&

         "Should not be used for O0 pipeline");


  assert(Phase != ThinOrFullLTOPhase::FullLTOPostLink &&

         "FullLTOPostLink shouldn't call buildModuleSimplificationPipeline!");


  ModulePassManager MPM;


  // Place pseudo probe instrumentation as the first pass of the pipeline to

  // minimize the impact of optimization changes.

  if (PGOOpt && PGOOpt->PseudoProbeForProfiling &&

      Phase != ThinOrFullLTOPhase::ThinLTOPostLink)

    MPM.addPass(SampleProfileProbePass(TM));


  bool HasSampleProfile = PGOOpt && (PGOOpt->Action == PGOOptions::SampleUse);


  // In ThinLTO mode, when flattened profile is used, all the available

  // profile information will be annotated in PreLink phase so there is

  // no need to load the profile again in PostLink.

  bool LoadSampleProfile =

      HasSampleProfile &&

      !(FlattenedProfileUsed && Phase == ThinOrFullLTOPhase::ThinLTOPostLink);


  // During the ThinLTO backend phase we perform early indirect call promotion

  // here, before globalopt. Otherwise imported available_externally functions

  // look unreferenced and are removed. If we are going to load the sample

  // profile then defer until later.

  // TODO: See if we can move later and consolidate with the location where

  // we perform ICP when we are loading a sample profile.

  // TODO: We pass HasSampleProfile (whether there was a sample profile file

  // passed to the compile) to the SamplePGO flag of ICP. This is used to

  // determine whether the new direct calls are annotated with prof metadata.

  // Ideally this should be determined from whether the IR is annotated with

  // sample profile, and not whether the a sample profile was provided on the

  // command line. E.g. for flattened profiles where we will not be reloading

  // the sample profile in the ThinLTO backend, we ideally shouldn't have to

  // provide the sample profile file.

  if (Phase == ThinOrFullLTOPhase::ThinLTOPostLink && !LoadSampleProfile)

    MPM.addPass(PGOIndirectCallPromotion(true /* InLTO */, HasSampleProfile));


  // Create an early function pass manager to cleanup the output of the

  // frontend. Not necessary with LTO post link pipelines since the pre link

  // pipeline already cleaned up the frontend output.

  if (Phase != ThinOrFullLTOPhase::ThinLTOPostLink) {

    // Do basic inference of function attributes from known properties of system

    // libraries and other oracles.

    MPM.addPass(InferFunctionAttrsPass());

    MPM.addPass(CoroEarlyPass());


    FunctionPassManager EarlyFPM;

    EarlyFPM.addPass(EntryExitInstrumenterPass(/*PostInlining=*/false));

    // Lower llvm.expect to metadata before attempting transforms.

    // Compare/branch metadata may alter the behavior of passes like

    // SimplifyCFG.

    EarlyFPM.addPass(LowerExpectIntrinsicPass());

    EarlyFPM.addPass(SimplifyCFGPass());

    EarlyFPM.addPass(SROAPass(SROAOptions::ModifyCFG));

    EarlyFPM.addPass(EarlyCSEPass());

    if (Level == OptimizationLevel::O3)

      EarlyFPM.addPass(CallSiteSplittingPass());

    MPM.addPass(createModuleToFunctionPassAdaptor(

        std::move(EarlyFPM), PTO.EagerlyInvalidateAnalyses));

  }


  if (LoadSampleProfile) {

    // Annotate sample profile right after early FPM to ensure freshness of

    // the debug info.

    MPM.addPass(SampleProfileLoaderPass(PGOOpt->ProfileFile,

                                        PGOOpt->ProfileRemappingFile, Phase));

    // Cache ProfileSummaryAnalysis once to avoid the potential need to insert

    // RequireAnalysisPass for PSI before subsequent non-module passes.

    MPM.addPass(RequireAnalysisPass<ProfileSummaryAnalysis, Module>());

    // Do not invoke ICP in the LTOPrelink phase as it makes it hard

    // for the profile annotation to be accurate in the LTO backend.

    if (!isLTOPreLink(Phase))

      // We perform early indirect call promotion here, before globalopt.

      // This is important for the ThinLTO backend phase because otherwise

      // imported available_externally functions look unreferenced and are

      // removed.

      MPM.addPass(

          PGOIndirectCallPromotion(true /* IsInLTO */, true /* SamplePGO */));

  }


  // Try to perform OpenMP specific optimizations on the module. This is a

  // (quick!) no-op if there are no OpenMP runtime calls present in the module.

  MPM.addPass(OpenMPOptPass(Phase));


  if (AttributorRun & AttributorRunOption::MODULE)

    MPM.addPass(AttributorPass());


  // Lower type metadata and the type.test intrinsic in the ThinLTO

  // post link pipeline after ICP. This is to enable usage of the type

  // tests in ICP sequences.

  if (Phase == ThinOrFullLTOPhase::ThinLTOPostLink)

    MPM.addPass(LowerTypeTestsPass(nullptr, nullptr,

                                   lowertypetests::DropTestKind::Assume));


  invokePipelineEarlySimplificationEPCallbacks(MPM, Level, Phase);


  // Interprocedural constant propagation now that basic cleanup has occurred

  // and prior to optimizing globals.

  // FIXME: This position in the pipeline hasn't been carefully considered in

  // years, it should be re-analyzed.

  MPM.addPass(IPSCCPPass(

              IPSCCPOptions(/*AllowFuncSpec=*/

                            Level != OptimizationLevel::Os &&

                            Level != OptimizationLevel::Oz &&

                            !isLTOPreLink(Phase))));


  // Attach metadata to indirect call sites indicating the set of functions

  // they may target at run-time. This should follow IPSCCP.

  MPM.addPass(CalledValuePropagationPass());


  // Optimize globals to try and fold them into constants.

  MPM.addPass(GlobalOptPass());


  // Create a small function pass pipeline to cleanup after all the global

  // optimizations.

  FunctionPassManager GlobalCleanupPM;

  // FIXME: Should this instead by a run of SROA?

  GlobalCleanupPM.addPass(PromotePass());

  GlobalCleanupPM.addPass(InstCombinePass());

  invokePeepholeEPCallbacks(GlobalCleanupPM, Level);

  GlobalCleanupPM.addPass(

      SimplifyCFGPass(SimplifyCFGOptions().convertSwitchRangeToICmp(true)));

  MPM.addPass(createModuleToFunctionPassAdaptor(std::move(GlobalCleanupPM),

                                                PTO.EagerlyInvalidateAnalyses));


  // We already asserted this happens in non-FullLTOPostLink earlier.

  const bool IsPreLink = Phase != ThinOrFullLTOPhase::ThinLTOPostLink;

  // Enable contextual profiling instrumentation.

  const bool IsCtxProfGen =

      IsPreLink && PGOCtxProfLoweringPass::isCtxIRPGOInstrEnabled();

  const bool IsPGOPreLink = !IsCtxProfGen && PGOOpt && IsPreLink;

  const bool IsPGOInstrGen =

      IsPGOPreLink && PGOOpt->Action == PGOOptions::IRInstr;

  const bool IsPGOInstrUse =

      IsPGOPreLink && PGOOpt->Action == PGOOptions::IRUse;

  const bool IsMemprofUse = IsPGOPreLink && !PGOOpt->MemoryProfile.empty();

  // We don't want to mix pgo ctx gen and pgo gen; we also don't currently

  // enable ctx profiling from the frontend.

  assert(!(IsPGOInstrGen && PGOCtxProfLoweringPass::isCtxIRPGOInstrEnabled()) &&

         "Enabling both instrumented PGO and contextual instrumentation is not "

         "supported.");

  const bool IsCtxProfUse =

      !UseCtxProfile.empty() && Phase == ThinOrFullLTOPhase::ThinLTOPreLink;


  assert(

      (InstrumentColdFuncOnlyPath.empty() || PGOInstrumentColdFunctionOnly) &&

      "--instrument-cold-function-only-path is provided but "

      "--pgo-instrument-cold-function-only is not enabled");

  const bool IsColdFuncOnlyInstrGen = PGOInstrumentColdFunctionOnly &&

                                      IsPGOPreLink &&

                                      !InstrumentColdFuncOnlyPath.empty();


  if (IsPGOInstrGen || IsPGOInstrUse || IsMemprofUse || IsCtxProfGen ||

      IsCtxProfUse || IsColdFuncOnlyInstrGen)

    addPreInlinerPasses(MPM, Level, Phase);


  // Add all the requested passes for instrumentation PGO, if requested.

  if (IsPGOInstrGen || IsPGOInstrUse) {

    addPGOInstrPasses(MPM, Level,

                      /*RunProfileGen=*/IsPGOInstrGen,

                      /*IsCS=*/false, PGOOpt->AtomicCounterUpdate,

                      PGOOpt->ProfileFile, PGOOpt->ProfileRemappingFile,

                      PGOOpt->FS);

  } else if (IsCtxProfGen || IsCtxProfUse) {

    MPM.addPass(PGOInstrumentationGen(PGOInstrumentationType::CTXPROF));

    // In pre-link, we just want the instrumented IR. We use the contextual

    // profile in the post-thinlink phase.

    // The instrumentation will be removed in post-thinlink after IPO.

    // FIXME(mtrofin): move AssignGUIDPass if there is agreement to use this

    // mechanism for GUIDs.

    MPM.addPass(AssignGUIDPass());

    if (IsCtxProfUse) {

      MPM.addPass(PGOCtxProfFlatteningPass(/*IsPreThinlink=*/true));

      return MPM;

    }

    // Block further inlining in the instrumented ctxprof case. This avoids

    // confusingly collecting profiles for the same GUID corresponding to

    // different variants of the function. We could do like PGO and identify

    // functions by a (GUID, Hash) tuple, but since the ctxprof "use" waits for

    // thinlto to happen before performing any further optimizations, it's

    // unnecessary to collect profiles for non-prevailing copies.

    MPM.addPass(NoinlineNonPrevailing());

    addPostPGOLoopRotation(MPM, Level);

    MPM.addPass(PGOCtxProfLoweringPass());

  } else if (IsColdFuncOnlyInstrGen) {

    addPGOInstrPasses(

        MPM, Level, /* RunProfileGen */ true, /* IsCS */ false,

        /* AtomicCounterUpdate */ false, InstrumentColdFuncOnlyPath,

        /* ProfileRemappingFile */ "", IntrusiveRefCntPtr<vfs::FileSystem>());

  }


  if (IsPGOInstrGen || IsPGOInstrUse || IsCtxProfGen)

    MPM.addPass(PGOIndirectCallPromotion(false, false));


  if (IsPGOPreLink && PGOOpt->CSAction == PGOOptions::CSIRInstr)

    MPM.addPass(PGOInstrumentationGenCreateVar(PGOOpt->CSProfileGenFile,

                                               EnableSampledInstr));


  if (IsMemprofUse)

    MPM.addPass(MemProfUsePass(PGOOpt->MemoryProfile, PGOOpt->FS));


  if (PGOOpt && (PGOOpt->Action == PGOOptions::IRUse ||

                 PGOOpt->Action == PGOOptions::SampleUse))

    MPM.addPass(PGOForceFunctionAttrsPass(PGOOpt->ColdOptType));


  MPM.addPass(AlwaysInlinerPass(/*InsertLifetimeIntrinsics=*/true));


  if (EnableModuleInliner)

    MPM.addPass(buildModuleInlinerPipeline(Level, Phase));

  else

    MPM.addPass(buildInlinerPipeline(Level, Phase));


  // Remove any dead arguments exposed by cleanups, constant folding globals,

  // and argument promotion.

  MPM.addPass(DeadArgumentEliminationPass());


  if (Phase == ThinOrFullLTOPhase::ThinLTOPostLink)

    MPM.addPass(SimplifyTypeTestsPass());


  if (Phase != ThinOrFullLTOPhase::ThinLTOPreLink)

    MPM.addPass(CoroCleanupPass());


  // Optimize globals now that functions are fully simplified.

  MPM.addPass(GlobalOptPass());

  MPM.addPass(GlobalDCEPass());


  return MPM;

}


/// TODO: Should LTO cause any differences to this set of passes?

void PassBuilder::addVectorPasses(OptimizationLevel Level,

                                  FunctionPassManager &FPM, bool IsFullLTO) {

  FPM.addPass(LoopVectorizePass(

      LoopVectorizeOptions(!PTO.LoopInterleaving, !PTO.LoopVectorization)));


  FPM.addPass(InferAlignmentPass());

  if (IsFullLTO) {

    // The vectorizer may have significantly shortened a loop body; unroll

    // again. Unroll small loops to hide loop backedge latency and saturate any

    // parallel execution resources of an out-of-order processor. We also then

    // need to clean up redundancies and loop invariant code.

    // FIXME: It would be really good to use a loop-integrated instruction

    // combiner for cleanup here so that the unrolling and LICM can be pipelined

    // across the loop nests.

    // We do UnrollAndJam in a separate LPM to ensure it happens before unroll

    if (EnableUnrollAndJam && PTO.LoopUnrolling)

      FPM.addPass(createFunctionToLoopPassAdaptor(

          LoopUnrollAndJamPass(Level.getSpeedupLevel())));

    FPM.addPass(LoopUnrollPass(LoopUnrollOptions(

        Level.getSpeedupLevel(), /*OnlyWhenForced=*/!PTO.LoopUnrolling,

        PTO.ForgetAllSCEVInLoopUnroll)));

    FPM.addPass(WarnMissedTransformationsPass());

    // Now that we are done with loop unrolling, be it either by LoopVectorizer,

    // or LoopUnroll passes, some variable-offset GEP's into alloca's could have

    // become constant-offset, thus enabling SROA and alloca promotion. Do so.

    // NOTE: we are very late in the pipeline, and we don't have any LICM

    // or SimplifyCFG passes scheduled after us, that would cleanup

    // the CFG mess this may created if allowed to modify CFG, so forbid that.

    FPM.addPass(SROAPass(SROAOptions::PreserveCFG));

  }


  if (!IsFullLTO) {

    // Eliminate loads by forwarding stores from the previous iteration to loads

    // of the current iteration.

    FPM.addPass(LoopLoadEliminationPass());

  }

  // Cleanup after the loop optimization passes.

  FPM.addPass(InstCombinePass());


  if (Level.getSpeedupLevel() > 1 && ExtraVectorizerPasses) {

    ExtraFunctionPassManager<ShouldRunExtraVectorPasses> ExtraPasses;

    // At higher optimization levels, try to clean up any runtime overlap and

    // alignment checks inserted by the vectorizer. We want to track correlated

    // runtime checks for two inner loops in the same outer loop, fold any

    // common computations, hoist loop-invariant aspects out of any outer loop,

    // and unswitch the runtime checks if possible. Once hoisted, we may have

    // dead (or speculatable) control flows or more combining opportunities.

    ExtraPasses.addPass(EarlyCSEPass());

    ExtraPasses.addPass(CorrelatedValuePropagationPass());

    ExtraPasses.addPass(InstCombinePass());

    LoopPassManager LPM;

    LPM.addPass(LICMPass(PTO.LicmMssaOptCap, PTO.LicmMssaNoAccForPromotionCap,

                         /*AllowSpeculation=*/true));

    LPM.addPass(SimpleLoopUnswitchPass(/* NonTrivial */ Level ==

                                       OptimizationLevel::O3));

    ExtraPasses.addPass(

        createFunctionToLoopPassAdaptor(std::move(LPM), /*UseMemorySSA=*/true,

                                        /*UseBlockFrequencyInfo=*/true));

    ExtraPasses.addPass(

        SimplifyCFGPass(SimplifyCFGOptions().convertSwitchRangeToICmp(true)));

    ExtraPasses.addPass(InstCombinePass());

    FPM.addPass(std::move(ExtraPasses));

  }


  // Now that we've formed fast to execute loop structures, we do further

  // optimizations. These are run afterward as they might block doing complex

  // analyses and transforms such as what are needed for loop vectorization.


  // Cleanup after loop vectorization, etc. Simplification passes like CVP and

  // GVN, loop transforms, and others have already run, so it's now better to

  // convert to more optimized IR using more aggressive simplify CFG options.

  // The extra sinking transform can create larger basic blocks, so do this

  // before SLP vectorization.

  FPM.addPass(SimplifyCFGPass(SimplifyCFGOptions()

                                  .forwardSwitchCondToPhi(true)

                                  .convertSwitchRangeToICmp(true)

                                  .convertSwitchToLookupTable(true)

                                  .needCanonicalLoops(false)

                                  .hoistCommonInsts(true)

                                  .sinkCommonInsts(true)));


  if (IsFullLTO) {

    FPM.addPass(SCCPPass());

    FPM.addPass(InstCombinePass());

    FPM.addPass(BDCEPass());

  }


  // Optimize parallel scalar instruction chains into SIMD instructions.

  if (PTO.SLPVectorization) {

    FPM.addPass(SLPVectorizerPass());

    if (Level.getSpeedupLevel() > 1 && ExtraVectorizerPasses) {

      FPM.addPass(EarlyCSEPass());

    }

  }

  // Enhance/cleanup vector code.

  FPM.addPass(VectorCombinePass());


  if (!IsFullLTO) {

    FPM.addPass(InstCombinePass());

    // Unroll small loops to hide loop backedge latency and saturate any

    // parallel execution resources of an out-of-order processor. We also then

    // need to clean up redundancies and loop invariant code.

    // FIXME: It would be really good to use a loop-integrated instruction

    // combiner for cleanup here so that the unrolling and LICM can be pipelined

    // across the loop nests.

    // We do UnrollAndJam in a separate LPM to ensure it happens before unroll

    if (EnableUnrollAndJam && PTO.LoopUnrolling) {

      FPM.addPass(createFunctionToLoopPassAdaptor(

          LoopUnrollAndJamPass(Level.getSpeedupLevel())));

    }

    FPM.addPass(LoopUnrollPass(LoopUnrollOptions(

        Level.getSpeedupLevel(), /*OnlyWhenForced=*/!PTO.LoopUnrolling,

        PTO.ForgetAllSCEVInLoopUnroll)));

    FPM.addPass(WarnMissedTransformationsPass());

    // Now that we are done with loop unrolling, be it either by LoopVectorizer,

    // or LoopUnroll passes, some variable-offset GEP's into alloca's could have

    // become constant-offset, thus enabling SROA and alloca promotion. Do so.

    // NOTE: we are very late in the pipeline, and we don't have any LICM

    // or SimplifyCFG passes scheduled after us, that would cleanup

    // the CFG mess this may created if allowed to modify CFG, so forbid that.

    FPM.addPass(SROAPass(SROAOptions::PreserveCFG));

  }


  FPM.addPass(InferAlignmentPass());

  FPM.addPass(InstCombinePass());


  // This is needed for two reasons:

  //   1. It works around problems that instcombine introduces, such as sinking

  //      expensive FP divides into loops containing multiplications using the

  //      divide result.

  //   2. It helps to clean up some loop-invariant code created by the loop

  //      unroll pass when IsFullLTO=false.

  FPM.addPass(createFunctionToLoopPassAdaptor(

      LICMPass(PTO.LicmMssaOptCap, PTO.LicmMssaNoAccForPromotionCap,

               /*AllowSpeculation=*/true),

      /*UseMemorySSA=*/true, /*UseBlockFrequencyInfo=*/false));


  // Now that we've vectorized and unrolled loops, we may have more refined

  // alignment information, try to re-derive it here.

  FPM.addPass(AlignmentFromAssumptionsPass());

}


ModulePassManager


PassBuilder::buildModuleOptimizationPipeline(OptimizationLevel Level,

                                             ThinOrFullLTOPhase LTOPhase) {

  const bool LTOPreLink = isLTOPreLink(LTOPhase);

  ModulePassManager MPM;


  // Run partial inlining pass to partially inline functions that have

  // large bodies.

  if (RunPartialInlining)

    MPM.addPass(PartialInlinerPass());


  // Remove avail extern fns and globals definitions since we aren't compiling

  // an object file for later LTO. For LTO we want to preserve these so they

  // are eligible for inlining at link-time. Note if they are unreferenced they

  // will be removed by GlobalDCE later, so this only impacts referenced

  // available externally globals. Eventually they will be suppressed during

  // codegen, but eliminating here enables more opportunity for GlobalDCE as it

  // may make globals referenced by available external functions dead and saves

  // running remaining passes on the eliminated functions. These should be

  // preserved during prelinking for link-time inlining decisions.

  if (!LTOPreLink)

    MPM.addPass(EliminateAvailableExternallyPass());


  // Do RPO function attribute inference across the module to forward-propagate

  // attributes where applicable.

  // FIXME: Is this really an optimization rather than a canonicalization?

  MPM.addPass(ReversePostOrderFunctionAttrsPass());


  // Do a post inline PGO instrumentation and use pass. This is a context

  // sensitive PGO pass. We don't want to do this in LTOPreLink phrase as

  // cross-module inline has not been done yet. The context sensitive

  // instrumentation is after all the inlines are done.

  if (!LTOPreLink && PGOOpt) {

    if (PGOOpt->CSAction == PGOOptions::CSIRInstr)

      addPGOInstrPasses(MPM, Level, /*RunProfileGen=*/true,

                        /*IsCS=*/true, PGOOpt->AtomicCounterUpdate,

                        PGOOpt->CSProfileGenFile, PGOOpt->ProfileRemappingFile,

                        PGOOpt->FS);

    else if (PGOOpt->CSAction == PGOOptions::CSIRUse)

      addPGOInstrPasses(MPM, Level, /*RunProfileGen=*/false,

                        /*IsCS=*/true, PGOOpt->AtomicCounterUpdate,

                        PGOOpt->ProfileFile, PGOOpt->ProfileRemappingFile,

                        PGOOpt->FS);

  }


  // Re-compute GlobalsAA here prior to function passes. This is particularly

  // useful as the above will have inlined, DCE'ed, and function-attr

  // propagated everything. We should at this point have a reasonably minimal

  // and richly annotated call graph. By computing aliasing and mod/ref

  // information for all local globals here, the late loop passes and notably

  // the vectorizer will be able to use them to help recognize vectorizable

  // memory operations.

  if (EnableGlobalAnalyses)

    MPM.addPass(RecomputeGlobalsAAPass());


  invokeOptimizerEarlyEPCallbacks(MPM, Level, LTOPhase);


  FunctionPassManager OptimizePM;


  // Only drop unnecessary assumes post-inline and post-link, as otherwise

  // additional uses of the affected value may be introduced through inlining

  // and CSE.

  if (!isLTOPreLink(LTOPhase))

    OptimizePM.addPass(DropUnnecessaryAssumesPass());


  // Scheduling LoopVersioningLICM when inlining is over, because after that

  // we may see more accurate aliasing. Reason to run this late is that too

  // early versioning may prevent further inlining due to increase of code

  // size. Other optimizations which runs later might get benefit of no-alias

  // assumption in clone loop.

  if (UseLoopVersioningLICM) {

    OptimizePM.addPass(

        createFunctionToLoopPassAdaptor(LoopVersioningLICMPass()));

    // LoopVersioningLICM pass might increase new LICM opportunities.

    OptimizePM.addPass(createFunctionToLoopPassAdaptor(

        LICMPass(PTO.LicmMssaOptCap, PTO.LicmMssaNoAccForPromotionCap,

                 /*AllowSpeculation=*/true),

        /*USeMemorySSA=*/true, /*UseBlockFrequencyInfo=*/false));

  }


  OptimizePM.addPass(Float2IntPass());

  OptimizePM.addPass(LowerConstantIntrinsicsPass());


  if (EnableMatrix) {

    OptimizePM.addPass(LowerMatrixIntrinsicsPass());

    OptimizePM.addPass(EarlyCSEPass());

  }


  // CHR pass should only be applied with the profile information.

  // The check is to check the profile summary information in CHR.

  if (EnableCHR && Level == OptimizationLevel::O3)

    OptimizePM.addPass(ControlHeightReductionPass());


  // FIXME: We need to run some loop optimizations to re-rotate loops after

  // simplifycfg and others undo their rotation.


  // Optimize the loop execution. These passes operate on entire loop nests

  // rather than on each loop in an inside-out manner, and so they are actually

  // function passes.


  invokeVectorizerStartEPCallbacks(OptimizePM, Level);


  LoopPassManager LPM;

  // First rotate loops that may have been un-rotated by prior passes.

  // Disable header duplication at -Oz.

  LPM.addPass(LoopRotatePass(EnableLoopHeaderDuplication ||

                                 Level != OptimizationLevel::Oz,

                             LTOPreLink));

  // Some loops may have become dead by now. Try to delete them.

  // FIXME: see discussion in https://reviews.llvm.org/D112851,

  //        this may need to be revisited once we run GVN before loop deletion

  //        in the simplification pipeline.

  LPM.addPass(LoopDeletionPass());


  if (PTO.LoopInterchange)

    LPM.addPass(LoopInterchangePass());


  OptimizePM.addPass(createFunctionToLoopPassAdaptor(

      std::move(LPM), /*UseMemorySSA=*/false, /*UseBlockFrequencyInfo=*/false));


  // FIXME: This may not be the right place in the pipeline.

  // We need to have the data to support the right place.

  if (PTO.LoopFusion)

    OptimizePM.addPass(LoopFusePass());


  // Distribute loops to allow partial vectorization.  I.e. isolate dependences

  // into separate loop that would otherwise inhibit vectorization.  This is

  // currently only performed for loops marked with the metadata

  // llvm.loop.distribute=true or when -enable-loop-distribute is specified.

  OptimizePM.addPass(LoopDistributePass());


  // Populates the VFABI attribute with the scalar-to-vector mappings

  // from the TargetLibraryInfo.

  OptimizePM.addPass(InjectTLIMappings());


  addVectorPasses(Level, OptimizePM, /* IsFullLTO */ false);


  invokeVectorizerEndEPCallbacks(OptimizePM, Level);


  // LoopSink pass sinks instructions hoisted by LICM, which serves as a

  // canonicalization pass that enables other optimizations. As a result,

  // LoopSink pass needs to be a very late IR pass to avoid undoing LICM

  // result too early.

  OptimizePM.addPass(LoopSinkPass());


  // And finally clean up LCSSA form before generating code.

  OptimizePM.addPass(InstSimplifyPass());


  // This hoists/decomposes div/rem ops. It should run after other sink/hoist

  // passes to avoid re-sinking, but before SimplifyCFG because it can allow

  // flattening of blocks.

  OptimizePM.addPass(DivRemPairsPass());


  // Try to annotate calls that were created during optimization.

  OptimizePM.addPass(

      TailCallElimPass(/*UpdateFunctionEntryCount=*/isInstrumentedPGOUse()));


  // LoopSink (and other loop passes since the last simplifyCFG) might have

  // resulted in single-entry-single-exit or empty blocks. Clean up the CFG.

  OptimizePM.addPass(

      SimplifyCFGPass(SimplifyCFGOptions()

                          .convertSwitchRangeToICmp(true)

                          .speculateUnpredictables(true)

                          .hoistLoadsStoresWithCondFaulting(true)));


  // Add the core optimizing pipeline.

  MPM.addPass(createModuleToFunctionPassAdaptor(std::move(OptimizePM),

                                                PTO.EagerlyInvalidateAnalyses));


  invokeOptimizerLastEPCallbacks(MPM, Level, LTOPhase);


  // Split out cold code. Splitting is done late to avoid hiding context from

  // other optimizations and inadvertently regressing performance. The tradeoff

  // is that this has a higher code size cost than splitting early.

  if (EnableHotColdSplit && !LTOPreLink)

    MPM.addPass(HotColdSplittingPass());


  // Search the code for similar regions of code. If enough similar regions can

  // be found where extracting the regions into their own function will decrease

  // the size of the program, we extract the regions, a deduplicate the

  // structurally similar regions.

  if (EnableIROutliner)

    MPM.addPass(IROutlinerPass());


  // Now we need to do some global optimization transforms.

  // FIXME: It would seem like these should come first in the optimization

  // pipeline and maybe be the bottom of the canonicalization pipeline? Weird

  // ordering here.

  MPM.addPass(GlobalDCEPass());

  MPM.addPass(ConstantMergePass());


  // Merge functions if requested. It has a better chance to merge functions

  // after ConstantMerge folded jump tables.

  if (PTO.MergeFunctions)

    MPM.addPass(MergeFunctionsPass());


  if (PTO.CallGraphProfile && !LTOPreLink)

    MPM.addPass(CGProfilePass(isLTOPostLink(LTOPhase)));


  // RelLookupTableConverterPass runs later in LTO post-link pipeline.

  if (!LTOPreLink)

    MPM.addPass(RelLookupTableConverterPass());


  return MPM;

}


ModulePassManager


PassBuilder::buildPerModuleDefaultPipeline(OptimizationLevel Level,

                                           ThinOrFullLTOPhase Phase) {

  if (Level == OptimizationLevel::O0)

    return buildO0DefaultPipeline(Level, Phase);


  ModulePassManager MPM;


  // Convert @llvm.global.annotations to !annotation metadata.

  MPM.addPass(Annotation2MetadataPass());


  // Force any function attributes we want the rest of the pipeline to observe.

  MPM.addPass(ForceFunctionAttrsPass());


  if (PGOOpt && PGOOpt->DebugInfoForProfiling)

    MPM.addPass(createModuleToFunctionPassAdaptor(AddDiscriminatorsPass()));


  // Apply module pipeline start EP callback.

  invokePipelineStartEPCallbacks(MPM, Level);


  // Add the core simplification pipeline.

  MPM.addPass(buildModuleSimplificationPipeline(Level, Phase));


  // Now add the optimization pipeline.

  MPM.addPass(buildModuleOptimizationPipeline(Level, Phase));


  if (PGOOpt && PGOOpt->PseudoProbeForProfiling &&

      PGOOpt->Action == PGOOptions::SampleUse)

    MPM.addPass(PseudoProbeUpdatePass());


  // Emit annotation remarks.

  addAnnotationRemarksPass(MPM);


  if (isLTOPreLink(Phase))

    addRequiredLTOPreLinkPasses(MPM);

  return MPM;

}


ModulePassManager


PassBuilder::buildFatLTODefaultPipeline(OptimizationLevel Level, bool ThinLTO,

                                        bool EmitSummary) {

  ModulePassManager MPM;

  if (ThinLTO)

    MPM.addPass(buildThinLTOPreLinkDefaultPipeline(Level));

  else

    MPM.addPass(buildLTOPreLinkDefaultPipeline(Level));

  MPM.addPass(EmbedBitcodePass(ThinLTO, EmitSummary));


  // Perform any cleanups to the IR that aren't suitable for per TU compilation,

  // like removing CFI/WPD related instructions. Note, we reuse

  // LowerTypeTestsPass to clean up type tests rather than duplicate that logic

  // in FatLtoCleanup.

  MPM.addPass(FatLtoCleanup());


  // If we're doing FatLTO w/ CFI enabled, we don't want the type tests in the

  // object code, only in the bitcode section, so drop it before we run

  // module optimization and generate machine code. If llvm.type.test() isn't in

  // the IR, this won't do anything.

  MPM.addPass(

      LowerTypeTestsPass(nullptr, nullptr, lowertypetests::DropTestKind::All));


  // Use the ThinLTO post-link pipeline with sample profiling

  if (ThinLTO && PGOOpt && PGOOpt->Action == PGOOptions::SampleUse)

    MPM.addPass(buildThinLTODefaultPipeline(Level, /*ImportSummary=*/nullptr));

  else {

    // ModuleSimplification does not run the coroutine passes for

    // ThinLTOPreLink, so we need the coroutine passes to run for ThinLTO

    // builds, otherwise they will miscompile.

    if (ThinLTO) {

      // TODO: replace w/ buildCoroWrapper() when it takes phase and level into

      // consideration.

      CGSCCPassManager CGPM;

      CGPM.addPass(CoroSplitPass(Level != OptimizationLevel::O0));

      CGPM.addPass(CoroAnnotationElidePass());

      MPM.addPass(createModuleToPostOrderCGSCCPassAdaptor(std::move(CGPM)));

      MPM.addPass(CoroCleanupPass());

    }


    // otherwise, just use module optimization

    MPM.addPass(

        buildModuleOptimizationPipeline(Level, ThinOrFullLTOPhase::None));

    // Emit annotation remarks.

    addAnnotationRemarksPass(MPM);

  }

  return MPM;

}


ModulePassManager


PassBuilder::buildThinLTOPreLinkDefaultPipeline(OptimizationLevel Level) {

  if (Level == OptimizationLevel::O0)

    return buildO0DefaultPipeline(Level, ThinOrFullLTOPhase::ThinLTOPreLink);


  ModulePassManager MPM;


  // Convert @llvm.global.annotations to !annotation metadata.

  MPM.addPass(Annotation2MetadataPass());


  // Force any function attributes we want the rest of the pipeline to observe.

  MPM.addPass(ForceFunctionAttrsPass());


  if (PGOOpt && PGOOpt->DebugInfoForProfiling)

    MPM.addPass(createModuleToFunctionPassAdaptor(AddDiscriminatorsPass()));


  // Apply module pipeline start EP callback.

  invokePipelineStartEPCallbacks(MPM, Level);


  // If we are planning to perform ThinLTO later, we don't bloat the code with

  // unrolling/vectorization/... now. Just simplify the module as much as we

  // can.

  MPM.addPass(buildModuleSimplificationPipeline(

      Level, ThinOrFullLTOPhase::ThinLTOPreLink));

  // In pre-link, for ctx prof use, we stop here with an instrumented IR. We let

  // thinlto use the contextual info to perform imports; then use the contextual

  // profile in the post-thinlink phase.

  if (!UseCtxProfile.empty()) {

    addRequiredLTOPreLinkPasses(MPM);

    return MPM;

  }


  // Run partial inlining pass to partially inline functions that have

  // large bodies.

  // FIXME: It isn't clear whether this is really the right place to run this

  // in ThinLTO. Because there is another canonicalization and simplification

  // phase that will run after the thin link, running this here ends up with

  // less information than will be available later and it may grow functions in

  // ways that aren't beneficial.

  if (RunPartialInlining)

    MPM.addPass(PartialInlinerPass());


  if (PGOOpt && PGOOpt->PseudoProbeForProfiling &&

      PGOOpt->Action == PGOOptions::SampleUse)

    MPM.addPass(PseudoProbeUpdatePass());


  // Handle Optimizer{Early,Last}EPCallbacks added by clang on PreLink. Actual

  // optimization is going to be done in PostLink stage, but clang can't add

  // callbacks there in case of in-process ThinLTO called by linker.

  invokeOptimizerEarlyEPCallbacks(MPM, Level,

                                  /*Phase=*/ThinOrFullLTOPhase::ThinLTOPreLink);

  invokeOptimizerLastEPCallbacks(MPM, Level,

                                 /*Phase=*/ThinOrFullLTOPhase::ThinLTOPreLink);


  // Emit annotation remarks.

  addAnnotationRemarksPass(MPM);


  addRequiredLTOPreLinkPasses(MPM);


  return MPM;

}


ModulePassManager PassBuilder::buildThinLTODefaultPipeline(

    OptimizationLevel Level, const ModuleSummaryIndex *ImportSummary) {

  ModulePassManager MPM;


  if (ImportSummary) {

    // For ThinLTO we must apply the context disambiguation decisions early, to

    // ensure we can correctly match the callsites to summary data.

    if (EnableMemProfContextDisambiguation)

      MPM.addPass(MemProfContextDisambiguation(

          ImportSummary, PGOOpt && PGOOpt->Action == PGOOptions::SampleUse));


    // These passes import type identifier resolutions for whole-program

    // devirtualization and CFI. They must run early because other passes may

    // disturb the specific instruction patterns that these passes look for,

    // creating dependencies on resolutions that may not appear in the summary.

    //

    // For example, GVN may transform the pattern assume(type.test) appearing in

    // two basic blocks into assume(phi(type.test, type.test)), which would

    // transform a dependency on a WPD resolution into a dependency on a type

    // identifier resolution for CFI.

    //

    // Also, WPD has access to more precise information than ICP and can

    // devirtualize more effectively, so it should operate on the IR first.

    //

    // The WPD and LowerTypeTest passes need to run at -O0 to lower type

    // metadata and intrinsics.

    MPM.addPass(WholeProgramDevirtPass(nullptr, ImportSummary));

    MPM.addPass(LowerTypeTestsPass(nullptr, ImportSummary));

  }


  if (Level == OptimizationLevel::O0) {

    // Run a second time to clean up any type tests left behind by WPD for use

    // in ICP.

    MPM.addPass(LowerTypeTestsPass(nullptr, nullptr,

                                   lowertypetests::DropTestKind::Assume));

    // Drop available_externally and unreferenced globals. This is necessary

    // with ThinLTO in order to avoid leaving undefined references to dead

    // globals in the object file.

    MPM.addPass(EliminateAvailableExternallyPass());

    MPM.addPass(GlobalDCEPass());

    return MPM;

  }

  if (!UseCtxProfile.empty()) {

    MPM.addPass(

        buildModuleInlinerPipeline(Level, ThinOrFullLTOPhase::ThinLTOPostLink));

  } else {

    // Add the core simplification pipeline.

    MPM.addPass(buildModuleSimplificationPipeline(

        Level, ThinOrFullLTOPhase::ThinLTOPostLink));

  }

  // Now add the optimization pipeline.

  MPM.addPass(buildModuleOptimizationPipeline(

      Level, ThinOrFullLTOPhase::ThinLTOPostLink));


  // Emit annotation remarks.

  addAnnotationRemarksPass(MPM);


  return MPM;

}


ModulePassManager


PassBuilder::buildLTOPreLinkDefaultPipeline(OptimizationLevel Level) {

  // FIXME: We should use a customized pre-link pipeline!

  return buildPerModuleDefaultPipeline(Level,

                                       ThinOrFullLTOPhase::FullLTOPreLink);

}


ModulePassManager


PassBuilder::buildLTODefaultPipeline(OptimizationLevel Level,

                                     ModuleSummaryIndex *ExportSummary) {

  ModulePassManager MPM;


  invokeFullLinkTimeOptimizationEarlyEPCallbacks(MPM, Level);


  // Create a function that performs CFI checks for cross-DSO calls with targets

  // in the current module.

  MPM.addPass(CrossDSOCFIPass());


  if (Level == OptimizationLevel::O0) {

    // The WPD and LowerTypeTest passes need to run at -O0 to lower type

    // metadata and intrinsics.

    MPM.addPass(WholeProgramDevirtPass(ExportSummary, nullptr));

    MPM.addPass(LowerTypeTestsPass(ExportSummary, nullptr));

    // Run a second time to clean up any type tests left behind by WPD for use

    // in ICP.

    MPM.addPass(LowerTypeTestsPass(nullptr, nullptr,

                                   lowertypetests::DropTestKind::Assume));


    MPM.addPass(buildCoroWrapper(ThinOrFullLTOPhase::FullLTOPostLink));


    invokeFullLinkTimeOptimizationLastEPCallbacks(MPM, Level);


    // Emit annotation remarks.

    addAnnotationRemarksPass(MPM);


    return MPM;

  }


  if (PGOOpt && PGOOpt->Action == PGOOptions::SampleUse) {

    // Load sample profile before running the LTO optimization pipeline.

    MPM.addPass(SampleProfileLoaderPass(PGOOpt->ProfileFile,

                                        PGOOpt->ProfileRemappingFile,

                                        ThinOrFullLTOPhase::FullLTOPostLink));

    // Cache ProfileSummaryAnalysis once to avoid the potential need to insert

    // RequireAnalysisPass for PSI before subsequent non-module passes.

    MPM.addPass(RequireAnalysisPass<ProfileSummaryAnalysis, Module>());

  }


  // Try to run OpenMP optimizations, quick no-op if no OpenMP metadata present.

  MPM.addPass(OpenMPOptPass(ThinOrFullLTOPhase::FullLTOPostLink));


  // Remove unused virtual tables to improve the quality of code generated by

  // whole-program devirtualization and bitset lowering.

  MPM.addPass(GlobalDCEPass(/*InLTOPostLink=*/true));


  // Do basic inference of function attributes from known properties of system

  // libraries and other oracles.

  MPM.addPass(InferFunctionAttrsPass());


  if (Level.getSpeedupLevel() > 1) {

    MPM.addPass(createModuleToFunctionPassAdaptor(

        CallSiteSplittingPass(), PTO.EagerlyInvalidateAnalyses));


    // Indirect call promotion. This should promote all the targets that are

    // left by the earlier promotion pass that promotes intra-module targets.

    // This two-step promotion is to save the compile time. For LTO, it should

    // produce the same result as if we only do promotion here.

    MPM.addPass(PGOIndirectCallPromotion(

        true /* InLTO */, PGOOpt && PGOOpt->Action == PGOOptions::SampleUse));


    // Promoting by-reference arguments to by-value exposes more constants to

    // IPSCCP.

    CGSCCPassManager CGPM;

    CGPM.addPass(PostOrderFunctionAttrsPass());

    CGPM.addPass(ArgumentPromotionPass());

    CGPM.addPass(

        createCGSCCToFunctionPassAdaptor(SROAPass(SROAOptions::ModifyCFG)));

    MPM.addPass(createModuleToPostOrderCGSCCPassAdaptor(std::move(CGPM)));


    // Propagate constants at call sites into the functions they call.  This

    // opens opportunities for globalopt (and inlining) by substituting function

    // pointers passed as arguments to direct uses of functions.

    MPM.addPass(IPSCCPPass(IPSCCPOptions(/*AllowFuncSpec=*/

                                         Level != OptimizationLevel::Os &&

                                         Level != OptimizationLevel::Oz)));


    // Attach metadata to indirect call sites indicating the set of functions

    // they may target at run-time. This should follow IPSCCP.

    MPM.addPass(CalledValuePropagationPass());

  }


  // Do RPO function attribute inference across the module to forward-propagate

  // attributes where applicable.

  // FIXME: Is this really an optimization rather than a canonicalization?

  MPM.addPass(ReversePostOrderFunctionAttrsPass());


  // Use in-range annotations on GEP indices to split globals where beneficial.

  MPM.addPass(GlobalSplitPass());


  // Run whole program optimization of virtual call when the list of callees

  // is fixed.

  MPM.addPass(WholeProgramDevirtPass(ExportSummary, nullptr));


  // Stop here at -O1.

  if (Level == OptimizationLevel::O1) {

    // The LowerTypeTestsPass needs to run to lower type metadata and the

    // type.test intrinsics. The pass does nothing if CFI is disabled.

    MPM.addPass(LowerTypeTestsPass(ExportSummary, nullptr));

    // Run a second time to clean up any type tests left behind by WPD for use

    // in ICP (which is performed earlier than this in the regular LTO

    // pipeline).

    MPM.addPass(LowerTypeTestsPass(nullptr, nullptr,

                                   lowertypetests::DropTestKind::Assume));


    MPM.addPass(buildCoroWrapper(ThinOrFullLTOPhase::FullLTOPostLink));


    invokeFullLinkTimeOptimizationLastEPCallbacks(MPM, Level);


    // Emit annotation remarks.

    addAnnotationRemarksPass(MPM);


    return MPM;

  }


  // TODO: Skip to match buildCoroWrapper.

  MPM.addPass(CoroEarlyPass());


  // Optimize globals to try and fold them into constants.

  MPM.addPass(GlobalOptPass());


  // Promote any localized globals to SSA registers.

  MPM.addPass(createModuleToFunctionPassAdaptor(PromotePass()));


  // Linking modules together can lead to duplicate global constant, only

  // keep one copy of each constant.

  MPM.addPass(ConstantMergePass());


  // Remove unused arguments from functions.

  MPM.addPass(DeadArgumentEliminationPass());


  // Reduce the code after globalopt and ipsccp.  Both can open up significant

  // simplification opportunities, and both can propagate functions through

  // function pointers.  When this happens, we often have to resolve varargs

  // calls, etc, so let instcombine do this.

  FunctionPassManager PeepholeFPM;

  PeepholeFPM.addPass(InstCombinePass());

  if (Level.getSpeedupLevel() > 1)

    PeepholeFPM.addPass(AggressiveInstCombinePass());

  invokePeepholeEPCallbacks(PeepholeFPM, Level);


  MPM.addPass(createModuleToFunctionPassAdaptor(std::move(PeepholeFPM),

                                                PTO.EagerlyInvalidateAnalyses));


  // Lower variadic functions for supported targets prior to inlining.

  MPM.addPass(ExpandVariadicsPass(ExpandVariadicsMode::Optimize));


  // Note: historically, the PruneEH pass was run first to deduce nounwind and

  // generally clean up exception handling overhead. It isn't clear this is

  // valuable as the inliner doesn't currently care whether it is inlining an

  // invoke or a call.

  // Run the inliner now.

  if (EnableModuleInliner) {

    MPM.addPass(ModuleInlinerPass(getInlineParamsFromOptLevel(Level),

                                  UseInlineAdvisor,

                                  ThinOrFullLTOPhase::FullLTOPostLink));

  } else {

    MPM.addPass(ModuleInlinerWrapperPass(

        getInlineParamsFromOptLevel(Level),

        /* MandatoryFirst */ true,

        InlineContext{ThinOrFullLTOPhase::FullLTOPostLink,

                      InlinePass::CGSCCInliner}));

  }


  // Perform context disambiguation after inlining, since that would reduce the

  // amount of additional cloning required to distinguish the allocation

  // contexts.

  if (EnableMemProfContextDisambiguation)

    MPM.addPass(MemProfContextDisambiguation(

        /*Summary=*/nullptr,

        PGOOpt && PGOOpt->Action == PGOOptions::SampleUse));


  // Optimize globals again after we ran the inliner.

  MPM.addPass(GlobalOptPass());


  // Run the OpenMPOpt pass again after global optimizations.

  MPM.addPass(OpenMPOptPass(ThinOrFullLTOPhase::FullLTOPostLink));


  // Garbage collect dead functions.

  MPM.addPass(GlobalDCEPass(/*InLTOPostLink=*/true));


  // If we didn't decide to inline a function, check to see if we can

  // transform it to pass arguments by value instead of by reference.

  CGSCCPassManager CGPM;

  CGPM.addPass(ArgumentPromotionPass());

  CGPM.addPass(CoroSplitPass(Level != OptimizationLevel::O0));

  CGPM.addPass(CoroAnnotationElidePass());

  MPM.addPass(createModuleToPostOrderCGSCCPassAdaptor(std::move(CGPM)));


  FunctionPassManager FPM;

  // The IPO Passes may leave cruft around. Clean up after them.

  FPM.addPass(InstCombinePass());

  invokePeepholeEPCallbacks(FPM, Level);


  if (EnableConstraintElimination)

    FPM.addPass(ConstraintEliminationPass());


  FPM.addPass(JumpThreadingPass());


  // Do a post inline PGO instrumentation and use pass. This is a context

  // sensitive PGO pass.

  if (PGOOpt) {

    if (PGOOpt->CSAction == PGOOptions::CSIRInstr)

      addPGOInstrPasses(MPM, Level, /*RunProfileGen=*/true,

                        /*IsCS=*/true, PGOOpt->AtomicCounterUpdate,

                        PGOOpt->CSProfileGenFile, PGOOpt->ProfileRemappingFile,

                        PGOOpt->FS);

    else if (PGOOpt->CSAction == PGOOptions::CSIRUse)

      addPGOInstrPasses(MPM, Level, /*RunProfileGen=*/false,

                        /*IsCS=*/true, PGOOpt->AtomicCounterUpdate,

                        PGOOpt->ProfileFile, PGOOpt->ProfileRemappingFile,

                        PGOOpt->FS);

  }


  // Break up allocas

  FPM.addPass(SROAPass(SROAOptions::ModifyCFG));


  // LTO provides additional opportunities for tailcall elimination due to

  // link-time inlining, and visibility of nocapture attribute.

  FPM.addPass(

      TailCallElimPass(/*UpdateFunctionEntryCount=*/isInstrumentedPGOUse()));


  // Run a few AA driver optimizations here and now to cleanup the code.

  MPM.addPass(createModuleToFunctionPassAdaptor(std::move(FPM),

                                                PTO.EagerlyInvalidateAnalyses));


  MPM.addPass(

      createModuleToPostOrderCGSCCPassAdaptor(PostOrderFunctionAttrsPass()));


  // Require the GlobalsAA analysis for the module so we can query it within

  // MainFPM.

  if (EnableGlobalAnalyses) {

    MPM.addPass(RequireAnalysisPass<GlobalsAA, Module>());

    // Invalidate AAManager so it can be recreated and pick up the newly

    // available GlobalsAA.

    MPM.addPass(

        createModuleToFunctionPassAdaptor(InvalidateAnalysisPass<AAManager>()));

  }


  FunctionPassManager MainFPM;

  MainFPM.addPass(createFunctionToLoopPassAdaptor(

      LICMPass(PTO.LicmMssaOptCap, PTO.LicmMssaNoAccForPromotionCap,

               /*AllowSpeculation=*/true),

      /*USeMemorySSA=*/true, /*UseBlockFrequencyInfo=*/false));


  if (RunNewGVN)

    MainFPM.addPass(NewGVNPass());

  else

    MainFPM.addPass(GVNPass());


  // Remove dead memcpy()'s.

  MainFPM.addPass(MemCpyOptPass());


  // Nuke dead stores.

  MainFPM.addPass(DSEPass());

  MainFPM.addPass(MoveAutoInitPass());

  MainFPM.addPass(MergedLoadStoreMotionPass());


  invokeVectorizerStartEPCallbacks(MainFPM, Level);


  LoopPassManager LPM;

  if (EnableLoopFlatten && Level.getSpeedupLevel() > 1)

    LPM.addPass(LoopFlattenPass());

  LPM.addPass(IndVarSimplifyPass());

  LPM.addPass(LoopDeletionPass());

  // FIXME: Add loop interchange.


  // Unroll small loops and perform peeling.

  LPM.addPass(LoopFullUnrollPass(Level.getSpeedupLevel(),

                                 /* OnlyWhenForced= */ !PTO.LoopUnrolling,

                                 PTO.ForgetAllSCEVInLoopUnroll));

  // The loop passes in LPM (LoopFullUnrollPass) do not preserve MemorySSA.

  // *All* loop passes must preserve it, in order to be able to use it.

  MainFPM.addPass(createFunctionToLoopPassAdaptor(

      std::move(LPM), /*UseMemorySSA=*/false, /*UseBlockFrequencyInfo=*/true));


  MainFPM.addPass(LoopDistributePass());


  addVectorPasses(Level, MainFPM, /* IsFullLTO */ true);


  invokeVectorizerEndEPCallbacks(MainFPM, Level);


  // Run the OpenMPOpt CGSCC pass again late.

  MPM.addPass(createModuleToPostOrderCGSCCPassAdaptor(

      OpenMPOptCGSCCPass(ThinOrFullLTOPhase::FullLTOPostLink)));


  invokePeepholeEPCallbacks(MainFPM, Level);

  MainFPM.addPass(JumpThreadingPass());

  MPM.addPass(createModuleToFunctionPassAdaptor(std::move(MainFPM),

                                                PTO.EagerlyInvalidateAnalyses));


  // Lower type metadata and the type.test intrinsic. This pass supports

  // clang's control flow integrity mechanisms (-fsanitize=cfi*) and needs

  // to be run at link time if CFI is enabled. This pass does nothing if

  // CFI is disabled.

  MPM.addPass(LowerTypeTestsPass(ExportSummary, nullptr));

  // Run a second time to clean up any type tests left behind by WPD for use

  // in ICP (which is performed earlier than this in the regular LTO pipeline).

  MPM.addPass(LowerTypeTestsPass(nullptr, nullptr,

                                 lowertypetests::DropTestKind::Assume));


  // Enable splitting late in the FullLTO post-link pipeline.

  if (EnableHotColdSplit)

    MPM.addPass(HotColdSplittingPass());


  // Add late LTO optimization passes.

  FunctionPassManager LateFPM;


  // LoopSink pass sinks instructions hoisted by LICM, which serves as a

  // canonicalization pass that enables other optimizations. As a result,

  // LoopSink pass needs to be a very late IR pass to avoid undoing LICM

  // result too early.

  LateFPM.addPass(LoopSinkPass());


  // This hoists/decomposes div/rem ops. It should run after other sink/hoist

  // passes to avoid re-sinking, but before SimplifyCFG because it can allow

  // flattening of blocks.

  LateFPM.addPass(DivRemPairsPass());


  // Delete basic blocks, which optimization passes may have killed.

  LateFPM.addPass(SimplifyCFGPass(SimplifyCFGOptions()

                                      .convertSwitchRangeToICmp(true)

                                      .hoistCommonInsts(true)

                                      .speculateUnpredictables(true)));

  MPM.addPass(createModuleToFunctionPassAdaptor(std::move(LateFPM)));


  // Drop bodies of available eternally objects to improve GlobalDCE.

  MPM.addPass(EliminateAvailableExternallyPass());


  // Now that we have optimized the program, discard unreachable functions.

  MPM.addPass(GlobalDCEPass(/*InLTOPostLink=*/true));


  if (PTO.MergeFunctions)

    MPM.addPass(MergeFunctionsPass());


  MPM.addPass(RelLookupTableConverterPass());


  if (PTO.CallGraphProfile)

    MPM.addPass(CGProfilePass(/*InLTOPostLink=*/true));


  MPM.addPass(CoroCleanupPass());


  invokeFullLinkTimeOptimizationLastEPCallbacks(MPM, Level);


  // Emit annotation remarks.

  addAnnotationRemarksPass(MPM);


  return MPM;

}


ModulePassManager


PassBuilder::buildO0DefaultPipeline(OptimizationLevel Level,

                                    ThinOrFullLTOPhase Phase) {

  assert(Level == OptimizationLevel::O0 &&

         "buildO0DefaultPipeline should only be used with O0");


  ModulePassManager MPM;


  // Perform pseudo probe instrumentation in O0 mode. This is for the

  // consistency between different build modes. For example, a LTO build can be

  // mixed with an O0 prelink and an O2 postlink. Loading a sample profile in

  // the postlink will require pseudo probe instrumentation in the prelink.

  if (PGOOpt && PGOOpt->PseudoProbeForProfiling)

    MPM.addPass(SampleProfileProbePass(TM));


  if (PGOOpt && (PGOOpt->Action == PGOOptions::IRInstr ||

                 PGOOpt->Action == PGOOptions::IRUse))

    addPGOInstrPassesForO0(

        MPM,

        /*RunProfileGen=*/(PGOOpt->Action == PGOOptions::IRInstr),

        /*IsCS=*/false, PGOOpt->AtomicCounterUpdate, PGOOpt->ProfileFile,

        PGOOpt->ProfileRemappingFile, PGOOpt->FS);


  // Instrument function entry and exit before all inlining.

  MPM.addPass(createModuleToFunctionPassAdaptor(

      EntryExitInstrumenterPass(/*PostInlining=*/false)));


  invokePipelineStartEPCallbacks(MPM, Level);


  if (PGOOpt && PGOOpt->DebugInfoForProfiling)

    MPM.addPass(createModuleToFunctionPassAdaptor(AddDiscriminatorsPass()));


  if (PGOOpt && PGOOpt->Action == PGOOptions::SampleUse) {

    // Explicitly disable sample loader inlining and use flattened profile in O0

    // pipeline.

    MPM.addPass(SampleProfileLoaderPass(PGOOpt->ProfileFile,

                                        PGOOpt->ProfileRemappingFile,

                                        ThinOrFullLTOPhase::None, nullptr,

                                        /*DisableSampleProfileInlining=*/true,

                                        /*UseFlattenedProfile=*/true));

    // Cache ProfileSummaryAnalysis once to avoid the potential need to insert

    // RequireAnalysisPass for PSI before subsequent non-module passes.

    MPM.addPass(RequireAnalysisPass<ProfileSummaryAnalysis, Module>());

  }


  invokePipelineEarlySimplificationEPCallbacks(MPM, Level, Phase);


  // Build a minimal pipeline based on the semantics required by LLVM,

  // which is just that always inlining occurs. Further, disable generating

  // lifetime intrinsics to avoid enabling further optimizations during

  // code generation.

  MPM.addPass(AlwaysInlinerPass(

      /*InsertLifetimeIntrinsics=*/false));


  if (PTO.MergeFunctions)

    MPM.addPass(MergeFunctionsPass());


  if (EnableMatrix)

    MPM.addPass(

        createModuleToFunctionPassAdaptor(LowerMatrixIntrinsicsPass(true)));


  if (!CGSCCOptimizerLateEPCallbacks.empty()) {

    CGSCCPassManager CGPM;

    invokeCGSCCOptimizerLateEPCallbacks(CGPM, Level);

    if (!CGPM.isEmpty())

      MPM.addPass(createModuleToPostOrderCGSCCPassAdaptor(std::move(CGPM)));

  }

  if (!LateLoopOptimizationsEPCallbacks.empty()) {

    LoopPassManager LPM;

    invokeLateLoopOptimizationsEPCallbacks(LPM, Level);

    if (!LPM.isEmpty()) {

      MPM.addPass(createModuleToFunctionPassAdaptor(

          createFunctionToLoopPassAdaptor(std::move(LPM))));

    }

  }

  if (!LoopOptimizerEndEPCallbacks.empty()) {

    LoopPassManager LPM;

    invokeLoopOptimizerEndEPCallbacks(LPM, Level);

    if (!LPM.isEmpty()) {

      MPM.addPass(createModuleToFunctionPassAdaptor(

          createFunctionToLoopPassAdaptor(std::move(LPM))));

    }

  }

  if (!ScalarOptimizerLateEPCallbacks.empty()) {

    FunctionPassManager FPM;

    invokeScalarOptimizerLateEPCallbacks(FPM, Level);

    if (!FPM.isEmpty())

      MPM.addPass(createModuleToFunctionPassAdaptor(std::move(FPM)));

  }


  invokeOptimizerEarlyEPCallbacks(MPM, Level, Phase);


  if (!VectorizerStartEPCallbacks.empty()) {

    FunctionPassManager FPM;

    invokeVectorizerStartEPCallbacks(FPM, Level);

    if (!FPM.isEmpty())

      MPM.addPass(createModuleToFunctionPassAdaptor(std::move(FPM)));

  }


  if (!VectorizerEndEPCallbacks.empty()) {

    FunctionPassManager FPM;

    invokeVectorizerEndEPCallbacks(FPM, Level);

    if (!FPM.isEmpty())

      MPM.addPass(createModuleToFunctionPassAdaptor(std::move(FPM)));

  }


  MPM.addPass(buildCoroWrapper(Phase));


  invokeOptimizerLastEPCallbacks(MPM, Level, Phase);


  if (isLTOPreLink(Phase))

    addRequiredLTOPreLinkPasses(MPM);


  MPM.addPass(createModuleToFunctionPassAdaptor(AnnotationRemarksPass()));


  return MPM;

}


AAManager PassBuilder::buildDefaultAAPipeline() {

  AAManager AA;


  // The order in which these are registered determines their priority when

  // being queried.


  // Add any target-specific alias analyses that should be run early.

  if (TM)

    TM->registerEarlyDefaultAliasAnalyses(AA);


  // First we register the basic alias analysis that provides the majority of

  // per-function local AA logic. This is a stateless, on-demand local set of

  // AA techniques.

  AA.registerFunctionAnalysis<BasicAA>();


  // Next we query fast, specialized alias analyses that wrap IR-embedded

  // information about aliasing.

  AA.registerFunctionAnalysis<ScopedNoAliasAA>();

  AA.registerFunctionAnalysis<TypeBasedAA>();


  // Add support for querying global aliasing information when available.

  // Because the `AAManager` is a function analysis and `GlobalsAA` is a module

  // analysis, all that the `AAManager` can do is query for any *cached*

  // results from `GlobalsAA` through a readonly proxy.

  if (EnableGlobalAnalyses)

    AA.registerModuleAnalysis<GlobalsAA>();


  // Add target-specific alias analyses.

  if (TM)

    TM->registerDefaultAliasAnalyses(AA);


  return AA;

}


bool PassBuilder::isInstrumentedPGOUse() const {

  return (PGOOpt && PGOOpt->Action == PGOOptions::IRUse) ||

         !UseCtxProfile.empty();

}

Phase
aarch64 falkor hwpf fix Falkor HW Prefetch Fix Late Phase
Definition AArch64FalkorHWPFFix.cpp:222

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

ADCE.h

AddDiscriminators.h

AggressiveInstCombine.h
AggressiveInstCombiner - Combine expression patterns to form expressions with fewer,...

AliasAnalysis.h

AlignmentFromAssumptions.h

AlwaysInliner.h
Provides passes to inlining "always_inline" functions.

Annotation2Metadata.h

AnnotationRemarks.h

ArgumentPromotion.h

AssumeBundleBuilder.h

Attributor.h

BDCE.h

BasicAliasAnalysis.h
This is the interface for LLVM's primary stateless and local alias analysis.

CGProfile.h
This file provides the interface for LLVM's Call Graph Profile pass.

CGSCCPassManager.h
This header provides classes for managing passes over SCCs of the call graph.

CallSiteSplitting.h

CalledValuePropagation.h

CanonicalizeAliases.h

CommandLine.h

clEnumValN
#define clEnumValN(ENUMVAL, FLAGNAME, DESC)
Definition CommandLine.h:687

ConstantMerge.h

ConstraintElimination.h

ControlHeightReduction.h

CoroAnnotationElide.h

CoroCleanup.h

CoroConditionalWrapper.h

CoroEarly.h

CoroElide.h

CoroSplit.h

CorrelatedValuePropagation.h

CountVisits.h

CrossDSOCFI.h

UseCtxProfile
cl::opt< std::string > UseCtxProfile("use-ctx-profile", cl::init(""), cl::Hidden, cl::desc("Use the specified contextual profile file"))

CtxProfAnalysis.h

DFAJumpThreading.h

DeadArgumentElimination.h

DeadStoreElimination.h

DivRemPairs.h

DropUnnecessaryAssumes.h

EarlyCSE.h
This file provides the interface for a simple, fast CSE pass.

ElimAvailExtern.h

EmbedBitcodePass.h
This file provides a pass which clones the current module and runs the provided pass pipeline on the ...

EntryExitInstrumenter.h

ExpandVariadics.h

ExtraPassManager.h
This file provides a pass manager that only runs its passes if the provided marker analysis has been ...

FatLTOCleanup.h

Float2Int.h

ForceFunctionAttrs.h
Super simple passes to force specific function attrs from the commandline into the IR for debugging p...

FunctionAttrs.h
Provides passes for computing function attributes based on interprocedural analyses.

GVN.h
This file provides the interface for LLVM's Global Value Numbering pass which eliminates fully redund...

GlobalDCE.h

GlobalOpt.h

GlobalSplit.h

GlobalsModRef.h
This is the interface for a simple mod/ref and alias analysis over globals.

HipStdPar.h
AcceleratorCodeSelection - Identify all functions reachable from a kernel, removing those that are un...

HotColdSplitting.h

SCCP.h

IROutliner.h

PassManager.h
This header defines various interfaces for pass management in LLVM.

IndVarSimplify.h

InferAlignment.h

InferFunctionAttrs.h
Interfaces for passes which infer implicit function attributes from the name and signature of functio...

InjectTLIMappings.h

InlineAdvisor.h

Inliner.h

InstCombine.h
This file provides the primary interface to the instcombine pass.

InstSimplifyPass.h
Defines passes for running instruction simplification across chunks of IR.

InstrProfiling.h
This file provides the interface for LLVM's PGO Instrumentation lowering pass.

JumpTableToSwitch.h

JumpThreading.h
See the comments on JumpThreadingPass.

LICM.h

Options
static LVOptions Options
Definition LVOptions.cpp:25

LibCallsShrinkWrap.h

LoopDeletion.h

LoopDistribute.h

LoopFlatten.h

LoopFuse.h
This file implements the Loop Fusion pass.

LoopIdiomRecognize.h

LoopInstSimplify.h

LoopInterchange.h

LoopLoadElimination.h
This header defines the LoopLoadEliminationPass object.

LoopPassManager.h
This header provides classes for managing a pipeline of passes over loops in LLVM IR.

LoopRotation.h

LoopSimplifyCFG.h

LoopSink.h

LoopUnrollAndJamPass.h

LoopUnrollPass.h

LoopVectorize.h

LoopVersioningLICM.h

LowerConstantIntrinsics.h
The header file for the LowerConstantIntrinsics pass as used by the new pass manager.

LowerExpectIntrinsic.h
The header file for the LowerExpectIntrinsic pass as used by the new pass manager.

LowerMatrixIntrinsics.h

LowerTypeTests.h

Mem2Reg.h

MemCpyOptimizer.h

MemProfContextDisambiguation.h

MemProfInstrumentation.h

MemProfUse.h

MergeFunctions.h

MergedLoadStoreMotion.h
This pass performs merges of loads and stores on both sides of a.

ModuleInliner.h

MoveAutoInit.h

NameAnonGlobals.h

NewGVN.h
This file provides the interface for LLVM's Global Value Numbering pass.

OpenMPOpt.h

OptimizationLevel.h
This header enumerates the LLVM-provided high-level optimization levels.

PGOCtxProfFlattening.h

PGOCtxProfLowering.h

PGOForceFunctionAttrs.h

PGOInstrumentation.h
This file provides the interface for IR based instrumentation passes ( (profile-gen,...

PGOOptions.h
Define option tunables for PGO.

PartialInlining.h

EnableMergeFunctions
static cl::opt< bool > EnableMergeFunctions("enable-merge-functions", cl::init(false), cl::Hidden, cl::desc("Enable function merging as part of the optimization pipeline"))

EnableGlobalAnalyses
static cl::opt< bool > EnableGlobalAnalyses("enable-global-analyses", cl::init(true), cl::Hidden, cl::desc("Enable inter-procedural analyses"))

EnableIROutliner
static cl::opt< bool > EnableIROutliner("ir-outliner", cl::init(false), cl::Hidden, cl::desc("Enable ir outliner pass"))

RunNewGVN
static cl::opt< bool > RunNewGVN("enable-newgvn", cl::init(false), cl::Hidden, cl::desc("Run the NewGVN pass"))

DisablePreInliner
static cl::opt< bool > DisablePreInliner("disable-preinline", cl::init(false), cl::Hidden, cl::desc("Disable pre-instrumentation inliner"))

EnableEagerlyInvalidateAnalyses
static cl::opt< bool > EnableEagerlyInvalidateAnalyses("eagerly-invalidate-analyses", cl::init(true), cl::Hidden, cl::desc("Eagerly invalidate more analyses in default pipelines"))

ExtraVectorizerPasses
static cl::opt< bool > ExtraVectorizerPasses("extra-vectorizer-passes", cl::init(false), cl::Hidden, cl::desc("Run cleanup optimization passes after vectorization"))

addAnnotationRemarksPass
static void addAnnotationRemarksPass(ModulePassManager &MPM)
Definition PassBuilderPipelines.cpp:402

EnablePostPGOLoopRotation
static cl::opt< bool > EnablePostPGOLoopRotation("enable-post-pgo-loop-rotation", cl::init(true), cl::Hidden, cl::desc("Run the loop rotation transformation after PGO instrumentation"))

getInlineParamsFromOptLevel
static InlineParams getInlineParamsFromOptLevel(OptimizationLevel Level)
Definition PassBuilderPipelines.cpp:915

EnableGVNSink
static cl::opt< bool > EnableGVNSink("enable-gvn-sink", cl::desc("Enable the GVN sinking pass (default = off)"))

PerformMandatoryInliningsFirst
static cl::opt< bool > PerformMandatoryInliningsFirst("mandatory-inlining-first", cl::init(false), cl::Hidden, cl::desc("Perform mandatory inlinings module-wide, before performing " "inlining"))

EnableLoopInterchange
static cl::opt< bool > EnableLoopInterchange("enable-loopinterchange", cl::init(false), cl::Hidden, cl::desc("Enable the LoopInterchange Pass"))

EnableGVNHoist
static cl::opt< bool > EnableGVNHoist("enable-gvn-hoist", cl::desc("Enable the GVN hoisting pass (default = off)"))

RunPartialInlining
static cl::opt< bool > RunPartialInlining("enable-partial-inlining", cl::init(false), cl::Hidden, cl::desc("Run Partial inlining pass"))

EnableDFAJumpThreading
static cl::opt< bool > EnableDFAJumpThreading("enable-dfa-jump-thread", cl::desc("Enable DFA jump threading"), cl::init(false), cl::Hidden)

EnableCHR
static cl::opt< bool > EnableCHR("enable-chr", cl::init(true), cl::Hidden, cl::desc("Enable control height reduction optimization (CHR)"))

buildCoroWrapper
static CoroConditionalWrapper buildCoroWrapper(ThinOrFullLTOPhase Phase)
Definition PassBuilderPipelines.cpp:419

EnableHotColdSplit
static cl::opt< bool > EnableHotColdSplit("hot-cold-split", cl::desc("Enable hot-cold splitting pass"))

EnableSampledInstr
static cl::opt< bool > EnableSampledInstr("enable-sampled-instrumentation", cl::init(false), cl::Hidden, cl::desc("Enable profile instrumentation sampling (default = off)"))

PreInlineThreshold
static cl::opt< int > PreInlineThreshold("preinline-threshold", cl::Hidden, cl::init(75), cl::desc("Control the amount of inlining in pre-instrumentation inliner " "(default = 75)"))

FlattenedProfileUsed
static cl::opt< bool > FlattenedProfileUsed("flattened-profile-used", cl::init(false), cl::Hidden, cl::desc("Indicate the sample profile being used is flattened, i.e., " "no inline hierarchy exists in the profile"))

EnableLoopHeaderDuplication
static cl::opt< bool > EnableLoopHeaderDuplication("enable-loop-header-duplication", cl::init(false), cl::Hidden, cl::desc("Enable loop header duplication at any optimization level"))

EnableUnrollAndJam
static cl::opt< bool > EnableUnrollAndJam("enable-unroll-and-jam", cl::init(false), cl::Hidden, cl::desc("Enable Unroll And Jam Pass"))

InstrumentColdFuncOnlyPath
static cl::opt< std::string > InstrumentColdFuncOnlyPath("instrument-cold-function-only-path", cl::init(""), cl::desc("File path for cold function only instrumentation(requires use " "with --pgo-instrument-cold-function-only)"), cl::Hidden)

PGOInstrumentColdFunctionOnly
cl::opt< bool > PGOInstrumentColdFunctionOnly

EnableModuleInliner
static cl::opt< bool > EnableModuleInliner("enable-module-inliner", cl::init(false), cl::Hidden, cl::desc("Enable module inliner"))

EnableMatrix
static cl::opt< bool > EnableMatrix("enable-matrix", cl::init(false), cl::Hidden, cl::desc("Enable lowering of the matrix intrinsics"))

AttributorRun
static cl::opt< AttributorRunOption > AttributorRun("attributor-enable", cl::Hidden, cl::init(AttributorRunOption::NONE), cl::desc("Enable the attributor inter-procedural deduction pass"), cl::values(clEnumValN(AttributorRunOption::ALL, "all", "enable all attributor runs"), clEnumValN(AttributorRunOption::MODULE, "module", "enable module-wide attributor runs"), clEnumValN(AttributorRunOption::CGSCC, "cgscc", "enable call graph SCC attributor runs"), clEnumValN(AttributorRunOption::NONE, "none", "disable attributor runs")))

UseLoopVersioningLICM
static cl::opt< bool > UseLoopVersioningLICM("enable-loop-versioning-licm", cl::init(false), cl::Hidden, cl::desc("Enable the experimental Loop Versioning LICM pass"))

isLTOPreLink
static bool isLTOPreLink(ThinOrFullLTOPhase Phase)
Definition PassBuilderPipelines.cpp:407

EnablePGOInlineDeferral
static cl::opt< bool > EnablePGOInlineDeferral("enable-npm-pgo-inline-deferral", cl::init(true), cl::Hidden, cl::desc("Enable inline deferral during PGO"))
Flag to enable inline deferral during PGO.

EnableJumpTableToSwitch
static cl::opt< bool > EnableJumpTableToSwitch("enable-jump-table-to-switch", cl::desc("Enable JumpTableToSwitch pass (default = off)"))

UseInlineAdvisor
static cl::opt< InliningAdvisorMode > UseInlineAdvisor("enable-ml-inliner", cl::init(InliningAdvisorMode::Default), cl::Hidden, cl::desc("Enable ML policy for inliner. Currently trained for -Oz only"), cl::values(clEnumValN(InliningAdvisorMode::Default, "default", "Heuristics-based inliner version"), clEnumValN(InliningAdvisorMode::Development, "development", "Use development mode (runtime-loadable model)"), clEnumValN(InliningAdvisorMode::Release, "release", "Use release mode (AOT-compiled model)")))

isLTOPostLink
static bool isLTOPostLink(ThinOrFullLTOPhase Phase)
Definition PassBuilderPipelines.cpp:413

EnableConstraintElimination
static cl::opt< bool > EnableConstraintElimination("enable-constraint-elimination", cl::init(true), cl::Hidden, cl::desc("Enable pass to eliminate conditions based on linear constraints"))

EnableLoopFlatten
static cl::opt< bool > EnableLoopFlatten("enable-loop-flatten", cl::init(false), cl::Hidden, cl::desc("Enable the LoopFlatten Pass"))

Pass.h

ProfileSummaryInfo.h

Reassociate.h

RelLookupTableConverter.h
This file implements relative lookup table converter that converts lookup tables to relative lookup t...

SLPVectorizer.h

SROA.h
This file provides the interface for LLVM's Scalar Replacement of Aggregates pass.

SampleProfileProbe.h
This file provides the interface for the pseudo probe implementation for AutoFDO.

SampleProfile.h
This file provides the interface for the sampled PGO loader pass.

SCCP.h

ScopedNoAliasAA.h
This is the interface for a metadata-based scoped no-alias analysis.

SimpleLoopUnswitch.h

SimplifyCFGOptions.h

SimplifyCFG.h
This file provides the interface for the pass responsible for both simplifying and canonicalizing the...

SpeculativeExecution.h

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

TailRecursionElimination.h

TypeBasedAliasAnalysis.h
This is the interface for a metadata-based TBAA.

VectorCombine.h

VirtualFileSystem.h
Defines the virtual file system interface vfs::FileSystem.

WarnMissedTransforms.h

WholeProgramDevirt.h

llvm::AAManager
A manager for alias analyses.
Definition AliasAnalysis.h:974

llvm::AddDiscriminatorsPass
Definition AddDiscriminators.h:24

llvm::AggressiveInstCombinePass
Definition AggressiveInstCombine.h:23

llvm::AlwaysInlinerPass
Inlines functions marked as "always_inline".
Definition AlwaysInliner.h:33

llvm::ArgumentPromotionPass
Argument promotion pass.
Definition ArgumentPromotion.h:23

llvm::AssignGUIDPass
Assign a GUID to functions as metadata.
Definition CtxProfAnalysis.h:200

llvm::BasicAA
Analysis pass providing a never-invalidated alias analysis result.
Definition BasicAliasAnalysis.h:159

llvm::CGProfilePass
Definition CGProfile.h:19

llvm::CalledValuePropagationPass
Definition CalledValuePropagation.h:27

llvm::CanonicalizeAliasesPass
Simple pass that canonicalizes aliases.
Definition CanonicalizeAliases.h:23

llvm::ConstantMergePass
A pass that merges duplicate global constants into a single constant.
Definition ConstantMerge.h:29

llvm::ConstraintEliminationPass
Definition ConstraintElimination.h:17

llvm::ControlHeightReductionPass
Definition ControlHeightReduction.h:22

llvm::CrossDSOCFIPass
Definition CrossDSOCFI.h:20

llvm::DSEPass
This class implements a trivial dead store elimination.
Definition DeadStoreElimination.h:28

llvm::DeadArgumentEliminationPass
Eliminate dead arguments (and return values) from functions.
Definition DeadArgumentElimination.h:39

llvm::EliminateAvailableExternallyPass
A pass that transforms external global definitions into declarations.
Definition ElimAvailExtern.h:25

llvm::EmbedBitcodePass
Pass embeds a copy of the module optimized with the provided pass pipeline into a global variable.
Definition EmbedBitcodePass.h:38

llvm::ExpandVariadicsPass
Definition ExpandVariadics.h:26

llvm::ExtraFunctionPassManager::addPass
void addPass(PassT &&Pass)
Definition ExtraPassManager.h:63

llvm::ExtraLoopPassManager
A pass manager to run a set of extra loop passes if the MarkerTy analysis is present.
Definition ExtraPassManager.h:83

llvm::ExtraLoopPassManager::addPass
void addPass(PassT &&Pass)
Definition ExtraPassManager.h:87

llvm::FatLtoCleanup
Definition FatLTOCleanup.h:27

llvm::Float2IntPass
Definition Float2Int.h:31

llvm::GVNPass
The core GVN pass object.
Definition GVN.h:126

llvm::GlobalDCEPass
Pass to remove unused function declarations.
Definition GlobalDCE.h:38

llvm::GlobalOptPass
Optimize globals that never have their address taken.
Definition GlobalOpt.h:25

llvm::GlobalSplitPass
Pass to perform split of global variables.
Definition GlobalSplit.h:26

llvm::GlobalsAA
Analysis pass providing a never-invalidated alias analysis result.
Definition GlobalsModRef.h:131

llvm::HotColdSplittingPass
Pass to outline cold regions.
Definition HotColdSplitting.h:67

llvm::IPSCCPPass
Pass to perform interprocedural constant propagation.
Definition SCCP.h:48

llvm::IROutlinerPass
Pass to outline similar regions.
Definition IROutliner.h:444

llvm::IndVarSimplifyPass
Definition IndVarSimplify.h:25

llvm::InjectTLIMappings
Definition InjectTLIMappings.h:20

llvm::InstCombinePass
Definition InstCombine.h:49

llvm::InstSimplifyPass
Run instruction simplification across each instruction in the function.
Definition InstSimplifyPass.h:32

llvm::InstrProfilingLoweringPass
Instrumentation based profiling lowering pass.
Definition InstrProfiling.h:27

llvm::IntrusiveRefCntPtr
A smart pointer to a reference-counted object that inherits from RefCountedBase or ThreadSafeRefCount...
Definition IntrusiveRefCntPtr.h:173

llvm::JumpThreadingPass
This pass performs 'jump threading', which looks at blocks that have multiple predecessors and multip...
Definition JumpThreading.h:80

llvm::LICMPass
Performs Loop Invariant Code Motion Pass.
Definition LICM.h:66

llvm::LibCallsShrinkWrapPass
Definition LibCallsShrinkWrap.h:18

llvm::LoopDeletionPass
Definition LoopDeletion.h:24

llvm::LoopDistributePass
Definition LoopDistribute.h:25

llvm::LoopFlattenPass
Definition LoopFlatten.h:23

llvm::LoopFullUnrollPass
Loop unroll pass that only does full loop unrolling and peeling.
Definition LoopUnrollPass.h:26

llvm::LoopFusePass
Definition LoopFuse.h:23

llvm::LoopIdiomRecognizePass
Performs Loop Idiom Recognize Pass.
Definition LoopIdiomRecognize.h:49

llvm::LoopInstSimplifyPass
Performs Loop Inst Simplify Pass.
Definition LoopInstSimplify.h:25

llvm::LoopRotatePass
A simple loop rotation transformation.
Definition LoopRotation.h:24

llvm::LoopSimplifyCFGPass
Performs basic CFG simplifications to assist other loop passes.
Definition LoopSimplifyCFG.h:28

llvm::LoopSinkPass
A pass that does profile-guided sinking of instructions into loops.
Definition LoopSink.h:33

llvm::LoopUnrollAndJamPass
A simple loop rotation transformation.
Definition LoopUnrollAndJamPass.h:20

llvm::LoopUnrollPass
Loop unroll pass that will support both full and partial unrolling.
Definition LoopUnrollPass.h:133

llvm::LoopVersioningLICMPass
Definition LoopVersioningLICM.h:19

llvm::LowerMatrixIntrinsicsPass
Definition LowerMatrixIntrinsics.h:20

llvm::LowerTypeTestsPass
Definition LowerTypeTests.h:205

llvm::MemCpyOptPass
Definition MemCpyOptimizer.h:44

llvm::MemProfContextDisambiguation
Definition MemProfContextDisambiguation.h:31

llvm::MemProfUsePass
Definition MemProfUse.h:32

llvm::MergeFunctionsPass
Merge identical functions.
Definition MergeFunctions.h:27

llvm::MergedLoadStoreMotionPass
Definition MergedLoadStoreMotion.h:43

llvm::ModuleInlinerPass
The module inliner pass for the new pass manager.
Definition ModuleInliner.h:28

llvm::ModuleInlinerWrapperPass
Module pass, wrapping the inliner pass.
Definition Inliner.h:65

llvm::ModuleInlinerWrapperPass::addModulePass
void addModulePass(T Pass)
Add a module pass that runs before the CGSCC passes.
Definition Inliner.h:81

llvm::ModuleSummaryIndex
Class to hold module path string table and global value map, and encapsulate methods for operating on...
Definition ModuleSummaryIndex.h:1396

llvm::MoveAutoInitPass
Definition MoveAutoInit.h:23

llvm::NameAnonGlobalPass
Simple pass that provides a name to every anonymous globals.
Definition NameAnonGlobals.h:22

llvm::NewGVNPass
Definition NewGVN.h:23

llvm::NoinlineNonPrevailing
Definition PGOCtxProfLowering.h:35

llvm::OpenMPOptCGSCCPass
Definition OpenMPOpt.h:53

llvm::OpenMPOptPass
OpenMP optimizations pass.
Definition OpenMPOpt.h:42

llvm::OptimizationLevel
Definition OptimizationLevel.h:23

llvm::OptimizationLevel::O3
static LLVM_ABI const OptimizationLevel O3
Optimize for fast execution as much as possible.
Definition OptimizationLevel.h:90

llvm::OptimizationLevel::Oz
static LLVM_ABI const OptimizationLevel Oz
A very specialized mode that will optimize for code size at any and all costs.
Definition OptimizationLevel.h:109

llvm::OptimizationLevel::O0
static LLVM_ABI const OptimizationLevel O0
Disable as many optimizations as possible.
Definition OptimizationLevel.h:42

llvm::OptimizationLevel::Os
static LLVM_ABI const OptimizationLevel Os
Similar to O2 but tries to optimize for small code size instead of fast execution without triggering ...
Definition OptimizationLevel.h:101

llvm::OptimizationLevel::O2
static LLVM_ABI const OptimizationLevel O2
Optimize for fast execution as much as possible without triggering significant incremental compile ti...
Definition OptimizationLevel.h:75

llvm::OptimizationLevel::O1
static LLVM_ABI const OptimizationLevel O1
Optimize quickly without destroying debuggability.
Definition OptimizationLevel.h:58

llvm::PGOCtxProfFlatteningPass
Definition PGOCtxProfFlattening.h:19

llvm::PGOCtxProfLoweringPass
Definition PGOCtxProfLowering.h:19

llvm::PGOCtxProfLoweringPass::isCtxIRPGOInstrEnabled
static bool isCtxIRPGOInstrEnabled()
Definition PGOCtxProfLowering.cpp:41

llvm::PGOIndirectCallPromotion
The indirect function call promotion pass.
Definition PGOInstrumentation.h:87

llvm::PGOInstrumentationGenCreateVar
The instrumentation (profile-instr-gen) pass for IR based PGO.
Definition PGOInstrumentation.h:42

llvm::PGOInstrumentationGen
The instrumentation (profile-instr-gen) pass for IR based PGO.
Definition PGOInstrumentation.h:56

llvm::PGOInstrumentationUse
The profile annotation (profile-instr-use) pass for IR based PGO.
Definition PGOInstrumentation.h:69

llvm::PGOMemOPSizeOpt
The profile size based optimization pass for memory intrinsics.
Definition PGOInstrumentation.h:100

llvm::PartialInlinerPass
Pass to remove unused function declarations.
Definition PartialInlining.h:24

llvm::PassBuilder::invokeFullLinkTimeOptimizationLastEPCallbacks
LLVM_ABI void invokeFullLinkTimeOptimizationLastEPCallbacks(ModulePassManager &MPM, OptimizationLevel Level)
Definition PassBuilderPipelines.cpp:385

llvm::PassBuilder::buildInlinerPipeline
LLVM_ABI ModuleInlinerWrapperPass buildInlinerPipeline(OptimizationLevel Level, ThinOrFullLTOPhase Phase)
Construct the module pipeline that performs inlining as well as the inlining-driven cleanups.
Definition PassBuilderPipelines.cpp:920

llvm::PassBuilder::invokeOptimizerEarlyEPCallbacks
LLVM_ABI void invokeOptimizerEarlyEPCallbacks(ModulePassManager &MPM, OptimizationLevel Level, ThinOrFullLTOPhase Phase)
Definition PassBuilderPipelines.cpp:368

llvm::PassBuilder::invokeVectorizerStartEPCallbacks
LLVM_ABI void invokeVectorizerStartEPCallbacks(FunctionPassManager &FPM, OptimizationLevel Level)
Definition PassBuilderPipelines.cpp:358

llvm::PassBuilder::buildDefaultAAPipeline
LLVM_ABI AAManager buildDefaultAAPipeline()
Build the default AAManager with the default alias analysis pipeline registered.
Definition PassBuilderPipelines.cpp:2336

llvm::PassBuilder::invokeCGSCCOptimizerLateEPCallbacks
LLVM_ABI void invokeCGSCCOptimizerLateEPCallbacks(CGSCCPassManager &CGPM, OptimizationLevel Level)
Definition PassBuilderPipelines.cpp:353

llvm::PassBuilder::buildThinLTOPreLinkDefaultPipeline
LLVM_ABI ModulePassManager buildThinLTOPreLinkDefaultPipeline(OptimizationLevel Level)
Build a pre-link, ThinLTO-targeting default optimization pipeline to a pass manager.
Definition PassBuilderPipelines.cpp:1738

llvm::PassBuilder::invokeScalarOptimizerLateEPCallbacks
LLVM_ABI void invokeScalarOptimizerLateEPCallbacks(FunctionPassManager &FPM, OptimizationLevel Level)
Definition PassBuilderPipelines.cpp:348

llvm::PassBuilder::buildPerModuleDefaultPipeline
LLVM_ABI ModulePassManager buildPerModuleDefaultPipeline(OptimizationLevel Level, ThinOrFullLTOPhase Phase=ThinOrFullLTOPhase::None)
Build a per-module default optimization pipeline.
Definition PassBuilderPipelines.cpp:1651

llvm::PassBuilder::invokePipelineStartEPCallbacks
LLVM_ABI void invokePipelineStartEPCallbacks(ModulePassManager &MPM, OptimizationLevel Level)
Definition PassBuilderPipelines.cpp:390

llvm::PassBuilder::invokeVectorizerEndEPCallbacks
LLVM_ABI void invokeVectorizerEndEPCallbacks(FunctionPassManager &FPM, OptimizationLevel Level)
Definition PassBuilderPipelines.cpp:363

llvm::PassBuilder::buildO0DefaultPipeline
LLVM_ABI ModulePassManager buildO0DefaultPipeline(OptimizationLevel Level, ThinOrFullLTOPhase Phase=ThinOrFullLTOPhase::None)
Build an O0 pipeline with the minimal semantically required passes.
Definition PassBuilderPipelines.cpp:2219

llvm::PassBuilder::buildFunctionSimplificationPipeline
LLVM_ABI FunctionPassManager buildFunctionSimplificationPipeline(OptimizationLevel Level, ThinOrFullLTOPhase Phase)
Construct the core LLVM function canonicalization and simplification pipeline.
Definition PassBuilderPipelines.cpp:570

llvm::PassBuilder::invokePeepholeEPCallbacks
LLVM_ABI void invokePeepholeEPCallbacks(FunctionPassManager &FPM, OptimizationLevel Level)
Definition PassBuilderPipelines.cpp:333

llvm::PassBuilder::invokePipelineEarlySimplificationEPCallbacks
LLVM_ABI void invokePipelineEarlySimplificationEPCallbacks(ModulePassManager &MPM, OptimizationLevel Level, ThinOrFullLTOPhase Phase)
Definition PassBuilderPipelines.cpp:395

llvm::PassBuilder::invokeLoopOptimizerEndEPCallbacks
LLVM_ABI void invokeLoopOptimizerEndEPCallbacks(LoopPassManager &LPM, OptimizationLevel Level)
Definition PassBuilderPipelines.cpp:343

llvm::PassBuilder::buildLTODefaultPipeline
LLVM_ABI ModulePassManager buildLTODefaultPipeline(OptimizationLevel Level, ModuleSummaryIndex *ExportSummary)
Build an LTO default optimization pipeline to a pass manager.
Definition PassBuilderPipelines.cpp:1867

llvm::PassBuilder::buildModuleInlinerPipeline
LLVM_ABI ModulePassManager buildModuleInlinerPipeline(OptimizationLevel Level, ThinOrFullLTOPhase Phase)
Construct the module pipeline that performs inlining with module inliner pass.
Definition PassBuilderPipelines.cpp:1019

llvm::PassBuilder::buildThinLTODefaultPipeline
LLVM_ABI ModulePassManager buildThinLTODefaultPipeline(OptimizationLevel Level, const ModuleSummaryIndex *ImportSummary)
Build a ThinLTO default optimization pipeline to a pass manager.
Definition PassBuilderPipelines.cpp:1799

llvm::PassBuilder::invokeLateLoopOptimizationsEPCallbacks
LLVM_ABI void invokeLateLoopOptimizationsEPCallbacks(LoopPassManager &LPM, OptimizationLevel Level)
Definition PassBuilderPipelines.cpp:338

llvm::PassBuilder::invokeFullLinkTimeOptimizationEarlyEPCallbacks
LLVM_ABI void invokeFullLinkTimeOptimizationEarlyEPCallbacks(ModulePassManager &MPM, OptimizationLevel Level)
Definition PassBuilderPipelines.cpp:380

llvm::PassBuilder::buildFatLTODefaultPipeline
LLVM_ABI ModulePassManager buildFatLTODefaultPipeline(OptimizationLevel Level, bool ThinLTO, bool EmitSummary)
Build a fat object default optimization pipeline.
Definition PassBuilderPipelines.cpp:1689

llvm::PassBuilder::buildModuleSimplificationPipeline
LLVM_ABI ModulePassManager buildModuleSimplificationPipeline(OptimizationLevel Level, ThinOrFullLTOPhase Phase)
Construct the core LLVM module canonicalization and simplification pipeline.
Definition PassBuilderPipelines.cpp:1067

llvm::PassBuilder::buildModuleOptimizationPipeline
LLVM_ABI ModulePassManager buildModuleOptimizationPipeline(OptimizationLevel Level, ThinOrFullLTOPhase LTOPhase)
Construct the core LLVM module optimization pipeline.
Definition PassBuilderPipelines.cpp:1445

llvm::PassBuilder::addPGOInstrPassesForO0
LLVM_ABI void addPGOInstrPassesForO0(ModulePassManager &MPM, bool RunProfileGen, bool IsCS, bool AtomicCounterUpdate, std::string ProfileFile, std::string ProfileRemappingFile, IntrusiveRefCntPtr< vfs::FileSystem > FS)
Add PGOInstrumenation passes for O0 only.
Definition PassBuilderPipelines.cpp:887

llvm::PassBuilder::invokeOptimizerLastEPCallbacks
LLVM_ABI void invokeOptimizerLastEPCallbacks(ModulePassManager &MPM, OptimizationLevel Level, ThinOrFullLTOPhase Phase)
Definition PassBuilderPipelines.cpp:374

llvm::PassBuilder::buildLTOPreLinkDefaultPipeline
LLVM_ABI ModulePassManager buildLTOPreLinkDefaultPipeline(OptimizationLevel Level)
Build a pre-link, LTO-targeting default optimization pipeline to a pass manager.
Definition PassBuilderPipelines.cpp:1860

llvm::PassManager::addPass
LLVM_ATTRIBUTE_MINSIZE std::enable_if_t<!std::is_same_v< PassT, PassManager > > addPass(PassT &&Pass)
Definition PassManager.h:196

llvm::PassManager::isEmpty
bool isEmpty() const
Returns if the pass manager contains any passes.
Definition PassManager.h:218

llvm::PipelineTuningOptions::LicmMssaNoAccForPromotionCap
unsigned LicmMssaNoAccForPromotionCap
Tuning option to disable promotion to scalars in LICM with MemorySSA, if the number of access is too ...
Definition PassBuilder.h:81

llvm::PipelineTuningOptions::SLPVectorization
bool SLPVectorization
Tuning option to enable/disable slp loop vectorization, set based on opt level.
Definition PassBuilder.h:59

llvm::PipelineTuningOptions::InlinerThreshold
int InlinerThreshold
Tuning option to override the default inliner threshold.
Definition PassBuilder.h:95

llvm::PipelineTuningOptions::LoopFusion
bool LoopFusion
Tuning option to enable/disable loop fusion. Its default value is false.
Definition PassBuilder.h:69

llvm::PipelineTuningOptions::EagerlyInvalidateAnalyses
bool EagerlyInvalidateAnalyses
Definition PassBuilder.h:104

llvm::PipelineTuningOptions::CallGraphProfile
bool CallGraphProfile
Tuning option to enable/disable call graph profile.
Definition PassBuilder.h:85

llvm::PipelineTuningOptions::MergeFunctions
bool MergeFunctions
Tuning option to enable/disable function merging.
Definition PassBuilder.h:92

llvm::PipelineTuningOptions::ForgetAllSCEVInLoopUnroll
bool ForgetAllSCEVInLoopUnroll
Tuning option to forget all SCEV loops in LoopUnroll.
Definition PassBuilder.h:73

llvm::PipelineTuningOptions::LicmMssaOptCap
unsigned LicmMssaOptCap
Tuning option to cap the number of calls to retrive clobbering accesses in MemorySSA,...
Definition PassBuilder.h:77

llvm::PipelineTuningOptions::LoopInterleaving
bool LoopInterleaving
Tuning option to set loop interleaving on/off, set based on opt level.
Definition PassBuilder.h:51

llvm::PipelineTuningOptions::PipelineTuningOptions
LLVM_ABI PipelineTuningOptions()
Constructor sets pipeline tuning defaults based on cl::opts.
Definition PassBuilderPipelines.cpp:312

llvm::PipelineTuningOptions::LoopUnrolling
bool LoopUnrolling
Tuning option to enable/disable loop unrolling. Its default value is true.
Definition PassBuilder.h:62

llvm::PipelineTuningOptions::LoopInterchange
bool LoopInterchange
Tuning option to enable/disable loop interchange.
Definition PassBuilder.h:66

llvm::PipelineTuningOptions::LoopVectorization
bool LoopVectorization
Tuning option to enable/disable loop vectorization, set based on opt level.
Definition PassBuilder.h:55

llvm::PipelineTuningOptions::UnifiedLTO
bool UnifiedLTO
Definition PassBuilder.h:88

llvm::PromotePass
Definition Mem2Reg.h:24

llvm::PseudoProbeUpdatePass
Definition SampleProfileProbe.h:136

llvm::ReassociatePass
Reassociate commutative expressions.
Definition Reassociate.h:74

llvm::RelLookupTableConverterPass
Definition RelLookupTableConverter.h:62

llvm::ReversePostOrderFunctionAttrsPass
A pass to do RPO deduction and propagation of function attributes.
Definition FunctionAttrs.h:77

llvm::SCCPPass
This pass performs function-level constant propagation and merging.
Definition SCCP.h:30

llvm::SROAPass
Definition SROA.h:26

llvm::SampleProfileLoaderPass
The sample profiler data loader pass.
Definition SampleProfile.h:40

llvm::SampleProfileProbePass
Definition SampleProfileProbe.h:116

llvm::ScopedNoAliasAA
Analysis pass providing a never-invalidated alias analysis result.
Definition ScopedNoAliasAA.h:58

llvm::SimpleLoopUnswitchPass
This pass transforms loops that contain branches or switches on loop- invariant conditions to have mu...
Definition SimpleLoopUnswitch.h:68

llvm::SimplifyCFGPass
A pass to simplify and canonicalize the CFG of a function.
Definition SimplifyCFG.h:30

llvm::SimplifyTypeTestsPass
Definition LowerTypeTests.h:224

llvm::SpeculativeExecutionPass
Definition SpeculativeExecution.h:72

llvm::TailCallElimPass
Definition TailRecursionElimination.h:61

llvm::TypeBasedAA
Analysis pass providing a never-invalidated alias analysis result.
Definition TypeBasedAliasAnalysis.h:75

llvm::VectorCombinePass
Optimize scalar/vector interactions in IR using target cost models.
Definition VectorCombine.h:23

llvm::WarnMissedTransformationsPass
Definition WarnMissedTransforms.h:21

llvm::cl::opt
Definition CommandLine.h:1429

PassBuilder.h
Interfaces for registering analysis passes, producing common pass manager configurations,...

ErrorHandling.h

TargetMachine.h

llvm::AA
Abstract Attribute helper functions.
Definition Attributor.h:165

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::PICLevel::Level
Level
Definition CodeGen.h:36

llvm::cl::Hidden
@ Hidden
Definition CommandLine.h:138

llvm::cl::values
ValuesClass values(OptsTy... Options)
Helper to build a ValuesClass by forwarding a variable number of arguments as an initializer list to ...
Definition CommandLine.h:712

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition CommandLine.h:444

llvm::lowertypetests::DropTestKind::Assume
@ Assume
Do not drop type tests (default).
Definition LowerTypeTests.h:199

llvm::lowertypetests::DropTestKind::All
@ All
Drop only llvm.assumes using type test value.
Definition LowerTypeTests.h:200

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::EnableKnowledgeRetention
LLVM_ABI cl::opt< bool > EnableKnowledgeRetention

llvm::InlinePass::CGSCCInliner
@ CGSCCInliner
Definition InlineAdvisor.h:48

llvm::InlinePass::EarlyInliner
@ EarlyInliner
Definition InlineAdvisor.h:49

llvm::createModuleToFunctionPassAdaptor
ModuleToFunctionPassAdaptor createModuleToFunctionPassAdaptor(FunctionPassT &&Pass, bool EagerlyInvalidate=false)
A function to deduce a function pass type and wrap it in the templated adaptor.
Definition PassManager.h:877

llvm::InliningAdvisorMode::Development
@ Development
Definition InlineAdvisor.h:43

llvm::InliningAdvisorMode::Default
@ Default
Definition InlineAdvisor.h:43

llvm::InliningAdvisorMode::Release
@ Release
Definition InlineAdvisor.h:43

llvm::PGOInstrumentationType::CTXPROF
@ CTXPROF
Definition PGOInstrumentation.h:54

llvm::PGOInstrumentationType::CSFDO
@ CSFDO
Definition PGOInstrumentation.h:54

llvm::PGOInstrumentationType::FDO
@ FDO
Definition PGOInstrumentation.h:54

llvm::ExpandVariadicsMode::Optimize
@ Optimize
Definition ExpandVariadics.h:22

llvm::CGSCCPassManager
PassManager< LazyCallGraph::SCC, CGSCCAnalysisManager, LazyCallGraph &, CGSCCUpdateResult & > CGSCCPassManager
The CGSCC pass manager.
Definition CGSCCPassManager.h:143

llvm::MODULE
@ MODULE
Definition Attributor.h:6613

llvm::ALL
@ ALL
Definition Attributor.h:6615

llvm::CGSCC
@ CGSCC
Definition Attributor.h:6614

llvm::ThinOrFullLTOPhase
ThinOrFullLTOPhase
This enumerates the LLVM full LTO or ThinLTO optimization phases.
Definition Pass.h:77

llvm::ThinOrFullLTOPhase::FullLTOPreLink
@ FullLTOPreLink
Full LTO prelink phase.
Definition Pass.h:85

llvm::ThinOrFullLTOPhase::ThinLTOPostLink
@ ThinLTOPostLink
ThinLTO postlink (backend compile) phase.
Definition Pass.h:83

llvm::ThinOrFullLTOPhase::None
@ None
No LTO/ThinLTO behavior needed.
Definition Pass.h:79

llvm::ThinOrFullLTOPhase::FullLTOPostLink
@ FullLTOPostLink
Full LTO postlink (backend compile) phase.
Definition Pass.h:87

llvm::ThinOrFullLTOPhase::ThinLTOPreLink
@ ThinLTOPreLink
ThinLTO prelink (summary) phase.
Definition Pass.h:81

llvm::LoopPassManager
PassManager< Loop, LoopAnalysisManager, LoopStandardAnalysisResults &, LPMUpdater & > LoopPassManager
The Loop pass manager.
Definition LoopPassManager.h:181

llvm::createModuleToPostOrderCGSCCPassAdaptor
ModuleToPostOrderCGSCCPassAdaptor createModuleToPostOrderCGSCCPassAdaptor(CGSCCPassT &&Pass)
A function to deduce a function pass type and wrap it in the templated adaptor.
Definition CGSCCPassManager.h:359

llvm::createFunctionToLoopPassAdaptor
FunctionToLoopPassAdaptor createFunctionToLoopPassAdaptor(LoopPassT &&Pass, bool UseMemorySSA=false, bool UseBlockFrequencyInfo=false)
A function to deduce a loop pass type and wrap it in the templated adaptor.
Definition LoopPassManager.h:445

llvm::createCGSCCToFunctionPassAdaptor
CGSCCToFunctionPassAdaptor createCGSCCToFunctionPassAdaptor(FunctionPassT &&Pass, bool EagerlyInvalidate=false, bool NoRerun=false)
A function to deduce a function pass type and wrap it in the templated adaptor.
Definition CGSCCPassManager.h:506

llvm::ForgetSCEVInLoopUnroll
cl::opt< bool > ForgetSCEVInLoopUnroll

llvm::ModulePassManager
PassManager< Module > ModulePassManager
Convenience typedef for a pass manager over modules.
Definition PassManager.h:239

llvm::AreStatisticsEnabled
LLVM_ABI bool AreStatisticsEnabled()
Check if statistics are enabled.
Definition Statistic.cpp:139

llvm::EnableMemProfContextDisambiguation
cl::opt< bool > EnableMemProfContextDisambiguation
Enable MemProf context disambiguation for thin link.
Definition PassBuilderPipelines.cpp:309

llvm::FunctionPassManager
PassManager< Function > FunctionPassManager
Convenience typedef for a pass manager over functions.
Definition PassManager.h:248

llvm::getInlineParams
LLVM_ABI InlineParams getInlineParams()
Generate the parameters to tune the inline cost analysis based only on the commandline options.
Definition InlineCost.cpp:3428

llvm::SetLicmMssaNoAccForPromotionCap
cl::opt< unsigned > SetLicmMssaNoAccForPromotionCap

llvm::MaxDevirtIterations
cl::opt< unsigned > MaxDevirtIterations("max-devirt-iterations", cl::ReallyHidden, cl::init(4))
Definition PassBuilderPipelines.cpp:330

llvm::SetLicmMssaOptCap
cl::opt< unsigned > SetLicmMssaOptCap

llvm::SROAOptions::PreserveCFG
@ PreserveCFG
Definition SROA.h:24

llvm::SROAOptions::ModifyCFG
@ ModifyCFG
Definition SROA.h:24

llvm::ADCEPass
A DCE pass that assumes instructions are dead until proven otherwise.
Definition ADCE.h:31

llvm::Annotation2MetadataPass
Pass to convert @llvm.global.annotations to !annotation metadata.
Definition Annotation2Metadata.h:24

llvm::AnnotationRemarksPass
Definition AnnotationRemarks.h:23

llvm::AssumeSimplifyPass
This pass attempts to minimize the number of assume without loosing any information.
Definition AssumeBundleBuilder.h:59

llvm::AttributorCGSCCPass
Definition Attributor.h:3480

llvm::AttributorPass
}
Definition Attributor.h:3477

llvm::BDCEPass
Definition BDCE.h:26

llvm::CallSiteSplittingPass
Definition CallSiteSplitting.h:18

llvm::CoroAnnotationElidePass
Definition CoroAnnotationElide.h:26

llvm::CoroCleanupPass
Definition CoroCleanup.h:23

llvm::CoroConditionalWrapper
Definition CoroConditionalWrapper.h:20

llvm::CoroEarlyPass
Definition CoroEarly.h:26

llvm::CoroElidePass
Definition CoroElide.h:25

llvm::CoroSplitPass
Definition CoroSplit.h:31

llvm::CorrelatedValuePropagationPass
Definition CorrelatedValuePropagation.h:19

llvm::CountVisitsPass
Definition CountVisits.h:19

llvm::DFAJumpThreadingPass
Definition DFAJumpThreading.h:22

llvm::DivRemPairsPass
Hoist/decompose integer division and remainder instructions to enable CFG improvements and better cod...
Definition DivRemPairs.h:23

llvm::DropUnnecessaryAssumesPass
Definition DropUnnecessaryAssumes.h:21

llvm::EarlyCSEPass
A simple and fast domtree-based CSE pass.
Definition EarlyCSE.h:31

llvm::EntryExitInstrumenterPass
Definition EntryExitInstrumenter.h:25

llvm::ForceFunctionAttrsPass
Pass which forces specific function attributes into the IR, primarily as a debugging tool.
Definition ForceFunctionAttrs.h:23

llvm::GVNHoistPass
A simple and fast domtree-based GVN pass to hoist common expressions from sibling branches.
Definition GVN.h:417

llvm::GVNSinkPass
Uses an "inverted" value numbering to decide the similarity of expressions and sinks similar expressi...
Definition GVN.h:424

llvm::IPSCCPOptions
A set of parameters to control various transforms performed by IPSCCP pass.
Definition SCCP.h:35

llvm::InferAlignmentPass
Definition InferAlignment.h:21

llvm::InferFunctionAttrsPass
A pass which infers function attributes from the names and signatures of function declarations in a m...
Definition InferFunctionAttrs.h:25

llvm::InlineContext
Provides context on when an inline advisor is constructed in the pipeline (e.g., link phase,...
Definition InlineAdvisor.h:59

llvm::InlineParams
Thresholds to tune inline cost analysis.
Definition InlineCost.h:207

llvm::InlineParams::HotCallSiteThreshold
std::optional< int > HotCallSiteThreshold
Threshold to use when the callsite is considered hot.
Definition InlineCost.h:224

llvm::InlineParams::DefaultThreshold
int DefaultThreshold
The default threshold to start with for a callee.
Definition InlineCost.h:209

llvm::InlineParams::EnableDeferral
std::optional< bool > EnableDeferral
Indicate whether we should allow inline deferral.
Definition InlineCost.h:237

llvm::InlineParams::HintThreshold
std::optional< int > HintThreshold
Threshold to use for callees with inline hint.
Definition InlineCost.h:212

llvm::InstrProfOptions
Options for the frontend instrumentation based profiling pass.
Definition Instrumentation.h:117

llvm::InvalidateAnalysisPass
A no-op pass template which simply forces a specific analysis result to be invalidated.
Definition PassManager.h:930

llvm::JumpTableToSwitchPass
Definition JumpTableToSwitch.h:18

llvm::LoopInterchangePass
Definition LoopInterchange.h:20

llvm::LoopLoadEliminationPass
Pass to forward loads in a loop around the backedge to subsequent iterations.
Definition LoopLoadElimination.h:27

llvm::LoopUnrollOptions
A set of parameters used to control various transforms performed by the LoopUnroll pass.
Definition LoopUnrollPass.h:61

llvm::LoopVectorizeOptions
Definition LoopVectorize.h:85

llvm::LoopVectorizePass
The LoopVectorize Pass.
Definition LoopVectorize.h:131

llvm::LowerConstantIntrinsicsPass
Definition LowerConstantIntrinsics.h:30

llvm::LowerExpectIntrinsicPass
Definition LowerExpectIntrinsic.h:25

llvm::PGOForceFunctionAttrsPass
Definition PGOForceFunctionAttrs.h:18

llvm::PGOOptions::IRUse
@ IRUse
Definition PGOOptions.h:29

llvm::PGOOptions::IRInstr
@ IRInstr
Definition PGOOptions.h:29

llvm::PGOOptions::SampleUse
@ SampleUse
Definition PGOOptions.h:29

llvm::PGOOptions::CSIRUse
@ CSIRUse
Definition PGOOptions.h:30

llvm::PGOOptions::CSIRInstr
@ CSIRInstr
Definition PGOOptions.h:30

llvm::PostOrderFunctionAttrsPass
Computes function attributes in post-order over the call graph.
Definition FunctionAttrs.h:51

llvm::RecomputeGlobalsAAPass
Definition GlobalsModRef.h:141

llvm::RequireAnalysisPass
A utility pass template to force an analysis result to be available.
Definition PassManager.h:903

llvm::SimplifyCFGOptions
Definition SimplifyCFGOptions.h:23

llvm::WholeProgramDevirtPass
Definition WholeProgramDevirt.h:225

llvm::cl::desc
Definition CommandLine.h:410