CbC/CbC_llvm: lib/Passes/PassBuilder.cpp comparison

comparison lib/Passes/PassBuilder.cpp @ 134:3a76565eade5 LLVM5.0.1

update 5.0.1

author	mir3636
date	Sat, 17 Feb 2018 09:57:20 +0900
parents	803732b1fca8
children	c2174574ed3a

comparison

equal deleted inserted replaced

-:c60214abe0e8
+:3a76565eade5
 #include "llvm/Analysis/AliasAnalysis.h"
 #include "llvm/Analysis/AliasAnalysisEvaluator.h"
 #include "llvm/Analysis/AssumptionCache.h"
 #include "llvm/Analysis/BasicAliasAnalysis.h"
 #include "llvm/Analysis/BlockFrequencyInfo.h"
-#include "llvm/Analysis/BlockFrequencyInfoImpl.h"
 #include "llvm/Analysis/BranchProbabilityInfo.h"
 #include "llvm/Analysis/CFGPrinter.h"
 #include "llvm/Analysis/CFLAndersAliasAnalysis.h"
 #include "llvm/Analysis/CFLSteensAliasAnalysis.h"
 #include "llvm/Analysis/CGSCCPassManager.h"
 #include "llvm/IR/PassManager.h"
 #include "llvm/IR/Verifier.h"
 #include "llvm/Support/Debug.h"
 #include "llvm/Support/Regex.h"
 #include "llvm/Target/TargetMachine.h"
+#include "llvm/Transforms/AggressiveInstCombine/AggressiveInstCombine.h"
 #include "llvm/Transforms/GCOVProfiler.h"
 #include "llvm/Transforms/IPO/AlwaysInliner.h"
 #include "llvm/Transforms/IPO/ArgumentPromotion.h"
 #include "llvm/Transforms/IPO/CalledValuePropagation.h"
 #include "llvm/Transforms/IPO/ConstantMerge.h"
 #include "llvm/Transforms/IPO/Internalize.h"
 #include "llvm/Transforms/IPO/LowerTypeTests.h"
 #include "llvm/Transforms/IPO/PartialInlining.h"
 #include "llvm/Transforms/IPO/SCCP.h"
 #include "llvm/Transforms/IPO/StripDeadPrototypes.h"
+#include "llvm/Transforms/IPO/SyntheticCountsPropagation.h"
 #include "llvm/Transforms/IPO/WholeProgramDevirt.h"
 #include "llvm/Transforms/InstCombine/InstCombine.h"
 #include "llvm/Transforms/InstrProfiling.h"
+#include "llvm/Transforms/Instrumentation/BoundsChecking.h"
 #include "llvm/Transforms/PGOInstrumentation.h"
 #include "llvm/Transforms/SampleProfile.h"
 #include "llvm/Transforms/Scalar/ADCE.h"
 #include "llvm/Transforms/Scalar/AlignmentFromAssumptions.h"
 #include "llvm/Transforms/Scalar/BDCE.h"
+#include "llvm/Transforms/Scalar/CallSiteSplitting.h"
 #include "llvm/Transforms/Scalar/ConstantHoisting.h"
 #include "llvm/Transforms/Scalar/CorrelatedValuePropagation.h"
 #include "llvm/Transforms/Scalar/DCE.h"
 #include "llvm/Transforms/Scalar/DeadStoreElimination.h"
 #include "llvm/Transforms/Scalar/DivRemPairs.h"
 #include "llvm/Transforms/Scalar/MergedLoadStoreMotion.h"
 #include "llvm/Transforms/Scalar/NaryReassociate.h"
 #include "llvm/Transforms/Scalar/NewGVN.h"
 #include "llvm/Transforms/Scalar/PartiallyInlineLibCalls.h"
 #include "llvm/Transforms/Scalar/Reassociate.h"
+#include "llvm/Transforms/Scalar/RewriteStatepointsForGC.h"
 #include "llvm/Transforms/Scalar/SCCP.h"
 #include "llvm/Transforms/Scalar/SROA.h"
 #include "llvm/Transforms/Scalar/SimpleLoopUnswitch.h"
 #include "llvm/Transforms/Scalar/SimplifyCFG.h"
 #include "llvm/Transforms/Scalar/Sink.h"
+#include "llvm/Transforms/Scalar/SpeculateAroundPHIs.h"
 #include "llvm/Transforms/Scalar/SpeculativeExecution.h"
 #include "llvm/Transforms/Scalar/TailRecursionElimination.h"
 #include "llvm/Transforms/Utils/AddDiscriminators.h"
 #include "llvm/Transforms/Utils/BreakCriticalEdges.h"
+#include "llvm/Transforms/Utils/EntryExitInstrumenter.h"
 #include "llvm/Transforms/Utils/LCSSA.h"
 #include "llvm/Transforms/Utils/LibCallsShrinkWrap.h"
 #include "llvm/Transforms/Utils/LoopSimplify.h"
 #include "llvm/Transforms/Utils/LowerInvoke.h"
 #include "llvm/Transforms/Utils/Mem2Reg.h"
 #include "llvm/Transforms/Utils/NameAnonGlobals.h"
-#include "llvm/Transforms/Utils/PredicateInfo.h"
 #include "llvm/Transforms/Utils/SimplifyInstructions.h"
 #include "llvm/Transforms/Utils/SymbolRewriter.h"
 #include "llvm/Transforms/Vectorize/LoopVectorize.h"
 #include "llvm/Transforms/Vectorize/SLPVectorizer.h"
-#include <type_traits>
 using namespace llvm;
 static cl::opt<unsigned> MaxDevirtIterations("pm-max-devirt-iterations",
 cl::ReallyHidden, cl::init(4));
 cl::desc("Enable the GVN hoisting pass for the new PM (default = off)"));
 static cl::opt<bool> EnableGVNSink(
 "enable-npm-gvn-sink", cl::init(false), cl::Hidden,
 cl::desc("Enable the GVN hoisting pass for the new PM (default = off)"));
+static cl::opt<bool> EnableSyntheticCounts(
+"enable-npm-synthetic-counts", cl::init(false), cl::Hidden, cl::ZeroOrMore,
+cl::desc("Run synthetic function entry count generation "
+"pass"));
 static Regex DefaultAliasRegex(
 "^(default|thinlto-pre-link|thinlto|lto-pre-link|lto)<(O[0123sz])>$");
 static bool isOptimizingForSize(PassBuilder::OptimizationLevel Level) {
 // Optimize based on known information about branches, and cleanup afterward.
 FPM.addPass(JumpThreadingPass());
 FPM.addPass(CorrelatedValuePropagationPass());
 FPM.addPass(SimplifyCFGPass());
+if (Level == O3)
+FPM.addPass(AggressiveInstCombinePass());
 FPM.addPass(InstCombinePass());
 if (!isOptimizingForSize(Level))
 FPM.addPass(LibCallsShrinkWrapPass());
 C(LPM2, Level);
 // We provide the opt remark emitter pass for LICM to use. We only need to do
 // this once as it is immutable.
 FPM.addPass(RequireAnalysisPass<OptimizationRemarkEmitterAnalysis, Function>());
-FPM.addPass(createFunctionToLoopPassAdaptor(std::move(LPM1)));
+FPM.addPass(createFunctionToLoopPassAdaptor(std::move(LPM1), DebugLogging));
 FPM.addPass(SimplifyCFGPass());
 FPM.addPass(InstCombinePass());
-FPM.addPass(createFunctionToLoopPassAdaptor(std::move(LPM2)));
+FPM.addPass(createFunctionToLoopPassAdaptor(std::move(LPM2), DebugLogging));
 // Eliminate redundancies.
 if (Level != O1) {
 // These passes add substantial compile time so skip them at O1.
 FPM.addPass(MergedLoadStoreMotionPass());
 // Re-consider control flow based optimizations after redundancy elimination,
 // redo DCE, etc.
 FPM.addPass(JumpThreadingPass());
 FPM.addPass(CorrelatedValuePropagationPass());
 FPM.addPass(DSEPass());
-FPM.addPass(createFunctionToLoopPassAdaptor(LICMPass()));
+FPM.addPass(createFunctionToLoopPassAdaptor(LICMPass(), DebugLogging));
 for (auto &C : ScalarOptimizerLateEPCallbacks)
 C(FPM, Level);
 // Finally, do an expensive DCE pass to catch all the dead code exposed by
 if (RunProfileGen) {
 MPM.addPass(PGOInstrumentationGen());
 FunctionPassManager FPM;
-FPM.addPass(createFunctionToLoopPassAdaptor(LoopRotatePass()));
+FPM.addPass(
+createFunctionToLoopPassAdaptor(LoopRotatePass(), DebugLogging));
 MPM.addPass(createModuleToFunctionPassAdaptor(std::move(FPM)));
 // Add the profile lowering pass.
 InstrProfOptions Options;
 if (!ProfileGenFile.empty())
 FunctionPassManager EarlyFPM(DebugLogging);
 EarlyFPM.addPass(SimplifyCFGPass());
 EarlyFPM.addPass(SROA());
 EarlyFPM.addPass(EarlyCSEPass());
 EarlyFPM.addPass(LowerExpectIntrinsicPass());
+if (Level == O3)
+EarlyFPM.addPass(CallSiteSplittingPass());
 // In SamplePGO ThinLTO backend, we need instcombine before profile annotation
 // to convert bitcast to direct calls so that they can be inlined during the
 // profile annotation prepration step.
 // More details about SamplePGO design can be found in:
 // https://research.google.com/pubs/pub45290.html
 // removed.
 MPM.addPass(PGOIndirectCallPromotion(Phase == ThinLTOPhase::PostLink,
 true));
 }
-// Interprocedural constant propagation now that basic cleanup has occured
+// Interprocedural constant propagation now that basic cleanup has occurred
 // and prior to optimizing globals.
 // FIXME: This position in the pipeline hasn't been carefully considered in
 // years, it should be re-analyzed.
 MPM.addPass(IPSCCPPass());
 (!PGOOpt->ProfileGenFile.empty() || !PGOOpt->ProfileUseFile.empty())) {
 addPGOInstrPasses(MPM, DebugLogging, Level, PGOOpt->RunProfileGen,
 PGOOpt->ProfileGenFile, PGOOpt->ProfileUseFile);
 MPM.addPass(PGOIndirectCallPromotion(false, false));
 }
+// Synthesize function entry counts for non-PGO compilation.
+if (EnableSyntheticCounts && !PGOOpt)
+MPM.addPass(SyntheticCountsPropagation());
 // Require the GlobalsAA analysis for the module so we can query it within
 // the CGSCC pipeline.
 MPM.addPass(RequireAnalysisPass<GlobalsAA, Module>());
 for (auto &C : VectorizerStartEPCallbacks)
 C(OptimizePM, Level);
 // First rotate loops that may have been un-rotated by prior passes.
-OptimizePM.addPass(createFunctionToLoopPassAdaptor(LoopRotatePass()));
+OptimizePM.addPass(
+createFunctionToLoopPassAdaptor(LoopRotatePass(), DebugLogging));
 // Distribute loops to allow partial vectorization.  I.e. isolate dependences
 // into separate loop that would otherwise inhibit vectorization.  This is
 // currently only performed for loops marked with the metadata
 // llvm.loop.distribute=true or when -enable-loop-distribute is specified.
 OptimizePM.addPass(LoopLoadEliminationPass());
 // Cleanup after the loop optimization passes.
 OptimizePM.addPass(InstCombinePass());
 // Now that we've formed fast to execute loop structures, we do further
 // optimizations. These are run afterward as they might block doing complex
 // analyses and transforms such as what are needed for loop vectorization.
+// Cleanup after loop vectorization, etc. Simplification passes like CVP and
+// GVN, loop transforms, and others have already run, so it's now better to
+// convert to more optimized IR using more aggressive simplify CFG options.
+// The extra sinking transform can create larger basic blocks, so do this
+// before SLP vectorization.
+OptimizePM.addPass(SimplifyCFGPass(SimplifyCFGOptions().
+forwardSwitchCondToPhi(true).
+convertSwitchToLookupTable(true).
+needCanonicalLoops(false).
+sinkCommonInsts(true)));
 // Optimize parallel scalar instruction chains into SIMD instructions.
 OptimizePM.addPass(SLPVectorizerPass());
-// Cleanup after all of the vectorizers.
-OptimizePM.addPass(SimplifyCFGPass());
 OptimizePM.addPass(InstCombinePass());
 // Unroll small loops to hide loop backedge latency and saturate any parallel
 // execution resources of an out-of-order processor. We also then need to
 // clean up redundancies and loop invariant code.
 // combiner for cleanup here so that the unrolling and LICM can be pipelined
 // across the loop nests.
 OptimizePM.addPass(LoopUnrollPass(Level));
 OptimizePM.addPass(InstCombinePass());
 OptimizePM.addPass(RequireAnalysisPass<OptimizationRemarkEmitterAnalysis, Function>());
-OptimizePM.addPass(createFunctionToLoopPassAdaptor(LICMPass()));
+OptimizePM.addPass(createFunctionToLoopPassAdaptor(LICMPass(), DebugLogging));
 // Now that we've vectorized and unrolled loops, we may have more refined
 // alignment information, try to re-derive it here.
 OptimizePM.addPass(AlignmentFromAssumptionsPass());
 OptimizePM.addPass(DivRemPairsPass());
 // LoopSink (and other loop passes since the last simplifyCFG) might have
 // resulted in single-entry-single-exit or empty blocks. Clean up the CFG.
 OptimizePM.addPass(SimplifyCFGPass());
+// Optimize PHIs by speculating around them when profitable. Note that this
+// pass needs to be run after any PRE or similar pass as it is essentially
+// inserting redudnancies into the progrem. This even includes SimplifyCFG.
+OptimizePM.addPass(SpeculateAroundPHIsPass());
 // Add the core optimizing pipeline.
 MPM.addPass(createModuleToFunctionPassAdaptor(std::move(OptimizePM)));
 // Now we need to do some global optimization transforms.
 ModulePassManager MPM(DebugLogging);
 // Force any function attributes we want the rest of the pipeline to observe.
 MPM.addPass(ForceFunctionAttrsPass());
+// Apply module pipeline start EP callback.
+for (auto &C : PipelineStartEPCallbacks)
+C(MPM);
 if (PGOOpt && PGOOpt->SamplePGOSupport)
 MPM.addPass(createModuleToFunctionPassAdaptor(AddDiscriminatorsPass()));
 // Add the core simplification pipeline.
 MPM.addPass(buildModuleSimplificationPipeline(Level, ThinLTOPhase::None,
 // Force any function attributes we want the rest of the pipeline to observe.
 MPM.addPass(ForceFunctionAttrsPass());
 if (PGOOpt && PGOOpt->SamplePGOSupport)
 MPM.addPass(createModuleToFunctionPassAdaptor(AddDiscriminatorsPass()));
+// Apply module pipeline start EP callback.
+for (auto &C : PipelineStartEPCallbacks)
+C(MPM);
 // If we are planning to perform ThinLTO later, we don't bloat the code with
 // unrolling/vectorization/... now. Just simplify the module as much as we
 // can.
 MPM.addPass(buildModuleSimplificationPipeline(Level, ThinLTOPhase::PreLink,
 // Do basic inference of function attributes from known properties of system
 // libraries and other oracles.
 MPM.addPass(InferFunctionAttrsPass());
 if (Level > 1) {
+FunctionPassManager EarlyFPM(DebugLogging);
+EarlyFPM.addPass(CallSiteSplittingPass());
+MPM.addPass(createModuleToFunctionPassAdaptor(std::move(EarlyFPM)));
 // Indirect call promotion. This should promote all the targets that are
 // left by the earlier promotion pass that promotes intra-module targets.
 // This two-step promotion is to save the compile time. For LTO, it should
 // produce the same result as if we only do promotion here.
 MPM.addPass(PGOIndirectCallPromotion(
 true /* InLTO */, PGOOpt && !PGOOpt->SampleProfileFile.empty()));
 // Propagate constants at call sites into the functions they call.  This
 // opens opportunities for globalopt (and inlining) by substituting function
 // pointers passed as arguments to direct uses of functions.
 MPM.addPass(IPSCCPPass());
 // Reduce the code after globalopt and ipsccp.  Both can open up significant
 // simplification opportunities, and both can propagate functions through
 // function pointers.  When this happens, we often have to resolve varargs
 // calls, etc, so let instcombine do this.
 FunctionPassManager PeepholeFPM(DebugLogging);
+if (Level == O3)
+PeepholeFPM.addPass(AggressiveInstCombinePass());
 PeepholeFPM.addPass(InstCombinePass());
 invokePeepholeEPCallbacks(PeepholeFPM, Level);
 MPM.addPass(createModuleToFunctionPassAdaptor(std::move(PeepholeFPM)));
 LoopPassManager LPM(DebugLogging);
 if (!parseLoopPassPipeline(LPM, InnerPipeline, VerifyEachPass,
 DebugLogging))
 return false;
 // Add the nested pass manager with the appropriate adaptor.
-FPM.addPass(createFunctionToLoopPassAdaptor(std::move(LPM)));
+FPM.addPass(
+createFunctionToLoopPassAdaptor(std::move(LPM), DebugLogging));
 return true;
 }
 if (auto Count = parseRepeatPassName(Name)) {
 FunctionPassManager NestedFPM(DebugLogging);
 if (!parseFunctionPassPipeline(NestedFPM, InnerPipeline, VerifyEachPass,

Mercurial > hg > CbC > CbC_llvm

comparison lib/Passes/PassBuilder.cpp @ 134:3a76565eade5 LLVM5.0.1