123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840 |
- //===------ RegisterPasses.cpp - Add the Polly Passes to default passes --===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- //
- // This file composes the individual LLVM-IR passes provided by Polly to a
- // functional polyhedral optimizer. The polyhedral optimizer is automatically
- // made available to LLVM based compilers by loading the Polly shared library
- // into such a compiler.
- //
- // The Polly optimizer is made available by executing a static constructor that
- // registers the individual Polly passes in the LLVM pass manager builder. The
- // passes are registered such that the default behaviour of the compiler is not
- // changed, but that the flag '-polly' provided at optimization level '-O3'
- // enables additional polyhedral optimizations.
- //===----------------------------------------------------------------------===//
- #include "polly/RegisterPasses.h"
- #include "polly/Canonicalization.h"
- #include "polly/CodeGen/CodeGeneration.h"
- #include "polly/CodeGen/CodegenCleanup.h"
- #include "polly/CodeGen/IslAst.h"
- #include "polly/CodePreparation.h"
- #include "polly/DeLICM.h"
- #include "polly/DeadCodeElimination.h"
- #include "polly/DependenceInfo.h"
- #include "polly/ForwardOpTree.h"
- #include "polly/JSONExporter.h"
- #include "polly/LinkAllPasses.h"
- #include "polly/PolyhedralInfo.h"
- #include "polly/PruneUnprofitable.h"
- #include "polly/ScheduleOptimizer.h"
- #include "polly/ScopDetection.h"
- #include "polly/ScopInfo.h"
- #include "polly/Simplify.h"
- #include "polly/Support/DumpFunctionPass.h"
- #include "polly/Support/DumpModulePass.h"
- #include "llvm/Analysis/CFGPrinter.h"
- #include "llvm/IR/LegacyPassManager.h"
- #include "llvm/IR/Verifier.h"
- #include "llvm/Passes/PassBuilder.h"
- #include "llvm/Passes/PassPlugin.h"
- #include "llvm/Support/CommandLine.h"
- #include "llvm/Support/TargetSelect.h"
- #include "llvm/Transforms/IPO.h"
- #include "llvm/Transforms/IPO/PassManagerBuilder.h"
- using namespace llvm;
- using namespace polly;
- cl::OptionCategory PollyCategory("Polly Options",
- "Configure the polly loop optimizer");
- static cl::opt<bool>
- PollyEnabled("polly",
- cl::desc("Enable the polly optimizer (with -O1, -O2 or -O3)"),
- cl::init(false), cl::ZeroOrMore, cl::cat(PollyCategory));
- static cl::opt<bool> PollyDetectOnly(
- "polly-only-scop-detection",
- cl::desc("Only run scop detection, but no other optimizations"),
- cl::init(false), cl::ZeroOrMore, cl::cat(PollyCategory));
- enum PassPositionChoice {
- POSITION_EARLY,
- POSITION_AFTER_LOOPOPT,
- POSITION_BEFORE_VECTORIZER
- };
- enum OptimizerChoice { OPTIMIZER_NONE, OPTIMIZER_ISL };
- static cl::opt<PassPositionChoice> PassPosition(
- "polly-position", cl::desc("Where to run polly in the pass pipeline"),
- cl::values(
- clEnumValN(POSITION_EARLY, "early", "Before everything"),
- clEnumValN(POSITION_AFTER_LOOPOPT, "after-loopopt",
- "After the loop optimizer (but within the inline cycle)"),
- clEnumValN(POSITION_BEFORE_VECTORIZER, "before-vectorizer",
- "Right before the vectorizer")),
- cl::Hidden, cl::init(POSITION_BEFORE_VECTORIZER), cl::ZeroOrMore,
- cl::cat(PollyCategory));
- static cl::opt<OptimizerChoice>
- Optimizer("polly-optimizer", cl::desc("Select the scheduling optimizer"),
- cl::values(clEnumValN(OPTIMIZER_NONE, "none", "No optimizer"),
- clEnumValN(OPTIMIZER_ISL, "isl",
- "The isl scheduling optimizer")),
- cl::Hidden, cl::init(OPTIMIZER_ISL), cl::ZeroOrMore,
- cl::cat(PollyCategory));
- enum CodeGenChoice { CODEGEN_FULL, CODEGEN_AST, CODEGEN_NONE };
- static cl::opt<CodeGenChoice> CodeGeneration(
- "polly-code-generation", cl::desc("How much code-generation to perform"),
- cl::values(clEnumValN(CODEGEN_FULL, "full", "AST and IR generation"),
- clEnumValN(CODEGEN_AST, "ast", "Only AST generation"),
- clEnumValN(CODEGEN_NONE, "none", "No code generation")),
- cl::Hidden, cl::init(CODEGEN_FULL), cl::ZeroOrMore, cl::cat(PollyCategory));
- enum TargetChoice { TARGET_CPU, TARGET_GPU, TARGET_HYBRID };
- static cl::opt<TargetChoice>
- Target("polly-target", cl::desc("The hardware to target"),
- cl::values(clEnumValN(TARGET_CPU, "cpu", "generate CPU code")
- #ifdef GPU_CODEGEN
- ,
- clEnumValN(TARGET_GPU, "gpu", "generate GPU code"),
- clEnumValN(TARGET_HYBRID, "hybrid",
- "generate GPU code (preferably) or CPU code")
- #endif
- ),
- cl::init(TARGET_CPU), cl::ZeroOrMore, cl::cat(PollyCategory));
- VectorizerChoice polly::PollyVectorizerChoice;
- static cl::opt<polly::VectorizerChoice, true> Vectorizer(
- "polly-vectorizer", cl::desc("Select the vectorization strategy"),
- cl::values(
- clEnumValN(polly::VECTORIZER_NONE, "none", "No Vectorization"),
- clEnumValN(polly::VECTORIZER_POLLY, "polly",
- "Polly internal vectorizer"),
- clEnumValN(
- polly::VECTORIZER_STRIPMINE, "stripmine",
- "Strip-mine outer loops for the loop-vectorizer to trigger")),
- cl::location(PollyVectorizerChoice), cl::init(polly::VECTORIZER_NONE),
- cl::ZeroOrMore, cl::cat(PollyCategory));
- static cl::opt<bool> ImportJScop(
- "polly-import",
- cl::desc("Import the polyhedral description of the detected Scops"),
- cl::Hidden, cl::init(false), cl::ZeroOrMore, cl::cat(PollyCategory));
- static cl::opt<bool> FullyIndexedStaticExpansion(
- "polly-enable-mse",
- cl::desc("Fully expand the memory accesses of the detected Scops"),
- cl::Hidden, cl::init(false), cl::ZeroOrMore, cl::cat(PollyCategory));
- static cl::opt<bool> ExportJScop(
- "polly-export",
- cl::desc("Export the polyhedral description of the detected Scops"),
- cl::Hidden, cl::init(false), cl::ZeroOrMore, cl::cat(PollyCategory));
- static cl::opt<bool> DeadCodeElim("polly-run-dce",
- cl::desc("Run the dead code elimination"),
- cl::Hidden, cl::init(false), cl::ZeroOrMore,
- cl::cat(PollyCategory));
- static cl::opt<bool> PollyViewer(
- "polly-show",
- cl::desc("Highlight the code regions that will be optimized in a "
- "(CFG BBs and LLVM-IR instructions)"),
- cl::init(false), cl::ZeroOrMore, cl::cat(PollyCategory));
- static cl::opt<bool> PollyOnlyViewer(
- "polly-show-only",
- cl::desc("Highlight the code regions that will be optimized in "
- "a (CFG only BBs)"),
- cl::init(false), cl::cat(PollyCategory));
- static cl::opt<bool>
- PollyPrinter("polly-dot", cl::desc("Enable the Polly DOT printer in -O3"),
- cl::Hidden, cl::value_desc("Run the Polly DOT printer at -O3"),
- cl::init(false), cl::cat(PollyCategory));
- static cl::opt<bool> PollyOnlyPrinter(
- "polly-dot-only",
- cl::desc("Enable the Polly DOT printer in -O3 (no BB content)"), cl::Hidden,
- cl::value_desc("Run the Polly DOT printer at -O3 (no BB content"),
- cl::init(false), cl::cat(PollyCategory));
- static cl::opt<bool>
- CFGPrinter("polly-view-cfg",
- cl::desc("Show the Polly CFG right after code generation"),
- cl::Hidden, cl::init(false), cl::cat(PollyCategory));
- static cl::opt<bool>
- EnablePolyhedralInfo("polly-enable-polyhedralinfo",
- cl::desc("Enable polyhedral interface of Polly"),
- cl::Hidden, cl::init(false), cl::cat(PollyCategory));
- static cl::opt<bool>
- EnableForwardOpTree("polly-enable-optree",
- cl::desc("Enable operand tree forwarding"), cl::Hidden,
- cl::init(true), cl::cat(PollyCategory));
- static cl::opt<bool>
- DumpBefore("polly-dump-before",
- cl::desc("Dump module before Polly transformations into a file "
- "suffixed with \"-before\""),
- cl::init(false), cl::cat(PollyCategory));
- static cl::list<std::string> DumpBeforeFile(
- "polly-dump-before-file",
- cl::desc("Dump module before Polly transformations to the given file"),
- cl::cat(PollyCategory));
- static cl::opt<bool>
- DumpAfter("polly-dump-after",
- cl::desc("Dump module after Polly transformations into a file "
- "suffixed with \"-after\""),
- cl::init(false), cl::cat(PollyCategory));
- static cl::list<std::string> DumpAfterFile(
- "polly-dump-after-file",
- cl::desc("Dump module after Polly transformations to the given file"),
- cl::ZeroOrMore, cl::cat(PollyCategory));
- static cl::opt<bool>
- EnableDeLICM("polly-enable-delicm",
- cl::desc("Eliminate scalar loop carried dependences"),
- cl::Hidden, cl::init(true), cl::cat(PollyCategory));
- static cl::opt<bool>
- EnableSimplify("polly-enable-simplify",
- cl::desc("Simplify SCoP after optimizations"),
- cl::init(true), cl::cat(PollyCategory));
- static cl::opt<bool> EnablePruneUnprofitable(
- "polly-enable-prune-unprofitable",
- cl::desc("Bail out on unprofitable SCoPs before rescheduling"), cl::Hidden,
- cl::init(true), cl::cat(PollyCategory));
- namespace {
- /// Initialize Polly passes when library is loaded.
- ///
- /// We use the constructor of a statically declared object to initialize the
- /// different Polly passes right after the Polly library is loaded. This ensures
- /// that the Polly passes are available e.g. in the 'opt' tool.
- class StaticInitializer {
- public:
- StaticInitializer() {
- llvm::PassRegistry &Registry = *llvm::PassRegistry::getPassRegistry();
- polly::initializePollyPasses(Registry);
- }
- };
- static StaticInitializer InitializeEverything;
- } // end of anonymous namespace.
- namespace polly {
- void initializePollyPasses(PassRegistry &Registry) {
- initializeCodeGenerationPass(Registry);
- #ifdef GPU_CODEGEN
- initializePPCGCodeGenerationPass(Registry);
- initializeManagedMemoryRewritePassPass(Registry);
- LLVMInitializeNVPTXTarget();
- LLVMInitializeNVPTXTargetInfo();
- LLVMInitializeNVPTXTargetMC();
- LLVMInitializeNVPTXAsmPrinter();
- #endif
- initializeCodePreparationPass(Registry);
- initializeDeadCodeElimWrapperPassPass(Registry);
- initializeDependenceInfoPass(Registry);
- initializeDependenceInfoWrapperPassPass(Registry);
- initializeJSONExporterPass(Registry);
- initializeJSONImporterPass(Registry);
- initializeMaximalStaticExpanderPass(Registry);
- initializeIslAstInfoWrapperPassPass(Registry);
- initializeIslScheduleOptimizerWrapperPassPass(Registry);
- initializePollyCanonicalizePass(Registry);
- initializePolyhedralInfoPass(Registry);
- initializeScopDetectionWrapperPassPass(Registry);
- initializeScopInlinerPass(Registry);
- initializeScopInfoRegionPassPass(Registry);
- initializeScopInfoWrapperPassPass(Registry);
- initializeCodegenCleanupPass(Registry);
- initializeFlattenSchedulePass(Registry);
- initializeForwardOpTreeWrapperPassPass(Registry);
- initializeDeLICMWrapperPassPass(Registry);
- initializeSimplifyWrapperPassPass(Registry);
- initializeDumpModuleWrapperPassPass(Registry);
- initializePruneUnprofitableWrapperPassPass(Registry);
- }
- /// Register Polly passes such that they form a polyhedral optimizer.
- ///
- /// The individual Polly passes are registered in the pass manager such that
- /// they form a full polyhedral optimizer. The flow of the optimizer starts with
- /// a set of preparing transformations that canonicalize the LLVM-IR such that
- /// the LLVM-IR is easier for us to understand and to optimizes. On the
- /// canonicalized LLVM-IR we first run the ScopDetection pass, which detects
- /// static control flow regions. Those regions are then translated by the
- /// ScopInfo pass into a polyhedral representation. As a next step, a scheduling
- /// optimizer is run on the polyhedral representation and finally the optimized
- /// polyhedral representation is code generated back to LLVM-IR.
- ///
- /// Besides this core functionality, we optionally schedule passes that provide
- /// a graphical view of the scops (Polly[Only]Viewer, Polly[Only]Printer), that
- /// allow the export/import of the polyhedral representation
- /// (JSCON[Exporter|Importer]) or that show the cfg after code generation.
- ///
- /// For certain parts of the Polly optimizer, several alternatives are provided:
- ///
- /// As scheduling optimizer we support the isl scheduling optimizer
- /// (http://freecode.com/projects/isl).
- /// It is also possible to run Polly with no optimizer. This mode is mainly
- /// provided to analyze the run and compile time changes caused by the
- /// scheduling optimizer.
- ///
- /// Polly supports the isl internal code generator.
- static void registerPollyPasses(llvm::legacy::PassManagerBase &PM,
- bool EnableForOpt) {
- if (DumpBefore)
- PM.add(polly::createDumpModuleWrapperPass("-before", true));
- for (auto &Filename : DumpBeforeFile)
- PM.add(polly::createDumpModuleWrapperPass(Filename, false));
- PM.add(polly::createCodePreparationPass());
- PM.add(polly::createScopDetectionWrapperPassPass());
- if (PollyDetectOnly)
- return;
- if (PollyViewer)
- PM.add(polly::createDOTViewerPass());
- if (PollyOnlyViewer)
- PM.add(polly::createDOTOnlyViewerPass());
- if (PollyPrinter)
- PM.add(polly::createDOTPrinterPass());
- if (PollyOnlyPrinter)
- PM.add(polly::createDOTOnlyPrinterPass());
- PM.add(polly::createScopInfoRegionPassPass());
- if (EnablePolyhedralInfo)
- PM.add(polly::createPolyhedralInfoPass());
- if (EnableSimplify)
- PM.add(polly::createSimplifyWrapperPass(0));
- if (EnableForwardOpTree)
- PM.add(polly::createForwardOpTreeWrapperPass());
- if (EnableDeLICM)
- PM.add(polly::createDeLICMWrapperPass());
- if (EnableSimplify)
- PM.add(polly::createSimplifyWrapperPass(1));
- if (ImportJScop)
- PM.add(polly::createJSONImporterPass());
- if (DeadCodeElim)
- PM.add(polly::createDeadCodeElimWrapperPass());
- if (FullyIndexedStaticExpansion)
- PM.add(polly::createMaximalStaticExpansionPass());
- if (EnablePruneUnprofitable)
- PM.add(polly::createPruneUnprofitableWrapperPass());
- #ifdef GPU_CODEGEN
- if (Target == TARGET_HYBRID)
- PM.add(
- polly::createPPCGCodeGenerationPass(GPUArchChoice, GPURuntimeChoice));
- #endif
- if (Target == TARGET_CPU || Target == TARGET_HYBRID)
- switch (Optimizer) {
- case OPTIMIZER_NONE:
- break; /* Do nothing */
- case OPTIMIZER_ISL:
- PM.add(polly::createIslScheduleOptimizerWrapperPass());
- break;
- }
- if (ExportJScop)
- PM.add(polly::createJSONExporterPass());
- if (!EnableForOpt)
- return;
- if (Target == TARGET_CPU || Target == TARGET_HYBRID)
- switch (CodeGeneration) {
- case CODEGEN_AST:
- PM.add(polly::createIslAstInfoWrapperPassPass());
- break;
- case CODEGEN_FULL:
- PM.add(polly::createCodeGenerationPass());
- break;
- case CODEGEN_NONE:
- break;
- }
- #ifdef GPU_CODEGEN
- else {
- PM.add(
- polly::createPPCGCodeGenerationPass(GPUArchChoice, GPURuntimeChoice));
- PM.add(polly::createManagedMemoryRewritePassPass());
- }
- #endif
- #ifdef GPU_CODEGEN
- if (Target == TARGET_HYBRID)
- PM.add(polly::createManagedMemoryRewritePassPass(GPUArchChoice,
- GPURuntimeChoice));
- #endif
- // FIXME: This dummy ModulePass keeps some programs from miscompiling,
- // probably some not correctly preserved analyses. It acts as a barrier to
- // force all analysis results to be recomputed.
- PM.add(createBarrierNoopPass());
- if (DumpAfter)
- PM.add(polly::createDumpModuleWrapperPass("-after", true));
- for (auto &Filename : DumpAfterFile)
- PM.add(polly::createDumpModuleWrapperPass(Filename, false));
- if (CFGPrinter)
- PM.add(llvm::createCFGPrinterLegacyPassPass());
- }
- static bool shouldEnablePollyForOptimization() { return PollyEnabled; }
- static bool shouldEnablePollyForDiagnostic() {
- // FIXME: PollyTrackFailures is user-controlled, should not be set
- // programmatically.
- if (PollyOnlyPrinter || PollyPrinter || PollyOnlyViewer || PollyViewer)
- PollyTrackFailures = true;
- return PollyOnlyPrinter || PollyPrinter || PollyOnlyViewer || PollyViewer ||
- ExportJScop;
- }
- static void
- registerPollyEarlyAsPossiblePasses(const llvm::PassManagerBuilder &Builder,
- llvm::legacy::PassManagerBase &PM) {
- if (PassPosition != POSITION_EARLY)
- return;
- bool EnableForOpt = shouldEnablePollyForOptimization() &&
- Builder.OptLevel >= 1 && Builder.SizeLevel == 0;
- if (!shouldEnablePollyForDiagnostic() && !EnableForOpt)
- return;
- registerCanonicalicationPasses(PM);
- registerPollyPasses(PM, EnableForOpt);
- }
- static void
- registerPollyLoopOptimizerEndPasses(const llvm::PassManagerBuilder &Builder,
- llvm::legacy::PassManagerBase &PM) {
- if (PassPosition != POSITION_AFTER_LOOPOPT)
- return;
- bool EnableForOpt = shouldEnablePollyForOptimization() &&
- Builder.OptLevel >= 1 && Builder.SizeLevel == 0;
- if (!shouldEnablePollyForDiagnostic() && !EnableForOpt)
- return;
- registerPollyPasses(PM, EnableForOpt);
- if (EnableForOpt)
- PM.add(createCodegenCleanupPass());
- }
- static void
- registerPollyScalarOptimizerLatePasses(const llvm::PassManagerBuilder &Builder,
- llvm::legacy::PassManagerBase &PM) {
- if (PassPosition != POSITION_BEFORE_VECTORIZER)
- return;
- bool EnableForOpt = shouldEnablePollyForOptimization() &&
- Builder.OptLevel >= 1 && Builder.SizeLevel == 0;
- if (!shouldEnablePollyForDiagnostic() && !EnableForOpt)
- return;
- polly::registerPollyPasses(PM, EnableForOpt);
- if (EnableForOpt)
- PM.add(createCodegenCleanupPass());
- }
- /// Add the pass sequence required for Polly to the New Pass Manager.
- ///
- /// @param PM The pass manager itself.
- /// @param Level The optimization level. Used for the cleanup of Polly's
- /// output.
- /// @param EnableForOpt Whether to add Polly IR transformations. If False, only
- /// the analysis passes are added, skipping Polly itself.
- /// The IR may still be modified.
- static void buildCommonPollyPipeline(FunctionPassManager &PM,
- OptimizationLevel Level,
- bool EnableForOpt) {
- PassBuilder PB;
- ScopPassManager SPM;
- PM.addPass(CodePreparationPass());
- // TODO add utility passes for the various command line options, once they're
- // ported
- if (PollyDetectOnly) {
- // Don't add more passes other than the ScopPassManager's detection passes.
- PM.addPass(createFunctionToScopPassAdaptor(std::move(SPM)));
- return;
- }
- if (PollyViewer)
- report_fatal_error("Option -polly-show not supported with NPM", false);
- if (PollyOnlyViewer)
- report_fatal_error("Option -polly-show-only not supported with NPM", false);
- if (PollyPrinter)
- report_fatal_error("Option -polly-dot not supported with NPM", false);
- if (PollyOnlyPrinter)
- report_fatal_error("Option -polly-dot-only not supported with NPM", false);
- if (EnablePolyhedralInfo)
- report_fatal_error(
- "Option -polly-enable-polyhedralinfo not supported with NPM", false);
- if (EnableSimplify)
- SPM.addPass(SimplifyPass(0));
- if (EnableForwardOpTree)
- SPM.addPass(ForwardOpTreePass());
- if (EnableDeLICM)
- SPM.addPass(DeLICMPass());
- if (EnableSimplify)
- SPM.addPass(SimplifyPass(1));
- if (ImportJScop)
- SPM.addPass(JSONImportPass());
- if (DeadCodeElim)
- SPM.addPass(DeadCodeElimPass());
- if (FullyIndexedStaticExpansion)
- report_fatal_error("Option -polly-enable-mse not supported with NPM",
- false);
- if (EnablePruneUnprofitable)
- SPM.addPass(PruneUnprofitablePass());
- if (Target == TARGET_CPU || Target == TARGET_HYBRID) {
- switch (Optimizer) {
- case OPTIMIZER_NONE:
- break; /* Do nothing */
- case OPTIMIZER_ISL:
- SPM.addPass(IslScheduleOptimizerPass());
- break;
- }
- }
- if (ExportJScop)
- report_fatal_error("Option -polly-export not supported with NPM", false);
- if (!EnableForOpt)
- return;
- if (Target == TARGET_CPU || Target == TARGET_HYBRID) {
- switch (CodeGeneration) {
- case CODEGEN_AST:
- SPM.addPass(
- RequireAnalysisPass<IslAstAnalysis, Scop, ScopAnalysisManager,
- ScopStandardAnalysisResults &, SPMUpdater &>());
- break;
- case CODEGEN_FULL:
- SPM.addPass(CodeGenerationPass());
- break;
- case CODEGEN_NONE:
- break;
- }
- }
- #ifdef GPU_CODEGEN
- else
- report_fatal_error("Option -polly-target=gpu not supported for NPM", false);
- #endif
- #ifdef GPU_CODEGEN
- if (Target == TARGET_HYBRID)
- report_fatal_error("Option -polly-target=hybrid not supported for NPM",
- false);
- #endif
- PM.addPass(createFunctionToScopPassAdaptor(std::move(SPM)));
- PM.addPass(PB.buildFunctionSimplificationPipeline(
- Level, ThinOrFullLTOPhase::None)); // Cleanup
- if (CFGPrinter)
- PM.addPass(llvm::CFGPrinterPass());
- }
- static void buildEarlyPollyPipeline(ModulePassManager &MPM,
- OptimizationLevel Level) {
- bool EnableForOpt =
- shouldEnablePollyForOptimization() && Level.isOptimizingForSpeed();
- if (!shouldEnablePollyForDiagnostic() && !EnableForOpt)
- return;
- FunctionPassManager FPM = buildCanonicalicationPassesForNPM(MPM, Level);
- if (DumpBefore || !DumpBeforeFile.empty()) {
- MPM.addPass(createModuleToFunctionPassAdaptor(std::move(FPM)));
- if (DumpBefore)
- MPM.addPass(DumpModulePass("-before", true));
- for (auto &Filename : DumpBeforeFile)
- MPM.addPass(DumpModulePass(Filename, false));
- FPM = FunctionPassManager();
- }
- buildCommonPollyPipeline(FPM, Level, EnableForOpt);
- MPM.addPass(createModuleToFunctionPassAdaptor(std::move(FPM)));
- if (DumpAfter)
- MPM.addPass(DumpModulePass("-after", true));
- for (auto &Filename : DumpAfterFile)
- MPM.addPass(DumpModulePass(Filename, false));
- }
- static void buildLatePollyPipeline(FunctionPassManager &PM,
- OptimizationLevel Level) {
- bool EnableForOpt =
- shouldEnablePollyForOptimization() && Level.isOptimizingForSpeed();
- if (!shouldEnablePollyForDiagnostic() && !EnableForOpt)
- return;
- if (DumpBefore)
- PM.addPass(DumpFunctionPass("-before"));
- if (!DumpBeforeFile.empty())
- report_fatal_error("Option -polly-dump-before-file at -polly-position=late "
- "not supported with NPM",
- false);
- buildCommonPollyPipeline(PM, Level, EnableForOpt);
- if (DumpAfter)
- PM.addPass(DumpFunctionPass("-after"));
- if (!DumpAfterFile.empty())
- report_fatal_error("Option -polly-dump-after-file at -polly-position=late "
- "not supported with NPM",
- false);
- }
- /// Register Polly to be available as an optimizer
- ///
- ///
- /// We can currently run Polly at three different points int the pass manager.
- /// a) very early, b) after the canonicalizing loop transformations and c) right
- /// before the vectorizer.
- ///
- /// The default is currently a), to register Polly such that it runs as early as
- /// possible. This has several implications:
- ///
- /// 1) We need to schedule more canonicalization passes
- ///
- /// As nothing is run before Polly, it is necessary to run a set of preparing
- /// transformations before Polly to canonicalize the LLVM-IR and to allow
- /// Polly to detect and understand the code.
- ///
- /// 2) LICM and LoopIdiom pass have not yet been run
- ///
- /// Loop invariant code motion as well as the loop idiom recognition pass make
- /// it more difficult for Polly to transform code. LICM may introduce
- /// additional data dependences that are hard to eliminate and the loop idiom
- /// recognition pass may introduce calls to memset that we currently do not
- /// understand. By running Polly early enough (meaning before these passes) we
- /// avoid difficulties that may be introduced by these passes.
- ///
- /// 3) We get the full -O3 optimization sequence after Polly
- ///
- /// The LLVM-IR that is generated by Polly has been optimized on a high level,
- /// but it may be rather inefficient on the lower/scalar level. By scheduling
- /// Polly before all other passes, we have the full sequence of -O3
- /// optimizations behind us, such that inefficiencies on the low level can
- /// be optimized away.
- ///
- /// We are currently evaluating the benefit or running Polly at position b) or
- /// c). b) is likely too early as it interacts with the inliner. c) is nice
- /// as everything is fully inlined and canonicalized, but we need to be able
- /// to handle LICMed code to make it useful.
- static llvm::RegisterStandardPasses RegisterPollyOptimizerEarly(
- llvm::PassManagerBuilder::EP_ModuleOptimizerEarly,
- registerPollyEarlyAsPossiblePasses);
- static llvm::RegisterStandardPasses
- RegisterPollyOptimizerLoopEnd(llvm::PassManagerBuilder::EP_LoopOptimizerEnd,
- registerPollyLoopOptimizerEndPasses);
- static llvm::RegisterStandardPasses RegisterPollyOptimizerScalarLate(
- llvm::PassManagerBuilder::EP_VectorizerStart,
- registerPollyScalarOptimizerLatePasses);
- static OwningScopAnalysisManagerFunctionProxy
- createScopAnalyses(FunctionAnalysisManager &FAM,
- PassInstrumentationCallbacks *PIC) {
- OwningScopAnalysisManagerFunctionProxy Proxy;
- #define SCOP_ANALYSIS(NAME, CREATE_PASS) \
- Proxy.getManager().registerPass([PIC] { \
- (void)PIC; \
- return CREATE_PASS; \
- });
- #include "PollyPasses.def"
- Proxy.getManager().registerPass(
- [&FAM] { return FunctionAnalysisManagerScopProxy(FAM); });
- return Proxy;
- }
- static void registerFunctionAnalyses(FunctionAnalysisManager &FAM,
- PassInstrumentationCallbacks *PIC) {
- #define FUNCTION_ANALYSIS(NAME, CREATE_PASS) \
- FAM.registerPass([] { return CREATE_PASS; });
- #include "PollyPasses.def"
- FAM.registerPass([&FAM, PIC] { return createScopAnalyses(FAM, PIC); });
- }
- static bool
- parseFunctionPipeline(StringRef Name, FunctionPassManager &FPM,
- ArrayRef<PassBuilder::PipelineElement> Pipeline) {
- if (parseAnalysisUtilityPasses<OwningScopAnalysisManagerFunctionProxy>(
- "polly-scop-analyses", Name, FPM))
- return true;
- #define FUNCTION_ANALYSIS(NAME, CREATE_PASS) \
- if (parseAnalysisUtilityPasses< \
- std::remove_reference<decltype(CREATE_PASS)>::type>(NAME, Name, \
- FPM)) \
- return true;
- #define FUNCTION_PASS(NAME, CREATE_PASS) \
- if (Name == NAME) { \
- FPM.addPass(CREATE_PASS); \
- return true; \
- }
- #include "PollyPasses.def"
- return false;
- }
- static bool parseScopPass(StringRef Name, ScopPassManager &SPM,
- PassInstrumentationCallbacks *PIC) {
- #define SCOP_ANALYSIS(NAME, CREATE_PASS) \
- if (parseAnalysisUtilityPasses< \
- std::remove_reference<decltype(CREATE_PASS)>::type>(NAME, Name, \
- SPM)) \
- return true;
- #define SCOP_PASS(NAME, CREATE_PASS) \
- if (Name == NAME) { \
- SPM.addPass(CREATE_PASS); \
- return true; \
- }
- #include "PollyPasses.def"
- return false;
- }
- static bool parseScopPipeline(StringRef Name, FunctionPassManager &FPM,
- PassInstrumentationCallbacks *PIC,
- ArrayRef<PassBuilder::PipelineElement> Pipeline) {
- if (Name != "scop")
- return false;
- if (!Pipeline.empty()) {
- ScopPassManager SPM;
- for (const auto &E : Pipeline)
- if (!parseScopPass(E.Name, SPM, PIC))
- return false;
- FPM.addPass(createFunctionToScopPassAdaptor(std::move(SPM)));
- }
- return true;
- }
- static bool isScopPassName(StringRef Name) {
- #define SCOP_ANALYSIS(NAME, CREATE_PASS) \
- if (Name == "require<" NAME ">") \
- return true; \
- if (Name == "invalidate<" NAME ">") \
- return true;
- #define SCOP_PASS(NAME, CREATE_PASS) \
- if (Name == NAME) \
- return true;
- #include "PollyPasses.def"
- return false;
- }
- static bool
- parseTopLevelPipeline(ModulePassManager &MPM, PassInstrumentationCallbacks *PIC,
- ArrayRef<PassBuilder::PipelineElement> Pipeline) {
- std::vector<PassBuilder::PipelineElement> FullPipeline;
- StringRef FirstName = Pipeline.front().Name;
- if (!isScopPassName(FirstName))
- return false;
- FunctionPassManager FPM;
- ScopPassManager SPM;
- for (auto &Element : Pipeline) {
- auto &Name = Element.Name;
- auto &InnerPipeline = Element.InnerPipeline;
- if (!InnerPipeline.empty()) // Scop passes don't have inner pipelines
- return false;
- if (!parseScopPass(Name, SPM, PIC))
- return false;
- }
- FPM.addPass(createFunctionToScopPassAdaptor(std::move(SPM)));
- MPM.addPass(createModuleToFunctionPassAdaptor(std::move(FPM)));
- return true;
- }
- void registerPollyPasses(PassBuilder &PB) {
- PassInstrumentationCallbacks *PIC = PB.getPassInstrumentationCallbacks();
- PB.registerAnalysisRegistrationCallback([PIC](FunctionAnalysisManager &FAM) {
- registerFunctionAnalyses(FAM, PIC);
- });
- PB.registerPipelineParsingCallback(parseFunctionPipeline);
- PB.registerPipelineParsingCallback(
- [PIC](StringRef Name, FunctionPassManager &FPM,
- ArrayRef<PassBuilder::PipelineElement> Pipeline) -> bool {
- return parseScopPipeline(Name, FPM, PIC, Pipeline);
- });
- PB.registerParseTopLevelPipelineCallback(
- [PIC](ModulePassManager &MPM,
- ArrayRef<PassBuilder::PipelineElement> Pipeline) -> bool {
- return parseTopLevelPipeline(MPM, PIC, Pipeline);
- });
- switch (PassPosition) {
- case POSITION_EARLY:
- PB.registerPipelineStartEPCallback(buildEarlyPollyPipeline);
- break;
- case POSITION_AFTER_LOOPOPT:
- report_fatal_error(
- "Option -polly-position=after-loopopt not supported with NPM", false);
- break;
- case POSITION_BEFORE_VECTORIZER:
- PB.registerVectorizerStartEPCallback(buildLatePollyPipeline);
- break;
- }
- }
- } // namespace polly
- llvm::PassPluginLibraryInfo getPollyPluginInfo() {
- return {LLVM_PLUGIN_API_VERSION, "Polly", LLVM_VERSION_STRING,
- polly::registerPollyPasses};
- }
|