mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-25 20:23:11 +01:00
[LoopUnrollAndJam] Change LoopUnrollAndJamPass to LoopNest pass
This patch changes LoopUnrollAndJamPass from FunctionPass to LoopNest pass. The next patch will utilize LoopNest to effectively handle loop nests. Reviewed By: Whitney Differential Revision: https://reviews.llvm.org/D99149
This commit is contained in:
parent
56f2b0fa7f
commit
45a93367af
@ -258,7 +258,7 @@ public:
|
|||||||
/// state, this routine will mark that the current loop should be skipped by
|
/// state, this routine will mark that the current loop should be skipped by
|
||||||
/// the rest of the pass management infrastructure.
|
/// the rest of the pass management infrastructure.
|
||||||
void markLoopAsDeleted(Loop &L, llvm::StringRef Name) {
|
void markLoopAsDeleted(Loop &L, llvm::StringRef Name) {
|
||||||
assert((!LoopNestMode || L.isOutermost()) &&
|
assert((!LoopNestMode || CurrentL == &L) &&
|
||||||
"L should be a top-level loop in loop-nest mode.");
|
"L should be a top-level loop in loop-nest mode.");
|
||||||
LAM.clear(L, Name);
|
LAM.clear(L, Name);
|
||||||
assert((&L == CurrentL || CurrentL->contains(&L)) &&
|
assert((&L == CurrentL || CurrentL->contains(&L)) &&
|
||||||
|
@ -10,6 +10,7 @@
|
|||||||
#define LLVM_TRANSFORMS_SCALAR_LOOPUNROLLANDJAMPASS_H
|
#define LLVM_TRANSFORMS_SCALAR_LOOPUNROLLANDJAMPASS_H
|
||||||
|
|
||||||
#include "llvm/IR/PassManager.h"
|
#include "llvm/IR/PassManager.h"
|
||||||
|
#include "llvm/Transforms/Scalar/LoopPassManager.h"
|
||||||
|
|
||||||
namespace llvm {
|
namespace llvm {
|
||||||
class Function;
|
class Function;
|
||||||
@ -20,7 +21,8 @@ class LoopUnrollAndJamPass : public PassInfoMixin<LoopUnrollAndJamPass> {
|
|||||||
|
|
||||||
public:
|
public:
|
||||||
explicit LoopUnrollAndJamPass(int OptLevel = 2) : OptLevel(OptLevel) {}
|
explicit LoopUnrollAndJamPass(int OptLevel = 2) : OptLevel(OptLevel) {}
|
||||||
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM);
|
PreservedAnalyses run(LoopNest &L, LoopAnalysisManager &AM,
|
||||||
|
LoopStandardAnalysisResults &AR, LPMUpdater &U);
|
||||||
};
|
};
|
||||||
|
|
||||||
} // end namespace llvm
|
} // end namespace llvm
|
||||||
|
@ -1207,7 +1207,8 @@ void PassBuilder::addVectorPasses(OptimizationLevel Level,
|
|||||||
// across the loop nests.
|
// across the loop nests.
|
||||||
// We do UnrollAndJam in a separate LPM to ensure it happens before unroll
|
// We do UnrollAndJam in a separate LPM to ensure it happens before unroll
|
||||||
if (EnableUnrollAndJam && PTO.LoopUnrolling)
|
if (EnableUnrollAndJam && PTO.LoopUnrolling)
|
||||||
FPM.addPass(LoopUnrollAndJamPass(Level.getSpeedupLevel()));
|
FPM.addPass(createFunctionToLoopPassAdaptor(
|
||||||
|
LoopUnrollAndJamPass(Level.getSpeedupLevel())));
|
||||||
FPM.addPass(LoopUnrollPass(LoopUnrollOptions(
|
FPM.addPass(LoopUnrollPass(LoopUnrollOptions(
|
||||||
Level.getSpeedupLevel(), /*OnlyWhenForced=*/!PTO.LoopUnrolling,
|
Level.getSpeedupLevel(), /*OnlyWhenForced=*/!PTO.LoopUnrolling,
|
||||||
PTO.ForgetAllSCEVInLoopUnroll)));
|
PTO.ForgetAllSCEVInLoopUnroll)));
|
||||||
@ -1290,7 +1291,8 @@ void PassBuilder::addVectorPasses(OptimizationLevel Level,
|
|||||||
// across the loop nests.
|
// across the loop nests.
|
||||||
// We do UnrollAndJam in a separate LPM to ensure it happens before unroll
|
// We do UnrollAndJam in a separate LPM to ensure it happens before unroll
|
||||||
if (EnableUnrollAndJam && PTO.LoopUnrolling) {
|
if (EnableUnrollAndJam && PTO.LoopUnrolling) {
|
||||||
FPM.addPass(LoopUnrollAndJamPass(Level.getSpeedupLevel()));
|
FPM.addPass(createFunctionToLoopPassAdaptor(
|
||||||
|
LoopUnrollAndJamPass(Level.getSpeedupLevel())));
|
||||||
}
|
}
|
||||||
FPM.addPass(LoopUnrollPass(LoopUnrollOptions(
|
FPM.addPass(LoopUnrollPass(LoopUnrollOptions(
|
||||||
Level.getSpeedupLevel(), /*OnlyWhenForced=*/!PTO.LoopUnrolling,
|
Level.getSpeedupLevel(), /*OnlyWhenForced=*/!PTO.LoopUnrolling,
|
||||||
|
@ -247,7 +247,6 @@ FUNCTION_PASS("guard-widening", GuardWideningPass())
|
|||||||
FUNCTION_PASS("load-store-vectorizer", LoadStoreVectorizerPass())
|
FUNCTION_PASS("load-store-vectorizer", LoadStoreVectorizerPass())
|
||||||
FUNCTION_PASS("loop-simplify", LoopSimplifyPass())
|
FUNCTION_PASS("loop-simplify", LoopSimplifyPass())
|
||||||
FUNCTION_PASS("loop-sink", LoopSinkPass())
|
FUNCTION_PASS("loop-sink", LoopSinkPass())
|
||||||
FUNCTION_PASS("loop-unroll-and-jam", LoopUnrollAndJamPass())
|
|
||||||
FUNCTION_PASS("loop-flatten", LoopFlattenPass())
|
FUNCTION_PASS("loop-flatten", LoopFlattenPass())
|
||||||
FUNCTION_PASS("lowerinvoke", LowerInvokePass())
|
FUNCTION_PASS("lowerinvoke", LowerInvokePass())
|
||||||
FUNCTION_PASS("lowerswitch", LowerSwitchPass())
|
FUNCTION_PASS("lowerswitch", LowerSwitchPass())
|
||||||
@ -399,6 +398,7 @@ LOOP_PASS("loop-deletion", LoopDeletionPass())
|
|||||||
LOOP_PASS("loop-simplifycfg", LoopSimplifyCFGPass())
|
LOOP_PASS("loop-simplifycfg", LoopSimplifyCFGPass())
|
||||||
LOOP_PASS("loop-reduce", LoopStrengthReducePass())
|
LOOP_PASS("loop-reduce", LoopStrengthReducePass())
|
||||||
LOOP_PASS("indvars", IndVarSimplifyPass())
|
LOOP_PASS("indvars", IndVarSimplifyPass())
|
||||||
|
LOOP_PASS("loop-unroll-and-jam", LoopUnrollAndJamPass())
|
||||||
LOOP_PASS("loop-unroll-full", LoopFullUnrollPass())
|
LOOP_PASS("loop-unroll-full", LoopFullUnrollPass())
|
||||||
LOOP_PASS("print-access-info", LoopAccessInfoPrinterPass(dbgs()))
|
LOOP_PASS("print-access-info", LoopAccessInfoPrinterPass(dbgs()))
|
||||||
LOOP_PASS("print<ddg>", DDGAnalysisPrinterPass(dbgs()))
|
LOOP_PASS("print<ddg>", DDGAnalysisPrinterPass(dbgs()))
|
||||||
|
@ -22,6 +22,7 @@
|
|||||||
#include "llvm/Analysis/DependenceAnalysis.h"
|
#include "llvm/Analysis/DependenceAnalysis.h"
|
||||||
#include "llvm/Analysis/LoopAnalysisManager.h"
|
#include "llvm/Analysis/LoopAnalysisManager.h"
|
||||||
#include "llvm/Analysis/LoopInfo.h"
|
#include "llvm/Analysis/LoopInfo.h"
|
||||||
|
#include "llvm/Analysis/LoopPass.h"
|
||||||
#include "llvm/Analysis/OptimizationRemarkEmitter.h"
|
#include "llvm/Analysis/OptimizationRemarkEmitter.h"
|
||||||
#include "llvm/Analysis/ScalarEvolution.h"
|
#include "llvm/Analysis/ScalarEvolution.h"
|
||||||
#include "llvm/Analysis/TargetTransformInfo.h"
|
#include "llvm/Analysis/TargetTransformInfo.h"
|
||||||
@ -424,35 +425,29 @@ tryToUnrollAndJamLoop(Loop *L, DominatorTree &DT, LoopInfo *LI,
|
|||||||
return UnrollResult;
|
return UnrollResult;
|
||||||
}
|
}
|
||||||
|
|
||||||
static bool tryToUnrollAndJamLoop(Function &F, DominatorTree &DT, LoopInfo &LI,
|
static bool tryToUnrollAndJamLoop(LoopNest &LN, DominatorTree &DT, LoopInfo &LI,
|
||||||
ScalarEvolution &SE,
|
ScalarEvolution &SE,
|
||||||
const TargetTransformInfo &TTI,
|
const TargetTransformInfo &TTI,
|
||||||
AssumptionCache &AC, DependenceInfo &DI,
|
AssumptionCache &AC, DependenceInfo &DI,
|
||||||
OptimizationRemarkEmitter &ORE,
|
OptimizationRemarkEmitter &ORE, int OptLevel,
|
||||||
int OptLevel) {
|
LPMUpdater &U) {
|
||||||
bool DidSomething = false;
|
bool DidSomething = false;
|
||||||
|
ArrayRef<Loop *> Loops = LN.getLoops();
|
||||||
|
Loop *OutmostLoop = &LN.getOutermostLoop();
|
||||||
|
|
||||||
// The loop unroll and jam pass requires loops to be in simplified form, and
|
// Add the loop nests in the reverse order of LN. See method
|
||||||
// also needs LCSSA. Since simplification may add new inner loops, it has to
|
|
||||||
// run before the legality and profitability checks. This means running the
|
|
||||||
// loop unroll and jam pass will simplify all loops, regardless of whether
|
|
||||||
// anything end up being unroll and jammed.
|
|
||||||
for (auto &L : LI) {
|
|
||||||
DidSomething |=
|
|
||||||
simplifyLoop(L, &DT, &LI, &SE, &AC, nullptr, false /* PreserveLCSSA */);
|
|
||||||
DidSomething |= formLCSSARecursively(*L, DT, &LI, &SE);
|
|
||||||
}
|
|
||||||
|
|
||||||
// Add the loop nests in the reverse order of LoopInfo. See method
|
|
||||||
// declaration.
|
// declaration.
|
||||||
SmallPriorityWorklist<Loop *, 4> Worklist;
|
SmallPriorityWorklist<Loop *, 4> Worklist;
|
||||||
appendLoopsToWorklist(LI, Worklist);
|
appendLoopsToWorklist(Loops, Worklist);
|
||||||
while (!Worklist.empty()) {
|
while (!Worklist.empty()) {
|
||||||
Loop *L = Worklist.pop_back_val();
|
Loop *L = Worklist.pop_back_val();
|
||||||
|
std::string LoopName = std::string(L->getName());
|
||||||
LoopUnrollResult Result =
|
LoopUnrollResult Result =
|
||||||
tryToUnrollAndJamLoop(L, DT, &LI, SE, TTI, AC, DI, ORE, OptLevel);
|
tryToUnrollAndJamLoop(L, DT, &LI, SE, TTI, AC, DI, ORE, OptLevel);
|
||||||
if (Result != LoopUnrollResult::Unmodified)
|
if (Result != LoopUnrollResult::Unmodified)
|
||||||
DidSomething = true;
|
DidSomething = true;
|
||||||
|
if (L == OutmostLoop && Result == LoopUnrollResult::FullyUnrolled)
|
||||||
|
U.markLoopAsDeleted(*L, LoopName);
|
||||||
}
|
}
|
||||||
|
|
||||||
return DidSomething;
|
return DidSomething;
|
||||||
@ -460,29 +455,35 @@ static bool tryToUnrollAndJamLoop(Function &F, DominatorTree &DT, LoopInfo &LI,
|
|||||||
|
|
||||||
namespace {
|
namespace {
|
||||||
|
|
||||||
class LoopUnrollAndJam : public FunctionPass {
|
class LoopUnrollAndJam : public LoopPass {
|
||||||
public:
|
public:
|
||||||
static char ID; // Pass ID, replacement for typeid
|
static char ID; // Pass ID, replacement for typeid
|
||||||
unsigned OptLevel;
|
unsigned OptLevel;
|
||||||
|
|
||||||
LoopUnrollAndJam(int OptLevel = 2) : FunctionPass(ID), OptLevel(OptLevel) {
|
LoopUnrollAndJam(int OptLevel = 2) : LoopPass(ID), OptLevel(OptLevel) {
|
||||||
initializeLoopUnrollAndJamPass(*PassRegistry::getPassRegistry());
|
initializeLoopUnrollAndJamPass(*PassRegistry::getPassRegistry());
|
||||||
}
|
}
|
||||||
|
|
||||||
bool runOnFunction(Function &F) override {
|
bool runOnLoop(Loop *L, LPPassManager &LPM) override {
|
||||||
if (skipFunction(F))
|
if (skipLoop(L))
|
||||||
return false;
|
return false;
|
||||||
|
|
||||||
auto &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree();
|
auto *F = L->getHeader()->getParent();
|
||||||
LoopInfo &LI = getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
|
auto &SE = getAnalysis<ScalarEvolutionWrapperPass>().getSE();
|
||||||
ScalarEvolution &SE = getAnalysis<ScalarEvolutionWrapperPass>().getSE();
|
auto *LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
|
||||||
const TargetTransformInfo &TTI =
|
|
||||||
getAnalysis<TargetTransformInfoWrapperPass>().getTTI(F);
|
|
||||||
auto &AC = getAnalysis<AssumptionCacheTracker>().getAssumptionCache(F);
|
|
||||||
auto &DI = getAnalysis<DependenceAnalysisWrapperPass>().getDI();
|
auto &DI = getAnalysis<DependenceAnalysisWrapperPass>().getDI();
|
||||||
|
auto &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree();
|
||||||
|
auto &TTI = getAnalysis<TargetTransformInfoWrapperPass>().getTTI(*F);
|
||||||
auto &ORE = getAnalysis<OptimizationRemarkEmitterWrapperPass>().getORE();
|
auto &ORE = getAnalysis<OptimizationRemarkEmitterWrapperPass>().getORE();
|
||||||
|
auto &AC = getAnalysis<AssumptionCacheTracker>().getAssumptionCache(*F);
|
||||||
|
|
||||||
return tryToUnrollAndJamLoop(F, DT, LI, SE, TTI, AC, DI, ORE, OptLevel);
|
LoopUnrollResult Result =
|
||||||
|
tryToUnrollAndJamLoop(L, DT, LI, SE, TTI, AC, DI, ORE, OptLevel);
|
||||||
|
|
||||||
|
if (Result == LoopUnrollResult::FullyUnrolled)
|
||||||
|
LPM.markLoopAsDeleted(*L);
|
||||||
|
|
||||||
|
return Result != LoopUnrollResult::Unmodified;
|
||||||
}
|
}
|
||||||
|
|
||||||
/// This transformation requires natural loop information & requires that
|
/// This transformation requires natural loop information & requires that
|
||||||
@ -505,7 +506,10 @@ char LoopUnrollAndJam::ID = 0;
|
|||||||
INITIALIZE_PASS_BEGIN(LoopUnrollAndJam, "loop-unroll-and-jam",
|
INITIALIZE_PASS_BEGIN(LoopUnrollAndJam, "loop-unroll-and-jam",
|
||||||
"Unroll and Jam loops", false, false)
|
"Unroll and Jam loops", false, false)
|
||||||
INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)
|
INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)
|
||||||
|
INITIALIZE_PASS_DEPENDENCY(LoopPass)
|
||||||
INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass)
|
INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass)
|
||||||
|
INITIALIZE_PASS_DEPENDENCY(LoopSimplify)
|
||||||
|
INITIALIZE_PASS_DEPENDENCY(LCSSAWrapperPass)
|
||||||
INITIALIZE_PASS_DEPENDENCY(ScalarEvolutionWrapperPass)
|
INITIALIZE_PASS_DEPENDENCY(ScalarEvolutionWrapperPass)
|
||||||
INITIALIZE_PASS_DEPENDENCY(TargetTransformInfoWrapperPass)
|
INITIALIZE_PASS_DEPENDENCY(TargetTransformInfoWrapperPass)
|
||||||
INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker)
|
INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker)
|
||||||
@ -518,19 +522,20 @@ Pass *llvm::createLoopUnrollAndJamPass(int OptLevel) {
|
|||||||
return new LoopUnrollAndJam(OptLevel);
|
return new LoopUnrollAndJam(OptLevel);
|
||||||
}
|
}
|
||||||
|
|
||||||
PreservedAnalyses LoopUnrollAndJamPass::run(Function &F,
|
PreservedAnalyses LoopUnrollAndJamPass::run(LoopNest &LN,
|
||||||
FunctionAnalysisManager &AM) {
|
LoopAnalysisManager &AM,
|
||||||
ScalarEvolution &SE = AM.getResult<ScalarEvolutionAnalysis>(F);
|
LoopStandardAnalysisResults &AR,
|
||||||
LoopInfo &LI = AM.getResult<LoopAnalysis>(F);
|
LPMUpdater &U) {
|
||||||
TargetTransformInfo &TTI = AM.getResult<TargetIRAnalysis>(F);
|
Function &F = *LN.getParent();
|
||||||
AssumptionCache &AC = AM.getResult<AssumptionAnalysis>(F);
|
|
||||||
DominatorTree &DT = AM.getResult<DominatorTreeAnalysis>(F);
|
|
||||||
DependenceInfo &DI = AM.getResult<DependenceAnalysis>(F);
|
|
||||||
OptimizationRemarkEmitter &ORE =
|
|
||||||
AM.getResult<OptimizationRemarkEmitterAnalysis>(F);
|
|
||||||
|
|
||||||
if (!tryToUnrollAndJamLoop(F, DT, LI, SE, TTI, AC, DI, ORE, OptLevel))
|
DependenceInfo DI(&F, &AR.AA, &AR.SE, &AR.LI);
|
||||||
|
OptimizationRemarkEmitter ORE(&F);
|
||||||
|
|
||||||
|
if (!tryToUnrollAndJamLoop(LN, AR.DT, AR.LI, AR.SE, AR.TTI, AR.AC, DI, ORE,
|
||||||
|
OptLevel, U))
|
||||||
return PreservedAnalyses::all();
|
return PreservedAnalyses::all();
|
||||||
|
|
||||||
return getLoopPassPreservedAnalyses();
|
auto PA = getLoopPassPreservedAnalyses();
|
||||||
|
PA.preserve<LoopNestAnalysis>();
|
||||||
|
return PA;
|
||||||
}
|
}
|
||||||
|
@ -1,5 +1,5 @@
|
|||||||
; RUN: opt -loop-unroll-and-jam -allow-unroll-and-jam -verify-loop-info < %s -S | FileCheck %s
|
; RUN: opt -loop-unroll-and-jam -allow-unroll-and-jam -verify-loop-info < %s -S | FileCheck %s
|
||||||
; RUN: opt -passes='loop-unroll-and-jam,verify<loops>' -allow-unroll-and-jam < %s -S | FileCheck %s
|
; RUN: opt -passes='loop(loop-unroll-and-jam),verify<loops>' -allow-unroll-and-jam < %s -S | FileCheck %s
|
||||||
|
|
||||||
; Check that the newly created loops to not fail to be added to LI
|
; Check that the newly created loops to not fail to be added to LI
|
||||||
; This test deliberately disables UnJ on the middle loop, performing it instead on the
|
; This test deliberately disables UnJ on the middle loop, performing it instead on the
|
||||||
|
Loading…
Reference in New Issue
Block a user