forked from OSchip/llvm-project
Disable loop peeling during full unrolling pass.
Summary: Peeling should not occur during the full unrolling invocation early in the pipeline, but rather later with partial and runtime loop unrolling. The later loop unrolling invocation will also eventually utilize profile summary and branch frequency information, which we would like to use to control peeling. And for ThinLTO we want to delay peeling until the backend (post thin link) phase, just as we do for most types of unrolling. Ensure peeling doesn't occur during the full unrolling invocation by adding a parameter to the shared implementation function, similar to the way partial and runtime loop unrolling are disabled. Performance results for ThinLTO suggest this has a neutral to positive effect on some internal benchmarks. Reviewers: chandlerc, davidxl Subscribers: mzolotukhin, llvm-commits, mehdi_amini Differential Revision: https://reviews.llvm.org/D36258 llvm-svn: 309966
This commit is contained in:
parent
f58df39529
commit
9a18a6f08b
|
@ -184,7 +184,7 @@ Pass *createLoopInstSimplifyPass();
|
|||
//
|
||||
Pass *createLoopUnrollPass(int OptLevel = 2, int Threshold = -1, int Count = -1,
|
||||
int AllowPartial = -1, int Runtime = -1,
|
||||
int UpperBound = -1);
|
||||
int UpperBound = -1, int AllowPeeling = -1);
|
||||
// Create an unrolling pass for full unrolling that uses exact trip count only.
|
||||
Pass *createSimpleLoopUnrollPass(int OptLevel = 2);
|
||||
|
||||
|
|
|
@ -134,7 +134,7 @@ static TargetTransformInfo::UnrollingPreferences gatherUnrollingPreferences(
|
|||
Loop *L, ScalarEvolution &SE, const TargetTransformInfo &TTI, int OptLevel,
|
||||
Optional<unsigned> UserThreshold, Optional<unsigned> UserCount,
|
||||
Optional<bool> UserAllowPartial, Optional<bool> UserRuntime,
|
||||
Optional<bool> UserUpperBound) {
|
||||
Optional<bool> UserUpperBound, Optional<bool> UserAllowPeeling) {
|
||||
TargetTransformInfo::UnrollingPreferences UP;
|
||||
|
||||
// Set up the defaults
|
||||
|
@ -201,6 +201,8 @@ static TargetTransformInfo::UnrollingPreferences gatherUnrollingPreferences(
|
|||
UP.Runtime = *UserRuntime;
|
||||
if (UserUpperBound.hasValue())
|
||||
UP.UpperBound = *UserUpperBound;
|
||||
if (UserAllowPeeling.hasValue())
|
||||
UP.AllowPeeling = *UserAllowPeeling;
|
||||
|
||||
return UP;
|
||||
}
|
||||
|
@ -927,15 +929,13 @@ static bool computeUnrollCount(
|
|||
return ExplicitUnroll;
|
||||
}
|
||||
|
||||
static bool tryToUnrollLoop(Loop *L, DominatorTree &DT, LoopInfo *LI,
|
||||
ScalarEvolution &SE, const TargetTransformInfo &TTI,
|
||||
AssumptionCache &AC, OptimizationRemarkEmitter &ORE,
|
||||
bool PreserveLCSSA, int OptLevel,
|
||||
Optional<unsigned> ProvidedCount,
|
||||
Optional<unsigned> ProvidedThreshold,
|
||||
Optional<bool> ProvidedAllowPartial,
|
||||
Optional<bool> ProvidedRuntime,
|
||||
Optional<bool> ProvidedUpperBound) {
|
||||
static bool tryToUnrollLoop(
|
||||
Loop *L, DominatorTree &DT, LoopInfo *LI, ScalarEvolution &SE,
|
||||
const TargetTransformInfo &TTI, AssumptionCache &AC,
|
||||
OptimizationRemarkEmitter &ORE, bool PreserveLCSSA, int OptLevel,
|
||||
Optional<unsigned> ProvidedCount, Optional<unsigned> ProvidedThreshold,
|
||||
Optional<bool> ProvidedAllowPartial, Optional<bool> ProvidedRuntime,
|
||||
Optional<bool> ProvidedUpperBound, Optional<bool> ProvidedAllowPeeling) {
|
||||
DEBUG(dbgs() << "Loop Unroll: F[" << L->getHeader()->getParent()->getName()
|
||||
<< "] Loop %" << L->getHeader()->getName() << "\n");
|
||||
if (HasUnrollDisablePragma(L))
|
||||
|
@ -951,7 +951,8 @@ static bool tryToUnrollLoop(Loop *L, DominatorTree &DT, LoopInfo *LI,
|
|||
bool Convergent;
|
||||
TargetTransformInfo::UnrollingPreferences UP = gatherUnrollingPreferences(
|
||||
L, SE, TTI, OptLevel, ProvidedThreshold, ProvidedCount,
|
||||
ProvidedAllowPartial, ProvidedRuntime, ProvidedUpperBound);
|
||||
ProvidedAllowPartial, ProvidedRuntime, ProvidedUpperBound,
|
||||
ProvidedAllowPeeling);
|
||||
// Exit early if unrolling is disabled.
|
||||
if (UP.Threshold == 0 && (!UP.Partial || UP.PartialThreshold == 0))
|
||||
return false;
|
||||
|
@ -1053,10 +1054,12 @@ public:
|
|||
LoopUnroll(int OptLevel = 2, Optional<unsigned> Threshold = None,
|
||||
Optional<unsigned> Count = None,
|
||||
Optional<bool> AllowPartial = None, Optional<bool> Runtime = None,
|
||||
Optional<bool> UpperBound = None)
|
||||
Optional<bool> UpperBound = None,
|
||||
Optional<bool> AllowPeeling = None)
|
||||
: LoopPass(ID), OptLevel(OptLevel), ProvidedCount(std::move(Count)),
|
||||
ProvidedThreshold(Threshold), ProvidedAllowPartial(AllowPartial),
|
||||
ProvidedRuntime(Runtime), ProvidedUpperBound(UpperBound) {
|
||||
ProvidedRuntime(Runtime), ProvidedUpperBound(UpperBound),
|
||||
ProvidedAllowPeeling(AllowPeeling) {
|
||||
initializeLoopUnrollPass(*PassRegistry::getPassRegistry());
|
||||
}
|
||||
|
||||
|
@ -1066,6 +1069,7 @@ public:
|
|||
Optional<bool> ProvidedAllowPartial;
|
||||
Optional<bool> ProvidedRuntime;
|
||||
Optional<bool> ProvidedUpperBound;
|
||||
Optional<bool> ProvidedAllowPeeling;
|
||||
|
||||
bool runOnLoop(Loop *L, LPPassManager &) override {
|
||||
if (skipLoop(L))
|
||||
|
@ -1088,7 +1092,7 @@ public:
|
|||
return tryToUnrollLoop(L, DT, LI, SE, TTI, AC, ORE, PreserveLCSSA, OptLevel,
|
||||
ProvidedCount, ProvidedThreshold,
|
||||
ProvidedAllowPartial, ProvidedRuntime,
|
||||
ProvidedUpperBound);
|
||||
ProvidedUpperBound, ProvidedAllowPeeling);
|
||||
}
|
||||
|
||||
/// This transformation requires natural loop information & requires that
|
||||
|
@ -1112,8 +1116,8 @@ INITIALIZE_PASS_DEPENDENCY(TargetTransformInfoWrapperPass)
|
|||
INITIALIZE_PASS_END(LoopUnroll, "loop-unroll", "Unroll loops", false, false)
|
||||
|
||||
Pass *llvm::createLoopUnrollPass(int OptLevel, int Threshold, int Count,
|
||||
int AllowPartial, int Runtime,
|
||||
int UpperBound) {
|
||||
int AllowPartial, int Runtime, int UpperBound,
|
||||
int AllowPeeling) {
|
||||
// TODO: It would make more sense for this function to take the optionals
|
||||
// directly, but that's dangerous since it would silently break out of tree
|
||||
// callers.
|
||||
|
@ -1122,11 +1126,12 @@ Pass *llvm::createLoopUnrollPass(int OptLevel, int Threshold, int Count,
|
|||
Count == -1 ? None : Optional<unsigned>(Count),
|
||||
AllowPartial == -1 ? None : Optional<bool>(AllowPartial),
|
||||
Runtime == -1 ? None : Optional<bool>(Runtime),
|
||||
UpperBound == -1 ? None : Optional<bool>(UpperBound));
|
||||
UpperBound == -1 ? None : Optional<bool>(UpperBound),
|
||||
AllowPeeling == -1 ? None : Optional<bool>(AllowPeeling));
|
||||
}
|
||||
|
||||
Pass *llvm::createSimpleLoopUnrollPass(int OptLevel) {
|
||||
return llvm::createLoopUnrollPass(OptLevel, -1, -1, 0, 0, 0);
|
||||
return llvm::createLoopUnrollPass(OptLevel, -1, -1, 0, 0, 0, 0);
|
||||
}
|
||||
|
||||
PreservedAnalyses LoopFullUnrollPass::run(Loop &L, LoopAnalysisManager &AM,
|
||||
|
@ -1156,7 +1161,8 @@ PreservedAnalyses LoopFullUnrollPass::run(Loop &L, LoopAnalysisManager &AM,
|
|||
tryToUnrollLoop(&L, AR.DT, &AR.LI, AR.SE, AR.TTI, AR.AC, *ORE,
|
||||
/*PreserveLCSSA*/ true, OptLevel, /*Count*/ None,
|
||||
/*Threshold*/ None, /*AllowPartial*/ false,
|
||||
/*Runtime*/ false, /*UpperBound*/ false);
|
||||
/*Runtime*/ false, /*UpperBound*/ false,
|
||||
/*AllowPeeling*/ false);
|
||||
if (!Changed)
|
||||
return PreservedAnalyses::all();
|
||||
|
||||
|
@ -1278,7 +1284,8 @@ PreservedAnalyses LoopUnrollPass::run(Function &F,
|
|||
bool CurChanged = tryToUnrollLoop(
|
||||
&L, DT, &LI, SE, TTI, AC, ORE,
|
||||
/*PreserveLCSSA*/ true, OptLevel, /*Count*/ None,
|
||||
/*Threshold*/ None, AllowPartialParam, RuntimeParam, UpperBoundParam);
|
||||
/*Threshold*/ None, AllowPartialParam, RuntimeParam, UpperBoundParam,
|
||||
/*AllowPeeling*/ None);
|
||||
Changed |= CurChanged;
|
||||
|
||||
// The parent must not be damaged by unrolling!
|
||||
|
|
|
@ -1,4 +1,5 @@
|
|||
; RUN: opt < %s -S -debug-only=loop-unroll -loop-unroll 2>&1 | FileCheck %s
|
||||
; RUN: opt < %s -S -debug-only=loop-unroll -passes='require<opt-remark-emit>,unroll' 2>&1 | FileCheck %s
|
||||
; REQUIRES: asserts
|
||||
|
||||
; Make sure we use the profile information correctly to peel-off 3 iterations
|
||||
|
@ -9,6 +10,10 @@
|
|||
; CHECK: Loop Unroll: F[optsize]
|
||||
; CHECK-NOT: PEELING
|
||||
|
||||
; Confirm that no peeling occurs when we are performing full unrolling.
|
||||
; RUN: opt < %s -S -debug-only=loop-unroll -passes='require<opt-remark-emit>,loop(unroll-full)' 2>&1 | FileCheck %s --check-prefix=FULLUNROLL
|
||||
; FULLUNROLL-NOT: PEELING
|
||||
|
||||
; CHECK-LABEL: @basic
|
||||
; CHECK: br i1 %{{.*}}, label %[[NEXT0:.*]], label %for.cond.for.end_crit_edge, !prof !1
|
||||
; CHECK: [[NEXT0]]:
|
||||
|
|
Loading…
Reference in New Issue