Skip to content

Commit

Permalink
[SCEV] Try to reuse existing value during SCEV expansion
Browse files Browse the repository at this point in the history
Current SCEV expansion will expand SCEV as a sequence of operations
and doesn't utilize the value already existed. This will introduce
redundent computation which may not be cleaned up throughly by
following optimizations.

This patch introduces an ExprValueMap which is a map from SCEV to the
set of equal values with the same SCEV. When a SCEV is expanded, the
set of values is checked and reused whenever possible before generating
a sequence of operations.

Differential Revision: http://reviews.llvm.org/D12090

llvm-svn: 259662
  • Loading branch information
wmi-11 committed Feb 3, 2016
1 parent 38a36c4 commit ed13397
Show file tree
Hide file tree
Showing 12 changed files with 205 additions and 30 deletions.
29 changes: 29 additions & 0 deletions llvm/include/llvm/Analysis/ScalarEvolution.h
Expand Up @@ -23,6 +23,7 @@

#include "llvm/ADT/DenseSet.h"
#include "llvm/ADT/FoldingSet.h"
#include "llvm/ADT/SetVector.h"
#include "llvm/Analysis/LoopInfo.h"
#include "llvm/IR/ConstantRange.h"
#include "llvm/IR/Function.h"
Expand Down Expand Up @@ -382,6 +383,22 @@ namespace llvm {
/// This SCEV is used to represent unknown trip counts and things.
std::unique_ptr<SCEVCouldNotCompute> CouldNotCompute;

/// HasRecMapType - The typedef for HasRecMap.
///
typedef DenseMap<const SCEV *, bool> HasRecMapType;

/// HasRecMap -- This is a cache to record whether a SCEV contains
/// any scAddRecExpr.
HasRecMapType HasRecMap;

/// ExprValueMapType - The typedef for ExprValueMap.
///
typedef DenseMap<const SCEV *, SetVector<Value *>> ExprValueMapType;

/// ExprValueMap -- This map records the original values from which
/// the SCEV expr is generated from.
ExprValueMapType ExprValueMap;

/// The typedef for ValueExprMap.
///
typedef DenseMap<SCEVCallbackVH, const SCEV *, DenseMapInfo<Value *> >
Expand Down Expand Up @@ -821,6 +838,18 @@ namespace llvm {
/// return true. For pointer types, this is the pointer-sized integer type.
Type *getEffectiveSCEVType(Type *Ty) const;

/// containsAddRecurrence - Return true if the SCEV is a scAddRecExpr or
/// it contains scAddRecExpr. The result will be cached in HasRecMap.
///
bool containsAddRecurrence(const SCEV *S);

/// getSCEVValues - Return the Value set from which the SCEV expr is
/// generated.
SetVector<Value *> *getSCEVValues(const SCEV *S);

/// eraseValueFromMap - Erase Value from ValueExprMap and ExprValueMap.
void eraseValueFromMap(Value *V);

/// Return a SCEV expression for the full generality of the specified
/// expression.
const SCEV *getSCEV(Value *V);
Expand Down
90 changes: 86 additions & 4 deletions llvm/lib/Analysis/ScalarEvolution.cpp
Expand Up @@ -115,6 +115,10 @@ MaxBruteForceIterations("scalar-evolution-max-iterations", cl::ReallyHidden,
static cl::opt<bool>
VerifySCEV("verify-scev",
cl::desc("Verify ScalarEvolution's backedge taken counts (slow)"));
static cl::opt<bool>
VerifySCEVMap("verify-scev-maps",
cl::desc("Verify no dangling value in ScalarEvolution's"
"ExprValueMap (slow)"));

//===----------------------------------------------------------------------===//
// SCEV class definitions
Expand Down Expand Up @@ -3310,6 +3314,73 @@ bool ScalarEvolution::checkValidity(const SCEV *S) const {
return !F.FindOne;
}

namespace {
// Helper class working with SCEVTraversal to figure out if a SCEV contains
// a sub SCEV of scAddRecExpr type. FindInvalidSCEVUnknown::FoundOne is set
// iff if such sub scAddRecExpr type SCEV is found.
struct FindAddRecurrence {
bool FoundOne;
FindAddRecurrence() : FoundOne(false) {}

bool follow(const SCEV *S) {
switch (static_cast<SCEVTypes>(S->getSCEVType())) {
case scAddRecExpr:
FoundOne = true;
case scConstant:
case scUnknown:
case scCouldNotCompute:
return false;
default:
return true;
}
}
bool isDone() const { return FoundOne; }
};
}

bool ScalarEvolution::containsAddRecurrence(const SCEV *S) {
HasRecMapType::iterator I = HasRecMap.find_as(S);
if (I != HasRecMap.end())
return I->second;

FindAddRecurrence F;
SCEVTraversal<FindAddRecurrence> ST(F);
ST.visitAll(S);
HasRecMap.insert(std::make_pair(S, F.FoundOne));
return F.FoundOne;
}

/// getSCEVValues - Return the Value set from S.
SetVector<Value *> *ScalarEvolution::getSCEVValues(const SCEV *S) {
ExprValueMapType::iterator SI = ExprValueMap.find_as(S);
if (SI == ExprValueMap.end())
return nullptr;
#ifndef NDEBUG
if (VerifySCEVMap) {
// Check there is no dangling Value in the set returned.
for (const auto &VE : SI->second)
assert(ValueExprMap.count(VE));
}
#endif
return &SI->second;
}

/// eraseValueFromMap - Erase Value from ValueExprMap and ExprValueMap.
/// If ValueExprMap.erase(V) is not used together with forgetMemoizedResults(S),
/// eraseValueFromMap should be used instead to ensure whenever V->S is removed
/// from ValueExprMap, V is also removed from the set of ExprValueMap[S].
void ScalarEvolution::eraseValueFromMap(Value *V) {
ValueExprMapType::iterator I = ValueExprMap.find_as(V);
if (I != ValueExprMap.end()) {
const SCEV *S = I->second;
SetVector<Value *> *SV = getSCEVValues(S);
// Remove V from the set of ExprValueMap[S]
if (SV)
SV->remove(V);
ValueExprMap.erase(V);
}
}

/// getSCEV - Return an existing SCEV if it exists, otherwise analyze the
/// expression and create a new one.
const SCEV *ScalarEvolution::getSCEV(Value *V) {
Expand All @@ -3318,7 +3389,13 @@ const SCEV *ScalarEvolution::getSCEV(Value *V) {
const SCEV *S = getExistingSCEV(V);
if (S == nullptr) {
S = createSCEV(V);
ValueExprMap.insert(std::make_pair(SCEVCallbackVH(V, this), S));
// During PHI resolution, it is possible to create two SCEVs for the same
// V, so it is needed to double check whether V->S is inserted into
// ValueExprMap before insert S->V into ExprValueMap.
std::pair<ValueExprMapType::iterator, bool> Pair =
ValueExprMap.insert(std::make_pair(SCEVCallbackVH(V, this), S));
if (Pair.second)
ExprValueMap[S].insert(V);
}
return S;
}
Expand All @@ -3331,6 +3408,7 @@ const SCEV *ScalarEvolution::getExistingSCEV(Value *V) {
const SCEV *S = I->second;
if (checkValidity(S))
return S;
forgetMemoizedResults(S);
ValueExprMap.erase(I);
}
return nullptr;
Expand Down Expand Up @@ -8967,7 +9045,7 @@ void ScalarEvolution::SCEVCallbackVH::deleted() {
assert(SE && "SCEVCallbackVH called with a null ScalarEvolution!");
if (PHINode *PN = dyn_cast<PHINode>(getValPtr()))
SE->ConstantEvolutionLoopExitValue.erase(PN);
SE->ValueExprMap.erase(getValPtr());
SE->eraseValueFromMap(getValPtr());
// this now dangles!
}

Expand All @@ -8990,13 +9068,13 @@ void ScalarEvolution::SCEVCallbackVH::allUsesReplacedWith(Value *V) {
continue;
if (PHINode *PN = dyn_cast<PHINode>(U))
SE->ConstantEvolutionLoopExitValue.erase(PN);
SE->ValueExprMap.erase(U);
SE->eraseValueFromMap(U);
Worklist.insert(Worklist.end(), U->user_begin(), U->user_end());
}
// Delete the Old value.
if (PHINode *PN = dyn_cast<PHINode>(Old))
SE->ConstantEvolutionLoopExitValue.erase(PN);
SE->ValueExprMap.erase(Old);
SE->eraseValueFromMap(Old);
// this now dangles!
}

Expand Down Expand Up @@ -9046,7 +9124,9 @@ ScalarEvolution::~ScalarEvolution() {
}
FirstUnknown = nullptr;

ExprValueMap.clear();
ValueExprMap.clear();
HasRecMap.clear();

// Free any extra memory created for ExitNotTakenInfo in the unlikely event
// that a loop had multiple computable exits.
Expand Down Expand Up @@ -9375,6 +9455,8 @@ void ScalarEvolution::forgetMemoizedResults(const SCEV *S) {
BlockDispositions.erase(S);
UnsignedRanges.erase(S);
SignedRanges.erase(S);
ExprValueMap.erase(S);
HasRecMap.erase(S);

for (DenseMap<const Loop*, BackedgeTakenInfo>::iterator I =
BackedgeTakenCounts.begin(), E = BackedgeTakenCounts.end(); I != E; ) {
Expand Down
26 changes: 25 additions & 1 deletion llvm/lib/Analysis/ScalarEvolutionExpander.cpp
Expand Up @@ -1600,6 +1600,12 @@ Value *SCEVExpander::expandCodeFor(const SCEV *SH, Type *Ty) {
return V;
}

// The expansion of SCEV will either reuse a previous Value in ExprValueMap,
// or expand the SCEV literally. Specifically, if the expansion is in LSRMode,
// and the SCEV contains any sub scAddRecExpr type SCEV, it will be expanded
// literally, to prevent LSR's transformed SCEV from being reverted. Otherwise,
// the expansion will try to reuse Value from ExprValueMap, and only when it
// fails, expand the SCEV literally.
Value *SCEVExpander::expand(const SCEV *S) {
// Compute an insertion point for this SCEV object. Hoist the instructions
// as far out in the loop nest as possible.
Expand Down Expand Up @@ -1639,7 +1645,25 @@ Value *SCEVExpander::expand(const SCEV *S) {
Builder.SetInsertPoint(InsertPt);

// Expand the expression into instructions.
Value *V = visit(S);
SetVector<Value *> *Set = SE.getSCEVValues(S);
Value *V = nullptr;
// If the expansion is in LSRMode, and the SCEV contains any sub scAddRecExpr
// type SCEV, it will be expanded literally, to prevent LSR's transformed SCEV
// from being reverted.
if (!(LSRMode && SE.containsAddRecurrence(S))) {
if (Set) {
// Choose a Value from the set which dominates the insertPt.
for (auto const &Ent : *Set) {
if (Ent && isa<Instruction>(Ent) && S->getType() == Ent->getType() &&
SE.DT.dominates(cast<Instruction>(Ent), InsertPt)) {
V = Ent;
break;
}
}
}
}
if (!V)
V = visit(S);

// Remember the expanded value for this SCEV at this location.
//
Expand Down
20 changes: 16 additions & 4 deletions llvm/lib/Transforms/Vectorize/LoopVectorize.cpp
Expand Up @@ -2718,6 +2718,10 @@ void InnerLoopVectorizer::emitMinimumIterationCountCheck(Loop *L,

BasicBlock *NewBB = BB->splitBasicBlock(BB->getTerminator(),
"min.iters.checked");
// Update dominator tree immediately if the generated block is a
// LoopBypassBlock because SCEV expansions to generate loop bypass
// checks may query it before the current function is finished.
DT->addNewBlock(NewBB, BB);
if (L->getParentLoop())
L->getParentLoop()->addBasicBlockToLoop(NewBB, *LI);
ReplaceInstWithInst(BB->getTerminator(),
Expand All @@ -2740,6 +2744,10 @@ void InnerLoopVectorizer::emitVectorLoopEnteredCheck(Loop *L,
// adding one to the backedge-taken count will not overflow.
BasicBlock *NewBB = BB->splitBasicBlock(BB->getTerminator(),
"vector.ph");
// Update dominator tree immediately if the generated block is a
// LoopBypassBlock because SCEV expansions to generate loop bypass
// checks may query it before the current function is finished.
DT->addNewBlock(NewBB, BB);
if (L->getParentLoop())
L->getParentLoop()->addBasicBlockToLoop(NewBB, *LI);
ReplaceInstWithInst(BB->getTerminator(),
Expand All @@ -2765,6 +2773,10 @@ void InnerLoopVectorizer::emitSCEVChecks(Loop *L, BasicBlock *Bypass) {
// Create a new block containing the stride check.
BB->setName("vector.scevcheck");
auto *NewBB = BB->splitBasicBlock(BB->getTerminator(), "vector.ph");
// Update dominator tree immediately if the generated block is a
// LoopBypassBlock because SCEV expansions to generate loop bypass
// checks may query it before the current function is finished.
DT->addNewBlock(NewBB, BB);
if (L->getParentLoop())
L->getParentLoop()->addBasicBlockToLoop(NewBB, *LI);
ReplaceInstWithInst(BB->getTerminator(),
Expand All @@ -2790,6 +2802,10 @@ void InnerLoopVectorizer::emitMemRuntimeChecks(Loop *L,
// Create a new block containing the memory check.
BB->setName("vector.memcheck");
auto *NewBB = BB->splitBasicBlock(BB->getTerminator(), "vector.ph");
// Update dominator tree immediately if the generated block is a
// LoopBypassBlock because SCEV expansions to generate loop bypass
// checks may query it before the current function is finished.
DT->addNewBlock(NewBB, BB);
if (L->getParentLoop())
L->getParentLoop()->addBasicBlockToLoop(NewBB, *LI);
ReplaceInstWithInst(BB->getTerminator(),
Expand Down Expand Up @@ -3957,10 +3973,6 @@ void InnerLoopVectorizer::updateAnalysis() {
assert(DT->properlyDominates(LoopBypassBlocks.front(), LoopExitBlock) &&
"Entry does not dominate exit.");

for (unsigned I = 1, E = LoopBypassBlocks.size(); I != E; ++I)
DT->addNewBlock(LoopBypassBlocks[I], LoopBypassBlocks[I-1]);
DT->addNewBlock(LoopVectorPreHeader, LoopBypassBlocks.back());

// We don't predicate stores by this point, so the vector body should be a
// single loop.
assert(LoopVectorBody.size() == 1 && "Expected single block loop!");
Expand Down
38 changes: 38 additions & 0 deletions llvm/test/Analysis/ScalarEvolution/scev-expander-existing-value.ll
@@ -0,0 +1,38 @@
; RUN: opt < %s -loop-vectorize -force-vector-width=4 -verify-scev-maps -S |FileCheck %s

; SCEV expansion uses existing value when the SCEV has no AddRec expr.
; CHECK: select
; CHECK-NOT: select

@a = common global [1000 x i16] zeroinitializer, align 16

define i32 @foo(i32 %x, i32 %y) {
entry:
%cmp = icmp slt i32 %x, %y
%cond = select i1 %cmp, i32 %x, i32 %y
%cmp1.10 = icmp sgt i32 %cond, 0
br i1 %cmp1.10, label %for.body.lr.ph, label %for.end

for.body.lr.ph: ; preds = %entry
%tmp = sext i32 %cond to i64
br label %for.body

for.body: ; preds = %for.body, %for.body.lr.ph
%indvars.iv = phi i64 [ 0, %for.body.lr.ph ], [ %indvars.iv.next, %for.body ]
%total.011 = phi i32 [ 0, %for.body.lr.ph ], [ %add, %for.body ]
%arrayidx = getelementptr inbounds [1000 x i16], [1000 x i16]* @a, i64 0, i64 %indvars.iv
%tmp1 = load i16, i16* %arrayidx, align 2
%conv = sext i16 %tmp1 to i32
%add = add nsw i32 %conv, %total.011
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
%cmp1 = icmp slt i64 %indvars.iv.next, %tmp
br i1 %cmp1, label %for.body, label %for.end.loopexit

for.end.loopexit: ; preds = %for.body
%add.lcssa = phi i32 [ %add, %for.body ]
br label %for.end

for.end: ; preds = %for.end.loopexit, %entry
%total.0.lcssa = phi i32 [ 0, %entry ], [ %add.lcssa, %for.end.loopexit ]
ret i32 %total.0.lcssa
}
1 change: 0 additions & 1 deletion llvm/test/CodeGen/Thumb2/2009-12-01-LoopIVUsers.ll
Expand Up @@ -8,7 +8,6 @@ entry:
; -- The loop following the load should only use a single add-literation
; instruction.
; CHECK: vldr
; CHECK: adds r{{[0-9]+.*}}#1
; CHECK-NOT: adds
; CHECK: subsections_via_symbols

Expand Down
1 change: 0 additions & 1 deletion llvm/test/Transforms/IRCE/decrementing-loop.ll
Expand Up @@ -28,7 +28,6 @@ define void @decrementing_loop(i32 *%arr, i32 *%a_len_ptr, i32 %n) {
ret void

; CHECK: loop.preheader:
; CHECK: [[indvar_start:[^ ]+]] = add i32 %n, -1
; CHECK: [[not_len:[^ ]+]] = sub i32 -1, %len
; CHECK: [[not_n:[^ ]+]] = sub i32 -1, %n
; CHECK: [[not_len_hiclamp_cmp:[^ ]+]] = icmp sgt i32 [[not_len]], [[not_n]]
Expand Down
Expand Up @@ -11,7 +11,7 @@ entry:
br i1 %cmp1, label %for.body, label %for.end

; Make sure the added GEP has the right index type
; CHECK: %lftr.limit = getelementptr i8, i8 addrspace(2)* %base, i8 %0
; CHECK: %lftr.limit = getelementptr i8, i8 addrspace(2)* %base, i8 %idx.trunc

; CHECK: for.body:
; CHECK: phi i8 addrspace(2)*
Expand Down Expand Up @@ -43,7 +43,7 @@ entry:
br i1 %cmp1, label %for.body, label %for.end

; Make sure the added GEP has the right index type
; CHECK: %lftr.limit = getelementptr i8, i8 addrspace(3)* %base, i16 %0
; CHECK: %lftr.limit = getelementptr i8, i8 addrspace(3)* %base, i16 %idx.trunc

; CHECK: for.body:
; CHECK: phi i8 addrspace(3)*
Expand Down
5 changes: 1 addition & 4 deletions llvm/test/Transforms/IndVarSimplify/pr24783.ll
Expand Up @@ -6,9 +6,6 @@ target triple = "powerpc64-unknown-linux-gnu"
define void @f(i32* %end.s, i8** %loc, i32 %p) {
; CHECK-LABEL: @f(
entry:
; CHECK: [[P_SEXT:%[0-9a-z]+]] = sext i32 %p to i64
; CHECK: [[END:%[0-9a-z]+]] = getelementptr i32, i32* %end.s, i64 [[P_SEXT]]

%end = getelementptr inbounds i32, i32* %end.s, i32 %p
%init = bitcast i32* %end.s to i8*
br label %while.body.i
Expand All @@ -22,7 +19,7 @@ while.body.i:

loop.exit:
; CHECK: loop.exit:
; CHECK: [[END_BCASTED:%[a-z0-9]+]] = bitcast i32* %scevgep to i8*
; CHECK: [[END_BCASTED:%[a-z0-9]+]] = bitcast i32* %end to i8*
; CHECK: store i8* [[END_BCASTED]], i8** %loc
%ptr.inc.lcssa = phi i8* [ %ptr.inc, %while.body.i ]
store i8* %ptr.inc.lcssa, i8** %loc
Expand Down

0 comments on commit ed13397

Please sign in to comment.