src - FreeBSD source tree

diff options


context:
space:
mode:

author	Dimitry Andric <dim@FreeBSD.org>	2020-02-27 19:04:39 +0000
committer	Dimitry Andric <dim@FreeBSD.org>	2020-02-27 19:04:39 +0000
commit	473957941922d17be72089e385e2e2a995fd0e1c (patch)
tree	7cd9f69252de735b0fa011d5e83e02e619b03819 /contrib/llvm-project/llvm/lib/Transforms
parent	21054a9b078ffbeb221934db2b545397cdd42d7d (diff)
parent	92d00d6a94bb341a1ed677031280e14863d4bb28 (diff)

Notes

Diffstat (limited to 'contrib/llvm-project/llvm/lib/Transforms')

-rw-r--r--

contrib/llvm-project/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp

-rw-r--r--

contrib/llvm-project/llvm/lib/Transforms/InstCombine/InstCombineShifts.cpp

-rw-r--r--

contrib/llvm-project/llvm/lib/Transforms/Scalar/LICM.cpp

-rw-r--r--

contrib/llvm-project/llvm/lib/Transforms/Scalar/LoopRotation.cpp

-rw-r--r--

contrib/llvm-project/llvm/lib/Transforms/Utils/BasicBlockUtils.cpp

-rw-r--r--

contrib/llvm-project/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp

6 files changed, 56 insertions, 61 deletions

diff --git a/contrib/llvm-project/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp b/contrib/llvm-project/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp
index f38dc436722d..e49e6cec65c0 100644
--- a/contrib/llvm-project/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp
+++ b/contrib/llvm-project/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp

@@ -3494,7 +3494,8 @@ foldShiftIntoShiftInAnotherHandOfAndInICmp(ICmpInst &I, const SimplifyQuery SQ,

Instruction *NarrowestShift = XShift;

Type *WidestTy = WidestShift->getType();

- assert(NarrowestShift->getType() == I.getOperand(0)->getType() &&

+ Type *NarrowestTy = NarrowestShift->getType();

+ assert(NarrowestTy == I.getOperand(0)->getType() &&

"We did not look past any shifts while matching XShift though.");

bool HadTrunc = WidestTy != I.getOperand(0)->getType();

@@ -3533,6 +3534,23 @@ foldShiftIntoShiftInAnotherHandOfAndInICmp(ICmpInst &I, const SimplifyQuery SQ,

if (XShAmt->getType() != YShAmt->getType())

return nullptr;

+ // As input, we have the following pattern:

+ // icmp eq/ne (and ((x shift Q), (y oppositeshift K))), 0

+ // We want to rewrite that as:

+ // icmp eq/ne (and (x shift (Q+K)), y), 0 iff (Q+K) u< bitwidth(x)

+ // While we know that originally (Q+K) would not overflow

+ // (because 2 * (N-1) u<= iN -1), we have looked past extensions of

+ // shift amounts. so it may now overflow in smaller bitwidth.

+ // To ensure that does not happen, we need to ensure that the total maximal

+ // shift amount is still representable in that smaller bit width.

+ unsigned MaximalPossibleTotalShiftAmount =

+ (WidestTy->getScalarSizeInBits() - 1) +

+ (NarrowestTy->getScalarSizeInBits() - 1);

+ APInt MaximalRepresentableShiftAmount =

+ APInt::getAllOnesValue(XShAmt->getType()->getScalarSizeInBits());

+ if (MaximalRepresentableShiftAmount.ult(MaximalPossibleTotalShiftAmount))

+ return nullptr;

// Can we fold (XShAmt+YShAmt) ?

auto *NewShAmt = dyn_cast_or_null<Constant>(

SimplifyAddInst(XShAmt, YShAmt, /*isNSW=*/false,

diff --git a/contrib/llvm-project/llvm/lib/Transforms/InstCombine/InstCombineShifts.cpp b/contrib/llvm-project/llvm/lib/Transforms/InstCombine/InstCombineShifts.cpp
index fbff5dd4a8cd..739579e2d38e 100644
--- a/contrib/llvm-project/llvm/lib/Transforms/InstCombine/InstCombineShifts.cpp
+++ b/contrib/llvm-project/llvm/lib/Transforms/InstCombine/InstCombineShifts.cpp

@@ -23,8 +23,11 @@ using namespace PatternMatch;

// Given pattern:

// (x shiftopcode Q) shiftopcode K

// we should rewrite it as

-// x shiftopcode (Q+K) iff (Q+K) u< bitwidth(x)

-// This is valid for any shift, but they must be identical.

+// x shiftopcode (Q+K) iff (Q+K) u< bitwidth(x) and

+//

+// This is valid for any shift, but they must be identical, and we must be

+// careful in case we have (zext(Q)+zext(K)) and look past extensions,

+// (Q+K) must not overflow or else (Q+K) u< bitwidth(x) is bogus.

// AnalyzeForSignBitExtraction indicates that we will only analyze whether this

// pattern has any 2 right-shifts that sum to 1 less than original bit width.

@@ -58,6 +61,23 @@ Value *InstCombiner::reassociateShiftAmtsOfTwoSameDirectionShifts(

if (ShAmt0->getType() != ShAmt1->getType())

return nullptr;

+ // As input, we have the following pattern:

+ // Sh0 (Sh1 X, Q), K

+ // We want to rewrite that as:

+ // Sh x, (Q+K) iff (Q+K) u< bitwidth(x)

+ // While we know that originally (Q+K) would not overflow

+ // (because 2 * (N-1) u<= iN -1), we have looked past extensions of

+ // shift amounts. so it may now overflow in smaller bitwidth.

+ // To ensure that does not happen, we need to ensure that the total maximal

+ // shift amount is still representable in that smaller bit width.

+ unsigned MaximalPossibleTotalShiftAmount =

+ (Sh0->getType()->getScalarSizeInBits() - 1) +

+ (Sh1->getType()->getScalarSizeInBits() - 1);

+ APInt MaximalRepresentableShiftAmount =

+ APInt::getAllOnesValue(ShAmt0->getType()->getScalarSizeInBits());

+ if (MaximalRepresentableShiftAmount.ult(MaximalPossibleTotalShiftAmount))

+ return nullptr;

// We are only looking for signbit extraction if we have two right shifts.

bool HadTwoRightShifts = match(Sh0, m_Shr(m_Value(), m_Value())) &&

match(Sh1, m_Shr(m_Value(), m_Value()));

diff --git a/contrib/llvm-project/llvm/lib/Transforms/Scalar/LICM.cpp b/contrib/llvm-project/llvm/lib/Transforms/Scalar/LICM.cpp
index 8c33045c2380..a1c012fddde3 100644
--- a/contrib/llvm-project/llvm/lib/Transforms/Scalar/LICM.cpp
+++ b/contrib/llvm-project/llvm/lib/Transforms/Scalar/LICM.cpp

@@ -790,41 +790,6 @@ public:

};

} // namespace

-/// Return true if we know how to rewrite all uses of the given alloca after

-/// hoisting it out of the loop. The main concerns are a) potential captures

-/// and b) invariant.start markers which don't capture, but are no longer

-/// valid w/o a corresponding invariant.end.

-static bool canRewriteUsesOfAlloca(AllocaInst &AI) {

- // TODO: This looks a lot like capture tracking, but we need to remove any

- // invariant starts if we extend the lifetime of the alloca by hoisting it.

- // We should probably refactor capture tracking into a form which allows us

- // to reuse the relevant bits and remove the duplicated logic here.

- SmallVector<Use *, 16> Worklist;

- for (Use &U : AI.uses())

- Worklist.push_back(&U);

- unsigned NumUsesExplored = 0;

- while (!Worklist.empty()) {

- Use *U = Worklist.pop_back_val();

- Instruction *I = cast<Instruction>(U->getUser());

- NumUsesExplored++;

- if (NumUsesExplored > DefaultMaxUsesToExplore)

- return false;

- // Non capturing, terminating uses

- if (isa<LoadInst>(I) ||

- (isa<StoreInst>(I) && U->getOperandNo() == 1))

- continue;

- // Non capturing, non-terminating

- if (!isa<BitCastInst>(I) && !isa<GetElementPtrInst>(I))

- return false;

- for (Use &U : I->uses())

- Worklist.push_back(&U);

- }

- return true;

/// Walk the specified region of the CFG (defined by all blocks dominated by

/// the specified block, and that are in the current loop) in depth first

/// order w.r.t the DominatorTree. This allows us to visit definitions before

@@ -945,16 +910,6 @@ bool llvm::hoistRegion(DomTreeNode *N, AliasAnalysis *AA, LoopInfo *LI,

continue;

}

- if (isa<AllocaInst>(&I) &&

- SafetyInfo->isGuaranteedToExecute(I, DT, CurLoop) &&

- canRewriteUsesOfAlloca(cast<AllocaInst>(I))) {

- hoist(I, DT, CurLoop, CFH.getOrCreateHoistedBlock(BB), SafetyInfo,

- MSSAU, SE, ORE);

- HoistedInstructions.push_back(&I);

- Changed = true;

- continue;

- }

if (PHINode *PN = dyn_cast<PHINode>(&I)) {

if (CFH.canHoistPHI(PN)) {

// Redirect incoming blocks first to ensure that we create hoisted

@@ -1537,7 +1492,8 @@ static bool canSplitPredecessors(PHINode *PN, LoopSafetyInfo *SafetyInfo) {

return false;

for (pred_iterator PI = pred_begin(BB), E = pred_end(BB); PI != E; ++PI) {

BasicBlock *BBPred = *PI;

- if (isa<IndirectBrInst>(BBPred->getTerminator()))

+ if (isa<IndirectBrInst>(BBPred->getTerminator()) ||

+ isa<CallBrInst>(BBPred->getTerminator()))

return false;

}

return true;

diff --git a/contrib/llvm-project/llvm/lib/Transforms/Scalar/LoopRotation.cpp b/contrib/llvm-project/llvm/lib/Transforms/Scalar/LoopRotation.cpp
index 0868e742f4ee..67c20b2edae8 100644
--- a/contrib/llvm-project/llvm/lib/Transforms/Scalar/LoopRotation.cpp
+++ b/contrib/llvm-project/llvm/lib/Transforms/Scalar/LoopRotation.cpp

@@ -81,10 +81,8 @@ public:

void getAnalysisUsage(AnalysisUsage &AU) const override {

AU.addRequired<AssumptionCacheTracker>();

AU.addRequired<TargetTransformInfoWrapperPass>();

- if (EnableMSSALoopDependency) {

- AU.addRequired<MemorySSAWrapperPass>();

+ if (EnableMSSALoopDependency)

AU.addPreserved<MemorySSAWrapperPass>();

- }

getLoopAnalysisUsage(AU);

}

@@ -101,8 +99,11 @@ public:

const SimplifyQuery SQ = getBestSimplifyQuery(*this, F);

Optional<MemorySSAUpdater> MSSAU;

if (EnableMSSALoopDependency) {

- MemorySSA *MSSA = &getAnalysis<MemorySSAWrapperPass>().getMSSA();

- MSSAU = MemorySSAUpdater(MSSA);

+ // Not requiring MemorySSA and getting it only if available will split

+ // the loop pass pipeline when LoopRotate is being run first.

+ auto *MSSAA = getAnalysisIfAvailable<MemorySSAWrapperPass>();

+ if (MSSAA)

+ MSSAU = MemorySSAUpdater(&MSSAA->getMSSA());

}

return LoopRotation(L, LI, TTI, AC, &DT, &SE,

MSSAU.hasValue() ? MSSAU.getPointer() : nullptr, SQ,

diff --git a/contrib/llvm-project/llvm/lib/Transforms/Utils/BasicBlockUtils.cpp b/contrib/llvm-project/llvm/lib/Transforms/Utils/BasicBlockUtils.cpp
index c9eb4abfa21a..9a7379e27ed6 100644
--- a/contrib/llvm-project/llvm/lib/Transforms/Utils/BasicBlockUtils.cpp
+++ b/contrib/llvm-project/llvm/lib/Transforms/Utils/BasicBlockUtils.cpp

@@ -505,7 +505,8 @@ llvm::SplitAllCriticalEdges(Function &F,

unsigned NumBroken = 0;

for (BasicBlock &BB : F) {

Instruction *TI = BB.getTerminator();

- if (TI->getNumSuccessors() > 1 && !isa<IndirectBrInst>(TI))

+ if (TI->getNumSuccessors() > 1 && !isa<IndirectBrInst>(TI) &&

+ !isa<CallBrInst>(TI))

for (unsigned i = 0, e = TI->getNumSuccessors(); i != e; ++i)

if (SplitCriticalEdge(TI, i, Options))

++NumBroken;

diff --git a/contrib/llvm-project/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp b/contrib/llvm-project/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
index 479bca83b51e..26cae4134ebc 100644
--- a/contrib/llvm-project/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
+++ b/contrib/llvm-project/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp

@@ -832,13 +832,12 @@ public:

// Extracts from consecutive indexes of the same vector better score as

// the extracts could be optimized away.

- auto *Ex1 = dyn_cast<ExtractElementInst>(V1);

- auto *Ex2 = dyn_cast<ExtractElementInst>(V2);

- if (Ex1 && Ex2 && Ex1->getVectorOperand() == Ex2->getVectorOperand() &&

- cast<ConstantInt>(Ex1->getIndexOperand())->getZExtValue() + 1 ==

- cast<ConstantInt>(Ex2->getIndexOperand())->getZExtValue()) {

+ Value *EV;

+ ConstantInt *Ex1Idx, *Ex2Idx;

+ if (match(V1, m_ExtractElement(m_Value(EV), m_ConstantInt(Ex1Idx))) &&

+ match(V2, m_ExtractElement(m_Deferred(EV), m_ConstantInt(Ex2Idx))) &&

+ Ex1Idx->getZExtValue() + 1 == Ex2Idx->getZExtValue())

return VLOperands::ScoreConsecutiveExtracts;

- }

auto *I1 = dyn_cast<Instruction>(V1);

auto *I2 = dyn_cast<Instruction>(V2);