src - FreeBSD source tree

diff options


context:
space:
mode:

author	Dimitry Andric <dim@FreeBSD.org>	2022-07-14 18:50:02 +0000
committer	Dimitry Andric <dim@FreeBSD.org>	2022-07-14 18:50:02 +0000
commit	1f917f69ff07f09b6dbb670971f57f8efe718b84 (patch)
tree	99293cbc1411737cd995dac10a99b2c40ef0944c /llvm/lib/Transforms/Utils
parent	145449b1e420787bb99721a429341fa6be3adfb6 (diff)

vendor/llvm-project/llvmorg-15-init-16436-g18a6ab5b8d1f

Diffstat (limited to 'llvm/lib/Transforms/Utils')

-rw-r--r--

llvm/lib/Transforms/Utils/BasicBlockUtils.cpp

-rw-r--r--

llvm/lib/Transforms/Utils/BreakCriticalEdges.cpp

-rw-r--r--

llvm/lib/Transforms/Utils/CodeExtractor.cpp

-rw-r--r--

llvm/lib/Transforms/Utils/Debugify.cpp

-rw-r--r--

llvm/lib/Transforms/Utils/LoopUnrollRuntime.cpp

-rw-r--r--

llvm/lib/Transforms/Utils/LoopUtils.cpp

-rw-r--r--

llvm/lib/Transforms/Utils/LowerAtomic.cpp

-rw-r--r--

llvm/lib/Transforms/Utils/MisExpect.cpp

-rw-r--r--

llvm/lib/Transforms/Utils/ModuleUtils.cpp

-rw-r--r--

llvm/lib/Transforms/Utils/PromoteMemoryToRegister.cpp

-rw-r--r--

llvm/lib/Transforms/Utils/SCCPSolver.cpp

-rw-r--r--

llvm/lib/Transforms/Utils/ScalarEvolutionExpander.cpp

-rw-r--r--

llvm/lib/Transforms/Utils/SimplifyCFG.cpp

205

-rw-r--r--

llvm/lib/Transforms/Utils/SimplifyIndVar.cpp

-rw-r--r--

llvm/lib/Transforms/Utils/SimplifyLibCalls.cpp

189

15 files changed, 393 insertions, 301 deletions

diff --git a/llvm/lib/Transforms/Utils/BasicBlockUtils.cpp b/llvm/lib/Transforms/Utils/BasicBlockUtils.cpp
index e9983ff82176..079b2fc973b9 100644
--- a/llvm/lib/Transforms/Utils/BasicBlockUtils.cpp
+++ b/llvm/lib/Transforms/Utils/BasicBlockUtils.cpp

@@ -769,8 +769,7 @@ llvm::SplitAllCriticalEdges(Function &F,

unsigned NumBroken = 0;

for (BasicBlock &BB : F) {

Instruction *TI = BB.getTerminator();

- if (TI->getNumSuccessors() > 1 && !isa<IndirectBrInst>(TI) &&

- !isa<CallBrInst>(TI))

+ if (TI->getNumSuccessors() > 1 && !isa<IndirectBrInst>(TI))

for (unsigned i = 0, e = TI->getNumSuccessors(); i != e; ++i)

if (SplitCriticalEdge(TI, i, Options))

++NumBroken;

@@ -1132,9 +1131,7 @@ SplitBlockPredecessorsImpl(BasicBlock *BB, ArrayRef<BasicBlock *> Preds,

// all BlockAddress uses would need to be updated.

assert(!isa<IndirectBrInst>(Preds[i]->getTerminator()) &&

"Cannot split an edge from an IndirectBrInst");

- assert(!isa<CallBrInst>(Preds[i]->getTerminator()) &&

- "Cannot split an edge from a CallBrInst");

- Preds[i]->getTerminator()->replaceUsesOfWith(BB, NewBB);

+ Preds[i]->getTerminator()->replaceSuccessorWith(BB, NewBB);

}

// Insert a new PHI node into NewBB for every PHI node in BB and that new PHI

diff --git a/llvm/lib/Transforms/Utils/BreakCriticalEdges.cpp b/llvm/lib/Transforms/Utils/BreakCriticalEdges.cpp
index 0b36e8708a03..9c595401ce29 100644
--- a/llvm/lib/Transforms/Utils/BreakCriticalEdges.cpp
+++ b/llvm/lib/Transforms/Utils/BreakCriticalEdges.cpp

@@ -129,8 +129,7 @@ llvm::SplitKnownCriticalEdge(Instruction *TI, unsigned SuccNum,

SmallVector<BasicBlock *, 4> LoopPreds;

// Check if extra modifications will be required to preserve loop-simplify

// form after splitting. If it would require splitting blocks with IndirectBr

- // or CallBr terminators, bail out if preserving loop-simplify form is

- // requested.

+ // terminators, bail out if preserving loop-simplify form is requested.

if (LI) {

if (Loop *TIL = LI->getLoopFor(TIBB)) {

@@ -156,10 +155,7 @@ llvm::SplitKnownCriticalEdge(Instruction *TI, unsigned SuccNum,

// Loop-simplify form can be preserved, if we can split all in-loop

// predecessors.

if (any_of(LoopPreds, [](BasicBlock *Pred) {

- const Instruction *T = Pred->getTerminator();

- if (const auto *CBR = dyn_cast<CallBrInst>(T))

- return CBR->getDefaultDest() != Pred;

- return isa<IndirectBrInst>(T);

+ return isa<IndirectBrInst>(Pred->getTerminator());

})) {

if (Options.PreserveLoopSimplify)

return nullptr;

diff --git a/llvm/lib/Transforms/Utils/CodeExtractor.cpp b/llvm/lib/Transforms/Utils/CodeExtractor.cpp
index f94d854f7ee8..421f1f329f07 100644
--- a/llvm/lib/Transforms/Utils/CodeExtractor.cpp
+++ b/llvm/lib/Transforms/Utils/CodeExtractor.cpp

@@ -927,6 +927,7 @@ Function *CodeExtractor::constructFunction(const ValueSet &inputs,

case Attribute::AlwaysInline:

case Attribute::Cold:

case Attribute::DisableSanitizerInstrumentation:

+ case Attribute::FnRetThunkExtern:

case Attribute::Hot:

case Attribute::NoRecurse:

case Attribute::InlineHint:

@@ -1777,7 +1778,7 @@ CodeExtractor::extractCodeRegion(const CodeExtractorAnalysisCache &CEAC,

auto Count = BFI->getProfileCountFromFreq(EntryFreq.getFrequency());

if (Count)

newFunction->setEntryCount(

- ProfileCount(Count.getValue(), Function::PCT_Real)); // FIXME

+ ProfileCount(Count.value(), Function::PCT_Real)); // FIXME

BFI->setBlockFreq(codeReplacer, EntryFreq.getFrequency());

}

diff --git a/llvm/lib/Transforms/Utils/Debugify.cpp b/llvm/lib/Transforms/Utils/Debugify.cpp
index 205f7a7d9ed2..24126b5ab67b 100644
--- a/llvm/lib/Transforms/Utils/Debugify.cpp
+++ b/llvm/lib/Transforms/Utils/Debugify.cpp

@@ -961,8 +961,13 @@ createDebugifyFunctionPass(enum DebugifyMode Mode,

}

PreservedAnalyses NewPMDebugifyPass::run(Module &M, ModuleAnalysisManager &) {

- applyDebugifyMetadata(M, M.functions(),

- "ModuleDebugify: ", /*ApplyToMF*/ nullptr);

+ if (Mode == DebugifyMode::SyntheticDebugInfo)

+ applyDebugifyMetadata(M, M.functions(),

+ "ModuleDebugify: ", /*ApplyToMF*/ nullptr);

+ else

+ collectDebugInfoMetadata(M, M.functions(), *DebugInfoBeforePass,

+ "ModuleDebugify (original debuginfo)",

+ NameOfWrappedPass);

return PreservedAnalyses::all();

}

@@ -992,8 +997,14 @@ FunctionPass *createCheckDebugifyFunctionPass(

PreservedAnalyses NewPMCheckDebugifyPass::run(Module &M,

ModuleAnalysisManager &) {

- checkDebugifyMetadata(M, M.functions(), "", "CheckModuleDebugify", false,

- nullptr);

+ if (Mode == DebugifyMode::SyntheticDebugInfo)

+ checkDebugifyMetadata(M, M.functions(), NameOfWrappedPass,

+ "CheckModuleDebugify", Strip, StatsMap);

+ else

+ checkDebugInfoMetadata(

+ M, M.functions(), *DebugInfoBeforePass,

+ "CheckModuleDebugify (original debuginfo)", NameOfWrappedPass,

+ OrigDIVerifyBugsReportFilePath);

return PreservedAnalyses::all();

}

@@ -1006,13 +1017,15 @@ static bool isIgnoredPass(StringRef PassID) {

void DebugifyEachInstrumentation::registerCallbacks(

PassInstrumentationCallbacks &PIC) {

- PIC.registerBeforeNonSkippedPassCallback([](StringRef P, Any IR) {

+ PIC.registerBeforeNonSkippedPassCallback([this](StringRef P, Any IR) {

if (isIgnoredPass(P))

return;

if (any_isa<const Function *>(IR))

- applyDebugify(*const_cast<Function *>(any_cast<const Function *>(IR)));

+ applyDebugify(*const_cast<Function *>(any_cast<const Function *>(IR)),

+ Mode, DebugInfoBeforePass, P);

else if (any_isa<const Module *>(IR))

- applyDebugify(*const_cast<Module *>(any_cast<const Module *>(IR)));

+ applyDebugify(*const_cast<Module *>(any_cast<const Module *>(IR)),

+ Mode, DebugInfoBeforePass, P);

});

PIC.registerAfterPassCallback([this](StringRef P, Any IR,

const PreservedAnalyses &PassPA) {

@@ -1022,12 +1035,24 @@ void DebugifyEachInstrumentation::registerCallbacks(

auto &F = *const_cast<Function *>(any_cast<const Function *>(IR));

Module &M = *F.getParent();

auto It = F.getIterator();

- checkDebugifyMetadata(M, make_range(It, std::next(It)), P,

- "CheckFunctionDebugify", /*Strip=*/true, &StatsMap);

+ if (Mode == DebugifyMode::SyntheticDebugInfo)

+ checkDebugifyMetadata(M, make_range(It, std::next(It)), P,

+ "CheckFunctionDebugify", /*Strip=*/true, DIStatsMap);

+ else

+ checkDebugInfoMetadata(

+ M, make_range(It, std::next(It)), *DebugInfoBeforePass,

+ "CheckModuleDebugify (original debuginfo)",

+ P, OrigDIVerifyBugsReportFilePath);

} else if (any_isa<const Module *>(IR)) {

auto &M = *const_cast<Module *>(any_cast<const Module *>(IR));

- checkDebugifyMetadata(M, M.functions(), P, "CheckModuleDebugify",

- /*Strip=*/true, &StatsMap);

+ if (Mode == DebugifyMode::SyntheticDebugInfo)

+ checkDebugifyMetadata(M, M.functions(), P, "CheckModuleDebugify",

+ /*Strip=*/true, DIStatsMap);

+ else

+ checkDebugInfoMetadata(

+ M, M.functions(), *DebugInfoBeforePass,

+ "CheckModuleDebugify (original debuginfo)",

+ P, OrigDIVerifyBugsReportFilePath);

}

});

}

diff --git a/llvm/lib/Transforms/Utils/LoopUnrollRuntime.cpp b/llvm/lib/Transforms/Utils/LoopUnrollRuntime.cpp
index cd3b6c1a095a..023a0afd329b 100644
--- a/llvm/lib/Transforms/Utils/LoopUnrollRuntime.cpp
+++ b/llvm/lib/Transforms/Utils/LoopUnrollRuntime.cpp

@@ -402,7 +402,7 @@ CloneLoopBlocks(Loop *L, Value *NewIter, const bool UseEpilogRemainder,

Optional<MDNode *> NewLoopID = makeFollowupLoopID(

LoopID, {LLVMLoopUnrollFollowupAll, LLVMLoopUnrollFollowupRemainder});

if (NewLoopID) {

- NewLoop->setLoopID(NewLoopID.getValue());

+ NewLoop->setLoopID(NewLoopID.value());

// Do not setLoopAlreadyUnrolled if loop attributes have been defined

// explicitly.

diff --git a/llvm/lib/Transforms/Utils/LoopUtils.cpp b/llvm/lib/Transforms/Utils/LoopUtils.cpp
index ec898c463574..82f993b4ceab 100644
--- a/llvm/lib/Transforms/Utils/LoopUtils.cpp
+++ b/llvm/lib/Transforms/Utils/LoopUtils.cpp

@@ -75,9 +75,6 @@ bool llvm::formDedicatedExitBlocks(Loop *L, DominatorTree *DT, LoopInfo *LI,

if (isa<IndirectBrInst>(PredBB->getTerminator()))

// We cannot rewrite exiting edges from an indirectbr.

return false;

- if (isa<CallBrInst>(PredBB->getTerminator()))

- // We cannot rewrite exiting edges from a callbr.

- return false;

InLoopPredecessors.push_back(PredBB);

} else {

@@ -359,7 +356,7 @@ TransformationMode llvm::hasUnrollTransformation(const Loop *L) {

Optional<int> Count =

getOptionalIntLoopAttribute(L, "llvm.loop.unroll.count");

if (Count)

- return Count.getValue() == 1 ? TM_SuppressedByUser : TM_ForcedByUser;

+ return Count.value() == 1 ? TM_SuppressedByUser : TM_ForcedByUser;

if (getBooleanLoopAttribute(L, "llvm.loop.unroll.enable"))

return TM_ForcedByUser;

@@ -380,7 +377,7 @@ TransformationMode llvm::hasUnrollAndJamTransformation(const Loop *L) {

Optional<int> Count =

getOptionalIntLoopAttribute(L, "llvm.loop.unroll_and_jam.count");

if (Count)

- return Count.getValue() == 1 ? TM_SuppressedByUser : TM_ForcedByUser;

+ return Count.value() == 1 ? TM_SuppressedByUser : TM_ForcedByUser;

if (getBooleanLoopAttribute(L, "llvm.loop.unroll_and_jam.enable"))

return TM_ForcedByUser;

@@ -1246,6 +1243,20 @@ static bool canLoopBeDeleted(Loop *L, SmallVector<RewritePhi, 8> &RewritePhiSet)

return true;

}

+/// Checks if it is safe to call InductionDescriptor::isInductionPHI for \p Phi,

+/// and returns true if this Phi is an induction phi in the loop. When

+/// isInductionPHI returns true, \p ID will be also be set by isInductionPHI.

+static bool checkIsIndPhi(PHINode *Phi, Loop *L, ScalarEvolution *SE,

+ InductionDescriptor &ID) {

+ if (!Phi)

+ return false;

+ if (!L->getLoopPreheader())

+ return false;

+ if (Phi->getParent() != L->getHeader())

+ return false;

+ return InductionDescriptor::isInductionPHI(Phi, L, SE, ID);

int llvm::rewriteLoopExitValues(Loop *L, LoopInfo *LI, TargetLibraryInfo *TLI,

ScalarEvolution *SE,

const TargetTransformInfo *TTI,

@@ -1297,6 +1308,46 @@ int llvm::rewriteLoopExitValues(Loop *L, LoopInfo *LI, TargetLibraryInfo *TLI,

if (!L->contains(Inst))

continue;

+ // Find exit values which are induction variables in the loop, and are

+ // unused in the loop, with the only use being the exit block PhiNode,

+ // and the induction variable update binary operator.

+ // The exit value can be replaced with the final value when it is cheap

+ // to do so.

+ if (ReplaceExitValue == UnusedIndVarInLoop) {

+ InductionDescriptor ID;

+ PHINode *IndPhi = dyn_cast<PHINode>(Inst);

+ if (IndPhi) {

+ if (!checkIsIndPhi(IndPhi, L, SE, ID))

+ continue;

+ // This is an induction PHI. Check that the only users are PHI

+ // nodes, and induction variable update binary operators.

+ if (llvm::any_of(Inst->users(), [&](User *U) {

+ if (!isa<PHINode>(U) && !isa<BinaryOperator>(U))

+ return true;

+ BinaryOperator *B = dyn_cast<BinaryOperator>(U);

+ if (B && B != ID.getInductionBinOp())

+ return true;

+ return false;

+ }))

+ continue;

+ } else {

+ // If it is not an induction phi, it must be an induction update

+ // binary operator with an induction phi user.

+ BinaryOperator *B = dyn_cast<BinaryOperator>(Inst);

+ if (!B)

+ continue;

+ if (llvm::any_of(Inst->users(), [&](User *U) {

+ PHINode *Phi = dyn_cast<PHINode>(U);

+ if (Phi != PN && !checkIsIndPhi(Phi, L, SE, ID))

+ return true;

+ return false;

+ }))

+ continue;

+ if (B != ID.getInductionBinOp())

+ continue;

+ }

// Okay, this instruction has a user outside of the current loop

// and varies predictably *inside* the loop. Evaluate the value it

// contains when the loop exits, if possible. We prefer to start with

@@ -1362,7 +1413,9 @@ int llvm::rewriteLoopExitValues(Loop *L, LoopInfo *LI, TargetLibraryInfo *TLI,

// Only do the rewrite when the ExitValue can be expanded cheaply.

// If LoopCanBeDel is true, rewrite exit value aggressively.

- if (ReplaceExitValue == OnlyCheapRepl && !LoopCanBeDel && Phi.HighCost)

+ if ((ReplaceExitValue == OnlyCheapRepl ||

+ ReplaceExitValue == UnusedIndVarInLoop) &&

+ !LoopCanBeDel && Phi.HighCost)

continue;

Value *ExitVal = Rewriter.expandCodeFor(

diff --git a/llvm/lib/Transforms/Utils/LowerAtomic.cpp b/llvm/lib/Transforms/Utils/LowerAtomic.cpp
index 8641581c8039..9914a5ca6c5e 100644
--- a/llvm/lib/Transforms/Utils/LowerAtomic.cpp
+++ b/llvm/lib/Transforms/Utils/LowerAtomic.cpp

@@ -74,6 +74,10 @@ Value *llvm::buildAtomicRMWValue(AtomicRMWInst::BinOp Op,

return Builder.CreateFAdd(Loaded, Inc, "new");

case AtomicRMWInst::FSub:

return Builder.CreateFSub(Loaded, Inc, "new");

+ case AtomicRMWInst::FMax:

+ return Builder.CreateMaxNum(Loaded, Inc);

+ case AtomicRMWInst::FMin:

+ return Builder.CreateMinNum(Loaded, Inc);

default:

llvm_unreachable("Unknown atomic op");

}

diff --git a/llvm/lib/Transforms/Utils/MisExpect.cpp b/llvm/lib/Transforms/Utils/MisExpect.cpp
index b73d68ebec7c..4414b04c7264 100644
--- a/llvm/lib/Transforms/Utils/MisExpect.cpp
+++ b/llvm/lib/Transforms/Utils/MisExpect.cpp

@@ -221,7 +221,7 @@ void checkBackendInstrumentation(Instruction &I,

auto ExpectedWeightsOpt = extractWeights(&I, I.getContext());

if (!ExpectedWeightsOpt)

return;

- auto ExpectedWeights = ExpectedWeightsOpt.getValue();

+ auto ExpectedWeights = ExpectedWeightsOpt.value();

verifyMisExpect(I, RealWeights, ExpectedWeights);

}

@@ -230,7 +230,7 @@ void checkFrontendInstrumentation(Instruction &I,

auto RealWeightsOpt = extractWeights(&I, I.getContext());

if (!RealWeightsOpt)

return;

- auto RealWeights = RealWeightsOpt.getValue();

+ auto RealWeights = RealWeightsOpt.value();

verifyMisExpect(I, RealWeights, ExpectedWeights);

}

diff --git a/llvm/lib/Transforms/Utils/ModuleUtils.cpp b/llvm/lib/Transforms/Utils/ModuleUtils.cpp
index 5120ade70e16..9e1492b97a86 100644
--- a/llvm/lib/Transforms/Utils/ModuleUtils.cpp
+++ b/llvm/lib/Transforms/Utils/ModuleUtils.cpp

@@ -255,7 +255,7 @@ void VFABI::setVectorVariantNames(CallInst *CI,

LLVM_DEBUG(dbgs() << "VFABI: adding mapping '" << VariantMapping << "'\n");

Optional<VFInfo> VI = VFABI::tryDemangleForVFABI(VariantMapping, *M);

assert(VI && "Cannot add an invalid VFABI name.");

- assert(M->getNamedValue(VI.getValue().VectorName) &&

+ assert(M->getNamedValue(VI.value().VectorName) &&

"Cannot add variant to attribute: "

"vector function declaration is missing.");

}

@@ -275,5 +275,13 @@ void llvm::embedBufferInModule(Module &M, MemoryBufferRef Buf,

GV->setSection(SectionName);

GV->setAlignment(Alignment);

+ LLVMContext &Ctx = M.getContext();

+ NamedMDNode *MD = M.getOrInsertNamedMetadata("llvm.embedded.objects");

+ Metadata *MDVals[] = {ConstantAsMetadata::get(GV),

+ MDString::get(Ctx, SectionName)};

+ MD->addOperand(llvm::MDNode::get(Ctx, MDVals));

+ GV->setMetadata(LLVMContext::MD_exclude, llvm::MDNode::get(Ctx, {}));

appendToCompilerUsed(M, GV);

}

diff --git a/llvm/lib/Transforms/Utils/PromoteMemoryToRegister.cpp b/llvm/lib/Transforms/Utils/PromoteMemoryToRegister.cpp
index aff692b36288..bec1db896efb 100644
--- a/llvm/lib/Transforms/Utils/PromoteMemoryToRegister.cpp
+++ b/llvm/lib/Transforms/Utils/PromoteMemoryToRegister.cpp

@@ -488,31 +488,33 @@ static bool promoteSingleBlockAlloca(AllocaInst *AI, const AllocaInfo &Info,

StoresByIndex,

std::make_pair(LoadIdx, static_cast<StoreInst *>(nullptr)),

less_first());

+ Value *ReplVal;

if (I == StoresByIndex.begin()) {

if (StoresByIndex.empty())

// If there are no stores, the load takes the undef value.

- LI->replaceAllUsesWith(UndefValue::get(LI->getType()));

+ ReplVal = UndefValue::get(LI->getType());

else

// There is no store before this load, bail out (load may be affected

// by the following stores - see main comment).

return false;

} else {

- // Otherwise, there was a store before this load, the load takes its value.

- // Note, if the load was marked as nonnull we don't want to lose that

- // information when we erase it. So we preserve it with an assume.

- Value *ReplVal = std::prev(I)->second->getOperand(0);

- if (AC && LI->getMetadata(LLVMContext::MD_nonnull) &&

- !isKnownNonZero(ReplVal, DL, 0, AC, LI, &DT))

- addAssumeNonNull(AC, LI);

+ // Otherwise, there was a store before this load, the load takes its

+ // value.

+ ReplVal = std::prev(I)->second->getOperand(0);

+ }

- // If the replacement value is the load, this must occur in unreachable

- // code.

- if (ReplVal == LI)

- ReplVal = PoisonValue::get(LI->getType());

+ // Note, if the load was marked as nonnull we don't want to lose that

+ // information when we erase it. So we preserve it with an assume.

+ if (AC && LI->getMetadata(LLVMContext::MD_nonnull) &&

+ !isKnownNonZero(ReplVal, DL, 0, AC, LI, &DT))

+ addAssumeNonNull(AC, LI);

- LI->replaceAllUsesWith(ReplVal);

- }

+ // If the replacement value is the load, this must occur in unreachable

+ // code.

+ if (ReplVal == LI)

+ ReplVal = PoisonValue::get(LI->getType());

+ LI->replaceAllUsesWith(ReplVal);

LI->eraseFromParent();

LBI.deleteValue(LI);

}

diff --git a/llvm/lib/Transforms/Utils/SCCPSolver.cpp b/llvm/lib/Transforms/Utils/SCCPSolver.cpp
index eee91e70292e..09a83f1ea094 100644
--- a/llvm/lib/Transforms/Utils/SCCPSolver.cpp
+++ b/llvm/lib/Transforms/Utils/SCCPSolver.cpp

@@ -208,8 +208,6 @@ private:

if (!Elt)

LV.markOverdefined(); // Unknown sort of constant.

- else if (isa<UndefValue>(Elt))

- ; // Undef values remain unknown.

else

LV.markConstant(Elt); // Constants are constant.

}

@@ -356,8 +354,7 @@ public:

// We only track the contents of scalar globals.

if (GV->getValueType()->isSingleValueType()) {

ValueLatticeElement &IV = TrackedGlobals[GV];

- if (!isa<UndefValue>(GV->getInitializer()))

- IV.markConstant(GV->getInitializer());

+ IV.markConstant(GV->getInitializer());

}

@@ -822,9 +819,6 @@ void SCCPInstVisitor::visitCastInst(CastInst &I) {

if (Constant *OpC = getConstant(OpSt)) {

// Fold the constant as we build.

Constant *C = ConstantFoldCastOperand(I.getOpcode(), OpC, I.getType(), DL);

- if (isa<UndefValue>(C))

- return;

- // Propagate constant value

markConstant(&I, C);

} else if (I.getDestTy()->isIntegerTy()) {

auto &LV = getValueState(&I);

@@ -959,19 +953,15 @@ void SCCPInstVisitor::visitUnaryOperator(Instruction &I) {

if (isOverdefined(IV))

return (void)markOverdefined(&I);

- if (isConstant(V0State)) {

- Constant *C = ConstantExpr::get(I.getOpcode(), getConstant(V0State));

- // op Y -> undef.

- if (isa<UndefValue>(C))

- return;

- return (void)markConstant(IV, &I, C);

- }

- // If something is undef, wait for it to resolve.

- if (!isOverdefined(V0State))

+ // If something is unknown/undef, wait for it to resolve.

+ if (V0State.isUnknownOrUndef())

return;

+ if (isConstant(V0State))

+ if (Constant *C = ConstantFoldUnaryOpOperand(I.getOpcode(),

+ getConstant(V0State), DL))

+ return (void)markConstant(IV, &I, C);

markOverdefined(&I);

}

@@ -999,9 +989,6 @@ void SCCPInstVisitor::visitBinaryOperator(Instruction &I) {

Value *R = simplifyBinOp(I.getOpcode(), V1, V2, SimplifyQuery(DL));

auto *C = dyn_cast_or_null<Constant>(R);

if (C) {

- // X op Y -> undef.

- if (isa<UndefValue>(C))

- return;

// Conservatively assume that the result may be based on operands that may

// be undef. Note that we use mergeInValue to combine the constant with

// the existing lattice value for I, as different constants might be found

@@ -1050,6 +1037,7 @@ void SCCPInstVisitor::visitCmpInst(CmpInst &I) {

Constant *C = V1State.getCompare(I.getPredicate(), I.getType(), V2State);

if (C) {

+ // TODO: getCompare() currently has incorrect handling for unknown/undef.

if (isa<UndefValue>(C))

return;

ValueLatticeElement CV;

@@ -1095,8 +1083,6 @@ void SCCPInstVisitor::visitGetElementPtrInst(GetElementPtrInst &I) {

auto Indices = makeArrayRef(Operands.begin() + 1, Operands.end());

Constant *C =

ConstantExpr::getGetElementPtr(I.getSourceElementType(), Ptr, Indices);

- if (isa<UndefValue>(C))

- return;

markConstant(&I, C);

}

@@ -1174,11 +1160,8 @@ void SCCPInstVisitor::visitLoadInst(LoadInst &I) {

}

// Transform load from a constant into a constant if possible.

- if (Constant *C = ConstantFoldLoadFromConstPtr(Ptr, I.getType(), DL)) {

- if (isa<UndefValue>(C))

- return;

+ if (Constant *C = ConstantFoldLoadFromConstPtr(Ptr, I.getType(), DL))

return (void)markConstant(IV, &I, C);

- }

}

// Fall back to metadata.

@@ -1223,12 +1206,8 @@ void SCCPInstVisitor::handleCallOverdefined(CallBase &CB) {

// If we can constant fold this, mark the result of the call as a

// constant.

- if (Constant *C = ConstantFoldCall(&CB, F, Operands, &GetTLI(*F))) {

- // call -> undef.

- if (isa<UndefValue>(C))

- return;

+ if (Constant *C = ConstantFoldCall(&CB, F, Operands, &GetTLI(*F)))

return (void)markConstant(&CB, C);

- }

}

// Fall back to metadata.

diff --git a/llvm/lib/Transforms/Utils/ScalarEvolutionExpander.cpp b/llvm/lib/Transforms/Utils/ScalarEvolutionExpander.cpp
index 401f1ee5a55d..0c8bf3827256 100644
--- a/llvm/lib/Transforms/Utils/ScalarEvolutionExpander.cpp
+++ b/llvm/lib/Transforms/Utils/ScalarEvolutionExpander.cpp

@@ -220,7 +220,8 @@ Value *SCEVExpander::InsertBinop(Instruction::BinaryOps Opcode,

// Fold a binop with constant operands.

if (Constant *CLHS = dyn_cast<Constant>(LHS))

if (Constant *CRHS = dyn_cast<Constant>(RHS))

- return ConstantExpr::get(Opcode, CLHS, CRHS);

+ if (Constant *Res = ConstantFoldBinaryOpOperands(Opcode, CLHS, CRHS, DL))

+ return Res;

// Do a quick scan to see if we have this binop nearby. If so, reuse it.

unsigned ScanLimit = 6;

diff --git a/llvm/lib/Transforms/Utils/SimplifyCFG.cpp b/llvm/lib/Transforms/Utils/SimplifyCFG.cpp
index 567b866f7777..4b5ade99767b 100644
--- a/llvm/lib/Transforms/Utils/SimplifyCFG.cpp
+++ b/llvm/lib/Transforms/Utils/SimplifyCFG.cpp

@@ -377,18 +377,12 @@ static void AddPredecessorToBlock(BasicBlock *Succ, BasicBlock *NewPred,

/// expensive.

static InstructionCost computeSpeculationCost(const User *I,

const TargetTransformInfo &TTI) {

- assert(isSafeToSpeculativelyExecute(I) &&

+ assert((!isa<Instruction>(I) ||

+ isSafeToSpeculativelyExecute(cast<Instruction>(I))) &&

"Instruction is not safe to speculatively execute!");

return TTI.getUserCost(I, TargetTransformInfo::TCK_SizeAndLatency);

}

-/// Check whether this is a potentially trapping constant.

-static bool canTrap(const Value *V) {

- if (auto *C = dyn_cast<Constant>(V))

- return C->canTrap();

- return false;

/// If we have a merge point of an "if condition" as accepted above,

/// return true if the specified value dominates the block. We

/// don't handle the true generality of domination here, just a special case

@@ -421,9 +415,9 @@ static bool dominatesMergePoint(Value *V, BasicBlock *BB,

Instruction *I = dyn_cast<Instruction>(V);

if (!I) {

- // Non-instructions all dominate instructions, but not all constantexprs

- // can be executed unconditionally.

- return !canTrap(V);

+ // Non-instructions dominate all instructions and can be executed

+ // unconditionally.

+ return true;

}

BasicBlock *PBB = I->getParent();

@@ -1473,10 +1467,7 @@ bool SimplifyCFGOpt::HoistThenElseCodeToIf(BranchInst *BI,

while (isa<DbgInfoIntrinsic>(I2))

I2 = &*BB2_Itr++;

}

- // FIXME: Can we define a safety predicate for CallBr?

- if (isa<PHINode>(I1) || !I1->isIdenticalToWhenDefined(I2) ||

- (isa<InvokeInst>(I1) && !isSafeToHoistInvoke(BB1, BB2, I1, I2)) ||

- isa<CallBrInst>(I1))

+ if (isa<PHINode>(I1) || !I1->isIdenticalToWhenDefined(I2))

return false;

BasicBlock *BIParent = BI->getParent();

@@ -1609,11 +1600,6 @@ HoistTerminator:

if (passingValueIsAlwaysUndefined(BB1V, &PN) ||

passingValueIsAlwaysUndefined(BB2V, &PN))

return Changed;

- if (isa<ConstantExpr>(BB1V) && !isSafeToSpeculativelyExecute(BB1V))

- return Changed;

- if (isa<ConstantExpr>(BB2V) && !isSafeToSpeculativelyExecute(BB2V))

- return Changed;

}

@@ -2679,9 +2665,6 @@ static bool validateAndCostRequiredSelects(BasicBlock *BB, BasicBlock *ThenBB,

passingValueIsAlwaysUndefined(ThenV, &PN))

return false;

- if (canTrap(OrigV) || canTrap(ThenV))

- return false;

HaveRewritablePHIs = true;

ConstantExpr *OrigCE = dyn_cast<ConstantExpr>(OrigV);

ConstantExpr *ThenCE = dyn_cast<ConstantExpr>(ThenV);

@@ -2979,10 +2962,8 @@ static bool BlockIsSimpleEnoughToThreadThrough(BasicBlock *BB) {

return true;

}

-static ConstantInt *

-getKnownValueOnEdge(Value *V, BasicBlock *From, BasicBlock *To,

- SmallDenseMap<std::pair<BasicBlock *, BasicBlock *>,

- ConstantInt *> &Visited) {

+static ConstantInt *getKnownValueOnEdge(Value *V, BasicBlock *From,

+ BasicBlock *To) {

// Don't look past the block defining the value, we might get the value from

// a previous loop iteration.

auto *I = dyn_cast<Instruction>(V);

@@ -2996,23 +2977,7 @@ getKnownValueOnEdge(Value *V, BasicBlock *From, BasicBlock *To,

return BI->getSuccessor(0) == To ? ConstantInt::getTrue(BI->getContext())

: ConstantInt::getFalse(BI->getContext());

- // Limit the amount of blocks we inspect.

- if (Visited.size() >= 8)

- return nullptr;

- auto Pair = Visited.try_emplace({From, To}, nullptr);

- if (!Pair.second)

- return Pair.first->second;

- // Check whether the known value is the same for all predecessors.

- ConstantInt *Common = nullptr;

- for (BasicBlock *Pred : predecessors(From)) {

- ConstantInt *C = getKnownValueOnEdge(V, Pred, From, Visited);

- if (!C || (Common && Common != C))

- return nullptr;

- Common = C;

- }

- return Visited[{From, To}] = Common;

+ return nullptr;

}

/// If we have a conditional branch on something for which we know the constant

@@ -3022,7 +2987,7 @@ static Optional<bool>

FoldCondBranchOnValueKnownInPredecessorImpl(BranchInst *BI, DomTreeUpdater *DTU,

const DataLayout &DL,

AssumptionCache *AC) {

- SmallMapVector<BasicBlock *, ConstantInt *, 8> KnownValues;

+ SmallMapVector<ConstantInt *, SmallSetVector<BasicBlock *, 2>, 2> KnownValues;

BasicBlock *BB = BI->getParent();

Value *Cond = BI->getCondition();

PHINode *PN = dyn_cast<PHINode>(Cond);

@@ -3035,12 +3000,11 @@ FoldCondBranchOnValueKnownInPredecessorImpl(BranchInst *BI, DomTreeUpdater *DTU,

for (Use &U : PN->incoming_values())

if (auto *CB = dyn_cast<ConstantInt>(U))

- KnownValues.insert({PN->getIncomingBlock(U), CB});

+ KnownValues[CB].insert(PN->getIncomingBlock(U));

} else {

- SmallDenseMap<std::pair<BasicBlock *, BasicBlock *>, ConstantInt *> Visited;

for (BasicBlock *Pred : predecessors(BB)) {

- if (ConstantInt *CB = getKnownValueOnEdge(Cond, Pred, BB, Visited))

- KnownValues.insert({Pred, CB});

+ if (ConstantInt *CB = getKnownValueOnEdge(Cond, Pred, BB))

+ KnownValues[CB].insert(Pred);

}

@@ -3056,29 +3020,34 @@ FoldCondBranchOnValueKnownInPredecessorImpl(BranchInst *BI, DomTreeUpdater *DTU,

for (const auto &Pair : KnownValues) {

// Okay, we now know that all edges from PredBB should be revectored to

// branch to RealDest.

- ConstantInt *CB = Pair.second;

- BasicBlock *PredBB = Pair.first;

+ ConstantInt *CB = Pair.first;

+ ArrayRef<BasicBlock *> PredBBs = Pair.second.getArrayRef();

BasicBlock *RealDest = BI->getSuccessor(!CB->getZExtValue());

if (RealDest == BB)

continue; // Skip self loops.

// Skip if the predecessor's terminator is an indirect branch.

- if (isa<IndirectBrInst>(PredBB->getTerminator()))

+ if (any_of(PredBBs, [](BasicBlock *PredBB) {

+ return isa<IndirectBrInst>(PredBB->getTerminator());

+ }))

continue;

- SmallVector<DominatorTree::UpdateType, 3> Updates;

+ LLVM_DEBUG({

+ dbgs() << "Condition " << *Cond << " in " << BB->getName()

+ << " has value " << *Pair.first << " in predecessors:\n";

+ for (const BasicBlock *PredBB : Pair.second)

+ dbgs() << " " << PredBB->getName() << "\n";

+ dbgs() << "Threading to destination " << RealDest->getName() << ".\n";

+ });

+ // Split the predecessors we are threading into a new edge block. We'll

+ // clone the instructions into this block, and then redirect it to RealDest.

+ BasicBlock *EdgeBB = SplitBlockPredecessors(BB, PredBBs, ".critedge", DTU);

- // The dest block might have PHI nodes, other predecessors and other

- // difficult cases. Instead of being smart about this, just insert a new

- // block that jumps to the destination block, effectively splitting

- // the edge we are about to create.

- BasicBlock *EdgeBB =

- BasicBlock::Create(BB->getContext(), RealDest->getName() + ".critedge",

- RealDest->getParent(), RealDest);

- BranchInst *CritEdgeBranch = BranchInst::Create(RealDest, EdgeBB);

- if (DTU)

- Updates.push_back({DominatorTree::Insert, EdgeBB, RealDest});

- CritEdgeBranch->setDebugLoc(BI->getDebugLoc());

+ // TODO: These just exist to reduce test diff, we can drop them if we like.

+ EdgeBB->setName(RealDest->getName() + ".critedge");

+ EdgeBB->moveBefore(RealDest);

// Update PHI nodes.

AddPredecessorToBlock(RealDest, EdgeBB, BB);

@@ -3086,12 +3055,12 @@ FoldCondBranchOnValueKnownInPredecessorImpl(BranchInst *BI, DomTreeUpdater *DTU,

// BB may have instructions that are being threaded over. Clone these

// instructions into EdgeBB. We know that there will be no uses of the

// cloned instructions outside of EdgeBB.

- BasicBlock::iterator InsertPt = EdgeBB->begin();

+ BasicBlock::iterator InsertPt = EdgeBB->getFirstInsertionPt();

DenseMap<Value *, Value *> TranslateMap; // Track translated values.

- TranslateMap[Cond] = Pair.second;

+ TranslateMap[Cond] = CB;

for (BasicBlock::iterator BBI = BB->begin(); &*BBI != BI; ++BBI) {

if (PHINode *PN = dyn_cast<PHINode>(BBI)) {

- TranslateMap[PN] = PN->getIncomingValueForBlock(PredBB);

+ TranslateMap[PN] = PN->getIncomingValueForBlock(EdgeBB);

continue;

}

// Clone the instruction.

@@ -3129,19 +3098,15 @@ FoldCondBranchOnValueKnownInPredecessorImpl(BranchInst *BI, DomTreeUpdater *DTU,

}

- // Loop over all of the edges from PredBB to BB, changing them to branch

- // to EdgeBB instead.

- Instruction *PredBBTI = PredBB->getTerminator();

- for (unsigned i = 0, e = PredBBTI->getNumSuccessors(); i != e; ++i)

- if (PredBBTI->getSuccessor(i) == BB) {

- BB->removePredecessor(PredBB);

- PredBBTI->setSuccessor(i, EdgeBB);

- }

+ BB->removePredecessor(EdgeBB);

+ BranchInst *EdgeBI = cast<BranchInst>(EdgeBB->getTerminator());

+ EdgeBI->setSuccessor(0, RealDest);

+ EdgeBI->setDebugLoc(BI->getDebugLoc());

if (DTU) {

- Updates.push_back({DominatorTree::Insert, PredBB, EdgeBB});

- Updates.push_back({DominatorTree::Delete, PredBB, BB});

+ SmallVector<DominatorTree::UpdateType, 2> Updates;

+ Updates.push_back({DominatorTree::Delete, EdgeBB, BB});

+ Updates.push_back({DominatorTree::Insert, EdgeBB, RealDest});

DTU->applyUpdates(Updates);

}

@@ -3599,13 +3564,6 @@ bool llvm::FoldBranchToCommonDest(BranchInst *BI, DomTreeUpdater *DTU,

Cond->getParent() != BB || !Cond->hasOneUse())

return false;

- // Cond is known to be a compare or binary operator. Check to make sure that

- // neither operand is a potentially-trapping constant expression.

- if (canTrap(Cond->getOperand(0)))

- return false;

- if (canTrap(Cond->getOperand(1)))

- return false;

// Finally, don't infinitely unroll conditional loops.

if (is_contained(successors(BB), BB))

return false;

@@ -4113,9 +4071,6 @@ static bool SimplifyCondBranchToCondBranch(BranchInst *PBI, BranchInst *BI,

if (tryWidenCondBranchToCondBranch(PBI, BI, DTU))

return true;

- if (canTrap(BI->getCondition()))

- return false;

// If both branches are conditional and both contain stores to the same

// address, remove the stores from the conditionals and create a conditional

// merged store at the end.

@@ -4157,10 +4112,6 @@ static bool SimplifyCondBranchToCondBranch(BranchInst *PBI, BranchInst *BI,

// insertion of a large number of select instructions. For targets

// without predication/cmovs, this is a big pessimization.

- // Also do not perform this transformation if any phi node in the common

- // destination block can trap when reached by BB or PBB (PR17073). In that

- // case, it would be unsafe to hoist the operation into a select instruction.

BasicBlock *CommonDest = PBI->getSuccessor(PBIOp);

BasicBlock *RemovedDest = PBI->getSuccessor(PBIOp ^ 1);

unsigned NumPhis = 0;

@@ -4168,16 +4119,6 @@ static bool SimplifyCondBranchToCondBranch(BranchInst *PBI, BranchInst *BI,

++II, ++NumPhis) {

if (NumPhis > 2) // Disable this xform.

return false;

- PHINode *PN = cast<PHINode>(II);

- Value *BIV = PN->getIncomingValueForBlock(BB);

- if (canTrap(BIV))

- return false;

- unsigned PBBIdx = PN->getBasicBlockIndex(PBI->getParent());

- Value *PBIV = PN->getIncomingValue(PBBIdx);

- if (canTrap(PBIV))

- return false;

}

// Finally, if everything is ok, fold the branches to logical ops.

@@ -6174,6 +6115,23 @@ ShouldBuildLookupTable(SwitchInst *SI, uint64_t TableSize,

return isSwitchDense(SI->getNumCases(), TableSize);

}

+static bool ShouldUseSwitchConditionAsTableIndex(

+ ConstantInt &MinCaseVal, const ConstantInt &MaxCaseVal,

+ bool HasDefaultResults, const SmallDenseMap<PHINode *, Type *> &ResultTypes,

+ const DataLayout &DL, const TargetTransformInfo &TTI) {

+ if (MinCaseVal.isNullValue())

+ return true;

+ if (MinCaseVal.isNegative() ||

+ MaxCaseVal.getLimitedValue() == std::numeric_limits<uint64_t>::max() ||

+ !HasDefaultResults)

+ return false;

+ return all_of(ResultTypes, [&](const auto &KV) {

+ return SwitchLookupTable::WouldFitInRegister(

+ DL, MaxCaseVal.getLimitedValue() + 1 /* TableSize */,

+ KV.second /* ResultType */);

+ });

/// Try to reuse the switch table index compare. Following pattern:

/// \code

/// if (idx < tablesize)

@@ -6329,9 +6287,6 @@ static bool SwitchToLookupTable(SwitchInst *SI, IRBuilder<> &Builder,

}

uint64_t NumResults = ResultLists[PHIs[0]].size();

- APInt RangeSpread = MaxCaseVal->getValue() - MinCaseVal->getValue();

- uint64_t TableSize = RangeSpread.getLimitedValue() + 1;

- bool TableHasHoles = (NumResults < TableSize);

// If the table has holes, we need a constant result for the default case

// or a bitmask that fits in a register.

@@ -6340,6 +6295,22 @@ static bool SwitchToLookupTable(SwitchInst *SI, IRBuilder<> &Builder,

getCaseResults(SI, nullptr, SI->getDefaultDest(), &CommonDest,

DefaultResultsList, DL, TTI);

+ for (const auto &I : DefaultResultsList) {

+ PHINode *PHI = I.first;

+ Constant *Result = I.second;

+ DefaultResults[PHI] = Result;

+ }

+ bool UseSwitchConditionAsTableIndex = ShouldUseSwitchConditionAsTableIndex(

+ *MinCaseVal, *MaxCaseVal, HasDefaultResults, ResultTypes, DL, TTI);

+ uint64_t TableSize;

+ if (UseSwitchConditionAsTableIndex)

+ TableSize = MaxCaseVal->getLimitedValue() + 1;

+ else

+ TableSize =

+ (MaxCaseVal->getValue() - MinCaseVal->getValue()).getLimitedValue() + 1;

+ bool TableHasHoles = (NumResults < TableSize);

bool NeedMask = (TableHasHoles && !HasDefaultResults);

if (NeedMask) {

// As an extra penalty for the validity test we require more cases.

@@ -6349,12 +6320,6 @@ static bool SwitchToLookupTable(SwitchInst *SI, IRBuilder<> &Builder,

return false;

}

- for (const auto &I : DefaultResultsList) {

- PHINode *PHI = I.first;

- Constant *Result = I.second;

- DefaultResults[PHI] = Result;

- }

if (!ShouldBuildLookupTable(SI, TableSize, TTI, DL, ResultTypes))

return false;

@@ -6368,11 +6333,15 @@ static bool SwitchToLookupTable(SwitchInst *SI, IRBuilder<> &Builder,

// Compute the table index value.

Builder.SetInsertPoint(SI);

Value *TableIndex;

- if (MinCaseVal->isNullValue())

+ ConstantInt *TableIndexOffset;

+ if (UseSwitchConditionAsTableIndex) {

+ TableIndexOffset = ConstantInt::get(MaxCaseVal->getType(), 0);

TableIndex = SI->getCondition();

- else

- TableIndex = Builder.CreateSub(SI->getCondition(), MinCaseVal,

- "switch.tableidx");

+ } else {

+ TableIndexOffset = MinCaseVal;

+ TableIndex =

+ Builder.CreateSub(SI->getCondition(), TableIndexOffset, "switch.tableidx");

+ }

// Compute the maximum table size representable by the integer type we are

// switching upon.

@@ -6424,7 +6393,7 @@ static bool SwitchToLookupTable(SwitchInst *SI, IRBuilder<> &Builder,

// Build bitmask; fill in a 1 bit for every case.

const ResultListTy &ResultList = ResultLists[PHIs[0]];

for (size_t I = 0, E = ResultList.size(); I != E; ++I) {

- uint64_t Idx = (ResultList[I].first->getValue() - MinCaseVal->getValue())

+ uint64_t Idx = (ResultList[I].first->getValue() - TableIndexOffset->getValue())

.getLimitedValue();

MaskInt |= One << Idx;

}

@@ -6463,8 +6432,8 @@ static bool SwitchToLookupTable(SwitchInst *SI, IRBuilder<> &Builder,

// If using a bitmask, use any value to fill the lookup table holes.

Constant *DV = NeedMask ? ResultLists[PHI][0].second : DefaultResults[PHI];

StringRef FuncName = Fn->getName();

- SwitchLookupTable Table(Mod, TableSize, MinCaseVal, ResultList, DV, DL,

- FuncName);

+ SwitchLookupTable Table(Mod, TableSize, TableIndexOffset, ResultList, DV,

+ DL, FuncName);

Value *Result = Table.BuildLookup(TableIndex, Builder);

diff --git a/llvm/lib/Transforms/Utils/SimplifyIndVar.cpp b/llvm/lib/Transforms/Utils/SimplifyIndVar.cpp
index dbef1ff2e739..af15e0c31b75 100644
--- a/llvm/lib/Transforms/Utils/SimplifyIndVar.cpp
+++ b/llvm/lib/Transforms/Utils/SimplifyIndVar.cpp

@@ -79,21 +79,23 @@ namespace {

bool eliminateIdentitySCEV(Instruction *UseInst, Instruction *IVOperand);

bool replaceIVUserWithLoopInvariant(Instruction *UseInst);

+ bool replaceFloatIVWithIntegerIV(Instruction *UseInst);

bool eliminateOverflowIntrinsic(WithOverflowInst *WO);

bool eliminateSaturatingIntrinsic(SaturatingInst *SI);

bool eliminateTrunc(TruncInst *TI);

bool eliminateIVUser(Instruction *UseInst, Instruction *IVOperand);

- bool makeIVComparisonInvariant(ICmpInst *ICmp, Value *IVOperand);

- void eliminateIVComparison(ICmpInst *ICmp, Value *IVOperand);

- void simplifyIVRemainder(BinaryOperator *Rem, Value *IVOperand,

+ bool makeIVComparisonInvariant(ICmpInst *ICmp, Instruction *IVOperand);

+ void eliminateIVComparison(ICmpInst *ICmp, Instruction *IVOperand);

+ void simplifyIVRemainder(BinaryOperator *Rem, Instruction *IVOperand,

bool IsSigned);

void replaceRemWithNumerator(BinaryOperator *Rem);

void replaceRemWithNumeratorOrZero(BinaryOperator *Rem);

void replaceSRemWithURem(BinaryOperator *Rem);

bool eliminateSDiv(BinaryOperator *SDiv);

- bool strengthenOverflowingOperation(BinaryOperator *OBO, Value *IVOperand);

- bool strengthenRightShift(BinaryOperator *BO, Value *IVOperand);

+ bool strengthenOverflowingOperation(BinaryOperator *OBO,

+ Instruction *IVOperand);

+ bool strengthenRightShift(BinaryOperator *BO, Instruction *IVOperand);

};

}

@@ -192,7 +194,7 @@ Value *SimplifyIndvar::foldIVUser(Instruction *UseInst, Instruction *IVOperand)

}

bool SimplifyIndvar::makeIVComparisonInvariant(ICmpInst *ICmp,

- Value *IVOperand) {

+ Instruction *IVOperand) {

unsigned IVOperIdx = 0;

ICmpInst::Predicate Pred = ICmp->getPredicate();

if (IVOperand != ICmp->getOperand(0)) {

@@ -261,7 +263,8 @@ bool SimplifyIndvar::makeIVComparisonInvariant(ICmpInst *ICmp,

/// SimplifyIVUsers helper for eliminating useless

/// comparisons against an induction variable.

-void SimplifyIndvar::eliminateIVComparison(ICmpInst *ICmp, Value *IVOperand) {

+void SimplifyIndvar::eliminateIVComparison(ICmpInst *ICmp,

+ Instruction *IVOperand) {

unsigned IVOperIdx = 0;

ICmpInst::Predicate Pred = ICmp->getPredicate();

ICmpInst::Predicate OriginalPred = Pred;

@@ -372,7 +375,8 @@ void SimplifyIndvar::replaceRemWithNumeratorOrZero(BinaryOperator *Rem) {

/// SimplifyIVUsers helper for eliminating useless remainder operations

/// operating on an induction variable or replacing srem by urem.

-void SimplifyIndvar::simplifyIVRemainder(BinaryOperator *Rem, Value *IVOperand,

+void SimplifyIndvar::simplifyIVRemainder(BinaryOperator *Rem,

+ Instruction *IVOperand,

bool IsSigned) {

auto *NValue = Rem->getOperand(0);

auto *DValue = Rem->getOperand(1);

@@ -673,6 +677,35 @@ bool SimplifyIndvar::replaceIVUserWithLoopInvariant(Instruction *I) {

return true;

}

+/// Eliminate redundant type cast between integer and float.

+bool SimplifyIndvar::replaceFloatIVWithIntegerIV(Instruction *UseInst) {

+ if (UseInst->getOpcode() != CastInst::SIToFP)

+ return false;

+ Value *IVOperand = UseInst->getOperand(0);

+ // Get the symbolic expression for this instruction.

+ ConstantRange IVRange = SE->getSignedRange(SE->getSCEV(IVOperand));

+ unsigned DestNumSigBits = UseInst->getType()->getFPMantissaWidth();

+ if (IVRange.getActiveBits() <= DestNumSigBits) {

+ for (User *U : UseInst->users()) {

+ // Match for fptosi of sitofp and with same type.

+ auto *CI = dyn_cast<FPToSIInst>(U);

+ if (!CI || IVOperand->getType() != CI->getType())

+ continue;

+ CI->replaceAllUsesWith(IVOperand);

+ DeadInsts.push_back(CI);

+ LLVM_DEBUG(dbgs() << "INDVARS: Replace IV user: " << *CI

+ << " with: " << *IVOperand << '\n');

+ ++NumFoldedUser;

+ Changed = true;

+ }

+ return Changed;

/// Eliminate any operation that SCEV can prove is an identity function.

bool SimplifyIndvar::eliminateIdentitySCEV(Instruction *UseInst,

Instruction *IVOperand) {

@@ -718,18 +751,16 @@ bool SimplifyIndvar::eliminateIdentitySCEV(Instruction *UseInst,

/// Annotate BO with nsw / nuw if it provably does not signed-overflow /

/// unsigned-overflow. Returns true if anything changed, false otherwise.

bool SimplifyIndvar::strengthenOverflowingOperation(BinaryOperator *BO,

- Value *IVOperand) {

- SCEV::NoWrapFlags Flags;

- bool Deduced;

- std::tie(Flags, Deduced) = SE->getStrengthenedNoWrapFlagsFromBinOp(

+ Instruction *IVOperand) {

+ auto Flags = SE->getStrengthenedNoWrapFlagsFromBinOp(

cast<OverflowingBinaryOperator>(BO));

- if (!Deduced)

- return Deduced;

+ if (!Flags)

+ return false;

- BO->setHasNoUnsignedWrap(ScalarEvolution::maskFlags(Flags, SCEV::FlagNUW) ==

+ BO->setHasNoUnsignedWrap(ScalarEvolution::maskFlags(*Flags, SCEV::FlagNUW) ==

SCEV::FlagNUW);

- BO->setHasNoSignedWrap(ScalarEvolution::maskFlags(Flags, SCEV::FlagNSW) ==

+ BO->setHasNoSignedWrap(ScalarEvolution::maskFlags(*Flags, SCEV::FlagNSW) ==

SCEV::FlagNSW);

// The getStrengthenedNoWrapFlagsFromBinOp() check inferred additional nowrap

@@ -737,14 +768,14 @@ bool SimplifyIndvar::strengthenOverflowingOperation(BinaryOperator *BO,

// forgetValue() here to make sure those flags also propagate to any other

// SCEV expressions based on the addrec. However, this can have pathological

// compile-time impact, see https://bugs.llvm.org/show_bug.cgi?id=50384.

- return Deduced;

+ return true;

}

/// Annotate the Shr in (X << IVOperand) >> C as exact using the

/// information from the IV's range. Returns true if anything changed, false

/// otherwise.

bool SimplifyIndvar::strengthenRightShift(BinaryOperator *BO,

- Value *IVOperand) {

+ Instruction *IVOperand) {

using namespace llvm::PatternMatch;

if (BO->getOpcode() == Instruction::Shl) {

@@ -896,6 +927,13 @@ void SimplifyIndvar::simplifyUsers(PHINode *CurrIV, IVVisitor *V) {

}

+ // Try to use integer induction for FPToSI of float induction directly.

+ if (replaceFloatIVWithIntegerIV(UseInst)) {

+ // Re-queue the potentially new direct uses of IVOperand.

+ pushIVUsers(IVOperand, L, Simplified, SimpleIVUsers);

+ continue;

+ }

CastInst *Cast = dyn_cast<CastInst>(UseInst);

if (V && Cast) {

V->visitCast(Cast);

diff --git a/llvm/lib/Transforms/Utils/SimplifyLibCalls.cpp b/llvm/lib/Transforms/Utils/SimplifyLibCalls.cpp
index f4306bb43dfd..b359717424a6 100644
--- a/llvm/lib/Transforms/Utils/SimplifyLibCalls.cpp
+++ b/llvm/lib/Transforms/Utils/SimplifyLibCalls.cpp

@@ -75,7 +75,8 @@ static bool callHasFP128Argument(const CallInst *CI) {

});

}

-static Value *convertStrToNumber(CallInst *CI, StringRef &Str, int64_t Base) {

+static Value *convertStrToNumber(CallInst *CI, StringRef &Str, Value *EndPtr,

+ int64_t Base, IRBuilderBase &B) {

if (Base < 2 || Base > 36)

// handle special zero base

if (Base != 0)

@@ -97,6 +98,15 @@ static Value *convertStrToNumber(CallInst *CI, StringRef &Str, int64_t Base) {

if (!isIntN(CI->getType()->getPrimitiveSizeInBits(), Result))

return nullptr;

+ if (EndPtr) {

+ // Store the pointer to the end.

+ uint64_t ILen = End - nptr.c_str();

+ Value *Off = B.getInt64(ILen);

+ Value *StrBeg = CI->getArgOperand(0);

+ Value *StrEnd = B.CreateInBoundsGEP(B.getInt8Ty(), StrBeg, Off, "endptr");

+ B.CreateStore(StrEnd, EndPtr);

+ }

return ConstantInt::get(CI->getType(), Result);

}

@@ -295,31 +305,69 @@ Value *LibCallSimplifier::optimizeStrNCat(CallInst *CI, IRBuilderBase &B) {

return copyFlags(*CI, emitStrLenMemCpy(Src, Dst, SrcLen, B));

}

+// Helper to transform memchr(S, C, N) == S to N && *S == C and, when

+// NBytes is null, strchr(S, C) to *S == C. A precondition of the function

+// is that either S is dereferenceable or the value of N is nonzero.

+static Value* memChrToCharCompare(CallInst *CI, Value *NBytes,

+ IRBuilderBase &B, const DataLayout &DL)

+ Value *Src = CI->getArgOperand(0);

+ Value *CharVal = CI->getArgOperand(1);

+ // Fold memchr(A, C, N) == A to N && *A == C.

+ Type *CharTy = B.getInt8Ty();

+ Value *Char0 = B.CreateLoad(CharTy, Src);

+ CharVal = B.CreateTrunc(CharVal, CharTy);

+ Value *Cmp = B.CreateICmpEQ(Char0, CharVal, "char0cmp");

+ if (NBytes) {

+ Value *Zero = ConstantInt::get(NBytes->getType(), 0);

+ Value *And = B.CreateICmpNE(NBytes, Zero);

+ Cmp = B.CreateLogicalAnd(And, Cmp);

+ }

+ Value *NullPtr = Constant::getNullValue(CI->getType());

+ return B.CreateSelect(Cmp, Src, NullPtr);

Value *LibCallSimplifier::optimizeStrChr(CallInst *CI, IRBuilderBase &B) {

- Function *Callee = CI->getCalledFunction();

- FunctionType *FT = Callee->getFunctionType();

Value *SrcStr = CI->getArgOperand(0);

+ Value *CharVal = CI->getArgOperand(1);

annotateNonNullNoUndefBasedOnAccess(CI, 0);

+ if (isOnlyUsedInEqualityComparison(CI, SrcStr))

+ return memChrToCharCompare(CI, nullptr, B, DL);

// If the second operand is non-constant, see if we can compute the length

// of the input string and turn this into memchr.

- ConstantInt *CharC = dyn_cast<ConstantInt>(CI->getArgOperand(1));

+ ConstantInt *CharC = dyn_cast<ConstantInt>(CharVal);

if (!CharC) {

uint64_t Len = GetStringLength(SrcStr);

if (Len)

annotateDereferenceableBytes(CI, 0, Len);

else

return nullptr;

+ Function *Callee = CI->getCalledFunction();

+ FunctionType *FT = Callee->getFunctionType();

if (!FT->getParamType(1)->isIntegerTy(32)) // memchr needs i32.

return nullptr;

return copyFlags(

*CI,

- emitMemChr(SrcStr, CI->getArgOperand(1), // include nul.

+ emitMemChr(SrcStr, CharVal, // include nul.

ConstantInt::get(DL.getIntPtrType(CI->getContext()), Len), B,

DL, TLI));

}

+ if (CharC->isZero()) {

+ Value *NullPtr = Constant::getNullValue(CI->getType());

+ if (isOnlyUsedInEqualityComparison(CI, NullPtr))

+ // Pre-empt the transformation to strlen below and fold

+ // strchr(A, '\0') == null to false.

+ return B.CreateIntToPtr(B.getTrue(), CI->getType());

+ }

// Otherwise, the character is a constant, see if the first argument is

// a string literal. If so, we can constant fold.

StringRef Str;

@@ -1008,8 +1056,12 @@ Value *LibCallSimplifier::optimizeMemRChr(CallInst *CI, IRBuilderBase &B) {

Value *LibCallSimplifier::optimizeMemChr(CallInst *CI, IRBuilderBase &B) {

Value *SrcStr = CI->getArgOperand(0);

Value *Size = CI->getArgOperand(2);

- if (isKnownNonZero(Size, DL))

+ if (isKnownNonZero(Size, DL)) {

annotateNonNullNoUndefBasedOnAccess(CI, 0);

+ if (isOnlyUsedInEqualityComparison(CI, SrcStr))

+ return memChrToCharCompare(CI, Size, B, DL);

+ }

Value *CharVal = CI->getArgOperand(1);

ConstantInt *CharC = dyn_cast<ConstantInt>(CharVal);

@@ -1099,9 +1151,16 @@ Value *LibCallSimplifier::optimizeMemChr(CallInst *CI, IRBuilderBase &B) {

return B.CreateSelect(And, SrcStr, Sel1, "memchr.sel2");

}

- if (!LenC)

+ if (!LenC) {

+ if (isOnlyUsedInEqualityComparison(CI, SrcStr))

+ // S is dereferenceable so it's safe to load from it and fold

+ // memchr(S, C, N) == S to N && *S == C for any C and N.

+ // TODO: This is safe even even for nonconstant S.

+ return memChrToCharCompare(CI, Size, B, DL);

// From now on we need a constant length and constant array.

return nullptr;

+ }

// If the char is variable but the input str and length are not we can turn

// this memchr call into a simple bit field test. Of course this only works

@@ -1589,31 +1648,6 @@ static Value *optimizeTrigReflections(CallInst *Call, LibFunc Func,

return nullptr;

}

-static Value *getPow(Value *InnerChain[33], unsigned Exp, IRBuilderBase &B) {

- // Multiplications calculated using Addition Chains.

- // Refer: http://wwwhomes.uni-bielefeld.de/achim/addition_chain.html

- assert(Exp != 0 && "Incorrect exponent 0 not handled");

- if (InnerChain[Exp])

- return InnerChain[Exp];

- static const unsigned AddChain[33][2] = {

- {0, 0}, // Unused.

- {0, 0}, // Unused (base case = pow1).

- {1, 1}, // Unused (pre-computed).

- {1, 2}, {2, 2}, {2, 3}, {3, 3}, {2, 5}, {4, 4},

- {1, 8}, {5, 5}, {1, 10}, {6, 6}, {4, 9}, {7, 7},

- {3, 12}, {8, 8}, {8, 9}, {2, 16}, {1, 18}, {10, 10},

- {6, 15}, {11, 11}, {3, 20}, {12, 12}, {8, 17}, {13, 13},

- {3, 24}, {14, 14}, {4, 25}, {15, 15}, {3, 28}, {16, 16},

- };

- InnerChain[Exp] = B.CreateFMul(getPow(InnerChain, AddChain[Exp][0], B),

- getPow(InnerChain, AddChain[Exp][1], B));

- return InnerChain[Exp];

// Return a properly extended integer (DstWidth bits wide) if the operation is

// an itofp.

static Value *getIntToFPVal(Value *I2F, IRBuilderBase &B, unsigned DstWidth) {

@@ -1914,70 +1948,52 @@ Value *LibCallSimplifier::optimizePow(CallInst *Pow, IRBuilderBase &B) {

if (Value *Sqrt = replacePowWithSqrt(Pow, B))

return Sqrt;

- // pow(x, n) -> x * x * x * ...

+ // pow(x, n) -> powi(x, n) * sqrt(x) if n has exactly a 0.5 fraction

const APFloat *ExpoF;

- if (AllowApprox && match(Expo, m_APFloat(ExpoF)) &&

- !ExpoF->isExactlyValue(0.5) && !ExpoF->isExactlyValue(-0.5)) {

- // We limit to a max of 7 multiplications, thus the maximum exponent is 32.

- // If the exponent is an integer+0.5 we generate a call to sqrt and an

- // additional fmul.

- // TODO: This whole transformation should be backend specific (e.g. some

- // backends might prefer libcalls or the limit for the exponent might

- // be different) and it should also consider optimizing for size.

- APFloat LimF(ExpoF->getSemantics(), 33),

- ExpoA(abs(*ExpoF));

- if (ExpoA < LimF) {

- // This transformation applies to integer or integer+0.5 exponents only.

- // For integer+0.5, we create a sqrt(Base) call.

- Value *Sqrt = nullptr;

- if (!ExpoA.isInteger()) {

- APFloat Expo2 = ExpoA;

- // To check if ExpoA is an integer + 0.5, we add it to itself. If there

- // is no floating point exception and the result is an integer, then

- // ExpoA == integer + 0.5

- if (Expo2.add(ExpoA, APFloat::rmNearestTiesToEven) != APFloat::opOK)

- return nullptr;

- if (!Expo2.isInteger())

- return nullptr;

- Sqrt = getSqrtCall(Base, Pow->getCalledFunction()->getAttributes(),

- Pow->doesNotAccessMemory(), M, B, TLI);

- if (!Sqrt)

- return nullptr;

- }

- // We will memoize intermediate products of the Addition Chain.

- Value *InnerChain[33] = {nullptr};

- InnerChain[1] = Base;

- InnerChain[2] = B.CreateFMul(Base, Base, "square");

- // We cannot readily convert a non-double type (like float) to a double.

- // So we first convert it to something which could be converted to double.

- ExpoA.convert(APFloat::IEEEdouble(), APFloat::rmTowardZero, &Ignored);

- Value *FMul = getPow(InnerChain, ExpoA.convertToDouble(), B);

+ if (match(Expo, m_APFloat(ExpoF)) && !ExpoF->isExactlyValue(0.5) &&

+ !ExpoF->isExactlyValue(-0.5)) {

+ APFloat ExpoA(abs(*ExpoF));

+ APFloat ExpoI(*ExpoF);

+ Value *Sqrt = nullptr;

+ if (AllowApprox && !ExpoA.isInteger()) {

+ APFloat Expo2 = ExpoA;

+ // To check if ExpoA is an integer + 0.5, we add it to itself. If there

+ // is no floating point exception and the result is an integer, then

+ // ExpoA == integer + 0.5

+ if (Expo2.add(ExpoA, APFloat::rmNearestTiesToEven) != APFloat::opOK)

+ return nullptr;

- // Expand pow(x, y+0.5) to pow(x, y) * sqrt(x).

- if (Sqrt)

- FMul = B.CreateFMul(FMul, Sqrt);

+ if (!Expo2.isInteger())

+ return nullptr;

- // If the exponent is negative, then get the reciprocal.

- if (ExpoF->isNegative())

- FMul = B.CreateFDiv(ConstantFP::get(Ty, 1.0), FMul, "reciprocal");

+ if (ExpoI.roundToIntegral(APFloat::rmTowardNegative) !=

+ APFloat::opInexact)

+ return nullptr;

+ if (!ExpoI.isInteger())

+ return nullptr;

+ ExpoF = &ExpoI;

- return FMul;

+ Sqrt = getSqrtCall(Base, Pow->getCalledFunction()->getAttributes(),

+ Pow->doesNotAccessMemory(), M, B, TLI);

+ if (!Sqrt)

+ return nullptr;

}

+ // pow(x, n) -> powi(x, n) if n is a constant signed integer value

APSInt IntExpo(TLI->getIntSize(), /*isUnsigned=*/false);

- // powf(x, n) -> powi(x, n) if n is a constant signed integer value

if (ExpoF->isInteger() &&

ExpoF->convertToInteger(IntExpo, APFloat::rmTowardZero, &Ignored) ==

APFloat::opOK) {

- return copyFlags(

+ Value *PowI = copyFlags(

*Pow,

createPowWithIntegerExponent(

Base, ConstantInt::get(B.getIntNTy(TLI->getIntSize()), IntExpo),

M, B));

+ if (PowI && Sqrt)

+ return B.CreateFMul(PowI, Sqrt);

+ return PowI;

}

@@ -2517,7 +2533,7 @@ Value *LibCallSimplifier::optimizeAtoi(CallInst *CI, IRBuilderBase &B) {

if (!getConstantStringInfo(CI->getArgOperand(0), Str))

return nullptr;

- return convertStrToNumber(CI, Str, 10);

+ return convertStrToNumber(CI, Str, nullptr, 10, B);

}

Value *LibCallSimplifier::optimizeStrtol(CallInst *CI, IRBuilderBase &B) {

@@ -2525,11 +2541,14 @@ Value *LibCallSimplifier::optimizeStrtol(CallInst *CI, IRBuilderBase &B) {

if (!getConstantStringInfo(CI->getArgOperand(0), Str))

return nullptr;

- if (!isa<ConstantPointerNull>(CI->getArgOperand(1)))

+ Value *EndPtr = CI->getArgOperand(1);

+ if (isa<ConstantPointerNull>(EndPtr))

+ EndPtr = nullptr;

+ else if (!isKnownNonZero(EndPtr, DL))

return nullptr;

if (ConstantInt *CInt = dyn_cast<ConstantInt>(CI->getArgOperand(2))) {

- return convertStrToNumber(CI, Str, CInt->getSExtValue());

+ return convertStrToNumber(CI, Str, EndPtr, CInt->getSExtValue(), B);

}

return nullptr;