src - FreeBSD source tree

diff options


context:
space:
mode:

author	Dimitry Andric <dim@FreeBSD.org>	2017-04-16 16:01:22 +0000
committer	Dimitry Andric <dim@FreeBSD.org>	2017-04-16 16:01:22 +0000
commit	71d5a2540a98c81f5bcaeb48805e0e2881f530ef (patch)
tree	5343938942df402b49ec7300a1c25a2d4ccd5821 /lib/Transforms/InstCombine/InstCombineCasts.cpp
parent	31bbf64f3a4974a2d6c8b3b27ad2f519caf74057 (diff)

vendor/llvm/llvm-trunk-r300422

Diffstat (limited to 'lib/Transforms/InstCombine/InstCombineCasts.cpp')

-rw-r--r--

lib/Transforms/InstCombine/InstCombineCasts.cpp

169

1 files changed, 118 insertions, 51 deletions

diff --git a/lib/Transforms/InstCombine/InstCombineCasts.cpp b/lib/Transforms/InstCombine/InstCombineCasts.cpp
index e74b590e2b7c..25683132c786 100644
--- a/lib/Transforms/InstCombine/InstCombineCasts.cpp
+++ b/lib/Transforms/InstCombine/InstCombineCasts.cpp

@@ -274,12 +274,12 @@ Instruction *InstCombiner::commonCastTransforms(CastInst &CI) {

return NV;

// If we are casting a PHI, then fold the cast into the PHI.

- if (isa<PHINode>(Src)) {

+ if (auto *PN = dyn_cast<PHINode>(Src)) {

// Don't do this if it would create a PHI node with an illegal type from a

// legal type.

if (!Src->getType()->isIntegerTy() || !CI.getType()->isIntegerTy() ||

- ShouldChangeType(CI.getType(), Src->getType()))

- if (Instruction *NV = FoldOpIntoPhi(CI))

+ shouldChangeType(CI.getType(), Src->getType()))

+ if (Instruction *NV = foldOpIntoPhi(CI, PN))

return NV;

}

@@ -447,7 +447,7 @@ static Instruction *foldVecTruncToExtElt(TruncInst &Trunc, InstCombiner &IC,

Instruction *InstCombiner::shrinkBitwiseLogic(TruncInst &Trunc) {

Type *SrcTy = Trunc.getSrcTy();

Type *DestTy = Trunc.getType();

- if (isa<IntegerType>(SrcTy) && !ShouldChangeType(SrcTy, DestTy))

+ if (isa<IntegerType>(SrcTy) && !shouldChangeType(SrcTy, DestTy))

return nullptr;

BinaryOperator *LogicOp;

@@ -463,6 +463,56 @@ Instruction *InstCombiner::shrinkBitwiseLogic(TruncInst &Trunc) {

return BinaryOperator::Create(LogicOp->getOpcode(), NarrowOp0, NarrowC);

}

+/// Try to narrow the width of a splat shuffle. This could be generalized to any

+/// shuffle with a constant operand, but we limit the transform to avoid

+/// creating a shuffle type that targets may not be able to lower effectively.

+static Instruction *shrinkSplatShuffle(TruncInst &Trunc,

+ InstCombiner::BuilderTy &Builder) {

+ auto *Shuf = dyn_cast<ShuffleVectorInst>(Trunc.getOperand(0));

+ if (Shuf && Shuf->hasOneUse() && isa<UndefValue>(Shuf->getOperand(1)) &&

+ Shuf->getMask()->getSplatValue() &&

+ Shuf->getType() == Shuf->getOperand(0)->getType()) {

+ // trunc (shuf X, Undef, SplatMask) --> shuf (trunc X), Undef, SplatMask

+ Constant *NarrowUndef = UndefValue::get(Trunc.getType());

+ Value *NarrowOp = Builder.CreateTrunc(Shuf->getOperand(0), Trunc.getType());

+ return new ShuffleVectorInst(NarrowOp, NarrowUndef, Shuf->getMask());

+ }

+ return nullptr;

+/// Try to narrow the width of an insert element. This could be generalized for

+/// any vector constant, but we limit the transform to insertion into undef to

+/// avoid potential backend problems from unsupported insertion widths. This

+/// could also be extended to handle the case of inserting a scalar constant

+/// into a vector variable.

+static Instruction *shrinkInsertElt(CastInst &Trunc,

+ InstCombiner::BuilderTy &Builder) {

+ Instruction::CastOps Opcode = Trunc.getOpcode();

+ assert((Opcode == Instruction::Trunc || Opcode == Instruction::FPTrunc) &&

+ "Unexpected instruction for shrinking");

+ auto *InsElt = dyn_cast<InsertElementInst>(Trunc.getOperand(0));

+ if (!InsElt || !InsElt->hasOneUse())

+ return nullptr;

+ Type *DestTy = Trunc.getType();

+ Type *DestScalarTy = DestTy->getScalarType();

+ Value *VecOp = InsElt->getOperand(0);

+ Value *ScalarOp = InsElt->getOperand(1);

+ Value *Index = InsElt->getOperand(2);

+ if (isa<UndefValue>(VecOp)) {

+ // trunc (inselt undef, X, Index) --> inselt undef, (trunc X), Index

+ // fptrunc (inselt undef, X, Index) --> inselt undef, (fptrunc X), Index

+ UndefValue *NarrowUndef = UndefValue::get(DestTy);

+ Value *NarrowOp = Builder.CreateCast(Opcode, ScalarOp, DestScalarTy);

+ return InsertElementInst::Create(NarrowUndef, NarrowOp, Index);

+ }

+ return nullptr;

Instruction *InstCombiner::visitTrunc(TruncInst &CI) {

if (Instruction *Result = commonCastTransforms(CI))

return Result;

@@ -488,7 +538,7 @@ Instruction *InstCombiner::visitTrunc(TruncInst &CI) {

// type. Only do this if the dest type is a simple type, don't convert the

// expression tree to something weird like i93 unless the source is also

// strange.

- if ((DestTy->isVectorTy() || ShouldChangeType(SrcTy, DestTy)) &&

+ if ((DestTy->isVectorTy() || shouldChangeType(SrcTy, DestTy)) &&

canEvaluateTruncated(Src, DestTy, *this, &CI)) {

// If this cast is a truncate, evaluting in a different type always

@@ -554,8 +604,14 @@ Instruction *InstCombiner::visitTrunc(TruncInst &CI) {

if (Instruction *I = shrinkBitwiseLogic(CI))

return I;

+ if (Instruction *I = shrinkSplatShuffle(CI, *Builder))

+ return I;

+ if (Instruction *I = shrinkInsertElt(CI, *Builder))

+ return I;

if (Src->hasOneUse() && isa<IntegerType>(SrcTy) &&

- ShouldChangeType(SrcTy, DestTy)) {

+ shouldChangeType(SrcTy, DestTy)) {

// Transform "trunc (shl X, cst)" -> "shl (trunc X), cst" so long as the

// dest type is native and cst < dest size.

if (match(Src, m_Shl(m_Value(A), m_ConstantInt(Cst))) &&

@@ -838,11 +894,6 @@ Instruction *InstCombiner::visitZExt(ZExtInst &CI) {

if (Instruction *Result = commonCastTransforms(CI))

return Result;

- // See if we can simplify any instructions used by the input whose sole

- // purpose is to compute bits we don't care about.

- if (SimplifyDemandedInstructionBits(CI))

- return &CI;

Value *Src = CI.getOperand(0);

Type *SrcTy = Src->getType(), *DestTy = CI.getType();

@@ -851,10 +902,10 @@ Instruction *InstCombiner::visitZExt(ZExtInst &CI) {

// expression tree to something weird like i93 unless the source is also

// strange.

unsigned BitsToClear;

- if ((DestTy->isVectorTy() || ShouldChangeType(SrcTy, DestTy)) &&

+ if ((DestTy->isVectorTy() || shouldChangeType(SrcTy, DestTy)) &&

canEvaluateZExtd(Src, DestTy, BitsToClear, *this, &CI)) {

- assert(BitsToClear < SrcTy->getScalarSizeInBits() &&

- "Unreasonable BitsToClear");

+ assert(BitsToClear <= SrcTy->getScalarSizeInBits() &&

+ "Can't clear more bits than in SrcTy");

// Okay, we can transform this! Insert the new expression now.

DEBUG(dbgs() << "ICE: EvaluateInDifferentType converting expression type"

@@ -1124,11 +1175,6 @@ Instruction *InstCombiner::visitSExt(SExtInst &CI) {

if (Instruction *I = commonCastTransforms(CI))

return I;

- // See if we can simplify any instructions used by the input whose sole

- // purpose is to compute bits we don't care about.

- if (SimplifyDemandedInstructionBits(CI))

- return &CI;

Value *Src = CI.getOperand(0);

Type *SrcTy = Src->getType(), *DestTy = CI.getType();

@@ -1145,7 +1191,7 @@ Instruction *InstCombiner::visitSExt(SExtInst &CI) {

// type. Only do this if the dest type is a simple type, don't convert the

// expression tree to something weird like i93 unless the source is also

// strange.

- if ((DestTy->isVectorTy() || ShouldChangeType(SrcTy, DestTy)) &&

+ if ((DestTy->isVectorTy() || shouldChangeType(SrcTy, DestTy)) &&

canEvaluateSExtd(Src, DestTy)) {

// Okay, we can transform this! Insert the new expression now.

DEBUG(dbgs() << "ICE: EvaluateInDifferentType converting expression type"

@@ -1167,18 +1213,16 @@ Instruction *InstCombiner::visitSExt(SExtInst &CI) {

ShAmt);

}

- // If this input is a trunc from our destination, then turn sext(trunc(x))

+ // If the input is a trunc from the destination type, then turn sext(trunc(x))

// into shifts.

- if (TruncInst *TI = dyn_cast<TruncInst>(Src))

- if (TI->hasOneUse() && TI->getOperand(0)->getType() == DestTy) {

- uint32_t SrcBitSize = SrcTy->getScalarSizeInBits();

- uint32_t DestBitSize = DestTy->getScalarSizeInBits();

- // We need to emit a shl + ashr to do the sign extend.

- Value *ShAmt = ConstantInt::get(DestTy, DestBitSize-SrcBitSize);

- Value *Res = Builder->CreateShl(TI->getOperand(0), ShAmt, "sext");

- return BinaryOperator::CreateAShr(Res, ShAmt);

- }

+ Value *X;

+ if (match(Src, m_OneUse(m_Trunc(m_Value(X)))) && X->getType() == DestTy) {

+ // sext(trunc(X)) --> ashr(shl(X, C), C)

+ unsigned SrcBitSize = SrcTy->getScalarSizeInBits();

+ unsigned DestBitSize = DestTy->getScalarSizeInBits();

+ Constant *ShAmt = ConstantInt::get(DestTy, DestBitSize - SrcBitSize);

+ return BinaryOperator::CreateAShr(Builder->CreateShl(X, ShAmt), ShAmt);

+ }

if (ICmpInst *ICI = dyn_cast<ICmpInst>(Src))

return transformSExtICmp(ICI, CI);

@@ -1225,17 +1269,15 @@ static Constant *fitsInFPType(ConstantFP *CFP, const fltSemantics &Sem) {

return nullptr;

}

-/// If this is a floating-point extension instruction, look

-/// through it until we get the source value.

+/// Look through floating-point extensions until we get the source value.

static Value *lookThroughFPExtensions(Value *V) {

- if (Instruction *I = dyn_cast<Instruction>(V))

- if (I->getOpcode() == Instruction::FPExt)

- return lookThroughFPExtensions(I->getOperand(0));

+ while (auto *FPExt = dyn_cast<FPExtInst>(V))

+ V = FPExt->getOperand(0);

// If this value is a constant, return the constant in the smallest FP type

// that can accurately represent it. This allows us to turn

// (float)((double)X+2.0) into x+2.0f.

- if (ConstantFP *CFP = dyn_cast<ConstantFP>(V)) {

+ if (auto *CFP = dyn_cast<ConstantFP>(V)) {

if (CFP->getType() == Type::getPPC_FP128Ty(V->getContext()))

return V; // No constant folding of this.

// See if the value can be truncated to half and then reextended.

@@ -1392,24 +1434,49 @@ Instruction *InstCombiner::visitFPTrunc(FPTruncInst &CI) {

IntrinsicInst *II = dyn_cast<IntrinsicInst>(CI.getOperand(0));

if (II) {

switch (II->getIntrinsicID()) {

- default: break;

- case Intrinsic::fabs: {

- // (fptrunc (fabs x)) -> (fabs (fptrunc x))

- Value *InnerTrunc = Builder->CreateFPTrunc(II->getArgOperand(0),

- CI.getType());

- Type *IntrinsicType[] = { CI.getType() };

- Function *Overload = Intrinsic::getDeclaration(

- CI.getModule(), II->getIntrinsicID(), IntrinsicType);

- SmallVector<OperandBundleDef, 1> OpBundles;

- II->getOperandBundlesAsDefs(OpBundles);

- Value *Args[] = { InnerTrunc };

- return CallInst::Create(Overload, Args, OpBundles, II->getName());

+ default: break;

+ case Intrinsic::fabs:

+ case Intrinsic::ceil:

+ case Intrinsic::floor:

+ case Intrinsic::rint:

+ case Intrinsic::round:

+ case Intrinsic::nearbyint:

+ case Intrinsic::trunc: {

+ Value *Src = II->getArgOperand(0);

+ if (!Src->hasOneUse())

+ break;

+ // Except for fabs, this transformation requires the input of the unary FP

+ // operation to be itself an fpext from the type to which we're

+ // truncating.

+ if (II->getIntrinsicID() != Intrinsic::fabs) {

+ FPExtInst *FPExtSrc = dyn_cast<FPExtInst>(Src);

+ if (!FPExtSrc || FPExtSrc->getOperand(0)->getType() != CI.getType())

+ break;

}

+ // Do unary FP operation on smaller type.

+ // (fptrunc (fabs x)) -> (fabs (fptrunc x))

+ Value *InnerTrunc = Builder->CreateFPTrunc(Src, CI.getType());

+ Type *IntrinsicType[] = { CI.getType() };

+ Function *Overload = Intrinsic::getDeclaration(

+ CI.getModule(), II->getIntrinsicID(), IntrinsicType);

+ SmallVector<OperandBundleDef, 1> OpBundles;

+ II->getOperandBundlesAsDefs(OpBundles);

+ Value *Args[] = { InnerTrunc };

+ CallInst *NewCI = CallInst::Create(Overload, Args,

+ OpBundles, II->getName());

+ NewCI->copyFastMathFlags(II);

+ return NewCI;

+ }

}

+ if (Instruction *I = shrinkInsertElt(CI, *Builder))

+ return I;

return nullptr;

}