src - FreeBSD source tree

diff options


context:
space:
mode:

author	Dimitry Andric <dim@FreeBSD.org>	2022-03-20 11:40:34 +0000
committer	Dimitry Andric <dim@FreeBSD.org>	2022-05-14 11:43:05 +0000
commit	349cc55c9796c4596a5b9904cd3281af295f878f (patch)
tree	410c5a785075730a35f1272ca6a7adf72222ad03 /contrib/llvm-project/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
parent	cb2ae6163174b90e999326ecec3699ee093a5d43 (diff)
parent	c0981da47d5696fe36474fcf86b4ce03ae3ff818 (diff)

Diffstat (limited to 'contrib/llvm-project/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp')

-rw-r--r--

contrib/llvm-project/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp

924

1 files changed, 690 insertions, 234 deletions

diff --git a/contrib/llvm-project/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp b/contrib/llvm-project/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
index 2a98464425c4..008665d50233 100644
--- a/contrib/llvm-project/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
+++ b/contrib/llvm-project/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp

@@ -28,6 +28,7 @@

#include "llvm/Analysis/MemoryLocation.h"

#include "llvm/Analysis/ProfileSummaryInfo.h"

#include "llvm/Analysis/ValueTracking.h"

+#include "llvm/CodeGen/Analysis.h"

#include "llvm/CodeGen/FunctionLoweringInfo.h"

#include "llvm/CodeGen/ISDOpcodes.h"

#include "llvm/CodeGen/MachineBasicBlock.h"

@@ -175,7 +176,7 @@ bool ISD::isConstantSplatVectorAllOnes(const SDNode *N, bool BuildVectorOnly) {

if (!BuildVectorOnly && N->getOpcode() == ISD::SPLAT_VECTOR) {

APInt SplatVal;

- return isConstantSplatVector(N, SplatVal) && SplatVal.isAllOnesValue();

+ return isConstantSplatVector(N, SplatVal) && SplatVal.isAllOnes();

}

if (N->getOpcode() != ISD::BUILD_VECTOR) return false;

@@ -224,7 +225,7 @@ bool ISD::isConstantSplatVectorAllZeros(const SDNode *N, bool BuildVectorOnly) {

if (!BuildVectorOnly && N->getOpcode() == ISD::SPLAT_VECTOR) {

APInt SplatVal;

- return isConstantSplatVector(N, SplatVal) && SplatVal.isNullValue();

+ return isConstantSplatVector(N, SplatVal) && SplatVal.isZero();

}

if (N->getOpcode() != ISD::BUILD_VECTOR) return false;

@@ -412,6 +413,28 @@ bool ISD::isVPOpcode(unsigned Opcode) {

}

+bool ISD::isVPBinaryOp(unsigned Opcode) {

+ switch (Opcode) {

+ default:

+ return false;

+#define PROPERTY_VP_BINARYOP_SDNODE(SDOPC) \

+ case ISD::SDOPC: \

+ return true;

+#include "llvm/IR/VPIntrinsics.def"

+ }

+bool ISD::isVPReduction(unsigned Opcode) {

+ switch (Opcode) {

+ default:

+ return false;

+#define PROPERTY_VP_REDUCTION_SDNODE(SDOPC) \

+ case ISD::SDOPC: \

+ return true;

+#include "llvm/IR/VPIntrinsics.def"

+ }

/// The operand position of the vector mask.

Optional<unsigned> ISD::getVPMaskIdx(unsigned Opcode) {

switch (Opcode) {

@@ -683,6 +706,34 @@ static void AddNodeIDCustom(FoldingSetNodeID &ID, const SDNode *N) {

ID.AddInteger(ST->getPointerInfo().getAddrSpace());

break;

}

+ case ISD::VP_LOAD: {

+ const VPLoadSDNode *ELD = cast<VPLoadSDNode>(N);

+ ID.AddInteger(ELD->getMemoryVT().getRawBits());

+ ID.AddInteger(ELD->getRawSubclassData());

+ ID.AddInteger(ELD->getPointerInfo().getAddrSpace());

+ break;

+ }

+ case ISD::VP_STORE: {

+ const VPStoreSDNode *EST = cast<VPStoreSDNode>(N);

+ ID.AddInteger(EST->getMemoryVT().getRawBits());

+ ID.AddInteger(EST->getRawSubclassData());

+ ID.AddInteger(EST->getPointerInfo().getAddrSpace());

+ break;

+ }

+ case ISD::VP_GATHER: {

+ const VPGatherSDNode *EG = cast<VPGatherSDNode>(N);

+ ID.AddInteger(EG->getMemoryVT().getRawBits());

+ ID.AddInteger(EG->getRawSubclassData());

+ ID.AddInteger(EG->getPointerInfo().getAddrSpace());

+ break;

+ }

+ case ISD::VP_SCATTER: {

+ const VPScatterSDNode *ES = cast<VPScatterSDNode>(N);

+ ID.AddInteger(ES->getMemoryVT().getRawBits());

+ ID.AddInteger(ES->getRawSubclassData());

+ ID.AddInteger(ES->getPointerInfo().getAddrSpace());

+ break;

+ }

case ISD::MLOAD: {

const MaskedLoadSDNode *MLD = cast<MaskedLoadSDNode>(N);

ID.AddInteger(MLD->getMemoryVT().getRawBits());

@@ -1319,10 +1370,7 @@ SDValue SelectionDAG::getPtrExtendInReg(SDValue Op, const SDLoc &DL, EVT VT) {

/// getNOT - Create a bitwise NOT operation as (XOR Val, -1).

SDValue SelectionDAG::getNOT(const SDLoc &DL, SDValue Val, EVT VT) {

- EVT EltVT = VT.getScalarType();

- SDValue NegOne =

- getConstant(APInt::getAllOnesValue(EltVT.getSizeInBits()), DL, VT);

- return getNode(ISD::XOR, DL, VT, Val, NegOne);

+ return getNode(ISD::XOR, DL, VT, Val, getAllOnesConstant(DL, VT));

}

SDValue SelectionDAG::getLogicalNOT(const SDLoc &DL, SDValue Val, EVT VT) {

@@ -1901,7 +1949,7 @@ SDValue SelectionDAG::getVectorShuffle(EVT VT, const SDLoc &dl, SDValue N1,

if (SameNumElts)

return N1;

if (auto *C = dyn_cast<ConstantSDNode>(Splat))

- if (C->isNullValue())

+ if (C->isZero())

return N1;

}

@@ -2265,19 +2313,8 @@ SDValue SelectionDAG::FoldSetCC(EVT VT, SDValue N1, SDValue N2,

if (ConstantSDNode *N1C = dyn_cast<ConstantSDNode>(N1)) {

const APInt &C1 = N1C->getAPIntValue();

- switch (Cond) {

- default: llvm_unreachable("Unknown integer setcc!");

- case ISD::SETEQ: return getBoolConstant(C1 == C2, dl, VT, OpVT);

- case ISD::SETNE: return getBoolConstant(C1 != C2, dl, VT, OpVT);

- case ISD::SETULT: return getBoolConstant(C1.ult(C2), dl, VT, OpVT);

- case ISD::SETUGT: return getBoolConstant(C1.ugt(C2), dl, VT, OpVT);

- case ISD::SETULE: return getBoolConstant(C1.ule(C2), dl, VT, OpVT);

- case ISD::SETUGE: return getBoolConstant(C1.uge(C2), dl, VT, OpVT);

- case ISD::SETLT: return getBoolConstant(C1.slt(C2), dl, VT, OpVT);

- case ISD::SETGT: return getBoolConstant(C1.sgt(C2), dl, VT, OpVT);

- case ISD::SETLE: return getBoolConstant(C1.sle(C2), dl, VT, OpVT);

- case ISD::SETGE: return getBoolConstant(C1.sge(C2), dl, VT, OpVT);

- }

+ return getBoolConstant(ICmpInst::compare(C1, C2, getICmpCondCode(Cond)),

+ dl, VT, OpVT);

}

@@ -2380,7 +2417,7 @@ SDValue SelectionDAG::GetDemandedBits(SDValue V, const APInt &DemandedBits) {

return SDValue();

APInt DemandedElts = VT.isVector()

- ? APInt::getAllOnesValue(VT.getVectorNumElements())

+ ? APInt::getAllOnes(VT.getVectorNumElements())

: APInt(1, 1);

return GetDemandedBits(V, DemandedBits, DemandedElts);

}

@@ -2475,7 +2512,7 @@ bool SelectionDAG::isSplatValue(SDValue V, const APInt &DemandedElts,

switch (V.getOpcode()) {

case ISD::SPLAT_VECTOR:

UndefElts = V.getOperand(0).isUndef()

- ? APInt::getAllOnesValue(DemandedElts.getBitWidth())

+ ? APInt::getAllOnes(DemandedElts.getBitWidth())

: APInt(DemandedElts.getBitWidth(), 0);

return true;

case ISD::ADD:

@@ -2507,7 +2544,7 @@ bool SelectionDAG::isSplatValue(SDValue V, const APInt &DemandedElts,

unsigned NumElts = VT.getVectorNumElements();

assert(NumElts == DemandedElts.getBitWidth() && "Vector size mismatch");

- UndefElts = APInt::getNullValue(NumElts);

+ UndefElts = APInt::getZero(NumElts);

switch (V.getOpcode()) {

case ISD::BUILD_VECTOR: {

@@ -2576,7 +2613,7 @@ bool SelectionDAG::isSplatValue(SDValue V, bool AllowUndefs) {

// For now we don't support this with scalable vectors.

if (!VT.isScalableVector())

- DemandedElts = APInt::getAllOnesValue(VT.getVectorNumElements());

+ DemandedElts = APInt::getAllOnes(VT.getVectorNumElements());

return isSplatValue(V, DemandedElts, UndefElts) &&

(AllowUndefs || !UndefElts);

}

@@ -2592,7 +2629,7 @@ SDValue SelectionDAG::getSplatSourceVector(SDValue V, int &SplatIdx) {

APInt DemandedElts;

if (!VT.isScalableVector())

- DemandedElts = APInt::getAllOnesValue(VT.getVectorNumElements());

+ DemandedElts = APInt::getAllOnes(VT.getVectorNumElements());

if (isSplatValue(V, DemandedElts, UndefElts)) {

if (VT.isScalableVector()) {

@@ -2740,7 +2777,7 @@ KnownBits SelectionDAG::computeKnownBits(SDValue Op, unsigned Depth) const {

}

APInt DemandedElts = VT.isVector()

- ? APInt::getAllOnesValue(VT.getVectorNumElements())

+ ? APInt::getAllOnes(VT.getVectorNumElements())

: APInt(1, 1);

return computeKnownBits(Op, DemandedElts, Depth);

}

@@ -2878,7 +2915,7 @@ KnownBits SelectionDAG::computeKnownBits(SDValue Op, const APInt &DemandedElts,

unsigned NumSubElts = Sub.getValueType().getVectorNumElements();

APInt DemandedSubElts = DemandedElts.extractBits(NumSubElts, Idx);

APInt DemandedSrcElts = DemandedElts;

- DemandedSrcElts.insertBits(APInt::getNullValue(NumSubElts), Idx);

+ DemandedSrcElts.insertBits(APInt::getZero(NumSubElts), Idx);

Known.One.setAllBits();

Known.Zero.setAllBits();

@@ -2965,11 +3002,8 @@ KnownBits SelectionDAG::computeKnownBits(SDValue Op, const APInt &DemandedElts,

// bits from the overlapping larger input elements and extracting the

// sub sections we actually care about.

unsigned SubScale = SubBitWidth / BitWidth;

- APInt SubDemandedElts(NumElts / SubScale, 0);

- for (unsigned i = 0; i != NumElts; ++i)

- if (DemandedElts[i])

- SubDemandedElts.setBit(i / SubScale);

+ APInt SubDemandedElts =

+ APIntOps::ScaleBitMask(DemandedElts, NumElts / SubScale);

Known2 = computeKnownBits(N0, SubDemandedElts, Depth + 1);

Known.Zero.setAllBits(); Known.One.setAllBits();

@@ -3415,7 +3449,7 @@ KnownBits SelectionDAG::computeKnownBits(SDValue Op, const APInt &DemandedElts,

// If we know the element index, just demand that vector element, else for

// an unknown element index, ignore DemandedElts and demand them all.

- APInt DemandedSrcElts = APInt::getAllOnesValue(NumSrcElts);

+ APInt DemandedSrcElts = APInt::getAllOnes(NumSrcElts);

auto *ConstEltNo = dyn_cast<ConstantSDNode>(EltNo);

if (ConstEltNo && ConstEltNo->getAPIntValue().ult(NumSrcElts))

DemandedSrcElts =

@@ -3647,6 +3681,12 @@ bool SelectionDAG::isKnownToBeAPowerOfTwo(SDValue Val) const {

}))

return true;

+ // Is the operand of a splat vector a constant power of two?

+ if (Val.getOpcode() == ISD::SPLAT_VECTOR)

+ if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Val->getOperand(0)))

+ if (C->getAPIntValue().zextOrTrunc(BitWidth).isPowerOf2())

+ return true;

// More could be done here, though the above checks are enough

// to handle some common cases.

@@ -3663,7 +3703,7 @@ unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, unsigned Depth) const {

return 1;

APInt DemandedElts = VT.isVector()

- ? APInt::getAllOnesValue(VT.getVectorNumElements())

+ ? APInt::getAllOnes(VT.getVectorNumElements())

: APInt(1, 1);

return ComputeNumSignBits(Op, DemandedElts, Depth);

}

@@ -3771,10 +3811,8 @@ unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, const APInt &DemandedElts,

assert(VT.isVector() && "Expected bitcast to vector");

unsigned Scale = SrcBits / VTBits;

- APInt SrcDemandedElts(NumElts / Scale, 0);

- for (unsigned i = 0; i != NumElts; ++i)

- if (DemandedElts[i])

- SrcDemandedElts.setBit(i / Scale);

+ APInt SrcDemandedElts =

+ APIntOps::ScaleBitMask(DemandedElts, NumElts / Scale);

// Fast case - sign splat can be simply split across the small elements.

Tmp = ComputeNumSignBits(N0, SrcDemandedElts, Depth + 1);

@@ -3946,13 +3984,13 @@ unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, const APInt &DemandedElts,

// Special case decrementing a value (ADD X, -1):

if (ConstantSDNode *CRHS =

isConstOrConstSplat(Op.getOperand(1), DemandedElts))

- if (CRHS->isAllOnesValue()) {

+ if (CRHS->isAllOnes()) {

KnownBits Known =

computeKnownBits(Op.getOperand(0), DemandedElts, Depth + 1);

// If the input is known to be 0 or 1, the output is 0/-1, which is all

// sign bits set.

- if ((Known.Zero | 1).isAllOnesValue())

+ if ((Known.Zero | 1).isAllOnes())

return VTBits;

// If we are subtracting one from a positive number, there is no carry

@@ -3971,12 +4009,12 @@ unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, const APInt &DemandedElts,

// Handle NEG.

if (ConstantSDNode *CLHS =

isConstOrConstSplat(Op.getOperand(0), DemandedElts))

- if (CLHS->isNullValue()) {

+ if (CLHS->isZero()) {

KnownBits Known =

computeKnownBits(Op.getOperand(1), DemandedElts, Depth + 1);

// If the input is known to be 0 or 1, the output is 0/-1, which is all

// sign bits set.

- if ((Known.Zero | 1).isAllOnesValue())

+ if ((Known.Zero | 1).isAllOnes())

return VTBits;

// If the input is known to be positive (the sign bit is known clear),

@@ -4080,7 +4118,7 @@ unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, const APInt &DemandedElts,

// If we know the element index, just demand that vector element, else for

// an unknown element index, ignore DemandedElts and demand them all.

- APInt DemandedSrcElts = APInt::getAllOnesValue(NumSrcElts);

+ APInt DemandedSrcElts = APInt::getAllOnes(NumSrcElts);

auto *ConstEltNo = dyn_cast<ConstantSDNode>(EltNo);

if (ConstEltNo && ConstEltNo->getAPIntValue().ult(NumSrcElts))

DemandedSrcElts =

@@ -4126,7 +4164,7 @@ unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, const APInt &DemandedElts,

unsigned NumSubElts = Sub.getValueType().getVectorNumElements();

APInt DemandedSubElts = DemandedElts.extractBits(NumSubElts, Idx);

APInt DemandedSrcElts = DemandedElts;

- DemandedSrcElts.insertBits(APInt::getNullValue(NumSubElts), Idx);

+ DemandedSrcElts.insertBits(APInt::getZero(NumSubElts), Idx);

Tmp = std::numeric_limits<unsigned>::max();

if (!!DemandedSubElts) {

@@ -4248,6 +4286,18 @@ unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, const APInt &DemandedElts,

return std::max(FirstAnswer, Mask.countLeadingOnes());

}

+unsigned SelectionDAG::ComputeMinSignedBits(SDValue Op, unsigned Depth) const {

+ unsigned SignBits = ComputeNumSignBits(Op, Depth);

+ return Op.getScalarValueSizeInBits() - SignBits + 1;

+unsigned SelectionDAG::ComputeMinSignedBits(SDValue Op,

+ const APInt &DemandedElts,

+ unsigned Depth) const {

+ unsigned SignBits = ComputeNumSignBits(Op, DemandedElts, Depth);

+ return Op.getScalarValueSizeInBits() - SignBits + 1;

bool SelectionDAG::isGuaranteedNotToBeUndefOrPoison(SDValue Op, bool PoisonOnly,

unsigned Depth) const {

// Early out for FREEZE.

@@ -4260,7 +4310,7 @@ bool SelectionDAG::isGuaranteedNotToBeUndefOrPoison(SDValue Op, bool PoisonOnly,

return false;

APInt DemandedElts = VT.isVector()

- ? APInt::getAllOnesValue(VT.getVectorNumElements())

+ ? APInt::getAllOnes(VT.getVectorNumElements())

: APInt(1, 1);

return isGuaranteedNotToBeUndefOrPoison(Op, DemandedElts, PoisonOnly, Depth);

}

@@ -4285,7 +4335,17 @@ bool SelectionDAG::isGuaranteedNotToBeUndefOrPoison(SDValue Op,

case ISD::UNDEF:

return PoisonOnly;

- // TODO: ISD::BUILD_VECTOR handling

+ case ISD::BUILD_VECTOR:

+ // NOTE: BUILD_VECTOR has implicit truncation of wider scalar elements -

+ // this shouldn't affect the result.

+ for (unsigned i = 0, e = Op.getNumOperands(); i < e; ++i) {

+ if (!DemandedElts[i])

+ continue;

+ if (!isGuaranteedNotToBeUndefOrPoison(Op.getOperand(i), PoisonOnly,

+ Depth + 1))

+ return false;

+ }

+ return true;

// TODO: Search for noundef attributes from library functions.

@@ -4449,8 +4509,8 @@ bool SelectionDAG::isKnownNeverZero(SDValue Op) const {

"Floating point types unsupported - use isKnownNeverZeroFloat");

// If the value is a constant, we can obviously see if it is a zero or not.

- if (ISD::matchUnaryPredicate(

- Op, [](ConstantSDNode *C) { return !C->isNullValue(); }))

+ if (ISD::matchUnaryPredicate(Op,

+ [](ConstantSDNode *C) { return !C->isZero(); }))

return true;

// TODO: Recognize more cases here.

@@ -4490,7 +4550,7 @@ bool SelectionDAG::haveNoCommonBitsSet(SDValue A, SDValue B) const {

static SDValue FoldSTEP_VECTOR(const SDLoc &DL, EVT VT, SDValue Step,

SelectionDAG &DAG) {

- if (cast<ConstantSDNode>(Step)->isNullValue())

+ if (cast<ConstantSDNode>(Step)->isZero())

return DAG.getConstant(0, DL, VT);

return SDValue();

@@ -4676,7 +4736,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, const SDLoc &DL, EVT VT,

case ISD::UINT_TO_FP:

case ISD::SINT_TO_FP: {

APFloat apf(EVTToAPFloatSemantics(VT),

- APInt::getNullValue(VT.getSizeInBits()));

+ APInt::getZero(VT.getSizeInBits()));

(void)apf.convertFromAPInt(Val,

Opcode==ISD::SINT_TO_FP,

APFloat::rmNearestTiesToEven);

@@ -4828,7 +4888,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, const SDLoc &DL, EVT VT,

case ISD::CTTZ_ZERO_UNDEF:

case ISD::CTPOP: {

SDValue Ops = {Operand};

- if (SDValue Fold = FoldConstantVectorArithmetic(Opcode, DL, VT, Ops))

+ if (SDValue Fold = FoldConstantArithmetic(Opcode, DL, VT, Ops))

return Fold;

}

@@ -4976,6 +5036,8 @@ SDValue SelectionDAG::getNode(unsigned Opcode, const SDLoc &DL, EVT VT,

}

if (OpOpcode == ISD::UNDEF)

return getUNDEF(VT);

+ if (OpOpcode == ISD::VSCALE && !NewNodesMustHaveLegalTypes)

+ return getVScale(DL, VT, Operand.getConstantOperandAPInt(0));

break;

case ISD::ANY_EXTEND_VECTOR_INREG:

case ISD::ZERO_EXTEND_VECTOR_INREG:

@@ -5206,173 +5268,111 @@ SDValue SelectionDAG::FoldConstantArithmetic(unsigned Opcode, const SDLoc &DL,

if (Opcode >= ISD::BUILTIN_OP_END || Opcode == ISD::CONCAT_VECTORS)

return SDValue();

- // For now, the array Ops should only contain two values.

- // This enforcement will be removed once this function is merged with

- // FoldConstantVectorArithmetic

- if (Ops.size() != 2)

+ unsigned NumOps = Ops.size();

+ if (NumOps == 0)

return SDValue();

if (isUndef(Opcode, Ops))

return getUNDEF(VT);

- SDNode *N1 = Ops[0].getNode();

- SDNode *N2 = Ops[1].getNode();

// Handle the case of two scalars.

- if (auto *C1 = dyn_cast<ConstantSDNode>(N1)) {

- if (auto *C2 = dyn_cast<ConstantSDNode>(N2)) {

- if (C1->isOpaque() || C2->isOpaque())

- return SDValue();

- Optional<APInt> FoldAttempt =

- FoldValue(Opcode, C1->getAPIntValue(), C2->getAPIntValue());

- if (!FoldAttempt)

- return SDValue();

- SDValue Folded = getConstant(FoldAttempt.getValue(), DL, VT);

- assert((!Folded || !VT.isVector()) &&

- "Can't fold vectors ops with scalar operands");

- return Folded;

- }

- // fold (add Sym, c) -> Sym+c

- if (GlobalAddressSDNode *GA = dyn_cast<GlobalAddressSDNode>(N1))

- return FoldSymbolOffset(Opcode, VT, GA, N2);

- if (TLI->isCommutativeBinOp(Opcode))

- if (GlobalAddressSDNode *GA = dyn_cast<GlobalAddressSDNode>(N2))

- return FoldSymbolOffset(Opcode, VT, GA, N1);

- // For fixed width vectors, extract each constant element and fold them

- // individually. Either input may be an undef value.

- bool IsBVOrSV1 = N1->getOpcode() == ISD::BUILD_VECTOR ||

- N1->getOpcode() == ISD::SPLAT_VECTOR;

- if (!IsBVOrSV1 && !N1->isUndef())

- return SDValue();

- bool IsBVOrSV2 = N2->getOpcode() == ISD::BUILD_VECTOR ||

- N2->getOpcode() == ISD::SPLAT_VECTOR;

- if (!IsBVOrSV2 && !N2->isUndef())

- return SDValue();

- // If both operands are undef, that's handled the same way as scalars.

- if (!IsBVOrSV1 && !IsBVOrSV2)

- return SDValue();

- EVT SVT = VT.getScalarType();

- EVT LegalSVT = SVT;

- if (NewNodesMustHaveLegalTypes && LegalSVT.isInteger()) {

- LegalSVT = TLI->getTypeToTransformTo(*getContext(), LegalSVT);

- if (LegalSVT.bitsLT(SVT))

- return SDValue();

- }

- SmallVector<SDValue, 4> Outputs;

- unsigned NumOps = 0;

- if (IsBVOrSV1)

- NumOps = std::max(NumOps, N1->getNumOperands());

- if (IsBVOrSV2)

- NumOps = std::max(NumOps, N2->getNumOperands());

- assert(NumOps != 0 && "Expected non-zero operands");

- // Scalable vectors should only be SPLAT_VECTOR or UNDEF here. We only need

- // one iteration for that.

- assert((!VT.isScalableVector() || NumOps == 1) &&

- "Scalable vector should only have one scalar");

- for (unsigned I = 0; I != NumOps; ++I) {

- // We can have a fixed length SPLAT_VECTOR and a BUILD_VECTOR so we need

- // to use operand 0 of the SPLAT_VECTOR for each fixed element.

- SDValue V1;

- if (N1->getOpcode() == ISD::BUILD_VECTOR)

- V1 = N1->getOperand(I);

- else if (N1->getOpcode() == ISD::SPLAT_VECTOR)

- V1 = N1->getOperand(0);

- else

- V1 = getUNDEF(SVT);

- SDValue V2;

- if (N2->getOpcode() == ISD::BUILD_VECTOR)

- V2 = N2->getOperand(I);

- else if (N2->getOpcode() == ISD::SPLAT_VECTOR)

- V2 = N2->getOperand(0);

- else

- V2 = getUNDEF(SVT);

- if (SVT.isInteger()) {

- if (V1.getValueType().bitsGT(SVT))

- V1 = getNode(ISD::TRUNCATE, DL, SVT, V1);

- if (V2.getValueType().bitsGT(SVT))

- V2 = getNode(ISD::TRUNCATE, DL, SVT, V2);

+ if (NumOps == 2) {

+ // TODO: Move foldConstantFPMath here?

+ if (auto *C1 = dyn_cast<ConstantSDNode>(Ops[0])) {

+ if (auto *C2 = dyn_cast<ConstantSDNode>(Ops[1])) {

+ if (C1->isOpaque() || C2->isOpaque())

+ return SDValue();

+ Optional<APInt> FoldAttempt =

+ FoldValue(Opcode, C1->getAPIntValue(), C2->getAPIntValue());

+ if (!FoldAttempt)

+ return SDValue();

+ SDValue Folded = getConstant(FoldAttempt.getValue(), DL, VT);

+ assert((!Folded || !VT.isVector()) &&

+ "Can't fold vectors ops with scalar operands");

+ return Folded;

+ }

}

- if (V1.getValueType() != SVT || V2.getValueType() != SVT)

- return SDValue();

- // Fold one vector element.

- SDValue ScalarResult = getNode(Opcode, DL, SVT, V1, V2);

- if (LegalSVT != SVT)

- ScalarResult = getNode(ISD::SIGN_EXTEND, DL, LegalSVT, ScalarResult);

- // Scalar folding only succeeded if the result is a constant or UNDEF.

- if (!ScalarResult.isUndef() && ScalarResult.getOpcode() != ISD::Constant &&

- ScalarResult.getOpcode() != ISD::ConstantFP)

- return SDValue();

- Outputs.push_back(ScalarResult);

- }

- if (N1->getOpcode() == ISD::BUILD_VECTOR ||

- N2->getOpcode() == ISD::BUILD_VECTOR) {

- assert(VT.getVectorNumElements() == Outputs.size() &&

- "Vector size mismatch!");

- // Build a big vector out of the scalar elements we generated.

- return getBuildVector(VT, SDLoc(), Outputs);

+ // fold (add Sym, c) -> Sym+c

+ if (GlobalAddressSDNode *GA = dyn_cast<GlobalAddressSDNode>(Ops[0]))

+ return FoldSymbolOffset(Opcode, VT, GA, Ops[1].getNode());

+ if (TLI->isCommutativeBinOp(Opcode))

+ if (GlobalAddressSDNode *GA = dyn_cast<GlobalAddressSDNode>(Ops[1]))

+ return FoldSymbolOffset(Opcode, VT, GA, Ops[0].getNode());

}

- assert((N1->getOpcode() == ISD::SPLAT_VECTOR ||

- N2->getOpcode() == ISD::SPLAT_VECTOR) &&

- "One operand should be a splat vector");

- assert(Outputs.size() == 1 && "Vector size mismatch!");

- return getSplatVector(VT, SDLoc(), Outputs[0]);

-// TODO: Merge with FoldConstantArithmetic

-SDValue SelectionDAG::FoldConstantVectorArithmetic(unsigned Opcode,

- const SDLoc &DL, EVT VT,

- ArrayRef<SDValue> Ops,

- const SDNodeFlags Flags) {

- // If the opcode is a target-specific ISD node, there's nothing we can

- // do here and the operand rules may not line up with the below, so

- // bail early.

- if (Opcode >= ISD::BUILTIN_OP_END)

- return SDValue();

- if (isUndef(Opcode, Ops))

- return getUNDEF(VT);

- // We can only fold vectors - maybe merge with FoldConstantArithmetic someday?

+ // This is for vector folding only from here on.

if (!VT.isVector())

return SDValue();

ElementCount NumElts = VT.getVectorElementCount();

+ // See if we can fold through bitcasted integer ops.

+ // TODO: Can we handle undef elements?

+ if (NumOps == 2 && VT.isFixedLengthVector() && VT.isInteger() &&

+ Ops[0].getValueType() == VT && Ops[1].getValueType() == VT &&

+ Ops[0].getOpcode() == ISD::BITCAST &&

+ Ops[1].getOpcode() == ISD::BITCAST) {

+ SDValue N1 = peekThroughBitcasts(Ops[0]);

+ SDValue N2 = peekThroughBitcasts(Ops[1]);

+ auto *BV1 = dyn_cast<BuildVectorSDNode>(N1);

+ auto *BV2 = dyn_cast<BuildVectorSDNode>(N2);

+ EVT BVVT = N1.getValueType();

+ if (BV1 && BV2 && BVVT.isInteger() && BVVT == N2.getValueType()) {

+ bool IsLE = getDataLayout().isLittleEndian();

+ unsigned EltBits = VT.getScalarSizeInBits();

+ SmallVector<APInt> RawBits1, RawBits2;

+ BitVector UndefElts1, UndefElts2;

+ if (BV1->getConstantRawBits(IsLE, EltBits, RawBits1, UndefElts1) &&

+ BV2->getConstantRawBits(IsLE, EltBits, RawBits2, UndefElts2) &&

+ UndefElts1.none() && UndefElts2.none()) {

+ SmallVector<APInt> RawBits;

+ for (unsigned I = 0, E = NumElts.getFixedValue(); I != E; ++I) {

+ Optional<APInt> Fold = FoldValue(Opcode, RawBits1[I], RawBits2[I]);

+ if (!Fold)

+ break;

+ RawBits.push_back(Fold.getValue());

+ }

+ if (RawBits.size() == NumElts.getFixedValue()) {

+ // We have constant folded, but we need to cast this again back to

+ // the original (possibly legalized) type.

+ SmallVector<APInt> DstBits;

+ BitVector DstUndefs;

+ BuildVectorSDNode::recastRawBits(IsLE, BVVT.getScalarSizeInBits(),

+ DstBits, RawBits, DstUndefs,

+ BitVector(RawBits.size(), false));

+ EVT BVEltVT = BV1->getOperand(0).getValueType();

+ unsigned BVEltBits = BVEltVT.getSizeInBits();

+ SmallVector<SDValue> Ops(DstBits.size(), getUNDEF(BVEltVT));

+ for (unsigned I = 0, E = DstBits.size(); I != E; ++I) {

+ if (DstUndefs[I])

+ continue;

+ Ops[I] = getConstant(DstBits[I].sextOrSelf(BVEltBits), DL, BVEltVT);

+ }

+ return getBitcast(VT, getBuildVector(BVVT, DL, Ops));

+ }

auto IsScalarOrSameVectorSize = [NumElts](const SDValue &Op) {

return !Op.getValueType().isVector() ||

Op.getValueType().getVectorElementCount() == NumElts;

};

- auto IsConstantBuildVectorSplatVectorOrUndef = [](const SDValue &Op) {

- APInt SplatVal;

- BuildVectorSDNode *BV = dyn_cast<BuildVectorSDNode>(Op);

+ auto IsBuildVectorSplatVectorOrUndef = [](const SDValue &Op) {

return Op.isUndef() || Op.getOpcode() == ISD::CONDCODE ||

- (BV && BV->isConstant()) ||

- (Op.getOpcode() == ISD::SPLAT_VECTOR &&

- ISD::isConstantSplatVector(Op.getNode(), SplatVal));

+ Op.getOpcode() == ISD::BUILD_VECTOR ||

+ Op.getOpcode() == ISD::SPLAT_VECTOR;

};

// All operands must be vector types with the same number of elements as

- // the result type and must be either UNDEF or a build vector of constant

+ // the result type and must be either UNDEF or a build/splat vector

// or UNDEF scalars.

- if (!llvm::all_of(Ops, IsConstantBuildVectorSplatVectorOrUndef) ||

+ if (!llvm::all_of(Ops, IsBuildVectorSplatVectorOrUndef) ||

!llvm::all_of(Ops, IsScalarOrSameVectorSize))

return SDValue();

@@ -5392,17 +5392,16 @@ SDValue SelectionDAG::FoldConstantVectorArithmetic(unsigned Opcode,

// For scalable vector types we know we're dealing with SPLAT_VECTORs. We

// only have one operand to check. For fixed-length vector types we may have

// a combination of BUILD_VECTOR and SPLAT_VECTOR.

- unsigned NumOperands = NumElts.isScalable() ? 1 : NumElts.getFixedValue();

+ unsigned NumVectorElts = NumElts.isScalable() ? 1 : NumElts.getFixedValue();

// Constant fold each scalar lane separately.

SmallVector<SDValue, 4> ScalarResults;

- for (unsigned I = 0; I != NumOperands; I++) {

+ for (unsigned I = 0; I != NumVectorElts; I++) {

SmallVector<SDValue, 4> ScalarOps;

for (SDValue Op : Ops) {

EVT InSVT = Op.getValueType().getScalarType();

if (Op.getOpcode() != ISD::BUILD_VECTOR &&

Op.getOpcode() != ISD::SPLAT_VECTOR) {

- // We've checked that this is UNDEF or a constant of some kind.

if (Op.isUndef())

ScalarOps.push_back(getUNDEF(InSVT));

else

@@ -5423,7 +5422,7 @@ SDValue SelectionDAG::FoldConstantVectorArithmetic(unsigned Opcode,

}

// Constant fold the scalar operands.

- SDValue ScalarResult = getNode(Opcode, DL, SVT, ScalarOps, Flags);

+ SDValue ScalarResult = getNode(Opcode, DL, SVT, ScalarOps);

// Legalize the (integer) scalar constant if necessary.

if (LegalSVT != SVT)

@@ -5591,9 +5590,9 @@ SDValue SelectionDAG::getNode(unsigned Opcode, const SDLoc &DL, EVT VT,

N1.getValueType() == VT && "Binary operator types must match!");

// (X & 0) -> 0. This commonly occurs when legalizing i64 values, so it's

// worth handling here.

- if (N2C && N2C->isNullValue())

+ if (N2C && N2C->isZero())

return N2;

- if (N2C && N2C->isAllOnesValue()) // X & -1 -> X

+ if (N2C && N2C->isAllOnes()) // X & -1 -> X

return N1;

break;

case ISD::OR:

@@ -5605,7 +5604,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, const SDLoc &DL, EVT VT,

N1.getValueType() == VT && "Binary operator types must match!");

// (X ^|+- 0) -> X. This commonly occurs when legalizing i64 values, so

// it's worth handling here.

- if (N2C && N2C->isNullValue())

+ if (N2C && N2C->isZero())

return N1;

if ((Opcode == ISD::ADD || Opcode == ISD::SUB) && VT.isVector() &&

VT.getVectorElementType() == MVT::i1)

@@ -5711,7 +5710,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, const SDLoc &DL, EVT VT,

// size of the value, the shift/rotate count is guaranteed to be zero.

if (VT == MVT::i1)

return N1;

- if (N2C && N2C->isNullValue())

+ if (N2C && N2C->isZero())

return N1;

break;

case ISD::FP_ROUND:

@@ -6086,7 +6085,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, const SDLoc &DL, EVT VT,

return V;

// Vector constant folding.

SDValue Ops[] = {N1, N2, N3};

- if (SDValue V = FoldConstantVectorArithmetic(Opcode, DL, VT, Ops)) {

+ if (SDValue V = FoldConstantArithmetic(Opcode, DL, VT, Ops)) {

NewSDValueDbgMsg(V, "New node vector constant folding: ", this);

return V;

}

@@ -6099,6 +6098,11 @@ SDValue SelectionDAG::getNode(unsigned Opcode, const SDLoc &DL, EVT VT,

break;

case ISD::VECTOR_SHUFFLE:

llvm_unreachable("should use getVectorShuffle constructor!");

+ case ISD::VECTOR_SPLICE: {

+ if (cast<ConstantSDNode>(N3)->isNullValue())

+ return N1;

+ break;

+ }

case ISD::INSERT_VECTOR_ELT: {

ConstantSDNode *N3C = dyn_cast<ConstantSDNode>(N3);

// INSERT_VECTOR_ELT into out-of-bounds element is an UNDEF, except

@@ -6214,9 +6218,8 @@ SDValue SelectionDAG::getStackArgumentTokenFactor(SDValue Chain) {

ArgChains.push_back(Chain);

// Add a chain value for each stack argument.

- for (SDNode::use_iterator U = getEntryNode().getNode()->use_begin(),

- UE = getEntryNode().getNode()->use_end(); U != UE; ++U)

- if (LoadSDNode *L = dyn_cast<LoadSDNode>(*U))

+ for (SDNode *U : getEntryNode().getNode()->uses())

+ if (LoadSDNode *L = dyn_cast<LoadSDNode>(U))

if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(L->getBasePtr()))

if (FI->getIndex() < 0)

ArgChains.push_back(SDValue(L, 1));

@@ -6720,7 +6723,7 @@ static SDValue getMemsetStores(SelectionDAG &DAG, const SDLoc &dl,

if (FI && !MFI.isFixedObjectIndex(FI->getIndex()))

DstAlignCanChange = true;

bool IsZeroVal =

- isa<ConstantSDNode>(Src) && cast<ConstantSDNode>(Src)->isNullValue();

+ isa<ConstantSDNode>(Src) && cast<ConstantSDNode>(Src)->isZero();

if (!TLI.findOptimalMemOpLowering(

MemOps, TLI.getMaxStoresPerMemset(OptSize),

MemOp::Set(Size, DstAlignCanChange, Alignment, IsZeroVal, isVol),

@@ -6809,7 +6812,7 @@ SDValue SelectionDAG::getMemcpy(SDValue Chain, const SDLoc &dl, SDValue Dst,

ConstantSDNode *ConstantSize = dyn_cast<ConstantSDNode>(Size);

if (ConstantSize) {

// Memcpy with size zero? Just return the original chain.

- if (ConstantSize->isNullValue())

+ if (ConstantSize->isZero())

return Chain;

SDValue Result = getMemcpyLoadsAndStores(

@@ -6924,7 +6927,7 @@ SDValue SelectionDAG::getMemmove(SDValue Chain, const SDLoc &dl, SDValue Dst,

ConstantSDNode *ConstantSize = dyn_cast<ConstantSDNode>(Size);

if (ConstantSize) {

// Memmove with size zero? Just return the original chain.

- if (ConstantSize->isNullValue())

+ if (ConstantSize->isZero())

return Chain;

SDValue Result = getMemmoveLoadsAndStores(

@@ -7026,7 +7029,7 @@ SDValue SelectionDAG::getMemset(SDValue Chain, const SDLoc &dl, SDValue Dst,

ConstantSDNode *ConstantSize = dyn_cast<ConstantSDNode>(Size);

if (ConstantSize) {

// Memset with size zero? Just return the original chain.

- if (ConstantSize->isNullValue())

+ if (ConstantSize->isZero())

return Chain;

SDValue Result = getMemsetStores(*this, dl, Chain, Dst, Src,

@@ -7618,6 +7621,374 @@ SDValue SelectionDAG::getIndexedStore(SDValue OrigStore, const SDLoc &dl,

return V;

}

+SDValue SelectionDAG::getLoadVP(

+ ISD::MemIndexedMode AM, ISD::LoadExtType ExtType, EVT VT, const SDLoc &dl,

+ SDValue Chain, SDValue Ptr, SDValue Offset, SDValue Mask, SDValue EVL,

+ MachinePointerInfo PtrInfo, EVT MemVT, Align Alignment,

+ MachineMemOperand::Flags MMOFlags, const AAMDNodes &AAInfo,

+ const MDNode *Ranges, bool IsExpanding) {

+ assert(Chain.getValueType() == MVT::Other && "Invalid chain type");

+ MMOFlags |= MachineMemOperand::MOLoad;

+ assert((MMOFlags & MachineMemOperand::MOStore) == 0);

+ // If we don't have a PtrInfo, infer the trivial frame index case to simplify

+ // clients.

+ if (PtrInfo.V.isNull())

+ PtrInfo = InferPointerInfo(PtrInfo, *this, Ptr, Offset);

+ uint64_t Size = MemoryLocation::getSizeOrUnknown(MemVT.getStoreSize());

+ MachineFunction &MF = getMachineFunction();

+ MachineMemOperand *MMO = MF.getMachineMemOperand(PtrInfo, MMOFlags, Size,

+ Alignment, AAInfo, Ranges);

+ return getLoadVP(AM, ExtType, VT, dl, Chain, Ptr, Offset, Mask, EVL, MemVT,

+ MMO, IsExpanding);

+SDValue SelectionDAG::getLoadVP(ISD::MemIndexedMode AM,

+ ISD::LoadExtType ExtType, EVT VT,

+ const SDLoc &dl, SDValue Chain, SDValue Ptr,

+ SDValue Offset, SDValue Mask, SDValue EVL,

+ EVT MemVT, MachineMemOperand *MMO,

+ bool IsExpanding) {

+ if (VT == MemVT) {

+ ExtType = ISD::NON_EXTLOAD;

+ } else if (ExtType == ISD::NON_EXTLOAD) {

+ assert(VT == MemVT && "Non-extending load from different memory type!");

+ } else {

+ // Extending load.

+ assert(MemVT.getScalarType().bitsLT(VT.getScalarType()) &&

+ "Should only be an extending load, not truncating!");

+ assert(VT.isInteger() == MemVT.isInteger() &&

+ "Cannot convert from FP to Int or Int -> FP!");

+ assert(VT.isVector() == MemVT.isVector() &&

+ "Cannot use an ext load to convert to or from a vector!");

+ assert((!VT.isVector() ||

+ VT.getVectorElementCount() == MemVT.getVectorElementCount()) &&

+ "Cannot use an ext load to change the number of vector elements!");

+ }

+ bool Indexed = AM != ISD::UNINDEXED;

+ assert((Indexed || Offset.isUndef()) && "Unindexed load with an offset!");

+ SDVTList VTs = Indexed ? getVTList(VT, Ptr.getValueType(), MVT::Other)

+ : getVTList(VT, MVT::Other);

+ SDValue Ops[] = {Chain, Ptr, Offset, Mask, EVL};

+ FoldingSetNodeID ID;

+ AddNodeIDNode(ID, ISD::VP_LOAD, VTs, Ops);

+ ID.AddInteger(VT.getRawBits());

+ ID.AddInteger(getSyntheticNodeSubclassData<VPLoadSDNode>(

+ dl.getIROrder(), VTs, AM, ExtType, IsExpanding, MemVT, MMO));

+ ID.AddInteger(MMO->getPointerInfo().getAddrSpace());

+ void *IP = nullptr;

+ if (SDNode *E = FindNodeOrInsertPos(ID, dl, IP)) {

+ cast<VPLoadSDNode>(E)->refineAlignment(MMO);

+ return SDValue(E, 0);

+ }

+ auto *N = newSDNode<VPLoadSDNode>(dl.getIROrder(), dl.getDebugLoc(), VTs, AM,

+ ExtType, IsExpanding, MemVT, MMO);

+ createOperands(N, Ops);

+ CSEMap.InsertNode(N, IP);

+ InsertNode(N);

+ SDValue V(N, 0);

+ NewSDValueDbgMsg(V, "Creating new node: ", this);

+ return V;

+SDValue SelectionDAG::getLoadVP(EVT VT, const SDLoc &dl, SDValue Chain,

+ SDValue Ptr, SDValue Mask, SDValue EVL,

+ MachinePointerInfo PtrInfo,

+ MaybeAlign Alignment,

+ MachineMemOperand::Flags MMOFlags,

+ const AAMDNodes &AAInfo, const MDNode *Ranges,

+ bool IsExpanding) {

+ SDValue Undef = getUNDEF(Ptr.getValueType());

+ return getLoadVP(ISD::UNINDEXED, ISD::NON_EXTLOAD, VT, dl, Chain, Ptr, Undef,

+ Mask, EVL, PtrInfo, VT, Alignment, MMOFlags, AAInfo, Ranges,

+ IsExpanding);

+SDValue SelectionDAG::getLoadVP(EVT VT, const SDLoc &dl, SDValue Chain,

+ SDValue Ptr, SDValue Mask, SDValue EVL,

+ MachineMemOperand *MMO, bool IsExpanding) {

+ SDValue Undef = getUNDEF(Ptr.getValueType());

+ return getLoadVP(ISD::UNINDEXED, ISD::NON_EXTLOAD, VT, dl, Chain, Ptr, Undef,

+ Mask, EVL, VT, MMO, IsExpanding);

+SDValue SelectionDAG::getExtLoadVP(ISD::LoadExtType ExtType, const SDLoc &dl,

+ EVT VT, SDValue Chain, SDValue Ptr,

+ SDValue Mask, SDValue EVL,

+ MachinePointerInfo PtrInfo, EVT MemVT,

+ MaybeAlign Alignment,

+ MachineMemOperand::Flags MMOFlags,

+ const AAMDNodes &AAInfo, bool IsExpanding) {

+ SDValue Undef = getUNDEF(Ptr.getValueType());

+ return getLoadVP(ISD::UNINDEXED, ExtType, VT, dl, Chain, Ptr, Undef, Mask,

+ EVL, PtrInfo, MemVT, Alignment, MMOFlags, AAInfo, nullptr,

+ IsExpanding);

+SDValue SelectionDAG::getExtLoadVP(ISD::LoadExtType ExtType, const SDLoc &dl,

+ EVT VT, SDValue Chain, SDValue Ptr,

+ SDValue Mask, SDValue EVL, EVT MemVT,

+ MachineMemOperand *MMO, bool IsExpanding) {

+ SDValue Undef = getUNDEF(Ptr.getValueType());

+ return getLoadVP(ISD::UNINDEXED, ExtType, VT, dl, Chain, Ptr, Undef, Mask,

+ EVL, MemVT, MMO, IsExpanding);

+SDValue SelectionDAG::getIndexedLoadVP(SDValue OrigLoad, const SDLoc &dl,

+ SDValue Base, SDValue Offset,

+ ISD::MemIndexedMode AM) {

+ auto *LD = cast<VPLoadSDNode>(OrigLoad);

+ assert(LD->getOffset().isUndef() && "Load is already a indexed load!");

+ // Don't propagate the invariant or dereferenceable flags.

+ auto MMOFlags =

+ LD->getMemOperand()->getFlags() &

+ ~(MachineMemOperand::MOInvariant | MachineMemOperand::MODereferenceable);

+ return getLoadVP(AM, LD->getExtensionType(), OrigLoad.getValueType(), dl,

+ LD->getChain(), Base, Offset, LD->getMask(),

+ LD->getVectorLength(), LD->getPointerInfo(),

+ LD->getMemoryVT(), LD->getAlign(), MMOFlags, LD->getAAInfo(),

+ nullptr, LD->isExpandingLoad());

+SDValue SelectionDAG::getStoreVP(SDValue Chain, const SDLoc &dl, SDValue Val,

+ SDValue Ptr, SDValue Mask, SDValue EVL,

+ MachinePointerInfo PtrInfo, Align Alignment,

+ MachineMemOperand::Flags MMOFlags,

+ const AAMDNodes &AAInfo, bool IsCompressing) {

+ assert(Chain.getValueType() == MVT::Other && "Invalid chain type");

+ MMOFlags |= MachineMemOperand::MOStore;

+ assert((MMOFlags & MachineMemOperand::MOLoad) == 0);

+ if (PtrInfo.V.isNull())

+ PtrInfo = InferPointerInfo(PtrInfo, *this, Ptr);

+ MachineFunction &MF = getMachineFunction();

+ uint64_t Size =

+ MemoryLocation::getSizeOrUnknown(Val.getValueType().getStoreSize());

+ MachineMemOperand *MMO =

+ MF.getMachineMemOperand(PtrInfo, MMOFlags, Size, Alignment, AAInfo);

+ return getStoreVP(Chain, dl, Val, Ptr, Mask, EVL, MMO, IsCompressing);

+SDValue SelectionDAG::getStoreVP(SDValue Chain, const SDLoc &dl, SDValue Val,

+ SDValue Ptr, SDValue Mask, SDValue EVL,

+ MachineMemOperand *MMO, bool IsCompressing) {

+ assert(Chain.getValueType() == MVT::Other && "Invalid chain type");

+ EVT VT = Val.getValueType();

+ SDVTList VTs = getVTList(MVT::Other);

+ SDValue Undef = getUNDEF(Ptr.getValueType());

+ SDValue Ops[] = {Chain, Val, Ptr, Undef, Mask, EVL};

+ FoldingSetNodeID ID;

+ AddNodeIDNode(ID, ISD::VP_STORE, VTs, Ops);

+ ID.AddInteger(VT.getRawBits());

+ ID.AddInteger(getSyntheticNodeSubclassData<VPStoreSDNode>(

+ dl.getIROrder(), VTs, ISD::UNINDEXED, false, IsCompressing, VT, MMO));

+ ID.AddInteger(MMO->getPointerInfo().getAddrSpace());

+ void *IP = nullptr;

+ if (SDNode *E = FindNodeOrInsertPos(ID, dl, IP)) {

+ cast<VPStoreSDNode>(E)->refineAlignment(MMO);

+ return SDValue(E, 0);

+ }

+ auto *N =

+ newSDNode<VPStoreSDNode>(dl.getIROrder(), dl.getDebugLoc(), VTs,

+ ISD::UNINDEXED, false, IsCompressing, VT, MMO);

+ createOperands(N, Ops);

+ CSEMap.InsertNode(N, IP);

+ InsertNode(N);

+ SDValue V(N, 0);

+ NewSDValueDbgMsg(V, "Creating new node: ", this);

+ return V;

+SDValue SelectionDAG::getTruncStoreVP(SDValue Chain, const SDLoc &dl,

+ SDValue Val, SDValue Ptr, SDValue Mask,

+ SDValue EVL, MachinePointerInfo PtrInfo,

+ EVT SVT, Align Alignment,

+ MachineMemOperand::Flags MMOFlags,

+ const AAMDNodes &AAInfo,

+ bool IsCompressing) {

+ assert(Chain.getValueType() == MVT::Other && "Invalid chain type");

+ MMOFlags |= MachineMemOperand::MOStore;

+ assert((MMOFlags & MachineMemOperand::MOLoad) == 0);

+ if (PtrInfo.V.isNull())

+ PtrInfo = InferPointerInfo(PtrInfo, *this, Ptr);

+ MachineFunction &MF = getMachineFunction();

+ MachineMemOperand *MMO = MF.getMachineMemOperand(

+ PtrInfo, MMOFlags, MemoryLocation::getSizeOrUnknown(SVT.getStoreSize()),

+ Alignment, AAInfo);

+ return getTruncStoreVP(Chain, dl, Val, Ptr, Mask, EVL, SVT, MMO,

+ IsCompressing);

+SDValue SelectionDAG::getTruncStoreVP(SDValue Chain, const SDLoc &dl,

+ SDValue Val, SDValue Ptr, SDValue Mask,

+ SDValue EVL, EVT SVT,

+ MachineMemOperand *MMO,

+ bool IsCompressing) {

+ EVT VT = Val.getValueType();

+ assert(Chain.getValueType() == MVT::Other && "Invalid chain type");

+ if (VT == SVT)

+ return getStoreVP(Chain, dl, Val, Ptr, Mask, EVL, MMO, IsCompressing);

+ assert(SVT.getScalarType().bitsLT(VT.getScalarType()) &&

+ "Should only be a truncating store, not extending!");

+ assert(VT.isInteger() == SVT.isInteger() && "Can't do FP-INT conversion!");

+ assert(VT.isVector() == SVT.isVector() &&

+ "Cannot use trunc store to convert to or from a vector!");

+ assert((!VT.isVector() ||

+ VT.getVectorElementCount() == SVT.getVectorElementCount()) &&

+ "Cannot use trunc store to change the number of vector elements!");

+ SDVTList VTs = getVTList(MVT::Other);

+ SDValue Undef = getUNDEF(Ptr.getValueType());

+ SDValue Ops[] = {Chain, Val, Ptr, Undef, Mask, EVL};

+ FoldingSetNodeID ID;

+ AddNodeIDNode(ID, ISD::VP_STORE, VTs, Ops);

+ ID.AddInteger(SVT.getRawBits());

+ ID.AddInteger(getSyntheticNodeSubclassData<VPStoreSDNode>(

+ dl.getIROrder(), VTs, ISD::UNINDEXED, true, IsCompressing, SVT, MMO));

+ ID.AddInteger(MMO->getPointerInfo().getAddrSpace());

+ void *IP = nullptr;

+ if (SDNode *E = FindNodeOrInsertPos(ID, dl, IP)) {

+ cast<VPStoreSDNode>(E)->refineAlignment(MMO);

+ return SDValue(E, 0);

+ }

+ auto *N =

+ newSDNode<VPStoreSDNode>(dl.getIROrder(), dl.getDebugLoc(), VTs,

+ ISD::UNINDEXED, true, IsCompressing, SVT, MMO);

+ createOperands(N, Ops);

+ CSEMap.InsertNode(N, IP);

+ InsertNode(N);

+ SDValue V(N, 0);

+ NewSDValueDbgMsg(V, "Creating new node: ", this);

+ return V;

+SDValue SelectionDAG::getIndexedStoreVP(SDValue OrigStore, const SDLoc &dl,

+ SDValue Base, SDValue Offset,

+ ISD::MemIndexedMode AM) {

+ auto *ST = cast<VPStoreSDNode>(OrigStore);

+ assert(ST->getOffset().isUndef() && "Store is already an indexed store!");

+ SDVTList VTs = getVTList(Base.getValueType(), MVT::Other);

+ SDValue Ops[] = {ST->getChain(), ST->getValue(), Base,

+ Offset, ST->getMask(), ST->getVectorLength()};

+ FoldingSetNodeID ID;

+ AddNodeIDNode(ID, ISD::VP_STORE, VTs, Ops);

+ ID.AddInteger(ST->getMemoryVT().getRawBits());

+ ID.AddInteger(ST->getRawSubclassData());

+ ID.AddInteger(ST->getPointerInfo().getAddrSpace());

+ void *IP = nullptr;

+ if (SDNode *E = FindNodeOrInsertPos(ID, dl, IP))

+ return SDValue(E, 0);

+ auto *N = newSDNode<VPStoreSDNode>(

+ dl.getIROrder(), dl.getDebugLoc(), VTs, AM, ST->isTruncatingStore(),

+ ST->isCompressingStore(), ST->getMemoryVT(), ST->getMemOperand());

+ createOperands(N, Ops);

+ CSEMap.InsertNode(N, IP);

+ InsertNode(N);

+ SDValue V(N, 0);

+ NewSDValueDbgMsg(V, "Creating new node: ", this);

+ return V;

+SDValue SelectionDAG::getGatherVP(SDVTList VTs, EVT VT, const SDLoc &dl,

+ ArrayRef<SDValue> Ops, MachineMemOperand *MMO,

+ ISD::MemIndexType IndexType) {

+ assert(Ops.size() == 6 && "Incompatible number of operands");

+ FoldingSetNodeID ID;

+ AddNodeIDNode(ID, ISD::VP_GATHER, VTs, Ops);

+ ID.AddInteger(VT.getRawBits());

+ ID.AddInteger(getSyntheticNodeSubclassData<VPGatherSDNode>(

+ dl.getIROrder(), VTs, VT, MMO, IndexType));

+ ID.AddInteger(MMO->getPointerInfo().getAddrSpace());

+ void *IP = nullptr;

+ if (SDNode *E = FindNodeOrInsertPos(ID, dl, IP)) {

+ cast<VPGatherSDNode>(E)->refineAlignment(MMO);

+ return SDValue(E, 0);

+ }

+ auto *N = newSDNode<VPGatherSDNode>(dl.getIROrder(), dl.getDebugLoc(), VTs,

+ VT, MMO, IndexType);

+ createOperands(N, Ops);

+ assert(N->getMask().getValueType().getVectorElementCount() ==

+ N->getValueType(0).getVectorElementCount() &&

+ "Vector width mismatch between mask and data");

+ assert(N->getIndex().getValueType().getVectorElementCount().isScalable() ==

+ N->getValueType(0).getVectorElementCount().isScalable() &&

+ "Scalable flags of index and data do not match");

+ assert(ElementCount::isKnownGE(

+ N->getIndex().getValueType().getVectorElementCount(),

+ N->getValueType(0).getVectorElementCount()) &&

+ "Vector width mismatch between index and data");

+ assert(isa<ConstantSDNode>(N->getScale()) &&

+ cast<ConstantSDNode>(N->getScale())->getAPIntValue().isPowerOf2() &&

+ "Scale should be a constant power of 2");

+ CSEMap.InsertNode(N, IP);

+ InsertNode(N);

+ SDValue V(N, 0);

+ NewSDValueDbgMsg(V, "Creating new node: ", this);

+ return V;

+SDValue SelectionDAG::getScatterVP(SDVTList VTs, EVT VT, const SDLoc &dl,

+ ArrayRef<SDValue> Ops,

+ MachineMemOperand *MMO,

+ ISD::MemIndexType IndexType) {

+ assert(Ops.size() == 7 && "Incompatible number of operands");

+ FoldingSetNodeID ID;

+ AddNodeIDNode(ID, ISD::VP_SCATTER, VTs, Ops);

+ ID.AddInteger(VT.getRawBits());

+ ID.AddInteger(getSyntheticNodeSubclassData<VPScatterSDNode>(

+ dl.getIROrder(), VTs, VT, MMO, IndexType));

+ ID.AddInteger(MMO->getPointerInfo().getAddrSpace());

+ void *IP = nullptr;

+ if (SDNode *E = FindNodeOrInsertPos(ID, dl, IP)) {

+ cast<VPScatterSDNode>(E)->refineAlignment(MMO);

+ return SDValue(E, 0);

+ }

+ auto *N = newSDNode<VPScatterSDNode>(dl.getIROrder(), dl.getDebugLoc(), VTs,

+ VT, MMO, IndexType);

+ createOperands(N, Ops);

+ assert(N->getMask().getValueType().getVectorElementCount() ==

+ N->getValue().getValueType().getVectorElementCount() &&

+ "Vector width mismatch between mask and data");

+ assert(

+ N->getIndex().getValueType().getVectorElementCount().isScalable() ==

+ N->getValue().getValueType().getVectorElementCount().isScalable() &&

+ "Scalable flags of index and data do not match");

+ assert(ElementCount::isKnownGE(

+ N->getIndex().getValueType().getVectorElementCount(),

+ N->getValue().getValueType().getVectorElementCount()) &&

+ "Vector width mismatch between index and data");

+ assert(isa<ConstantSDNode>(N->getScale()) &&

+ cast<ConstantSDNode>(N->getScale())->getAPIntValue().isPowerOf2() &&

+ "Scale should be a constant power of 2");

+ CSEMap.InsertNode(N, IP);

+ InsertNode(N);

+ SDValue V(N, 0);

+ NewSDValueDbgMsg(V, "Creating new node: ", this);

+ return V;

SDValue SelectionDAG::getMaskedLoad(EVT VT, const SDLoc &dl, SDValue Chain,

SDValue Base, SDValue Offset, SDValue Mask,

SDValue PassThru, EVT MemVT,

@@ -7818,7 +8189,7 @@ SDValue SelectionDAG::simplifySelect(SDValue Cond, SDValue T, SDValue F) {

// select true, T, F --> T

// select false, T, F --> F

if (auto *CondC = dyn_cast<ConstantSDNode>(Cond))

- return CondC->isNullValue() ? F : T;

+ return CondC->isZero() ? F : T;

// TODO: This should simplify VSELECT with constant condition using something

// like this (but check boolean contents to be complete?):

@@ -9296,7 +9667,7 @@ void SelectionDAG::CreateTopologicalOrder(std::vector<SDNode *> &Order) {

}

#ifndef NDEBUG

-void SelectionDAG::VerifyDAGDiverence() {

+void SelectionDAG::VerifyDAGDivergence() {

std::vector<SDNode *> TopoOrder;

CreateTopologicalOrder(TopoOrder);

for (auto *N : TopoOrder) {

@@ -9384,21 +9755,20 @@ unsigned SelectionDAG::AssignTopologicalOrder() {

// before SortedPos will contain the topological sort index, and the

// Node Id fields for nodes At SortedPos and after will contain the

// count of outstanding operands.

- for (allnodes_iterator I = allnodes_begin(),E = allnodes_end(); I != E; ) {

- SDNode *N = &*I++;

- checkForCycles(N, this);

- unsigned Degree = N->getNumOperands();

+ for (SDNode &N : llvm::make_early_inc_range(allnodes())) {

+ checkForCycles(&N, this);

+ unsigned Degree = N.getNumOperands();

if (Degree == 0) {

// A node with no uses, add it to the result array immediately.

- N->setNodeId(DAGSize++);

- allnodes_iterator Q(N);

+ N.setNodeId(DAGSize++);

+ allnodes_iterator Q(&N);

if (Q != SortedPos)

SortedPos = AllNodes.insert(SortedPos, AllNodes.remove(Q));

assert(SortedPos != AllNodes.end() && "Overran node list");

++SortedPos;

} else {

// Temporarily use the Node Id as scratch space for the degree count.

- N->setNodeId(Degree);

+ N.setNodeId(Degree);

}

@@ -9512,12 +9882,9 @@ SDValue SelectionDAG::getSymbolFunctionGlobalAddress(SDValue Op,

std::string ErrorStr;

raw_string_ostream ErrorFormatter(ErrorStr);

ErrorFormatter << "Undefined external symbol ";

ErrorFormatter << '"' << Symbol << '"';

- ErrorFormatter.flush();

- report_fatal_error(ErrorStr);

+ report_fatal_error(Twine(ErrorFormatter.str()));

}

//===----------------------------------------------------------------------===//

@@ -9526,7 +9893,7 @@ SDValue SelectionDAG::getSymbolFunctionGlobalAddress(SDValue Op,

bool llvm::isNullConstant(SDValue V) {

ConstantSDNode *Const = dyn_cast<ConstantSDNode>(V);

- return Const != nullptr && Const->isNullValue();

+ return Const != nullptr && Const->isZero();

}

bool llvm::isNullFPConstant(SDValue V) {

@@ -9536,7 +9903,7 @@ bool llvm::isNullFPConstant(SDValue V) {

bool llvm::isAllOnesConstant(SDValue V) {

ConstantSDNode *Const = dyn_cast<ConstantSDNode>(V);

- return Const != nullptr && Const->isAllOnesValue();

+ return Const != nullptr && Const->isAllOnes();

}

bool llvm::isOneConstant(SDValue V) {

@@ -9670,7 +10037,7 @@ bool llvm::isNullOrNullSplat(SDValue N, bool AllowUndefs) {

// TODO: may want to use peekThroughBitcast() here.

ConstantSDNode *C =

isConstOrConstSplat(N, AllowUndefs, /*AllowTruncation=*/true);

- return C && C->isNullValue();

+ return C && C->isZero();

}

bool llvm::isOneOrOneSplat(SDValue N, bool AllowUndefs) {

@@ -9684,7 +10051,7 @@ bool llvm::isAllOnesOrAllOnesSplat(SDValue N, bool AllowUndefs) {

N = peekThroughBitcasts(N);

unsigned BitWidth = N.getScalarValueSizeInBits();

ConstantSDNode *C = isConstOrConstSplat(N, AllowUndefs);

- return C && C->isAllOnesValue() && C->getValueSizeInBits(0) == BitWidth;

+ return C && C->isAllOnes() && C->getValueSizeInBits(0) == BitWidth;

}

HandleSDNode::~HandleSDNode() {

@@ -9790,8 +10157,7 @@ bool SDNode::hasAnyUseOfValue(unsigned Value) const {

/// isOnlyUserOf - Return true if this node is the only use of N.

bool SDNode::isOnlyUserOf(const SDNode *N) const {

bool Seen = false;

- for (SDNode::use_iterator I = N->use_begin(), E = N->use_end(); I != E; ++I) {

- SDNode *User = *I;

+ for (const SDNode *User : N->uses()) {

if (User == this)

Seen = true;

else

@@ -9804,8 +10170,7 @@ bool SDNode::isOnlyUserOf(const SDNode *N) const {

/// Return true if the only users of N are contained in Nodes.

bool SDNode::areOnlyUsersOf(ArrayRef<const SDNode *> Nodes, const SDNode *N) {

bool Seen = false;

- for (SDNode::use_iterator I = N->use_begin(), E = N->use_end(); I != E; ++I) {

- SDNode *User = *I;

+ for (const SDNode *User : N->uses()) {

if (llvm::is_contained(Nodes, User))

Seen = true;

else

@@ -10212,14 +10577,14 @@ SelectionDAG::GetDependentSplitDestVTs(const EVT &VT, const EVT &EnvVT,

"Mixing fixed width and scalable vectors when enveloping a type");

EVT LoVT, HiVT;

if (VTNumElts.getKnownMinValue() > EnvNumElts.getKnownMinValue()) {

- LoVT = EnvVT;

+ LoVT = EVT::getVectorVT(*getContext(), EltTp, EnvNumElts);

HiVT = EVT::getVectorVT(*getContext(), EltTp, VTNumElts - EnvNumElts);

*HiIsEmpty = false;

} else {

// Flag that hi type has zero storage size, but return split envelop type

// (this would be easier if vector types with zero elements were allowed).

LoVT = EVT::getVectorVT(*getContext(), EltTp, VTNumElts);

- HiVT = EnvVT;

+ HiVT = EVT::getVectorVT(*getContext(), EltTp, EnvNumElts);

*HiIsEmpty = true;

}

return std::make_pair(LoVT, HiVT);

@@ -10387,7 +10752,7 @@ SDValue BuildVectorSDNode::getSplatValue(const APInt &DemandedElts,

}

SDValue BuildVectorSDNode::getSplatValue(BitVector *UndefElements) const {

- APInt DemandedElts = APInt::getAllOnesValue(getNumOperands());

+ APInt DemandedElts = APInt::getAllOnes(getNumOperands());

return getSplatValue(DemandedElts, UndefElements);

}

@@ -10439,7 +10804,7 @@ bool BuildVectorSDNode::getRepeatedSequence(const APInt &DemandedElts,

bool BuildVectorSDNode::getRepeatedSequence(SmallVectorImpl<SDValue> &Sequence,

BitVector *UndefElements) const {

- APInt DemandedElts = APInt::getAllOnesValue(getNumOperands());

+ APInt DemandedElts = APInt::getAllOnes(getNumOperands());

return getRepeatedSequence(DemandedElts, Sequence, UndefElements);

}

@@ -10485,6 +10850,97 @@ BuildVectorSDNode::getConstantFPSplatPow2ToLog2Int(BitVector *UndefElements,

return -1;

}

+bool BuildVectorSDNode::getConstantRawBits(

+ bool IsLittleEndian, unsigned DstEltSizeInBits,

+ SmallVectorImpl<APInt> &RawBitElements, BitVector &UndefElements) const {

+ // Early-out if this contains anything but Undef/Constant/ConstantFP.

+ if (!isConstant())

+ return false;

+ unsigned NumSrcOps = getNumOperands();

+ unsigned SrcEltSizeInBits = getValueType(0).getScalarSizeInBits();

+ assert(((NumSrcOps * SrcEltSizeInBits) % DstEltSizeInBits) == 0 &&

+ "Invalid bitcast scale");

+ // Extract raw src bits.

+ SmallVector<APInt> SrcBitElements(NumSrcOps,

+ APInt::getNullValue(SrcEltSizeInBits));

+ BitVector SrcUndeElements(NumSrcOps, false);

+ for (unsigned I = 0; I != NumSrcOps; ++I) {

+ SDValue Op = getOperand(I);

+ if (Op.isUndef()) {

+ SrcUndeElements.set(I);

+ continue;

+ }

+ auto *CInt = dyn_cast<ConstantSDNode>(Op);

+ auto *CFP = dyn_cast<ConstantFPSDNode>(Op);

+ assert((CInt || CFP) && "Unknown constant");

+ SrcBitElements[I] =

+ CInt ? CInt->getAPIntValue().truncOrSelf(SrcEltSizeInBits)

+ : CFP->getValueAPF().bitcastToAPInt();

+ }

+ // Recast to dst width.

+ recastRawBits(IsLittleEndian, DstEltSizeInBits, RawBitElements,

+ SrcBitElements, UndefElements, SrcUndeElements);

+ return true;

+void BuildVectorSDNode::recastRawBits(bool IsLittleEndian,

+ unsigned DstEltSizeInBits,

+ SmallVectorImpl<APInt> &DstBitElements,

+ ArrayRef<APInt> SrcBitElements,

+ BitVector &DstUndefElements,

+ const BitVector &SrcUndefElements) {

+ unsigned NumSrcOps = SrcBitElements.size();

+ unsigned SrcEltSizeInBits = SrcBitElements[0].getBitWidth();

+ assert(((NumSrcOps * SrcEltSizeInBits) % DstEltSizeInBits) == 0 &&

+ "Invalid bitcast scale");

+ assert(NumSrcOps == SrcUndefElements.size() &&

+ "Vector size mismatch");

+ unsigned NumDstOps = (NumSrcOps * SrcEltSizeInBits) / DstEltSizeInBits;

+ DstUndefElements.clear();

+ DstUndefElements.resize(NumDstOps, false);

+ DstBitElements.assign(NumDstOps, APInt::getNullValue(DstEltSizeInBits));

+ // Concatenate src elements constant bits together into dst element.

+ if (SrcEltSizeInBits <= DstEltSizeInBits) {

+ unsigned Scale = DstEltSizeInBits / SrcEltSizeInBits;

+ for (unsigned I = 0; I != NumDstOps; ++I) {

+ DstUndefElements.set(I);

+ APInt &DstBits = DstBitElements[I];

+ for (unsigned J = 0; J != Scale; ++J) {

+ unsigned Idx = (I * Scale) + (IsLittleEndian ? J : (Scale - J - 1));

+ if (SrcUndefElements[Idx])

+ continue;

+ DstUndefElements.reset(I);

+ const APInt &SrcBits = SrcBitElements[Idx];

+ assert(SrcBits.getBitWidth() == SrcEltSizeInBits &&

+ "Illegal constant bitwidths");

+ DstBits.insertBits(SrcBits, J * SrcEltSizeInBits);

+ }

+ return;

+ }

+ // Split src element constant bits into dst elements.

+ unsigned Scale = SrcEltSizeInBits / DstEltSizeInBits;

+ for (unsigned I = 0; I != NumSrcOps; ++I) {

+ if (SrcUndefElements[I]) {

+ DstUndefElements.set(I * Scale, (I + 1) * Scale);

+ continue;

+ }

+ const APInt &SrcBits = SrcBitElements[I];

+ for (unsigned J = 0; J != Scale; ++J) {

+ unsigned Idx = (I * Scale) + (IsLittleEndian ? J : (Scale - J - 1));

+ APInt &DstBits = DstBitElements[Idx];

+ DstBits = SrcBits.extractBits(DstEltSizeInBits, J * DstEltSizeInBits);

+ }

bool BuildVectorSDNode::isConstant() const {

for (const SDValue &Op : op_values()) {

unsigned Opc = Op.getOpcode();