src - FreeBSD source tree

diff options


context:
space:
mode:

author	Dimitry Andric <dim@FreeBSD.org>	2023-10-21 13:31:11 +0000
committer	Dimitry Andric <dim@FreeBSD.org>	2023-12-08 17:35:41 +0000
commit	bdb86d1a853a919764f65fdedcea76d76e4d619b (patch)
tree	9192288f53762443b0d7453fd2d49bbbe0e344eb /contrib/llvm-project/llvm/lib/Target
parent	3bd749dbd90cc3b95719b65393df5ca8a0fe919d (diff)
parent	cd255c5cf2441442b46200d298c0cbccf83caba5 (diff)

Diffstat (limited to 'contrib/llvm-project/llvm/lib/Target')

-rw-r--r--

contrib/llvm-project/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp

-rw-r--r--

contrib/llvm-project/llvm/lib/Target/PowerPC/PPCISelLowering.cpp

-rw-r--r--

contrib/llvm-project/llvm/lib/Target/X86/X86ISelLowering.cpp

3 files changed, 25 insertions, 5 deletions

diff --git a/contrib/llvm-project/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp b/contrib/llvm-project/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
index a1753a40a117..6e721b937846 100644
--- a/contrib/llvm-project/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
+++ b/contrib/llvm-project/llvm/lib/Target/AArch64/AArch64ISelLowering.cpp

@@ -1033,7 +1033,12 @@ AArch64TargetLowering::AArch64TargetLowering(const TargetMachine &TM,

// Set required alignment.

setMinFunctionAlignment(Align(4));

// Set preferred alignments.

- setPrefLoopAlignment(STI.getPrefLoopAlignment());

+ // Don't align loops on Windows. The SEH unwind info generation needs to

+ // know the exact length of functions before the alignments have been

+ // expanded.

+ if (!Subtarget->isTargetWindows())

+ setPrefLoopAlignment(STI.getPrefLoopAlignment());

setMaxBytesForAlignment(STI.getMaxBytesForLoopAlignment());

setPrefFunctionAlignment(STI.getPrefFunctionAlignment());

diff --git a/contrib/llvm-project/llvm/lib/Target/PowerPC/PPCISelLowering.cpp b/contrib/llvm-project/llvm/lib/Target/PowerPC/PPCISelLowering.cpp
index 3ed0a261eb76..d4d2da55160e 100644
--- a/contrib/llvm-project/llvm/lib/Target/PowerPC/PPCISelLowering.cpp
+++ b/contrib/llvm-project/llvm/lib/Target/PowerPC/PPCISelLowering.cpp

@@ -15527,7 +15527,7 @@ SDValue PPCTargetLowering::PerformDAGCombine(SDNode *N,

break;

SDValue ConstOp = DAG.getConstant(Imm, dl, MVT::i32);

SDValue NarrowAnd = DAG.getNode(ISD::AND, dl, MVT::i32, NarrowOp, ConstOp);

- return DAG.getAnyExtOrTrunc(NarrowAnd, dl, N->getValueType(0));

+ return DAG.getZExtOrTrunc(NarrowAnd, dl, N->getValueType(0));

}

case ISD::SHL:

return combineSHL(N, DCI);

diff --git a/contrib/llvm-project/llvm/lib/Target/X86/X86ISelLowering.cpp b/contrib/llvm-project/llvm/lib/Target/X86/X86ISelLowering.cpp
index d9750ea22e2b..0f1cb5f1e236 100644
--- a/contrib/llvm-project/llvm/lib/Target/X86/X86ISelLowering.cpp
+++ b/contrib/llvm-project/llvm/lib/Target/X86/X86ISelLowering.cpp

@@ -48539,13 +48539,28 @@ static SDValue combineSetCCMOVMSK(SDValue EFLAGS, X86::CondCode &CC,

}

// MOVMSK(SHUFFLE(X,u)) -> MOVMSK(X) iff every element is referenced.

- SmallVector<int, 32> ShuffleMask;

+ // Since we peek through a bitcast, we need to be careful if the base vector

+ // type has smaller elements than the MOVMSK type. In that case, even if

+ // all the elements are demanded by the shuffle mask, only the "high"

+ // elements which have highbits that align with highbits in the MOVMSK vec

+ // elements are actually demanded. A simplification of spurious operations

+ // on the "low" elements take place during other simplifications.

+ //

+ // For example:

+ // MOVMSK64(BITCAST(SHUF32 X, (1,0,3,2))) even though all the elements are

+ // demanded, because we are swapping around the result can change.

+ //

+ // To address this, we check that we can scale the shuffle mask to MOVMSK

+ // element width (this will ensure "high" elements match). Its slightly overly

+ // conservative, but fine for an edge case fold.

+ SmallVector<int, 32> ShuffleMask, ScaledMaskUnused;

SmallVector<SDValue, 2> ShuffleInputs;

if (NumElts <= CmpBits &&

getTargetShuffleInputs(peekThroughBitcasts(Vec), ShuffleInputs,

ShuffleMask, DAG) &&

ShuffleInputs.size() == 1 && !isAnyZeroOrUndef(ShuffleMask) &&

- ShuffleInputs[0].getValueSizeInBits() == VecVT.getSizeInBits()) {

+ ShuffleInputs[0].getValueSizeInBits() == VecVT.getSizeInBits() &&

+ scaleShuffleElements(ShuffleMask, NumElts, ScaledMaskUnused)) {

unsigned NumShuffleElts = ShuffleMask.size();

APInt DemandedElts = APInt::getZero(NumShuffleElts);

for (int M : ShuffleMask) {

@@ -57239,7 +57254,7 @@ static SDValue combineConcatVectorOps(const SDLoc &DL, MVT VT,

// TODO - combineX86ShufflesRecursively should handle shuffle concatenation

// but it currently struggles with different vector widths.

if (llvm::all_of(Ops, [Op0](SDValue Op) {

- return Op.getOpcode() == Op0.getOpcode();

+ return Op.getOpcode() == Op0.getOpcode() && Op.hasOneUse();

})) {

auto ConcatSubOperand = [&](EVT VT, ArrayRef<SDValue> SubOps, unsigned I) {

SmallVector<SDValue> Subs;