diff options
Diffstat (limited to 'lib/CodeGen/SelectionDAG/DAGCombiner.cpp')
| -rw-r--r-- | lib/CodeGen/SelectionDAG/DAGCombiner.cpp | 161 | 
1 files changed, 111 insertions, 50 deletions
| diff --git a/lib/CodeGen/SelectionDAG/DAGCombiner.cpp b/lib/CodeGen/SelectionDAG/DAGCombiner.cpp index 71382c18fdf9d..d5d3f7a61a9f9 100644 --- a/lib/CodeGen/SelectionDAG/DAGCombiner.cpp +++ b/lib/CodeGen/SelectionDAG/DAGCombiner.cpp @@ -3889,9 +3889,8 @@ SDValue DAGCombiner::visitAND(SDNode *N) {    // Note: the SimplifyDemandedBits fold below can make an information-losing    // transform, and then we have no way to find this better fold.    if (N1C && N1C->isOne() && N0.getOpcode() == ISD::SUB) { -    ConstantSDNode *SubLHS = isConstOrConstSplat(N0.getOperand(0)); -    SDValue SubRHS = N0.getOperand(1); -    if (SubLHS && SubLHS->isNullValue()) { +    if (isNullConstantOrNullSplatConstant(N0.getOperand(0))) { +      SDValue SubRHS = N0.getOperand(1);        if (SubRHS.getOpcode() == ISD::ZERO_EXTEND &&            SubRHS.getOperand(0).getScalarValueSizeInBits() == 1)          return SubRHS; @@ -4586,6 +4585,20 @@ SDNode *DAGCombiner::MatchRotatePosNeg(SDValue Shifted, SDValue Pos,    return nullptr;  } +// if Left + Right == Sum (constant or constant splat vector) +static bool sumMatchConstant(SDValue Left, SDValue Right, unsigned Sum, +                             SelectionDAG &DAG, const SDLoc &DL) { +  EVT ShiftVT = Left.getValueType(); +  if (ShiftVT != Right.getValueType()) return false; + +  SDValue ShiftSum = DAG.FoldConstantArithmetic(ISD::ADD, DL, ShiftVT, +                         Left.getNode(), Right.getNode()); +  if (!ShiftSum) return false; + +  ConstantSDNode *CSum = isConstOrConstSplat(ShiftSum); +  return CSum && CSum->getZExtValue() == Sum; +} +  // MatchRotate - Handle an 'or' of two operands.  If this is one of the many  // idioms for rotate, and if the target supports rotation instructions, generate  // a rot[lr]. @@ -4631,30 +4644,24 @@ SDNode *DAGCombiner::MatchRotate(SDValue LHS, SDValue RHS, const SDLoc &DL) {    // fold (or (shl x, C1), (srl x, C2)) -> (rotl x, C1)    // fold (or (shl x, C1), (srl x, C2)) -> (rotr x, C2) -  if (isConstOrConstSplat(LHSShiftAmt) && isConstOrConstSplat(RHSShiftAmt)) { -    uint64_t LShVal = isConstOrConstSplat(LHSShiftAmt)->getZExtValue(); -    uint64_t RShVal = isConstOrConstSplat(RHSShiftAmt)->getZExtValue(); -    if ((LShVal + RShVal) != EltSizeInBits) -      return nullptr; - +  if (sumMatchConstant(LHSShiftAmt, RHSShiftAmt, EltSizeInBits, DAG, DL)) {      SDValue Rot = DAG.getNode(HasROTL ? ISD::ROTL : ISD::ROTR, DL, VT,                                LHSShiftArg, HasROTL ? LHSShiftAmt : RHSShiftAmt);      // If there is an AND of either shifted operand, apply it to the result.      if (LHSMask.getNode() || RHSMask.getNode()) { -      SDValue Mask = DAG.getAllOnesConstant(DL, VT); +      SDValue AllOnes = DAG.getAllOnesConstant(DL, VT); +      SDValue Mask = AllOnes;        if (LHSMask.getNode()) { -        APInt RHSBits = APInt::getLowBitsSet(EltSizeInBits, LShVal); +        SDValue RHSBits = DAG.getNode(ISD::SRL, DL, VT, AllOnes, RHSShiftAmt);          Mask = DAG.getNode(ISD::AND, DL, VT, Mask, -                           DAG.getNode(ISD::OR, DL, VT, LHSMask, -                                       DAG.getConstant(RHSBits, DL, VT))); +                           DAG.getNode(ISD::OR, DL, VT, LHSMask, RHSBits));        }        if (RHSMask.getNode()) { -        APInt LHSBits = APInt::getHighBitsSet(EltSizeInBits, RShVal); +        SDValue LHSBits = DAG.getNode(ISD::SHL, DL, VT, AllOnes, LHSShiftAmt);          Mask = DAG.getNode(ISD::AND, DL, VT, Mask, -                           DAG.getNode(ISD::OR, DL, VT, RHSMask, -                                       DAG.getConstant(LHSBits, DL, VT))); +                           DAG.getNode(ISD::OR, DL, VT, RHSMask, LHSBits));        }        Rot = DAG.getNode(ISD::AND, DL, VT, Rot, Mask); @@ -5272,11 +5279,21 @@ SDValue DAGCombiner::visitRotate(SDNode *N) {    SDValue N0 = N->getOperand(0);    SDValue N1 = N->getOperand(1);    EVT VT = N->getValueType(0); +  unsigned Bitsize = VT.getScalarSizeInBits();    // fold (rot x, 0) -> x    if (isNullConstantOrNullSplatConstant(N1))      return N0; +  // fold (rot x, c) -> (rot x, c % BitSize) +  if (ConstantSDNode *Cst = isConstOrConstSplat(N1)) { +    if (Cst->getAPIntValue().uge(Bitsize)) { +      uint64_t RotAmt = Cst->getAPIntValue().urem(Bitsize); +      return DAG.getNode(N->getOpcode(), dl, VT, N0, +                         DAG.getConstant(RotAmt, dl, N1.getValueType())); +    } +  } +    // fold (rot* x, (trunc (and y, c))) -> (rot* x, (and (trunc y), (trunc c))).    if (N1.getOpcode() == ISD::TRUNCATE &&        N1.getOperand(0).getOpcode() == ISD::AND) { @@ -5286,22 +5303,24 @@ SDValue DAGCombiner::visitRotate(SDNode *N) {    unsigned NextOp = N0.getOpcode();    // fold (rot* (rot* x, c2), c1) -> (rot* x, c1 +- c2 % bitsize) -  if (NextOp == ISD::ROTL || NextOp == ISD::ROTR) -    if (SDNode *C1 = DAG.isConstantIntBuildVectorOrConstantInt(N1)) -      if (SDNode *C2 = -          DAG.isConstantIntBuildVectorOrConstantInt(N0.getOperand(1))) { -        bool SameSide = (N->getOpcode() == NextOp); -        unsigned CombineOp = SameSide ? ISD::ADD : ISD::SUB; -        if (SDValue CombinedShift = -            DAG.FoldConstantArithmetic(CombineOp, dl, VT, C1, C2)) { -          unsigned Bitsize = VT.getScalarSizeInBits(); -          SDValue BitsizeC = DAG.getConstant(Bitsize, dl, VT); -          SDValue CombinedShiftNorm = DAG.FoldConstantArithmetic( -            ISD::SREM, dl, VT, CombinedShift.getNode(), BitsizeC.getNode()); -          return DAG.getNode( -            N->getOpcode(), dl, VT, N0->getOperand(0), CombinedShiftNorm); -        } +  if (NextOp == ISD::ROTL || NextOp == ISD::ROTR) { +    SDNode *C1 = DAG.isConstantIntBuildVectorOrConstantInt(N1); +    SDNode *C2 = DAG.isConstantIntBuildVectorOrConstantInt(N0.getOperand(1)); +    if (C1 && C2 && C1->getValueType(0) == C2->getValueType(0)) { +      EVT ShiftVT = C1->getValueType(0); +      bool SameSide = (N->getOpcode() == NextOp); +      unsigned CombineOp = SameSide ? ISD::ADD : ISD::SUB; +      if (SDValue CombinedShift = +              DAG.FoldConstantArithmetic(CombineOp, dl, ShiftVT, C1, C2)) { +        SDValue BitsizeC = DAG.getConstant(Bitsize, dl, ShiftVT); +        SDValue CombinedShiftNorm = DAG.FoldConstantArithmetic( +            ISD::SREM, dl, ShiftVT, CombinedShift.getNode(), +            BitsizeC.getNode()); +        return DAG.getNode(N->getOpcode(), dl, VT, N0->getOperand(0), +                           CombinedShiftNorm);        } +    } +  }    return SDValue();  } @@ -7152,8 +7171,14 @@ SDValue DAGCombiner::visitSIGN_EXTEND(SDNode *N) {        SDValue Trunc = DAG.getNode(ISD::TRUNCATE, SDLoc(N0),                                    N0.getValueType(), ExtLoad);        ExtendSetCCUses(SetCCs, Trunc, ExtLoad, DL, ISD::SIGN_EXTEND); -      CombineTo(N0.getNode(), Trunc, ExtLoad.getValue(1)); -      return CombineTo(N, ExtLoad); // Return N so it doesn't get rechecked! +      // If the load value is used only by N, replace it via CombineTo N. +      bool NoReplaceTrunc = SDValue(LN0, 0).hasOneUse(); +      CombineTo(N, ExtLoad); +      if (NoReplaceTrunc) +        DAG.ReplaceAllUsesOfValueWith(SDValue(LN0, 1), ExtLoad.getValue(1)); +      else +        CombineTo(LN0, Trunc, ExtLoad.getValue(1)); +      return SDValue(N, 0);      }    } @@ -7210,8 +7235,13 @@ SDValue DAGCombiner::visitSIGN_EXTEND(SDNode *N) {                                      SDLoc(N0.getOperand(0)),                                      N0.getOperand(0).getValueType(), ExtLoad);          ExtendSetCCUses(SetCCs, Trunc, ExtLoad, DL, ISD::SIGN_EXTEND); -        CombineTo(N0.getOperand(0).getNode(), Trunc, ExtLoad.getValue(1)); -        return CombineTo(N, And); // Return N so it doesn't get rechecked! +        bool NoReplaceTrunc = SDValue(LN0, 0).hasOneUse(); +        CombineTo(N, And); +        if (NoReplaceTrunc) +          DAG.ReplaceAllUsesOfValueWith(SDValue(LN0, 1), ExtLoad.getValue(1)); +        else +          CombineTo(LN0, Trunc, ExtLoad.getValue(1)); +        return SDValue(N,0); // Return N so it doesn't get rechecked!        }      }    } @@ -7451,8 +7481,14 @@ SDValue DAGCombiner::visitZERO_EXTEND(SDNode *N) {        SDValue Trunc = DAG.getNode(ISD::TRUNCATE, SDLoc(N0),                                    N0.getValueType(), ExtLoad);        ExtendSetCCUses(SetCCs, Trunc, ExtLoad, SDLoc(N), ISD::ZERO_EXTEND); -      CombineTo(N0.getNode(), Trunc, ExtLoad.getValue(1)); -      return CombineTo(N, ExtLoad); // Return N so it doesn't get rechecked! +      // If the load value is used only by N, replace it via CombineTo N. +      bool NoReplaceTrunc = SDValue(LN0, 0).hasOneUse(); +      CombineTo(N, ExtLoad); +      if (NoReplaceTrunc) +        DAG.ReplaceAllUsesOfValueWith(SDValue(LN0, 1), ExtLoad.getValue(1)); +      else +        CombineTo(LN0, Trunc, ExtLoad.getValue(1)); +      return SDValue(N, 0); // Return N so it doesn't get rechecked!      }    } @@ -7503,8 +7539,13 @@ SDValue DAGCombiner::visitZERO_EXTEND(SDNode *N) {                                      SDLoc(N0.getOperand(0)),                                      N0.getOperand(0).getValueType(), ExtLoad);          ExtendSetCCUses(SetCCs, Trunc, ExtLoad, DL, ISD::ZERO_EXTEND); -        CombineTo(N0.getOperand(0).getNode(), Trunc, ExtLoad.getValue(1)); -        return CombineTo(N, And); // Return N so it doesn't get rechecked! +        bool NoReplaceTrunc = SDValue(LN0, 0).hasOneUse(); +        CombineTo(N, And); +        if (NoReplaceTrunc) +          DAG.ReplaceAllUsesOfValueWith(SDValue(LN0, 1), ExtLoad.getValue(1)); +        else +          CombineTo(LN0, Trunc, ExtLoad.getValue(1)); +        return SDValue(N,0); // Return N so it doesn't get rechecked!        }      }    } @@ -7676,13 +7717,18 @@ SDValue DAGCombiner::visitANY_EXTEND(SDNode *N) {                                         LN0->getChain(),                                         LN0->getBasePtr(), N0.getValueType(),                                         LN0->getMemOperand()); -      CombineTo(N, ExtLoad);        SDValue Trunc = DAG.getNode(ISD::TRUNCATE, SDLoc(N0),                                    N0.getValueType(), ExtLoad); -      CombineTo(N0.getNode(), Trunc, ExtLoad.getValue(1));        ExtendSetCCUses(SetCCs, Trunc, ExtLoad, SDLoc(N),                        ISD::ANY_EXTEND); -      return SDValue(N, 0);   // Return N so it doesn't get rechecked! +      // If the load value is used only by N, replace it via CombineTo N. +      bool NoReplaceTrunc = N0.hasOneUse(); +      CombineTo(N, ExtLoad);  +      if (NoReplaceTrunc) +        DAG.ReplaceAllUsesOfValueWith(SDValue(LN0, 1), ExtLoad.getValue(1)); +      else +        CombineTo(LN0, Trunc, ExtLoad.getValue(1)); +      return SDValue(N, 0); // Return N so it doesn't get rechecked!      }    } @@ -11373,12 +11419,8 @@ SDValue DAGCombiner::visitLOAD(SDNode *N) {        SDValue Token = DAG.getNode(ISD::TokenFactor, SDLoc(N),                                    MVT::Other, Chain, ReplLoad.getValue(1)); -      // Make sure the new and old chains are cleaned up. -      AddToWorklist(Token.getNode()); - -      // Replace uses with load result and token factor. Don't add users -      // to work list. -      return CombineTo(N, ReplLoad.getValue(0), Token, false); +      // Replace uses with load result and token factor +      return CombineTo(N, ReplLoad.getValue(0), Token);      }    } @@ -12744,7 +12786,12 @@ bool DAGCombiner::MergeConsecutiveStores(StoreSDNode *St) {               TLI.storeOfVectorConstantIsCheap(MemVT, i + 1, FirstStoreAS)) &&              !NoVectors) {            // Find a legal type for the vector store. -          EVT Ty = EVT::getVectorVT(Context, MemVT, i + 1); +          unsigned Elts = i + 1; +          if (MemVT.isVector()) { +            // When merging vector stores, get the total number of elements. +            Elts *= MemVT.getVectorNumElements(); +          } +          EVT Ty = EVT::getVectorVT(Context, MemVT.getScalarType(), Elts);            if (TLI.isTypeLegal(Ty) &&                TLI.canMergeStoresTo(FirstStoreAS, Ty, DAG) &&                TLI.allowsMemoryAccess(Context, DL, Ty, FirstStoreAS, @@ -13003,7 +13050,7 @@ bool DAGCombiner::MergeConsecutiveStores(StoreSDNode *St) {      SDValue NewStoreChain = getMergeStoreChains(StoreNodes, NumElem);      AddToWorklist(NewStoreChain.getNode()); -    MachineMemOperand::Flags MMOFlags = isDereferenceable ?  +    MachineMemOperand::Flags MMOFlags = isDereferenceable ?                                            MachineMemOperand::MODereferenceable:                                            MachineMemOperand::MONone; @@ -16703,6 +16750,20 @@ bool DAGCombiner::isAlias(LSBaseSDNode *Op0, LSBaseSDNode *Op1) const {    if (BasePtr0.equalBaseIndex(BasePtr1, DAG, PtrDiff))      return !((NumBytes0 <= PtrDiff) || (PtrDiff + NumBytes1 <= 0)); +  // If both BasePtr0 and BasePtr1 are FrameIndexes, we will not be +  // able to calculate their relative offset if at least one arises +  // from an alloca. However, these allocas cannot overlap and we +  // can infer there is no alias. +  if (auto *A = dyn_cast<FrameIndexSDNode>(BasePtr0.getBase())) +    if (auto *B = dyn_cast<FrameIndexSDNode>(BasePtr1.getBase())) { +      MachineFrameInfo &MFI = DAG.getMachineFunction().getFrameInfo(); +      // If the base are the same frame index but the we couldn't find a +      // constant offset, (indices are different) be conservative. +      if (A != B && (!MFI.isFixedObjectIndex(A->getIndex()) || +                     !MFI.isFixedObjectIndex(B->getIndex()))) +        return false; +    } +    // FIXME: findBaseOffset and ConstantValue/GlobalValue/FrameIndex analysis    // modified to use BaseIndexOffset. | 
