vendor/llvm/llvm-trunk-r291274

author: Dimitry Andric <dim@FreeBSD.org> 2017-01-06 20:13:21 +0000
committer: Dimitry Andric <dim@FreeBSD.org> 2017-01-06 20:13:21 +0000
commit: 7e7b6700743285c0af506ac6299ddf82ebd434b9 (patch)
tree: 578d2ea1868b77f3dff145df7f8f3fe73272c09e /lib/Target/ARM/ARMTargetTransformInfo.cpp
parent: 4b570baa7e867c652fa7d690585098278082fae9 (diff)
1 files changed, 5 insertions, 2 deletions
diff --git a/lib/Target/ARM/ARMTargetTransformInfo.cpp b/lib/Target/ARM/ARMTargetTransformInfo.cpp
index 10e6297ef1ed6..cc001b596785e 100644
--- a/lib/Target/ARM/ARMTargetTransformInfo.cpp
+++ b/lib/Target/ARM/ARMTargetTransformInfo.cpp
@@ -338,14 +338,17 @@ int ARMTTIImpl::getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy) {
   return BaseT::getCmpSelInstrCost(Opcode, ValTy, CondTy);
 }
 
-int ARMTTIImpl::getAddressComputationCost(Type *Ty, bool IsComplex) {
+int ARMTTIImpl::getAddressComputationCost(Type *Ty, ScalarEvolution *SE,
+                                          const SCEV *Ptr) {
   // Address computations in vectorized code with non-consecutive addresses will
   // likely result in more instructions compared to scalar code where the
   // computation can more often be merged into the index mode. The resulting
   // extra micro-ops can significantly decrease throughput.
   unsigned NumVectorInstToHideOverhead = 10;
+  int MaxMergeDistance = 64;
 
-  if (Ty->isVectorTy() && IsComplex)
+  if (Ty->isVectorTy() && SE && 
+      !BaseT::isConstantStridedAccessLessThan(SE, Ptr, MaxMergeDistance + 1))
     return NumVectorInstToHideOverhead;
 
   // In many cases the address computation is not merged into the instruction
author	Dimitry Andric <dim@FreeBSD.org>	2017-01-06 20:13:21 +0000
committer	Dimitry Andric <dim@FreeBSD.org>	2017-01-06 20:13:21 +0000
commit	7e7b6700743285c0af506ac6299ddf82ebd434b9 (patch)
tree	578d2ea1868b77f3dff145df7f8f3fe73272c09e /lib/Target/ARM/ARMTargetTransformInfo.cpp
parent	4b570baa7e867c652fa7d690585098278082fae9 (diff)