Vendor import of llvm trunk r242221: - src

diff options


context:
space:
mode:

author	Dimitry Andric <dim@FreeBSD.org>	2015-08-07 23:01:33 +0000
committer	Dimitry Andric <dim@FreeBSD.org>	2015-08-07 23:01:33 +0000
commit	ee8648bdac07986a0f1ec897b02ec82a2f144d46 (patch)
tree	52d1861acda1205241ee35a94aa63129c604d469 /test/CodeGen/PowerPC
parent	1a82d4c088707c791c792f6822f611b47a12bdfe (diff)

vendor/llvm/llvm-trunk-r242221

Notes

Diffstat (limited to 'test/CodeGen/PowerPC')

-rw-r--r--

test/CodeGen/PowerPC/builtins-ppc-elf2-abi.ll

-rw-r--r--

test/CodeGen/PowerPC/ppc-crbits-onoff.ll

-rw-r--r--

test/CodeGen/PowerPC/ppc32-nest.ll

-rw-r--r--

test/CodeGen/PowerPC/ppc64-anyregcc.ll

-rw-r--r--

test/CodeGen/PowerPC/ppc64-fastcc-fast-isel.ll

-rw-r--r--

test/CodeGen/PowerPC/ppc64-fastcc.ll

-rw-r--r--

test/CodeGen/PowerPC/ppc64-nest.ll

-rw-r--r--

test/CodeGen/PowerPC/ppc64-patchpoint.ll

-rw-r--r--

test/CodeGen/PowerPC/ppc64-stackmap.ll

-rw-r--r--

test/CodeGen/PowerPC/recipest.ll

-rw-r--r--

test/CodeGen/PowerPC/sjlj.ll

-rw-r--r--

test/CodeGen/PowerPC/swaps-le-3.ll

-rw-r--r--

test/CodeGen/PowerPC/swaps-le-5.ll

-rw-r--r--

test/CodeGen/PowerPC/tls-store2.ll

-rw-r--r--

test/CodeGen/PowerPC/vsx-elementary-arith.ll

-rw-r--r--

test/CodeGen/PowerPC/vsx-fma-m.ll

-rw-r--r--

test/CodeGen/PowerPC/vsx-fma-sp.ll

17 files changed, 288 insertions, 55 deletions

diff --git a/test/CodeGen/PowerPC/builtins-ppc-elf2-abi.ll b/test/CodeGen/PowerPC/builtins-ppc-elf2-abi.ll
index 16dc2ccb111d..6013a412924f 100644
--- a/test/CodeGen/PowerPC/builtins-ppc-elf2-abi.ll
+++ b/test/CodeGen/PowerPC/builtins-ppc-elf2-abi.ll

@@ -134,6 +134,36 @@ entry:

; CHECK: xvcmpgtsp {{[0-9]+}}, {{[0-9]+}}, {{[0-9]+}}

}

+; Function Attrs: nounwind

+define <4 x float> @emit_xvresp(<4 x float> %a) {

+entry:

+ %a.addr = alloca <4 x float>, align 16

+ store <4 x float> %a, <4 x float>* %a.addr, align 16

+ %0 = load <4 x float>, <4 x float>* %a.addr, align 16

+ %1 = call <4 x float> @llvm.ppc.vsx.xvresp(<4 x float> %0)

+ ret <4 x float> %1

+; CHECK-LABEL: @emit_xvresp

+; CHECK: xvresp {{[0-9]+}}, {{[0-9]+}}

+; Function Attrs: nounwind

+define <2 x double> @emit_xvredp(<2 x double> %a) {

+entry:

+ %a.addr = alloca <2 x double>, align 16

+ store <2 x double> %a, <2 x double>* %a.addr, align 16

+ %0 = load <2 x double>, <2 x double>* %a.addr, align 16

+ %1 = call <2 x double> @llvm.ppc.vsx.xvredp(<2 x double> %0)

+ ret <2 x double> %1

+; CHECK-LABEL: @emit_xvredp

+; CHECK: xvredp {{[0-9]+}}, {{[0-9]+}}

+; Function Attrs: nounwind readnone

+declare <4 x float> @llvm.ppc.vsx.xvresp(<4 x float>)

+; Function Attrs: nounwind readnone

+declare <2 x double> @llvm.ppc.vsx.xvredp(<2 x double>)

; Function Attrs: nounwind readnone

declare <2 x double> @llvm.ceil.v2f64(<2 x double>)

diff --git a/test/CodeGen/PowerPC/ppc-crbits-onoff.ll b/test/CodeGen/PowerPC/ppc-crbits-onoff.ll
index 88648df5fa36..c69f30017d88 100644
--- a/test/CodeGen/PowerPC/ppc-crbits-onoff.ll
+++ b/test/CodeGen/PowerPC/ppc-crbits-onoff.ll

@@ -15,8 +15,8 @@ entry:

; CHECK-DAG: cmplwi {{[0-9]+}}, 3, 0

; CHECK-DAG: li [[REG2:[0-9]+]], 1

; CHECK-DAG: cntlzw [[REG3:[0-9]+]],

-; CHECK: isel 3, 0, [[REG2]]

-; CHECK: and 3, 3, [[REG3]]

+; CHECK: isel [[REG4:[0-9]+]], 0, [[REG2]]

+; CHECK: and 3, [[REG4]], [[REG3]]

; CHECK: blr

}

diff --git a/test/CodeGen/PowerPC/ppc32-nest.ll b/test/CodeGen/PowerPC/ppc32-nest.ll
new file mode 100644
index 000000000000..ed7bbe2b8f37
--- /dev/null
+++ b/test/CodeGen/PowerPC/ppc32-nest.ll

@@ -0,0 +1,26 @@

+; RUN: llc < %s | FileCheck %s

+target datalayout = "E-m:e-p:32:32-i64:64-n32"

+target triple = "powerpc-unknown-linux-gnu"

+; Tests that the 'nest' parameter attribute causes the relevant parameter to be

+; passed in the right register (r11 for PPC).

+define i8* @nest_receiver(i8* nest %arg) nounwind {

+; CHECK-LABEL: nest_receiver:

+; CHECK: # BB#0:

+; CHECK-NEXT: mr 3, 11

+; CHECK-NEXT: blr

+ ret i8* %arg

+define i8* @nest_caller(i8* %arg) nounwind {

+; CHECK-LABEL: nest_caller:

+; CHECK: mr 11, 3

+; CHECK-NEXT: bl nest_receiver

+; CHECK: blr

+ %result = call i8* @nest_receiver(i8* nest %arg)

+ ret i8* %result

diff --git a/test/CodeGen/PowerPC/ppc64-anyregcc.ll b/test/CodeGen/PowerPC/ppc64-anyregcc.ll
index 66f6a2c790c6..ff0768ff47ed 100644
--- a/test/CodeGen/PowerPC/ppc64-anyregcc.ll
+++ b/test/CodeGen/PowerPC/ppc64-anyregcc.ll

@@ -82,7 +82,7 @@ target triple = "powerpc64-unknown-linux-gnu"

; CHECK-NEXT: .long 3

define i64 @test() nounwind ssp uwtable {

entry:

- call anyregcc void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 0, i32 24, i8* null, i32 2, i32 1, i32 2, i64 3)

+ call anyregcc void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 0, i32 40, i8* null, i32 2, i32 1, i32 2, i64 3)

ret i64 0

}

@@ -104,7 +104,7 @@ entry:

define i64 @property_access1(i8* %obj) nounwind ssp uwtable {

entry:

%f = inttoptr i64 281474417671919 to i8*

- %ret = call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 1, i32 24, i8* %f, i32 1, i8* %obj)

+ %ret = call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 1, i32 40, i8* %f, i32 1, i8* %obj)

ret i64 %ret

}

@@ -127,7 +127,7 @@ define i64 @property_access2() nounwind ssp uwtable {

entry:

%obj = alloca i64, align 8

%f = inttoptr i64 281474417671919 to i8*

- %ret = call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 2, i32 24, i8* %f, i32 1, i64* %obj)

+ %ret = call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 2, i32 40, i8* %f, i32 1, i64* %obj)

ret i64 %ret

}

@@ -150,7 +150,7 @@ define i64 @property_access3() nounwind ssp uwtable {

entry:

%obj = alloca i64, align 8

%f = inttoptr i64 281474417671919 to i8*

- %ret = call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 3, i32 24, i8* %f, i32 0, i64* %obj)

+ %ret = call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 3, i32 40, i8* %f, i32 0, i64* %obj)

ret i64 %ret

}

@@ -232,7 +232,7 @@ entry:

define i64 @anyreg_test1(i8* %a1, i8* %a2, i8* %a3, i8* %a4, i8* %a5, i8* %a6, i8* %a7, i8* %a8, i8* %a9, i8* %a10, i8* %a11, i8* %a12, i8* %a13) nounwind ssp uwtable {

entry:

%f = inttoptr i64 281474417671919 to i8*

- %ret = call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 4, i32 24, i8* %f, i32 13, i8* %a1, i8* %a2, i8* %a3, i8* %a4, i8* %a5, i8* %a6, i8* %a7, i8* %a8, i8* %a9, i8* %a10, i8* %a11, i8* %a12, i8* %a13)

+ %ret = call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 4, i32 40, i8* %f, i32 13, i8* %a1, i8* %a2, i8* %a3, i8* %a4, i8* %a5, i8* %a6, i8* %a7, i8* %a8, i8* %a9, i8* %a10, i8* %a11, i8* %a12, i8* %a13)

ret i64 %ret

}

@@ -314,7 +314,7 @@ entry:

define i64 @anyreg_test2(i8* %a1, i8* %a2, i8* %a3, i8* %a4, i8* %a5, i8* %a6, i8* %a7, i8* %a8, i8* %a9, i8* %a10, i8* %a11, i8* %a12, i8* %a13) nounwind ssp uwtable {

entry:

%f = inttoptr i64 281474417671919 to i8*

- %ret = call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 5, i32 24, i8* %f, i32 8, i8* %a1, i8* %a2, i8* %a3, i8* %a4, i8* %a5, i8* %a6, i8* %a7, i8* %a8, i8* %a9, i8* %a10, i8* %a11, i8* %a12, i8* %a13)

+ %ret = call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 5, i32 40, i8* %f, i32 8, i8* %a1, i8* %a2, i8* %a3, i8* %a4, i8* %a5, i8* %a6, i8* %a7, i8* %a8, i8* %a9, i8* %a10, i8* %a11, i8* %a12, i8* %a13)

ret i64 %ret

}

@@ -342,7 +342,7 @@ entry:

; CHECK-NEXT: .long 0

define i64 @patchpoint_spilldef(i64 %p1, i64 %p2, i64 %p3, i64 %p4) {

entry:

- %result = tail call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 12, i32 24, i8* inttoptr (i64 0 to i8*), i32 2, i64 %p1, i64 %p2)

+ %result = tail call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 12, i32 40, i8* inttoptr (i64 0 to i8*), i32 2, i64 %p1, i64 %p2)

tail call void asm sideeffect "nop", "~{r0},~{r3},~{r4},~{r5},~{r6},~{r7},~{r8},~{r9},~{r10},~{r11},~{r12},~{r14},~{r15},~{r16},~{r17

},~{r18},~{r19},~{r20},~{r21},~{r22},~{r23},~{r24},~{r25},~{r26},~{r27},~{r28},~{r29},~{r30},~{r31}"() nounwind

ret i64 %result

@@ -384,7 +384,7 @@ define i64 @patchpoint_spillargs(i64 %p1, i64 %p2, i64 %p3, i64 %p4) {

entry:

tail call void asm sideeffect "nop", "~{r0},~{r3},~{r4},~{r5},~{r6},~{r7},~{r8},~{r9},~{r10},~{r11},~{r12},~{r14},~{r15},~{r16},~{r17

},~{r18},~{r19},~{r20},~{r21},~{r22},~{r23},~{r24},~{r25},~{r26},~{r27},~{r28},~{r29},~{r30},~{r31}"() nounwind

- %result = tail call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 13, i32 24, i8* inttoptr (i64 0 to i8*), i32 2, i64 %p1, i64 %p2, i64 %p3, i64 %p4)

+ %result = tail call anyregcc i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 13, i32 40, i8* inttoptr (i64 0 to i8*), i32 2, i64 %p1, i64 %p2, i64 %p3, i64 %p4)

ret i64 %result

}

diff --git a/test/CodeGen/PowerPC/ppc64-fastcc-fast-isel.ll b/test/CodeGen/PowerPC/ppc64-fastcc-fast-isel.ll
index f90519836c25..92d6d556738c 100644
--- a/test/CodeGen/PowerPC/ppc64-fastcc-fast-isel.ll
+++ b/test/CodeGen/PowerPC/ppc64-fastcc-fast-isel.ll

@@ -35,7 +35,7 @@ define fastcc double @f2(i64 %g1, double %f1, i64 %g2, double %f2, i64 %g3, doub

}

define void @cg2(i64 %v) #0 {

- tail call fastcc i64 @g1(i64 0, double 0.0, i64 %v, double 0.0, i64 0, double 0.0, i64 0, double 0.0)

+ call fastcc i64 @g1(i64 0, double 0.0, i64 %v, double 0.0, i64 0, double 0.0, i64 0, double 0.0)

ret void

; CHECK-LABEL: @cg2

@@ -44,11 +44,11 @@ define void @cg2(i64 %v) #0 {

}

define void @cf2(double %v) #0 {

- tail call fastcc i64 @g1(i64 0, double 0.0, i64 0, double %v, i64 0, double 0.0, i64 0, double 0.0)

+ call fastcc i64 @g1(i64 0, double 0.0, i64 0, double %v, i64 0, double 0.0, i64 0, double 0.0)

ret void

; CHECK-LABEL: @cf2

-; CHECK: mr 2, 1

+; CHECK: fmr 2, 1

; CHECK: blr

}

diff --git a/test/CodeGen/PowerPC/ppc64-fastcc.ll b/test/CodeGen/PowerPC/ppc64-fastcc.ll
index bb1365a3b675..69e15d104da8 100644
--- a/test/CodeGen/PowerPC/ppc64-fastcc.ll
+++ b/test/CodeGen/PowerPC/ppc64-fastcc.ll

@@ -521,8 +521,9 @@ define void @cv13(<4 x i32> %v) #0 {

ret void

; CHECK-LABEL: @cv13

-; CHECK: li [[REG1:[0-9]+]], 96

-; CHECK: stvx 2, 1, [[REG1]]

+; CHECK-DAG: li [[REG1:[0-9]+]], 96

+; CHECK-DAG: vor [[REG2:[0-9]+]], 2, 2

+; CHECK: stvx [[REG2]], 1, [[REG1]]

; CHECK: blr

}

@@ -531,8 +532,9 @@ define void @cv14(<4 x i32> %v) #0 {

ret void

; CHECK-LABEL: @cv14

-; CHECK: li [[REG1:[0-9]+]], 128

-; CHECK: stvx 2, 1, [[REG1]]

+; CHECK-DAG: li [[REG1:[0-9]+]], 128

+; CHECK-DAG: vor [[REG2:[0-9]+]], 2, 2

+; CHECK: stvx [[REG2]], 1, [[REG1]]

; CHECK: blr

}

diff --git a/test/CodeGen/PowerPC/ppc64-nest.ll b/test/CodeGen/PowerPC/ppc64-nest.ll
new file mode 100644
index 000000000000..9dd88db2fb5d
--- /dev/null
+++ b/test/CodeGen/PowerPC/ppc64-nest.ll

@@ -0,0 +1,42 @@

+; RUN: llc < %s | FileCheck %s

+target datalayout = "E-m:e-i64:64-n32:64"

+target triple = "powerpc64-unknown-linux-gnu"

+; Tests that the 'nest' parameter attribute causes the relevant parameter to be

+; passed in the right register (r11 for PPC).

+define i8* @nest_receiver(i8* nest %arg) nounwind {

+; CHECK-LABEL: nest_receiver:

+; CHECK: # BB#0:

+; CHECK-NEXT: mr 3, 11

+; CHECK-NEXT: blr

+ ret i8* %arg

+define i8* @nest_caller(i8* %arg) nounwind {

+; CHECK-LABEL: nest_caller:

+; CHECK: mr 11, 3

+; CHECK-NEXT: bl nest_receiver

+; CHECK: blr

+ %result = call i8* @nest_receiver(i8* nest %arg)

+ ret i8* %result

+define void @test_indirect(i32 ()* nocapture %f, i8* %p) {

+entry:

+; CHECK-LABEL: test_indirect

+; CHECK-DAG: ld [[DEST:[0-9]+]], 0(3)

+; CHECK-DAG: ld 2, 8(3)

+; CHECK-DAG: mr 11, 4

+; CHECK: mtctr [[DEST]]

+; CHECK: bctrl

+; CHECK: blr

+ %callee.knr.cast = bitcast i32 ()* %f to i32 (i8*)*

+ %call = tail call signext i32 %callee.knr.cast(i8* nest %p)

+ ret void

diff --git a/test/CodeGen/PowerPC/ppc64-patchpoint.ll b/test/CodeGen/PowerPC/ppc64-patchpoint.ll
index 67b26268a3a3..53b737ae9a0b 100644
--- a/test/CodeGen/PowerPC/ppc64-patchpoint.ll
+++ b/test/CodeGen/PowerPC/ppc64-patchpoint.ll

@@ -15,22 +15,34 @@ entry:

; CHECK-NEXT: rldic 12, 12, 32, 16

; CHECK-NEXT: oris 12, 12, 48879

; CHECK-NEXT: ori 12, 12, 51966

+; CHECK-LE-NEXT: std 2, 24(1)

+; CHECK-BE-NEXT: std 2, 40(1)

+; CHECK-BE-NEXT: ld 2, 8(12)

+; CHECK-BE-NEXT: ld 12, 0(12)

; CHECK-NEXT: mtctr 12

; CHECK-NEXT: bctrl

+; CHECK-LE-NEXT: ld 2, 24(1)

+; CHECK-BE-NEXT: ld 2, 40(1)

; CHECK: li 12, -8531

; CHECK-NEXT: rldic 12, 12, 32, 16

; CHECK-NEXT: oris 12, 12, 48879

; CHECK-NEXT: ori 12, 12, 51967

+; CHECK-LE-NEXT: std 2, 24(1)

+; CHECK-BE-NEXT: std 2, 40(1)

+; CHECK-BE-NEXT: ld 2, 8(12)

+; CHECK-BE-NEXT: ld 12, 0(12)

; CHECK-NEXT: mtctr 12

; CHECK-NEXT: bctrl

+; CHECK-LE-NEXT: ld 2, 24(1)

+; CHECK-BE-NEXT: ld 2, 40(1)

; CHECK: blr

%resolveCall2 = inttoptr i64 244837814094590 to i8*

- %result = tail call i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 2, i32 24, i8* %resolveCall2, i32 4, i64 %p1, i64 %p2, i64 %p3, i64 %p4)

+ %result = tail call i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 2, i32 40, i8* %resolveCall2, i32 4, i64 %p1, i64 %p2, i64 %p3, i64 %p4)

%resolveCall3 = inttoptr i64 244837814094591 to i8*

- tail call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 3, i32 24, i8* %resolveCall3, i32 2, i64 %p1, i64 %result)

+ tail call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 3, i32 40, i8* %resolveCall3, i32 2, i64 %p1, i64 %result)

ret i64 %result

}

@@ -65,13 +77,13 @@ entry:

%tmp81 = inttoptr i64 %tmp80 to i64*

%tmp82 = load i64, i64* %tmp81, align 8

tail call void (i64, i32, ...) @llvm.experimental.stackmap(i64 14, i32 8, i64 %arg, i64 %tmp2, i64 %tmp10, i64 %tmp82)

- tail call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 15, i32 32, i8* null, i32 3, i64 %arg, i64 %tmp10, i64 %tmp82)

+ tail call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 15, i32 48, i8* null, i32 3, i64 %arg, i64 %tmp10, i64 %tmp82)

%tmp83 = load i64, i64* %tmp33, align 8

%tmp84 = add i64 %tmp83, -24

%tmp85 = inttoptr i64 %tmp84 to i64*

%tmp86 = load i64, i64* %tmp85, align 8

tail call void (i64, i32, ...) @llvm.experimental.stackmap(i64 17, i32 8, i64 %arg, i64 %tmp10, i64 %tmp86)

- tail call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 18, i32 32, i8* null, i32 3, i64 %arg, i64 %tmp10, i64 %tmp86)

+ tail call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 18, i32 48, i8* null, i32 3, i64 %arg, i64 %tmp10, i64 %tmp86)

ret i64 10

}

diff --git a/test/CodeGen/PowerPC/ppc64-stackmap.ll b/test/CodeGen/PowerPC/ppc64-stackmap.ll
index 917fa7422512..a77339f8e475 100644
--- a/test/CodeGen/PowerPC/ppc64-stackmap.ll
+++ b/test/CodeGen/PowerPC/ppc64-stackmap.ll

@@ -112,7 +112,7 @@ target triple = "powerpc64-unknown-linux-gnu"

define void @constantargs() {

entry:

%0 = inttoptr i64 244837814094590 to i8*

- tail call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 1, i32 24, i8* %0, i32 0, i64 65535, i64 65536, i64 4294967295, i64 4294967296)

+ tail call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 1, i32 40, i8* %0, i32 0, i64 65535, i64 65536, i64 4294967295, i64 4294967296)

ret void

}

@@ -160,7 +160,7 @@ entry:

cold:

; OSR patchpoint with 12-byte nop-slide and 2 live vars.

%thunk = inttoptr i64 244837814094590 to i8*

- call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 4, i32 24, i8* %thunk, i32 0, i64 %a, i64 %b)

+ call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 4, i32 40, i8* %thunk, i32 0, i64 %a, i64 %b)

unreachable

ret:

ret void

@@ -176,7 +176,7 @@ ret:

define i64 @propertyRead(i64* %obj) {

entry:

%resolveRead = inttoptr i64 244837814094590 to i8*

- %result = call i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 5, i32 24, i8* %resolveRead, i32 1, i64* %obj)

+ %result = call i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 5, i32 40, i8* %resolveRead, i32 1, i64* %obj)

%add = add i64 %result, 3

ret i64 %add

}

@@ -196,7 +196,7 @@ entry:

define void @propertyWrite(i64 %dummy1, i64* %obj, i64 %dummy2, i64 %a) {

entry:

%resolveWrite = inttoptr i64 244837814094590 to i8*

- call anyregcc void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 6, i32 24, i8* %resolveWrite, i32 2, i64* %obj, i64 %a)

+ call anyregcc void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 6, i32 40, i8* %resolveWrite, i32 2, i64* %obj, i64 %a)

ret void

}

@@ -218,7 +218,7 @@ entry:

define void @jsVoidCall(i64 %dummy1, i64* %obj, i64 %arg, i64 %l1, i64 %l2) {

entry:

%resolveCall = inttoptr i64 244837814094590 to i8*

- call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 7, i32 24, i8* %resolveCall, i32 2, i64* %obj, i64 %arg, i64 %l1, i64 %l2)

+ call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 7, i32 40, i8* %resolveCall, i32 2, i64* %obj, i64 %arg, i64 %l1, i64 %l2)

ret void

}

@@ -240,7 +240,7 @@ entry:

define i64 @jsIntCall(i64 %dummy1, i64* %obj, i64 %arg, i64 %l1, i64 %l2) {

entry:

%resolveCall = inttoptr i64 244837814094590 to i8*

- %result = call i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 8, i32 24, i8* %resolveCall, i32 2, i64* %obj, i64 %arg, i64 %l1, i64 %l2)

+ %result = call i64 (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.i64(i64 8, i32 40, i8* %resolveCall, i32 2, i64* %obj, i64 %arg, i64 %l1, i64 %l2)

%add = add i64 %result, 3

ret i64 %add

}

@@ -260,7 +260,7 @@ entry:

; CHECK-NEXT: .short 31

define void @spilledValue(i64 %arg0, i64 %arg1, i64 %arg2, i64 %arg3, i64 %arg4, i64 %l0, i64 %l1, i64 %l2, i64 %l3, i64 %l4, i64 %l5, i64 %l6, i64 %l7, i64 %l8, i64 %l9, i64 %l10, i64 %l11, i64 %l12, i64 %l13, i64 %l14, i64 %l15, i64 %l16, i64 %l17, i64 %l18, i64 %l19, i64 %l20, i64 %l21, i64 %l22, i64 %l23, i64 %l24, i64 %l25, i64 %l26, i64 %l27) {

entry:

- call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 11, i32 24, i8* null, i32 5, i64 %arg0, i64 %arg1, i64 %arg2, i64 %arg3, i64 %arg4, i64 %l0, i64 %l1, i64 %l2, i64 %l3, i64 %l4, i64 %l5, i64 %l6, i64 %l7, i64 %l8, i64 %l9, i64 %l10, i64 %l11, i64 %l12, i64 %l13, i64 %l14, i64 %l15, i64 %l16, i64 %l17, i64 %l18, i64 %l19, i64 %l20, i64 %l21, i64 %l22, i64 %l23, i64 %l24, i64 %l25, i64 %l26, i64 %l27)

+ call void (i64, i32, i8*, i32, ...) @llvm.experimental.patchpoint.void(i64 11, i32 40, i8* null, i32 5, i64 %arg0, i64 %arg1, i64 %arg2, i64 %arg3, i64 %arg4, i64 %l0, i64 %l1, i64 %l2, i64 %l3, i64 %l4, i64 %l5, i64 %l6, i64 %l7, i64 %l8, i64 %l9, i64 %l10, i64 %l11, i64 %l12, i64 %l13, i64 %l14, i64 %l15, i64 %l16, i64 %l17, i64 %l18, i64 %l19, i64 %l20, i64 %l21, i64 %l22, i64 %l23, i64 %l24, i64 %l25, i64 %l26, i64 %l27)

ret void

}

diff --git a/test/CodeGen/PowerPC/recipest.ll b/test/CodeGen/PowerPC/recipest.ll
index cd77548b281b..41dcb0f5b3fc 100644
--- a/test/CodeGen/PowerPC/recipest.ll
+++ b/test/CodeGen/PowerPC/recipest.ll

@@ -1,4 +1,5 @@

; RUN: llc < %s -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 -enable-unsafe-fp-math -mattr=-vsx | FileCheck %s

+; RUN: llc < %s -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 -enable-unsafe-fp-math -mattr=-vsx -recip=sqrtf:0,sqrtd:0 | FileCheck %s -check-prefix=CHECK-NONR

; RUN: llc < %s -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 -mattr=-vsx | FileCheck -check-prefix=CHECK-SAFE %s

target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-f128:128:128-v128:128:128-n32:64"

target triple = "powerpc64-unknown-linux-gnu"

@@ -24,6 +25,13 @@ define double @foo(double %a, double %b) nounwind {

; CHECK-NEXT: fmul

; CHECK: blr

+; CHECK-NONR: @foo

+; CHECK-NONR: frsqrte

+; CHECK-NONR-NOT: fmadd

+; CHECK-NONR: fmul

+; CHECK-NONR-NOT: fmadd

+; CHECK-NONR: blr

; CHECK-SAFE: @foo

; CHECK-SAFE: fsqrt

; CHECK-SAFE: fdiv

@@ -90,6 +98,13 @@ define float @goo(float %a, float %b) nounwind {

; CHECK-NEXT: fmuls

; CHECK-NEXT: blr

+; CHECK-NONR: @goo

+; CHECK-NONR: frsqrtes

+; CHECK-NONR-NOT: fmadds

+; CHECK-NONR: fmuls

+; CHECK-NONR-NOT: fmadds

+; CHECK-NONR: blr

; CHECK-SAFE: @goo

; CHECK-SAFE: fsqrts

; CHECK-SAFE: fdivs

diff --git a/test/CodeGen/PowerPC/sjlj.ll b/test/CodeGen/PowerPC/sjlj.ll
index 62403e711968..dcbdd69d5d50 100644
--- a/test/CodeGen/PowerPC/sjlj.ll
+++ b/test/CodeGen/PowerPC/sjlj.ll

@@ -18,10 +18,10 @@ entry:

; CHECK: addi [[REG]], [[REG]], env_sigill@toc@l

; CHECK: ld 31, 0([[REG]])

; CHECK: ld [[REG2:[0-9]+]], 8([[REG]])

-; CHECK: ld 1, 16([[REG]])

-; CHECK: mtctr [[REG2]]

-; CHECK: ld 30, 32([[REG]])

-; CHECK: ld 2, 24([[REG]])

+; CHECK-DAG: ld 1, 16([[REG]])

+; CHECK-DAG: mtctr [[REG2]]

+; CHECK-DAG: ld 30, 32([[REG]])

+; CHECK-DAG: ld 2, 24([[REG]])

; CHECK: bctr

return: ; No predecessors!

diff --git a/test/CodeGen/PowerPC/swaps-le-3.ll b/test/CodeGen/PowerPC/swaps-le-3.ll
index 0c1748df9fcd..49b93976d310 100644
--- a/test/CodeGen/PowerPC/swaps-le-3.ll
+++ b/test/CodeGen/PowerPC/swaps-le-3.ll

@@ -17,8 +17,8 @@ entry:

}

; CHECK-LABEL: @test

-; CHECK: xxspltd

-; CHECK: lxvd2x

+; CHECK-DAG: xxspltd

+; CHECK-DAG: lxvd2x

; CHECK: xvadddp

; CHECK: stxvd2x

; CHECK-NOT: xxswapd

diff --git a/test/CodeGen/PowerPC/swaps-le-5.ll b/test/CodeGen/PowerPC/swaps-le-5.ll
new file mode 100644
index 000000000000..5cd739a0efa9
--- /dev/null
+++ b/test/CodeGen/PowerPC/swaps-le-5.ll

@@ -0,0 +1,70 @@

+; RUN: llc -mcpu=pwr8 -mtriple=powerpc64le-unknown-linux-gnu -O3 < %s | FileCheck %s

+; These tests verify that VSX swap optimization works for various

+; manipulations of <2 x double> vectors.

+@x = global <2 x double> <double 9.970000e+01, double -1.032220e+02>, align 16

+@z = global <2 x double> <double 2.332000e+01, double 3.111111e+01>, align 16

+define void @bar0(double %y) {

+entry:

+ %0 = load <2 x double>, <2 x double>* @x, align 16

+ %vecins = insertelement <2 x double> %0, double %y, i32 0

+ store <2 x double> %vecins, <2 x double>* @z, align 16

+ ret void

+; CHECK-LABEL: @bar0

+; CHECK-DAG: xxswapd {{[0-9]+}}, 1

+; CHECK-DAG: lxvd2x [[REG1:[0-9]+]]

+; CHECK-DAG: xxspltd [[REG2:[0-9]+]]

+; CHECK: xxpermdi [[REG3:[0-9]+]], [[REG2]], [[REG1]], 1

+; CHECK: stxvd2x [[REG3]]

+define void @bar1(double %y) {

+entry:

+ %0 = load <2 x double>, <2 x double>* @x, align 16

+ %vecins = insertelement <2 x double> %0, double %y, i32 1

+ store <2 x double> %vecins, <2 x double>* @z, align 16

+ ret void

+; CHECK-LABEL: @bar1

+; CHECK-DAG: xxswapd {{[0-9]+}}, 1

+; CHECK-DAG: lxvd2x [[REG1:[0-9]+]]

+; CHECK-DAG: xxspltd [[REG2:[0-9]+]]

+; CHECK: xxmrghd [[REG3:[0-9]+]], [[REG1]], [[REG2]]

+; CHECK: stxvd2x [[REG3]]

+define void @baz0() {

+entry:

+ %0 = load <2 x double>, <2 x double>* @z, align 16

+ %1 = load <2 x double>, <2 x double>* @x, align 16

+ %vecins = shufflevector <2 x double> %0, <2 x double> %1, <2 x i32> <i32 0, i32 2>

+ store <2 x double> %vecins, <2 x double>* @z, align 16

+ ret void

+; CHECK-LABEL: @baz0

+; CHECK: lxvd2x

+; CHECK: xxmrghd

+; CHECK: stxvd2x

+; CHECK-NOT: xxswapd

+define void @baz1() {

+entry:

+ %0 = load <2 x double>, <2 x double>* @z, align 16

+ %1 = load <2 x double>, <2 x double>* @x, align 16

+ %vecins = shufflevector <2 x double> %0, <2 x double> %1, <2 x i32> <i32 3, i32 1>

+ store <2 x double> %vecins, <2 x double>* @z, align 16

+ ret void

+; CHECK-LABEL: @baz1

+; CHECK: lxvd2x

+; CHECK: xxmrgld

+; CHECK: stxvd2x

+; CHECK-NOT: xxswapd

diff --git a/test/CodeGen/PowerPC/tls-store2.ll b/test/CodeGen/PowerPC/tls-store2.ll
index e9aa17e8c0ff..649508637f4e 100644
--- a/test/CodeGen/PowerPC/tls-store2.ll
+++ b/test/CodeGen/PowerPC/tls-store2.ll

@@ -29,6 +29,8 @@ entry:

; CHECK: addi 3, {{[0-9]+}}, __once_call@got@tlsgd@l

; CHECK: bl __tls_get_addr(__once_call@tlsgd)

; CHECK-NEXT: nop

-; CHECK: std {{[0-9]+}}, 0(3)

+; FIXME: We don't really need the copy here either, we could move the store up.

+; CHECK: mr [[REG1:[0-9]+]], 3

+; CHECK: std {{[0-9]+}}, 0([[REG1]])

declare void @__once_call_impl()

diff --git a/test/CodeGen/PowerPC/vsx-elementary-arith.ll b/test/CodeGen/PowerPC/vsx-elementary-arith.ll
index d8f76bb989e7..5416f667aef1 100644
--- a/test/CodeGen/PowerPC/vsx-elementary-arith.ll
+++ b/test/CodeGen/PowerPC/vsx-elementary-arith.ll

@@ -116,5 +116,36 @@ entry:

; CHECK: xssqrtdp {{[0-9]+}}

}

+; Vector forms

+; Function Attrs: nounwind

+define <4 x float> @emit_xvrsqrtesp() {

+entry:

+; CHECK-LABEL: @emit_xvrsqrtesp

+ %vf = alloca <4 x float>, align 16

+ %vfr = alloca <4 x float>, align 16

+ %0 = load <4 x float>, <4 x float>* %vf, align 16

+ %call = call <4 x float> @llvm.ppc.vsx.xvrsqrtesp(<4 x float> %0)

+; CHECK: xvrsqrtesp {{[0-9]+}}, {{[0-9]+}}

+ ret <4 x float> %call

+; Function Attrs: nounwind

+define <2 x double> @emit_xvrsqrtedp() {

+entry:

+; CHECK-LABEL: @emit_xvrsqrtedp

+ %vd = alloca <2 x double>, align 16

+ %vdr = alloca <2 x double>, align 16

+ %0 = load <2 x double>, <2 x double>* %vd, align 16

+ %call = call <2 x double> @llvm.ppc.vsx.xvrsqrtedp(<2 x double> %0)

+ ret <2 x double> %call

+; CHECK: xvrsqrtedp {{[0-9]+}}, {{[0-9]+}}

; Function Attrs: nounwind

declare double @sqrt(double)

+; Function Attrs: nounwind readnone

+declare <4 x float> @llvm.ppc.vsx.xvrsqrtesp(<4 x float>)

+; Function Attrs: nounwind readnone

+declare <2 x double> @llvm.ppc.vsx.xvrsqrtedp(<2 x double>)

diff --git a/test/CodeGen/PowerPC/vsx-fma-m.ll b/test/CodeGen/PowerPC/vsx-fma-m.ll
index d85927396e3e..4f556b6b79c2 100644
--- a/test/CodeGen/PowerPC/vsx-fma-m.ll
+++ b/test/CodeGen/PowerPC/vsx-fma-m.ll

@@ -49,12 +49,13 @@ entry:

; CHECK-LABEL: @test2

; CHECK-DAG: li [[C1:[0-9]+]], 8

; CHECK-DAG: li [[C2:[0-9]+]], 16

-; CHECK-DAG: xsmaddmdp 3, 2, 1

-; CHECK-DAG: xsmaddmdp 4, 2, 1

-; CHECK-DAG: xsmaddadp 1, 2, 5

-; CHECK-DAG: stxsdx 3, 0, 8

-; CHECK-DAG: stxsdx 4, 8, [[C1]]

-; CHECK-DAG: stxsdx 1, 8, [[C2]]

+; FIXME: We no longer get this because of copy ordering at the MI level.

+; CHECX-DAG: xsmaddmdp 3, 2, 1

+; CHECX-DAG: xsmaddmdp 4, 2, 1

+; CHECX-DAG: xsmaddadp 1, 2, 5

+; CHECX-DAG: stxsdx 3, 0, 8

+; CHECX-DAG: stxsdx 4, 8, [[C1]]

+; CHECX-DAG: stxsdx 1, 8, [[C2]]

; CHECK: blr

; CHECK-FISL-LABEL: @test2

@@ -213,14 +214,15 @@ entry:

ret void

; CHECK-LABEL: @testv2

-; CHECK-DAG: xvmaddmdp 36, 35, 34

-; CHECK-DAG: xvmaddmdp 37, 35, 34

-; CHECK-DAG: li [[C1:[0-9]+]], 16

-; CHECK-DAG: li [[C2:[0-9]+]], 32

-; CHECK-DAG: xvmaddadp 34, 35, 38

-; CHECK-DAG: stxvd2x 36, 0, 3

-; CHECK-DAG: stxvd2x 37, 3, [[C1:[0-9]+]]

-; CHECK-DAG: stxvd2x 34, 3, [[C2:[0-9]+]]

+; FIXME: We currently don't get this because of copy ordering on the MI level.

+; CHECX-DAG: xvmaddmdp 36, 35, 34

+; CHECX-DAG: xvmaddmdp 37, 35, 34

+; CHECX-DAG: li [[C1:[0-9]+]], 16

+; CHECX-DAG: li [[C2:[0-9]+]], 32

+; CHECX-DAG: xvmaddadp 34, 35, 38

+; CHECX-DAG: stxvd2x 36, 0, 3

+; CHECX-DAG: stxvd2x 37, 3, [[C1:[0-9]+]]

+; CHECX-DAG: stxvd2x 34, 3, [[C2:[0-9]+]]

; CHECK: blr

; CHECK-FISL-LABEL: @testv2

diff --git a/test/CodeGen/PowerPC/vsx-fma-sp.ll b/test/CodeGen/PowerPC/vsx-fma-sp.ll
index 1c3e457f92cb..b4dd2e1627c4 100644
--- a/test/CodeGen/PowerPC/vsx-fma-sp.ll
+++ b/test/CodeGen/PowerPC/vsx-fma-sp.ll

@@ -42,12 +42,13 @@ entry:

; CHECK-LABEL: @test2sp

; CHECK-DAG: li [[C1:[0-9]+]], 4

; CHECK-DAG: li [[C2:[0-9]+]], 8

-; CHECK-DAG: xsmaddmsp 3, 2, 1

-; CHECK-DAG: xsmaddmsp 4, 2, 1

-; CHECK-DAG: xsmaddasp 1, 2, 5

-; CHECK-DAG: stxsspx 3, 0, 8

-; CHECK-DAG: stxsspx 4, 8, [[C1]]

-; CHECK-DAG: stxsspx 1, 8, [[C2]]

+; FIXME: We now miss this because of copy ordering at the MI level.

+; CHECX-DAG: xsmaddmsp 3, 2, 1

+; CHECX-DAG: xsmaddmsp 4, 2, 1

+; CHECX-DAG: xsmaddasp 1, 2, 5

+; CHECX-DAG: stxsspx 3, 0, 8

+; CHECX-DAG: stxsspx 4, 8, [[C1]]

+; CHECX-DAG: stxsspx 1, 8, [[C2]]

; CHECK: blr

; CHECK-FISL-LABEL: @test2sp