summaryrefslogtreecommitdiff
path: root/test/CodeGen/AMDGPU/convergent-inlineasm.ll
diff options
context:
space:
mode:
Diffstat (limited to 'test/CodeGen/AMDGPU/convergent-inlineasm.ll')
-rw-r--r--test/CodeGen/AMDGPU/convergent-inlineasm.ll45
1 files changed, 45 insertions, 0 deletions
diff --git a/test/CodeGen/AMDGPU/convergent-inlineasm.ll b/test/CodeGen/AMDGPU/convergent-inlineasm.ll
new file mode 100644
index 0000000000000..55a38e576ad10
--- /dev/null
+++ b/test/CodeGen/AMDGPU/convergent-inlineasm.ll
@@ -0,0 +1,45 @@
+; RUN: llc -mtriple=amdgcn--amdhsa -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
+
+declare i32 @llvm.amdgcn.workitem.id.x() #0
+; GCN-LABEL: {{^}}convergent_inlineasm:
+; GCN: BB#0:
+; GCN: v_cmp_ne_i32_e64
+; GCN: BB#1:
+define void @convergent_inlineasm(i64 addrspace(1)* nocapture %arg) {
+bb:
+ %tmp = call i32 @llvm.amdgcn.workitem.id.x()
+ %tmp1 = tail call i64 asm "v_cmp_ne_i32_e64 $0, 0, $1", "=s,v"(i32 1) #1
+ %tmp2 = icmp eq i32 %tmp, 8
+ br i1 %tmp2, label %bb3, label %bb5
+
+bb3: ; preds = %bb
+ %tmp4 = getelementptr i64, i64 addrspace(1)* %arg, i32 %tmp
+ store i64 %tmp1, i64 addrspace(1)* %arg, align 8
+ br label %bb5
+
+bb5: ; preds = %bb3, %bb
+ ret void
+}
+
+; GCN-LABEL: {{^}}nonconvergent_inlineasm:
+; GCN: BB#1:
+; GCN: v_cmp_ne_i32_e64
+; GCN: BB1_2:
+define void @nonconvergent_inlineasm(i64 addrspace(1)* nocapture %arg) {
+bb:
+ %tmp = call i32 @llvm.amdgcn.workitem.id.x()
+ %tmp1 = tail call i64 asm "v_cmp_ne_i32_e64 $0, 0, $1", "=s,v"(i32 1)
+ %tmp2 = icmp eq i32 %tmp, 8
+ br i1 %tmp2, label %bb3, label %bb5
+
+bb3: ; preds = %bb
+ %tmp4 = getelementptr i64, i64 addrspace(1)* %arg, i32 %tmp
+ store i64 %tmp1, i64 addrspace(1)* %arg, align 8
+ br label %bb5
+
+bb5: ; preds = %bb3, %bb
+ ret void
+}
+
+attributes #0 = { nounwind readnone }
+attributes #1 = { convergent nounwind readnone }