llvm-project/llvm/test/CodeGen/AMDGPU/convergent-inlineasm.ll

; RUN: llc -mtriple=amdgcn--amdhsa -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s

declare i32 @llvm.amdgcn.workitem.id.x() #0
; GCN-LABEL: {{^}}convergent_inlineasm:
; GCN: BB#0:
; GCN: v_cmp_ne_i32_e64
; GCN: BB#1:
define void @convergent_inlineasm(i64 addrspace(1)* nocapture %arg) {
bb:
  %tmp = call i32 @llvm.amdgcn.workitem.id.x()
  %tmp1 = tail call i64 asm "v_cmp_ne_i32_e64 $0, 0, $1", "=s,v"(i32 1) #1
  %tmp2 = icmp eq i32 %tmp, 8
  br i1 %tmp2, label %bb3, label %bb5

bb3:                                              ; preds = %bb
  %tmp4 = getelementptr i64, i64 addrspace(1)* %arg, i32 %tmp
  store i64 %tmp1, i64 addrspace(1)* %arg, align 8
  br label %bb5

bb5:                                              ; preds = %bb3, %bb
  ret void
}

; GCN-LABEL: {{^}}nonconvergent_inlineasm:
; GCN: BB#1:
; GCN: v_cmp_ne_i32_e64
; GCN: BB1_2:
define void @nonconvergent_inlineasm(i64 addrspace(1)* nocapture %arg) {
bb:
  %tmp = call i32 @llvm.amdgcn.workitem.id.x()
  %tmp1 = tail call i64 asm "v_cmp_ne_i32_e64 $0, 0, $1", "=s,v"(i32 1)
  %tmp2 = icmp eq i32 %tmp, 8
  br i1 %tmp2, label %bb3, label %bb5

bb3:                                              ; preds = %bb
  %tmp4 = getelementptr i64, i64 addrspace(1)* %arg, i32 %tmp
  store i64 %tmp1, i64 addrspace(1)* %arg, align 8
  br label %bb5

bb5:                                              ; preds = %bb3, %bb
  ret void
}

attributes #0 = { nounwind readnone }
attributes #1 = { convergent nounwind readnone }
AMDGPU: Add convergent flag to INLINEASM instruction. Differential Revision: http://reviews.llvm.org/D21214 llvm-svn: 273455 2016-06-23 02:51:08 +08:00			`; RUN: llc -mtriple=amdgcn--amdhsa -verify-machineinstrs < %s \| FileCheck -check-prefix=GCN %s`

			`declare i32 @llvm.amdgcn.workitem.id.x() #0`
			`; GCN-LABEL: {{^}}convergent_inlineasm:`
			`; GCN: BB#0:`
			`; GCN: v_cmp_ne_i32_e64`
			`; GCN: BB#1:`
			`define void @convergent_inlineasm(i64 addrspace(1)* nocapture %arg) {`
			`bb:`
			`%tmp = call i32 @llvm.amdgcn.workitem.id.x()`
			`%tmp1 = tail call i64 asm "v_cmp_ne_i32_e64 $0, 0, $1", "=s,v"(i32 1) #1`
			`%tmp2 = icmp eq i32 %tmp, 8`
			`br i1 %tmp2, label %bb3, label %bb5`

			`bb3: ; preds = %bb`
			`%tmp4 = getelementptr i64, i64 addrspace(1)* %arg, i32 %tmp`
			`store i64 %tmp1, i64 addrspace(1)* %arg, align 8`
			`br label %bb5`

			`bb5: ; preds = %bb3, %bb`
			`ret void`
			`}`

			`; GCN-LABEL: {{^}}nonconvergent_inlineasm:`
			`; GCN: BB#1:`
			`; GCN: v_cmp_ne_i32_e64`
			`; GCN: BB1_2:`
			`define void @nonconvergent_inlineasm(i64 addrspace(1)* nocapture %arg) {`
			`bb:`
			`%tmp = call i32 @llvm.amdgcn.workitem.id.x()`
			`%tmp1 = tail call i64 asm "v_cmp_ne_i32_e64 $0, 0, $1", "=s,v"(i32 1)`
			`%tmp2 = icmp eq i32 %tmp, 8`
			`br i1 %tmp2, label %bb3, label %bb5`

			`bb3: ; preds = %bb`
			`%tmp4 = getelementptr i64, i64 addrspace(1)* %arg, i32 %tmp`
			`store i64 %tmp1, i64 addrspace(1)* %arg, align 8`
			`br label %bb5`

			`bb5: ; preds = %bb3, %bb`
			`ret void`
			`}`

			`attributes #0 = { nounwind readnone }`
			`attributes #1 = { convergent nounwind readnone }`