forked from OSchip/llvm-project
47 lines
1.7 KiB
LLVM
47 lines
1.7 KiB
LLVM
; RUN: opt -mtriple amdgcn-unknown-amdhsa -enable-new-pm=0 -analyze -divergence -use-gpu-divergence-analysis %s | FileCheck %s
|
|
; RUN: opt -mtriple amdgcn-unknown-amdhsa -passes='print<divergence>' -disable-output %s 2>&1 | FileCheck %s
|
|
|
|
declare i32 @llvm.amdgcn.workitem.id.x() #0
|
|
declare i32 @llvm.amdgcn.workitem.id.y() #0
|
|
declare i32 @llvm.amdgcn.workitem.id.z() #0
|
|
declare i32 @llvm.amdgcn.mbcnt.lo(i32, i32) #0
|
|
declare i32 @llvm.amdgcn.mbcnt.hi(i32, i32) #0
|
|
|
|
; CHECK: DIVERGENT: %id.x = call i32 @llvm.amdgcn.workitem.id.x()
|
|
define amdgpu_kernel void @workitem_id_x() #1 {
|
|
%id.x = call i32 @llvm.amdgcn.workitem.id.x()
|
|
store volatile i32 %id.x, i32 addrspace(1)* undef
|
|
ret void
|
|
}
|
|
|
|
; CHECK: DIVERGENT: %id.y = call i32 @llvm.amdgcn.workitem.id.y()
|
|
define amdgpu_kernel void @workitem_id_y() #1 {
|
|
%id.y = call i32 @llvm.amdgcn.workitem.id.y()
|
|
store volatile i32 %id.y, i32 addrspace(1)* undef
|
|
ret void
|
|
}
|
|
|
|
; CHECK: DIVERGENT: %id.z = call i32 @llvm.amdgcn.workitem.id.z()
|
|
define amdgpu_kernel void @workitem_id_z() #1 {
|
|
%id.z = call i32 @llvm.amdgcn.workitem.id.z()
|
|
store volatile i32 %id.z, i32 addrspace(1)* undef
|
|
ret void
|
|
}
|
|
|
|
; CHECK: DIVERGENT: %mbcnt.lo = call i32 @llvm.amdgcn.mbcnt.lo(i32 0, i32 0)
|
|
define amdgpu_kernel void @mbcnt_lo() #1 {
|
|
%mbcnt.lo = call i32 @llvm.amdgcn.mbcnt.lo(i32 0, i32 0)
|
|
store volatile i32 %mbcnt.lo, i32 addrspace(1)* undef
|
|
ret void
|
|
}
|
|
|
|
; CHECK: DIVERGENT: %mbcnt.hi = call i32 @llvm.amdgcn.mbcnt.hi(i32 0, i32 0)
|
|
define amdgpu_kernel void @mbcnt_hi() #1 {
|
|
%mbcnt.hi = call i32 @llvm.amdgcn.mbcnt.hi(i32 0, i32 0)
|
|
store volatile i32 %mbcnt.hi, i32 addrspace(1)* undef
|
|
ret void
|
|
}
|
|
|
|
attributes #0 = { nounwind readnone }
|
|
attributes #1 = { nounwind }
|