2016-05-12 09:58:58 +08:00
; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -mcpu=kaveri -amdgpu-promote-alloca < %s | FileCheck %s
; CHECK-LABEL: @lds_promoted_alloca_select_invalid_pointer_operand(
; CHECK: %alloca = alloca i32
; CHECK: select i1 undef, i32* undef, i32* %alloca
define void @lds_promoted_alloca_select_invalid_pointer_operand ( ) #0 {
%alloca = alloca i32 , align 4
%select = select i1 undef , i32 * undef , i32 * %alloca
store i32 0 , i32 * %select , align 4
ret void
}
; CHECK-LABEL: @lds_promote_alloca_select_two_derived_pointers(
; CHECK: [[ARRAYGEP:%[0-9]+]] = getelementptr inbounds [256 x [16 x i32]], [256 x [16 x i32]] addrspace(3)* @lds_promote_alloca_select_two_derived_pointers.alloca, i32 0, i32 %{{[0-9]+}}
; CHECK: %ptr0 = getelementptr inbounds [16 x i32], [16 x i32] addrspace(3)* [[ARRAYGEP]], i32 0, i32 %a
; CHECK: %ptr1 = getelementptr inbounds [16 x i32], [16 x i32] addrspace(3)* [[ARRAYGEP]], i32 0, i32 %b
; CHECK: %select = select i1 undef, i32 addrspace(3)* %ptr0, i32 addrspace(3)* %ptr1
; CHECK: store i32 0, i32 addrspace(3)* %select, align 4
define void @lds_promote_alloca_select_two_derived_pointers ( i32 %a , i32 %b ) #0 {
%alloca = alloca [ 16 x i32 ] , align 4
%ptr0 = getelementptr inbounds [ 16 x i32 ] , [ 16 x i32 ] * %alloca , i32 0 , i32 %a
%ptr1 = getelementptr inbounds [ 16 x i32 ] , [ 16 x i32 ] * %alloca , i32 0 , i32 %b
%select = select i1 undef , i32 * %ptr0 , i32 * %ptr1
store i32 0 , i32 * %select , align 4
ret void
}
; FIXME: This should be promotable but requires knowing that both will be promoted first.
; CHECK-LABEL: @lds_promote_alloca_select_two_allocas(
; CHECK: %alloca0 = alloca i32, i32 16, align 4
; CHECK: %alloca1 = alloca i32, i32 16, align 4
; CHECK: %ptr0 = getelementptr inbounds i32, i32* %alloca0, i32 %a
; CHECK: %ptr1 = getelementptr inbounds i32, i32* %alloca1, i32 %b
; CHECK: %select = select i1 undef, i32* %ptr0, i32* %ptr1
define void @lds_promote_alloca_select_two_allocas ( i32 %a , i32 %b ) #0 {
%alloca0 = alloca i32 , i32 16 , align 4
%alloca1 = alloca i32 , i32 16 , align 4
%ptr0 = getelementptr inbounds i32 , i32 * %alloca0 , i32 %a
%ptr1 = getelementptr inbounds i32 , i32 * %alloca1 , i32 %b
%select = select i1 undef , i32 * %ptr0 , i32 * %ptr1
store i32 0 , i32 * %select , align 4
ret void
}
; TODO: Maybe this should be canonicalized to select on the constant and GEP after.
; CHECK-LABEL: @lds_promote_alloca_select_two_derived_constant_pointers(
; CHECK: [[ARRAYGEP:%[0-9]+]] = getelementptr inbounds [256 x [16 x i32]], [256 x [16 x i32]] addrspace(3)* @lds_promote_alloca_select_two_derived_constant_pointers.alloca, i32 0, i32 %{{[0-9]+}}
; CHECK: %ptr0 = getelementptr inbounds [16 x i32], [16 x i32] addrspace(3)* [[ARRAYGEP]], i32 0, i32 1
; CHECK: %ptr1 = getelementptr inbounds [16 x i32], [16 x i32] addrspace(3)* [[ARRAYGEP]], i32 0, i32 3
; CHECK: %select = select i1 undef, i32 addrspace(3)* %ptr0, i32 addrspace(3)* %ptr1
; CHECK: store i32 0, i32 addrspace(3)* %select, align 4
define void @lds_promote_alloca_select_two_derived_constant_pointers ( ) #0 {
%alloca = alloca [ 16 x i32 ] , align 4
%ptr0 = getelementptr inbounds [ 16 x i32 ] , [ 16 x i32 ] * %alloca , i32 0 , i32 1
%ptr1 = getelementptr inbounds [ 16 x i32 ] , [ 16 x i32 ] * %alloca , i32 0 , i32 3
%select = select i1 undef , i32 * %ptr0 , i32 * %ptr1
store i32 0 , i32 * %select , align 4
ret void
}
; CHECK-LABEL: @lds_promoted_alloca_select_input_select(
; CHECK: getelementptr inbounds [256 x [16 x i32]], [256 x [16 x i32]] addrspace(3)* @lds_promoted_alloca_select_input_select.alloca, i32 0, i32 %{{[0-9]+}}
; CHECK: %ptr0 = getelementptr inbounds [16 x i32], [16 x i32] addrspace(3)* %{{[0-9]+}}, i32 0, i32 %a
; CHECK: %ptr1 = getelementptr inbounds [16 x i32], [16 x i32] addrspace(3)* %{{[0-9]+}}, i32 0, i32 %b
; CHECK: %ptr2 = getelementptr inbounds [16 x i32], [16 x i32] addrspace(3)* %{{[0-9]+}}, i32 0, i32 %c
; CHECK: %select0 = select i1 undef, i32 addrspace(3)* %ptr0, i32 addrspace(3)* %ptr1
; CHECK: %select1 = select i1 undef, i32 addrspace(3)* %select0, i32 addrspace(3)* %ptr2
; CHECK: store i32 0, i32 addrspace(3)* %select1, align 4
define void @lds_promoted_alloca_select_input_select ( i32 %a , i32 %b , i32 %c ) #0 {
%alloca = alloca [ 16 x i32 ] , align 4
%ptr0 = getelementptr inbounds [ 16 x i32 ] , [ 16 x i32 ] * %alloca , i32 0 , i32 %a
%ptr1 = getelementptr inbounds [ 16 x i32 ] , [ 16 x i32 ] * %alloca , i32 0 , i32 %b
%ptr2 = getelementptr inbounds [ 16 x i32 ] , [ 16 x i32 ] * %alloca , i32 0 , i32 %c
%select0 = select i1 undef , i32 * %ptr0 , i32 * %ptr1
%select1 = select i1 undef , i32 * %select0 , i32 * %ptr2
store i32 0 , i32 * %select1 , align 4
ret void
}
define void @lds_promoted_alloca_select_input_phi ( i32 %a , i32 %b , i32 %c ) #0 {
entry:
%alloca = alloca [ 16 x i32 ] , align 4
%ptr0 = getelementptr inbounds [ 16 x i32 ] , [ 16 x i32 ] * %alloca , i32 0 , i32 %a
%ptr1 = getelementptr inbounds [ 16 x i32 ] , [ 16 x i32 ] * %alloca , i32 0 , i32 %b
store i32 0 , i32 * %ptr0
br i1 undef , label %bb1 , label %bb2
bb1:
%ptr2 = getelementptr inbounds [ 16 x i32 ] , [ 16 x i32 ] * %alloca , i32 0 , i32 %c
%select0 = select i1 undef , i32 * undef , i32 * %ptr2
store i32 0 , i32 * %ptr1
br label %bb2
bb2:
%phi.ptr = phi i32 * [ %ptr0 , %entry ] , [ %select0 , %bb1 ]
%select1 = select i1 undef , i32 * %phi.ptr , i32 * %ptr1
store i32 0 , i32 * %select1 , align 4
ret void
}
2016-05-18 23:57:21 +08:00
; CHECK-LABEL: @select_null_rhs(
; CHECK-NOT: alloca
; CHECK: select i1 %tmp2, double addrspace(3)* %{{[0-9]+}}, double addrspace(3)* null
define void @select_null_rhs ( double addrspace ( 1 ) * nocapture %arg , i32 %arg1 ) #1 {
bb:
%tmp = alloca double , align 8
store double 0.000000e+00 , double * %tmp , align 8
%tmp2 = icmp eq i32 %arg1 , 0
%tmp3 = select i1 %tmp2 , double * %tmp , double * null
store double 1.000000e+00 , double * %tmp3 , align 8
%tmp4 = load double , double * %tmp , align 8
store double %tmp4 , double addrspace ( 1 ) * %arg
ret void
}
; CHECK-LABEL: @select_null_lhs(
; CHECK-NOT: alloca
; CHECK: select i1 %tmp2, double addrspace(3)* null, double addrspace(3)* %{{[0-9]+}}
define void @select_null_lhs ( double addrspace ( 1 ) * nocapture %arg , i32 %arg1 ) #1 {
bb:
%tmp = alloca double , align 8
store double 0.000000e+00 , double * %tmp , align 8
%tmp2 = icmp eq i32 %arg1 , 0
%tmp3 = select i1 %tmp2 , double * null , double * %tmp
store double 1.000000e+00 , double * %tmp3 , align 8
%tmp4 = load double , double * %tmp , align 8
store double %tmp4 , double addrspace ( 1 ) * %arg
ret void
}
2016-05-17 05:19:59 +08:00
attributes #0 = { norecurse nounwind "amdgpu-max-waves-per-eu" = "1" }
2016-05-18 23:57:21 +08:00
attributes #1 = { norecurse nounwind }