2011-01-10 10:53:54 +08:00
; RUN: opt < %s -instcombine -S | FileCheck %s
2014-04-24 08:58:18 +08:00
target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
2006-10-05 14:51:54 +08:00
2007-04-15 06:27:33 +08:00
define i16 @test1 ( float %f ) {
2006-10-05 14:51:54 +08:00
entry:
2013-07-14 09:42:54 +08:00
; CHECK-LABEL: @test1(
2011-01-10 10:53:54 +08:00
; CHECK: fmul float
; CHECK-NOT: insertelement {{.*}} 0.00
; CHECK-NOT: call {{.*}} @llvm.x86.sse.mul
; CHECK-NOT: call {{.*}} @llvm.x86.sse.sub
; CHECK: ret
2007-04-15 06:27:33 +08:00
%tmp = insertelement < 4 x float > undef , float %f , i32 0 ; <<4 x float>> [#uses=1]
%tmp10 = insertelement < 4 x float > %tmp , float 0.000000e+00 , i32 1 ; <<4 x float>> [#uses=1]
%tmp11 = insertelement < 4 x float > %tmp10 , float 0.000000e+00 , i32 2 ; <<4 x float>> [#uses=1]
%tmp12 = insertelement < 4 x float > %tmp11 , float 0.000000e+00 , i32 3 ; <<4 x float>> [#uses=1]
%tmp28 = tail call < 4 x float > @llvm.x86.sse.sub.ss ( < 4 x float > %tmp12 , < 4 x float > < float 1.000000e+00 , float 0.000000e+00 , float 0.000000e+00 , float 0.000000e+00 > ) ; <<4 x float>> [#uses=1]
%tmp37 = tail call < 4 x float > @llvm.x86.sse.mul.ss ( < 4 x float > %tmp28 , < 4 x float > < float 5.000000e-01 , float 0.000000e+00 , float 0.000000e+00 , float 0.000000e+00 > ) ; <<4 x float>> [#uses=1]
%tmp48 = tail call < 4 x float > @llvm.x86.sse.min.ss ( < 4 x float > %tmp37 , < 4 x float > < float 6.553500e+04 , float 0.000000e+00 , float 0.000000e+00 , float 0.000000e+00 > ) ; <<4 x float>> [#uses=1]
%tmp59 = tail call < 4 x float > @llvm.x86.sse.max.ss ( < 4 x float > %tmp48 , < 4 x float > zeroinitializer ) ; <<4 x float>> [#uses=1]
%tmp.upgrd.1 = tail call i32 @llvm.x86.sse.cvttss2si ( < 4 x float > %tmp59 ) ; <i32> [#uses=1]
%tmp69 = trunc i32 %tmp.upgrd.1 to i16 ; <i16> [#uses=1]
ret i16 %tmp69
2006-10-05 14:51:54 +08:00
}
2007-04-15 06:27:33 +08:00
define i32 @test2 ( float %f ) {
2013-07-14 09:42:54 +08:00
; CHECK-LABEL: @test2(
2011-01-10 10:53:54 +08:00
; CHECK-NOT: insertelement
; CHECK-NOT: extractelement
; CHECK: ret
%tmp5 = fmul float %f , %f
%tmp9 = insertelement < 4 x float > undef , float %tmp5 , i32 0
%tmp10 = insertelement < 4 x float > %tmp9 , float 0.000000e+00 , i32 1
%tmp11 = insertelement < 4 x float > %tmp10 , float 0.000000e+00 , i32 2
%tmp12 = insertelement < 4 x float > %tmp11 , float 0.000000e+00 , i32 3
%tmp19 = bitcast < 4 x float > %tmp12 to < 4 x i32 >
%tmp21 = extractelement < 4 x i32 > %tmp19 , i32 0
ret i32 %tmp21
2007-04-15 06:27:33 +08:00
}
2011-01-10 15:19:37 +08:00
define i64 @test3 ( float %f , double %d ) {
2013-07-14 09:42:54 +08:00
; CHECK-LABEL: @test3(
2011-01-10 15:19:37 +08:00
; CHECK-NOT: insertelement {{.*}} 0.00
; CHECK: ret
entry:
%v00 = insertelement < 4 x float > undef , float %f , i32 0
%v01 = insertelement < 4 x float > %v00 , float 0.000000e+00 , i32 1
%v02 = insertelement < 4 x float > %v01 , float 0.000000e+00 , i32 2
%v03 = insertelement < 4 x float > %v02 , float 0.000000e+00 , i32 3
%tmp0 = tail call i32 @llvm.x86.sse.cvtss2si ( < 4 x float > %v03 )
%v10 = insertelement < 4 x float > undef , float %f , i32 0
%v11 = insertelement < 4 x float > %v10 , float 0.000000e+00 , i32 1
%v12 = insertelement < 4 x float > %v11 , float 0.000000e+00 , i32 2
%v13 = insertelement < 4 x float > %v12 , float 0.000000e+00 , i32 3
%tmp1 = tail call i64 @llvm.x86.sse.cvtss2si64 ( < 4 x float > %v13 )
%v20 = insertelement < 4 x float > undef , float %f , i32 0
%v21 = insertelement < 4 x float > %v20 , float 0.000000e+00 , i32 1
%v22 = insertelement < 4 x float > %v21 , float 0.000000e+00 , i32 2
%v23 = insertelement < 4 x float > %v22 , float 0.000000e+00 , i32 3
%tmp2 = tail call i32 @llvm.x86.sse.cvttss2si ( < 4 x float > %v23 )
%v30 = insertelement < 4 x float > undef , float %f , i32 0
%v31 = insertelement < 4 x float > %v30 , float 0.000000e+00 , i32 1
%v32 = insertelement < 4 x float > %v31 , float 0.000000e+00 , i32 2
%v33 = insertelement < 4 x float > %v32 , float 0.000000e+00 , i32 3
%tmp3 = tail call i64 @llvm.x86.sse.cvttss2si64 ( < 4 x float > %v33 )
%v40 = insertelement < 2 x double > undef , double %d , i32 0
%v41 = insertelement < 2 x double > %v40 , double 0.000000e+00 , i32 1
%tmp4 = tail call i32 @llvm.x86.sse2.cvtsd2si ( < 2 x double > %v41 )
%v50 = insertelement < 2 x double > undef , double %d , i32 0
%v51 = insertelement < 2 x double > %v50 , double 0.000000e+00 , i32 1
%tmp5 = tail call i64 @llvm.x86.sse2.cvtsd2si64 ( < 2 x double > %v51 )
%v60 = insertelement < 2 x double > undef , double %d , i32 0
%v61 = insertelement < 2 x double > %v60 , double 0.000000e+00 , i32 1
%tmp6 = tail call i32 @llvm.x86.sse2.cvttsd2si ( < 2 x double > %v61 )
%v70 = insertelement < 2 x double > undef , double %d , i32 0
%v71 = insertelement < 2 x double > %v70 , double 0.000000e+00 , i32 1
%tmp7 = tail call i64 @llvm.x86.sse2.cvttsd2si64 ( < 2 x double > %v71 )
%tmp8 = add i32 %tmp0 , %tmp2
%tmp9 = add i32 %tmp4 , %tmp6
%tmp10 = add i32 %tmp8 , %tmp9
%tmp11 = sext i32 %tmp10 to i64
%tmp12 = add i64 %tmp1 , %tmp3
%tmp13 = add i64 %tmp5 , %tmp7
%tmp14 = add i64 %tmp12 , %tmp13
%tmp15 = add i64 %tmp11 , %tmp14
ret i64 %tmp15
}
2011-01-10 10:53:58 +08:00
define void @get_image ( ) nounwind {
2013-07-14 09:42:54 +08:00
; CHECK-LABEL: @get_image(
2011-01-10 10:53:58 +08:00
; CHECK-NOT: extractelement
; CHECK: unreachable
entry:
%0 = call i32 @fgetc ( i8 * null ) nounwind ; <i32> [#uses=1]
%1 = trunc i32 %0 to i8 ; <i8> [#uses=1]
%tmp2 = insertelement < 100 x i8 > zeroinitializer , i8 %1 , i32 1 ; <<100 x i8>> [#uses=1]
%tmp1 = extractelement < 100 x i8 > %tmp2 , i32 0 ; <i8> [#uses=1]
%2 = icmp eq i8 %tmp1 , 80 ; <i1> [#uses=1]
br i1 %2 , label %bb2 , label %bb3
bb2: ; preds = %entry
br label %bb3
bb3: ; preds = %bb2, %entry
unreachable
}
; PR4340
define void @vac ( < 4 x float > * nocapture %a ) nounwind {
2013-07-14 09:42:54 +08:00
; CHECK-LABEL: @vac(
2011-01-10 10:53:58 +08:00
; CHECK-NOT: load
; CHECK: ret
entry:
2015-02-28 05:17:42 +08:00
%tmp1 = load < 4 x float > , < 4 x float > * %a ; <<4 x float>> [#uses=1]
2011-01-10 10:53:58 +08:00
%vecins = insertelement < 4 x float > %tmp1 , float 0.000000e+00 , i32 0 ; <<4 x float>> [#uses=1]
%vecins4 = insertelement < 4 x float > %vecins , float 0.000000e+00 , i32 1 ; <<4 x float>> [#uses=1]
%vecins6 = insertelement < 4 x float > %vecins4 , float 0.000000e+00 , i32 2 ; <<4 x float>> [#uses=1]
%vecins8 = insertelement < 4 x float > %vecins6 , float 0.000000e+00 , i32 3 ; <<4 x float>> [#uses=1]
store < 4 x float > %vecins8 , < 4 x float > * %a
ret void
}
declare i32 @fgetc ( i8 * )
2007-04-15 06:27:33 +08:00
declare < 4 x float > @llvm.x86.sse.sub.ss ( < 4 x float > , < 4 x float > )
2006-10-05 14:51:54 +08:00
2007-04-15 06:27:33 +08:00
declare < 4 x float > @llvm.x86.sse.mul.ss ( < 4 x float > , < 4 x float > )
2006-10-05 14:51:54 +08:00
2007-04-15 06:27:33 +08:00
declare < 4 x float > @llvm.x86.sse.min.ss ( < 4 x float > , < 4 x float > )
2006-10-05 14:51:54 +08:00
2007-04-15 06:27:33 +08:00
declare < 4 x float > @llvm.x86.sse.max.ss ( < 4 x float > , < 4 x float > )
2006-10-05 14:51:54 +08:00
2011-01-10 15:19:37 +08:00
declare i32 @llvm.x86.sse.cvtss2si ( < 4 x float > )
declare i64 @llvm.x86.sse.cvtss2si64 ( < 4 x float > )
2007-04-15 06:27:33 +08:00
declare i32 @llvm.x86.sse.cvttss2si ( < 4 x float > )
2011-01-10 15:19:37 +08:00
declare i64 @llvm.x86.sse.cvttss2si64 ( < 4 x float > )
declare i32 @llvm.x86.sse2.cvtsd2si ( < 2 x double > )
declare i64 @llvm.x86.sse2.cvtsd2si64 ( < 2 x double > )
declare i32 @llvm.x86.sse2.cvttsd2si ( < 2 x double > )
declare i64 @llvm.x86.sse2.cvttsd2si64 ( < 2 x double > )
2011-05-19 13:53:22 +08:00
2011-09-15 09:14:29 +08:00
define < 4 x float > @dead_shuffle_elt ( < 4 x float > %x , < 2 x float > %y ) nounwind {
entry:
2013-07-14 09:50:49 +08:00
; CHECK-LABEL: define <4 x float> @dead_shuffle_elt(
2011-09-15 09:14:29 +08:00
; CHECK: shufflevector <2 x float> %y, <2 x float> undef, <4 x i32> <i32 0, i32 1, i32 undef, i32 undef>
%shuffle.i = shufflevector < 2 x float > %y , < 2 x float > %y , < 4 x i32 > < i32 0 , i32 1 , i32 0 , i32 1 >
%shuffle9.i = shufflevector < 4 x float > %x , < 4 x float > %shuffle.i , < 4 x i32 > < i32 4 , i32 5 , i32 2 , i32 3 >
ret < 4 x float > %shuffle9.i
}
2012-07-27 06:37:04 +08:00
define < 2 x float > @test_fptrunc ( double %f ) {
2013-07-14 09:42:54 +08:00
; CHECK-LABEL: @test_fptrunc(
2012-07-27 06:37:04 +08:00
; CHECK: insertelement
; CHECK: insertelement
; CHECK-NOT: insertelement
%tmp9 = insertelement < 4 x double > undef , double %f , i32 0
%tmp10 = insertelement < 4 x double > %tmp9 , double 0.000000e+00 , i32 1
%tmp11 = insertelement < 4 x double > %tmp10 , double 0.000000e+00 , i32 2
%tmp12 = insertelement < 4 x double > %tmp11 , double 0.000000e+00 , i32 3
%tmp5 = fptrunc < 4 x double > %tmp12 to < 4 x float >
%ret = shufflevector < 4 x float > %tmp5 , < 4 x float > undef , < 2 x i32 > < i32 0 , i32 1 >
ret < 2 x float > %ret
}
define < 2 x double > @test_fpext ( float %f ) {
2013-07-14 09:42:54 +08:00
; CHECK-LABEL: @test_fpext(
2012-07-27 06:37:04 +08:00
; CHECK: insertelement
; CHECK: insertelement
; CHECK-NOT: insertelement
%tmp9 = insertelement < 4 x float > undef , float %f , i32 0
%tmp10 = insertelement < 4 x float > %tmp9 , float 0.000000e+00 , i32 1
%tmp11 = insertelement < 4 x float > %tmp10 , float 0.000000e+00 , i32 2
%tmp12 = insertelement < 4 x float > %tmp11 , float 0.000000e+00 , i32 3
%tmp5 = fpext < 4 x float > %tmp12 to < 4 x double >
%ret = shufflevector < 4 x double > %tmp5 , < 4 x double > undef , < 2 x i32 > < i32 0 , i32 1 >
ret < 2 x double > %ret
}
2012-07-27 07:10:24 +08:00
define < 4 x float > @test_select ( float %f , float %g ) {
2013-07-14 09:42:54 +08:00
; CHECK-LABEL: @test_select(
2012-07-27 07:10:24 +08:00
; CHECK: %a0 = insertelement <4 x float> undef, float %f, i32 0
; CHECK-NOT: insertelement
; CHECK: %a3 = insertelement <4 x float> %a0, float 3.000000e+00, i32 3
; CHECK-NOT: insertelement
2013-05-06 10:39:09 +08:00
; CHECK: %ret = select <4 x i1> <i1 true, i1 false, i1 false, i1 true>, <4 x float> %a3, <4 x float> <float undef, float 4.000000e+00, float 5.000000e+00, float undef>
2012-07-27 07:10:24 +08:00
%a0 = insertelement < 4 x float > undef , float %f , i32 0
%a1 = insertelement < 4 x float > %a0 , float 1.000000e+00 , i32 1
%a2 = insertelement < 4 x float > %a1 , float 2.000000e+00 , i32 2
%a3 = insertelement < 4 x float > %a2 , float 3.000000e+00 , i32 3
%b0 = insertelement < 4 x float > undef , float %g , i32 0
%b1 = insertelement < 4 x float > %b0 , float 4.000000e+00 , i32 1
%b2 = insertelement < 4 x float > %b1 , float 5.000000e+00 , i32 2
%b3 = insertelement < 4 x float > %b2 , float 6.000000e+00 , i32 3
%ret = select < 4 x i1 > < i1 true , i1 false , i1 false , i1 true > , < 4 x float > %a3 , < 4 x float > %b3
ret < 4 x float > %ret
}
2014-04-22 06:06:04 +08:00
declare < 4 x float > @llvm.x86.avx.vpermilvar.ps ( < 4 x float > , < 4 x i32 > )
define < 4 x float > @test_vpermilvar_ps ( < 4 x float > %v ) {
; CHECK-LABEL: @test_vpermilvar_ps(
; CHECK: shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 3, i32 2, i32 1, i32 0>
%a = tail call < 4 x float > @llvm.x86.avx.vpermilvar.ps ( < 4 x float > %v , < 4 x i32 > < i32 3 , i32 2 , i32 1 , i32 0 > )
ret < 4 x float > %a
}
declare < 8 x float > @llvm.x86.avx.vpermilvar.ps.256 ( < 8 x float > , < 8 x i32 > )
define < 8 x float > @test_vpermilvar_ps_256 ( < 8 x float > %v ) {
; CHECK-LABEL: @test_vpermilvar_ps_256(
2014-04-30 04:41:54 +08:00
; CHECK: shufflevector <8 x float> %v, <8 x float> undef, <8 x i32> <i32 3, i32 2, i32 1, i32 0, i32 7, i32 6, i32 5, i32 4>
2014-04-22 06:06:04 +08:00
%a = tail call < 8 x float > @llvm.x86.avx.vpermilvar.ps.256 ( < 8 x float > %v , < 8 x i32 > < i32 7 , i32 6 , i32 5 , i32 4 , i32 3 , i32 2 , i32 1 , i32 0 > )
ret < 8 x float > %a
}
2011-09-15 09:14:29 +08:00
2015-03-28 06:04:28 +08:00
declare < 2 x double > @llvm.x86.avx.vpermilvar.pd ( < 2 x double > , < 2 x i64 > )
2014-04-22 06:06:04 +08:00
define < 2 x double > @test_vpermilvar_pd ( < 2 x double > %v ) {
; CHECK-LABEL: @test_vpermilvar_pd(
; CHECK: shufflevector <2 x double> %v, <2 x double> undef, <2 x i32> <i32 1, i32 0>
2015-03-28 06:04:28 +08:00
%a = tail call < 2 x double > @llvm.x86.avx.vpermilvar.pd ( < 2 x double > %v , < 2 x i64 > < i64 2 , i64 0 > )
2014-04-22 06:06:04 +08:00
ret < 2 x double > %a
}
2015-03-28 06:04:28 +08:00
declare < 4 x double > @llvm.x86.avx.vpermilvar.pd.256 ( < 4 x double > , < 4 x i64 > )
2014-04-22 06:06:04 +08:00
define < 4 x double > @test_vpermilvar_pd_256 ( < 4 x double > %v ) {
; CHECK-LABEL: @test_vpermilvar_pd_256(
2014-04-30 04:41:54 +08:00
; CHECK: shufflevector <4 x double> %v, <4 x double> undef, <4 x i32> <i32 1, i32 0, i32 3, i32 2>
2015-03-28 06:04:28 +08:00
%a = tail call < 4 x double > @llvm.x86.avx.vpermilvar.pd.256 ( < 4 x double > %v , < 4 x i64 > < i64 3 , i64 1 , i64 2 , i64 0 > )
2014-04-22 06:06:04 +08:00
ret < 4 x double > %a
}
2014-04-24 08:58:18 +08:00
2014-04-30 06:20:40 +08:00
define < 4 x float > @test_vpermilvar_ps_zero ( < 4 x float > %v ) {
; CHECK-LABEL: @test_vpermilvar_ps_zero(
; CHECK: shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> zeroinitializer
%a = tail call < 4 x float > @llvm.x86.avx.vpermilvar.ps ( < 4 x float > %v , < 4 x i32 > zeroinitializer )
ret < 4 x float > %a
}
define < 8 x float > @test_vpermilvar_ps_256_zero ( < 8 x float > %v ) {
; CHECK-LABEL: @test_vpermilvar_ps_256_zero(
; CHECK: shufflevector <8 x float> %v, <8 x float> undef, <8 x i32> <i32 0, i32 0, i32 0, i32 0, i32 4, i32 4, i32 4, i32 4>
%a = tail call < 8 x float > @llvm.x86.avx.vpermilvar.ps.256 ( < 8 x float > %v , < 8 x i32 > zeroinitializer )
ret < 8 x float > %a
}
define < 2 x double > @test_vpermilvar_pd_zero ( < 2 x double > %v ) {
; CHECK-LABEL: @test_vpermilvar_pd_zero(
; CHECK: shufflevector <2 x double> %v, <2 x double> undef, <2 x i32> zeroinitializer
2015-03-28 06:04:28 +08:00
%a = tail call < 2 x double > @llvm.x86.avx.vpermilvar.pd ( < 2 x double > %v , < 2 x i64 > zeroinitializer )
2014-04-30 06:20:40 +08:00
ret < 2 x double > %a
}
define < 4 x double > @test_vpermilvar_pd_256_zero ( < 4 x double > %v ) {
; CHECK-LABEL: @test_vpermilvar_pd_256_zero(
; CHECK: shufflevector <4 x double> %v, <4 x double> undef, <4 x i32> <i32 0, i32 0, i32 2, i32 2>
2015-03-28 06:04:28 +08:00
%a = tail call < 4 x double > @llvm.x86.avx.vpermilvar.pd.256 ( < 4 x double > %v , < 4 x i64 > zeroinitializer )
2014-04-30 06:20:40 +08:00
ret < 4 x double > %a
}
2015-10-06 18:34:53 +08:00
define < 2 x i64 > @PR24922 ( < 2 x i64 > %v ) {
; CHECK-LABEL: @PR24922
; CHECK: select <2 x i1>
;
; Check that instcombine doesn't wrongly fold the select statement into a
; ret <2 x i64> %v
;
; FIXME: We should be able to simplify the ConstantExpr in the select mask.
entry:
%result = select < 2 x i1 > < i1 icmp eq ( i64 extractelement ( < 2 x i64 > bitcast ( < 4 x i32 > < i32 15 , i32 15 , i32 15 , i32 15 > to < 2 x i64 > ) , i64 0 ) , i64 0 ) , i1 true > , < 2 x i64 > %v , < 2 x i64 > zeroinitializer
ret < 2 x i64 > %result
}