llvm-project/llvm/test/Transforms/SLPVectorizer/X86/PR34635.ll

99 lines
5.8 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
; RUN: opt < %s -mtriple=x86_64-unknown-linux -slp-vectorizer -S -mcpu=corei7 | FileCheck %s
define i32 @main() {
; CHECK-LABEL: @main(
; CHECK-NEXT: bb:
; CHECK-NEXT: [[TMP:%.*]] = alloca <8 x i32>, align 32
; CHECK-NEXT: [[TMP1:%.*]] = bitcast <8 x i32>* [[TMP]] to [8 x i32]*
; CHECK-NEXT: [[TMP2:%.*]] = alloca i32, align 4
; CHECK-NEXT: [[TMP3:%.*]] = bitcast <8 x i32>* [[TMP]] to i8*
; CHECK-NEXT: [[TMP4:%.*]] = getelementptr inbounds <8 x i32>, <8 x i32>* [[TMP]], i64 0, i64 0
; CHECK-NEXT: [[TMP5:%.*]] = getelementptr inbounds [8 x i32], [8 x i32]* [[TMP1]], i64 0, i64 1
; CHECK-NEXT: [[TMP6:%.*]] = getelementptr inbounds [8 x i32], [8 x i32]* [[TMP1]], i64 0, i64 2
; CHECK-NEXT: [[TMP7:%.*]] = getelementptr inbounds [8 x i32], [8 x i32]* [[TMP1]], i64 0, i64 3
; CHECK-NEXT: [[TMP8:%.*]] = getelementptr inbounds [8 x i32], [8 x i32]* [[TMP1]], i64 0, i64 4
; CHECK-NEXT: [[TMP9:%.*]] = getelementptr inbounds [8 x i32], [8 x i32]* [[TMP1]], i64 0, i64 6
; CHECK-NEXT: [[TMP10:%.*]] = getelementptr inbounds [8 x i32], [8 x i32]* [[TMP1]], i64 0, i64 5
; CHECK-NEXT: [[TMP11:%.*]] = getelementptr inbounds [8 x i32], [8 x i32]* [[TMP1]], i64 0, i64 7
; CHECK-NEXT: store <8 x i32> <i32 -221320154, i32 -756426931, i32 563883532, i32 382683935, i32 144890241, i32 -1052877364, i32 -1052877364, i32 -1016007675>, <8 x i32>* [[TMP]], align 32
; CHECK-NEXT: [[TMP12:%.*]] = bitcast i32* [[TMP2]] to i8*
; CHECK-NEXT: [[TMP13:%.*]] = load i32, i32* [[TMP4]], align 32
; CHECK-NEXT: [[TMP14:%.*]] = load i32, i32* [[TMP5]], align 4
; CHECK-NEXT: [[TMP15:%.*]] = icmp slt i32 [[TMP14]], [[TMP13]]
; CHECK-NEXT: [[TMP16:%.*]] = select i1 [[TMP15]], i32 [[TMP14]], i32 [[TMP13]]
; CHECK-NEXT: [[TMP17:%.*]] = zext i1 [[TMP15]] to i32
; CHECK-NEXT: [[TMP18:%.*]] = load i32, i32* [[TMP6]], align 8
; CHECK-NEXT: [[TMP19:%.*]] = icmp slt i32 [[TMP18]], [[TMP16]]
; CHECK-NEXT: [[TMP20:%.*]] = select i1 [[TMP19]], i32 [[TMP18]], i32 [[TMP16]]
; CHECK-NEXT: [[TMP21:%.*]] = select i1 [[TMP19]], i32 2, i32 [[TMP16]]
; CHECK-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP7]], align 4
; CHECK-NEXT: [[TMP23:%.*]] = icmp slt i32 [[TMP22]], [[TMP20]]
; CHECK-NEXT: [[TMP24:%.*]] = select i1 [[TMP23]], i32 [[TMP22]], i32 [[TMP20]]
; CHECK-NEXT: [[TMP25:%.*]] = select i1 [[TMP23]], i32 3, i32 [[TMP21]]
; CHECK-NEXT: [[TMP26:%.*]] = load i32, i32* [[TMP8]], align 16
; CHECK-NEXT: [[TMP27:%.*]] = icmp slt i32 [[TMP26]], [[TMP24]]
; CHECK-NEXT: [[TMP28:%.*]] = select i1 [[TMP27]], i32 [[TMP26]], i32 [[TMP24]]
; CHECK-NEXT: [[TMP29:%.*]] = select i1 [[TMP27]], i32 4, i32 [[TMP25]]
; CHECK-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP10]], align 4
; CHECK-NEXT: [[TMP31:%.*]] = icmp slt i32 [[TMP30]], [[TMP28]]
; CHECK-NEXT: [[TMP32:%.*]] = select i1 [[TMP31]], i32 [[TMP30]], i32 [[TMP28]]
; CHECK-NEXT: [[TMP33:%.*]] = select i1 [[TMP31]], i32 5, i32 [[TMP29]]
; CHECK-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP9]], align 8
; CHECK-NEXT: [[TMP35:%.*]] = icmp slt i32 [[TMP34]], [[TMP32]]
; CHECK-NEXT: [[TMP36:%.*]] = select i1 [[TMP35]], i32 [[TMP34]], i32 [[TMP32]]
; CHECK-NEXT: [[TMP37:%.*]] = select i1 [[TMP35]], i32 6, i32 [[TMP33]]
; CHECK-NEXT: [[TMP38:%.*]] = load i32, i32* [[TMP11]], align 4
; CHECK-NEXT: [[TMP39:%.*]] = icmp slt i32 [[TMP38]], [[TMP36]]
; CHECK-NEXT: [[TMP40:%.*]] = select i1 [[TMP39]], i32 7, i32 [[TMP37]]
; CHECK-NEXT: store i32 [[TMP40]], i32* [[TMP2]], align 4
; CHECK-NEXT: ret i32 0
;
bb:
%tmp = alloca <8 x i32>, align 32
%tmp1 = bitcast <8 x i32>* %tmp to [8 x i32]*
%tmp2 = alloca i32, align 4
%tmp3 = bitcast <8 x i32>* %tmp to i8*
%tmp4 = getelementptr inbounds <8 x i32>, <8 x i32>* %tmp, i64 0, i64 0
%tmp5 = getelementptr inbounds [8 x i32], [8 x i32]* %tmp1, i64 0, i64 1
%tmp6 = getelementptr inbounds [8 x i32], [8 x i32]* %tmp1, i64 0, i64 2
%tmp7 = getelementptr inbounds [8 x i32], [8 x i32]* %tmp1, i64 0, i64 3
%tmp8 = getelementptr inbounds [8 x i32], [8 x i32]* %tmp1, i64 0, i64 4
%tmp9 = getelementptr inbounds [8 x i32], [8 x i32]* %tmp1, i64 0, i64 6
%tmp10 = getelementptr inbounds [8 x i32], [8 x i32]* %tmp1, i64 0, i64 5
%tmp11 = getelementptr inbounds [8 x i32], [8 x i32]* %tmp1, i64 0, i64 7
store <8 x i32> <i32 -221320154, i32 -756426931, i32 563883532, i32 382683935, i32 144890241, i32 -1052877364, i32 -1052877364, i32 -1016007675>, <8 x i32>* %tmp, align 32
%tmp12 = bitcast i32* %tmp2 to i8*
%tmp13 = load i32, i32* %tmp4, align 32
%tmp14 = load i32, i32* %tmp5, align 4
%tmp15 = icmp slt i32 %tmp14, %tmp13
%tmp16 = select i1 %tmp15, i32 %tmp14, i32 %tmp13
%tmp17 = zext i1 %tmp15 to i32
%tmp18 = load i32, i32* %tmp6, align 8
%tmp19 = icmp slt i32 %tmp18, %tmp16
%tmp20 = select i1 %tmp19, i32 %tmp18, i32 %tmp16
%tmp21 = select i1 %tmp19, i32 2, i32 %tmp16
%tmp22 = load i32, i32* %tmp7, align 4
%tmp23 = icmp slt i32 %tmp22, %tmp20
%tmp24 = select i1 %tmp23, i32 %tmp22, i32 %tmp20
%tmp25 = select i1 %tmp23, i32 3, i32 %tmp21
%tmp26 = load i32, i32* %tmp8, align 16
%tmp27 = icmp slt i32 %tmp26, %tmp24
%tmp28 = select i1 %tmp27, i32 %tmp26, i32 %tmp24
%tmp29 = select i1 %tmp27, i32 4, i32 %tmp25
%tmp30 = load i32, i32* %tmp10, align 4
%tmp31 = icmp slt i32 %tmp30, %tmp28
%tmp32 = select i1 %tmp31, i32 %tmp30, i32 %tmp28
%tmp33 = select i1 %tmp31, i32 5, i32 %tmp29
%tmp34 = load i32, i32* %tmp9, align 8
%tmp35 = icmp slt i32 %tmp34, %tmp32
%tmp36 = select i1 %tmp35, i32 %tmp34, i32 %tmp32
%tmp37 = select i1 %tmp35, i32 6, i32 %tmp33
%tmp38 = load i32, i32* %tmp11, align 4
%tmp39 = icmp slt i32 %tmp38, %tmp36
%tmp40 = select i1 %tmp39, i32 7, i32 %tmp37
store i32 %tmp40, i32* %tmp2, align 4
ret i32 0
}