forked from OSchip/llvm-project
87 lines
3.5 KiB
LLVM
87 lines
3.5 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
|
|
; RUN: opt -instcombine -S < %s | FileCheck %s
|
|
|
|
define void @scalarize_phi(i32 * %n, float * %inout) {
|
|
; CHECK-LABEL: @scalarize_phi(
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: [[T0:%.*]] = load volatile float, float* [[INOUT:%.*]], align 4
|
|
; CHECK-NEXT: br label [[FOR_COND:%.*]]
|
|
; CHECK: for.cond:
|
|
; CHECK-NEXT: [[TMP0:%.*]] = phi float [ [[T0]], [[ENTRY:%.*]] ], [ [[TMP1:%.*]], [[FOR_BODY:%.*]] ]
|
|
; CHECK-NEXT: [[I_0:%.*]] = phi i32 [ 0, [[ENTRY]] ], [ [[INC:%.*]], [[FOR_BODY]] ]
|
|
; CHECK-NEXT: [[T1:%.*]] = load i32, i32* [[N:%.*]], align 4
|
|
; CHECK-NEXT: [[CMP:%.*]] = icmp eq i32 [[I_0]], [[T1]]
|
|
; CHECK-NEXT: br i1 [[CMP]], label [[FOR_END:%.*]], label [[FOR_BODY]]
|
|
; CHECK: for.body:
|
|
; CHECK-NEXT: store volatile float [[TMP0]], float* [[INOUT]], align 4
|
|
; CHECK-NEXT: [[TMP1]] = fmul float [[TMP0]], 0x4002A3D700000000
|
|
; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[I_0]], 1
|
|
; CHECK-NEXT: br label [[FOR_COND]]
|
|
; CHECK: for.end:
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
entry:
|
|
%t0 = load volatile float, float * %inout, align 4
|
|
%insert = insertelement <4 x float> undef, float %t0, i32 0
|
|
%splat = shufflevector <4 x float> %insert, <4 x float> undef, <4 x i32> zeroinitializer
|
|
%insert1 = insertelement <4 x float> undef, float 3.0, i32 0
|
|
br label %for.cond
|
|
|
|
for.cond:
|
|
%x.0 = phi <4 x float> [ %splat, %entry ], [ %mul, %for.body ]
|
|
%i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
|
|
%t1 = load i32, i32 * %n, align 4
|
|
%cmp = icmp ne i32 %i.0, %t1
|
|
br i1 %cmp, label %for.body, label %for.end
|
|
|
|
for.body:
|
|
%t2 = extractelement <4 x float> %x.0, i32 1
|
|
store volatile float %t2, float * %inout, align 4
|
|
%mul = fmul <4 x float> %x.0, <float 0x4002A3D700000000, float 0x4002A3D700000000, float 0x4002A3D700000000, float 0x4002A3D700000000>
|
|
%inc = add nsw i32 %i.0, 1
|
|
br label %for.cond
|
|
|
|
for.end:
|
|
ret void
|
|
}
|
|
|
|
define float @extract_element_constant_index(<4 x float> %x) {
|
|
; CHECK-LABEL: @extract_element_constant_index(
|
|
; CHECK-NEXT: [[R_LHS:%.*]] = extractelement <4 x float> [[X:%.*]], i32 2
|
|
; CHECK-NEXT: [[R:%.*]] = fadd float [[R_LHS]], 0x4002A3D700000000
|
|
; CHECK-NEXT: ret float [[R]]
|
|
;
|
|
%add = fadd <4 x float> %x, <float 0x4002A3D700000000, float 0x4002A3D700000000, float 0x4002A3D700000000, float 0x4002A3D700000000>
|
|
%r = extractelement <4 x float> %add, i32 2
|
|
ret float %r
|
|
}
|
|
|
|
define float @extract_element_variable_index(<4 x float> %x, i32 %y) {
|
|
; CHECK-LABEL: @extract_element_variable_index(
|
|
; CHECK-NEXT: [[R_LHS:%.*]] = extractelement <4 x float> [[X:%.*]], i32 [[Y:%.*]]
|
|
; CHECK-NEXT: [[R:%.*]] = fadd float [[R_LHS]], 1.000000e+00
|
|
; CHECK-NEXT: ret float [[R]]
|
|
;
|
|
%add = fadd <4 x float> %x, <float 1.0, float 1.0, float 1.0, float 1.0>
|
|
%r = extractelement <4 x float> %add, i32 %y
|
|
ret float %r
|
|
}
|
|
|
|
define float @extract_element_splat_constant_vector_variable_index(i32 %y) {
|
|
; CHECK-LABEL: @extract_element_splat_constant_vector_variable_index(
|
|
; CHECK-NEXT: ret float 2.000000e+00
|
|
;
|
|
%r = extractelement <4 x float> <float 2.0, float 2.0, float 2.0, float 2.0>, i32 %y
|
|
ret float %r
|
|
}
|
|
|
|
define float @extract_element_constant_vector_variable_index(i32 %y) {
|
|
; CHECK-LABEL: @extract_element_constant_vector_variable_index(
|
|
; CHECK-NEXT: [[R:%.*]] = extractelement <4 x float> <float 1.000000e+00, float 2.000000e+00, float 3.000000e+00, float 4.000000e+00>, i32 [[Y:%.*]]
|
|
; CHECK-NEXT: ret float [[R]]
|
|
;
|
|
%r = extractelement <4 x float> <float 1.0, float 2.0, float 3.0, float 4.0>, i32 %y
|
|
ret float %r
|
|
}
|
|
|