llvm-project/llvm/test/CodeGen/X86/widen_arith-6.ll

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=i686-unknown-unknown -mattr=+sse4.2 | FileCheck %s

; widen a v3f32 to vfi32 to do a vector multiple and an add

define void @update(<3 x float>* %dst, <3 x float>* %src, i32 %n) nounwind {
; CHECK-LABEL: update:
; CHECK:       # %bb.0: # %entry
; CHECK-NEXT:    pushl %ebp
; CHECK-NEXT:    movl %esp, %ebp
; CHECK-NEXT:    andl $-16, %esp
; CHECK-NEXT:    subl $48, %esp
; CHECK-NEXT:    movl $1077936128, {{[0-9]+}}(%esp) # imm = 0x40400000
; CHECK-NEXT:    movl $1073741824, {{[0-9]+}}(%esp) # imm = 0x40000000
; CHECK-NEXT:    movl $1065353216, {{[0-9]+}}(%esp) # imm = 0x3F800000
; CHECK-NEXT:    movl $0, {{[0-9]+}}(%esp)
; CHECK-NEXT:    movaps {{.*#+}} xmm0 = <1.97604004E+3,1.97604004E+3,1.97604004E+3,u>
; CHECK-NEXT:    jmp .LBB0_1
; CHECK-NEXT:    .p2align 4, 0x90
; CHECK-NEXT:  .LBB0_2: # %forbody
; CHECK-NEXT:    # in Loop: Header=BB0_1 Depth=1
; CHECK-NEXT:    movl {{[0-9]+}}(%esp), %eax
; CHECK-NEXT:    movl 8(%ebp), %ecx
; CHECK-NEXT:    shll $4, %eax
; CHECK-NEXT:    movl 12(%ebp), %edx
; CHECK-NEXT:    movaps (%edx,%eax), %xmm1
; CHECK-NEXT:    mulps {{[0-9]+}}(%esp), %xmm1
; CHECK-NEXT:    addps %xmm0, %xmm1
; CHECK-NEXT:    extractps $2, %xmm1, 8(%ecx,%eax)
; CHECK-NEXT:    extractps $1, %xmm1, 4(%ecx,%eax)
; CHECK-NEXT:    movss %xmm1, (%ecx,%eax)
; CHECK-NEXT:    incl {{[0-9]+}}(%esp)
; CHECK-NEXT:  .LBB0_1: # %forcond
; CHECK-NEXT:    # =>This Inner Loop Header: Depth=1
; CHECK-NEXT:    movl {{[0-9]+}}(%esp), %eax
; CHECK-NEXT:    cmpl 16(%ebp), %eax
; CHECK-NEXT:    jl .LBB0_2
; CHECK-NEXT:  # %bb.3: # %afterfor
; CHECK-NEXT:    movl %ebp, %esp
; CHECK-NEXT:    popl %ebp
; CHECK-NEXT:    retl
entry:
	%dst.addr = alloca <3 x float>*
	%src.addr = alloca <3 x float>*
	%n.addr = alloca i32
	%v = alloca <3 x float>, align 16
	%i = alloca i32, align 4
	store <3 x float>* %dst, <3 x float>** %dst.addr
	store <3 x float>* %src, <3 x float>** %src.addr
	store i32 %n, i32* %n.addr
	store <3 x float> < float 1.000000e+00, float 2.000000e+00, float 3.000000e+00 >, <3 x float>* %v
	store i32 0, i32* %i
	br label %forcond

forcond:
	%tmp = load i32, i32* %i
	%tmp1 = load i32, i32* %n.addr
	%cmp = icmp slt i32 %tmp, %tmp1
	br i1 %cmp, label %forbody, label %afterfor

forbody:
	%tmp2 = load i32, i32* %i
	%tmp3 = load <3 x float>*, <3 x float>** %dst.addr
	%arrayidx = getelementptr <3 x float>, <3 x float>* %tmp3, i32 %tmp2
	%tmp4 = load i32, i32* %i
	%tmp5 = load <3 x float>*, <3 x float>** %src.addr
	%arrayidx6 = getelementptr <3 x float>, <3 x float>* %tmp5, i32 %tmp4
	%tmp7 = load <3 x float>, <3 x float>* %arrayidx6
	%tmp8 = load <3 x float>, <3 x float>* %v
	%mul = fmul <3 x float> %tmp7, %tmp8
	%add = fadd <3 x float> %mul, < float 0x409EE02900000000, float 0x409EE02900000000, float 0x409EE02900000000 >
	store <3 x float> %add, <3 x float>* %arrayidx
	br label %forinc

forinc:
	%tmp9 = load i32, i32* %i
	%inc = add i32 %tmp9, 1
	store i32 %inc, i32* %i
	br label %forcond

afterfor:
	ret void
}
[x86] specify triples and auto-generate complete checks; NFC llvm-svn: 305656 2017-06-19 05:48:44 +08:00			`; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py`
			`; RUN: llc < %s -mtriple=i686-unknown-unknown -mattr=+sse4.2 \| FileCheck %s`
Added some basic test cases for r61209 llvm-svn: 61210 2008-12-19 04:05:58 +08:00
			`; widen a v3f32 to vfi32 to do a vector multiple and an add`

			`define void @update(<3 x float>* %dst, <3 x float>* %src, i32 %n) nounwind {`
[x86] specify triples and auto-generate complete checks; NFC llvm-svn: 305656 2017-06-19 05:48:44 +08:00			`; CHECK-LABEL: update:`
[CodeGen] Unify MBB reference format in both MIR and debug output As part of the unification of the debug format and the MIR format, print MBB references as '%bb.5'. The MIR printer prints the IR name of a MBB only for block definitions. * find . \( -name ".mir" -o -name ".cpp" -o -name ".h" -o -name ".ll" \) -type f -print0 \| xargs -0 sed -i '' -E 's/BB#" << ([a-zA-Z0-9_]+)->getNumber\(\)/" << printMBBReference(\1)/g' find . \( -name ".mir" -o -name ".cpp" -o -name ".h" -o -name ".ll" \) -type f -print0 \| xargs -0 sed -i '' -E 's/BB#" << ([a-zA-Z0-9_]+)\.getNumber\(\)/" << printMBBReference(\1)/g' * find . \( -name ".txt" -o -name ".s" -o -name ".mir" -o -name ".cpp" -o -name ".h" -o -name ".ll" \) -type f -print0 \| xargs -0 sed -i '' -E 's/BB#([0-9]+)/%bb.\1/g' * grep -nr 'BB#' and fix Differential Revision: https://reviews.llvm.org/D40422 llvm-svn: 319665 2017-12-05 01:18:51 +08:00			`; CHECK: # %bb.0: # %entry`
[x86] specify triples and auto-generate complete checks; NFC llvm-svn: 305656 2017-06-19 05:48:44 +08:00			`; CHECK-NEXT: pushl %ebp`
			`; CHECK-NEXT: movl %esp, %ebp`
			`; CHECK-NEXT: andl $-16, %esp`
			`; CHECK-NEXT: subl $48, %esp`
			`; CHECK-NEXT: movl $1077936128, {{[0-9]+}}(%esp) # imm = 0x40400000`
			`; CHECK-NEXT: movl $1073741824, {{[0-9]+}}(%esp) # imm = 0x40000000`
			`; CHECK-NEXT: movl $1065353216, {{[0-9]+}}(%esp) # imm = 0x3F800000`
			`; CHECK-NEXT: movl $0, {{[0-9]+}}(%esp)`
[X86] Force floating point values in constant pool decoding to print in scientific notation so they can't be confused with integers. When the floating point constants are whole numbers they have no decimal point so look like integers, but mean something very different in something like an 'and' instruction. Ideally we would just print a decimal point and a 0, but I couldn't see how to make APFloat::toString do that. llvm-svn: 345488 2018-10-29 12:52:04 +08:00			`; CHECK-NEXT: movaps {{.*#+}} xmm0 = <1.97604004E+3,1.97604004E+3,1.97604004E+3,u>`
[x86] specify triples and auto-generate complete checks; NFC llvm-svn: 305656 2017-06-19 05:48:44 +08:00			`; CHECK-NEXT: jmp .LBB0_1`
			`; CHECK-NEXT: .p2align 4, 0x90`
			`; CHECK-NEXT: .LBB0_2: # %forbody`
			`; CHECK-NEXT: # in Loop: Header=BB0_1 Depth=1`
			`; CHECK-NEXT: movl {{[0-9]+}}(%esp), %eax`
			`; CHECK-NEXT: movl 8(%ebp), %ecx`
			`; CHECK-NEXT: shll $4, %eax`
			`; CHECK-NEXT: movl 12(%ebp), %edx`
			`; CHECK-NEXT: movaps (%edx,%eax), %xmm1`
			`; CHECK-NEXT: mulps {{[0-9]+}}(%esp), %xmm1`
			`; CHECK-NEXT: addps %xmm0, %xmm1`
			`; CHECK-NEXT: extractps $2, %xmm1, 8(%ecx,%eax)`
			`; CHECK-NEXT: extractps $1, %xmm1, 4(%ecx,%eax)`
			`; CHECK-NEXT: movss %xmm1, (%ecx,%eax)`
			`; CHECK-NEXT: incl {{[0-9]+}}(%esp)`
			`; CHECK-NEXT: .LBB0_1: # %forcond`
			`; CHECK-NEXT: # =>This Inner Loop Header: Depth=1`
			`; CHECK-NEXT: movl {{[0-9]+}}(%esp), %eax`
			`; CHECK-NEXT: cmpl 16(%ebp), %eax`
			`; CHECK-NEXT: jl .LBB0_2`
[CodeGen] Unify MBB reference format in both MIR and debug output As part of the unification of the debug format and the MIR format, print MBB references as '%bb.5'. The MIR printer prints the IR name of a MBB only for block definitions. * find . \( -name ".mir" -o -name ".cpp" -o -name ".h" -o -name ".ll" \) -type f -print0 \| xargs -0 sed -i '' -E 's/BB#" << ([a-zA-Z0-9_]+)->getNumber\(\)/" << printMBBReference(\1)/g' find . \( -name ".mir" -o -name ".cpp" -o -name ".h" -o -name ".ll" \) -type f -print0 \| xargs -0 sed -i '' -E 's/BB#" << ([a-zA-Z0-9_]+)\.getNumber\(\)/" << printMBBReference(\1)/g' * find . \( -name ".txt" -o -name ".s" -o -name ".mir" -o -name ".cpp" -o -name ".h" -o -name ".ll" \) -type f -print0 \| xargs -0 sed -i '' -E 's/BB#([0-9]+)/%bb.\1/g' * grep -nr 'BB#' and fix Differential Revision: https://reviews.llvm.org/D40422 llvm-svn: 319665 2017-12-05 01:18:51 +08:00			`; CHECK-NEXT: # %bb.3: # %afterfor`
[x86] specify triples and auto-generate complete checks; NFC llvm-svn: 305656 2017-06-19 05:48:44 +08:00			`; CHECK-NEXT: movl %ebp, %esp`
			`; CHECK-NEXT: popl %ebp`
			`; CHECK-NEXT: retl`
Added some basic test cases for r61209 llvm-svn: 61210 2008-12-19 04:05:58 +08:00			`entry:`
[x86] specify triples and auto-generate complete checks; NFC llvm-svn: 305656 2017-06-19 05:48:44 +08:00			`%dst.addr = alloca <3 x float>*`
			`%src.addr = alloca <3 x float>*`
			`%n.addr = alloca i32`
			`%v = alloca <3 x float>, align 16`
			`%i = alloca i32, align 4`
Added some basic test cases for r61209 llvm-svn: 61210 2008-12-19 04:05:58 +08:00			`store <3 x float>* %dst, <3 x float>** %dst.addr`
			`store <3 x float>* %src, <3 x float>** %src.addr`
			`store i32 %n, i32* %n.addr`
			`store <3 x float> < float 1.000000e+00, float 2.000000e+00, float 3.000000e+00 >, <3 x float>* %v`
			`store i32 0, i32* %i`
			`br label %forcond`

[x86] specify triples and auto-generate complete checks; NFC llvm-svn: 305656 2017-06-19 05:48:44 +08:00			`forcond:`
			`%tmp = load i32, i32* %i`
			`%tmp1 = load i32, i32* %n.addr`
			`%cmp = icmp slt i32 %tmp, %tmp1`
Added some basic test cases for r61209 llvm-svn: 61210 2008-12-19 04:05:58 +08:00			`br i1 %cmp, label %forbody, label %afterfor`

[x86] specify triples and auto-generate complete checks; NFC llvm-svn: 305656 2017-06-19 05:48:44 +08:00			`forbody:`
			`%tmp2 = load i32, i32* %i`
			`%tmp3 = load <3 x float>, <3 x float>* %dst.addr`
			`%arrayidx = getelementptr <3 x float>, <3 x float>* %tmp3, i32 %tmp2`
			`%tmp4 = load i32, i32* %i`
			`%tmp5 = load <3 x float>, <3 x float>* %src.addr`
			`%arrayidx6 = getelementptr <3 x float>, <3 x float>* %tmp5, i32 %tmp4`
			`%tmp7 = load <3 x float>, <3 x float>* %arrayidx6`
			`%tmp8 = load <3 x float>, <3 x float>* %v`
			`%mul = fmul <3 x float> %tmp7, %tmp8`
			`%add = fadd <3 x float> %mul, < float 0x409EE02900000000, float 0x409EE02900000000, float 0x409EE02900000000 >`
Added some basic test cases for r61209 llvm-svn: 61210 2008-12-19 04:05:58 +08:00			`store <3 x float> %add, <3 x float>* %arrayidx`
			`br label %forinc`

[x86] specify triples and auto-generate complete checks; NFC llvm-svn: 305656 2017-06-19 05:48:44 +08:00			`forinc:`
			`%tmp9 = load i32, i32* %i`
			`%inc = add i32 %tmp9, 1`
Added some basic test cases for r61209 llvm-svn: 61210 2008-12-19 04:05:58 +08:00			`store i32 %inc, i32* %i`
			`br label %forcond`

[x86] specify triples and auto-generate complete checks; NFC llvm-svn: 305656 2017-06-19 05:48:44 +08:00			`afterfor:`
Added some basic test cases for r61209 llvm-svn: 61210 2008-12-19 04:05:58 +08:00			`ret void`
			`}`