llvm-project/llvm/test/CodeGen/X86/umul-with-overflow.ll

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=i686-unknown-linux-gnu | FileCheck %s --check-prefix=X86
; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu | FileCheck %s --check-prefix=X64

declare {i32, i1} @llvm.umul.with.overflow.i32(i32 %a, i32 %b)

define zeroext i1 @a(i32 %x)  nounwind {
; X86-LABEL: a:
; X86:       # BB#0:
; X86-NEXT:    movl {{[0-9]+}}(%esp), %eax
; X86-NEXT:    movl $3, %ecx
; X86-NEXT:    mull %ecx
; X86-NEXT:    seto %al
; X86-NEXT:    retl
;
; X64-LABEL: a:
; X64:       # BB#0:
; X64-NEXT:    movl $3, %ecx
; X64-NEXT:    movl %edi, %eax
; X64-NEXT:    mull %ecx
; X64-NEXT:    seto %al
; X64-NEXT:    retq
  %res = call {i32, i1} @llvm.umul.with.overflow.i32(i32 %x, i32 3)
  %obil = extractvalue {i32, i1} %res, 1
  ret i1 %obil
}

define i32 @test2(i32 %a, i32 %b) nounwind readnone {
; X86-LABEL: test2:
; X86:       # BB#0: # %entry
; X86-NEXT:    movl {{[0-9]+}}(%esp), %eax
; X86-NEXT:    addl {{[0-9]+}}(%esp), %eax
; X86-NEXT:    addl %eax, %eax
; X86-NEXT:    retl
;
; X64-LABEL: test2:
; X64:       # BB#0: # %entry
; X64-NEXT:    # kill: %EDI<def> %EDI<kill> %RDI<def>
; X64-NEXT:    addl %esi, %edi
; X64-NEXT:    leal (%rdi,%rdi), %eax
; X64-NEXT:    retq
entry:
	%tmp0 = add i32 %b, %a
	%tmp1 = call { i32, i1 } @llvm.umul.with.overflow.i32(i32 %tmp0, i32 2)
	%tmp2 = extractvalue { i32, i1 } %tmp1, 0
	ret i32 %tmp2
}

define i32 @test3(i32 %a, i32 %b) nounwind readnone {
; X86-LABEL: test3:
; X86:       # BB#0: # %entry
; X86-NEXT:    movl {{[0-9]+}}(%esp), %eax
; X86-NEXT:    addl {{[0-9]+}}(%esp), %eax
; X86-NEXT:    movl $4, %ecx
; X86-NEXT:    mull %ecx
; X86-NEXT:    retl
;
; X64-LABEL: test3:
; X64:       # BB#0: # %entry
; X64-NEXT:    # kill: %ESI<def> %ESI<kill> %RSI<def>
; X64-NEXT:    # kill: %EDI<def> %EDI<kill> %RDI<def>
; X64-NEXT:    leal (%rdi,%rsi), %eax
; X64-NEXT:    movl $4, %ecx
; X64-NEXT:    mull %ecx
; X64-NEXT:    retq
entry:
	%tmp0 = add i32 %b, %a
	%tmp1 = call { i32, i1 } @llvm.umul.with.overflow.i32(i32 %tmp0, i32 4)
	%tmp2 = extractvalue { i32, i1 } %tmp1, 0
	ret i32 %tmp2
}
[X86] Regenerated umul overflow tests on 32/64 bit targets llvm-svn: 309102 2017-07-26 19:04:18 +08:00			`; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py`
			`; RUN: llc < %s -mtriple=i686-unknown-linux-gnu \| FileCheck %s --check-prefix=X86`
			`; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu \| FileCheck %s --check-prefix=X64`
Add some generic expansion logic for SMULO and UMULO. Fixes UMULO support for x86, and UMULO/SMULO for many architectures, including PPC (PR4201), ARM, and Cell. The resulting expansion isn't perfect, but it's not bad. llvm-svn: 73477 2009-06-16 14:58:29 +08:00
			`declare {i32, i1} @llvm.umul.with.overflow.i32(i32 %a, i32 %b)`
[X86] Regenerated umul overflow tests on 32/64 bit targets llvm-svn: 309102 2017-07-26 19:04:18 +08:00
manually upgrade a bunch of tests to modern syntax, and remove some that are either unreduced or only test old syntax. llvm-svn: 133228 2011-06-17 11:14:27 +08:00			`define zeroext i1 @a(i32 %x) nounwind {`
[X86] Regenerated umul overflow tests on 32/64 bit targets llvm-svn: 309102 2017-07-26 19:04:18 +08:00			`; X86-LABEL: a:`
			`; X86: # BB#0:`
			`; X86-NEXT: movl {{[0-9]+}}(%esp), %eax`
			`; X86-NEXT: movl $3, %ecx`
			`; X86-NEXT: mull %ecx`
			`; X86-NEXT: seto %al`
			`; X86-NEXT: retl`
			`;`
			`; X64-LABEL: a:`
			`; X64: # BB#0:`
			`; X64-NEXT: movl $3, %ecx`
			`; X64-NEXT: movl %edi, %eax`
			`; X64-NEXT: mull %ecx`
			`; X64-NEXT: seto %al`
			`; X64-NEXT: retq`
Add some generic expansion logic for SMULO and UMULO. Fixes UMULO support for x86, and UMULO/SMULO for many architectures, including PPC (PR4201), ARM, and Cell. The resulting expansion isn't perfect, but it's not bad. llvm-svn: 73477 2009-06-16 14:58:29 +08:00			`%res = call {i32, i1} @llvm.umul.with.overflow.i32(i32 %x, i32 3)`
			`%obil = extractvalue {i32, i1} %res, 1`
			`ret i1 %obil`
			`}`
Implement mulo x, 2 -> addo x, x in DAGCombiner. llvm-svn: 131800 2011-05-22 02:31:55 +08:00
			`define i32 @test2(i32 %a, i32 %b) nounwind readnone {`
[X86] Regenerated umul overflow tests on 32/64 bit targets llvm-svn: 309102 2017-07-26 19:04:18 +08:00			`; X86-LABEL: test2:`
			`; X86: # BB#0: # %entry`
			`; X86-NEXT: movl {{[0-9]+}}(%esp), %eax`
			`; X86-NEXT: addl {{[0-9]+}}(%esp), %eax`
			`; X86-NEXT: addl %eax, %eax`
			`; X86-NEXT: retl`
			`;`
			`; X64-LABEL: test2:`
			`; X64: # BB#0: # %entry`
			`; X64-NEXT: # kill: %EDI<def> %EDI<kill> %RDI<def>`
			`; X64-NEXT: addl %esi, %edi`
			`; X64-NEXT: leal (%rdi,%rdi), %eax`
			`; X64-NEXT: retq`
Implement mulo x, 2 -> addo x, x in DAGCombiner. llvm-svn: 131800 2011-05-22 02:31:55 +08:00			`entry:`
Revert r314886 "[X86] Improvement in CodeGen instruction selection for LEAs (re-applying post required revision changes.)" It broke the Chromium / SQLite build; see PR34830. > Summary: > 1/ Operand folding during complex pattern matching for LEAs has been > extended, such that it promotes Scale to accommodate similar operand > appearing in the DAG. > e.g. > T1 = A + B > T2 = T1 + 10 > T3 = T2 + A > For above DAG rooted at T3, X86AddressMode will no look like > Base = B , Index = A , Scale = 2 , Disp = 10 > > 2/ During OptimizeLEAPass down the pipeline factorization is now performed over LEAs > so that if there is an opportunity then complex LEAs (having 3 operands) > could be factored out. > e.g. > leal 1(%rax,%rcx,1), %rdx > leal 1(%rax,%rcx,2), %rcx > will be factored as following > leal 1(%rax,%rcx,1), %rdx > leal (%rdx,%rcx) , %edx > > 3/ Aggressive operand folding for AM based selection for LEAs is sensitive to loops, > thus avoiding creation of any complex LEAs within a loop. > > Reviewers: lsaba, RKSimon, craig.topper, qcolombet, jmolloy > > Reviewed By: lsaba > > Subscribers: jmolloy, spatel, igorb, llvm-commits > > Differential Revision: https://reviews.llvm.org/D35014 llvm-svn: 314919 2017-10-05 01:54:06 +08:00			`%tmp0 = add i32 %b, %a`
			`%tmp1 = call { i32, i1 } @llvm.umul.with.overflow.i32(i32 %tmp0, i32 2)`
			`%tmp2 = extractvalue { i32, i1 } %tmp1, 0`
			`ret i32 %tmp2`
Implement mulo x, 2 -> addo x, x in DAGCombiner. llvm-svn: 131800 2011-05-22 02:31:55 +08:00			`}`

			`define i32 @test3(i32 %a, i32 %b) nounwind readnone {`
[X86] Regenerated umul overflow tests on 32/64 bit targets llvm-svn: 309102 2017-07-26 19:04:18 +08:00			`; X86-LABEL: test3:`
			`; X86: # BB#0: # %entry`
			`; X86-NEXT: movl {{[0-9]+}}(%esp), %eax`
			`; X86-NEXT: addl {{[0-9]+}}(%esp), %eax`
			`; X86-NEXT: movl $4, %ecx`
			`; X86-NEXT: mull %ecx`
			`; X86-NEXT: retl`
			`;`
			`; X64-LABEL: test3:`
			`; X64: # BB#0: # %entry`
			`; X64-NEXT: # kill: %ESI<def> %ESI<kill> %RSI<def>`
			`; X64-NEXT: # kill: %EDI<def> %EDI<kill> %RDI<def>`
			`; X64-NEXT: leal (%rdi,%rsi), %eax`
			`; X64-NEXT: movl $4, %ecx`
			`; X64-NEXT: mull %ecx`
			`; X64-NEXT: retq`
Implement mulo x, 2 -> addo x, x in DAGCombiner. llvm-svn: 131800 2011-05-22 02:31:55 +08:00			`entry:`
Revert r314886 "[X86] Improvement in CodeGen instruction selection for LEAs (re-applying post required revision changes.)" It broke the Chromium / SQLite build; see PR34830. > Summary: > 1/ Operand folding during complex pattern matching for LEAs has been > extended, such that it promotes Scale to accommodate similar operand > appearing in the DAG. > e.g. > T1 = A + B > T2 = T1 + 10 > T3 = T2 + A > For above DAG rooted at T3, X86AddressMode will no look like > Base = B , Index = A , Scale = 2 , Disp = 10 > > 2/ During OptimizeLEAPass down the pipeline factorization is now performed over LEAs > so that if there is an opportunity then complex LEAs (having 3 operands) > could be factored out. > e.g. > leal 1(%rax,%rcx,1), %rdx > leal 1(%rax,%rcx,2), %rcx > will be factored as following > leal 1(%rax,%rcx,1), %rdx > leal (%rdx,%rcx) , %edx > > 3/ Aggressive operand folding for AM based selection for LEAs is sensitive to loops, > thus avoiding creation of any complex LEAs within a loop. > > Reviewers: lsaba, RKSimon, craig.topper, qcolombet, jmolloy > > Reviewed By: lsaba > > Subscribers: jmolloy, spatel, igorb, llvm-commits > > Differential Revision: https://reviews.llvm.org/D35014 llvm-svn: 314919 2017-10-05 01:54:06 +08:00			`%tmp0 = add i32 %b, %a`
			`%tmp1 = call { i32, i1 } @llvm.umul.with.overflow.i32(i32 %tmp0, i32 4)`
			`%tmp2 = extractvalue { i32, i1 } %tmp1, 0`
			`ret i32 %tmp2`
Implement mulo x, 2 -> addo x, x in DAGCombiner. llvm-svn: 131800 2011-05-22 02:31:55 +08:00			`}`