2015-01-28 22:08:22 +08:00
|
|
|
; RUN: llc < %s -mtriple=x86_64-pc-linux-gnu | FileCheck %s --check-prefix=X64
|
|
|
|
; RUN: llc < %s -mtriple=x86_64-pc-linux-gnux32 | FileCheck %s --check-prefix=X64
|
|
|
|
; RUN: llc < %s -mtriple=i686-pc-linux | FileCheck %s --check-prefix=X86
|
|
|
|
|
|
|
|
define i32 @mul4_32(i32 %A) {
|
|
|
|
; X64-LABEL: mul4_32:
|
|
|
|
; X64: leal
|
|
|
|
; X86-LABEL: mul4_32:
|
|
|
|
; X86: shll
|
|
|
|
%mul = mul i32 %A, 4
|
|
|
|
ret i32 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @mul4_64(i64 %A) {
|
|
|
|
; X64-LABEL: mul4_64:
|
|
|
|
; X64: leaq
|
|
|
|
; X86-LABEL: mul4_64:
|
|
|
|
; X86: shldl
|
|
|
|
; X86: shll
|
|
|
|
%mul = mul i64 %A, 4
|
|
|
|
ret i64 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @mul4096_32(i32 %A) {
|
|
|
|
; X64-LABEL: mul4096_32:
|
|
|
|
; X64: shll
|
|
|
|
; X86-LABEL: mul4096_32:
|
|
|
|
; X86: shll
|
|
|
|
%mul = mul i32 %A, 4096
|
|
|
|
ret i32 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @mul4096_64(i64 %A) {
|
|
|
|
; X64-LABEL: mul4096_64:
|
|
|
|
; X64: shlq
|
|
|
|
; X86-LABEL: mul4096_64:
|
|
|
|
; X86: shldl
|
|
|
|
; X86: shll
|
|
|
|
%mul = mul i64 %A, 4096
|
|
|
|
ret i64 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @mulmin4096_32(i32 %A) {
|
|
|
|
; X64-LABEL: mulmin4096_32:
|
|
|
|
; X64: shll
|
|
|
|
; X64-NEXT: negl
|
|
|
|
; X86-LABEL: mulmin4096_32:
|
|
|
|
; X86: shll
|
|
|
|
; X86-NEXT: negl
|
|
|
|
%mul = mul i32 %A, -4096
|
|
|
|
ret i32 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @mulmin4096_64(i64 %A) {
|
|
|
|
; X64-LABEL: mulmin4096_64:
|
|
|
|
; X64: shlq
|
|
|
|
; X64-NEXT: negq
|
|
|
|
; X86-LABEL: mulmin4096_64:
|
|
|
|
; X86: shldl
|
|
|
|
; X86-NEXT: shll
|
|
|
|
; X86-NEXT: xorl
|
|
|
|
; X86-NEXT: negl
|
|
|
|
; X86-NEXT: sbbl
|
|
|
|
%mul = mul i64 %A, -4096
|
|
|
|
ret i64 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @mul3_32(i32 %A) {
|
|
|
|
; X64-LABEL: mul3_32:
|
|
|
|
; X64: leal
|
|
|
|
; X86-LABEL: mul3_32:
|
|
|
|
; But why?!
|
|
|
|
; X86: imull
|
|
|
|
%mul = mul i32 %A, 3
|
|
|
|
ret i32 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @mul3_64(i64 %A) {
|
|
|
|
; X64-LABEL: mul3_64:
|
|
|
|
; X64: leaq
|
|
|
|
; X86-LABEL: mul3_64:
|
|
|
|
; X86: mull
|
|
|
|
; X86-NEXT: imull
|
|
|
|
%mul = mul i64 %A, 3
|
|
|
|
ret i64 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @mul40_32(i32 %A) {
|
|
|
|
; X64-LABEL: mul40_32:
|
|
|
|
; X64: shll
|
|
|
|
; X64-NEXT: leal
|
|
|
|
; X86-LABEL: mul40_32:
|
|
|
|
; X86: shll
|
|
|
|
; X86-NEXT: leal
|
|
|
|
%mul = mul i32 %A, 40
|
|
|
|
ret i32 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @mul40_64(i64 %A) {
|
|
|
|
; X64-LABEL: mul40_64:
|
|
|
|
; X64: shlq
|
|
|
|
; X64-NEXT: leaq
|
|
|
|
; X86-LABEL: mul40_64:
|
|
|
|
; X86: leal
|
|
|
|
; X86-NEXT: movl
|
|
|
|
; X86-NEXT: mull
|
|
|
|
; X86-NEXT: leal
|
|
|
|
%mul = mul i64 %A, 40
|
|
|
|
ret i64 %mul
|
|
|
|
}
|
2015-08-12 19:27:26 +08:00
|
|
|
|
|
|
|
define i32 @mul4_32_minsize(i32 %A) minsize {
|
|
|
|
; X64-LABEL: mul4_32_minsize:
|
|
|
|
; X64: leal
|
|
|
|
; X86-LABEL: mul4_32_minsize:
|
|
|
|
; X86: shll
|
|
|
|
%mul = mul i32 %A, 4
|
|
|
|
ret i32 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @mul40_32_minsize(i32 %A) minsize {
|
|
|
|
; X64-LABEL: mul40_32_minsize:
|
|
|
|
; X64: imull
|
|
|
|
; X86-LABEL: mul40_32_minsize:
|
|
|
|
; X86: imull
|
|
|
|
%mul = mul i32 %A, 40
|
|
|
|
ret i32 %mul
|
|
|
|
}
|
[X86ISelLowering] Add additional support for multiplication-to-shift conversion.
Summary: This patch adds support of conversion (mul x, 2^N + 1) => (add (shl x, N), x) and (mul x, 2^N - 1) => (sub (shl x, N), x) if the multiplication can not be converted to LEA + SHL or LEA + LEA. LLVM has already supported this on ARM, and it should also be useful on X86. Note the patch currently only applies to cases where the constant operand is positive, and I am planing to add another patch to support negative cases after this.
Reviewers: craig.topper, RKSimon
Subscribers: aemerson, llvm-commits
Differential Revision: http://reviews.llvm.org/D14603
llvm-svn: 255415
2015-12-12 09:04:15 +08:00
|
|
|
|
|
|
|
define i32 @mul33_32(i32 %A) {
|
|
|
|
; X64-LABEL: mul33_32:
|
|
|
|
; X64: shll
|
|
|
|
; X64-NEXT: leal
|
|
|
|
; X86-LABEL: mul33_32:
|
|
|
|
; X86: shll
|
|
|
|
; X86-NEXT: addl
|
|
|
|
%mul = mul i32 %A, 33
|
|
|
|
ret i32 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @mul31_32(i32 %A) {
|
|
|
|
; X64-LABEL: mul31_32:
|
|
|
|
; X64: shll
|
|
|
|
; X64-NEXT: subl
|
|
|
|
; X86-LABEL: mul31_32:
|
|
|
|
; X86: shll
|
|
|
|
; X86-NEXT: subl
|
|
|
|
%mul = mul i32 %A, 31
|
|
|
|
ret i32 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @mul0_32(i32 %A) {
|
|
|
|
; X64-LABEL: mul0_32:
|
|
|
|
; X64: xorl %eax, %eax
|
|
|
|
%mul = mul i32 %A, 0
|
|
|
|
ret i32 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @mul4294967295_32(i32 %A) {
|
|
|
|
; X64-LABEL: mul4294967295_32:
|
|
|
|
; X64: negl %edi
|
|
|
|
; X64-NEXT: movl %edi, %eax
|
|
|
|
%mul = mul i32 %A, 4294967295
|
|
|
|
ret i32 %mul
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @mul18446744073709551615_64(i64 %A) {
|
|
|
|
; X64-LABEL: mul18446744073709551615_64:
|
|
|
|
; X64: negq %rdi
|
|
|
|
; X64-NEXT: movq %rdi, %rax
|
|
|
|
%mul = mul i64 %A, 18446744073709551615
|
|
|
|
ret i64 %mul
|
|
|
|
}
|
2017-01-18 17:31:13 +08:00
|
|
|
|
|
|
|
define i32 @test(i32 %a) {
|
|
|
|
; X64-LABEL: test:
|
|
|
|
; X64: # BB#0: # %entry
|
|
|
|
; X64-NEXT: movl %edi, %eax
|
|
|
|
; X64-NEXT: shll $5, %eax
|
|
|
|
; X64-NEXT: subl %edi, %eax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: test:
|
|
|
|
; X86: # BB#0: # %entry
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl %ecx, %eax
|
|
|
|
; X86-NEXT: shll $5, %eax
|
|
|
|
; X86-NEXT: subl %ecx, %eax
|
|
|
|
; X86-NEXT: retl
|
|
|
|
entry:
|
|
|
|
%tmp3 = mul i32 %a, 31
|
|
|
|
ret i32 %tmp3
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @test1(i32 %a) {
|
|
|
|
; X64-LABEL: test1:
|
|
|
|
; X64: # BB#0: # %entry
|
|
|
|
; X64-NEXT: movl %edi, %eax
|
|
|
|
; X64-NEXT: shll $5, %eax
|
|
|
|
; X64-NEXT: subl %edi, %eax
|
|
|
|
; X64-NEXT: negl %eax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: test1:
|
|
|
|
; X86: # BB#0: # %entry
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl %ecx, %eax
|
|
|
|
; X86-NEXT: shll $5, %eax
|
|
|
|
; X86-NEXT: subl %ecx, %eax
|
|
|
|
; X86-NEXT: negl %eax
|
|
|
|
; X86-NEXT: retl
|
|
|
|
entry:
|
|
|
|
%tmp3 = mul i32 %a, -31
|
|
|
|
ret i32 %tmp3
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
define i32 @test2(i32 %a) {
|
|
|
|
; X64-LABEL: test2:
|
|
|
|
; X64: # BB#0: # %entry
|
|
|
|
; X64-NEXT: # kill: %EDI<def> %EDI<kill> %RDI<def>
|
|
|
|
; X64-NEXT: movl %edi, %eax
|
|
|
|
; X64-NEXT: shll $5, %eax
|
|
|
|
; X64-NEXT: leal (%rax,%rdi), %eax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: test2:
|
|
|
|
; X86: # BB#0: # %entry
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl %ecx, %eax
|
|
|
|
; X86-NEXT: shll $5, %eax
|
|
|
|
; X86-NEXT: addl %ecx, %eax
|
|
|
|
; X86-NEXT: retl
|
|
|
|
entry:
|
|
|
|
%tmp3 = mul i32 %a, 33
|
|
|
|
ret i32 %tmp3
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @test3(i32 %a) {
|
|
|
|
; X64-LABEL: test3:
|
|
|
|
; X64: # BB#0: # %entry
|
|
|
|
; X64-NEXT: # kill: %EDI<def> %EDI<kill> %RDI<def>
|
|
|
|
; X64-NEXT: movl %edi, %eax
|
|
|
|
; X64-NEXT: shll $5, %eax
|
|
|
|
; X64-NEXT: leal (%rax,%rdi), %eax
|
|
|
|
; X64-NEXT: negl %eax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: test3:
|
|
|
|
; X86: # BB#0: # %entry
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl %ecx, %eax
|
|
|
|
; X86-NEXT: shll $5, %eax
|
|
|
|
; X86-NEXT: addl %ecx, %eax
|
|
|
|
; X86-NEXT: negl %eax
|
|
|
|
; X86-NEXT: retl
|
|
|
|
entry:
|
|
|
|
%tmp3 = mul i32 %a, -33
|
|
|
|
ret i32 %tmp3
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @test4(i64 %a) {
|
|
|
|
; X64-LABEL: test4:
|
|
|
|
; X64: # BB#0: # %entry
|
|
|
|
; X64-NEXT: movq %rdi, %rax
|
|
|
|
; X64-NEXT: shlq $5, %rax
|
|
|
|
; X64-NEXT: subq %rdi, %rax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: test4:
|
|
|
|
; X86: # BB#0: # %entry
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
|
|
; X86-NEXT: movl %eax, %ecx
|
|
|
|
; X86-NEXT: shll $5, %ecx
|
|
|
|
; X86-NEXT: subl %eax, %ecx
|
|
|
|
; X86-NEXT: movl $31, %eax
|
|
|
|
; X86-NEXT: mull {{[0-9]+}}(%esp)
|
|
|
|
; X86-NEXT: addl %ecx, %edx
|
|
|
|
; X86-NEXT: retl
|
|
|
|
entry:
|
|
|
|
%tmp3 = mul i64 %a, 31
|
|
|
|
ret i64 %tmp3
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @test5(i64 %a) {
|
|
|
|
; X64-LABEL: test5:
|
|
|
|
; X64: # BB#0: # %entry
|
|
|
|
; X64-NEXT: movq %rdi, %rax
|
|
|
|
; X64-NEXT: shlq $5, %rax
|
|
|
|
; X64-NEXT: subq %rdi, %rax
|
|
|
|
; X64-NEXT: negq %rax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: test5:
|
|
|
|
; X86: # BB#0: # %entry
|
|
|
|
; X86-NEXT: pushl %esi
|
|
|
|
; X86-NEXT: .Lcfi0:
|
|
|
|
; X86-NEXT: .cfi_def_cfa_offset 8
|
|
|
|
; X86-NEXT: .Lcfi1:
|
|
|
|
; X86-NEXT: .cfi_offset %esi, -8
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
|
|
; X86-NEXT: movl %eax, %esi
|
|
|
|
; X86-NEXT: shll $5, %esi
|
|
|
|
; X86-NEXT: subl %eax, %esi
|
|
|
|
; X86-NEXT: movl $-31, %edx
|
|
|
|
; X86-NEXT: movl %ecx, %eax
|
|
|
|
; X86-NEXT: mull %edx
|
|
|
|
; X86-NEXT: subl %ecx, %edx
|
|
|
|
; X86-NEXT: subl %esi, %edx
|
|
|
|
; X86-NEXT: popl %esi
|
|
|
|
; X86-NEXT: retl
|
|
|
|
entry:
|
|
|
|
%tmp3 = mul i64 %a, -31
|
|
|
|
ret i64 %tmp3
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
define i64 @test6(i64 %a) {
|
|
|
|
; X64-LABEL: test6:
|
|
|
|
; X64: # BB#0: # %entry
|
|
|
|
; X64-NEXT: movq %rdi, %rax
|
|
|
|
; X64-NEXT: shlq $5, %rax
|
|
|
|
; X64-NEXT: leaq (%rax,%rdi), %rax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: test6:
|
|
|
|
; X86: # BB#0: # %entry
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
|
|
; X86-NEXT: movl %eax, %ecx
|
|
|
|
; X86-NEXT: shll $5, %ecx
|
|
|
|
; X86-NEXT: addl %eax, %ecx
|
|
|
|
; X86-NEXT: movl $33, %eax
|
|
|
|
; X86-NEXT: mull {{[0-9]+}}(%esp)
|
|
|
|
; X86-NEXT: addl %ecx, %edx
|
|
|
|
; X86-NEXT: retl
|
|
|
|
entry:
|
|
|
|
%tmp3 = mul i64 %a, 33
|
|
|
|
ret i64 %tmp3
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @test7(i64 %a) {
|
|
|
|
; X64-LABEL: test7:
|
|
|
|
; X64: # BB#0: # %entry
|
|
|
|
; X64-NEXT: movq %rdi, %rax
|
|
|
|
; X64-NEXT: shlq $5, %rax
|
|
|
|
; X64-NEXT: leaq (%rax,%rdi), %rax
|
|
|
|
; X64-NEXT: negq %rax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: test7:
|
|
|
|
; X86: # BB#0: # %entry
|
|
|
|
; X86-NEXT: pushl %esi
|
2017-06-29 21:58:24 +08:00
|
|
|
; X86-NEXT: .Lcfi2:
|
2017-06-28 18:21:17 +08:00
|
|
|
; X86-NEXT: .cfi_def_cfa_offset 8
|
2017-06-29 21:58:24 +08:00
|
|
|
; X86-NEXT: .Lcfi3:
|
2017-01-18 17:31:13 +08:00
|
|
|
; X86-NEXT: .cfi_offset %esi, -8
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
|
|
; X86-NEXT: movl %eax, %esi
|
|
|
|
; X86-NEXT: shll $5, %esi
|
|
|
|
; X86-NEXT: addl %eax, %esi
|
|
|
|
; X86-NEXT: movl $-33, %edx
|
|
|
|
; X86-NEXT: movl %ecx, %eax
|
|
|
|
; X86-NEXT: mull %edx
|
|
|
|
; X86-NEXT: subl %ecx, %edx
|
|
|
|
; X86-NEXT: subl %esi, %edx
|
|
|
|
; X86-NEXT: popl %esi
|
|
|
|
; X86-NEXT: retl
|
|
|
|
entry:
|
|
|
|
%tmp3 = mul i64 %a, -33
|
|
|
|
ret i64 %tmp3
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @testOverflow(i64 %a) {
|
|
|
|
; X64-LABEL: testOverflow:
|
|
|
|
; X64: # BB#0: # %entry
|
|
|
|
; X64-NEXT: movabsq $9223372036854775807, %rax # imm = 0x7FFFFFFFFFFFFFFF
|
|
|
|
; X64-NEXT: imulq %rdi, %rax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: testOverflow:
|
|
|
|
; X86: # BB#0: # %entry
|
|
|
|
; X86-NEXT: pushl %esi
|
2017-06-29 21:58:24 +08:00
|
|
|
; X86-NEXT: .Lcfi4:
|
2017-01-18 17:31:13 +08:00
|
|
|
; X86-NEXT: .cfi_def_cfa_offset 8
|
2017-06-29 21:58:24 +08:00
|
|
|
; X86-NEXT: .Lcfi5:
|
2017-01-18 17:31:13 +08:00
|
|
|
; X86-NEXT: .cfi_offset %esi, -8
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl $-1, %edx
|
|
|
|
; X86-NEXT: movl %ecx, %eax
|
|
|
|
; X86-NEXT: mull %edx
|
|
|
|
; X86-NEXT: movl %ecx, %esi
|
|
|
|
; X86-NEXT: shll $31, %esi
|
|
|
|
; X86-NEXT: subl %ecx, %esi
|
|
|
|
; X86-NEXT: addl %esi, %edx
|
|
|
|
; X86-NEXT: subl {{[0-9]+}}(%esp), %edx
|
|
|
|
; X86-NEXT: popl %esi
|
|
|
|
; X86-NEXT: retl
|
|
|
|
entry:
|
|
|
|
%tmp3 = mul i64 %a, 9223372036854775807
|
|
|
|
ret i64 %tmp3
|
|
|
|
}
|