2018-12-12 14:29:14 +08:00
|
|
|
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
|
|
; RUN: llc < %s -mtriple=x86_64-linux | FileCheck %s --check-prefix=X64
|
|
|
|
; RUN: llc < %s -mtriple=i686 -mattr=cmov | FileCheck %s --check-prefix=X86
|
|
|
|
|
|
|
|
declare i4 @llvm.smul.fix.i4 (i4, i4, i32)
|
|
|
|
declare i32 @llvm.smul.fix.i32 (i32, i32, i32)
|
|
|
|
declare i64 @llvm.smul.fix.i64 (i64, i64, i32)
|
|
|
|
declare <4 x i32> @llvm.smul.fix.v4i32(<4 x i32>, <4 x i32>, i32)
|
|
|
|
|
|
|
|
define i32 @func(i32 %x, i32 %y) nounwind {
|
|
|
|
; X64-LABEL: func:
|
|
|
|
; X64: # %bb.0:
|
|
|
|
; X64-NEXT: movslq %esi, %rax
|
|
|
|
; X64-NEXT: movslq %edi, %rcx
|
|
|
|
; X64-NEXT: imulq %rax, %rcx
|
|
|
|
; X64-NEXT: movq %rcx, %rax
|
|
|
|
; X64-NEXT: shrq $32, %rax
|
|
|
|
; X64-NEXT: shldl $30, %ecx, %eax
|
|
|
|
; X64-NEXT: # kill: def $eax killed $eax killed $rax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: func:
|
|
|
|
; X86: # %bb.0:
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp)
|
|
|
|
; X86-NEXT: shrdl $2, %edx, %eax
|
|
|
|
; X86-NEXT: retl
|
2019-08-12 03:27:14 +08:00
|
|
|
%tmp = call i32 @llvm.smul.fix.i32(i32 %x, i32 %y, i32 2)
|
|
|
|
ret i32 %tmp
|
2018-12-12 14:29:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @func2(i64 %x, i64 %y) {
|
|
|
|
; X64-LABEL: func2:
|
|
|
|
; X64: # %bb.0:
|
|
|
|
; X64-NEXT: movq %rdi, %rax
|
|
|
|
; X64-NEXT: imulq %rsi
|
|
|
|
; X64-NEXT: shrdq $2, %rdx, %rax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: func2:
|
|
|
|
; X86: # %bb.0:
|
|
|
|
; X86-NEXT: pushl %ebp
|
|
|
|
; X86-NEXT: .cfi_def_cfa_offset 8
|
|
|
|
; X86-NEXT: pushl %ebx
|
|
|
|
; X86-NEXT: .cfi_def_cfa_offset 12
|
|
|
|
; X86-NEXT: pushl %edi
|
|
|
|
; X86-NEXT: .cfi_def_cfa_offset 16
|
|
|
|
; X86-NEXT: pushl %esi
|
|
|
|
; X86-NEXT: .cfi_def_cfa_offset 20
|
|
|
|
; X86-NEXT: .cfi_offset %esi, -20
|
|
|
|
; X86-NEXT: .cfi_offset %edi, -16
|
|
|
|
; X86-NEXT: .cfi_offset %ebx, -12
|
|
|
|
; X86-NEXT: .cfi_offset %ebp, -8
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ebx
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl %ebx, %eax
|
|
|
|
; X86-NEXT: mull {{[0-9]+}}(%esp)
|
|
|
|
; X86-NEXT: movl %edx, %esi
|
|
|
|
; X86-NEXT: movl %eax, %edi
|
|
|
|
; X86-NEXT: movl %ebx, %eax
|
|
|
|
; X86-NEXT: mull %ecx
|
|
|
|
; X86-NEXT: movl %eax, %ebx
|
|
|
|
; X86-NEXT: movl %edx, %ebp
|
|
|
|
; X86-NEXT: addl %edi, %ebp
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %edi
|
|
|
|
; X86-NEXT: adcl $0, %esi
|
|
|
|
; X86-NEXT: movl %edi, %eax
|
|
|
|
; X86-NEXT: mull %ecx
|
|
|
|
; X86-NEXT: addl %ebp, %eax
|
|
|
|
; X86-NEXT: adcl %esi, %edx
|
|
|
|
; X86-NEXT: movl %edi, %esi
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp), %esi
|
|
|
|
; X86-NEXT: addl %edx, %esi
|
|
|
|
; X86-NEXT: movl %esi, %ebp
|
|
|
|
; X86-NEXT: subl %ecx, %ebp
|
|
|
|
; X86-NEXT: testl %edi, %edi
|
|
|
|
; X86-NEXT: cmovnsl %esi, %ebp
|
|
|
|
; X86-NEXT: movl %ebp, %edx
|
|
|
|
; X86-NEXT: subl {{[0-9]+}}(%esp), %edx
|
|
|
|
; X86-NEXT: cmpl $0, {{[0-9]+}}(%esp)
|
|
|
|
; X86-NEXT: cmovnsl %ebp, %edx
|
|
|
|
; X86-NEXT: shldl $30, %eax, %edx
|
|
|
|
; X86-NEXT: shldl $30, %ebx, %eax
|
|
|
|
; X86-NEXT: popl %esi
|
|
|
|
; X86-NEXT: .cfi_def_cfa_offset 16
|
|
|
|
; X86-NEXT: popl %edi
|
|
|
|
; X86-NEXT: .cfi_def_cfa_offset 12
|
|
|
|
; X86-NEXT: popl %ebx
|
|
|
|
; X86-NEXT: .cfi_def_cfa_offset 8
|
|
|
|
; X86-NEXT: popl %ebp
|
|
|
|
; X86-NEXT: .cfi_def_cfa_offset 4
|
|
|
|
; X86-NEXT: retl
|
2019-08-12 03:27:14 +08:00
|
|
|
%tmp = call i64 @llvm.smul.fix.i64(i64 %x, i64 %y, i32 2)
|
|
|
|
ret i64 %tmp
|
2018-12-12 14:29:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
define i4 @func3(i4 %x, i4 %y) nounwind {
|
|
|
|
; X64-LABEL: func3:
|
|
|
|
; X64: # %bb.0:
|
|
|
|
; X64-NEXT: shlb $4, %dil
|
|
|
|
; X64-NEXT: sarb $4, %dil
|
|
|
|
; X64-NEXT: shlb $4, %sil
|
|
|
|
; X64-NEXT: sarb $4, %sil
|
|
|
|
; X64-NEXT: movsbl %sil, %ecx
|
|
|
|
; X64-NEXT: movsbl %dil, %eax
|
|
|
|
; X64-NEXT: imull %ecx, %eax
|
|
|
|
; X64-NEXT: movl %eax, %ecx
|
|
|
|
; X64-NEXT: shrb $2, %cl
|
|
|
|
; X64-NEXT: shrl $8, %eax
|
|
|
|
; X64-NEXT: shlb $6, %al
|
|
|
|
; X64-NEXT: orb %cl, %al
|
|
|
|
; X64-NEXT: # kill: def $al killed $al killed $eax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: func3:
|
|
|
|
; X86: # %bb.0:
|
|
|
|
; X86-NEXT: movb {{[0-9]+}}(%esp), %al
|
|
|
|
; X86-NEXT: shlb $4, %al
|
|
|
|
; X86-NEXT: sarb $4, %al
|
|
|
|
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
|
|
|
|
; X86-NEXT: shlb $4, %cl
|
|
|
|
; X86-NEXT: sarb $4, %cl
|
|
|
|
; X86-NEXT: movsbl %cl, %ecx
|
|
|
|
; X86-NEXT: movsbl %al, %eax
|
|
|
|
; X86-NEXT: imull %ecx, %eax
|
|
|
|
; X86-NEXT: shlb $6, %ah
|
|
|
|
; X86-NEXT: shrb $2, %al
|
|
|
|
; X86-NEXT: orb %ah, %al
|
|
|
|
; X86-NEXT: # kill: def $al killed $al killed $eax
|
|
|
|
; X86-NEXT: retl
|
2019-08-12 03:27:14 +08:00
|
|
|
%tmp = call i4 @llvm.smul.fix.i4(i4 %x, i4 %y, i32 2)
|
|
|
|
ret i4 %tmp
|
2018-12-12 14:29:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
define <4 x i32> @vec(<4 x i32> %x, <4 x i32> %y) nounwind {
|
|
|
|
; X64-LABEL: vec:
|
|
|
|
; X64: # %bb.0:
|
2019-02-01 03:15:37 +08:00
|
|
|
; X64-NEXT: pxor %xmm2, %xmm2
|
|
|
|
; X64-NEXT: pxor %xmm3, %xmm3
|
|
|
|
; X64-NEXT: pcmpgtd %xmm1, %xmm3
|
|
|
|
; X64-NEXT: pand %xmm0, %xmm3
|
|
|
|
; X64-NEXT: pcmpgtd %xmm0, %xmm2
|
|
|
|
; X64-NEXT: pand %xmm1, %xmm2
|
|
|
|
; X64-NEXT: paddd %xmm3, %xmm2
|
|
|
|
; X64-NEXT: pshufd {{.*#+}} xmm3 = xmm0[1,1,3,3]
|
|
|
|
; X64-NEXT: pmuludq %xmm1, %xmm0
|
|
|
|
; X64-NEXT: pshufd {{.*#+}} xmm4 = xmm0[1,3,2,3]
|
|
|
|
; X64-NEXT: pshufd {{.*#+}} xmm1 = xmm1[1,1,3,3]
|
|
|
|
; X64-NEXT: pmuludq %xmm3, %xmm1
|
|
|
|
; X64-NEXT: pshufd {{.*#+}} xmm3 = xmm1[1,3,2,3]
|
|
|
|
; X64-NEXT: punpckldq {{.*#+}} xmm4 = xmm4[0],xmm3[0],xmm4[1],xmm3[1]
|
|
|
|
; X64-NEXT: psubd %xmm2, %xmm4
|
|
|
|
; X64-NEXT: pslld $30, %xmm4
|
|
|
|
; X64-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,2,2,3]
|
|
|
|
; X64-NEXT: pshufd {{.*#+}} xmm1 = xmm1[0,2,2,3]
|
|
|
|
; X64-NEXT: punpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1]
|
|
|
|
; X64-NEXT: psrld $2, %xmm0
|
|
|
|
; X64-NEXT: por %xmm4, %xmm0
|
2018-12-12 14:29:14 +08:00
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: vec:
|
|
|
|
; X86: # %bb.0:
|
|
|
|
; X86-NEXT: pushl %ebp
|
|
|
|
; X86-NEXT: pushl %ebx
|
|
|
|
; X86-NEXT: pushl %edi
|
|
|
|
; X86-NEXT: pushl %esi
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %edi
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ebx
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp)
|
|
|
|
; X86-NEXT: movl %edx, %ebp
|
|
|
|
; X86-NEXT: shldl $30, %eax, %ebp
|
|
|
|
; X86-NEXT: movl %ebx, %eax
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp)
|
|
|
|
; X86-NEXT: movl %edx, %ebx
|
|
|
|
; X86-NEXT: shldl $30, %eax, %ebx
|
|
|
|
; X86-NEXT: movl %edi, %eax
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp)
|
|
|
|
; X86-NEXT: movl %edx, %edi
|
|
|
|
; X86-NEXT: shldl $30, %eax, %edi
|
|
|
|
; X86-NEXT: movl %esi, %eax
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp)
|
|
|
|
; X86-NEXT: shldl $30, %eax, %edx
|
|
|
|
; X86-NEXT: movl %edx, 12(%ecx)
|
|
|
|
; X86-NEXT: movl %edi, 8(%ecx)
|
|
|
|
; X86-NEXT: movl %ebx, 4(%ecx)
|
|
|
|
; X86-NEXT: movl %ebp, (%ecx)
|
|
|
|
; X86-NEXT: movl %ecx, %eax
|
|
|
|
; X86-NEXT: popl %esi
|
|
|
|
; X86-NEXT: popl %edi
|
|
|
|
; X86-NEXT: popl %ebx
|
|
|
|
; X86-NEXT: popl %ebp
|
|
|
|
; X86-NEXT: retl $4
|
2019-08-12 03:27:14 +08:00
|
|
|
%tmp = call <4 x i32> @llvm.smul.fix.v4i32(<4 x i32> %x, <4 x i32> %y, i32 2)
|
|
|
|
ret <4 x i32> %tmp
|
2018-12-12 14:29:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
; These result in regular integer multiplication
|
|
|
|
define i32 @func4(i32 %x, i32 %y) nounwind {
|
|
|
|
; X64-LABEL: func4:
|
|
|
|
; X64: # %bb.0:
|
|
|
|
; X64-NEXT: movl %edi, %eax
|
|
|
|
; X64-NEXT: imull %esi, %eax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: func4:
|
|
|
|
; X86: # %bb.0:
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp), %eax
|
|
|
|
; X86-NEXT: retl
|
2019-08-12 03:27:14 +08:00
|
|
|
%tmp = call i32 @llvm.smul.fix.i32(i32 %x, i32 %y, i32 0)
|
|
|
|
ret i32 %tmp
|
2018-12-12 14:29:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @func5(i64 %x, i64 %y) {
|
|
|
|
; X64-LABEL: func5:
|
|
|
|
; X64: # %bb.0:
|
|
|
|
; X64-NEXT: movq %rdi, %rax
|
|
|
|
; X64-NEXT: imulq %rsi, %rax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: func5:
|
|
|
|
; X86: # %bb.0:
|
|
|
|
; X86-NEXT: pushl %esi
|
|
|
|
; X86-NEXT: .cfi_def_cfa_offset 8
|
|
|
|
; X86-NEXT: .cfi_offset %esi, -8
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
|
|
|
|
; X86-NEXT: movl %ecx, %eax
|
|
|
|
; X86-NEXT: mull %esi
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: addl %ecx, %edx
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp), %esi
|
|
|
|
; X86-NEXT: addl %esi, %edx
|
|
|
|
; X86-NEXT: popl %esi
|
|
|
|
; X86-NEXT: .cfi_def_cfa_offset 4
|
|
|
|
; X86-NEXT: retl
|
2019-08-12 03:27:14 +08:00
|
|
|
%tmp = call i64 @llvm.smul.fix.i64(i64 %x, i64 %y, i32 0)
|
|
|
|
ret i64 %tmp
|
2018-12-12 14:29:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
define i4 @func6(i4 %x, i4 %y) nounwind {
|
|
|
|
; X64-LABEL: func6:
|
|
|
|
; X64: # %bb.0:
|
|
|
|
; X64-NEXT: movl %edi, %eax
|
|
|
|
; X64-NEXT: shlb $4, %al
|
|
|
|
; X64-NEXT: sarb $4, %al
|
|
|
|
; X64-NEXT: shlb $4, %sil
|
|
|
|
; X64-NEXT: sarb $4, %sil
|
|
|
|
; X64-NEXT: # kill: def $al killed $al killed $eax
|
|
|
|
; X64-NEXT: mulb %sil
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: func6:
|
|
|
|
; X86: # %bb.0:
|
|
|
|
; X86-NEXT: movb {{[0-9]+}}(%esp), %al
|
|
|
|
; X86-NEXT: shlb $4, %al
|
|
|
|
; X86-NEXT: sarb $4, %al
|
|
|
|
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
|
|
|
|
; X86-NEXT: shlb $4, %cl
|
|
|
|
; X86-NEXT: sarb $4, %cl
|
|
|
|
; X86-NEXT: mulb %cl
|
|
|
|
; X86-NEXT: retl
|
2019-08-12 03:27:14 +08:00
|
|
|
%tmp = call i4 @llvm.smul.fix.i4(i4 %x, i4 %y, i32 0)
|
|
|
|
ret i4 %tmp
|
2018-12-12 14:29:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
define <4 x i32> @vec2(<4 x i32> %x, <4 x i32> %y) nounwind {
|
|
|
|
; X64-LABEL: vec2:
|
|
|
|
; X64: # %bb.0:
|
2019-02-01 03:15:37 +08:00
|
|
|
; X64-NEXT: pshufd {{.*#+}} xmm2 = xmm0[1,1,3,3]
|
|
|
|
; X64-NEXT: pmuludq %xmm1, %xmm0
|
|
|
|
; X64-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,2,2,3]
|
|
|
|
; X64-NEXT: pshufd {{.*#+}} xmm1 = xmm1[1,1,3,3]
|
|
|
|
; X64-NEXT: pmuludq %xmm2, %xmm1
|
|
|
|
; X64-NEXT: pshufd {{.*#+}} xmm1 = xmm1[0,2,2,3]
|
|
|
|
; X64-NEXT: punpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1]
|
2018-12-12 14:29:14 +08:00
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: vec2:
|
|
|
|
; X86: # %bb.0:
|
|
|
|
; X86-NEXT: pushl %edi
|
|
|
|
; X86-NEXT: pushl %esi
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %edx
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %edi
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp), %edi
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp), %esi
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp), %edx
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl %ecx, 12(%eax)
|
|
|
|
; X86-NEXT: movl %edx, 8(%eax)
|
|
|
|
; X86-NEXT: movl %esi, 4(%eax)
|
|
|
|
; X86-NEXT: movl %edi, (%eax)
|
|
|
|
; X86-NEXT: popl %esi
|
|
|
|
; X86-NEXT: popl %edi
|
|
|
|
; X86-NEXT: retl $4
|
2019-08-12 03:27:14 +08:00
|
|
|
%tmp = call <4 x i32> @llvm.smul.fix.v4i32(<4 x i32> %x, <4 x i32> %y, i32 0)
|
|
|
|
ret <4 x i32> %tmp
|
2018-12-12 14:29:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @func7(i64 %x, i64 %y) nounwind {
|
|
|
|
; X64-LABEL: func7:
|
|
|
|
; X64: # %bb.0:
|
|
|
|
; X64-NEXT: movq %rdi, %rax
|
|
|
|
; X64-NEXT: imulq %rsi
|
|
|
|
; X64-NEXT: shrdq $32, %rdx, %rax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: func7:
|
|
|
|
; X86: # %bb.0:
|
|
|
|
; X86-NEXT: pushl %ebp
|
|
|
|
; X86-NEXT: pushl %ebx
|
|
|
|
; X86-NEXT: pushl %edi
|
|
|
|
; X86-NEXT: pushl %esi
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ebp
|
|
|
|
; X86-NEXT: movl %ecx, %eax
|
|
|
|
; X86-NEXT: mull {{[0-9]+}}(%esp)
|
|
|
|
; X86-NEXT: movl %edx, %edi
|
|
|
|
; X86-NEXT: movl %eax, %ebx
|
|
|
|
; X86-NEXT: movl %ecx, %eax
|
|
|
|
; X86-NEXT: mull %ebp
|
|
|
|
; X86-NEXT: addl %edx, %ebx
|
|
|
|
; X86-NEXT: adcl $0, %edi
|
|
|
|
; X86-NEXT: movl %esi, %eax
|
|
|
|
; X86-NEXT: mull %ebp
|
|
|
|
; X86-NEXT: addl %ebx, %eax
|
|
|
|
; X86-NEXT: adcl %edi, %edx
|
|
|
|
; X86-NEXT: movl %esi, %edi
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp), %edi
|
|
|
|
; X86-NEXT: addl %edx, %edi
|
|
|
|
; X86-NEXT: movl %edi, %ebx
|
|
|
|
; X86-NEXT: subl %ebp, %ebx
|
|
|
|
; X86-NEXT: testl %esi, %esi
|
|
|
|
; X86-NEXT: cmovnsl %edi, %ebx
|
|
|
|
; X86-NEXT: movl %ebx, %edx
|
|
|
|
; X86-NEXT: subl %ecx, %edx
|
|
|
|
; X86-NEXT: cmpl $0, {{[0-9]+}}(%esp)
|
|
|
|
; X86-NEXT: cmovnsl %ebx, %edx
|
|
|
|
; X86-NEXT: popl %esi
|
|
|
|
; X86-NEXT: popl %edi
|
|
|
|
; X86-NEXT: popl %ebx
|
|
|
|
; X86-NEXT: popl %ebp
|
|
|
|
; X86-NEXT: retl
|
2019-08-12 03:27:14 +08:00
|
|
|
%tmp = call i64 @llvm.smul.fix.i64(i64 %x, i64 %y, i32 32)
|
|
|
|
ret i64 %tmp
|
2018-12-12 14:29:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @func8(i64 %x, i64 %y) nounwind {
|
|
|
|
; X64-LABEL: func8:
|
|
|
|
; X64: # %bb.0:
|
|
|
|
; X64-NEXT: movq %rdi, %rax
|
|
|
|
; X64-NEXT: imulq %rsi
|
|
|
|
; X64-NEXT: shrdq $63, %rdx, %rax
|
|
|
|
; X64-NEXT: retq
|
|
|
|
;
|
|
|
|
; X86-LABEL: func8:
|
|
|
|
; X86: # %bb.0:
|
|
|
|
; X86-NEXT: pushl %ebp
|
|
|
|
; X86-NEXT: pushl %ebx
|
|
|
|
; X86-NEXT: pushl %edi
|
|
|
|
; X86-NEXT: pushl %esi
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
|
|
|
|
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
|
|
|
|
; X86-NEXT: movl %ecx, %eax
|
|
|
|
; X86-NEXT: mull {{[0-9]+}}(%esp)
|
|
|
|
; X86-NEXT: movl %edx, %edi
|
|
|
|
; X86-NEXT: movl %eax, %ebx
|
|
|
|
; X86-NEXT: movl %ecx, %eax
|
|
|
|
; X86-NEXT: mull {{[0-9]+}}(%esp)
|
[CodeGen] Use FSHR in DAGTypeLegalizer::ExpandIntRes_MULFIX
Summary:
Simplify the right shift of the intermediate result (given
in four parts) by using funnel shift.
There are some impact on lit tests, but that seems to be
related to register allocation differences due to how FSHR
is expanded on X86 (giving a slightly different operand order
for the OR operations compared to the old code).
Reviewers: leonardchan, RKSimon, spatel, lebedev.ri
Reviewed By: RKSimon
Subscribers: hiraditya, asb, rbar, johnrusso, simoncook, apazos, sabuasal, niosHD, jrtc27, MaskRay, zzheng, edward-jones, rogfer01, MartinMosbeck, brucehoult, the_o, PkmX, jocewei, s.egerton, pzheng, bevinh, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D67036
llvm-svn: 370813
2019-09-04 03:35:07 +08:00
|
|
|
; X86-NEXT: addl %edx, %ebx
|
2018-12-12 14:29:14 +08:00
|
|
|
; X86-NEXT: adcl $0, %edi
|
|
|
|
; X86-NEXT: movl %esi, %eax
|
|
|
|
; X86-NEXT: imull {{[0-9]+}}(%esp)
|
[CodeGen] Use FSHR in DAGTypeLegalizer::ExpandIntRes_MULFIX
Summary:
Simplify the right shift of the intermediate result (given
in four parts) by using funnel shift.
There are some impact on lit tests, but that seems to be
related to register allocation differences due to how FSHR
is expanded on X86 (giving a slightly different operand order
for the OR operations compared to the old code).
Reviewers: leonardchan, RKSimon, spatel, lebedev.ri
Reviewed By: RKSimon
Subscribers: hiraditya, asb, rbar, johnrusso, simoncook, apazos, sabuasal, niosHD, jrtc27, MaskRay, zzheng, edward-jones, rogfer01, MartinMosbeck, brucehoult, the_o, PkmX, jocewei, s.egerton, pzheng, bevinh, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D67036
llvm-svn: 370813
2019-09-04 03:35:07 +08:00
|
|
|
; X86-NEXT: movl %edx, %ebp
|
2018-12-12 14:29:14 +08:00
|
|
|
; X86-NEXT: movl %eax, %ecx
|
|
|
|
; X86-NEXT: movl %esi, %eax
|
|
|
|
; X86-NEXT: mull {{[0-9]+}}(%esp)
|
[CodeGen] Use FSHR in DAGTypeLegalizer::ExpandIntRes_MULFIX
Summary:
Simplify the right shift of the intermediate result (given
in four parts) by using funnel shift.
There are some impact on lit tests, but that seems to be
related to register allocation differences due to how FSHR
is expanded on X86 (giving a slightly different operand order
for the OR operations compared to the old code).
Reviewers: leonardchan, RKSimon, spatel, lebedev.ri
Reviewed By: RKSimon
Subscribers: hiraditya, asb, rbar, johnrusso, simoncook, apazos, sabuasal, niosHD, jrtc27, MaskRay, zzheng, edward-jones, rogfer01, MartinMosbeck, brucehoult, the_o, PkmX, jocewei, s.egerton, pzheng, bevinh, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D67036
llvm-svn: 370813
2019-09-04 03:35:07 +08:00
|
|
|
; X86-NEXT: addl %ebx, %eax
|
2018-12-12 14:29:14 +08:00
|
|
|
; X86-NEXT: adcl %edi, %edx
|
[CodeGen] Use FSHR in DAGTypeLegalizer::ExpandIntRes_MULFIX
Summary:
Simplify the right shift of the intermediate result (given
in four parts) by using funnel shift.
There are some impact on lit tests, but that seems to be
related to register allocation differences due to how FSHR
is expanded on X86 (giving a slightly different operand order
for the OR operations compared to the old code).
Reviewers: leonardchan, RKSimon, spatel, lebedev.ri
Reviewed By: RKSimon
Subscribers: hiraditya, asb, rbar, johnrusso, simoncook, apazos, sabuasal, niosHD, jrtc27, MaskRay, zzheng, edward-jones, rogfer01, MartinMosbeck, brucehoult, the_o, PkmX, jocewei, s.egerton, pzheng, bevinh, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D67036
llvm-svn: 370813
2019-09-04 03:35:07 +08:00
|
|
|
; X86-NEXT: adcl $0, %ebp
|
2018-12-12 14:29:14 +08:00
|
|
|
; X86-NEXT: addl %ecx, %edx
|
[CodeGen] Use FSHR in DAGTypeLegalizer::ExpandIntRes_MULFIX
Summary:
Simplify the right shift of the intermediate result (given
in four parts) by using funnel shift.
There are some impact on lit tests, but that seems to be
related to register allocation differences due to how FSHR
is expanded on X86 (giving a slightly different operand order
for the OR operations compared to the old code).
Reviewers: leonardchan, RKSimon, spatel, lebedev.ri
Reviewed By: RKSimon
Subscribers: hiraditya, asb, rbar, johnrusso, simoncook, apazos, sabuasal, niosHD, jrtc27, MaskRay, zzheng, edward-jones, rogfer01, MartinMosbeck, brucehoult, the_o, PkmX, jocewei, s.egerton, pzheng, bevinh, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D67036
llvm-svn: 370813
2019-09-04 03:35:07 +08:00
|
|
|
; X86-NEXT: adcl $0, %ebp
|
2018-12-12 14:29:14 +08:00
|
|
|
; X86-NEXT: movl %edx, %ecx
|
|
|
|
; X86-NEXT: subl {{[0-9]+}}(%esp), %ecx
|
[CodeGen] Use FSHR in DAGTypeLegalizer::ExpandIntRes_MULFIX
Summary:
Simplify the right shift of the intermediate result (given
in four parts) by using funnel shift.
There are some impact on lit tests, but that seems to be
related to register allocation differences due to how FSHR
is expanded on X86 (giving a slightly different operand order
for the OR operations compared to the old code).
Reviewers: leonardchan, RKSimon, spatel, lebedev.ri
Reviewed By: RKSimon
Subscribers: hiraditya, asb, rbar, johnrusso, simoncook, apazos, sabuasal, niosHD, jrtc27, MaskRay, zzheng, edward-jones, rogfer01, MartinMosbeck, brucehoult, the_o, PkmX, jocewei, s.egerton, pzheng, bevinh, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D67036
llvm-svn: 370813
2019-09-04 03:35:07 +08:00
|
|
|
; X86-NEXT: movl %ebp, %esi
|
2018-12-12 14:29:14 +08:00
|
|
|
; X86-NEXT: sbbl $0, %esi
|
|
|
|
; X86-NEXT: cmpl $0, {{[0-9]+}}(%esp)
|
[CodeGen] Use FSHR in DAGTypeLegalizer::ExpandIntRes_MULFIX
Summary:
Simplify the right shift of the intermediate result (given
in four parts) by using funnel shift.
There are some impact on lit tests, but that seems to be
related to register allocation differences due to how FSHR
is expanded on X86 (giving a slightly different operand order
for the OR operations compared to the old code).
Reviewers: leonardchan, RKSimon, spatel, lebedev.ri
Reviewed By: RKSimon
Subscribers: hiraditya, asb, rbar, johnrusso, simoncook, apazos, sabuasal, niosHD, jrtc27, MaskRay, zzheng, edward-jones, rogfer01, MartinMosbeck, brucehoult, the_o, PkmX, jocewei, s.egerton, pzheng, bevinh, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D67036
llvm-svn: 370813
2019-09-04 03:35:07 +08:00
|
|
|
; X86-NEXT: cmovnsl %ebp, %esi
|
2018-12-12 14:29:14 +08:00
|
|
|
; X86-NEXT: cmovnsl %edx, %ecx
|
|
|
|
; X86-NEXT: movl %ecx, %edi
|
|
|
|
; X86-NEXT: subl {{[0-9]+}}(%esp), %edi
|
|
|
|
; X86-NEXT: movl %esi, %edx
|
|
|
|
; X86-NEXT: sbbl $0, %edx
|
|
|
|
; X86-NEXT: cmpl $0, {{[0-9]+}}(%esp)
|
|
|
|
; X86-NEXT: cmovnsl %esi, %edx
|
|
|
|
; X86-NEXT: cmovnsl %ecx, %edi
|
|
|
|
; X86-NEXT: shldl $1, %edi, %edx
|
|
|
|
; X86-NEXT: shrdl $31, %edi, %eax
|
|
|
|
; X86-NEXT: popl %esi
|
|
|
|
; X86-NEXT: popl %edi
|
|
|
|
; X86-NEXT: popl %ebx
|
|
|
|
; X86-NEXT: popl %ebp
|
|
|
|
; X86-NEXT: retl
|
2019-08-12 03:27:14 +08:00
|
|
|
%tmp = call i64 @llvm.smul.fix.i64(i64 %x, i64 %y, i32 63)
|
|
|
|
ret i64 %tmp
|
2018-12-12 14:29:14 +08:00
|
|
|
}
|