llvm-project/llvm/test/CodeGen/X86/rotate4.ll

638 lines
17 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=i686-unknown-unknown | FileCheck %s --check-prefixes=X86
; RUN: llc < %s -mtriple=x86_64-unknown-unknown | FileCheck %s --check-prefixes=X64
; Check that we recognize this idiom for rotation too:
; a << (b & (OpSize-1)) | a >> ((0 - b) & (OpSize-1))
define i32 @rotate_left_32(i32 %a, i32 %b) {
; X86-LABEL: rotate_left_32:
; X86: # %bb.0:
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: roll %cl, %eax
; X86-NEXT: retl
;
; X64-LABEL: rotate_left_32:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: roll %cl, %edi
; X64-NEXT: movl %edi, %eax
; X64-NEXT: retq
%and = and i32 %b, 31
%shl = shl i32 %a, %and
%t0 = sub i32 0, %b
%and3 = and i32 %t0, 31
%shr = lshr i32 %a, %and3
%or = or i32 %shl, %shr
ret i32 %or
}
define i32 @rotate_right_32(i32 %a, i32 %b) {
; X86-LABEL: rotate_right_32:
; X86: # %bb.0:
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: rorl %cl, %eax
; X86-NEXT: retl
;
; X64-LABEL: rotate_right_32:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rorl %cl, %edi
; X64-NEXT: movl %edi, %eax
; X64-NEXT: retq
%and = and i32 %b, 31
%shl = lshr i32 %a, %and
%t0 = sub i32 0, %b
%and3 = and i32 %t0, 31
%shr = shl i32 %a, %and3
%or = or i32 %shl, %shr
ret i32 %or
}
define i64 @rotate_left_64(i64 %a, i64 %b) {
; X86-LABEL: rotate_left_64:
; X86: # %bb.0:
; X86-NEXT: pushl %ebx
; X86-NEXT: .cfi_def_cfa_offset 8
; X86-NEXT: pushl %edi
; X86-NEXT: .cfi_def_cfa_offset 12
; X86-NEXT: pushl %esi
; X86-NEXT: .cfi_def_cfa_offset 16
; X86-NEXT: .cfi_offset %esi, -16
; X86-NEXT: .cfi_offset %edi, -12
; X86-NEXT: .cfi_offset %ebx, -8
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
; X86-NEXT: movl {{[0-9]+}}(%esp), %edi
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl %esi, %eax
; X86-NEXT: shll %cl, %eax
; X86-NEXT: movl %edi, %edx
; X86-NEXT: shldl %cl, %esi, %edx
; X86-NEXT: testb $32, %cl
; X86-NEXT: je .LBB2_2
; X86-NEXT: # %bb.1:
; X86-NEXT: movl %eax, %edx
; X86-NEXT: xorl %eax, %eax
; X86-NEXT: .LBB2_2:
; X86-NEXT: negl %ecx
; X86-NEXT: movl %edi, %ebx
; X86-NEXT: shrl %cl, %ebx
; X86-NEXT: shrdl %cl, %edi, %esi
; X86-NEXT: testb $32, %cl
; X86-NEXT: je .LBB2_4
; X86-NEXT: # %bb.3:
; X86-NEXT: movl %ebx, %esi
; X86-NEXT: xorl %ebx, %ebx
; X86-NEXT: .LBB2_4:
; X86-NEXT: orl %ebx, %edx
; X86-NEXT: orl %esi, %eax
; X86-NEXT: popl %esi
; X86-NEXT: .cfi_def_cfa_offset 12
; X86-NEXT: popl %edi
; X86-NEXT: .cfi_def_cfa_offset 8
; X86-NEXT: popl %ebx
; X86-NEXT: .cfi_def_cfa_offset 4
; X86-NEXT: retl
;
; X64-LABEL: rotate_left_64:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rolq %cl, %rdi
; X64-NEXT: movq %rdi, %rax
; X64-NEXT: retq
%and = and i64 %b, 63
%shl = shl i64 %a, %and
%t0 = sub i64 0, %b
%and3 = and i64 %t0, 63
%shr = lshr i64 %a, %and3
%or = or i64 %shl, %shr
ret i64 %or
}
define i64 @rotate_right_64(i64 %a, i64 %b) {
; X86-LABEL: rotate_right_64:
; X86: # %bb.0:
; X86-NEXT: pushl %ebx
; X86-NEXT: .cfi_def_cfa_offset 8
; X86-NEXT: pushl %edi
; X86-NEXT: .cfi_def_cfa_offset 12
; X86-NEXT: pushl %esi
; X86-NEXT: .cfi_def_cfa_offset 16
; X86-NEXT: .cfi_offset %esi, -16
; X86-NEXT: .cfi_offset %edi, -12
; X86-NEXT: .cfi_offset %ebx, -8
; X86-NEXT: movl {{[0-9]+}}(%esp), %edi
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl %esi, %edx
; X86-NEXT: shrl %cl, %edx
; X86-NEXT: movl %edi, %eax
; X86-NEXT: shrdl %cl, %esi, %eax
; X86-NEXT: testb $32, %cl
; X86-NEXT: je .LBB3_2
; X86-NEXT: # %bb.1:
; X86-NEXT: movl %edx, %eax
; X86-NEXT: xorl %edx, %edx
; X86-NEXT: .LBB3_2:
; X86-NEXT: negl %ecx
; X86-NEXT: movl %edi, %ebx
; X86-NEXT: shll %cl, %ebx
; X86-NEXT: shldl %cl, %edi, %esi
; X86-NEXT: testb $32, %cl
; X86-NEXT: je .LBB3_4
; X86-NEXT: # %bb.3:
; X86-NEXT: movl %ebx, %esi
; X86-NEXT: xorl %ebx, %ebx
; X86-NEXT: .LBB3_4:
; X86-NEXT: orl %esi, %edx
; X86-NEXT: orl %ebx, %eax
; X86-NEXT: popl %esi
; X86-NEXT: .cfi_def_cfa_offset 12
; X86-NEXT: popl %edi
; X86-NEXT: .cfi_def_cfa_offset 8
; X86-NEXT: popl %ebx
; X86-NEXT: .cfi_def_cfa_offset 4
; X86-NEXT: retl
;
; X64-LABEL: rotate_right_64:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rorq %cl, %rdi
; X64-NEXT: movq %rdi, %rax
; X64-NEXT: retq
%and = and i64 %b, 63
%shl = lshr i64 %a, %and
%t0 = sub i64 0, %b
%and3 = and i64 %t0, 63
%shr = shl i64 %a, %and3
%or = or i64 %shl, %shr
ret i64 %or
}
; Also check mem operand.
define void @rotate_left_m32(i32 *%pa, i32 %b) {
; X86-LABEL: rotate_left_m32:
; X86: # %bb.0:
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: roll %cl, (%eax)
; X86-NEXT: retl
;
; X64-LABEL: rotate_left_m32:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: roll %cl, (%rdi)
; X64-NEXT: retq
%a = load i32, i32* %pa, align 16
%and = and i32 %b, 31
%shl = shl i32 %a, %and
%t0 = sub i32 0, %b
%and3 = and i32 %t0, 31
%shr = lshr i32 %a, %and3
%or = or i32 %shl, %shr
store i32 %or, i32* %pa, align 32
ret void
}
define void @rotate_right_m32(i32 *%pa, i32 %b) {
; X86-LABEL: rotate_right_m32:
; X86: # %bb.0:
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: rorl %cl, (%eax)
; X86-NEXT: retl
;
; X64-LABEL: rotate_right_m32:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rorl %cl, (%rdi)
; X64-NEXT: retq
%a = load i32, i32* %pa, align 16
%and = and i32 %b, 31
%shl = lshr i32 %a, %and
%t0 = sub i32 0, %b
%and3 = and i32 %t0, 31
%shr = shl i32 %a, %and3
%or = or i32 %shl, %shr
store i32 %or, i32* %pa, align 32
ret void
}
define void @rotate_left_m64(i64 *%pa, i64 %b) {
; X86-LABEL: rotate_left_m64:
; X86: # %bb.0:
; X86-NEXT: pushl %ebp
; X86-NEXT: .cfi_def_cfa_offset 8
; X86-NEXT: pushl %ebx
; X86-NEXT: .cfi_def_cfa_offset 12
; X86-NEXT: pushl %edi
; X86-NEXT: .cfi_def_cfa_offset 16
; X86-NEXT: pushl %esi
; X86-NEXT: .cfi_def_cfa_offset 20
; X86-NEXT: .cfi_offset %esi, -20
; X86-NEXT: .cfi_offset %edi, -16
; X86-NEXT: .cfi_offset %ebx, -12
; X86-NEXT: .cfi_offset %ebp, -8
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: movl (%eax), %edx
; X86-NEXT: movl 4(%eax), %ebx
; X86-NEXT: movl %edx, %esi
; X86-NEXT: shll %cl, %esi
; X86-NEXT: movl %ebx, %edi
; X86-NEXT: shldl %cl, %edx, %edi
; X86-NEXT: testb $32, %cl
; X86-NEXT: je .LBB6_2
; X86-NEXT: # %bb.1:
; X86-NEXT: movl %esi, %edi
; X86-NEXT: xorl %esi, %esi
; X86-NEXT: .LBB6_2:
; X86-NEXT: negl %ecx
; X86-NEXT: movl %ebx, %ebp
; X86-NEXT: shrl %cl, %ebp
; X86-NEXT: shrdl %cl, %ebx, %edx
; X86-NEXT: testb $32, %cl
; X86-NEXT: je .LBB6_4
; X86-NEXT: # %bb.3:
; X86-NEXT: movl %ebp, %edx
; X86-NEXT: xorl %ebp, %ebp
; X86-NEXT: .LBB6_4:
; X86-NEXT: orl %ebp, %edi
; X86-NEXT: orl %edx, %esi
; X86-NEXT: movl %edi, 4(%eax)
; X86-NEXT: movl %esi, (%eax)
; X86-NEXT: popl %esi
; X86-NEXT: .cfi_def_cfa_offset 16
; X86-NEXT: popl %edi
; X86-NEXT: .cfi_def_cfa_offset 12
; X86-NEXT: popl %ebx
; X86-NEXT: .cfi_def_cfa_offset 8
; X86-NEXT: popl %ebp
; X86-NEXT: .cfi_def_cfa_offset 4
; X86-NEXT: retl
;
; X64-LABEL: rotate_left_m64:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rolq %cl, (%rdi)
; X64-NEXT: retq
%a = load i64, i64* %pa, align 16
%and = and i64 %b, 63
%shl = shl i64 %a, %and
%t0 = sub i64 0, %b
%and3 = and i64 %t0, 63
%shr = lshr i64 %a, %and3
%or = or i64 %shl, %shr
store i64 %or, i64* %pa, align 64
ret void
}
define void @rotate_right_m64(i64 *%pa, i64 %b) {
; X86-LABEL: rotate_right_m64:
; X86: # %bb.0:
; X86-NEXT: pushl %ebp
; X86-NEXT: .cfi_def_cfa_offset 8
; X86-NEXT: pushl %ebx
; X86-NEXT: .cfi_def_cfa_offset 12
; X86-NEXT: pushl %edi
; X86-NEXT: .cfi_def_cfa_offset 16
; X86-NEXT: pushl %esi
; X86-NEXT: .cfi_def_cfa_offset 20
; X86-NEXT: .cfi_offset %esi, -20
; X86-NEXT: .cfi_offset %edi, -16
; X86-NEXT: .cfi_offset %ebx, -12
; X86-NEXT: .cfi_offset %ebp, -8
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: movl (%eax), %ebx
; X86-NEXT: movl 4(%eax), %edx
; X86-NEXT: movl %edx, %esi
; X86-NEXT: shrl %cl, %esi
; X86-NEXT: movl %ebx, %edi
; X86-NEXT: shrdl %cl, %edx, %edi
; X86-NEXT: testb $32, %cl
; X86-NEXT: je .LBB7_2
; X86-NEXT: # %bb.1:
; X86-NEXT: movl %esi, %edi
; X86-NEXT: xorl %esi, %esi
; X86-NEXT: .LBB7_2:
; X86-NEXT: negl %ecx
; X86-NEXT: movl %ebx, %ebp
; X86-NEXT: shll %cl, %ebp
; X86-NEXT: shldl %cl, %ebx, %edx
; X86-NEXT: testb $32, %cl
; X86-NEXT: je .LBB7_4
; X86-NEXT: # %bb.3:
; X86-NEXT: movl %ebp, %edx
; X86-NEXT: xorl %ebp, %ebp
; X86-NEXT: .LBB7_4:
; X86-NEXT: orl %edx, %esi
; X86-NEXT: orl %ebp, %edi
; X86-NEXT: movl %esi, 4(%eax)
; X86-NEXT: movl %edi, (%eax)
; X86-NEXT: popl %esi
; X86-NEXT: .cfi_def_cfa_offset 16
; X86-NEXT: popl %edi
; X86-NEXT: .cfi_def_cfa_offset 12
; X86-NEXT: popl %ebx
; X86-NEXT: .cfi_def_cfa_offset 8
; X86-NEXT: popl %ebp
; X86-NEXT: .cfi_def_cfa_offset 4
; X86-NEXT: retl
;
; X64-LABEL: rotate_right_m64:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rorq %cl, (%rdi)
; X64-NEXT: retq
%a = load i64, i64* %pa, align 16
%and = and i64 %b, 63
%shl = lshr i64 %a, %and
%t0 = sub i64 0, %b
%and3 = and i64 %t0, 63
%shr = shl i64 %a, %and3
%or = or i64 %shl, %shr
store i64 %or, i64* %pa, align 64
ret void
}
; The next 8 tests include masks of the narrow width shift amounts that should be eliminated.
; These patterns are produced by instcombine after r310509.
define i8 @rotate_left_8(i8 %x, i32 %amount) {
; X86-LABEL: rotate_left_8:
; X86: # %bb.0:
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: movb {{[0-9]+}}(%esp), %al
; X86-NEXT: rolb %cl, %al
; X86-NEXT: retl
;
; X64-LABEL: rotate_left_8:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rolb %cl, %dil
; X64-NEXT: movl %edi, %eax
; X64-NEXT: retq
%amt = trunc i32 %amount to i8
%sub = sub i8 0, %amt
%maskamt = and i8 %amt, 7
%masksub = and i8 %sub, 7
%shl = shl i8 %x, %maskamt
%shr = lshr i8 %x, %masksub
%or = or i8 %shl, %shr
ret i8 %or
}
define i8 @rotate_right_8(i8 %x, i32 %amount) {
; X86-LABEL: rotate_right_8:
; X86: # %bb.0:
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: movb {{[0-9]+}}(%esp), %al
; X86-NEXT: rorb %cl, %al
; X86-NEXT: retl
;
; X64-LABEL: rotate_right_8:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rorb %cl, %dil
; X64-NEXT: movl %edi, %eax
; X64-NEXT: retq
%amt = trunc i32 %amount to i8
%sub = sub i8 0, %amt
%maskamt = and i8 %amt, 7
%masksub = and i8 %sub, 7
%shr = lshr i8 %x, %maskamt
%shl = shl i8 %x, %masksub
%or = or i8 %shr, %shl
ret i8 %or
}
define i16 @rotate_left_16(i16 %x, i32 %amount) {
; X86-LABEL: rotate_left_16:
; X86: # %bb.0:
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax
; X86-NEXT: rolw %cl, %ax
; X86-NEXT: retl
;
; X64-LABEL: rotate_left_16:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rolw %cl, %di
; X64-NEXT: movl %edi, %eax
; X64-NEXT: retq
%amt = trunc i32 %amount to i16
%sub = sub i16 0, %amt
%maskamt = and i16 %amt, 15
%masksub = and i16 %sub, 15
%shl = shl i16 %x, %maskamt
%shr = lshr i16 %x, %masksub
%or = or i16 %shl, %shr
ret i16 %or
}
define i16 @rotate_right_16(i16 %x, i32 %amount) {
; X86-LABEL: rotate_right_16:
; X86: # %bb.0:
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax
; X86-NEXT: rorw %cl, %ax
; X86-NEXT: retl
;
; X64-LABEL: rotate_right_16:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rorw %cl, %di
; X64-NEXT: movl %edi, %eax
; X64-NEXT: retq
%amt = trunc i32 %amount to i16
%sub = sub i16 0, %amt
%maskamt = and i16 %amt, 15
%masksub = and i16 %sub, 15
%shr = lshr i16 %x, %maskamt
%shl = shl i16 %x, %masksub
%or = or i16 %shr, %shl
ret i16 %or
}
define void @rotate_left_m8(i8* %p, i32 %amount) {
; X86-LABEL: rotate_left_m8:
; X86: # %bb.0:
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: rolb %cl, (%eax)
; X86-NEXT: retl
;
; X64-LABEL: rotate_left_m8:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rolb %cl, (%rdi)
; X64-NEXT: retq
%x = load i8, i8* %p, align 1
%amt = trunc i32 %amount to i8
%sub = sub i8 0, %amt
%maskamt = and i8 %amt, 7
%masksub = and i8 %sub, 7
%shl = shl i8 %x, %maskamt
%shr = lshr i8 %x, %masksub
%or = or i8 %shl, %shr
store i8 %or, i8* %p, align 1
ret void
}
define void @rotate_right_m8(i8* %p, i32 %amount) {
; X86-LABEL: rotate_right_m8:
; X86: # %bb.0:
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: rorb %cl, (%eax)
; X86-NEXT: retl
;
; X64-LABEL: rotate_right_m8:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rorb %cl, (%rdi)
; X64-NEXT: retq
%x = load i8, i8* %p, align 1
%amt = trunc i32 %amount to i8
%sub = sub i8 0, %amt
%maskamt = and i8 %amt, 7
%masksub = and i8 %sub, 7
%shl = shl i8 %x, %masksub
%shr = lshr i8 %x, %maskamt
%or = or i8 %shl, %shr
store i8 %or, i8* %p, align 1
ret void
}
define void @rotate_left_m16(i16* %p, i32 %amount) {
; X86-LABEL: rotate_left_m16:
; X86: # %bb.0:
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: rolw %cl, (%eax)
; X86-NEXT: retl
;
; X64-LABEL: rotate_left_m16:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rolw %cl, (%rdi)
; X64-NEXT: retq
%x = load i16, i16* %p, align 1
%amt = trunc i32 %amount to i16
%sub = sub i16 0, %amt
%maskamt = and i16 %amt, 15
%masksub = and i16 %sub, 15
%shl = shl i16 %x, %maskamt
%shr = lshr i16 %x, %masksub
%or = or i16 %shl, %shr
store i16 %or, i16* %p, align 1
ret void
}
define void @rotate_right_m16(i16* %p, i32 %amount) {
; X86-LABEL: rotate_right_m16:
; X86: # %bb.0:
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: rorw %cl, (%eax)
; X86-NEXT: retl
;
; X64-LABEL: rotate_right_m16:
; X64: # %bb.0:
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: rorw %cl, (%rdi)
; X64-NEXT: retq
%x = load i16, i16* %p, align 1
%amt = trunc i32 %amount to i16
%sub = sub i16 0, %amt
%maskamt = and i16 %amt, 15
%masksub = and i16 %sub, 15
%shl = shl i16 %x, %masksub
%shr = lshr i16 %x, %maskamt
%or = or i16 %shl, %shr
store i16 %or, i16* %p, align 1
ret void
}
define i32 @rotate_demanded_bits(i32, i32) {
; X86-LABEL: rotate_demanded_bits:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: andb $30, %cl
; X86-NEXT: roll %cl, %eax
; X86-NEXT: retl
;
; X64-LABEL: rotate_demanded_bits:
; X64: # %bb.0:
; X64-NEXT: andb $30, %sil
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: roll %cl, %edi
; X64-NEXT: movl %edi, %eax
; X64-NEXT: retq
%3 = and i32 %1, 30
%4 = shl i32 %0, %3
%5 = sub nsw i32 0, %3
%6 = and i32 %5, 30
%7 = lshr i32 %0, %6
%8 = or i32 %7, %4
ret i32 %8
}
define i32 @rotate_demanded_bits_2(i32, i32) {
; X86-LABEL: rotate_demanded_bits_2:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: andb $23, %cl
; X86-NEXT: roll %cl, %eax
; X86-NEXT: retl
;
; X64-LABEL: rotate_demanded_bits_2:
; X64: # %bb.0:
; X64-NEXT: andb $23, %sil
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: roll %cl, %edi
; X64-NEXT: movl %edi, %eax
; X64-NEXT: retq
%3 = and i32 %1, 23
%4 = shl i32 %0, %3
%5 = sub nsw i32 0, %3
%6 = and i32 %5, 31
%7 = lshr i32 %0, %6
%8 = or i32 %7, %4
ret i32 %8
}
define i32 @rotate_demanded_bits_3(i32, i32) {
; X86-LABEL: rotate_demanded_bits_3:
; X86: # %bb.0:
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: movb {{[0-9]+}}(%esp), %cl
; X86-NEXT: addb %cl, %cl
; X86-NEXT: andb $30, %cl
; X86-NEXT: roll %cl, %eax
; X86-NEXT: retl
;
; X64-LABEL: rotate_demanded_bits_3:
; X64: # %bb.0:
; X64-NEXT: addb %sil, %sil
; X64-NEXT: andb $30, %sil
; X64-NEXT: movl %esi, %ecx
; X64-NEXT: roll %cl, %edi
; X64-NEXT: movl %edi, %eax
; X64-NEXT: retq
%3 = shl i32 %1, 1
%4 = and i32 %3, 30
%5 = shl i32 %0, %4
%6 = sub i32 0, %3
%7 = and i32 %6, 30
%8 = lshr i32 %0, %7
%9 = or i32 %5, %8
ret i32 %9
}