llvm-project/llvm/test/CodeGen/SystemZ/shift-04.ll

317 lines
7.8 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; Test 32-bit rotates left.
;
; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s
; Check the low end of the RLL range.
define i32 @f1(i32 %a) {
; CHECK-LABEL: f1:
; CHECK: # %bb.0:
; CHECK-NEXT: rll %r2, %r2, 1
; CHECK-NEXT: br %r14
%parta = shl i32 %a, 1
%partb = lshr i32 %a, 31
%or = or i32 %parta, %partb
ret i32 %or
}
; Check the high end of the defined RLL range.
define i32 @f2(i32 %a) {
; CHECK-LABEL: f2:
; CHECK: # %bb.0:
; CHECK-NEXT: rll %r2, %r2, 31
; CHECK-NEXT: br %r14
%parta = shl i32 %a, 31
%partb = lshr i32 %a, 1
%or = or i32 %parta, %partb
ret i32 %or
}
; We don't generate shifts by out-of-range values.
define i32 @f3(i32 %a) {
; CHECK-LABEL: f3:
; CHECK: # %bb.0:
; CHECK-NEXT: lhi %r2, -1
; CHECK-NEXT: br %r14
%parta = shl i32 %a, 32
%partb = lshr i32 %a, 0
%or = or i32 %parta, %partb
ret i32 %or
}
; Check variable shifts.
define i32 @f4(i32 %a, i32 %amt) {
; CHECK-LABEL: f4:
; CHECK: # %bb.0:
; CHECK-NEXT: rll %r2, %r2, 0(%r3)
; CHECK-NEXT: br %r14
%amtb = sub i32 32, %amt
%parta = shl i32 %a, %amt
%partb = lshr i32 %a, %amtb
%or = or i32 %parta, %partb
ret i32 %or
}
; Check shift amounts that have a constant term.
define i32 @f5(i32 %a, i32 %amt) {
; CHECK-LABEL: f5:
; CHECK: # %bb.0:
; CHECK-NEXT: rll %r2, %r2, 10(%r3)
; CHECK-NEXT: br %r14
%add = add i32 %amt, 10
%sub = sub i32 32, %add
%parta = shl i32 %a, %add
%partb = lshr i32 %a, %sub
%or = or i32 %parta, %partb
ret i32 %or
}
; ...and again with a truncated 64-bit shift amount.
define i32 @f6(i32 %a, i64 %amt) {
; CHECK-LABEL: f6:
; CHECK: # %bb.0:
; CHECK-NEXT: rll %r2, %r2, 10(%r3)
; CHECK-NEXT: br %r14
%add = add i64 %amt, 10
%addtrunc = trunc i64 %add to i32
%sub = sub i32 32, %addtrunc
%parta = shl i32 %a, %addtrunc
%partb = lshr i32 %a, %sub
%or = or i32 %parta, %partb
ret i32 %or
}
; ...and again with a different truncation representation.
define i32 @f7(i32 %a, i64 %amt) {
; CHECK-LABEL: f7:
; CHECK: # %bb.0:
; CHECK-NEXT: rll %r2, %r2, 10(%r3)
; CHECK-NEXT: br %r14
%add = add i64 %amt, 10
%sub = sub i64 32, %add
%addtrunc = trunc i64 %add to i32
%subtrunc = trunc i64 %sub to i32
%parta = shl i32 %a, %addtrunc
%partb = lshr i32 %a, %subtrunc
%or = or i32 %parta, %partb
ret i32 %or
}
; Check shift amounts that have the largest in-range constant term, and then
; mask the amount.
define i32 @f8(i32 %a, i32 %amt) {
; CHECK-LABEL: f8:
; CHECK: # %bb.0:
; CHECK-NEXT: rll %r2, %r2, -1(%r3)
; CHECK-NEXT: br %r14
%add = add i32 %amt, 524287
%sub = sub i32 32, %add
%parta = shl i32 %a, %add
%partb = lshr i32 %a, %sub
%or = or i32 %parta, %partb
ret i32 %or
}
; Check the next value up, which without masking must use a separate
; addition.
define i32 @f9(i32 %a, i32 %amt) {
; CHECK-LABEL: f9:
; CHECK: # %bb.0:
; CHECK-NEXT: afi %r3, 524288
; CHECK-NEXT: rll %r2, %r2, 0(%r3)
; CHECK-NEXT: br %r14
%add = add i32 %amt, 524288
%sub = sub i32 32, %add
%parta = shl i32 %a, %add
%partb = lshr i32 %a, %sub
%or = or i32 %parta, %partb
ret i32 %or
}
; Check cases where 1 is subtracted from the shift amount.
define i32 @f10(i32 %a, i32 %amt) {
; CHECK-LABEL: f10:
; CHECK: # %bb.0:
; CHECK-NEXT: rll %r2, %r2, -1(%r3)
; CHECK-NEXT: br %r14
%suba = sub i32 %amt, 1
%subb = sub i32 32, %suba
%parta = shl i32 %a, %suba
%partb = lshr i32 %a, %subb
%or = or i32 %parta, %partb
ret i32 %or
}
; Check the lowest value that can be subtracted from the shift amount.
; Again, we could mask the shift amount instead.
define i32 @f11(i32 %a, i32 %amt) {
; CHECK-LABEL: f11:
; CHECK: # %bb.0:
; CHECK-NEXT: rll %r2, %r2, -524288(%r3)
; CHECK-NEXT: br %r14
%suba = sub i32 %amt, 524288
%subb = sub i32 32, %suba
%parta = shl i32 %a, %suba
%partb = lshr i32 %a, %subb
%or = or i32 %parta, %partb
ret i32 %or
}
; Check the next value down, masking the amount removes the addition.
define i32 @f12(i32 %a, i32 %amt) {
; CHECK-LABEL: f12:
; CHECK: # %bb.0:
; CHECK-NEXT: rll %r2, %r2, -1(%r3)
; CHECK-NEXT: br %r14
%suba = sub i32 %amt, 524289
%subb = sub i32 32, %suba
%parta = shl i32 %a, %suba
%partb = lshr i32 %a, %subb
%or = or i32 %parta, %partb
ret i32 %or
}
; Check that we don't try to generate "indexed" shifts.
define i32 @f13(i32 %a, i32 %b, i32 %c) {
; CHECK-LABEL: f13:
; CHECK: # %bb.0:
; CHECK-NEXT: ar %r3, %r4
; CHECK-NEXT: rll %r2, %r2, 0(%r3)
; CHECK-NEXT: br %r14
%add = add i32 %b, %c
%sub = sub i32 32, %add
%parta = shl i32 %a, %add
%partb = lshr i32 %a, %sub
%or = or i32 %parta, %partb
ret i32 %or
}
; Check that the shift amount uses an address register. It cannot be in %r0.
define i32 @f14(i32 %a, i32 *%ptr) {
; CHECK-LABEL: f14:
; CHECK: # %bb.0:
; CHECK-NEXT: l %r1, 0(%r3)
; CHECK-NEXT: rll %r2, %r2, 0(%r1)
; CHECK-NEXT: br %r14
%amt = load i32, i32 *%ptr
%amtb = sub i32 32, %amt
%parta = shl i32 %a, %amt
%partb = lshr i32 %a, %amtb
%or = or i32 %parta, %partb
ret i32 %or
}
; Check another form of f5, which is the one produced by running f5 through
; instcombine.
define i32 @f15(i32 %a, i32 %amt) {
; CHECK-LABEL: f15:
; CHECK: # %bb.0:
; CHECK-NEXT: rll %r2, %r2, 10(%r3)
; CHECK-NEXT: br %r14
%add = add i32 %amt, 10
%sub = sub i32 22, %amt
%parta = shl i32 %a, %add
%partb = lshr i32 %a, %sub
%or = or i32 %parta, %partb
ret i32 %or
}
; Likewise for f7.
define i32 @f16(i32 %a, i64 %amt) {
; CHECK-LABEL: f16:
; CHECK: # %bb.0:
; CHECK-NEXT: rll %r2, %r2, 10(%r3)
; CHECK-NEXT: br %r14
%add = add i64 %amt, 10
%sub = sub i64 22, %amt
%addtrunc = trunc i64 %add to i32
%subtrunc = trunc i64 %sub to i32
%parta = shl i32 %a, %addtrunc
%partb = lshr i32 %a, %subtrunc
%or = or i32 %parta, %partb
ret i32 %or
}
; Check cases where (-x & 31) is used instead of 32 - x.
define i32 @f17(i32 %x, i32 %y) {
; CHECK-LABEL: f17:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: rll %r2, %r2, 0(%r3)
; CHECK-NEXT: br %r14
entry:
%shl = shl i32 %x, %y
%sub = sub i32 0, %y
%and = and i32 %sub, 31
%shr = lshr i32 %x, %and
%or = or i32 %shr, %shl
ret i32 %or
}
; ...and again with ((32 - x) & 31).
define i32 @f18(i32 %x, i32 %y) {
; CHECK-LABEL: f18:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: rll %r2, %r2, 0(%r3)
; CHECK-NEXT: br %r14
entry:
%shl = shl i32 %x, %y
%sub = sub i32 32, %y
%and = and i32 %sub, 31
%shr = lshr i32 %x, %and
%or = or i32 %shr, %shl
ret i32 %or
}
; This is not a rotation.
define i32 @f19(i32 %x, i32 %y) {
; CHECK-LABEL: f19:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: lr %r0, %r2
; CHECK-NEXT: sll %r0, 0(%r3)
; CHECK-NEXT: lhi %r1, 16
; CHECK-NEXT: sr %r1, %r3
; CHECK-NEXT: nill %r1, 31
; CHECK-NEXT: srl %r2, 0(%r1)
; CHECK-NEXT: or %r2, %r0
; CHECK-NEXT: br %r14
entry:
%shl = shl i32 %x, %y
%sub = sub i32 16, %y
%and = and i32 %sub, 31
%shr = lshr i32 %x, %and
%or = or i32 %shr, %shl
ret i32 %or
}
; Repeat f17 with an addition on the shift count.
define i32 @f20(i32 %x, i32 %y) {
; CHECK-LABEL: f20:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: rll %r2, %r2, 199(%r3)
; CHECK-NEXT: br %r14
entry:
%add = add i32 %y, 199
%shl = shl i32 %x, %add
%sub = sub i32 0, %add
%and = and i32 %sub, 31
%shr = lshr i32 %x, %and
%or = or i32 %shr, %shl
ret i32 %or
}
; ...and again with the InstCombine version.
define i32 @f21(i32 %x, i32 %y) {
; CHECK-LABEL: f21:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: rll %r2, %r2, 199(%r3)
; CHECK-NEXT: br %r14
entry:
%add = add i32 %y, 199
%shl = shl i32 %x, %add
%sub = sub i32 -199, %y
%and = and i32 %sub, 31
%shr = lshr i32 %x, %and
%or = or i32 %shr, %shl
ret i32 %or
}