2013-07-18 18:40:35 +08:00
|
|
|
; Test sequences that can use RNSBG.
|
|
|
|
;
|
|
|
|
; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s
|
|
|
|
|
|
|
|
; Test a simple mask, which is a wrap-around case.
|
|
|
|
define i32 @f1(i32 %a, i32 %b) {
|
|
|
|
; CHECK-LABEL: f1:
|
|
|
|
; CHECK: rnsbg %r2, %r3, 59, 56, 0
|
|
|
|
; CHECK: br %r14
|
|
|
|
%orb = or i32 %b, 96
|
|
|
|
%and = and i32 %a, %orb
|
|
|
|
ret i32 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; ...and again with i64.
|
|
|
|
define i64 @f2(i64 %a, i64 %b) {
|
|
|
|
; CHECK-LABEL: f2:
|
|
|
|
; CHECK: rnsbg %r2, %r3, 59, 56, 0
|
|
|
|
; CHECK: br %r14
|
|
|
|
%orb = or i64 %b, 96
|
|
|
|
%and = and i64 %a, %orb
|
|
|
|
ret i64 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; Test a case where no wraparound is needed.
|
|
|
|
define i32 @f3(i32 %a, i32 %b) {
|
|
|
|
; CHECK-LABEL: f3:
|
|
|
|
; CHECK: rnsbg %r2, %r3, 58, 61, 0
|
|
|
|
; CHECK: br %r14
|
|
|
|
%orb = or i32 %b, -61
|
|
|
|
%and = and i32 %a, %orb
|
|
|
|
ret i32 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; ...and again with i64.
|
|
|
|
define i64 @f4(i64 %a, i64 %b) {
|
|
|
|
; CHECK-LABEL: f4:
|
|
|
|
; CHECK: rnsbg %r2, %r3, 58, 61, 0
|
|
|
|
; CHECK: br %r14
|
|
|
|
%orb = or i64 %b, -61
|
|
|
|
%and = and i64 %a, %orb
|
|
|
|
ret i64 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; Test a case with just a left shift. This can't use RNSBG.
|
|
|
|
define i32 @f6(i32 %a, i32 %b) {
|
|
|
|
; CHECK-LABEL: f6:
|
|
|
|
; CHECK: sll {{%r[0-5]}}
|
|
|
|
; CHECK: nr {{%r[0-5]}}
|
|
|
|
; CHECK: br %r14
|
|
|
|
%shrb = shl i32 %b, 20
|
|
|
|
%and = and i32 %a, %shrb
|
|
|
|
ret i32 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; ...and again with i64.
|
|
|
|
define i64 @f7(i64 %a, i64 %b) {
|
|
|
|
; CHECK-LABEL: f7:
|
|
|
|
; CHECK: sllg {{%r[0-5]}}
|
|
|
|
; CHECK: ngr {{%r[0-5]}}
|
|
|
|
; CHECK: br %r14
|
|
|
|
%shrb = shl i64 %b, 20
|
|
|
|
%and = and i64 %a, %shrb
|
|
|
|
ret i64 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; Test a case with just a rotate. This can't use RNSBG.
|
|
|
|
define i32 @f8(i32 %a, i32 %b) {
|
|
|
|
; CHECK-LABEL: f8:
|
|
|
|
; CHECK: rll {{%r[0-5]}}
|
|
|
|
; CHECK: nr {{%r[0-5]}}
|
|
|
|
; CHECK: br %r14
|
|
|
|
%shlb = shl i32 %b, 22
|
|
|
|
%shrb = lshr i32 %b, 10
|
|
|
|
%rotlb = or i32 %shlb, %shrb
|
|
|
|
%and = and i32 %a, %rotlb
|
|
|
|
ret i32 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; ...and again with i64, which can.
|
|
|
|
define i64 @f9(i64 %a, i64 %b) {
|
|
|
|
; CHECK-LABEL: f9:
|
|
|
|
; CHECK: rnsbg %r2, %r3, 0, 63, 44
|
|
|
|
; CHECK: br %r14
|
|
|
|
%shlb = shl i64 %b, 44
|
|
|
|
%shrb = lshr i64 %b, 20
|
|
|
|
%rotlb = or i64 %shlb, %shrb
|
|
|
|
%and = and i64 %a, %rotlb
|
|
|
|
ret i64 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; Test a case with a left shift and OR, where the OR covers all shifted bits.
|
|
|
|
; We can do the whole thing using RNSBG.
|
|
|
|
define i32 @f10(i32 %a, i32 %b) {
|
|
|
|
; CHECK-LABEL: f10:
|
|
|
|
; CHECK: rnsbg %r2, %r3, 32, 56, 7
|
|
|
|
; CHECK: br %r14
|
|
|
|
%shlb = shl i32 %b, 7
|
|
|
|
%orb = or i32 %shlb, 127
|
|
|
|
%and = and i32 %a, %orb
|
|
|
|
ret i32 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; ...and again with i64.
|
|
|
|
define i64 @f11(i64 %a, i64 %b) {
|
|
|
|
; CHECK-LABEL: f11:
|
|
|
|
; CHECK: rnsbg %r2, %r3, 0, 56, 7
|
|
|
|
; CHECK: br %r14
|
|
|
|
%shlb = shl i64 %b, 7
|
|
|
|
%orb = or i64 %shlb, 127
|
|
|
|
%and = and i64 %a, %orb
|
|
|
|
ret i64 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; Test a case with a left shift and OR, where the OR doesn't cover all
|
|
|
|
; shifted bits. We can't use RNSBG for the shift, but we can for the OR
|
|
|
|
; and AND.
|
|
|
|
define i32 @f12(i32 %a, i32 %b) {
|
|
|
|
; CHECK-LABEL: f12:
|
|
|
|
; CHECK: sll %r3, 7
|
|
|
|
; CHECK: rnsbg %r2, %r3, 32, 57, 0
|
|
|
|
; CHECK: br %r14
|
|
|
|
%shlb = shl i32 %b, 7
|
|
|
|
%orb = or i32 %shlb, 63
|
|
|
|
%and = and i32 %a, %orb
|
|
|
|
ret i32 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; ...and again with i64.
|
|
|
|
define i64 @f13(i64 %a, i64 %b) {
|
|
|
|
; CHECK-LABEL: f13:
|
|
|
|
; CHECK: sllg [[REG:%r[01345]]], %r3, 7
|
|
|
|
; CHECK: rnsbg %r2, [[REG]], 0, 57, 0
|
|
|
|
; CHECK: br %r14
|
|
|
|
%shlb = shl i64 %b, 7
|
|
|
|
%orb = or i64 %shlb, 63
|
|
|
|
%and = and i64 %a, %orb
|
|
|
|
ret i64 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; Test a case with a right shift and OR, where the OR covers all the shifted
|
|
|
|
; bits. The whole thing can be done using RNSBG.
|
|
|
|
define i32 @f14(i32 %a, i32 %b) {
|
|
|
|
; CHECK-LABEL: f14:
|
|
|
|
; CHECK: rnsbg %r2, %r3, 60, 63, 37
|
|
|
|
; CHECK: br %r14
|
|
|
|
%shrb = lshr i32 %b, 27
|
|
|
|
%orb = or i32 %shrb, -16
|
|
|
|
%and = and i32 %a, %orb
|
|
|
|
ret i32 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; ...and again with i64.
|
|
|
|
define i64 @f15(i64 %a, i64 %b) {
|
|
|
|
; CHECK-LABEL: f15:
|
|
|
|
; CHECK: rnsbg %r2, %r3, 60, 63, 5
|
|
|
|
; CHECK: br %r14
|
|
|
|
%shrb = lshr i64 %b, 59
|
|
|
|
%orb = or i64 %shrb, -16
|
|
|
|
%and = and i64 %a, %orb
|
|
|
|
ret i64 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; Test a case with a right shift and OR, where the OR doesn't cover all the
|
|
|
|
; shifted bits. The shift needs to be done separately, but the OR and AND
|
|
|
|
; can use RNSBG.
|
|
|
|
define i32 @f16(i32 %a, i32 %b) {
|
|
|
|
; CHECK-LABEL: f16:
|
|
|
|
; CHECK: srl %r3, 29
|
|
|
|
; CHECK: rnsbg %r2, %r3, 60, 63, 0
|
|
|
|
; CHECK: br %r14
|
|
|
|
%shrb = lshr i32 %b, 29
|
|
|
|
%orb = or i32 %shrb, -16
|
|
|
|
%and = and i32 %a, %orb
|
|
|
|
ret i32 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; ...and again with i64.
|
|
|
|
define i64 @f17(i64 %a, i64 %b) {
|
|
|
|
; CHECK-LABEL: f17:
|
|
|
|
; CHECK: srlg [[REG:%r[01345]]], %r3, 61
|
|
|
|
; CHECK: rnsbg %r2, [[REG]], 60, 63, 0
|
|
|
|
; CHECK: br %r14
|
|
|
|
%shrb = lshr i64 %b, 61
|
|
|
|
%orb = or i64 %shrb, -16
|
|
|
|
%and = and i64 %a, %orb
|
|
|
|
ret i64 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; Test a combination involving an ASHR in which the sign bits matter.
|
|
|
|
; We can't use RNSBG for the ASHR in that case, but we can for the rest.
|
|
|
|
define i32 @f18(i32 %a, i32 %b, i32 *%dest) {
|
|
|
|
; CHECK-LABEL: f18:
|
|
|
|
; CHECK: sra %r3, 4
|
|
|
|
; CHECK: rnsbg %r2, %r3, 32, 62, 1
|
|
|
|
; CHECK: br %r14
|
|
|
|
%ashrb = ashr i32 %b, 4
|
|
|
|
store i32 %ashrb, i32 *%dest
|
|
|
|
%shlb = shl i32 %ashrb, 1
|
|
|
|
%orb = or i32 %shlb, 1
|
|
|
|
%and = and i32 %a, %orb
|
|
|
|
ret i32 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; ...and again with i64.
|
|
|
|
define i64 @f19(i64 %a, i64 %b, i64 *%dest) {
|
|
|
|
; CHECK-LABEL: f19:
|
|
|
|
; CHECK: srag [[REG:%r[0145]]], %r3, 34
|
|
|
|
; CHECK: rnsbg %r2, [[REG]], 0, 62, 1
|
|
|
|
; CHECK: br %r14
|
|
|
|
%ashrb = ashr i64 %b, 34
|
|
|
|
store i64 %ashrb, i64 *%dest
|
|
|
|
%shlb = shl i64 %ashrb, 1
|
|
|
|
%orb = or i64 %shlb, 1
|
|
|
|
%and = and i64 %a, %orb
|
|
|
|
ret i64 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; Test a combination involving an ASHR in which the sign bits don't matter.
|
|
|
|
define i32 @f20(i32 %a, i32 %b, i32 *%dest) {
|
|
|
|
; CHECK-LABEL: f20:
|
|
|
|
; CHECK: rnsbg %r2, %r3, 48, 62, 48
|
|
|
|
; CHECK: br %r14
|
|
|
|
%ashrb = ashr i32 %b, 17
|
|
|
|
store i32 %ashrb, i32 *%dest
|
|
|
|
%shlb = shl i32 %ashrb, 1
|
|
|
|
%orb = or i32 %shlb, -65535
|
|
|
|
%and = and i32 %a, %orb
|
|
|
|
ret i32 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; ...and again with i64.
|
|
|
|
define i64 @f21(i64 %a, i64 %b, i64 *%dest) {
|
|
|
|
; CHECK-LABEL: f21:
|
|
|
|
; CHECK: rnsbg %r2, %r3, 48, 62, 16
|
|
|
|
; CHECK: br %r14
|
|
|
|
%ashrb = ashr i64 %b, 49
|
|
|
|
store i64 %ashrb, i64 *%dest
|
|
|
|
%shlb = shl i64 %ashrb, 1
|
|
|
|
%orb = or i64 %shlb, -65535
|
|
|
|
%and = and i64 %a, %orb
|
|
|
|
ret i64 %and
|
|
|
|
}
|
|
|
|
|
|
|
|
; Test a case with a shift, OR, and rotate where the OR covers all shifted bits.
|
|
|
|
define i64 @f22(i64 %a, i64 %b) {
|
|
|
|
; CHECK-LABEL: f22:
|
|
|
|
; CHECK: rnsbg %r2, %r3, 60, 54, 9
|
|
|
|
; CHECK: br %r14
|
|
|
|
%shlb = shl i64 %b, 5
|
|
|
|
%orb = or i64 %shlb, 31
|
|
|
|
%shlorb = shl i64 %orb, 4
|
|
|
|
%shrorb = lshr i64 %orb, 60
|
|
|
|
%rotlorb = or i64 %shlorb, %shrorb
|
|
|
|
%and = and i64 %a, %rotlorb
|
|
|
|
ret i64 %and
|
|
|
|
}
|
2014-01-09 19:28:53 +08:00
|
|
|
|
|
|
|
; Check the handling of zext and AND, which isn't suitable for RNSBG.
|
|
|
|
define i64 @f23(i64 %a, i32 %b) {
|
|
|
|
; CHECK-LABEL: f23:
|
|
|
|
; CHECK-NOT: rnsbg
|
|
|
|
; CHECK: br %r14
|
|
|
|
%add = add i32 %b, 1
|
|
|
|
%ext = zext i32 %add to i64
|
|
|
|
%and = and i64 %a, %ext
|
|
|
|
ret i64 %and
|
|
|
|
}
|