[RISCV] Add test cases that show that we're too aggressive about using greviw/gorciw. NFC

We currently type legalize to the W form, but type legalization
doesn't place any requirements on the extended bits. So we are ok
to use GREVI/GORCI for type legalization as long as the control
doesn't cross any bits from the extended bits into the lower bits.

This can allow us to recognize cases where the extended bits end
up being all zeros and we can propagate that information through.

My plan is to move greviw/gorciw formation to isel patterns similar
to slliw.
This commit is contained in:
Craig Topper 2022-03-11 15:29:26 -08:00
parent a7b1dccf7a
commit fa62c5326a
3 changed files with 189 additions and 90 deletions

View File

@ -1,6 +1,8 @@
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc -mtriple=riscv64 -mattr=+zbb -verify-machineinstrs < %s \
; RUN: | FileCheck %s -check-prefix=RV64ZBB
; RUN: llc -mtriple=riscv64 -mattr=+zbb,+experimental-zbp -verify-machineinstrs < %s \
; RUN: | FileCheck %s -check-prefix=RV64ZBP
declare i32 @llvm.riscv.orc.b.i32(i32)
@ -10,6 +12,29 @@ define signext i32 @orcb32(i32 signext %a) nounwind {
; RV64ZBB-NEXT: orc.b a0, a0
; RV64ZBB-NEXT: sext.w a0, a0
; RV64ZBB-NEXT: ret
;
; RV64ZBP-LABEL: orcb32:
; RV64ZBP: # %bb.0:
; RV64ZBP-NEXT: gorciw a0, a0, 7
; RV64ZBP-NEXT: ret
%tmp = call i32 @llvm.riscv.orc.b.i32(i32 %a)
ret i32 %tmp
}
define zeroext i32 @orcb32_zext(i32 zeroext %a) nounwind {
; RV64ZBB-LABEL: orcb32_zext:
; RV64ZBB: # %bb.0:
; RV64ZBB-NEXT: orc.b a0, a0
; RV64ZBB-NEXT: slli a0, a0, 32
; RV64ZBB-NEXT: srli a0, a0, 32
; RV64ZBB-NEXT: ret
;
; RV64ZBP-LABEL: orcb32_zext:
; RV64ZBP: # %bb.0:
; RV64ZBP-NEXT: gorciw a0, a0, 7
; RV64ZBP-NEXT: slli a0, a0, 32
; RV64ZBP-NEXT: srli a0, a0, 32
; RV64ZBP-NEXT: ret
%tmp = call i32 @llvm.riscv.orc.b.i32(i32 %a)
ret i32 %tmp
}
@ -21,6 +46,11 @@ define i64 @orcb64(i64 %a) nounwind {
; RV64ZBB: # %bb.0:
; RV64ZBB-NEXT: orc.b a0, a0
; RV64ZBB-NEXT: ret
;
; RV64ZBP-LABEL: orcb64:
; RV64ZBP: # %bb.0:
; RV64ZBP-NEXT: orc.b a0, a0
; RV64ZBP-NEXT: ret
%tmp = call i64 @llvm.riscv.orc.b.i64(i64 %a)
ret i64 %tmp
}

View File

@ -34,6 +34,17 @@ define signext i32 @grevi32(i32 signext %a) nounwind {
ret i32 %tmp
}
define zeroext i32 @grevi32_zext(i32 zeroext %a) nounwind {
; RV64ZBP-LABEL: grevi32_zext:
; RV64ZBP: # %bb.0:
; RV64ZBP-NEXT: greviw a0, a0, 13
; RV64ZBP-NEXT: slli a0, a0, 32
; RV64ZBP-NEXT: srli a0, a0, 32
; RV64ZBP-NEXT: ret
%tmp = call i32 @llvm.riscv.grev.i32(i32 %a, i32 13)
ret i32 %tmp
}
declare i32 @llvm.riscv.gorc.i32(i32 %a, i32 %b)
define signext i32 @gorc32(i32 signext %a, i32 signext %b) nounwind {

View File

@ -1613,31 +1613,89 @@ define signext i32 @grev7_i32(i32 signext %a) nounwind {
ret i32 %or3
}
define zeroext i32 @grev7_i32_zext(i32 zeroext %a) nounwind {
; RV64I-LABEL: grev7_i32_zext:
; RV64I: # %bb.0:
; RV64I-NEXT: slliw a1, a0, 1
; RV64I-NEXT: lui a2, 699051
; RV64I-NEXT: addiw a2, a2, -1366
; RV64I-NEXT: and a1, a1, a2
; RV64I-NEXT: srli a0, a0, 1
; RV64I-NEXT: lui a2, 349525
; RV64I-NEXT: addiw a2, a2, 1365
; RV64I-NEXT: and a0, a0, a2
; RV64I-NEXT: or a0, a1, a0
; RV64I-NEXT: slliw a1, a0, 2
; RV64I-NEXT: lui a2, 838861
; RV64I-NEXT: addiw a2, a2, -820
; RV64I-NEXT: and a1, a1, a2
; RV64I-NEXT: srli a0, a0, 2
; RV64I-NEXT: lui a2, 209715
; RV64I-NEXT: addiw a2, a2, 819
; RV64I-NEXT: and a0, a0, a2
; RV64I-NEXT: or a0, a1, a0
; RV64I-NEXT: slli a1, a0, 4
; RV64I-NEXT: lui a2, 241
; RV64I-NEXT: addiw a2, a2, -241
; RV64I-NEXT: slli a2, a2, 12
; RV64I-NEXT: addi a2, a2, 240
; RV64I-NEXT: and a1, a1, a2
; RV64I-NEXT: srli a0, a0, 4
; RV64I-NEXT: lui a2, 61681
; RV64I-NEXT: addiw a2, a2, -241
; RV64I-NEXT: and a0, a0, a2
; RV64I-NEXT: or a0, a1, a0
; RV64I-NEXT: ret
;
; RV64ZBP-LABEL: grev7_i32_zext:
; RV64ZBP: # %bb.0:
; RV64ZBP-NEXT: greviw a0, a0, 7
; RV64ZBP-NEXT: slli a0, a0, 32
; RV64ZBP-NEXT: srli a0, a0, 32
; RV64ZBP-NEXT: ret
%and1 = shl i32 %a, 1
%shl1 = and i32 %and1, -1431655766
%and1b = lshr i32 %a, 1
%shr1 = and i32 %and1b, 1431655765
%or1 = or i32 %shl1, %shr1
%and2 = shl i32 %or1, 2
%shl2 = and i32 %and2, -858993460
%and2b = lshr i32 %or1, 2
%shr2 = and i32 %and2b, 858993459
%or2 = or i32 %shl2, %shr2
%and3 = shl i32 %or2, 4
%shl3 = and i32 %and3, -252645136
%and3b = lshr i32 %or2, 4
%shr3 = and i32 %and3b, 252645135
%or3 = or i32 %shl3, %shr3
ret i32 %or3
}
define i64 @grev7_i64(i64 %a) nounwind {
; RV64I-LABEL: grev7_i64:
; RV64I: # %bb.0:
; RV64I-NEXT: lui a1, %hi(.LCPI44_0)
; RV64I-NEXT: ld a1, %lo(.LCPI44_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI44_1)
; RV64I-NEXT: ld a2, %lo(.LCPI44_1)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI45_0)
; RV64I-NEXT: ld a1, %lo(.LCPI45_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI45_1)
; RV64I-NEXT: ld a2, %lo(.LCPI45_1)(a2)
; RV64I-NEXT: slli a3, a0, 1
; RV64I-NEXT: and a1, a3, a1
; RV64I-NEXT: srli a0, a0, 1
; RV64I-NEXT: and a0, a0, a2
; RV64I-NEXT: or a0, a1, a0
; RV64I-NEXT: lui a1, %hi(.LCPI44_2)
; RV64I-NEXT: ld a1, %lo(.LCPI44_2)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI44_3)
; RV64I-NEXT: ld a2, %lo(.LCPI44_3)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI45_2)
; RV64I-NEXT: ld a1, %lo(.LCPI45_2)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI45_3)
; RV64I-NEXT: ld a2, %lo(.LCPI45_3)(a2)
; RV64I-NEXT: slli a3, a0, 2
; RV64I-NEXT: and a1, a3, a1
; RV64I-NEXT: srli a0, a0, 2
; RV64I-NEXT: and a0, a0, a2
; RV64I-NEXT: or a0, a1, a0
; RV64I-NEXT: lui a1, %hi(.LCPI44_4)
; RV64I-NEXT: ld a1, %lo(.LCPI44_4)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI44_5)
; RV64I-NEXT: ld a2, %lo(.LCPI44_5)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI45_4)
; RV64I-NEXT: ld a1, %lo(.LCPI45_4)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI45_5)
; RV64I-NEXT: ld a2, %lo(.LCPI45_5)(a2)
; RV64I-NEXT: slli a3, a0, 4
; RV64I-NEXT: and a1, a3, a1
; RV64I-NEXT: srli a0, a0, 4
@ -1696,10 +1754,10 @@ define signext i32 @grev8_i32(i32 signext %a) nounwind {
define i64 @grev8_i64(i64 %a) nounwind {
; RV64I-LABEL: grev8_i64:
; RV64I: # %bb.0:
; RV64I-NEXT: lui a1, %hi(.LCPI46_0)
; RV64I-NEXT: ld a1, %lo(.LCPI46_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI46_1)
; RV64I-NEXT: ld a2, %lo(.LCPI46_1)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI47_0)
; RV64I-NEXT: ld a1, %lo(.LCPI47_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI47_1)
; RV64I-NEXT: ld a2, %lo(.LCPI47_1)(a2)
; RV64I-NEXT: slli a3, a0, 8
; RV64I-NEXT: and a1, a3, a1
; RV64I-NEXT: srli a0, a0, 8
@ -1762,19 +1820,19 @@ define signext i32 @grev12_i32(i32 signext %a) nounwind {
define i64 @grev12_i64(i64 %a) nounwind {
; RV64I-LABEL: grev12_i64:
; RV64I: # %bb.0:
; RV64I-NEXT: lui a1, %hi(.LCPI48_0)
; RV64I-NEXT: ld a1, %lo(.LCPI48_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI48_1)
; RV64I-NEXT: ld a2, %lo(.LCPI48_1)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI49_0)
; RV64I-NEXT: ld a1, %lo(.LCPI49_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI49_1)
; RV64I-NEXT: ld a2, %lo(.LCPI49_1)(a2)
; RV64I-NEXT: slli a3, a0, 4
; RV64I-NEXT: and a1, a3, a1
; RV64I-NEXT: srli a0, a0, 4
; RV64I-NEXT: and a0, a0, a2
; RV64I-NEXT: or a0, a1, a0
; RV64I-NEXT: lui a1, %hi(.LCPI48_2)
; RV64I-NEXT: ld a1, %lo(.LCPI48_2)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI48_3)
; RV64I-NEXT: ld a2, %lo(.LCPI48_3)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI49_2)
; RV64I-NEXT: ld a1, %lo(.LCPI49_2)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI49_3)
; RV64I-NEXT: ld a2, %lo(.LCPI49_3)(a2)
; RV64I-NEXT: slli a3, a0, 8
; RV64I-NEXT: and a1, a3, a1
; RV64I-NEXT: srli a0, a0, 8
@ -1856,28 +1914,28 @@ define signext i32 @grev14_i32(i32 signext %a) nounwind {
define i64 @grev14_i64(i64 %a) nounwind {
; RV64I-LABEL: grev14_i64:
; RV64I: # %bb.0:
; RV64I-NEXT: lui a1, %hi(.LCPI50_0)
; RV64I-NEXT: ld a1, %lo(.LCPI50_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI50_1)
; RV64I-NEXT: ld a2, %lo(.LCPI50_1)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI51_0)
; RV64I-NEXT: ld a1, %lo(.LCPI51_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI51_1)
; RV64I-NEXT: ld a2, %lo(.LCPI51_1)(a2)
; RV64I-NEXT: slli a3, a0, 2
; RV64I-NEXT: and a1, a3, a1
; RV64I-NEXT: srli a0, a0, 2
; RV64I-NEXT: and a0, a0, a2
; RV64I-NEXT: or a0, a1, a0
; RV64I-NEXT: lui a1, %hi(.LCPI50_2)
; RV64I-NEXT: ld a1, %lo(.LCPI50_2)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI50_3)
; RV64I-NEXT: ld a2, %lo(.LCPI50_3)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI51_2)
; RV64I-NEXT: ld a1, %lo(.LCPI51_2)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI51_3)
; RV64I-NEXT: ld a2, %lo(.LCPI51_3)(a2)
; RV64I-NEXT: slli a3, a0, 4
; RV64I-NEXT: and a1, a3, a1
; RV64I-NEXT: srli a0, a0, 4
; RV64I-NEXT: and a0, a0, a2
; RV64I-NEXT: or a0, a1, a0
; RV64I-NEXT: lui a1, %hi(.LCPI50_4)
; RV64I-NEXT: ld a1, %lo(.LCPI50_4)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI50_5)
; RV64I-NEXT: ld a2, %lo(.LCPI50_5)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI51_4)
; RV64I-NEXT: ld a1, %lo(.LCPI51_4)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI51_5)
; RV64I-NEXT: ld a2, %lo(.LCPI51_5)(a2)
; RV64I-NEXT: slli a3, a0, 8
; RV64I-NEXT: and a1, a3, a1
; RV64I-NEXT: srli a0, a0, 8
@ -2050,19 +2108,19 @@ define signext i32 @grev3b_i32(i32 signext %a) nounwind {
define i64 @grev3b_i64(i64 %a) nounwind {
; RV64I-LABEL: grev3b_i64:
; RV64I: # %bb.0:
; RV64I-NEXT: lui a1, %hi(.LCPI57_0)
; RV64I-NEXT: ld a1, %lo(.LCPI57_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI57_1)
; RV64I-NEXT: ld a2, %lo(.LCPI57_1)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI58_0)
; RV64I-NEXT: ld a1, %lo(.LCPI58_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI58_1)
; RV64I-NEXT: ld a2, %lo(.LCPI58_1)(a2)
; RV64I-NEXT: slli a3, a0, 2
; RV64I-NEXT: and a1, a3, a1
; RV64I-NEXT: srli a0, a0, 2
; RV64I-NEXT: and a0, a0, a2
; RV64I-NEXT: or a0, a1, a0
; RV64I-NEXT: lui a1, %hi(.LCPI57_2)
; RV64I-NEXT: ld a1, %lo(.LCPI57_2)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI57_3)
; RV64I-NEXT: ld a2, %lo(.LCPI57_3)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI58_2)
; RV64I-NEXT: ld a1, %lo(.LCPI58_2)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI58_3)
; RV64I-NEXT: ld a2, %lo(.LCPI58_3)(a2)
; RV64I-NEXT: slli a3, a0, 1
; RV64I-NEXT: and a1, a3, a1
; RV64I-NEXT: srli a0, a0, 1
@ -2142,19 +2200,19 @@ define signext i32 @grev2b_i32(i32 signext %a) nounwind {
define i64 @grev2b_i64(i64 %a) nounwind {
; RV64I-LABEL: grev2b_i64:
; RV64I: # %bb.0:
; RV64I-NEXT: lui a1, %hi(.LCPI59_0)
; RV64I-NEXT: ld a1, %lo(.LCPI59_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI59_1)
; RV64I-NEXT: ld a2, %lo(.LCPI59_1)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI60_0)
; RV64I-NEXT: ld a1, %lo(.LCPI60_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI60_1)
; RV64I-NEXT: ld a2, %lo(.LCPI60_1)(a2)
; RV64I-NEXT: slli a3, a0, 1
; RV64I-NEXT: and a3, a3, a1
; RV64I-NEXT: srli a0, a0, 1
; RV64I-NEXT: and a0, a0, a2
; RV64I-NEXT: or a0, a3, a0
; RV64I-NEXT: lui a3, %hi(.LCPI59_2)
; RV64I-NEXT: ld a3, %lo(.LCPI59_2)(a3)
; RV64I-NEXT: lui a4, %hi(.LCPI59_3)
; RV64I-NEXT: ld a4, %lo(.LCPI59_3)(a4)
; RV64I-NEXT: lui a3, %hi(.LCPI60_2)
; RV64I-NEXT: ld a3, %lo(.LCPI60_2)(a3)
; RV64I-NEXT: lui a4, %hi(.LCPI60_3)
; RV64I-NEXT: ld a4, %lo(.LCPI60_3)(a4)
; RV64I-NEXT: slli a5, a0, 2
; RV64I-NEXT: and a3, a5, a3
; RV64I-NEXT: srli a0, a0, 2
@ -2253,19 +2311,19 @@ define signext i32 @grev0_i32(i32 signext %a) nounwind {
define i64 @grev0_i64(i64 %a) nounwind {
; RV64I-LABEL: grev0_i64:
; RV64I: # %bb.0:
; RV64I-NEXT: lui a1, %hi(.LCPI61_0)
; RV64I-NEXT: ld a1, %lo(.LCPI61_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI61_1)
; RV64I-NEXT: ld a2, %lo(.LCPI61_1)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI62_0)
; RV64I-NEXT: ld a1, %lo(.LCPI62_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI62_1)
; RV64I-NEXT: ld a2, %lo(.LCPI62_1)(a2)
; RV64I-NEXT: slli a3, a0, 1
; RV64I-NEXT: and a3, a3, a1
; RV64I-NEXT: srli a0, a0, 1
; RV64I-NEXT: and a0, a0, a2
; RV64I-NEXT: or a0, a3, a0
; RV64I-NEXT: lui a3, %hi(.LCPI61_2)
; RV64I-NEXT: ld a3, %lo(.LCPI61_2)(a3)
; RV64I-NEXT: lui a4, %hi(.LCPI61_3)
; RV64I-NEXT: ld a4, %lo(.LCPI61_3)(a4)
; RV64I-NEXT: lui a3, %hi(.LCPI62_2)
; RV64I-NEXT: ld a3, %lo(.LCPI62_2)(a3)
; RV64I-NEXT: lui a4, %hi(.LCPI62_3)
; RV64I-NEXT: ld a4, %lo(.LCPI62_3)(a4)
; RV64I-NEXT: slli a5, a0, 2
; RV64I-NEXT: and a5, a5, a3
; RV64I-NEXT: srli a0, a0, 2
@ -2660,22 +2718,22 @@ define i64 @bitreverse_i64(i64 %a) nounwind {
; RV64I-NEXT: and a3, a4, a3
; RV64I-NEXT: slli a0, a0, 56
; RV64I-NEXT: or a0, a0, a3
; RV64I-NEXT: lui a3, %hi(.LCPI72_0)
; RV64I-NEXT: ld a3, %lo(.LCPI72_0)(a3)
; RV64I-NEXT: lui a3, %hi(.LCPI73_0)
; RV64I-NEXT: ld a3, %lo(.LCPI73_0)(a3)
; RV64I-NEXT: or a0, a0, a2
; RV64I-NEXT: or a0, a0, a1
; RV64I-NEXT: srli a1, a0, 4
; RV64I-NEXT: and a1, a1, a3
; RV64I-NEXT: and a0, a0, a3
; RV64I-NEXT: lui a2, %hi(.LCPI72_1)
; RV64I-NEXT: ld a2, %lo(.LCPI72_1)(a2)
; RV64I-NEXT: lui a2, %hi(.LCPI73_1)
; RV64I-NEXT: ld a2, %lo(.LCPI73_1)(a2)
; RV64I-NEXT: slli a0, a0, 4
; RV64I-NEXT: or a0, a1, a0
; RV64I-NEXT: srli a1, a0, 2
; RV64I-NEXT: and a1, a1, a2
; RV64I-NEXT: and a0, a0, a2
; RV64I-NEXT: lui a2, %hi(.LCPI72_2)
; RV64I-NEXT: ld a2, %lo(.LCPI72_2)(a2)
; RV64I-NEXT: lui a2, %hi(.LCPI73_2)
; RV64I-NEXT: ld a2, %lo(.LCPI73_2)(a2)
; RV64I-NEXT: slli a0, a0, 2
; RV64I-NEXT: or a0, a1, a0
; RV64I-NEXT: srli a1, a0, 1
@ -2873,20 +2931,20 @@ define i32 @bitreverse_bswap_i32(i32 %a) {
define i64 @bitreverse_bswap_i64(i64 %a) {
; RV64I-LABEL: bitreverse_bswap_i64:
; RV64I: # %bb.0:
; RV64I-NEXT: lui a1, %hi(.LCPI78_0)
; RV64I-NEXT: ld a1, %lo(.LCPI78_0)(a1)
; RV64I-NEXT: lui a1, %hi(.LCPI79_0)
; RV64I-NEXT: ld a1, %lo(.LCPI79_0)(a1)
; RV64I-NEXT: srli a2, a0, 4
; RV64I-NEXT: and a2, a2, a1
; RV64I-NEXT: and a0, a0, a1
; RV64I-NEXT: lui a1, %hi(.LCPI78_1)
; RV64I-NEXT: ld a1, %lo(.LCPI78_1)(a1)
; RV64I-NEXT: lui a1, %hi(.LCPI79_1)
; RV64I-NEXT: ld a1, %lo(.LCPI79_1)(a1)
; RV64I-NEXT: slli a0, a0, 4
; RV64I-NEXT: or a0, a2, a0
; RV64I-NEXT: srli a2, a0, 2
; RV64I-NEXT: and a2, a2, a1
; RV64I-NEXT: and a0, a0, a1
; RV64I-NEXT: lui a1, %hi(.LCPI78_2)
; RV64I-NEXT: ld a1, %lo(.LCPI78_2)(a1)
; RV64I-NEXT: lui a1, %hi(.LCPI79_2)
; RV64I-NEXT: ld a1, %lo(.LCPI79_2)(a1)
; RV64I-NEXT: slli a0, a0, 2
; RV64I-NEXT: or a0, a2, a0
; RV64I-NEXT: srli a2, a0, 1
@ -2940,14 +2998,14 @@ define signext i32 @shfl1_i32(i32 signext %a, i32 signext %b) nounwind {
define i64 @shfl1_i64(i64 %a, i64 %b) nounwind {
; RV64I-LABEL: shfl1_i64:
; RV64I: # %bb.0:
; RV64I-NEXT: lui a1, %hi(.LCPI80_1)
; RV64I-NEXT: ld a1, %lo(.LCPI80_1)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI80_0)
; RV64I-NEXT: ld a2, %lo(.LCPI80_0)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI81_1)
; RV64I-NEXT: ld a1, %lo(.LCPI81_1)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI81_0)
; RV64I-NEXT: ld a2, %lo(.LCPI81_0)(a2)
; RV64I-NEXT: slli a3, a0, 1
; RV64I-NEXT: and a1, a3, a1
; RV64I-NEXT: lui a3, %hi(.LCPI80_2)
; RV64I-NEXT: ld a3, %lo(.LCPI80_2)(a3)
; RV64I-NEXT: lui a3, %hi(.LCPI81_2)
; RV64I-NEXT: ld a3, %lo(.LCPI81_2)(a3)
; RV64I-NEXT: and a2, a0, a2
; RV64I-NEXT: or a1, a2, a1
; RV64I-NEXT: srli a0, a0, 1
@ -3004,14 +3062,14 @@ define signext i32 @shfl2_i32(i32 signext %a, i32 signext %b) nounwind {
define i64 @shfl2_i64(i64 %a, i64 %b) nounwind {
; RV64I-LABEL: shfl2_i64:
; RV64I: # %bb.0:
; RV64I-NEXT: lui a1, %hi(.LCPI82_1)
; RV64I-NEXT: ld a1, %lo(.LCPI82_1)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI82_0)
; RV64I-NEXT: ld a2, %lo(.LCPI82_0)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI83_1)
; RV64I-NEXT: ld a1, %lo(.LCPI83_1)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI83_0)
; RV64I-NEXT: ld a2, %lo(.LCPI83_0)(a2)
; RV64I-NEXT: slli a3, a0, 2
; RV64I-NEXT: and a1, a3, a1
; RV64I-NEXT: lui a3, %hi(.LCPI82_2)
; RV64I-NEXT: ld a3, %lo(.LCPI82_2)(a3)
; RV64I-NEXT: lui a3, %hi(.LCPI83_2)
; RV64I-NEXT: ld a3, %lo(.LCPI83_2)(a3)
; RV64I-NEXT: and a2, a0, a2
; RV64I-NEXT: or a1, a2, a1
; RV64I-NEXT: srli a0, a0, 2
@ -3068,13 +3126,13 @@ define signext i32 @shfl4_i32(i32 signext %a, i32 signext %b) nounwind {
define i64 @shfl4_i64(i64 %a, i64 %b) nounwind {
; RV64I-LABEL: shfl4_i64:
; RV64I: # %bb.0:
; RV64I-NEXT: lui a1, %hi(.LCPI84_0)
; RV64I-NEXT: ld a1, %lo(.LCPI84_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI84_1)
; RV64I-NEXT: ld a2, %lo(.LCPI84_1)(a2)
; RV64I-NEXT: lui a1, %hi(.LCPI85_0)
; RV64I-NEXT: ld a1, %lo(.LCPI85_0)(a1)
; RV64I-NEXT: lui a2, %hi(.LCPI85_1)
; RV64I-NEXT: ld a2, %lo(.LCPI85_1)(a2)
; RV64I-NEXT: slli a3, a0, 4
; RV64I-NEXT: lui a4, %hi(.LCPI84_2)
; RV64I-NEXT: ld a4, %lo(.LCPI84_2)(a4)
; RV64I-NEXT: lui a4, %hi(.LCPI85_2)
; RV64I-NEXT: ld a4, %lo(.LCPI85_2)(a4)
; RV64I-NEXT: and a2, a3, a2
; RV64I-NEXT: and a1, a0, a1
; RV64I-NEXT: srli a0, a0, 4