[AArch64][SVEIntrinsicOpts] Convect cntb/h/w/d to vscale intrinsic or constant.

As is mentioned above

Differential Revision: https://reviews.llvm.org/D104852
This commit is contained in:
Jun Ma 2021-06-18 11:55:01 +08:00
parent c0a6318d96
commit ae5433945f
6 changed files with 342 additions and 62 deletions

View File

@ -7,8 +7,9 @@
uint64_t test_svcntb() uint64_t test_svcntb()
{ {
// CHECK-LABEL: test_svcntb // CHECK-LABEL: test_svcntb
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntb(i32 31) // CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.vscale.i64()
// CHECK: ret i64 %[[INTRINSIC]] // CHECK-NEXT: %[[RET:.*]] = shl i64 %[[INTRINSIC]], 4
// CHECK: ret i64 %[[RET]]
return svcntb(); return svcntb();
} }
@ -23,72 +24,63 @@ uint64_t test_svcntb_pat()
uint64_t test_svcntb_pat_1() uint64_t test_svcntb_pat_1()
{ {
// CHECK-LABEL: test_svcntb_pat_1 // CHECK-LABEL: test_svcntb_pat_1
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntb(i32 1) // CHECK: ret i64 1
// CHECK: ret i64 %[[INTRINSIC]]
return svcntb_pat(SV_VL1); return svcntb_pat(SV_VL1);
} }
uint64_t test_svcntb_pat_2() uint64_t test_svcntb_pat_2()
{ {
// CHECK-LABEL: test_svcntb_pat_2 // CHECK-LABEL: test_svcntb_pat_2
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntb(i32 2) // CHECK: ret i64 2
// CHECK: ret i64 %[[INTRINSIC]]
return svcntb_pat(SV_VL2); return svcntb_pat(SV_VL2);
} }
uint64_t test_svcntb_pat_3() uint64_t test_svcntb_pat_3()
{ {
// CHECK-LABEL: test_svcntb_pat_3 // CHECK-LABEL: test_svcntb_pat_3
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntb(i32 3) // CHECK: ret i64 3
// CHECK: ret i64 %[[INTRINSIC]]
return svcntb_pat(SV_VL3); return svcntb_pat(SV_VL3);
} }
uint64_t test_svcntb_pat_4() uint64_t test_svcntb_pat_4()
{ {
// CHECK-LABEL: test_svcntb_pat_4 // CHECK-LABEL: test_svcntb_pat_4
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntb(i32 4) // CHECK: ret i64 4
// CHECK: ret i64 %[[INTRINSIC]]
return svcntb_pat(SV_VL4); return svcntb_pat(SV_VL4);
} }
uint64_t test_svcntb_pat_5() uint64_t test_svcntb_pat_5()
{ {
// CHECK-LABEL: test_svcntb_pat_5 // CHECK-LABEL: test_svcntb_pat_5
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntb(i32 5) // CHECK: ret i64 5
// CHECK: ret i64 %[[INTRINSIC]]
return svcntb_pat(SV_VL5); return svcntb_pat(SV_VL5);
} }
uint64_t test_svcntb_pat_6() uint64_t test_svcntb_pat_6()
{ {
// CHECK-LABEL: test_svcntb_pat_6 // CHECK-LABEL: test_svcntb_pat_6
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntb(i32 6) // CHECK: ret i64 6
// CHECK: ret i64 %[[INTRINSIC]]
return svcntb_pat(SV_VL6); return svcntb_pat(SV_VL6);
} }
uint64_t test_svcntb_pat_7() uint64_t test_svcntb_pat_7()
{ {
// CHECK-LABEL: test_svcntb_pat_7 // CHECK-LABEL: test_svcntb_pat_7
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntb(i32 7) // CHECK: ret i64 7
// CHECK: ret i64 %[[INTRINSIC]]
return svcntb_pat(SV_VL7); return svcntb_pat(SV_VL7);
} }
uint64_t test_svcntb_pat_8() uint64_t test_svcntb_pat_8()
{ {
// CHECK-LABEL: test_svcntb_pat_8 // CHECK-LABEL: test_svcntb_pat_8
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntb(i32 8) // CHECK: ret i64 8
// CHECK: ret i64 %[[INTRINSIC]]
return svcntb_pat(SV_VL8); return svcntb_pat(SV_VL8);
} }
uint64_t test_svcntb_pat_9() uint64_t test_svcntb_pat_9()
{ {
// CHECK-LABEL: test_svcntb_pat_9 // CHECK-LABEL: test_svcntb_pat_9
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntb(i32 9) // CHECK: ret i64 16
// CHECK: ret i64 %[[INTRINSIC]]
return svcntb_pat(SV_VL16); return svcntb_pat(SV_VL16);
} }
@ -143,7 +135,8 @@ uint64_t test_svcntb_pat_15()
uint64_t test_svcntb_pat_16() uint64_t test_svcntb_pat_16()
{ {
// CHECK-LABEL: test_svcntb_pat_16 // CHECK-LABEL: test_svcntb_pat_16
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntb(i32 31) // CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.vscale.i64()
// CHECK: ret i64 %[[INTRINSIC]] // CHECK-NEXT: %[[RET:.*]] = shl i64 %[[INTRINSIC]], 4
// CHECK: ret i64 %[[RET]]
return svcntb_pat(SV_ALL); return svcntb_pat(SV_ALL);
} }

View File

@ -7,8 +7,9 @@
uint64_t test_svcntd() uint64_t test_svcntd()
{ {
// CHECK-LABEL: test_svcntd // CHECK-LABEL: test_svcntd
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntd(i32 31) // CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.vscale.i64()
// CHECK: ret i64 %[[INTRINSIC]] // CHECK-NEXT: %[[RET:.*]] = shl i64 %[[INTRINSIC]], 1
// CHECK: ret i64 %[[RET]]
return svcntd(); return svcntd();
} }
@ -23,16 +24,14 @@ uint64_t test_svcntd_pat()
uint64_t test_svcntd_pat_1() uint64_t test_svcntd_pat_1()
{ {
// CHECK-LABEL: test_svcntd_pat_1 // CHECK-LABEL: test_svcntd_pat_1
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntd(i32 1) // CHECK: ret i64 1
// CHECK: ret i64 %[[INTRINSIC]]
return svcntd_pat(SV_VL1); return svcntd_pat(SV_VL1);
} }
uint64_t test_svcntd_pat_2() uint64_t test_svcntd_pat_2()
{ {
// CHECK-LABEL: test_svcntd_pat_2 // CHECK-LABEL: test_svcntd_pat_2
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntd(i32 2) // CHECK: ret i64 2
// CHECK: ret i64 %[[INTRINSIC]]
return svcntd_pat(SV_VL2); return svcntd_pat(SV_VL2);
} }
@ -143,7 +142,8 @@ uint64_t test_svcntd_pat_15()
uint64_t test_svcntd_pat_16() uint64_t test_svcntd_pat_16()
{ {
// CHECK-LABEL: test_svcntd_pat_16 // CHECK-LABEL: test_svcntd_pat_16
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntd(i32 31) // CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.vscale.i64()
// CHECK: ret i64 %[[INTRINSIC]] // CHECK-NEXT: %[[RET:.*]] = shl i64 %[[INTRINSIC]], 1
// CHECK: ret i64 %[[RET]]
return svcntd_pat(SV_ALL); return svcntd_pat(SV_ALL);
} }

View File

@ -7,8 +7,9 @@
uint64_t test_svcnth() uint64_t test_svcnth()
{ {
// CHECK-LABEL: test_svcnth // CHECK-LABEL: test_svcnth
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cnth(i32 31) // CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.vscale.i64()
// CHECK: ret i64 %[[INTRINSIC]] // CHECK-NEXT: %[[RET:.*]] = shl i64 %[[INTRINSIC]], 3
// CHECK: ret i64 %[[RET]]
return svcnth(); return svcnth();
} }
@ -23,64 +24,56 @@ uint64_t test_svcnth_pat()
uint64_t test_svcnth_pat_1() uint64_t test_svcnth_pat_1()
{ {
// CHECK-LABEL: test_svcnth_pat_1 // CHECK-LABEL: test_svcnth_pat_1
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cnth(i32 1) // CHECK: ret i64 1
// CHECK: ret i64 %[[INTRINSIC]]
return svcnth_pat(SV_VL1); return svcnth_pat(SV_VL1);
} }
uint64_t test_svcnth_pat_2() uint64_t test_svcnth_pat_2()
{ {
// CHECK-LABEL: test_svcnth_pat_2 // CHECK-LABEL: test_svcnth_pat_2
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cnth(i32 2) // CHECK: ret i64 2
// CHECK: ret i64 %[[INTRINSIC]]
return svcnth_pat(SV_VL2); return svcnth_pat(SV_VL2);
} }
uint64_t test_svcnth_pat_3() uint64_t test_svcnth_pat_3()
{ {
// CHECK-LABEL: test_svcnth_pat_3 // CHECK-LABEL: test_svcnth_pat_3
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cnth(i32 3) // CHECK: ret i64 3
// CHECK: ret i64 %[[INTRINSIC]]
return svcnth_pat(SV_VL3); return svcnth_pat(SV_VL3);
} }
uint64_t test_svcnth_pat_4() uint64_t test_svcnth_pat_4()
{ {
// CHECK-LABEL: test_svcnth_pat_4 // CHECK-LABEL: test_svcnth_pat_4
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cnth(i32 4) // CHECK: ret i64 4
// CHECK: ret i64 %[[INTRINSIC]]
return svcnth_pat(SV_VL4); return svcnth_pat(SV_VL4);
} }
uint64_t test_svcnth_pat_5() uint64_t test_svcnth_pat_5()
{ {
// CHECK-LABEL: test_svcnth_pat_5 // CHECK-LABEL: test_svcnth_pat_5
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cnth(i32 5) // CHECK: ret i64 5
// CHECK: ret i64 %[[INTRINSIC]]
return svcnth_pat(SV_VL5); return svcnth_pat(SV_VL5);
} }
uint64_t test_svcnth_pat_6() uint64_t test_svcnth_pat_6()
{ {
// CHECK-LABEL: test_svcnth_pat_6 // CHECK-LABEL: test_svcnth_pat_6
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cnth(i32 6) // CHECK: ret i64 6
// CHECK: ret i64 %[[INTRINSIC]]
return svcnth_pat(SV_VL6); return svcnth_pat(SV_VL6);
} }
uint64_t test_svcnth_pat_7() uint64_t test_svcnth_pat_7()
{ {
// CHECK-LABEL: test_svcnth_pat_7 // CHECK-LABEL: test_svcnth_pat_7
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cnth(i32 7) // CHECK: ret i64 7
// CHECK: ret i64 %[[INTRINSIC]]
return svcnth_pat(SV_VL7); return svcnth_pat(SV_VL7);
} }
uint64_t test_svcnth_pat_8() uint64_t test_svcnth_pat_8()
{ {
// CHECK-LABEL: test_svcnth_pat_8 // CHECK-LABEL: test_svcnth_pat_8
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cnth(i32 8) // CHECK: ret i64 8
// CHECK: ret i64 %[[INTRINSIC]]
return svcnth_pat(SV_VL8); return svcnth_pat(SV_VL8);
} }
@ -143,7 +136,8 @@ uint64_t test_svcnth_pat_15()
uint64_t test_svcnth_pat_16() uint64_t test_svcnth_pat_16()
{ {
// CHECK-LABEL: test_svcnth_pat_16 // CHECK-LABEL: test_svcnth_pat_16
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cnth(i32 31) // CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.vscale.i64()
// CHECK: ret i64 %[[INTRINSIC]] // CHECK-NEXT: %[[RET:.*]] = shl i64 %[[INTRINSIC]], 3
// CHECK: ret i64 %[[RET]]
return svcnth_pat(SV_ALL); return svcnth_pat(SV_ALL);
} }

View File

@ -7,8 +7,9 @@
uint64_t test_svcntw() uint64_t test_svcntw()
{ {
// CHECK-LABEL: test_svcntw // CHECK-LABEL: test_svcntw
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntw(i32 31) // CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.vscale.i64()
// CHECK: ret i64 %[[INTRINSIC]] // CHECK-NEXT: %[[RET:.*]] = shl i64 %[[INTRINSIC]], 2
// CHECK: ret i64 %[[RET]]
return svcntw(); return svcntw();
} }
@ -23,32 +24,28 @@ uint64_t test_svcntw_pat()
uint64_t test_svcntw_pat_1() uint64_t test_svcntw_pat_1()
{ {
// CHECK-LABEL: test_svcntw_pat_1 // CHECK-LABEL: test_svcntw_pat_1
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntw(i32 1) // CHECK: ret i64 1
// CHECK: ret i64 %[[INTRINSIC]]
return svcntw_pat(SV_VL1); return svcntw_pat(SV_VL1);
} }
uint64_t test_svcntw_pat_2() uint64_t test_svcntw_pat_2()
{ {
// CHECK-LABEL: test_svcntw_pat_2 // CHECK-LABEL: test_svcntw_pat_2
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntw(i32 2) // CHECK: ret i64 2
// CHECK: ret i64 %[[INTRINSIC]]
return svcntw_pat(SV_VL2); return svcntw_pat(SV_VL2);
} }
uint64_t test_svcntw_pat_3() uint64_t test_svcntw_pat_3()
{ {
// CHECK-LABEL: test_svcntw_pat_3 // CHECK-LABEL: test_svcntw_pat_3
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntw(i32 3) // CHECK: ret i64 3
// CHECK: ret i64 %[[INTRINSIC]]
return svcntw_pat(SV_VL3); return svcntw_pat(SV_VL3);
} }
uint64_t test_svcntw_pat_4() uint64_t test_svcntw_pat_4()
{ {
// CHECK-LABEL: test_svcntw_pat_4 // CHECK-LABEL: test_svcntw_pat_4
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntw(i32 4) // CHECK: ret i64 4
// CHECK: ret i64 %[[INTRINSIC]]
return svcntw_pat(SV_VL4); return svcntw_pat(SV_VL4);
} }
@ -143,7 +140,8 @@ uint64_t test_svcntw_pat_15()
uint64_t test_svcntw_pat_16() uint64_t test_svcntw_pat_16()
{ {
// CHECK-LABEL: test_svcntw_pat_16 // CHECK-LABEL: test_svcntw_pat_16
// CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.aarch64.sve.cntw(i32 31) // CHECK: %[[INTRINSIC:.*]] = call i64 @llvm.vscale.i64()
// CHECK: ret i64 %[[INTRINSIC]] // CHECK-NEXT: %[[RET:.*]] = shl i64 %[[INTRINSIC]], 2
// CHECK: ret i64 %[[RET]]
return svcntw_pat(SV_ALL); return svcntw_pat(SV_ALL);
} }

View File

@ -642,6 +642,46 @@ static Optional<Instruction *> instCombineRDFFR(InstCombiner &IC,
return IC.replaceInstUsesWith(II, RDFFR); return IC.replaceInstUsesWith(II, RDFFR);
} }
static Optional<Instruction *>
instCombineSVECntElts(InstCombiner &IC, IntrinsicInst &II, unsigned NumElts) {
const auto Pattern = cast<ConstantInt>(II.getArgOperand(0))->getZExtValue();
if (Pattern == AArch64SVEPredPattern::all) {
LLVMContext &Ctx = II.getContext();
IRBuilder<> Builder(Ctx);
Builder.SetInsertPoint(&II);
Constant *StepVal = ConstantInt::get(II.getType(), NumElts);
auto *VScale = Builder.CreateVScale(StepVal);
VScale->takeName(&II);
return IC.replaceInstUsesWith(II, VScale);
}
unsigned MinNumElts = 0;
switch (Pattern) {
default:
return None;
case AArch64SVEPredPattern::vl1:
case AArch64SVEPredPattern::vl2:
case AArch64SVEPredPattern::vl3:
case AArch64SVEPredPattern::vl4:
case AArch64SVEPredPattern::vl5:
case AArch64SVEPredPattern::vl6:
case AArch64SVEPredPattern::vl7:
case AArch64SVEPredPattern::vl8:
MinNumElts = Pattern;
break;
case AArch64SVEPredPattern::vl16:
MinNumElts = 16;
break;
}
return NumElts >= MinNumElts
? Optional<Instruction *>(IC.replaceInstUsesWith(
II, ConstantInt::get(II.getType(), MinNumElts)))
: None;
}
Optional<Instruction *> Optional<Instruction *>
AArch64TTIImpl::instCombineIntrinsic(InstCombiner &IC, AArch64TTIImpl::instCombineIntrinsic(InstCombiner &IC,
IntrinsicInst &II) const { IntrinsicInst &II) const {
@ -661,6 +701,14 @@ AArch64TTIImpl::instCombineIntrinsic(InstCombiner &IC,
case Intrinsic::aarch64_sve_lasta: case Intrinsic::aarch64_sve_lasta:
case Intrinsic::aarch64_sve_lastb: case Intrinsic::aarch64_sve_lastb:
return instCombineSVELast(IC, II); return instCombineSVELast(IC, II);
case Intrinsic::aarch64_sve_cntd:
return instCombineSVECntElts(IC, II, 2);
case Intrinsic::aarch64_sve_cntw:
return instCombineSVECntElts(IC, II, 4);
case Intrinsic::aarch64_sve_cnth:
return instCombineSVECntElts(IC, II, 8);
case Intrinsic::aarch64_sve_cntb:
return instCombineSVECntElts(IC, II, 16);
} }
return None; return None;

View File

@ -0,0 +1,247 @@
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
; RUN: opt -S -instcombine < %s | FileCheck %s
target triple = "aarch64-unknown-linux-gnu"
;
; CNTB
;
define i64 @cntb_vl1() {
; CHECK-LABEL: @cntb_vl1(
; CHECK-NEXT: ret i64 1
;
%out = call i64 @llvm.aarch64.sve.cntb(i32 1)
ret i64 %out
}
define i64 @cntb_vl2() {
; CHECK-LABEL: @cntb_vl2(
; CHECK-NEXT: ret i64 2
;
%out = call i64 @llvm.aarch64.sve.cntb(i32 2)
ret i64 %out
}
define i64 @cntb_vl4() {
; CHECK-LABEL: @cntb_vl4(
; CHECK-NEXT: ret i64 4
;
%out = call i64 @llvm.aarch64.sve.cntb(i32 4)
ret i64 %out
}
define i64 @cntb_mul3() {
; CHECK-LABEL: @cntb_mul3(
; CHECK-NEXT: ret i64 24
;
%cnt = call i64 @llvm.aarch64.sve.cntb(i32 8)
%out = mul i64 %cnt, 3
ret i64 %out
}
define i64 @cntb_mul4() {
; CHECK-LABEL: @cntb_mul4(
; CHECK-NEXT: ret i64 64
;
%cnt = call i64 @llvm.aarch64.sve.cntb(i32 9)
%out = mul i64 %cnt, 4
ret i64 %out
}
define i64 @cntb_all() {
; CHECK-LABEL: @cntb_all(
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.vscale.i64()
; CHECK-NEXT: [[OUT:%.*]] = shl i64 [[TMP1]], 4
; CHECK-NEXT: ret i64 [[OUT]]
;
%out = call i64 @llvm.aarch64.sve.cntb(i32 31)
ret i64 %out
}
;
; CNTH
;
define i64 @cnth_vl1() {
; CHECK-LABEL: @cnth_vl1(
; CHECK-NEXT: ret i64 1
;
%out = call i64 @llvm.aarch64.sve.cnth(i32 1)
ret i64 %out
}
define i64 @cnth_vl2() {
; CHECK-LABEL: @cnth_vl2(
; CHECK-NEXT: ret i64 2
;
%out = call i64 @llvm.aarch64.sve.cnth(i32 2)
ret i64 %out
}
define i64 @cnth_vl4() {
; CHECK-LABEL: @cnth_vl4(
; CHECK-NEXT: ret i64 4
;
%out = call i64 @llvm.aarch64.sve.cnth(i32 4)
ret i64 %out
}
define i64 @cnth_mul3() {
; CHECK-LABEL: @cnth_mul3(
; CHECK-NEXT: ret i64 24
;
%cnt = call i64 @llvm.aarch64.sve.cnth(i32 8)
%out = mul i64 %cnt, 3
ret i64 %out
}
define i64 @cnth_mul4() {
; CHECK-LABEL: @cnth_mul4(
; CHECK-NEXT: [[CNT:%.*]] = call i64 @llvm.aarch64.sve.cnth(i32 9)
; CHECK-NEXT: [[OUT:%.*]] = shl i64 [[CNT]], 2
; CHECK-NEXT: ret i64 [[OUT]]
;
%cnt = call i64 @llvm.aarch64.sve.cnth(i32 9)
%out = mul i64 %cnt, 4
ret i64 %out
}
define i64 @cnth_all() {
; CHECK-LABEL: @cnth_all(
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.vscale.i64()
; CHECK-NEXT: [[OUT:%.*]] = shl i64 [[TMP1]], 3
; CHECK-NEXT: ret i64 [[OUT]]
;
%out = call i64 @llvm.aarch64.sve.cnth(i32 31)
ret i64 %out
}
;
; CNTW
;
define i64 @cntw_vl1() {
; CHECK-LABEL: @cntw_vl1(
; CHECK-NEXT: ret i64 1
;
%out = call i64 @llvm.aarch64.sve.cntw(i32 1)
ret i64 %out
}
define i64 @cntw_vl2() {
; CHECK-LABEL: @cntw_vl2(
; CHECK-NEXT: ret i64 2
;
%out = call i64 @llvm.aarch64.sve.cntw(i32 2)
ret i64 %out
}
define i64 @cntw_vl4() {
; CHECK-LABEL: @cntw_vl4(
; CHECK-NEXT: ret i64 4
;
%out = call i64 @llvm.aarch64.sve.cntw(i32 4)
ret i64 %out
}
define i64 @cntw_mul3() {
; CHECK-LABEL: @cntw_mul3(
; CHECK-NEXT: [[CNT:%.*]] = call i64 @llvm.aarch64.sve.cntw(i32 8)
; CHECK-NEXT: [[OUT:%.*]] = mul i64 [[CNT]], 3
; CHECK-NEXT: ret i64 [[OUT]]
;
%cnt = call i64 @llvm.aarch64.sve.cntw(i32 8)
%out = mul i64 %cnt, 3
ret i64 %out
}
define i64 @cntw_mul4() {
; CHECK-LABEL: @cntw_mul4(
; CHECK-NEXT: [[CNT:%.*]] = call i64 @llvm.aarch64.sve.cntw(i32 9)
; CHECK-NEXT: [[OUT:%.*]] = shl i64 [[CNT]], 2
; CHECK-NEXT: ret i64 [[OUT]]
;
%cnt = call i64 @llvm.aarch64.sve.cntw(i32 9)
%out = mul i64 %cnt, 4
ret i64 %out
}
define i64 @cntw_all() {
; CHECK-LABEL: @cntw_all(
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.vscale.i64()
; CHECK-NEXT: [[OUT:%.*]] = shl i64 [[TMP1]], 2
; CHECK-NEXT: ret i64 [[OUT]]
;
%out = call i64 @llvm.aarch64.sve.cntw(i32 31)
ret i64 %out
}
;
; CNTD
;
define i64 @cntd_vl1() {
; CHECK-LABEL: @cntd_vl1(
; CHECK-NEXT: ret i64 1
;
%out = call i64 @llvm.aarch64.sve.cntd(i32 1)
ret i64 %out
}
define i64 @cntd_vl2() {
; CHECK-LABEL: @cntd_vl2(
; CHECK-NEXT: ret i64 2
;
%out = call i64 @llvm.aarch64.sve.cntd(i32 2)
ret i64 %out
}
define i64 @cntd_vl4() {
; CHECK-LABEL: @cntd_vl4(
; CHECK-NEXT: [[OUT:%.*]] = call i64 @llvm.aarch64.sve.cntd(i32 4)
; CHECK-NEXT: ret i64 [[OUT]]
;
%out = call i64 @llvm.aarch64.sve.cntd(i32 4)
ret i64 %out
}
define i64 @cntd_mul3() {
; CHECK-LABEL: @cntd_mul3(
; CHECK-NEXT: [[CNT:%.*]] = call i64 @llvm.aarch64.sve.cntd(i32 8)
; CHECK-NEXT: [[OUT:%.*]] = mul i64 [[CNT]], 3
; CHECK-NEXT: ret i64 [[OUT]]
;
%cnt = call i64 @llvm.aarch64.sve.cntd(i32 8)
%out = mul i64 %cnt, 3
ret i64 %out
}
define i64 @cntd_mul4() {
; CHECK-LABEL: @cntd_mul4(
; CHECK-NEXT: [[CNT:%.*]] = call i64 @llvm.aarch64.sve.cntd(i32 9)
; CHECK-NEXT: [[OUT:%.*]] = shl i64 [[CNT]], 2
; CHECK-NEXT: ret i64 [[OUT]]
;
%cnt = call i64 @llvm.aarch64.sve.cntd(i32 9)
%out = mul i64 %cnt, 4
ret i64 %out
}
define i64 @cntd_all() {
; CHECK-LABEL: @cntd_all(
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.vscale.i64()
; CHECK-NEXT: [[OUT:%.*]] = shl i64 [[TMP1]], 1
; CHECK-NEXT: ret i64 [[OUT]]
;
%out = call i64 @llvm.aarch64.sve.cntd(i32 31)
ret i64 %out
}
declare i64 @llvm.aarch64.sve.cntb(i32 %pattern)
declare i64 @llvm.aarch64.sve.cnth(i32 %pattern)
declare i64 @llvm.aarch64.sve.cntw(i32 %pattern)
declare i64 @llvm.aarch64.sve.cntd(i32 %pattern)