forked from OSchip/llvm-project
[PowerPC] Enable default support of quad precision operations
Summary: Remove option guarding support of quad precision operations. Reviewers: nemanjai, #powerpc, steven.zhang Reviewed By: nemanjai, #powerpc, steven.zhang Subscribers: qiucf, wuzish, nemanjai, hiraditya, kbarton, shchenz, llvm-commits Tags: #llvm Differential Revision: https://reviews.llvm.org/D83437
This commit is contained in:
parent
fdb7856d54
commit
90b1a710ae
|
@ -117,9 +117,6 @@ cl::desc("disable sibling call optimization on ppc"), cl::Hidden);
|
|||
static cl::opt<bool> DisableInnermostLoopAlign32("disable-ppc-innermost-loop-align32",
|
||||
cl::desc("don't always align innermost loop to 32 bytes on ppc"), cl::Hidden);
|
||||
|
||||
static cl::opt<bool> EnableQuadPrecision("enable-ppc-quad-precision",
|
||||
cl::desc("enable quad precision float support on ppc"), cl::Hidden);
|
||||
|
||||
static cl::opt<bool> UseAbsoluteJumpTables("ppc-use-absolute-jumptables",
|
||||
cl::desc("use absolute jump tables on ppc"), cl::Hidden);
|
||||
|
||||
|
@ -1004,7 +1001,6 @@ PPCTargetLowering::PPCTargetLowering(const PPCTargetMachine &TM,
|
|||
setOperationAction(ISD::SRL, MVT::v1i128, Legal);
|
||||
setOperationAction(ISD::SRA, MVT::v1i128, Expand);
|
||||
|
||||
if (EnableQuadPrecision) {
|
||||
addRegisterClass(MVT::f128, &PPC::VRRCRegClass);
|
||||
setOperationAction(ISD::FADD, MVT::f128, Legal);
|
||||
setOperationAction(ISD::FSUB, MVT::f128, Legal);
|
||||
|
@ -1058,7 +1054,6 @@ PPCTargetLowering::PPCTargetLowering(const PPCTargetMachine &TM,
|
|||
setOperationAction(ISD::STRICT_FCEIL, MVT::f128, Legal);
|
||||
setOperationAction(ISD::STRICT_FTRUNC, MVT::f128, Legal);
|
||||
setOperationAction(ISD::STRICT_FROUND, MVT::f128, Legal);
|
||||
}
|
||||
setOperationAction(ISD::FP_EXTEND, MVT::v2f32, Custom);
|
||||
setOperationAction(ISD::BSWAP, MVT::v8i16, Legal);
|
||||
setOperationAction(ISD::BSWAP, MVT::v4i32, Legal);
|
||||
|
@ -1307,7 +1302,6 @@ PPCTargetLowering::PPCTargetLowering(const PPCTargetMachine &TM,
|
|||
setTargetDAGCombine(ISD::VSELECT);
|
||||
}
|
||||
|
||||
if (EnableQuadPrecision) {
|
||||
setLibcallName(RTLIB::LOG_F128, "logf128");
|
||||
setLibcallName(RTLIB::LOG2_F128, "log2f128");
|
||||
setLibcallName(RTLIB::LOG10_F128, "log10f128");
|
||||
|
@ -1320,7 +1314,6 @@ PPCTargetLowering::PPCTargetLowering(const PPCTargetMachine &TM,
|
|||
setLibcallName(RTLIB::FMAX_F128, "fmaxf128");
|
||||
setLibcallName(RTLIB::POWI_F128, "__powikf2");
|
||||
setLibcallName(RTLIB::REM_F128, "fmodf128");
|
||||
}
|
||||
|
||||
// With 32 condition bits, we don't need to sink (and duplicate) compares
|
||||
// aggressively in CodeGenPrep.
|
||||
|
@ -8308,7 +8301,7 @@ SDValue PPCTargetLowering::LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG,
|
|||
const SDLoc &dl) const {
|
||||
|
||||
// FP to INT conversions are legal for f128.
|
||||
if (EnableQuadPrecision && (Op->getOperand(0).getValueType() == MVT::f128))
|
||||
if (Op->getOperand(0).getValueType() == MVT::f128)
|
||||
return Op;
|
||||
|
||||
// Expand ppcf128 to i32 by hand for the benefit of llvm-gcc bootstrap on
|
||||
|
@ -8576,7 +8569,7 @@ SDValue PPCTargetLowering::LowerINT_TO_FP(SDValue Op,
|
|||
return LowerINT_TO_FPVector(Op, DAG, dl);
|
||||
|
||||
// Conversions to f128 are legal.
|
||||
if (EnableQuadPrecision && (Op.getValueType() == MVT::f128))
|
||||
if (Op.getValueType() == MVT::f128)
|
||||
return Op;
|
||||
|
||||
if (Subtarget.hasQPX() && Op.getOperand(0).getValueType() == MVT::v4i1) {
|
||||
|
@ -9104,8 +9097,7 @@ SDValue PPCTargetLowering::LowerBITCAST(SDValue Op, SelectionDAG &DAG) const {
|
|||
SDLoc dl(Op);
|
||||
SDValue Op0 = Op->getOperand(0);
|
||||
|
||||
if (!EnableQuadPrecision ||
|
||||
(Op.getValueType() != MVT::f128 ) ||
|
||||
if ((Op.getValueType() != MVT::f128) ||
|
||||
(Op0.getOpcode() != ISD::BUILD_PAIR) ||
|
||||
(Op0.getOperand(0).getValueType() != MVT::i64) ||
|
||||
(Op0.getOperand(1).getValueType() != MVT::i64))
|
||||
|
@ -16373,7 +16365,7 @@ bool PPCTargetLowering::isFMAFasterThanFMulAndFAdd(const Function &F,
|
|||
case Type::DoubleTyID:
|
||||
return true;
|
||||
case Type::FP128TyID:
|
||||
return EnableQuadPrecision && Subtarget.hasP9Vector();
|
||||
return Subtarget.hasP9Vector();
|
||||
default:
|
||||
return false;
|
||||
}
|
||||
|
|
|
@ -1,6 +1,5 @@
|
|||
; RUN: llc -verify-machineinstrs -mcpu=pwr9 -enable-ppc-quad-precision \
|
||||
; RUN: -mtriple=powerpc64le-unknown-unknown -ppc-vsr-nums-as-vr \
|
||||
; RUN: -ppc-asm-full-reg-names < %s | FileCheck %s
|
||||
; RUN: llc -verify-machineinstrs -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
|
||||
; RUN: -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s | FileCheck %s
|
||||
|
||||
@A = common global fp128 0xL00000000000000000000000000000000, align 16
|
||||
@B = common global fp128 0xL00000000000000000000000000000000, align 16
|
||||
|
|
|
@ -1,6 +1,5 @@
|
|||
; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \
|
||||
; RUN: -mcpu=future -enable-ppc-quad-precision -ppc-asm-full-reg-names \
|
||||
; RUN: < %s | FileCheck %s
|
||||
; RUN: -mcpu=future -ppc-asm-full-reg-names < %s | FileCheck %s
|
||||
|
||||
define float @FloatConstantPool() {
|
||||
; CHECK-LABEL: FloatConstantPool:
|
||||
|
|
|
@ -1,9 +1,8 @@
|
|||
; RUN: llc -relocation-model=pic -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
|
||||
; RUN: -enable-ppc-quad-precision -verify-machineinstrs \
|
||||
; RUN: -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s | FileCheck %s
|
||||
; RUN: -verify-machineinstrs -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s \
|
||||
; RUN: | FileCheck %s
|
||||
; RUN: llc -relocation-model=pic -mcpu=pwr9 -mtriple=powerpc64-unknown-unknown \
|
||||
; RUN: -enable-ppc-quad-precision -verify-machineinstrs \
|
||||
; RUN: -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s \
|
||||
; RUN: -verify-machineinstrs -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s \
|
||||
; RUN: | FileCheck -check-prefix=CHECK-BE %s
|
||||
|
||||
; Testing homogeneous aggregates.
|
||||
|
|
|
@ -1,5 +1,4 @@
|
|||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
|
||||
; RUN: -enable-ppc-quad-precision -verify-machineinstrs \
|
||||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown -verify-machineinstrs \
|
||||
; RUN: -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s | FileCheck %s
|
||||
|
||||
; Function Attrs: norecurse nounwind
|
||||
|
|
|
@ -1,10 +1,8 @@
|
|||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
|
||||
; RUN: -enable-ppc-quad-precision -verify-machineinstrs \
|
||||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown -verify-machineinstrs \
|
||||
; RUN: -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s | FileCheck %s
|
||||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64-unknown-unknown \
|
||||
; RUN: -enable-ppc-quad-precision -verify-machineinstrs \
|
||||
; RUN: -ppc-asm-full-reg-names \
|
||||
; RUN: -ppc-vsr-nums-as-vr < %s | FileCheck %s --check-prefix=CHECK-BE
|
||||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64-unknown-unknown -verify-machineinstrs \
|
||||
; RUN: -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s | \
|
||||
; RUN: FileCheck %s --check-prefix=CHECK-BE
|
||||
|
||||
; Function Attrs: norecurse nounwind readnone
|
||||
define i64 @getPart1(fp128 %in) local_unnamed_addr {
|
||||
|
|
|
@ -1,5 +1,4 @@
|
|||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
|
||||
; RUN: -enable-ppc-quad-precision -verify-machineinstrs \
|
||||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown -verify-machineinstrs \
|
||||
; RUN: -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s | FileCheck %s
|
||||
|
||||
@a_qp = common global fp128 0xL00000000000000000000000000000000, align 16
|
||||
|
|
|
@ -1,6 +1,6 @@
|
|||
; RUN: llc -relocation-model=pic -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
|
||||
; RUN: -enable-ppc-quad-precision -ppc-vsr-nums-as-vr \
|
||||
; RUN: -verify-machineinstrs -ppc-asm-full-reg-names < %s | FileCheck %s
|
||||
; RUN: -ppc-vsr-nums-as-vr -verify-machineinstrs -ppc-asm-full-reg-names < %s \
|
||||
; RUN: | FileCheck %s
|
||||
|
||||
@mem = global [5 x i64] [i64 56, i64 63, i64 3, i64 5, i64 6], align 8
|
||||
@umem = global [5 x i64] [i64 560, i64 100, i64 34, i64 2, i64 5], align 8
|
||||
|
|
|
@ -1,6 +1,5 @@
|
|||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
|
||||
; RUN: -enable-ppc-quad-precision -ppc-vsr-nums-as-vr \
|
||||
; RUN: -ppc-asm-full-reg-names < %s | FileCheck %s
|
||||
; RUN: -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s | FileCheck %s
|
||||
|
||||
define void @qpFmadd(fp128* nocapture readonly %a, fp128* nocapture %b,
|
||||
fp128* nocapture readonly %c, fp128* nocapture %res) {
|
||||
|
|
|
@ -1,5 +1,4 @@
|
|||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
|
||||
; RUN: -enable-ppc-quad-precision -ppc-vsr-nums-as-vr \
|
||||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown -ppc-vsr-nums-as-vr \
|
||||
; RUN: -verify-machineinstrs -ppc-asm-full-reg-names < %s | FileCheck %s
|
||||
|
||||
; Function Attrs: norecurse nounwind readnone
|
||||
|
|
|
@ -1,5 +1,4 @@
|
|||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
|
||||
; RUN: -enable-ppc-quad-precision -verify-machineinstrs \
|
||||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown -verify-machineinstrs \
|
||||
; RUN: -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s | FileCheck %s
|
||||
|
||||
|
||||
|
|
|
@ -1,6 +1,6 @@
|
|||
; RUN: llc -relocation-model=pic -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
|
||||
; RUN: -verify-machineinstrs -enable-ppc-quad-precision \
|
||||
; RUN: -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s | FileCheck %s
|
||||
; RUN: -verify-machineinstrs -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s \
|
||||
; RUN: | FileCheck %s
|
||||
|
||||
@f128Array = global [4 x fp128] [fp128 0xL00000000000000004004C00000000000,
|
||||
fp128 0xLF000000000000000400808AB851EB851,
|
||||
|
|
|
@ -1,10 +1,10 @@
|
|||
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
||||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown -ppc-vsr-nums-as-vr \
|
||||
; RUN: -relocation-model=pic -ppc-asm-full-reg-names -verify-machineinstrs \
|
||||
; RUN: -enable-ppc-quad-precision < %s | FileCheck %s
|
||||
; RUN: < %s | FileCheck %s
|
||||
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64-unknown-unknown -ppc-vsr-nums-as-vr \
|
||||
; RUN: -ppc-asm-full-reg-names -verify-machineinstrs \
|
||||
; RUN: -enable-ppc-quad-precision < %s | FileCheck %s -check-prefix=CHECK-BE
|
||||
; RUN: < %s | FileCheck %s -check-prefix=CHECK-BE
|
||||
|
||||
; Vector extract DWord and convert to quad precision.
|
||||
|
||||
|
|
|
@ -52,24 +52,22 @@ define signext i32 @test() nounwind {
|
|||
; CHECK-NEXT: addis 3, 2, a10@toc@ha
|
||||
; CHECK-NEXT: lfd 10, a10@toc@l(3)
|
||||
; CHECK-NEXT: addis 3, 2, a11@toc@ha
|
||||
; CHECK-NEXT: addis 6, 2, a17@toc@ha
|
||||
; CHECK-NEXT: lfd 11, a11@toc@l(3)
|
||||
; CHECK-NEXT: addis 3, 2, a12@toc@ha
|
||||
; CHECK-NEXT: addis 5, 2, a16@toc@ha
|
||||
; CHECK-NEXT: addis 6, 2, a17@toc@ha
|
||||
; CHECK-NEXT: addi 6, 6, a17@toc@l
|
||||
; CHECK-NEXT: addi 5, 5, a16@toc@l
|
||||
; CHECK-NEXT: lxvx 34, 0, 6
|
||||
; CHECK-NEXT: lfd 12, a12@toc@l(3)
|
||||
; CHECK-NEXT: addis 3, 2, a13@toc@ha
|
||||
; CHECK-NEXT: addi 5, 5, a16@toc@l
|
||||
; CHECK-NEXT: addis 4, 2, a15@toc@ha
|
||||
; CHECK-NEXT: lxvx 0, 0, 5
|
||||
; CHECK-NEXT: ld 4, a15@toc@l(4)
|
||||
; CHECK-NEXT: li 5, 168
|
||||
; CHECK-NEXT: lfd 11, a11@toc@l(3)
|
||||
; CHECK-NEXT: addis 3, 2, a12@toc@ha
|
||||
; CHECK-NEXT: lfd 12, a12@toc@l(3)
|
||||
; CHECK-NEXT: addis 3, 2, a13@toc@ha
|
||||
; CHECK-NEXT: li 5, 152
|
||||
; CHECK-NEXT: lfd 13, a13@toc@l(3)
|
||||
; CHECK-NEXT: addis 3, 2, a14@toc@ha
|
||||
; CHECK-NEXT: ld 3, a14@toc@l(3)
|
||||
; CHECK-NEXT: stxvx 34, 1, 5
|
||||
; CHECK-NEXT: li 5, 152
|
||||
; CHECK-NEXT: stxvx 0, 1, 5
|
||||
; CHECK-NEXT: std 4, 144(1)
|
||||
; CHECK-NEXT: std 3, 136(1)
|
||||
|
|
|
@ -1,5 +1,6 @@
|
|||
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
||||
; RUN: llc -verify-machineinstrs -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s -mtriple=powerpc64le-unknown-linux -mcpu=pwr9 -enable-ppc-quad-precision=true | FileCheck %s
|
||||
; RUN: llc -verify-machineinstrs -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr \
|
||||
; RUN: < %s -mtriple=powerpc64le-unknown-linux -mcpu=pwr9 | FileCheck %s
|
||||
|
||||
declare fp128 @llvm.experimental.constrained.fadd.f128(fp128, fp128, metadata, metadata)
|
||||
declare fp128 @llvm.experimental.constrained.fsub.f128(fp128, fp128, metadata, metadata)
|
||||
|
|
|
@ -1,7 +1,7 @@
|
|||
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
||||
; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \
|
||||
; RUN: -mcpu=future -enable-ppc-quad-precision -ppc-asm-full-reg-names \
|
||||
; RUN: -ppc-vsr-nums-as-vr < %s | FileCheck %s
|
||||
; RUN: -mcpu=future -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s \
|
||||
; RUN: | FileCheck %s
|
||||
|
||||
@_ZL13StaticBoolVar = internal unnamed_addr global i8 0, align 1
|
||||
@_ZL19StaticSignedCharVar = internal unnamed_addr global i8 0, align 1
|
||||
|
|
|
@ -1,7 +1,7 @@
|
|||
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
||||
; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \
|
||||
; RUN: -mcpu=future -enable-ppc-quad-precision -ppc-asm-full-reg-names \
|
||||
; RUN: -ppc-vsr-nums-as-vr < %s | FileCheck %s
|
||||
; RUN: -mcpu=future -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s \
|
||||
; RUN: | FileCheck %s
|
||||
|
||||
%struct.Struct = type { i8, i16, i32 }
|
||||
|
||||
|
|
|
@ -1,5 +1,5 @@
|
|||
; RUN: llc -verify-machineinstrs -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
|
||||
; RUN: -enable-ppc-quad-precision -ppc-asm-full-reg-names < %s | FileCheck %s
|
||||
; RUN: -ppc-asm-full-reg-names < %s | FileCheck %s
|
||||
; RUN: llc -verify-machineinstrs -mcpu=pwr8 -mtriple=powerpc64le-unknown-unknown \
|
||||
; RUN: -ppc-asm-full-reg-names < %s | FileCheck %s -check-prefix=CHECK-PWR8 \
|
||||
; RUN: -implicit-check-not "\<setb\>"
|
||||
|
|
|
@ -1176,14 +1176,7 @@ define fp128 @hoo5_fmf(fp128 %a) #1 {
|
|||
;
|
||||
; CHECK-P9-LABEL: hoo5_fmf:
|
||||
; CHECK-P9: # %bb.0:
|
||||
; CHECK-P9-NEXT: mflr 0
|
||||
; CHECK-P9-NEXT: std 0, 16(1)
|
||||
; CHECK-P9-NEXT: stdu 1, -32(1)
|
||||
; CHECK-P9-NEXT: bl sqrtl
|
||||
; CHECK-P9-NEXT: nop
|
||||
; CHECK-P9-NEXT: addi 1, 1, 32
|
||||
; CHECK-P9-NEXT: ld 0, 16(1)
|
||||
; CHECK-P9-NEXT: mtlr 0
|
||||
; CHECK-P9-NEXT: xssqrtqp 2, 2
|
||||
; CHECK-P9-NEXT: blr
|
||||
%r = call reassoc ninf afn fp128 @llvm.sqrt.f128(fp128 %a)
|
||||
ret fp128 %r
|
||||
|
@ -1216,14 +1209,7 @@ define fp128 @hoo5_safe(fp128 %a) #1 {
|
|||
;
|
||||
; CHECK-P9-LABEL: hoo5_safe:
|
||||
; CHECK-P9: # %bb.0:
|
||||
; CHECK-P9-NEXT: mflr 0
|
||||
; CHECK-P9-NEXT: std 0, 16(1)
|
||||
; CHECK-P9-NEXT: stdu 1, -32(1)
|
||||
; CHECK-P9-NEXT: bl sqrtl
|
||||
; CHECK-P9-NEXT: nop
|
||||
; CHECK-P9-NEXT: addi 1, 1, 32
|
||||
; CHECK-P9-NEXT: ld 0, 16(1)
|
||||
; CHECK-P9-NEXT: mtlr 0
|
||||
; CHECK-P9-NEXT: xssqrtqp 2, 2
|
||||
; CHECK-P9-NEXT: blr
|
||||
%r = call fp128 @llvm.sqrt.f128(fp128 %a)
|
||||
ret fp128 %r
|
||||
|
|
Loading…
Reference in New Issue