forked from OSchip/llvm-project
[ARM] Use correct half-precision functions in EABI mode
The ARM RTABI defines the half- to single-precision float conversion functions with an __aeabi prefix, but libgcc only has them with a __gnu prefix. Therefore we need to emit the __aeabi version when compiling with an eabi or eabihf triple, and the __gnu version with a gnueabi or gnueabihf triple. llvm-svn: 249565
This commit is contained in:
parent
13d21e9ae1
commit
d3d114ba54
|
@ -396,6 +396,14 @@ ARMTargetLowering::ARMTargetLowering(const TargetMachine &TM,
|
||||||
setLibcallCallingConv(RTLIB::FPEXT_F16_F32, CallingConv::ARM_APCS);
|
setLibcallCallingConv(RTLIB::FPEXT_F16_F32, CallingConv::ARM_APCS);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// In EABI, these functions have an __aeabi_ prefix, but in GNUEABI they have
|
||||||
|
// a __gnu_ prefix (which is the default).
|
||||||
|
if (Subtarget->isTargetAEABI()) {
|
||||||
|
setLibcallName(RTLIB::FPROUND_F32_F16, "__aeabi_f2h");
|
||||||
|
setLibcallName(RTLIB::FPROUND_F64_F16, "__aeabi_d2h");
|
||||||
|
setLibcallName(RTLIB::FPEXT_F16_F32, "__aeabi_h2f");
|
||||||
|
}
|
||||||
|
|
||||||
if (Subtarget->isThumb1Only())
|
if (Subtarget->isThumb1Only())
|
||||||
addRegisterClass(MVT::i32, &ARM::tGPRRegClass);
|
addRegisterClass(MVT::i32, &ARM::tGPRRegClass);
|
||||||
else
|
else
|
||||||
|
|
|
@ -1,7 +1,9 @@
|
||||||
; RUN: llc < %s | FileCheck %s
|
; RUN: llc -mtriple=armv7a--none-eabi < %s | FileCheck --check-prefix=CHECK --check-prefix=CHECK-HARDFLOAT-EABI %s
|
||||||
; RUN: llc -mattr=+vfp3,+fp16 < %s | FileCheck --check-prefix=CHECK-FP16 %s
|
; RUN: llc -mtriple=armv7a--none-gnueabi < %s | FileCheck --check-prefix=CHECK --check-prefix=CHECK-HARDFLOAT-GNU %s
|
||||||
; RUN: llc -mtriple=armv8-eabihf < %s | FileCheck --check-prefix=CHECK-ARMV8 %s
|
; RUN: llc -mattr=+vfp3,+fp16 < %s | FileCheck --check-prefix=CHECK --check-prefix=CHECK-FP16 %s
|
||||||
; RUN: llc -mtriple=thumbv7m-eabi < %s | FileCheck --check-prefix=CHECK-SOFTFLOAT %s
|
; RUN: llc -mtriple=armv8-eabihf < %s | FileCheck --check-prefix=CHECK --check-prefix=CHECK-ARMV8 %s
|
||||||
|
; RUN: llc -mtriple=thumbv7m-eabi < %s | FileCheck --check-prefix=CHECK --check-prefix=CHECK-SOFTFLOAT-EABI %s
|
||||||
|
; RUN: llc -mtriple=thumbv7m-gnueabi < %s | FileCheck --check-prefix=CHECK --check-prefix=CHECK-SOFTFLOAT-GNU %s
|
||||||
|
|
||||||
target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-n32"
|
target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-n32"
|
||||||
target triple = "armv7---eabihf"
|
target triple = "armv7---eabihf"
|
||||||
|
@ -12,41 +14,45 @@ target triple = "armv7---eabihf"
|
||||||
|
|
||||||
define void @foo() nounwind {
|
define void @foo() nounwind {
|
||||||
; CHECK-LABEL: foo:
|
; CHECK-LABEL: foo:
|
||||||
; CHECK-FP16-LABEL: foo:
|
|
||||||
; CHECK-ARMV8-LABEL: foo:
|
|
||||||
; CHECK-SOFTFLOAT-LABEL: foo:
|
|
||||||
entry:
|
entry:
|
||||||
%0 = load i16, i16* @x, align 2
|
%0 = load i16, i16* @x, align 2
|
||||||
%1 = load i16, i16* @y, align 2
|
%1 = load i16, i16* @y, align 2
|
||||||
%2 = tail call float @llvm.convert.from.fp16.f32(i16 %0)
|
%2 = tail call float @llvm.convert.from.fp16.f32(i16 %0)
|
||||||
; CHECK: __gnu_h2f_ieee
|
; CHECK-HARDFLOAT-EABI: __aeabi_h2f
|
||||||
|
; CHECK-HARDFLOAT-GNU: __gnu_h2f_ieee
|
||||||
; CHECK-FP16: vcvtb.f32.f16
|
; CHECK-FP16: vcvtb.f32.f16
|
||||||
; CHECK-ARMv8: vcvtb.f32.f16
|
; CHECK-ARMv8: vcvtb.f32.f16
|
||||||
; CHECK-SOFTFLOAT: __gnu_h2f_ieee
|
; CHECK-SOFTFLOAT-EABI: __aeabi_h2f
|
||||||
|
; CHECK-SOFTFLOAT-GNU: __gnu_h2f_ieee
|
||||||
%3 = tail call float @llvm.convert.from.fp16.f32(i16 %1)
|
%3 = tail call float @llvm.convert.from.fp16.f32(i16 %1)
|
||||||
; CHECK: __gnu_h2f_ieee
|
; CHECK-HARDFLOAT-EABI: __aeabi_h2f
|
||||||
|
; CHECK-HARDFLOAT-GNU: __gnu_h2f_ieee
|
||||||
; CHECK-FP16: vcvtb.f32.f16
|
; CHECK-FP16: vcvtb.f32.f16
|
||||||
; CHECK-ARMV8: vcvtb.f32.f16
|
; CHECK-ARMV8: vcvtb.f32.f16
|
||||||
; CHECK-SOFTFLOAT: __gnu_h2f_ieee
|
; CHECK-SOFTFLOAT-EABI: __aeabi_h2f
|
||||||
|
; CHECK-SOFTFLOAT-GNU: __gnu_h2f_ieee
|
||||||
%4 = fadd float %2, %3
|
%4 = fadd float %2, %3
|
||||||
%5 = tail call i16 @llvm.convert.to.fp16.f32(float %4)
|
%5 = tail call i16 @llvm.convert.to.fp16.f32(float %4)
|
||||||
; CHECK: __gnu_f2h_ieee
|
; CHECK-HARDFLOAT-EABI: __aeabi_f2h
|
||||||
|
; CHECK-HARDFLOAT-GNU: __gnu_f2h_ieee
|
||||||
; CHECK-FP16: vcvtb.f16.f32
|
; CHECK-FP16: vcvtb.f16.f32
|
||||||
; CHECK-ARMV8: vcvtb.f16.f32
|
; CHECK-ARMV8: vcvtb.f16.f32
|
||||||
; CHECK-SOFTFLOAT: __gnu_f2h_ieee
|
; CHECK-SOFTFLOAT-EABI: __aeabi_f2h
|
||||||
|
; CHECK-SOFTFLOAT-GNU: __gnu_f2h_ieee
|
||||||
store i16 %5, i16* @x, align 2
|
store i16 %5, i16* @x, align 2
|
||||||
ret void
|
ret void
|
||||||
}
|
}
|
||||||
|
|
||||||
define double @test_from_fp16(i16 %in) {
|
define double @test_from_fp16(i16 %in) {
|
||||||
; CHECK-LABEL: test_from_fp16:
|
; CHECK-LABEL: test_from_fp16:
|
||||||
; CHECK-FP16-LABEL: test_from_fp16:
|
|
||||||
; CHECK-ARMV8-LABEL: test_from_fp16:
|
|
||||||
; CHECK-SOFTFLOAT-LABEL: test_from_fp16:
|
|
||||||
%val = call double @llvm.convert.from.fp16.f64(i16 %in)
|
%val = call double @llvm.convert.from.fp16.f64(i16 %in)
|
||||||
; CHECK: bl __gnu_h2f_ieee
|
; CHECK-HARDFLOAT-EABI: bl __aeabi_h2f
|
||||||
; CHECK: vmov [[TMP:s[0-9]+]], r0
|
; CHECK-HARDFLOAT-EABI: vmov [[TMP:s[0-9]+]], r0
|
||||||
; CHECK: vcvt.f64.f32 d0, [[TMP]]
|
; CHECK-HARDFLOAT-EABI: vcvt.f64.f32 {{d[0-9]+}}, [[TMP]]
|
||||||
|
|
||||||
|
; CHECK-HARDFLOAT-GNU: bl __gnu_h2f_ieee
|
||||||
|
; CHECK-HARDFLOAT-GNU: vmov [[TMP:s[0-9]+]], r0
|
||||||
|
; CHECK-HARDFLOAT-GNU: vcvt.f64.f32 {{d[0-9]+}}, [[TMP]]
|
||||||
|
|
||||||
; CHECK-FP16: vmov [[TMP16:s[0-9]+]], r0
|
; CHECK-FP16: vmov [[TMP16:s[0-9]+]], r0
|
||||||
; CHECK-FP16: vcvtb.f32.f16 [[TMP32:s[0-9]+]], [[TMP16]]
|
; CHECK-FP16: vcvtb.f32.f16 [[TMP32:s[0-9]+]], [[TMP16]]
|
||||||
|
@ -55,25 +61,29 @@ define double @test_from_fp16(i16 %in) {
|
||||||
; CHECK-ARMV8: vmov [[TMP:s[0-9]+]], r0
|
; CHECK-ARMV8: vmov [[TMP:s[0-9]+]], r0
|
||||||
; CHECK-ARMV8: vcvtb.f64.f16 d0, [[TMP]]
|
; CHECK-ARMV8: vcvtb.f64.f16 d0, [[TMP]]
|
||||||
|
|
||||||
; CHECK-SOFTFLOAT: bl __gnu_h2f_ieee
|
; CHECK-SOFTFLOAT-EABI: bl __aeabi_h2f
|
||||||
; CHECK-SOFTFLOAT: bl __aeabi_f2d
|
; CHECK-SOFTFLOAT-EABI: bl __aeabi_f2d
|
||||||
|
|
||||||
|
; CHECK-SOFTFLOAT-GNU: bl __gnu_h2f_ieee
|
||||||
|
; CHECK-SOFTFLOAT-GNU: bl __aeabi_f2d
|
||||||
ret double %val
|
ret double %val
|
||||||
}
|
}
|
||||||
|
|
||||||
define i16 @test_to_fp16(double %in) {
|
define i16 @test_to_fp16(double %in) {
|
||||||
; CHECK-LABEL: test_to_fp16:
|
; CHECK-LABEL: test_to_fp16:
|
||||||
; CHECK-FP16-LABEL: test_to_fp16:
|
|
||||||
; CHECK-ARMV8-LABEL: test_to_fp16:
|
|
||||||
; CHECK-SOFTFLOAT-LABEL: test_to_fp16:
|
|
||||||
%val = call i16 @llvm.convert.to.fp16.f64(double %in)
|
%val = call i16 @llvm.convert.to.fp16.f64(double %in)
|
||||||
; CHECK: bl __aeabi_d2h
|
; CHECK-HARDFLOAT-EABI: bl __aeabi_d2h
|
||||||
|
|
||||||
|
; CHECK-HARDFLOAT-GNU: bl __aeabi_d2h
|
||||||
|
|
||||||
; CHECK-FP16: bl __aeabi_d2h
|
; CHECK-FP16: bl __aeabi_d2h
|
||||||
|
|
||||||
; CHECK-ARMV8: vcvtb.f16.f64 [[TMP:s[0-9]+]], d0
|
; CHECK-ARMV8: vcvtb.f16.f64 [[TMP:s[0-9]+]], d0
|
||||||
; CHECK-ARMV8: vmov r0, [[TMP]]
|
; CHECK-ARMV8: vmov r0, [[TMP]]
|
||||||
|
|
||||||
; CHECK-SOFTFLOAT: bl __aeabi_d2h
|
; CHECK-SOFTFLOAT-EABI: bl __aeabi_d2h
|
||||||
|
|
||||||
|
; CHECK-SOFTFLOAT-GNU: bl __aeabi_d2h
|
||||||
ret i16 %val
|
ret i16 %val
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -215,7 +215,7 @@ define i16 @d_to_h(double %a) {
|
||||||
declare double @llvm.convert.from.fp16.f64(i16 %a)
|
declare double @llvm.convert.from.fp16.f64(i16 %a)
|
||||||
define double @h_to_d(i16 %a) {
|
define double @h_to_d(i16 %a) {
|
||||||
; CHECK-LABEL: h_to_d:
|
; CHECK-LABEL: h_to_d:
|
||||||
; NONE: bl __gnu_h2f_ieee
|
; NONE: bl __aeabi_h2f
|
||||||
; NONE: bl __aeabi_f2d
|
; NONE: bl __aeabi_f2d
|
||||||
; SP: vcvt{{[bt]}}.f32.f16
|
; SP: vcvt{{[bt]}}.f32.f16
|
||||||
; SP: bl __aeabi_f2d
|
; SP: bl __aeabi_f2d
|
||||||
|
|
|
@ -205,7 +205,7 @@ define float @fmuladd_f(float %a, float %b, float %c) {
|
||||||
declare i16 @llvm.convert.to.fp16.f32(float %a)
|
declare i16 @llvm.convert.to.fp16.f32(float %a)
|
||||||
define i16 @f_to_h(float %a) {
|
define i16 @f_to_h(float %a) {
|
||||||
; CHECK-LABEL: f_to_h:
|
; CHECK-LABEL: f_to_h:
|
||||||
; SOFT: bl __gnu_f2h_ieee
|
; SOFT: bl __aeabi_f2h
|
||||||
; HARD: vcvt{{[bt]}}.f16.f32
|
; HARD: vcvt{{[bt]}}.f16.f32
|
||||||
%1 = call i16 @llvm.convert.to.fp16.f32(float %a)
|
%1 = call i16 @llvm.convert.to.fp16.f32(float %a)
|
||||||
ret i16 %1
|
ret i16 %1
|
||||||
|
@ -214,7 +214,7 @@ define i16 @f_to_h(float %a) {
|
||||||
declare float @llvm.convert.from.fp16.f32(i16 %a)
|
declare float @llvm.convert.from.fp16.f32(i16 %a)
|
||||||
define float @h_to_f(i16 %a) {
|
define float @h_to_f(i16 %a) {
|
||||||
; CHECK-LABEL: h_to_f:
|
; CHECK-LABEL: h_to_f:
|
||||||
; SOFT: bl __gnu_h2f_ieee
|
; SOFT: bl __aeabi_h2f
|
||||||
; HARD: vcvt{{[bt]}}.f32.f16
|
; HARD: vcvt{{[bt]}}.f32.f16
|
||||||
%1 = call float @llvm.convert.from.fp16.f32(i16 %a)
|
%1 = call float @llvm.convert.from.fp16.f32(i16 %a)
|
||||||
ret float %1
|
ret float %1
|
||||||
|
|
Loading…
Reference in New Issue