forked from OSchip/llvm-project
65 lines
1.4 KiB
ArmAsm
65 lines
1.4 KiB
ArmAsm
// This file is dual licensed under the MIT and the University of Illinois Open
|
|
// Source Licenses. See LICENSE.TXT for details.
|
|
|
|
#include "../assembly.h"
|
|
|
|
// long double __floatundixf(du_int a);
|
|
|
|
#ifdef __x86_64__
|
|
|
|
#ifndef __ELF__
|
|
.const
|
|
#endif
|
|
.align 4
|
|
twop64: .quad 0x43f0000000000000
|
|
|
|
#define REL_ADDR(_a) (_a)(%rip)
|
|
|
|
.text
|
|
.align 4
|
|
DEFINE_COMPILERRT_FUNCTION(__floatundixf)
|
|
movq %rdi, -8(%rsp)
|
|
fildq -8(%rsp)
|
|
test %rdi, %rdi
|
|
js 1f
|
|
ret
|
|
1: faddl REL_ADDR(twop64)
|
|
ret
|
|
END_COMPILERRT_FUNCTION(__floatundixf)
|
|
|
|
#endif // __x86_64__
|
|
|
|
|
|
/* Branch-free implementation is ever so slightly slower, but more beautiful.
|
|
It is likely superior for inlining, so I kept it around for future reference.
|
|
|
|
#ifdef __x86_64__
|
|
|
|
.const
|
|
.align 4
|
|
twop52: .quad 0x4330000000000000
|
|
twop84_plus_twop52_neg:
|
|
.quad 0xc530000000100000
|
|
twop84: .quad 0x4530000000000000
|
|
|
|
#define REL_ADDR(_a) (_a)(%rip)
|
|
|
|
.text
|
|
.align 4
|
|
DEFINE_COMPILERRT_FUNCTION(__floatundixf)
|
|
movl %edi, %esi // low 32 bits of input
|
|
shrq $32, %rdi // hi 32 bits of input
|
|
orq REL_ADDR(twop84), %rdi // 2^84 + hi (as a double)
|
|
orq REL_ADDR(twop52), %rsi // 2^52 + lo (as a double)
|
|
movq %rdi, -8(%rsp)
|
|
movq %rsi, -16(%rsp)
|
|
fldl REL_ADDR(twop84_plus_twop52_neg)
|
|
faddl -8(%rsp) // hi - 2^52 (as double extended, no rounding occurs)
|
|
faddl -16(%rsp) // hi + lo (as double extended)
|
|
ret
|
|
END_COMPILERRT_FUNCTION(__floatundixf)
|
|
|
|
#endif // __x86_64__
|
|
|
|
*/
|