]> git.proxmox.com Git - rustc.git/blame - src/compiler-rt/lib/builtins/x86_64/floatundixf.S
New upstream version 1.19.0+dfsg3
[rustc.git] / src / compiler-rt / lib / builtins / x86_64 / floatundixf.S
CommitLineData
1a4d82fc
JJ
1// This file is dual licensed under the MIT and the University of Illinois Open
2// Source Licenses. See LICENSE.TXT for details.
3
4#include "../assembly.h"
5
6// long double __floatundixf(du_int a);
7
8#ifdef __x86_64__
9
10CONST_SECTION
92a42be0
SL
11
12 .balign 16
13twop64:
14 .quad 0x43f0000000000000
1a4d82fc
JJ
15
16#define REL_ADDR(_a) (_a)(%rip)
17
92a42be0
SL
18 .text
19
20 .balign 4
1a4d82fc
JJ
21DEFINE_COMPILERRT_FUNCTION(__floatundixf)
22 movq %rdi, -8(%rsp)
23 fildq -8(%rsp)
24 test %rdi, %rdi
25 js 1f
26 ret
271: faddl REL_ADDR(twop64)
28 ret
29END_COMPILERRT_FUNCTION(__floatundixf)
30
31#endif // __x86_64__
32
33
34/* Branch-free implementation is ever so slightly slower, but more beautiful.
35 It is likely superior for inlining, so I kept it around for future reference.
36
37#ifdef __x86_64__
38
39CONST_SECTION
92a42be0
SL
40
41 .balign 4
42twop52:
43 .quad 0x4330000000000000
1a4d82fc 44twop84_plus_twop52_neg:
92a42be0
SL
45 .quad 0xc530000000100000
46twop84:
47 .quad 0x4530000000000000
1a4d82fc
JJ
48
49#define REL_ADDR(_a) (_a)(%rip)
50
51.text
92a42be0 52.balign 4
1a4d82fc
JJ
53DEFINE_COMPILERRT_FUNCTION(__floatundixf)
54 movl %edi, %esi // low 32 bits of input
55 shrq $32, %rdi // hi 32 bits of input
56 orq REL_ADDR(twop84), %rdi // 2^84 + hi (as a double)
57 orq REL_ADDR(twop52), %rsi // 2^52 + lo (as a double)
58 movq %rdi, -8(%rsp)
59 movq %rsi, -16(%rsp)
60 fldl REL_ADDR(twop84_plus_twop52_neg)
61 faddl -8(%rsp) // hi - 2^52 (as double extended, no rounding occurs)
62 faddl -16(%rsp) // hi + lo (as double extended)
63 ret
64END_COMPILERRT_FUNCTION(__floatundixf)
65
66#endif // __x86_64__
67
68*/
3157f602
XL
69
70NO_EXEC_STACK_DIRECTIVE
71