aboutsummaryrefslogtreecommitdiff
path: root/lib/x86_64/floatundixf.S
diff options
context:
space:
mode:
authorEd Schouten <ed@FreeBSD.org>2010-10-21 19:02:02 +0000
committerEd Schouten <ed@FreeBSD.org>2010-10-21 19:02:02 +0000
commit217b614317dad692116a3a06fe94ea8f61a59edb (patch)
tree4cfe2eee875a959effca0881df14c079103447fa /lib/x86_64/floatundixf.S
downloadsrc-217b614317dad692116a3a06fe94ea8f61a59edb.tar.gz
src-217b614317dad692116a3a06fe94ea8f61a59edb.zip
Import compiler-rt r117047.vendor/compiler-rt/compiler-rt-r117047
Notes
Notes: svn path=/vendor/compiler-rt/dist/; revision=214152 svn path=/vendor/compiler-rt/compiler-rt-r117047/; revision=214153; tag=vendor/compiler-rt/compiler-rt-r117047
Diffstat (limited to 'lib/x86_64/floatundixf.S')
-rw-r--r--lib/x86_64/floatundixf.S62
1 files changed, 62 insertions, 0 deletions
diff --git a/lib/x86_64/floatundixf.S b/lib/x86_64/floatundixf.S
new file mode 100644
index 000000000000..246f0266c8a1
--- /dev/null
+++ b/lib/x86_64/floatundixf.S
@@ -0,0 +1,62 @@
+// This file is distributed under the University of Illinois Open Source
+// License. See LICENSE.TXT for details.
+
+#include "../assembly.h"
+
+// long double __floatundixf(du_int a);
+
+#ifdef __x86_64__
+
+#ifndef __ELF__
+.const
+#endif
+.align 4
+twop64: .quad 0x43f0000000000000
+
+#define REL_ADDR(_a) (_a)(%rip)
+
+.text
+.align 4
+DEFINE_COMPILERRT_FUNCTION(__floatundixf)
+ movq %rdi, -8(%rsp)
+ fildq -8(%rsp)
+ test %rdi, %rdi
+ js 1f
+ ret
+1: faddl REL_ADDR(twop64)
+ ret
+
+#endif // __x86_64__
+
+
+/* Branch-free implementation is ever so slightly slower, but more beautiful.
+ It is likely superior for inlining, so I kept it around for future reference.
+
+#ifdef __x86_64__
+
+.const
+.align 4
+twop52: .quad 0x4330000000000000
+twop84_plus_twop52_neg:
+ .quad 0xc530000000100000
+twop84: .quad 0x4530000000000000
+
+#define REL_ADDR(_a) (_a)(%rip)
+
+.text
+.align 4
+DEFINE_COMPILERRT_FUNCTION(__floatundixf)
+ movl %edi, %esi // low 32 bits of input
+ shrq $32, %rdi // hi 32 bits of input
+ orq REL_ADDR(twop84), %rdi // 2^84 + hi (as a double)
+ orq REL_ADDR(twop52), %rsi // 2^52 + lo (as a double)
+ movq %rdi, -8(%rsp)
+ movq %rsi, -16(%rsp)
+ fldl REL_ADDR(twop84_plus_twop52_neg)
+ faddl -8(%rsp) // hi - 2^52 (as double extended, no rounding occurs)
+ faddl -16(%rsp) // hi + lo (as double extended)
+ ret
+
+#endif // __x86_64__
+
+*/