Home | History | Annotate | Download | only in x86_64
      1 // This file is dual licensed under the MIT and the University of Illinois Open
      2 // Source Licenses. See LICENSE.TXT for details.
      3 
      4 #include "../assembly.h"
      5 
      6 // long double __floatundixf(du_int a);
      7 
      8 #ifdef __x86_64__
      9 
     10 CONST_SECTION
     11 
     12 	.balign 16
     13 twop64:
     14 	.quad 0x43f0000000000000
     15 
     16 #define REL_ADDR(_a)	(_a)(%rip)
     17 
     18 	.text
     19 
     20 	.balign 4
     21 DEFINE_COMPILERRT_FUNCTION(__floatundixf)
     22 	movq	%rdi,	 -8(%rsp)
     23 	fildq	-8(%rsp)
     24 	test	%rdi,		%rdi
     25 	js		1f
     26 	ret
     27 1:	faddl	REL_ADDR(twop64)
     28 	ret
     29 END_COMPILERRT_FUNCTION(__floatundixf)
     30 
     31 #endif // __x86_64__
     32 
     33 
     34 /* Branch-free implementation is ever so slightly slower, but more beautiful.
     35    It is likely superior for inlining, so I kept it around for future reference.
     36 
     37 #ifdef __x86_64__
     38 
     39 CONST_SECTION
     40 
     41 	.balign 4
     42 twop52:
     43 	.quad 0x4330000000000000
     44 twop84_plus_twop52_neg:
     45 	.quad 0xc530000000100000
     46 twop84:
     47 	.quad 0x4530000000000000
     48 
     49 #define REL_ADDR(_a)	(_a)(%rip)
     50 
     51 .text
     52 .balign 4
     53 DEFINE_COMPILERRT_FUNCTION(__floatundixf)
     54 	movl	%edi,				%esi			// low 32 bits of input
     55 	shrq	$32,				%rdi			// hi 32 bits of input
     56 	orq		REL_ADDR(twop84),	%rdi			// 2^84 + hi (as a double)
     57 	orq		REL_ADDR(twop52),	%rsi			// 2^52 + lo (as a double)
     58 	movq	%rdi,			 -8(%rsp)
     59 	movq	%rsi,			-16(%rsp)
     60 	fldl	REL_ADDR(twop84_plus_twop52_neg)
     61 	faddl	-8(%rsp)	// hi - 2^52 (as double extended, no rounding occurs)
     62 	faddl	-16(%rsp)	// hi + lo (as double extended)
     63 	ret
     64 END_COMPILERRT_FUNCTION(__floatundixf)
     65 
     66 #endif // __x86_64__
     67 
     68 */
     69 
     70 NO_EXEC_STACK_DIRECTIVE
     71 
     72