contrib/compiler-rt/lib/builtins/x86_64/floatundixf.S

   1 // This file is dual licensed under the MIT and the University of Illinois Open
   2 // Source Licenses. See LICENSE.TXT for details.
   3
   4 #include "../assembly.h"
   5
   6 // long double __floatundixf(du_int a);
   7
   8 #ifdef __x86_64__
   9
  10 CONST_SECTION
  11
  12         .balign 16
  13 twop64:
  14         .quad 0x43f0000000000000
  15
  16 #define REL_ADDR(_a)    (_a)(%rip)
  17
  18         .text
  19
  20         .balign 4
  21 DEFINE_COMPILERRT_FUNCTION(__floatundixf)
  22         movq    %rdi,    -8(%rsp)
  23         fildq   -8(%rsp)
  24         test    %rdi,           %rdi
  25         js              1f
  26         ret
  27 1:      faddl   REL_ADDR(twop64)
  28         ret
  29 END_COMPILERRT_FUNCTION(__floatundixf)
  30
  31 #endif // __x86_64__
  32
  33
  34 /* Branch-free implementation is ever so slightly slower, but more beautiful.
  35    It is likely superior for inlining, so I kept it around for future reference.
  36
  37 #ifdef __x86_64__
  38
  39 CONST_SECTION
  40
  41         .balign 4
  42 twop52:
  43         .quad 0x4330000000000000
  44 twop84_plus_twop52_neg:
  45         .quad 0xc530000000100000
  46 twop84:
  47         .quad 0x4530000000000000
  48
  49 #define REL_ADDR(_a)    (_a)(%rip)
  50
  51 .text
  52 .balign 4
  53 DEFINE_COMPILERRT_FUNCTION(__floatundixf)
  54         movl    %edi,                           %esi                    // low 32 bits of input
  55         shrq    $32,                            %rdi                    // hi 32 bits of input
  56         orq             REL_ADDR(twop84),       %rdi                    // 2^84 + hi (as a double)
  57         orq             REL_ADDR(twop52),       %rsi                    // 2^52 + lo (as a double)
  58         movq    %rdi,                    -8(%rsp)
  59         movq    %rsi,                   -16(%rsp)
  60         fldl    REL_ADDR(twop84_plus_twop52_neg)
  61         faddl   -8(%rsp)        // hi - 2^52 (as double extended, no rounding occurs)
  62         faddl   -16(%rsp)       // hi + lo (as double extended)
  63         ret
  64 END_COMPILERRT_FUNCTION(__floatundixf)
  65
  66 #endif // __x86_64__
  67
  68 */
  69
  70 NO_EXEC_STACK_DIRECTIVE
  71