[CRT]

implement floor and floorf for amd64 with sse2 instructions svn path=/trunk/; revision=53887
2025-06-10 20:34:59 +00:00 · 2011-09-28 21:32:37 +00:00 · 2011-09-28 21:32:37 +00:00 · 2779f4ccdd
commit 2779f4ccdd
parent 6d1eecf3d9
3 changed files with 36 additions and 21 deletions
--- a/reactos/lib/sdk/crt/libcntpr.cmake
+++ b/reactos/lib/sdk/crt/libcntpr.cmake
@ -111,6 +111,7 @@ elseif(ARCH MATCHES amd64)
        math/amd64/exp.S
        math/amd64/fabs.S
        math/amd64/floor.S
        math/amd64/floorf.S
        math/amd64/fmod.S
        math/amd64/ldexp.S
        math/amd64/log.S
--- a/reactos/lib/sdk/crt/math/amd64/floor.S
+++ b/reactos/lib/sdk/crt/math/amd64/floor.S
@ -9,14 +9,33 @@
 /* INCLUDES ******************************************************************/
 #include <asm.inc>
 #include <ksamd64.inc>
 /* CODE **********************************************************************/
 .code64
 PUBLIC floor
-floor:
+FUNC floor
-    UNIMPLEMENTED floor
+    sub rsp, 16
    .ENDPROLOG
    /* Truncate xmm0 to integer (double precision) */
    cvttsd2si rcx, xmm0
    /* Duplicate the bits into rax */
    movd rax, xmm0
    /* Shift all bits to the right, keeping the sign bit */
    shr rax, 63
    /* Substract the sign bit from the truncated value, so that
       we get the correct result for negative values. */
    sub rcx, rax
    /* Convert the result back to xmm0 (double precision) */
    cvtsi2sd xmm0, rcx
    add rsp, 16
    ret
 ENDFUNC floor
 END
--- a/reactos/lib/sdk/crt/math/amd64/floorf.S
+++ b/reactos/lib/sdk/crt/math/amd64/floorf.S
@ -1,7 +1,7 @@
 /*
 * COPYRIGHT:         See COPYING in the top level directory
 * PROJECT:           ReactOS system libraries
- * PURPOSE:           Implementation of tan
+ * PURPOSE:           Implementation of floorf
 * FILE:              lib/sdk/crt/math/amd64/floorf.S
 * PROGRAMMER:        Timo Kreuzer (timo.kreuzer@reactos.org)
 */
@ -9,7 +9,6 @@
 /* INCLUDES ******************************************************************/
 #include <asm.inc>
 #include <ksamd64.inc>
 /* CODE **********************************************************************/
 .code64
@ -19,26 +18,22 @@ FUNC floorf
    sub rsp, 16
    .ENDPROLOG
-    /* Put parameter on the stack */
+    /* Truncate xmm0 to integer (single precision) */
-    movss dword ptr [rsp], xmm0
+    cvttss2si rcx, xmm0
    fld   dword ptr [rsp]
-    /* Change fpu control word to round down */
+    /* Duplicate the bits into rax */
-    fstcw [rsp]
+    movd eax, xmm0
    mov   eax, [rsp]
    or    eax, HEX(000400)
    and   eax, HEX(00f7ff)
    mov   [rsp + 8], eax
    fldcw [rsp + 8]
-    /* Round to integer */
+    /* Shift all bits to the right, keeping the sign bit */
-    frndint
+    shr rax, 31
-    /* Restore fpu control word */
+    /* Substract the sign bit from the truncated value, so that
-    fldcw [rsp]
+       we get the correct result for negative values. */
    sub rcx, rax
    /* Convert the result back to xmm0 (single precision) */
    cvtsi2ss xmm0, rcx
    fstp  dword ptr [rsp]
    movss xmm0, dword ptr [rsp]
    add rsp, 16
    ret
 ENDFUNC floorf