windows-nt/Source/XPSP1/NT/base/wow64/mscpu/fraglib/axp64/fphelp.s

//
// Copyright (c) 1996-1998  Microsoft Corporation
//
// Module Name:
//
//     fphelp.s
// 
// Abstract:
//
//
//     This module contains assembly code helpers for floating-point
//     emulation.
// 
// Author:
//
//     Barry Bond (barrybo) creation-date 26-Aug-1996
// 
// Notes:
// 
// Revision History:

#include "kxalpha.h"
#include "soalpha.h"
#include "ksalpha.h"

.rdata

RoundingTable:
    .long (2 << 26), (1 << 26), (3 << 26), 0

.text

//
// Define call frame used to exchange a floating point and integer register.
//

        .struct 0
FpCr:   .space  8                       // fpcr value
        .space  8                       // ensure 16-byte stack alignment
FpFrameLength:                          // length of stack frame


    NESTED_ENTRY(SetNativeRoundingMode, FpFrameLength, ra)
// 
// Routine Description:
//
//     Sets the native FPU to the specified x86 rounding mode.
// 
// Arguments:
//
//     a0 -- the x86 rounding mode (already guaranteed to be just 2 bits)
//
// Return Value:
// 
//     None
//

    lda     sp, -FpFrameLength(sp)      // allocate stack frame

    PROLOGUE_END

    // map x86 rounding mode to Alpha rounding mode in a0
    lda     t0, RoundingTable
    s4addl  a0, t0, a0
    ldl     a0, 0(a0)

    excb                    // wait for all pending traps
    mf_fpcr f0, f0, f0      // get current fpcr
    excb                    // block against new traps
    stt     f0, FpCr(sp)    // store fpcr to stack
    ldl     t0, FpCr+4(sp)  // load the high dword of fpcr into integer register

    ldiq    t1, (3 << 26)   // load immediate value
    bic     t0, t1, t0      // t0 = t0 & ~(3 << 26)
    or      t0, a0, t0      // t0 |= a0

    stl     t0, FpCr+4(sp)  // store new high dword of fpcr to stack
    ldt     f0, FpCr(sp)    // load into fp register
    mt_fpcr f0, f0, f0      // set new fpcr
    excb                    // block against new traps

    lda     sp, FpFrameLength(sp)
    ret     zero, (ra)
    .end SetNativeRoundingMode


    NESTED_ENTRY(GetNativeFPStatus, FpFrameLength, ra)
// 
// Routine Description:
//
//     Alpha-specific version of _statusfp()/_clearfp().
// 
// Arguments:
//
//     None.
//
// Return Value:
// 
//     Alpha-specific equivalent of _statusfp().
//

    lda     sp, -FpFrameLength(sp)      // allocate stack frame
    PROLOGUE_END

    // this is _get_softfpcr, except the result ends up in t0
    GET_THREAD_ENVIRONMENT_BLOCK
    ldl     t0, TeSoftFpcr(v0)  // get current software fpcr value

    ldiq    t3, 0x3e0000        // t3 = SW_FPCR_STATUS_MASK
    bic     t0, t3, t1          // t1 = soft_fpcr & (~SW_FPCR_STATUS_MASK)

    // this is _set_softfpcr, except arg is in t1
    stl     t1, TeSoftFpcr(v0)  // store new software fpcr value

    excb                        // wait for all pending traps
    mf_fpcr f0, f0, f0          // get current fpcr
    excb                        // block against new traps

    stt     f0, FpCr(sp)        // store fpcr to stack
    ldq     t3, FpCr(sp)        // load fpcr into integer register

    ldiq    t1, 0x1c01000000000000  // (FPCR_ROUND_MASK|FPCR_UNDERFLOW_TO_ZERO_ENABLE|FPCR_DENORMAL_OPERANDS_TO_ZERO_ENABLE)
    and     t3, t1, t3          // t3 &= t1

    stq     t3, FpCr(sp)        // save integer version to stack
    ldt     f0, FpCr(sp)        // load it into floating-point reg
    mt_fpcr f0, f0, f0          // set new fpcr
    excb                        // block against new traps

    bis     t0, zero, v0        // move original software fpcr into v0 for ret

    lda     sp, FpFrameLength(sp)
    ret     zero, (ra)
    .end    GetNativeFPStatus


    NESTED_ENTRY(CastDoubleToInt64, FpFrameLength, ra)
//
// Arguments:
//
//      f16 = double value to be cast
//
// Return Value:
//
//      The double is cast to an __int64 value using Dynamic rounding.
//      NOTE: The Alpha C compiler generates chopped rounding always,
//            so "i64 = (double)-1.2" will give a different answer than
//               "i64 = CastDoubleToInt64(-1.2)" if the FP control word
//            is set to round towards -infinity.
//

    lda     sp, -FpFrameLength(sp)      // allocate stack frame
    PROLOGUE_END

    // Convert IEEE floating to Integer.
    //  Trapping:  S    - software
    //             V    - integer overflow enable
    //             I    - inexact enable
    //  Rounding:  D    - dynamic
    cvttqsvid  f16, f1

    // Store the int64 value onto the stack
    stt         f1, FpCr(sp)

    // Load the int64 value into an integer register
    ldq         v0, FpCr(sp)

    // Clean up the stack frame
    lda     sp, FpFrameLength(sp)
    ret     zero, (ra)
    .end CastDoubleToInt64
Add source files 2020-09-26 03:20:57 -05:00			`//`
			`// Copyright (c) 1996-1998 Microsoft Corporation`
			`//`
			`// Module Name:`
			`//`
			`// fphelp.s`
			`//`
			`// Abstract:`
			`//`
			`//`
			`// This module contains assembly code helpers for floating-point`
			`// emulation.`
			`//`
			`// Author:`
			`//`
			`// Barry Bond (barrybo) creation-date 26-Aug-1996`
			`//`
			`// Notes:`
			`//`
			`// Revision History:`

			`#include "kxalpha.h"`
			`#include "soalpha.h"`
			`#include "ksalpha.h"`

			`.rdata`

			`RoundingTable:`
			`.long (2 << 26), (1 << 26), (3 << 26), 0`

			`.text`

			`//`
			`// Define call frame used to exchange a floating point and integer register.`
			`//`

			`.struct 0`
			`FpCr: .space 8 // fpcr value`
			`.space 8 // ensure 16-byte stack alignment`
			`FpFrameLength: // length of stack frame`



			`NESTED_ENTRY(SetNativeRoundingMode, FpFrameLength, ra)`
			`//`
			`// Routine Description:`
			`//`
			`// Sets the native FPU to the specified x86 rounding mode.`
			`//`
			`// Arguments:`
			`//`
			`// a0 -- the x86 rounding mode (already guaranteed to be just 2 bits)`
			`//`
			`// Return Value:`
			`//`
			`// None`
			`//`

			`lda sp, -FpFrameLength(sp) // allocate stack frame`

			`PROLOGUE_END`

			`// map x86 rounding mode to Alpha rounding mode in a0`
			`lda t0, RoundingTable`
			`s4addl a0, t0, a0`
			`ldl a0, 0(a0)`

			`excb // wait for all pending traps`
			`mf_fpcr f0, f0, f0 // get current fpcr`
			`excb // block against new traps`
			`stt f0, FpCr(sp) // store fpcr to stack`
			`ldl t0, FpCr+4(sp) // load the high dword of fpcr into integer register`

			`ldiq t1, (3 << 26) // load immediate value`
			`bic t0, t1, t0 // t0 = t0 & ~(3 << 26)`
			`or t0, a0, t0 // t0 \|= a0`

			`stl t0, FpCr+4(sp) // store new high dword of fpcr to stack`
			`ldt f0, FpCr(sp) // load into fp register`
			`mt_fpcr f0, f0, f0 // set new fpcr`
			`excb // block against new traps`

			`lda sp, FpFrameLength(sp)`
			`ret zero, (ra)`
			`.end SetNativeRoundingMode`




			`NESTED_ENTRY(GetNativeFPStatus, FpFrameLength, ra)`
			`//`
			`// Routine Description:`
			`//`
			`// Alpha-specific version of _statusfp()/_clearfp().`
			`//`
			`// Arguments:`
			`//`
			`// None.`
			`//`
			`// Return Value:`
			`//`
			`// Alpha-specific equivalent of _statusfp().`
			`//`

			`lda sp, -FpFrameLength(sp) // allocate stack frame`
			`PROLOGUE_END`

			`// this is _get_softfpcr, except the result ends up in t0`
			`GET_THREAD_ENVIRONMENT_BLOCK`
			`ldl t0, TeSoftFpcr(v0) // get current software fpcr value`

			`ldiq t3, 0x3e0000 // t3 = SW_FPCR_STATUS_MASK`
			`bic t0, t3, t1 // t1 = soft_fpcr & (~SW_FPCR_STATUS_MASK)`

			`// this is _set_softfpcr, except arg is in t1`
			`stl t1, TeSoftFpcr(v0) // store new software fpcr value`

			`excb // wait for all pending traps`
			`mf_fpcr f0, f0, f0 // get current fpcr`
			`excb // block against new traps`

			`stt f0, FpCr(sp) // store fpcr to stack`
			`ldq t3, FpCr(sp) // load fpcr into integer register`

			`ldiq t1, 0x1c01000000000000 // (FPCR_ROUND_MASK\|FPCR_UNDERFLOW_TO_ZERO_ENABLE\|FPCR_DENORMAL_OPERANDS_TO_ZERO_ENABLE)`
			`and t3, t1, t3 // t3 &= t1`

			`stq t3, FpCr(sp) // save integer version to stack`
			`ldt f0, FpCr(sp) // load it into floating-point reg`
			`mt_fpcr f0, f0, f0 // set new fpcr`
			`excb // block against new traps`

			`bis t0, zero, v0 // move original software fpcr into v0 for ret`

			`lda sp, FpFrameLength(sp)`
			`ret zero, (ra)`
			`.end GetNativeFPStatus`


			`NESTED_ENTRY(CastDoubleToInt64, FpFrameLength, ra)`
			`//`
			`// Arguments:`
			`//`
			`// f16 = double value to be cast`
			`//`
			`// Return Value:`
			`//`
			`// The double is cast to an __int64 value using Dynamic rounding.`
			`// NOTE: The Alpha C compiler generates chopped rounding always,`
			`// so "i64 = (double)-1.2" will give a different answer than`
			`// "i64 = CastDoubleToInt64(-1.2)" if the FP control word`
			`// is set to round towards -infinity.`
			`//`

			`lda sp, -FpFrameLength(sp) // allocate stack frame`
			`PROLOGUE_END`

			`// Convert IEEE floating to Integer.`
			`// Trapping: S - software`
			`// V - integer overflow enable`
			`// I - inexact enable`
			`// Rounding: D - dynamic`
			`cvttqsvid f16, f1`

			`// Store the int64 value onto the stack`
			`stt f1, FpCr(sp)`

			`// Load the int64 value into an integer register`
			`ldq v0, FpCr(sp)`

			`// Clean up the stack frame`
			`lda sp, FpFrameLength(sp)`
			`ret zero, (ra)`
			`.end CastDoubleToInt64`