474 lines
15 KiB
NASM
474 lines
15 KiB
NASM
|
subttl emfdiv.asm - Division
|
||
|
page
|
||
|
;*******************************************************************************
|
||
|
; Copyright (c) Microsoft Corporation 1991
|
||
|
; All Rights Reserved
|
||
|
;
|
||
|
;emfdiv.asm - long double divide
|
||
|
; by Tim Paterson
|
||
|
;
|
||
|
;Purpose:
|
||
|
; Long double division.
|
||
|
;Inputs:
|
||
|
; ebx:esi = op1 mantissa
|
||
|
; ecx = op1 sign in bit 15, exponent in high half
|
||
|
; edi = pointer to op2 and result location
|
||
|
; [Result] = edi
|
||
|
;
|
||
|
; Exponents are unbiased. Denormals have been normalized using
|
||
|
; this expanded exponent range. Neither operand is allowed to be zero.
|
||
|
;Outputs:
|
||
|
; Jumps to [RoundMode] to round and store result.
|
||
|
;
|
||
|
;Revision History:
|
||
|
;
|
||
|
; [] 09/05/91 TP Initial 32-bit version.
|
||
|
;
|
||
|
;*******************************************************************************
|
||
|
|
||
|
|
||
|
;Dispatch tables for division
|
||
|
;
|
||
|
;One operand has been loaded into ecx:ebx:esi ("source"), the other is
|
||
|
;pointed to by edi ("dest"). edi points to dividend for fdiv,
|
||
|
;to divisor for fdivr.
|
||
|
;
|
||
|
;Tag of source is shifted. Tag values are as follows:
|
||
|
;
|
||
|
.erre TAG_SNGL eq 0 ;SINGLE: low 32 bits are zero
|
||
|
.erre TAG_VALID eq 1
|
||
|
.erre TAG_ZERO eq 2
|
||
|
.erre TAG_SPCL eq 3 ;NAN, Infinity, Denormal, Empty
|
||
|
|
||
|
;dest = dest / source
|
||
|
tFdivDisp label dword ;Source (reg) Dest (*[di])
|
||
|
dd DivSingle ;single single
|
||
|
dd DivSingle ;single double
|
||
|
dd XorDestSign ;single zero
|
||
|
dd DivSpclDest ;single special
|
||
|
dd DivDouble ;double single
|
||
|
dd DivDouble ;double double
|
||
|
dd XorDestSign ;double zero
|
||
|
dd DivSpclDest ;double special
|
||
|
dd DivideByZero ;zero single
|
||
|
dd DivideByZero ;zero double
|
||
|
dd ReturnIndefinite ;zero zero
|
||
|
dd DivSpclDest ;zero special
|
||
|
dd DivSpclSource ;special single
|
||
|
dd DivSpclSource ;special double
|
||
|
dd DivSpclSource ;special zero
|
||
|
dd TwoOpBothSpcl ;special special
|
||
|
dd ReturnIndefinite ;Two infinities
|
||
|
|
||
|
;dest = source / dest
|
||
|
tFdivrDisp label dword ;Source (reg) Dest (*[di])
|
||
|
dd DivrSingle ;single single
|
||
|
dd DivrDouble ;single double
|
||
|
dd DivideByZero ;single zero
|
||
|
dd DivrSpclDest ;single special
|
||
|
dd DivrSingle ;double single
|
||
|
dd DivrDouble ;double double
|
||
|
dd DivideByZero ;double zero
|
||
|
dd DivrSpclDest ;double special
|
||
|
dd XorSourceSign ;zero single
|
||
|
dd XorSourceSign ;zero double
|
||
|
dd ReturnIndefinite ;zero zero
|
||
|
dd DivrSpclDest ;zero special
|
||
|
dd DivrSpclSource ;special single
|
||
|
dd DivrSpclSource ;special double
|
||
|
dd DivrSpclSource ;special zero
|
||
|
dd TwoOpBothSpcl ;special special
|
||
|
dd ReturnIndefinite ;Two infinities
|
||
|
|
||
|
|
||
|
EM_ENTRY eFIDIV16
|
||
|
eFIDIV16:
|
||
|
push offset DivSetResult
|
||
|
jmp Load16Int ;Returns to DivSetResult
|
||
|
|
||
|
EM_ENTRY eFIDIVR16
|
||
|
eFIDIVR16:
|
||
|
push offset DivrSetResult
|
||
|
jmp Load16Int
|
||
|
|
||
|
EM_ENTRY eFIDIV32
|
||
|
eFIDIV32:
|
||
|
push offset DivSetResult
|
||
|
jmp Load32Int
|
||
|
|
||
|
EM_ENTRY eFIDIVR32
|
||
|
eFIDIVR32:
|
||
|
push offset DivrSetResult
|
||
|
jmp Load32Int
|
||
|
|
||
|
EM_ENTRY eFDIV32
|
||
|
eFDIV32:
|
||
|
push offset DivSetResult
|
||
|
jmp Load32Real ;Returns to DivSetResult
|
||
|
|
||
|
EM_ENTRY eFDIVR32
|
||
|
eFDIVR32:
|
||
|
push offset DivrSetResult ;Returns to DivrSetResult
|
||
|
jmp Load32Real
|
||
|
|
||
|
EM_ENTRY eFDIV64
|
||
|
eFDIV64:
|
||
|
push offset DivSetResult
|
||
|
jmp Load64Real ;Returns to DivSetResult
|
||
|
|
||
|
EM_ENTRY eFDIVR64
|
||
|
eFDIVR64:
|
||
|
push offset DivrSetResult
|
||
|
jmp Load64Real ;Returns to DivrSetResult
|
||
|
|
||
|
|
||
|
EM_ENTRY eFDIVRPreg
|
||
|
eFDIVRPreg:
|
||
|
push offset PopWhenDone
|
||
|
|
||
|
EM_ENTRY eFDIVRreg
|
||
|
eFDIVRreg:
|
||
|
xchg esi,edi
|
||
|
|
||
|
EM_ENTRY eFDIVRtop
|
||
|
eFDIVRtop:
|
||
|
mov ecx,EMSEG:[esi].ExpSgn
|
||
|
mov ebx,EMSEG:[esi].lManHi
|
||
|
mov esi,EMSEG:[esi].lManLo
|
||
|
DivrSetResult:
|
||
|
;cl has tag of dividend
|
||
|
mov ebp,offset tFdivrDisp
|
||
|
mov EMSEG:[Result],edi ;Save result pointer
|
||
|
mov ah,cl
|
||
|
mov al,EMSEG:[edi].bTag
|
||
|
and ah,not 1 ;Ignore single vs. double on dividend
|
||
|
cmp ax,1
|
||
|
.erre bTAG_VALID eq 1
|
||
|
.erre bTAG_SNGL eq 0
|
||
|
jz DivrDouble ;Divisor was double
|
||
|
ja TwoOpResultSet
|
||
|
;.erre DivrSingle eq $ ;Fall into DivrSingle
|
||
|
|
||
|
;*********
|
||
|
DivrSingle:
|
||
|
;*********
|
||
|
;Computes op1/op2
|
||
|
;Op1 is double, op2 is single (low 32 bits are zero)
|
||
|
mov edx,ebx
|
||
|
mov eax,esi ;Mantissa in edx:eax
|
||
|
mov ebx,EMSEG:[edi].ExpSgn
|
||
|
mov edi,EMSEG:[edi].lManHi
|
||
|
jmp DivSingleReg
|
||
|
|
||
|
|
||
|
SDivBigUnderflow:
|
||
|
;Overflow flag set could only occur with denormals (true exp < -32768)
|
||
|
or EMSEG:[CURerr],Underflow
|
||
|
test EMSEG:[CWmask],Underflow ;Is exception masked?
|
||
|
jnz UnderflowZero ;Yes, return zero (in emfmul.asm)
|
||
|
add ecx,Underbias shl 16 ;Fix up exponent
|
||
|
jmp ContSdiv ;Continue with multiply
|
||
|
|
||
|
|
||
|
EM_ENTRY eFDIVPreg
|
||
|
eFDIVPreg:
|
||
|
push offset PopWhenDone
|
||
|
|
||
|
EM_ENTRY eFDIVreg
|
||
|
eFDIVreg:
|
||
|
xchg esi,edi
|
||
|
|
||
|
EM_ENTRY eFDIVtop
|
||
|
eFDIVtop:
|
||
|
mov ecx,EMSEG:[esi].ExpSgn
|
||
|
mov ebx,EMSEG:[esi].lManHi
|
||
|
mov esi,EMSEG:[esi].lManLo
|
||
|
DivSetResult:
|
||
|
;cl has tag of divisor
|
||
|
mov ebp,offset tFdivDisp
|
||
|
mov EMSEG:[Result],edi ;Save result pointer
|
||
|
mov al,cl
|
||
|
mov ah,EMSEG:[edi].bTag
|
||
|
and ah,not 1 ;Ignore single vs. double on dividend
|
||
|
cmp ax,1
|
||
|
.erre bTAG_VALID eq 1
|
||
|
.erre bTAG_SNGL eq 0
|
||
|
jz DivDouble ;Divisor was double
|
||
|
ja TwoOpResultSet
|
||
|
;.erre DivSingle eq $ ;Fall into DivSingle
|
||
|
|
||
|
;*********
|
||
|
DivSingle:
|
||
|
;*********
|
||
|
;Computes op2/op1
|
||
|
;Op2 is double, op1 is single (low 32 bits are zero)
|
||
|
xchg edi,ebx ;Mantissa in edi, op2 ptr to ebx
|
||
|
xchg ebx,ecx ;ExpSgn to ebx, op2 ptr to ecx
|
||
|
mov edx,EMSEG:[ecx].lManHi
|
||
|
mov eax,EMSEG:[ecx].lManLo
|
||
|
mov ecx,EMSEG:[ecx].ExpSgn ;Op2 loaded
|
||
|
|
||
|
DivSingleReg:
|
||
|
;dividend mantissa in edx:eax, exponent in high ecx, sign in ch bit 7
|
||
|
;divisor mantissa in edi, exponent in high ebx, sign in bh bit 7
|
||
|
|
||
|
xor ch,bh ;Compute result sign
|
||
|
xor bx,bx ;Clear out sign and tag
|
||
|
sub ecx,1 shl 16 ;Exponent adjustment needed
|
||
|
sub ecx,ebx ;Compute result exponent
|
||
|
.erre TexpBias eq 0 ;Exponents not biased
|
||
|
jo SDivBigUnderflow ;Dividing denormal by large number
|
||
|
ContSdiv:
|
||
|
|
||
|
;If dividend >= divisor, the DIV instruction will overflow. Check for
|
||
|
;this condition and shift the dividend right one bit if necessary.
|
||
|
;
|
||
|
;In previous versions of this algorithm for 24-bit and 53-bit mantissas,
|
||
|
;this shift was always performed without a test. This meant that a 1-bit
|
||
|
;normalization might be required at the end. This worked fine because
|
||
|
;32 or 64 bits were calculated, so extra precision was available for
|
||
|
;normalization. However, this version needs all 64 bits that are calculated,
|
||
|
;so we can't afford a normalization shift at the end. This test tells us
|
||
|
;up front how to align so we'll be normalized.
|
||
|
xor ebx,ebx ;Extend dividend
|
||
|
cmp edi,edx ;Will DIV overflow?
|
||
|
ja DoSdiv ;No, we're safe
|
||
|
shrd ebx,eax,1
|
||
|
shrd eax,edx,1
|
||
|
shr edx,1
|
||
|
add ecx,1 shl 16 ;Bump exponent to account for shift
|
||
|
DoSdiv:
|
||
|
div edi
|
||
|
xchg ebx,eax ;Save quotient in ebx, extend remainder
|
||
|
div edi
|
||
|
mov esi,eax
|
||
|
;We have a 64-bit quotient in ebx:esi. Now compare remainder*2 with divisor
|
||
|
;to compute round and sticky bits.
|
||
|
mov eax,-1 ;Set round and sticky bits
|
||
|
shl edx,1 ;Double remainder
|
||
|
jc RoundJmp ;If too big, round & sticky set
|
||
|
cmp edx,edi ;Is remainder*2 > divisor?
|
||
|
ja RoundJmp
|
||
|
|
||
|
;Observe, oh wondering one, how you can assume the result of this last
|
||
|
;compare is not equality. Use the following notation: n=numerator,
|
||
|
;d=denominator,q=quotient,r=remainder,b=base(2^64 here). If
|
||
|
;initially we had n < d then there was no shift and we will find q and r
|
||
|
;so that q*d+r=n*b, if initially we had n >= d then there was a shift and
|
||
|
;we will find q and r so that q*d+r=n*b/2. If we have equality here
|
||
|
;then r=d/2 ==> n={possibly 2*}(2*q+1)*d/(2*b), since this can only
|
||
|
;be integral if d is a multiple of b, but by definition b/2 <= d < b, we
|
||
|
;have a contradiction. Equality is thus impossible at this point.
|
||
|
|
||
|
cmp edx,1 ;Check for zero remainder
|
||
|
sbb eax,-2 ;eax==0 if CY, ==1 if NC (was -1)
|
||
|
RoundJmp:
|
||
|
jmp EMSEG:[RoundMode]
|
||
|
|
||
|
;*******************************************************************************
|
||
|
|
||
|
DDivBigUnderflow:
|
||
|
;Overflow flag set could only occur with denormals (true exp < -32768)
|
||
|
or EMSEG:[CURerr],Underflow
|
||
|
test EMSEG:[CWmask],Underflow ;Is exception masked?
|
||
|
jnz UnderflowZero ;Yes, return zero (in emfmul.asm)
|
||
|
add ecx,Underbias shl 16 ;Fix up exponent
|
||
|
jmp ContDdiv ;Continue with multiply
|
||
|
|
||
|
DivrDoubleSetFlag:
|
||
|
;Special entry point used by FPATAN to set bit 6 of flag dword pushed
|
||
|
;on stack before call.
|
||
|
or byte ptr [esp+4],40H
|
||
|
;*********
|
||
|
DivrDouble:
|
||
|
;*********
|
||
|
;Computes op1/op2
|
||
|
mov edx,ebx
|
||
|
mov eax,esi ;Mantissa in edx:eax
|
||
|
mov ebx,EMSEG:[edi].ExpSgn
|
||
|
mov esi,EMSEG:[edi].lManHi
|
||
|
mov edi,EMSEG:[edi].lManLo
|
||
|
jmp short DivDoubleReg
|
||
|
|
||
|
HighHalfEqual:
|
||
|
;edx:eax:ebp = dividend
|
||
|
;esi:edi = divisor
|
||
|
;ecx = exponent and sign of result
|
||
|
;
|
||
|
;High half of dividend is equal to high half of divisor. This will cause
|
||
|
;the DIV instruction to overflow. If whole dividend >= whole divisor, then
|
||
|
;we just shift the dividend right 1 bit.
|
||
|
cmp eax,edi ;Is dividend >= divisor?
|
||
|
jae ShiftDividend ;Yes, divide it by two
|
||
|
;DIV instruction would overflow, so skip it and calculate the effective
|
||
|
;result. Assume a quotient of 2^32-1 and calculate the remainder. See
|
||
|
;detailed comments under MaxQuo below--this is a copy of that code.
|
||
|
push ecx ;Save exp. and sign
|
||
|
mov ebx,-1 ;Max quotient digit
|
||
|
sub eax,edi ;Calculate correct remainder
|
||
|
;Currently edx == esi, but the next instruction ensures that is no longer
|
||
|
;true, since eax != 0. This will allow us to skip the MaxQuo check at
|
||
|
;DivFirstDigit.
|
||
|
add edx,eax ;Should set CY if quotient fit
|
||
|
mov eax,edi ;ecx:eax has new remainder
|
||
|
jc ComputeSecond ;Remainder was positive
|
||
|
;Quotient doesn't fit. Note that we can no longer ensure that edx != esi
|
||
|
;after making a correction.
|
||
|
mov ecx,edx ;Need remainder in ecx:eax
|
||
|
jmp DivCorrect1
|
||
|
|
||
|
;*********
|
||
|
DivDouble:
|
||
|
;*********
|
||
|
;Computes op2/op1
|
||
|
mov eax,edi ;Move op2 pointer
|
||
|
mov edi,esi
|
||
|
mov esi,ebx ;Mantissa in esi:edi
|
||
|
mov ebx,ecx ;ExpSgn to ebx
|
||
|
mov ecx,EMSEG:[eax].ExpSgn ;Op2 loaded
|
||
|
mov edx,EMSEG:[eax].lManHi
|
||
|
mov eax,EMSEG:[eax].lManLo
|
||
|
|
||
|
DivDoubleReg:
|
||
|
;dividend mantissa in edx:eax, exponent in high ecx, sign in ch bit 7
|
||
|
;divisor mantissa in esi:edi, exponent in high ebx, sign in bh bit 7
|
||
|
|
||
|
xor ch,bh ;Compute result sign
|
||
|
xor bx,bx ;Clear out sign and tag
|
||
|
sub ecx,1 shl 16 ;Exponent adjustment needed
|
||
|
sub ecx,ebx ;Compute result exponent
|
||
|
.erre TexpBias eq 0 ;Exponents not biased
|
||
|
jo DDivBigUnderflow ;Dividing denormal by large number
|
||
|
ContDdiv:
|
||
|
|
||
|
;If dividend >= divisor, we must shift the dividend right one bit.
|
||
|
;This will ensure the result is normalized.
|
||
|
;
|
||
|
;In previous versions of this algorithm for 24-bit and 53-bit mantissas,
|
||
|
;this shift was always performed without a test. This meant that a 1-bit
|
||
|
;normalization might be required at the end. This worked fine because
|
||
|
;32 or 64 bits were calculated, so extra precision was available for
|
||
|
;normalization. However, this version needs all 64 bits that are calculated,
|
||
|
;so we can't afford a normalization shift at the end. This test tells us
|
||
|
;up front how to align so we'll be normalized.
|
||
|
xor ebp,ebp ;Extend dividend
|
||
|
cmp esi,edx ;Dividend > divisor
|
||
|
ja DoDdiv
|
||
|
jz HighHalfEqual ;Go compare low halves
|
||
|
ShiftDividend:
|
||
|
shrd ebp,eax,1
|
||
|
shrd eax,edx,1
|
||
|
shr edx,1
|
||
|
add ecx,1 shl 16 ;Bump exponent to account for shift
|
||
|
DoDdiv:
|
||
|
push ecx ;Save exp. and sign
|
||
|
|
||
|
;edx:eax:ebp = dividend
|
||
|
;esi:edi = divisor
|
||
|
;
|
||
|
;Division algorithm from Knuth vol. 2, p. 237, using 32-bit "digits":
|
||
|
;Guess a quotient digit by dividing two MSDs of dividend by the MSD of
|
||
|
;divisor. If divisor is >= 1/2 the radix (radix = 2^32 in this case), then
|
||
|
;this guess will be no more than 2 larger than the correct value of that
|
||
|
;quotient digit (and never smaller). Divisor meets magnitude condition
|
||
|
;because it's normalized.
|
||
|
|
||
|
div esi ;Guess first quotient "digit"
|
||
|
|
||
|
;Check out our guess.
|
||
|
;Currently, remainder in edx = dividend - (quotient * high half divisor).
|
||
|
;The definition of remainder is dividend - (quotient * all divisor). So
|
||
|
;if we subtract (quotient * low half divisor) from edx, we'll get
|
||
|
;the true remainder. If it's negative, our guess was too big.
|
||
|
|
||
|
mov ebx,eax ;Save quotient
|
||
|
mov ecx,edx ;Save remainder
|
||
|
mul edi ;Quotient * low half divisor
|
||
|
sub ebp,eax ;Subtract from dividend extension
|
||
|
sbb ecx,edx ;Subtract from remainder
|
||
|
mov eax,ebp ;Low remainder to eax
|
||
|
jnc DivFirstDigit ;Was quotient OK?
|
||
|
DivCorrect1:
|
||
|
dec ebx ;Quotient was too big
|
||
|
add eax,edi ;Add divisor back into remainder
|
||
|
adc ecx,esi
|
||
|
jnc DivCorrect1 ;Repeat if quotient is still too big
|
||
|
DivFirstDigit:
|
||
|
cmp ecx,esi ;Would DIV instruction overflow?
|
||
|
jae short MaxQuo ;Yes, figure alternate quotient
|
||
|
mov edx,ecx ;Remainder back to edx:eax
|
||
|
|
||
|
;Compute 2nd quotient "digit"
|
||
|
|
||
|
ComputeSecond:
|
||
|
div esi ;Guess 2nd quotient "digit"
|
||
|
mov ebp,eax ;Save quotient
|
||
|
mov ecx,edx ;Save remainder
|
||
|
mul edi ;Quotient * low half divisor
|
||
|
neg eax ;Subtract from dividend extended with 0
|
||
|
sbb ecx,edx ;Subtract from remainder
|
||
|
jnc DivSecondDigit ;Was quotient OK?
|
||
|
DivCorrect2:
|
||
|
dec ebp ;Quotient was too big
|
||
|
add eax,edi ;Add divisor back into remainder
|
||
|
adc ecx,esi
|
||
|
jnc DivCorrect2 ;Repeat if quotient is still too big
|
||
|
DivSecondDigit:
|
||
|
;ebx:ebp = quotient
|
||
|
;ecx:eax = remainder
|
||
|
;esi:edi = divisor
|
||
|
;Now compare remainder*2 with divisor to compute round and sticky bits.
|
||
|
mov edx,-1 ;Set round and sticky bits
|
||
|
shld ecx,eax,1 ;Double remainder
|
||
|
jc DDivEnd ;If too big, round & sticky set
|
||
|
shl eax,1
|
||
|
sub edi,eax
|
||
|
sbb esi,ecx ;Subtract remainder*2 from divisor
|
||
|
jb DDivEnd ;If <0, use round & sticky bits set
|
||
|
|
||
|
;Observe, oh wondering one, how you can assume the result of this last
|
||
|
;compare is not equality. Use the following notation: n=numerator,
|
||
|
;d=denominator,q=quotient,r=remainder,b=base(2^64 here). If
|
||
|
;initially we had n < d then there was no shift and we will find q and r
|
||
|
;so that q*d+r=n*b, if initially we had n >= d then there was a shift and
|
||
|
;we will find q and r so that q*d+r=n*b/2. If we have equality here
|
||
|
;then r=d/2 ==> n={possibly 2*}(2*q+1)*d/(2*b), since this can only
|
||
|
;be integral if d is a multiple of b, but by definition b/2 <= d < b, we
|
||
|
;have a contradiction. Equality is thus impossible at this point.
|
||
|
|
||
|
;No round bit, but set sticky bit if remainder != 0.
|
||
|
or eax,ecx ;Is remainder zero?
|
||
|
add eax,-1 ;Set CY if non-zero
|
||
|
adc edx,1 ;edx==0 if NC, ==1 if CY (was -1)
|
||
|
DDivEnd:
|
||
|
mov esi,ebp ;Result in ebx:esi
|
||
|
mov eax,edx ;Round/sticky bits to eax
|
||
|
pop ecx ;Recover sign/exponent
|
||
|
jmp EMSEG:[RoundMode]
|
||
|
|
||
|
|
||
|
MaxQuo:
|
||
|
;ebx = first quotient "digit"
|
||
|
;ecx:eax = remainder
|
||
|
;esi:edi = divisor
|
||
|
;On exit, ebp = second quotient "digit"
|
||
|
;
|
||
|
;Come here if divide instruction would overflow. This must mean that ecx == esi,
|
||
|
;i.e., the high halves of the dividend and divisor are equal. Assume a result
|
||
|
;of 2^32-1, thus remainder = dividend - ( divisor * (2^32-1) )
|
||
|
; = dividend - divisor * 2^32 + divisor. Since the high halves of the dividend
|
||
|
;and divisor are equal, dividend - divisor * 2^32 can be computed by
|
||
|
;subtracting only the low halves. When adding divisor (in esi) to this, note
|
||
|
;that ecx == esi, and we want the result in ecx anyway.
|
||
|
;
|
||
|
;Note also that since the dividend is a previous remainder, the
|
||
|
;dividend - divisor * 2^32 calculation must always be negative. Thus the
|
||
|
;addition of divisor back to it should generate a carry if it goes positive.
|
||
|
|
||
|
mov ebp,-1 ;Max quotient digit
|
||
|
sub eax,edi ;Calculate correct remainder
|
||
|
add ecx,eax ;Should set CY if quotient fit
|
||
|
mov eax,edi ;ecx:eax has new remainder
|
||
|
jc DivSecondDigit ;Remainder was positive
|
||
|
jmp DivCorrect2
|