windows-nt/Source/XPSP1/NT/multimedia/media/mplayer2/math.asm

917 lines
24 KiB
NASM
Raw Normal View History

2020-09-26 03:20:57 -05:00
page ,132
;---------------------------Module-Header-------------------------------;
; Module Name: MATH.ASM
;
; Contains FIXED point math routines.
;
; Created: Sun 30-Aug-1987 19:28:30
; Author: Charles Whitmer [chuckwh]
;
; Copyright (c) 1987 Microsoft Corporation
;-----------------------------------------------------------------------;
?WIN = 0
?PLM = 1
?NODATA = 0
PMODE = 1
.xlist
include cmacros.inc
include windows.inc
.list
externA __WinFlags
UQUAD struc
uq0 dw ?
uq1 dw ?
uq2 dw ?
uq3 dw ?
UQUAD ends
; The following two equates are just used as shorthand
; for the "word ptr" and "byte ptr" overrides.
wptr equ word ptr
bptr equ byte ptr
; The following structure should be used to access high and low
; words of a DWORD. This means that "word ptr foo[2]" -> "foo.hi".
LONG struc
lo dw ?
hi dw ?
LONG ends
EAXtoDXAX macro
shld edx,eax,16 ; move HIWORD(eax) to dx
endm
DXAXtoEAX macro
ror eax,16 ; xchg HIWORD(eax) and LOWORD(eax)
shrd eax,edx,16 ; move LOWORD(edx) to HIWORD(eax)
endm
neg32 macro hi, lo
neg lo
adc hi,0 ; carry set unless lo zero
neg hi
endm
ifndef SEGNAME
SEGNAME equ <_TEXT>
endif
createSeg %SEGNAME, CodeSeg, word, public, CODE
sBegin CodeSeg
assumes cs,CodeSeg
assumes ds,nothing
assumes es,nothing
;---------------------------Public-Routine------------------------------;
; long muldiv32(long, long, long)
;
; multiples two 32 bit values and then divides the result by a third
; 32 bit value with full 64 bit presision
;
; lResult = (lNumber * lNumerator) / lDenominator with correct rounding
;
; Entry:
; lNumber = number to multiply by nNumerator
; lNumerator = number to multiply by nNumber
; lDenominator = number to divide the multiplication result by.
;
; Returns:
; DX:AX = result of multiplication and division.
;
; Error Returns:
; none
; Registers Preserved:
; DS,ES,SI,DI
; History:
; Fri 05-Oct-1990 -by- Rob Williams [Robwi]
; Behavior consistent with MulDiv16 routine (signed, no int 0 on overflow)
; Stole muldiv16 psuedocode
;
; Wed 14-June-1990 -by- Todd Laney [ToddLa]
; converted it to 386/286 code. (by checking __WinFlags)
;
; Tue 08-May-1990 -by- Rob Williams [Robwi]
; Wrote it.
;
;----------------------------Pseudo-Code--------------------------------;
; long FAR PASCAL muldiv32(long, long, long)
; long l;
; long Numer;
; long Denom;
; {
;
; Sign = sign of Denom; // Sign will keep track of final sign //
;
;
; if (Denom < 0)
; {
; negate Denom; // make sure Denom is positive //
; }
;
; if (l < 0)
; {
; negate l; // make sure l is positive //
; }
;
; make Sign reflect any sign change;
;
;
; if (Numer < 0)
; {
; negate Numer; // make sure Numer is positive //
; }
;
; make Sign reflect any sign change;
;
; Numer *= l;
; Numer += (Denom/2); // adjust for rounding //
;
; if (overflow) // check for overflow, and handle divide by zero //
; {
; jump to md5;
; }
;
; result = Numer/Denom;
;
; if (overflow) // check again to see if overflow occured //
; {
; jump to md5;
; }
;
; if (Sign is negative) // put sign on the result //
; {
; negate result;
; }
;
;md6:
; return(result);
;
;md5:
; DX = 7FFF; // indicate overflow by //
; AX = 0xFFFF // return largest integer //
; if (Sign is negative)
; {
; DX = 0x8000; // with correct sign //
; AX = 0x0000;
; }
;
; jump to md6;
; }
;-----------------------------------------------------------------------;
assumes ds,nothing
assumes es,nothing
cProc muldiv32,<PUBLIC,FAR,NODATA,NONWIN>,<>
; ParmD lNumber
; ParmD lNumerator
; ParmD lDenominator
cBegin <nogen>
mov ax,__WinFlags
test ax,WF_CPU286+WF_CPU086+WF_CPU186
jz md32_1
jmp NEAR PTR muldiv32_286
md32_1:
errn$ muldiv32_386
cEnd <nogen>
cProc muldiv32_386,<PUBLIC,FAR,NODATA,NONWIN>,<>
ParmD lNumber
ParmD lNumerator
ParmD lDenominator
cBegin
.386
mov ebx,lDenominator ; get the demoninator
mov ecx,ebx ; ECX holds the final sign in hiword
or ebx,ebx ; ensure the denominator is positive
jns md386_1
neg ebx
md386_1:
mov eax,lNumber ; get the long we are multiplying
xor ecx,eax ; make ECX reflect any sign change
or eax,eax ; ensure the long is positive
jns md386_2
neg eax
md386_2:
mov edx,lNumerator ; get the numerator
xor ecx,edx ; make ECX reflect any sign change
or edx,edx ; ensure the numerator is positive
jns md386_3
neg edx
md386_3:
mul edx ; multiply
mov cx,bx ; get half of the demoninator to adjust for rounding
sar ebx,1
add eax,ebx ; adjust for possible rounding error
adc edx,0 ; this is really a long addition
sal ebx,1 ; restore the demoninator
or bx,cx ; fix bottom bit
cmp edx,ebx ; check for overflow
jae md386_5 ; (ae handles /0 case)
div ebx ; divide
or eax,eax ; If sign is set, then overflow occured
js md386_5 ; Overflow.
or ecx,ecx ; put the sign on the result
jns md386_6
neg eax
md386_6:
EAXtoDXAX ; convert eax to dx:ax for 16 bit programs
.286
cEnd
.386
md386_5:
mov eax,7FFFFFFFh ; return the largest integer
or ecx,ecx ; with the correct sign
jns md386_6
not eax
jmp md386_6
.286
cProc muldiv32_286,<PUBLIC,FAR,NODATA,NONWIN>,<di,si>
ParmD lNumber
ParmD lNumerator
ParmD lDenominator
LocalW wSign
cBegin
mov dx,lDenominator.hi ; get the demoninator
mov si,dx ; SI holds the final sign
or dx,dx ; ensure the denominator is positive
jns md286_1
neg32 dx, lDenominator.lo
mov lDenominator.hi, dx
md286_1:
mov ax,lNumber.lo ; get the long we are multiplying
mov dx,lNumber.hi
xor si,dx ; make ECX reflect any sign change
or dx,dx ; ensure the long is positive
jns md286_2
neg32 dx, ax
md286_2:
mov bx,lNumerator.lo ; get the numerator
mov cx,lNumerator.hi ; get the numerator
xor si,cx ; make ECX reflect any sign change
or cx,cx ; ensure the numerator is positive
jns md286_3
neg32 cx, bx
md286_3:
mov wSign, si ; save sign
call dmul ; multiply (result in dx:cx:bx:ax)
mov si, lDenominator.hi
mov di, lDenominator.lo
sar si, 1 ; get half of the demoninator
rcr di, 1 ; to adjust for rounding
add ax, di ; adjust for possible rounding error
adc bx, si
adc cx, 0
adc dx, 0 ; this is really a long addition
sal di, 1 ; restore the demoninator
rcl si, 1
or di, lDenominator.lo ; fix bottom bit
cmp dx, si ; begin overflow check (unsigned for div 0 check)
ja md286_5 ; overflow
jb md286_7 ; no overflow
cmp cx, di
jae md286_5 ; overflow
md286_7:
call qdiv ; DX:AX is quotient
or dx,dx ; If sign is set, then overflow occured
js md286_5 ; Overflow.
mov cx, wSign
or cx,cx ; put the sign on the result
jns md286_6
neg32 dx,ax
md286_6:
cEnd
md286_5:
mov cx, wSign
mov ax, 0FFFFh ; return the largest integer
mov dx, 7FFFh
or cx, cx ; with the correct sign
jns md286_6
not dx
not ax
jmp md286_6
;---------------------------Public-Routine------------------------------;
; idmul
;
; This is an extended precision multiply routine, intended to emulate
; 80386 imul instruction.
;
; Entry:
; DX:AX = LONG
; CX:BX = LONG
; Returns:
; DX:CX:BX:AX = QUAD product
; Registers Destroyed:
; none
; History:
; Tue 26-Jan-1988 23:47:02 -by- Charles Whitmer [chuckwh]
; Wrote it.
;-----------------------------------------------------------------------;
assumes ds,nothing
assumes es,nothing
cProc idmul,<PUBLIC,NEAR>,<si,di>
localQ qTemp
cBegin
; put one argument in safe registers
mov si,dx
mov di,ax
; do the low order unsigned product
mul bx
mov qTemp.uq0,ax
mov qTemp.uq1,dx
; do the high order signed product
mov ax,si
imul cx
mov qTemp.uq2,ax
mov qTemp.uq3,dx
; do a mixed product
mov ax,si
cwd
and dx,bx
sub qTemp.uq2,dx ; adjust for sign bit
sbb qTemp.uq3,0
mul bx
add qTemp.uq1,ax
adc qTemp.uq2,dx
adc qTemp.uq3,0
; do the other mixed product
mov ax,cx
cwd
and dx,di
sub qTemp.uq2,dx
sbb qTemp.uq3,0
mul di
; pick up the answer
mov bx,ax
mov cx,dx
xor dx,dx
mov ax,qTemp.uq0
add bx,qTemp.uq1
adc cx,qTemp.uq2
adc dx,qTemp.uq3
cEnd
;---------------------------Public-Routine------------------------------;
; dmul
;
; This is an extended precision multiply routine, intended to emulate
; 80386 mul instruction.
;
; Entry:
; DX:AX = LONG
; CX:BX = LONG
; Returns:
; DX:CX:BX:AX = QUAD product
; Registers Destroyed:
; none
; History:
; Tue 02-Feb-1988 10:50:44 -by- Charles Whitmer [chuckwh]
; Copied from idmul and modified.
;-----------------------------------------------------------------------;
assumes ds,nothing
assumes es,nothing
cProc dmul,<PUBLIC,NEAR>,<si,di>
localQ qTemp
cBegin
; put one argument in safe registers
mov si,dx
mov di,ax
; do the low order product
mul bx
mov qTemp.uq0,ax
mov qTemp.uq1,dx
; do the high order product
mov ax,si
mul cx
mov qTemp.uq2,ax
mov qTemp.uq3,dx
; do a mixed product
mov ax,si
mul bx
add qTemp.uq1,ax
adc qTemp.uq2,dx
adc qTemp.uq3,0
; do the other mixed product
mov ax,cx
mul di
; pick up the answer
mov bx,ax
mov cx,dx
xor dx,dx
mov ax,qTemp.uq0
add bx,qTemp.uq1
adc cx,qTemp.uq2
adc dx,qTemp.uq3
cEnd
;---------------------------Public-Routine------------------------------;
; iqdiv
;
; This is an extended precision divide routine which is intended to
; emulate the 80386 64 bit/32 bit IDIV instruction. We don't have the
; 32 bit registers to work with, but we pack the arguments and results
; into what registers we do have. We will divide two signed numbers
; and return the quotient and remainder. We will do INT 0 for overflow,
; just like the 80386 microcode. This should ease conversion later.
;
; This routine just keeps track of the signs and calls qdiv to do the
; real work.
;
; Entry:
; DX:CX:BX:AX = QUAD Numerator
; SI:DI = LONG Denominator
; Returns:
; DX:AX = quotient
; CX:BX = remainder
; Registers Destroyed:
; DI,SI
; History:
; Tue 26-Jan-1988 02:49:19 -by- Charles Whitmer [chuckwh]
; Wrote it.
;-----------------------------------------------------------------------;
WIMP equ 1
IQDIV_RESULT_SIGN equ 1
IQDIV_REM_SIGN equ 2
assumes ds,nothing
assumes es,nothing
cProc iqdiv,<PUBLIC,NEAR>
localB flags
cBegin
mov flags,0
; take the absolute value of the denominator
or si,si
jns denominator_is_cool
xor flags,IQDIV_RESULT_SIGN
neg di
adc si,0
neg si
denominator_is_cool:
; take the absolute value of the denominator
or dx,dx
jns numerator_is_cool
xor flags,IQDIV_RESULT_SIGN + IQDIV_REM_SIGN
not ax
not bx
not cx
not dx
add ax,1
adc bx,0
adc cx,0
adc dx,0
numerator_is_cool:
; do the unsigned division
call qdiv
ifdef WIMP
jo iqdiv_exit
endif
; check for overflow
or dx,dx
jns have_a_bit_to_spare
ifdef WIMP
mov ax,8000h
dec ah
jmp short iqdiv_exit
else
int 0 ; You're toast, Jack!
endif
have_a_bit_to_spare:
; negate the result, if required
test flags,IQDIV_RESULT_SIGN
jz result_is_done
neg ax
adc dx,0
neg dx
result_is_done:
; negate the remainder, if required
test flags,IQDIV_REM_SIGN
jz remainder_is_done
neg bx
adc cx,0
neg cx
remainder_is_done:
iqdiv_exit:
cEnd
;---------------------------Public-Routine------------------------------;
; qdiv
;
; This is an extended precision divide routine which is intended to
; emulate the 80386 64 bit/32 bit DIV instruction. We don't have the
; 32 bit registers to work with, but we pack the arguments and results
; into what registers we do have. We will divide two unsigned numbers
; and return the quotient and remainder. We will do INT 0 for overflow,
; just like the 80386 microcode. This should ease conversion later.
;
; Entry:
; DX:CX:BX:AX = UQUAD Numerator
; SI:DI = ULONG Denominator
; Returns:
; DX:AX = quotient
; CX:BX = remainder
; Registers Destroyed:
; none
; History:
; Tue 26-Jan-1988 00:02:09 -by- Charles Whitmer [chuckwh]
; Wrote it.
;-----------------------------------------------------------------------;
assumes ds,nothing
assumes es,nothing
cProc qdiv,<PUBLIC,NEAR>,<si,di>
localQ uqNumerator
localD ulDenominator
localD ulQuotient
localW cShift
cBegin
; stuff the quad word into local memory
mov uqNumerator.uq0,ax
mov uqNumerator.uq1,bx
mov uqNumerator.uq2,cx
mov uqNumerator.uq3,dx
; check for overflow
qdiv_restart:
cmp si,dx
ja qdiv_no_overflow
jb qdiv_overflow
cmp di,cx
ja qdiv_no_overflow
qdiv_overflow:
ifdef WIMP
mov ax,8000h
dec ah
jmp qdiv_exit
else
int 0 ; You're toast, Jack!
jmp qdiv_restart
endif
qdiv_no_overflow:
; check for a zero Numerator
or ax,bx
or ax,cx
or ax,dx
jz qdiv_exit_relay ; quotient = remainder = 0
; handle the special case when the denominator lives in the low word
or si,si
jnz not_that_special
; calculate (DX=0):CX:BX:uqNumerator.uq0 / (SI=0):DI
cmp di,1 ; separate out the trivial case
jz div_by_one
xchg dx,cx ; CX = remainder.hi = 0
mov ax,bx
div di
mov bx,ax ; BX = quotient.hi
mov ax,uqNumerator.uq0
div di ; AX = quotient.lo
xchg bx,dx ; DX = quotient.hi, BX = remainder.lo
ifdef WIMP
or ax,ax ; clear OF
endif
qdiv_exit_relay:
jmp qdiv_exit
; calculate (DX=0):(CX=0):BX:uqNumerator.uq0 / (SI=0):(DI=1)
div_by_one:
xchg dx,bx ; DX = quotient.hi, BX = remainder.lo = 0
mov ax,uqNumerator.uq0 ; AX = quotient.lo
jmp qdiv_exit
not_that_special:
; handle the special case when the denominator lives in the high word
or di,di
jnz not_this_special_either
; calculate DX:CX:BX:uqNumerator.uq0 / SI:(DI=0)
cmp si,1 ; separate out the trivial case
jz div_by_10000h
mov ax,cx
div si
mov cx,ax ; CX = quotient.hi
mov ax,bx
div si ; AX = quotient.lo
xchg cx,dx ; DX = quotient.hi, CX = remainder.hi
mov bx,uqNumerator.uq0 ; BX = remainder.lo
ifdef WIMP
or ax,ax ; clear OF
endif
jmp qdiv_exit
; calculate (DX=0):CX:BX:uqNumerator.uq0 / (SI=1):(DI=0)
div_by_10000h:
xchg cx,dx ; DX = quotient.hi, CX = remainder.hi = 0
mov ax,bx ; AX = quotient.lo
mov bx,uqNumerator.uq0 ; BX = remainder.lo
jmp qdiv_exit
not_this_special_either:
; normalize the denominator
mov dx,si
mov ax,di
call ulNormalize ; DX:AX = normalized denominator
mov cShift,cx ; CX < 16
mov ulDenominator.lo,ax
mov ulDenominator.hi,dx
; shift the Numerator by the same amount
jcxz numerator_is_shifted
mov si,-1
shl si,cl
not si ; SI = mask
mov bx,uqNumerator.uq3
shl bx,cl
mov ax,uqNumerator.uq2
rol ax,cl
mov di,si
and di,ax
or bx,di
mov uqNumerator.uq3,bx
xor ax,di
mov bx,uqNumerator.uq1
rol bx,cl
mov di,si
and di,bx
or ax,di
mov uqNumerator.uq2,ax
xor bx,di
mov ax,uqNumerator.uq0
rol ax,cl
mov di,si
and di,ax
or bx,di
mov uqNumerator.uq1,bx
xor ax,di
mov uqNumerator.uq0,ax
numerator_is_shifted:
; set up registers for division
mov dx,uqNumerator.uq3
mov ax,uqNumerator.uq2
mov di,uqNumerator.uq1
mov cx,ulDenominator.hi
mov bx,ulDenominator.lo
; check for case when Denominator has only 16 bits
or bx,bx
jnz must_do_long_division
div cx
mov si,ax
mov ax,uqNumerator.uq1
div cx
xchg si,dx ; DX:AX = quotient
mov di,uqNumerator.uq0 ; SI:DI = remainder (shifted)
jmp short unshift_remainder
must_do_long_division:
; do the long division, part IZ@NL@%
cmp dx,cx ; we only know that DX:AX < CX:BX!
jb first_division_is_safe
mov ulQuotient.hi,0 ; i.e. 10000h, our guess is too big
mov si,ax
sub si,bx ; ... remainder is negative
jmp short first_adjuster
first_division_is_safe:
div cx
mov ulQuotient.hi,ax
mov si,dx
mul bx ; fix remainder for low order term
sub di,ax
sbb si,dx
jnc first_adjuster_done ; The remainder is UNSIGNED! We have
first_adjuster: ; to use the carry flag to keep track
dec ulQuotient.hi ; of the sign. The adjuster loop
add di,bx ; watches for a change to the carry
adc si,cx ; flag which would indicate a sign
jnc first_adjuster ; change IF we had more bits to keep
first_adjuster_done: ; a sign in.
; do the long division, part II
mov dx,si
mov ax,di
mov di,uqNumerator.uq0
cmp dx,cx ; we only know that DX:AX < CX:BX!
jb second_division_is_safe
mov ulQuotient.lo,0 ; i.e. 10000h, our guess is too big
mov si,ax
sub si,bx ; ... remainder is negative
jmp short second_adjuster
second_division_is_safe:
div cx
mov ulQuotient.lo,ax
mov si,dx
mul bx ; fix remainder for low order term
sub di,ax
sbb si,dx
jnc second_adjuster_done
second_adjuster:
dec ulQuotient.lo
add di,bx
adc si,cx
jnc second_adjuster
second_adjuster_done:
mov ax,ulQuotient.lo
mov dx,ulQuotient.hi
; unshift the remainder in SI:DI
unshift_remainder:
mov cx,cShift
jcxz remainder_unshifted
mov bx,-1
shr bx,cl
not bx
shr di,cl
ror si,cl
and bx,si
or di,bx
xor si,bx
remainder_unshifted:
mov cx,si
mov bx,di
ifdef WIMP
or ax,ax ; clear OF
endif
qdiv_exit:
cEnd
;---------------------------Public-Routine------------------------------;
; ulNormalize
;
; Normalizes a ULONG so that the highest order bit is 1. Returns the
; number of shifts done. Also returns ZF=1 if the ULONG was zero.
;
; Entry:
; DX:AX = ULONG
; Returns:
; DX:AX = normalized ULONG
; CX = shift count
; ZF = 1 if the ULONG is zero, 0 otherwise
; Registers Destroyed:
; none
; History:
; Mon 25-Jan-1988 22:07:03 -by- Charles Whitmer [chuckwh]
; Wrote it.
;-----------------------------------------------------------------------;
assumes ds,nothing
assumes es,nothing
cProc ulNormalize,<PUBLIC,NEAR>
cBegin
; shift by words
xor cx,cx
or dx,dx
js ulNormalize_exit
jnz top_word_ok
xchg ax,dx
or dx,dx
jz ulNormalize_exit ; the zero exit
mov cl,16
js ulNormalize_exit
top_word_ok:
; shift by bytes
or dh,dh
jnz top_byte_ok
xchg dh,dl
xchg dl,ah
xchg ah,al
add cl,8
or dh,dh
js ulNormalize_exit
top_byte_ok:
; do the rest by bits
inc cx
add ax,ax
adc dx,dx
js ulNormalize_exit
inc cx
add ax,ax
adc dx,dx
js ulNormalize_exit
inc cx
add ax,ax
adc dx,dx
js ulNormalize_exit
inc cx
add ax,ax
adc dx,dx
js ulNormalize_exit
inc cx
add ax,ax
adc dx,dx
js ulNormalize_exit
inc cx
add ax,ax
adc dx,dx
js ulNormalize_exit
inc cx
add ax,ax
adc dx,dx
ulNormalize_exit:
cEnd
sEnd CodeSeg
end