coherent/b/lib/libc/crt/i386/ddiv.s - annotate

Return to ddiv.s CVS log
Up to [MW Coherent from dump] / coherent / b / lib / libc / crt / i386
Annotation of coherent/b/lib/libc/crt/i386/ddiv.s, revision 1.1

1.1     ! root        1: //////////
        !             2: / libc/crt/i386/ddiv.s
        !             3: / i386 C runtime library.
        !             4: / IEEE software floating point support.
        !             5: //////////
        !             6: 
        !             7: //////////
        !             8: / double _ddiv(double d)
        !             9: / Return d / %edx:eax in %edx:%eax.
        !            10: /
        !            11: / double _drdiv(double d)
        !            12: / Return %edx:eax / d in %edx:%eax.
        !            13: /
        !            14: / The hard part of floating point division is computing the result mantissa,
        !            15: / i.e. the quotient of the numerator mantissa by the denominator mantissa;
        !            16: / all are 53-bit quantities.
        !            17: / We shift the denominator mantissa to make it as large as possible,
        !            18: / then use i386 "divl" (64-bit by 32-bit unsigned integer divide)
        !            19: / twice to find the two quotient dwords efficiently.
        !            20: /
        !            21: / This does not handle denormals, though it could without much trouble.
        !            22: //////////
        !            23: 
        !            24: d      .equ    8
        !            25: BIAS   .equ    1023
        !            26: EXPMASK        .equ    0x7FF00000
        !            27: MANMASK        .equ    0x000FFFFF
        !            28: SGNMASK        .equ    0x80000000
        !            29: HIDDEN .equ    0x00100000
        !            30: 
        !            31:        .globl  _ddiv
        !            32:        .globl  _drdiv
        !            33: 
        !            34: _ddiv:
        !            35:        xchgl   %edx, 8(%esp)
        !            36:        xchgl   %eax, 4(%esp)           / exchange arg order
        !            37: /      jmp     _drdiv                  / and fall through to divide
        !            38: 
        !            39: / Numerator is in EDX:EAX, call it A = hiA:loA.
        !            40: / Denominator is on stack, call it B = hiB:loB.
        !            41: / Compute the quotient A/B, call it Q = hiQ:loQ.
        !            42: _drdiv:
        !            43:        push    %ebp
        !            44:        movl    %ebp, %esp
        !            45:        push    %esi
        !            46:        push    %edi
        !            47:        push    %ebx
        !            48:        push    %ecx
        !            49: 
        !            50:        movl    %esi, d+4(%ebp)
        !            51:        movl    %edi, d(%ebp)           / B to ESI:EDI
        !            52:                                        / now done with EBP as index register
        !            53: 
        !            54:        / Compute result sign.
        !            55:        movl    %ebx, %edx
        !            56:        xorl    %ebx, %esi
        !            57:        andl    %ebx, $SGNMASK
        !            58:        push    %ebx                    / save result sign bit
        !            59: 
        !            60:        / Check for special cases +-0.0, +-infinity, NaN on each side.
        !            61:        movl    %ecx, %esi
        !            62:        andl    %ecx, $EXPMASK
        !            63:        movl    %ebx, %edx
        !            64:        andl    %ebx, $EXPMASK
        !            65:        jz      ?lhszero                / A is 0.0; ignore denormal
        !            66:        cmpl    %ebx, $EXPMASK
        !            67:        jz      ?lhsmax                 / A is +-infinity or NaN
        !            68:        orl     %ecx, %ecx
        !            69:        jz      ?inf                    / normal/0.0, return +-infinity; ignore denormal
        !            70:        cmpl    %ecx, $EXPMASK
        !            71:        jz      ?rhsmax                 / normal/+-infinity or normal/NaN
        !            72: 
        !            73:        / Compute probable result exponent in EBX.
        !            74:        / It might get incremented below (so 0 might become 1).
        !            75:        shrl    %ebx, $20               / A biased exp in EBX
        !            76:        shrl    %ecx, $20               / B biased exp in ECX
        !            77:        subl    %ecx, $BIAS-1           / unbiased, fudged to get right result
        !            78:        subl    %ebx, %ecx              / form biased result exponent
        !            79:        jl      ?zero                   / underflow, return 0.0
        !            80:        cmpl    %ebx, $EXPMASK>>20
        !            81:        jge     ?inf                    / overflow, return +-infinity
        !            82: 
        !            83:        / Extract the mantissas.
        !            84:        / Shift the denominator mantissa to range 2^63 <= B < 2^64.
        !            85:        andl    %edx, $MANMASK
        !            86:        orl     %edx, $HIDDEN           / extract A mantissa, restore hidden bit
        !            87:        andl    %esi, $MANMASK
        !            88:        orl     %esi, $HIDDEN           / extract B mantissa, restore hidden bit
        !            89:        shld    %esi, %edi, $11
        !            90:        shll    %edi, $11               / shift left, B bit 31 is now 1
        !            91:        jnz     ?hard                   / loB is nonzero
        !            92: 
        !            93:        / Division is easy when the lo divisor dword is zero:
        !            94:        / perform a 96-bit by 32-bit divide of hiA:loA:0 by hiB to get
        !            95:        / a 64-bit quotient and a 32-bit remainder,
        !            96:        / then zero-extend the remainder to 64 bits.
        !            97:        / hiQ = q1 = A/hiB and r1 = A%hiB, then loQ = q2 = r1:0/hiB.
        !            98:        / This is a special case for efficiency; division by any double with
        !            99:        / up to 32 mantissa bits, notably any int or unsigned, is quite fast.
        !           100:        divl    %esi                    / q1 = A/hiB to EAX, r1 = A%hiB to EDX
        !           101:        movl    %ebp, %eax              / save q1
        !           102:        subl    %eax, %eax              / r1:0 in EDX:EAX
        !           103:        divl    %esi                    / q2 = r1:0/hiB to EAX, r to EDX
        !           104:        xchgl   %ebp, %edx              / result quotient in EDX:EAX
        !           105:        subl    %ecx, %ecx              / r:0 in EBP:ECX
        !           106: 
        !           107:        / The quotient is in EDX:EAX, the remainder is in EBP:ECX.
        !           108:        / Round up the quotient when remainder >= B / 2, i.e. 2*r >= B.
        !           109: ?remtest:
        !           110:        shld    %ebp, %ecx, $1          / 2*hiR
        !           111:        jc      ?roundup                / too big
        !           112:        cmpl    %ebp, %esi
        !           113:        jb      ?position               / 2*r < B
        !           114:        ja      ?roundup                / 2*r > B, round up
        !           115:        shll    %ecx, $1                / 2*loR
        !           116:        cmpl    %ecx, %edi              / hi(2*R) == hiB, compare lo dword
        !           117:        jb      ?position               / 2*r < B
        !           118: 
        !           119:        / Round up the quotient in EDX:EAX.
        !           120: ?roundup:
        !           121:        addl    %eax, $1
        !           122:        adcl    %edx, $0
        !           123: 
        !           124:        / The quotient in EDX:EAX might be correctly positioned as it stands,
        !           125:        / or it might require a 1-bit right shift.
        !           126: ?position:
        !           127:        testl   %edx, $HIDDEN<<1        / check if shift required
        !           128:        jz      ?pack                   / no shift required
        !           129: ?rshift:
        !           130:        incl    %ebx                    / bump exponent
        !           131:        shrd    %eax, %edx, $1
        !           132:        pushfl                          / save CF for rounding
        !           133:        shrl    %edx, $1                / shift EDX:EAX right by 1 bit
        !           134:        popfl                           / restore CF
        !           135:        adcl    %eax, $0
        !           136:        adcl    %edx, $0                / round if appropriate
        !           137:        testl   %edx, $HIDDEN<<1        / watch out for carry past hidden bit
        !           138:        jnz     ?rshift
        !           139: 
        !           140:        / Pack result mantissa in EDX:EAX with exponent from EBX and sign from stack.
        !           141: ?pack:
        !           142:        orl     %ebx, %ebx
        !           143:        jle     ?zero                   / exponent underflow, return 0.0
        !           144:        cmp     %ebx, $EXPMASK>>20
        !           145:        jge     ?inf                    / exponent overflow, return infinity
        !           146:        shll    %ebx, $20               / position exponent
        !           147:        andl    %edx, $MANMASK          / mask off hidden bit
        !           148:        orl     %edx, %ebx              / pack mantissa and exponent
        !           149:        pop     %ecx
        !           150:        orl     %edx, %ecx              / pack with sign
        !           151: 
        !           152: ?done:
        !           153:        pop     %ecx
        !           154:        pop     %ebx
        !           155:        pop     %edi
        !           156:        pop     %esi
        !           157:        pop     %ebp
        !           158:        ret
        !           159: 
        !           160: / Numerator is 0.0 (or denormal, ignored here).
        !           161: ?lhszero:
        !           162:        jecxz   ?NaN                    / 0/0, return NaN; ignore denormal
        !           163:        cmpl    %ecx, $EXPMASK
        !           164:        jnz     ?zero                   / 0/normal, return 0.0
        !           165: ?rhsmax:
        !           166:        / Numerator is normal or 0, denominator is +-infinity or NaN.
        !           167:        andl    %esi, $MANMASK
        !           168:        jnz     ?NaN                    / A/NaN, return NaN
        !           169:        orl     %edi, %edi
        !           170:        jnz     ?NaN                    / A/NaN, return NaN
        !           171: /      jmp     ?zero                   / 0/+-infinity or normal/+-infinity, return 0.0 
        !           172:                                        / fall through...
        !           173: / Return +0.0.
        !           174: ?zero:
        !           175:        pop     %edx                    / pop sign bit and ignore
        !           176:        subl    %edx, %edx              / return 0.0
        !           177: ?zeroeax:
        !           178:        subl    %eax, %eax
        !           179:        jmp     ?done
        !           180: 
        !           181: / Numerator is +-infinity or NaN.
        !           182: ?lhsmax:
        !           183:        andl    %edx, $MANMASK
        !           184:        jnz     ?NaN                    / NaN/B, return NaN
        !           185:        orl     %eax, %eax
        !           186:        jnz     ?NaN                    / NaN/B, return NaN
        !           187:        cmpl    %ecx, $EXPMASK
        !           188:        jz      ?NaN                    / +-infinity/NaN or +-infinity/+-infinity
        !           189: /      jmp     ?inf                    / +-infinity/normal or +-infinity/0, return infinity
        !           190:                                        / fall through...
        !           191:                
        !           192: / Return +-infinity.
        !           193: ?inf:
        !           194:        pop     %edx                    / pop result sign bit
        !           195:        orl     %edx, $EXPMASK          / max exp, zero mantissa for infinity
        !           196:        jmp     ?zeroeax
        !           197: 
        !           198: / Return NaN.
        !           199: ?NaN:
        !           200:        pop     %edx                    / pop sign bit and ignore
        !           201:        movl    %edx, $EXPMASK|MANMASK  / max exp, nonzero mantissa for NaN
        !           202:        jmp     ?zeroeax
        !           203: 
        !           204: / The hard case performs a 128-bit by 64-bit division of hiA:loA:0:0
        !           205: / by hiB:loB to get a 64-bit quotient hiQ:loQ and a 64-bit remainder hiR:loR.
        !           206: / Execute the following code twice to compute the two quotient dwords,
        !           207: / saving hiQ in EBP and using it as a termination flag.
        !           208: / Each iteration does a 96-bit by 64-bit divide to get a 32-bit quotient
        !           209: / and a 64-bit remainder.
        !           210: / Use q = A / hiB as a guess at the quotient,
        !           211: / then decrement the remainder r = A % hiB by loB*q.
        !           212: / We may need to decrement q once or twice to get the right quotient.
        !           213: 
        !           214: ?hard:
        !           215:        push    %ebx                    / save result exponent
        !           216:        subl    %ebp, %ebp              / clear flag for first pass
        !           217: ?divide:
        !           218:        divl    %esi                    / q = A/hiB to EAX, r = A%hiB to EDX
        !           219:        movl    %ecx, %eax              / save q in ECX
        !           220:        movl    %ebx, %edx              / and save r in EBX
        !           221:        mull    %edi                    / loB*q to EDX:EAX
        !           222:        xchgl   %edx, %ebx              / r to EDX, hi(loB*q) to EBX
        !           223:        negl    %eax                    / 0-lo(loB*q) to EAX
        !           224:        sbbl    %edx, %ebx              / EDX:EAX gets r-loB*q
        !           225:        jnc     ?gotcha                 / q is the right quotient
        !           226: 
        !           227:        / q is too big a guess, adjust to q' = q-1 and adjust the remainder.
        !           228:        / This gets executed at most twice (because the high bit of B is 1).
        !           229: ?adjust:
        !           230:        decl    %ecx                    / decrement the quotient
        !           231:        addl    %eax, %edi
        !           232:        adcl    %edx, %esi              / add B back to remainder
        !           233:        jnc     ?adjust                 / repeat if still negative
        !           234: 
        !           235:        / The correct dword q is in ECX, the remainder r is in EDX:EAX.
        !           236: ?gotcha:
        !           237:        orl     %ebp, %ebp
        !           238:        jz      ?loQ                    / repeat to find loQ
        !           239:        xchgl   %ebp, %edx
        !           240:        xchgl   %ecx, %eax              / q to EDX:EAX, r to EBP:ECX
        !           241:        pop     %ebx                    / restore result exponent
        !           242:        jmp     ?remtest
        !           243: 
        !           244:        / Compute the lo dword of the quotient.
        !           245:        / r is in EDX:EAX, hiQ is in ECX.
        !           246: ?loQ:
        !           247:        movl    %ebp, %ecx              / save hiQ (nonzero) in EBP
        !           248:        cmpl    %edx, %esi              / be wary of overflow on divide
        !           249:        jb      ?divide                 / no overflow, proceed as above
        !           250: 
        !           251:        / Since r is the remainder of the first division by B,
        !           252:        / it must be strictly less than B.  But it is possible that hiR = hiB,
        !           253:        / in which case the divide using "divl" would overflow.
        !           254:        / For this case, use q2 = 0xFFFFFFFF = 2^32 - 1 as the quotient guess.
        !           255:        / Compute the adjusted remainder r2 = r - q2*B as r - 2^32 * B + B.
        !           256:        movl    %ecx, $0xFFFFFFFF       / q2
        !           257:        subl    %eax, %edi              / loR - loB, must be negative
        !           258: /      sbbl    %edx, %esi              / hiR = hiB, so hi dword EDX becomes 0
        !           259:        movl    %edx, %eax              / EDX:EAX *= 2^32; EDX is now negative
        !           260:        movl    %eax, %edi              / 0 + loB
        !           261:        addl    %edx, %esi              / add back B to EDX:EAX
        !           262:        jc      ?gotcha                 / remainder became positive, q2 is ok
        !           263:        jmp     ?adjust                 / remainder stayed negative, adjust q2
        !           264: 
        !           265: / end of libc/crt/i386/ddiv.s
unix.superglobalmegacorp.com
This archive runs on limited infrastructure. Preserving old code on modern bandwidth. Automated agents are requested to crawl responsibly.