Annotation of 41BSD/libc/gen/atof.s, revision 1.1

1.1     ! root        1: #
        !             2: #      atof: convert ascii to floating
        !             3: #
        !             4: #      C usage:
        !             5: #
        !             6: #              double atof (s)
        !             7: #              char *s;
        !             8: #
        !             9: #      Register usage:
        !            10: #
        !            11: #              r0-1:   value being developed
        !            12: #              r2:     first section: pointer to the next character
        !            13: #                      second section: binary exponent
        !            14: #              r3:     flags
        !            15: #              r4:     first section: the current character
        !            16: #                      second section: scratch
        !            17: #              r5:     the decimal exponent
        !            18: #              r6-7:   scratch
        !            19: #
        !            20: #      Flag definitions
        !            21: #
        !            22:        .set    msign,0         # mantissa has negative sign
        !            23:        .set    esign,1         # exponent has negative sign
        !            24:        .set    decpt,2         # decimal point encountered
        !            25: 
        !            26:        .align  2
        !            27: two31: .word   0x5000          # 2 ** 31
        !            28:        .word   0               # (=2147483648)
        !            29:        .word   0               # in floating-point
        !            30:        .word   0               # (so atof doesn't have to convert it)
        !            31: #
        !            32: #      Entry point
        !            33: #
        !            34:        .text
        !            35:        .align 2
        !            36:        .globl  _atof
        !            37: _atof: .word   0x00c0          # Save r7, r6 (we use r0-r7)
        !            38: #
        !            39: #      Initialization
        !            40: #
        !            41:        clrl    r3              # All flags start out false
        !            42:        movl    4(ap),r2        # Address the first character
        !            43:        clrl    r5              # Clear starting exponent
        !            44: #
        !            45: #      Skip leading white space
        !            46: #
        !            47: sk0:   movzbl  (r2)+,r4        # Fetch the next (first) character
        !            48:        cmpb    $' ,r4          # Is it blank?
        !            49:        jeql    sk0             #   ...yes
        !            50:        cmpb    r4,$8           # 8 is lowest of white-space group
        !            51:        jlss    sk1             # Jump if char too low to be white space
        !            52:        cmpb    r4,$13          # 13 is highest of white-space group
        !            53:        jleq    sk0             # Jump if character is white space
        !            54: sk1:
        !            55: #
        !            56: #      Check for a sign
        !            57: #
        !            58:        cmpb    $'+,r4          # Positive sign?
        !            59:        jeql    cs1             #   ... yes
        !            60:        cmpb    $'-,r4          # Negative sign?
        !            61:        jneq    cs2             #   ... no
        !            62:        bisb2   $1<msign,r3     # Indicate a negative mantissa
        !            63: cs1:   movzbl  (r2)+,r4        # Skip the character
        !            64: cs2:
        !            65: #
        !            66: #      Accumulate digits, keeping track of the exponent
        !            67: #
        !            68:        clrq    r0              # Clear the accumulator
        !            69: ad0:   cmpb    r4,$'0          # Do we have a digit?
        !            70:        jlss    ad4             #   ... no, too small
        !            71:        cmpb    r4,$'9
        !            72:        jgtr    ad4             #   ... no, too large
        !            73: #
        !            74: #      We got a digit.  Accumulate it
        !            75: #
        !            76:        cmpl    r1,$214748364   # Would this digit cause overflow?
        !            77:        jgeq    ad1             #   ... yes
        !            78: #
        !            79: #      Multiply (r0,r1) by 10.  This is done by developing
        !            80: #      (r0,r1)*2 in (r6,r7), shifting (r0,r1) left three bits,
        !            81: #      and adding the two quadwords.
        !            82: #
        !            83:        ashq    $1,r0,r6        # (r6,r7)=(r0,r1)*2
        !            84:        ashq    $3,r0,r0        # (r0,r1)=(r0,r1)*8
        !            85:        addl2   r6,r0           # Add low halves
        !            86:        adwc    r7,r1           # Add high halves
        !            87: #
        !            88: #      Add in the digit
        !            89: #
        !            90:        subl2   $'0,r4          # Get the digit value
        !            91:        addl2   r4,r0           # Add it into the accumulator
        !            92:        adwc    $0,r1           # Possible carry into high half
        !            93:        jbr     ad2             # Join common code
        !            94: #
        !            95: #      Here when the digit won't fit in the accumulator
        !            96: #
        !            97: ad1:   incl    r5              # Ignore the digit, bump exponent
        !            98: #
        !            99: #      If we have seen a decimal point, decrease the exponent by 1
        !           100: #
        !           101: ad2:   jbc     $decpt,r3,ad3   # Jump if decimal point not seen
        !           102:        decl    r5              # Decrease exponent
        !           103: ad3:
        !           104: #
        !           105: #      Fetch the next character, back for more
        !           106: #
        !           107:        movzbl  (r2)+,r4        # Fetch
        !           108:        jbr     ad0             # Try again
        !           109: #
        !           110: #      Not a digit.  Could it be a decimal point?
        !           111: #
        !           112: ad4:   cmpb    r4,$'.          # If it's not a decimal point, either it's
        !           113:        jneq    ad5             #   the end of the number or the start of
        !           114:                                #   the exponent.
        !           115:        jbcs    $decpt,r3,ad3   # If it IS a decimal point, we record that
        !           116:                                #   we've seen one, and keep collecting
        !           117:                                #   digits if it is the first one.
        !           118: #
        !           119: #      Check for an exponent
        !           120: #
        !           121: ad5:   clrl    r6              # Initialize the exponent accumulator
        !           122: 
        !           123:        cmpb    r4,$'e          # We allow both lower case e
        !           124:        jeql    ex1             #   ... and ...
        !           125:        cmpb    r4,$'E          #   upper-case E
        !           126:        jneq    ex7
        !           127: #
        !           128: #      Does the exponent have a sign?
        !           129: #
        !           130: ex1:   movzbl  (r2)+,r4        # Get next character
        !           131:        cmpb    r4,$'+          # Positive sign?
        !           132:        jeql    ex2             #   ... yes ...
        !           133:        cmpb    r4,$'-          # Negative sign?
        !           134:        jneq    ex3             #   ... no ...
        !           135:        bisb2   $1<esign,r3     # Indicate exponent is negative
        !           136: ex2:   movzbl  (r2)+,r4        # Grab the next character
        !           137: #
        !           138: #      Accumulate exponent digits in r6
        !           139: #
        !           140: ex3:   cmpb    r4,$'0          # A digit is within the range
        !           141:        jlss    ex4             # '0' through
        !           142:        cmpb    r4,$'9          # '9',
        !           143:        jgtr    ex4             # inclusive.
        !           144:        cmpl    r6,$214748364   # Exponent outrageously large already?
        !           145:        jgeq    ex2             #   ... yes
        !           146:        moval   (r6)[r6],r6     # r6 *= 5
        !           147:        movaw   -'0(r4)[r6],r6  # r6 = r6 * 2 + r4 - '0'
        !           148:        jbr     ex2             # Go 'round again
        !           149: ex4:
        !           150: #
        !           151: #      Now get the final exponent and force it within a reasonable
        !           152: #      range so our scaling loops don't take forever for values
        !           153: #      that will ultimately cause overflow or underflow anyway.
        !           154: #      A tight check on over/underflow will be done by ldexp.
        !           155: #
        !           156:        jbc     $esign,r3,ex5   # Jump if exponent not negative
        !           157:        mnegl   r6,r6           # If sign, negate exponent
        !           158: ex5:   addl2   r6,r5           # Add given exponent to calculated exponent
        !           159:        cmpl    r5,$-100        # Absurdly small?
        !           160:        jgtr    ex6             #   ... no
        !           161:        movl    $-100,r5        #   ... yes, force within limit
        !           162: ex6:   cmpl    r5,$100         # Absurdly large?
        !           163:        jlss    ex7             #   ... no
        !           164:        movl    $100,r5         #   ... yes, force within bounds
        !           165: ex7:
        !           166: #
        !           167: #      Our number has now been reduced to a mantissa and an exponent.
        !           168: #      The mantissa is a 63-bit positive binary integer in r0,r1,
        !           169: #      and the exponent is a signed power of 10 in r5.  The msign
        !           170: #      bit in r3 will be on if the mantissa should ultimately be
        !           171: #      considered negative.
        !           172: #
        !           173: #      We now have to convert it to a standard format floating point
        !           174: #      number.  This will be done by accumulating a binary exponent
        !           175: #      in r2, as we progressively get r5 closer to zero.
        !           176: #
        !           177: #      Don't bother scaling if the mantissa is zero
        !           178: #
        !           179:        movq    r0,r0           # Mantissa zero?
        !           180:        jeql    exit            #   ... yes
        !           181: 
        !           182:        clrl    r2              # Initialize binary exponent
        !           183:        tstl    r5              # Which way to scale?
        !           184:        jleq    sd0             # Scale down if decimal exponent <= 0
        !           185: #
        !           186: #      Scale up by "multiplying" r0,r1 by 10 as many times as necessary,
        !           187: #      as follows:
        !           188: #
        !           189: #      Step 1: Shift r0,r1 right as necessary to ensure that no
        !           190: #      overflow can occur when multiplying.
        !           191: #
        !           192: su0:   cmpl    r1,$429496729   # Compare high word to (2**31)/5
        !           193:        jlss    su1             # Jump out if guaranteed safe
        !           194:        ashq    $-1,r0,r0       # Else shift right one bit
        !           195:        incl    r2              #    bump exponent to compensate
        !           196:        jbr     su0             #    and go back to test again.
        !           197: #
        !           198: #      Step 2: Multiply r0,r1 by 5, by appropriate shifting and
        !           199: #      double-precision addition
        !           200: #
        !           201: su1:   ashq    $2,r0,r6        # (r6,r7) := (r0,r1) * 4
        !           202:        addl2   r6,r0           # Add low-order halves
        !           203:        adwc    r7,r1           #   and high-order halves
        !           204: #
        !           205: #      Step 3: Increment the binary exponent to take care of the final
        !           206: #      factor of 2, and go back if we still need to scale more.
        !           207: #
        !           208:        incl    r2              # Increment the exponent
        !           209:        sobgtr  r5,su0          #    and back for more (maybe)
        !           210: 
        !           211:        jbr     cm0             # Merge to build final value
        !           212: 
        !           213: #
        !           214: #      Scale down.  We must "divide" r0,r1 by 10 as many times
        !           215: #      as needed, as follows:
        !           216: #
        !           217: #      Step 0: Right now, the condition codes reflect the state
        !           218: #      of r5.  If it's zero, we are done.
        !           219: #
        !           220: sd0:   jeql    cm0             # If finished, build final number
        !           221: #
        !           222: #      Step 1: Shift r0,r1 left until the high-order bit (not counting
        !           223: #      the sign bit) is nonzero, so that the division will preserve
        !           224: #      as much precision as possible.
        !           225: #
        !           226:        tstl    r1              # Is the entire high-order half zero?
        !           227:        jneq    sd2             #   ...no, go shift one bit at a time
        !           228:        ashq    $30,r0,r0       #   ...yes, shift left 30,
        !           229:        subl2   $30,r2          #   decrement the exponent to compensate,
        !           230:                                #   and now it's known to be safe to shift
        !           231:                                #   at least once more.
        !           232: sd1:   ashq    $1,r0,r0        # Shift (r0,r1) left one, and
        !           233:        decl    r2              #   decrement the exponent to compensate
        !           234: sd2:   jbc     $30,r1,sd1      # If the high-order bit is off, go shift
        !           235: #
        !           236: #      Step 2: Divide the high-order part of (r0,r1) by 5,
        !           237: #      giving a quotient in r1 and a remainder in r7.
        !           238: #
        !           239: sd3:   movl    r1,r6           # Copy the high-order part
        !           240:        clrl    r7              # Zero-extend to 64 bits
        !           241:        ediv    $5,r6,r1,r7     # Divide (cannot overflow)
        !           242: #
        !           243: #      Step 3: Divide the low-order part of (r0,r1) by 5,
        !           244: #      using the remainder from step 2 for rounding.
        !           245: #      Note that the result of this computation is unsigned,
        !           246: #      so we have to allow for the fact that an ordinary division
        !           247: #      by 5 could overflow.  We make allowance by dividing by 10,
        !           248: #      multiplying the quotient by 2, and using the remainder
        !           249: #      to adjust the modified quotient.
        !           250: #
        !           251:        addl3   $2,r0,r6        # Dividend is low part of (r0,r1) plus
        !           252:        adwc    $0,r7           #  2 for rounding plus
        !           253:                                #  (2**32) * previous remainder
        !           254:        ediv    $10,r6,r0,r6    # r0 := quotient, r6 := remainder.
        !           255:        addl2   r0,r0           # Make r0 result of dividing by 5
        !           256:        cmpl    r6,$5           # If remainder is 5 or greater,
        !           257:        jlss    sd4             #   increment the adjustted quotient.
        !           258:        incl    r0
        !           259: #
        !           260: #      Step 4: Increment the decimal exponent, decrement the binary
        !           261: #      exponent (to make the division by 5 into a division by 10),
        !           262: #      and back for another iteration.
        !           263: #
        !           264: sd4:   decl    r2              # Binary exponent
        !           265:        aoblss  $0,r5,sd2
        !           266: #
        !           267: #      We now have the following:
        !           268: #
        !           269: #      r0:     low-order half of a 64-bit integer
        !           270: #      r1:     high-order half of the same 64-bit integer
        !           271: #      r2:     a binary exponent
        !           272: #
        !           273: #      Our final result is the integer represented by (r0,r1)
        !           274: #      multiplied by 2 to the power contained in r2.
        !           275: #      We will transform (r0,r1) into a floating-point value,
        !           276: #      set the sign appropriately, and let ldexp do the
        !           277: #      rest of the work.
        !           278: #
        !           279: #      Step 1: if the high-order bit (excluding the sign) of
        !           280: #      the high-order half (r1) is 1, then we have 63 bits of
        !           281: #      fraction, too many to convert easily.  However, we also
        !           282: #      know we won't need them all, so we will just throw the
        !           283: #      low-order bit away (and adjust the exponent appropriately).
        !           284: #
        !           285: cm0:   jbc     $30,r1,cm1      # jump if no adjustment needed
        !           286:        ashq    $-1,r0,r0       # lose the low-order bit
        !           287:        incl    r2              # increase the exponent to compensate
        !           288: #
        !           289: #      Step 2: split the 62-bit number in (r0,r1) into two
        !           290: #      31-bit positive quantities
        !           291: #
        !           292: cm1:   ashq    $1,r0,r0        # put the high-order bits in r1
        !           293:                                #   and a 0 in the bottom of r0
        !           294:        rotl    $-1,r0,r0       # right-justify the bits in r0
        !           295:                                #   moving the 0 from the ashq
        !           296:                                #   into the sign bit.
        !           297: #
        !           298: #      Step 3: convert both halves to floating point
        !           299: #
        !           300:        cvtld   r0,r6           # low-order part in r6-r7
        !           301:        cvtld   r1,r0           # high-order part in r0-r1
        !           302: #
        !           303: #      Step 4: multiply the high order part by 2**31 and combine them
        !           304: #
        !           305:        muld2   two31,r0        # multiply
        !           306:        addd2   r6,r0           # combine
        !           307: #
        !           308: #      Step 5: if appropriate, negate the floating value
        !           309: #
        !           310:        jbc     $msign,r3,cm2   # Jump if mantissa not signed
        !           311:        mnegd   r0,r0           # If negative, make it so
        !           312: #
        !           313: #      Step 6: call ldexp to complete the job
        !           314: #
        !           315: cm2:   pushl   r2              # Put exponent in parameter list
        !           316:        movd    r0,-(sp)        #    and also mantissa
        !           317:        calls   $3,_ldexp       # go combine them
        !           318: 
        !           319: exit:  ret

unix.superglobalmegacorp.com

This archive runs on limited infrastructure. Preserving old code on modern bandwidth. Automated agents are requested to crawl responsibly.