|
|
1.1 root 1: /*
2: * Copyright (c) 1985 Regents of the University of California.
3: *
4: * Use and reproduction of this software are granted in accordance with
5: * the terms and conditions specified in the Berkeley Software License
6: * Agreement (in particular, this entails acknowledgement of the programs'
7: * source, and inclusion of this notice) with the additional understanding
8: * that all recipients should regard themselves as participants in an
9: * ongoing research project and hence should feel obligated to report
10: * their experiences (good or bad) with these elementary function codes,
11: * using "sendbug 4bsd-bugs@BERKELEY", to the authors.
12: *
13: *
14: * @(#)sqrt.s 1.1 (Berkeley) 8/21/85
15: *
16: * double sqrt(arg) revised August 15,1982
17: * double arg;
18: * if(arg<0.0) { _errno = EDOM; return(<a reserved operand>); }
19: * if arg is a reserved operand it is returned as it is
20: * W. Kahan's magic square root
21: * coded by Heidi Stettner and revised by Emile LeBlanc 8/18/82
22: *
23: * entry points:_d_sqrt address of double arg is on the stack
24: * _sqrt double arg is on the stack
25: */
26: .text
27: .align 1
28: .globl _sqrt
29: .globl _d_sqrt
30: .globl libm$dsqrt_r5
31: .set EDOM,33
32:
33: _d_sqrt:
34: .word 0x003c # save r5,r4,r3,r2
35: movq *4(ap),r0
36: jmp dsqrt2
37: _sqrt:
38: .word 0x003c # save r5,r4,r3,r2
39: movq 4(ap),r0
40: dsqrt2: bicw3 $0x807f,r0,r2 # check exponent of input
41: jeql noexp # biased exponent is zero -> 0.0 or reserved
42: bsbb libm$dsqrt_r5
43: noexp: ret
44:
45: /* **************************** internal procedure */
46:
47: libm$dsqrt_r5: # ENTRY POINT FOR cdabs and cdsqrt
48: # returns double square root scaled by
49: # 2^r6
50:
51: movd r0,r4
52: jleq nonpos # argument is not positive
53: movzwl r4,r2
54: ashl $-1,r2,r0
55: addw2 $0x203c,r0 # r0 has magic initial approximation
56: /*
57: * Do two steps of Heron's rule
58: * ((arg/guess) + guess) / 2 = better guess
59: */
60: divf3 r0,r4,r2
61: addf2 r2,r0
62: subw2 $0x80,r0 # divide by two
63:
64: divf3 r0,r4,r2
65: addf2 r2,r0
66: subw2 $0x80,r0 # divide by two
67:
68: /* Scale argument and approximation to prevent over/underflow */
69:
70: bicw3 $0x807f,r4,r1
71: subw2 $0x4080,r1 # r1 contains scaling factor
72: subw2 r1,r4
73: movl r0,r2
74: subw2 r1,r2
75:
76: /* Cubic step
77: *
78: * b = a + 2*a*(n-a*a)/(n+3*a*a) where b is better approximation,
79: * a is approximation, and n is the original argument.
80: * (let s be scale factor in the following comments)
81: */
82: clrl r1
83: clrl r3
84: muld2 r0,r2 # r2:r3 = a*a/s
85: subd2 r2,r4 # r4:r5 = n/s - a*a/s
86: addw2 $0x100,r2 # r2:r3 = 4*a*a/s
87: addd2 r4,r2 # r2:r3 = n/s + 3*a*a/s
88: muld2 r0,r4 # r4:r5 = a*n/s - a*a*a/s
89: divd2 r2,r4 # r4:r5 = a*(n-a*a)/(n+3*a*a)
90: addw2 $0x80,r4 # r4:r5 = 2*a*(n-a*a)/(n+3*a*a)
91: addd2 r4,r0 # r0:r1 = a + 2*a*(n-a*a)/(n+3*a*a)
92: rsb # DONE!
93: nonpos:
94: jneq negarg
95: ret # argument and root are zero
96: negarg:
97: pushl $EDOM
98: calls $1,_infnan # generate the reserved op fault
99: ret
This archive runs on limited infrastructure. Preserving old code on modern bandwidth. Automated agents are requested to crawl responsibly.