Home | History | Annotate | Line # | Download | only in fpsp
satan.sa revision 1.1
      1 *	MOTOROLA MICROPROCESSOR & MEMORY TECHNOLOGY GROUP
      2 *	M68000 Hi-Performance Microprocessor Division
      3 *	M68040 Software Package 
      4 *
      5 *	M68040 Software Package Copyright (c) 1993, 1994 Motorola Inc.
      6 *	All rights reserved.
      7 *
      8 *	THE SOFTWARE is provided on an "AS IS" basis and without warranty.
      9 *	To the maximum extent permitted by applicable law,
     10 *	MOTOROLA DISCLAIMS ALL WARRANTIES WHETHER EXPRESS OR IMPLIED,
     11 *	INCLUDING IMPLIED WARRANTIES OF MERCHANTABILITY OR FITNESS FOR A
     12 *	PARTICULAR PURPOSE and any warranty against infringement with
     13 *	regard to the SOFTWARE (INCLUDING ANY MODIFIED VERSIONS THEREOF)
     14 *	and any accompanying written materials. 
     15 *
     16 *	To the maximum extent permitted by applicable law,
     17 *	IN NO EVENT SHALL MOTOROLA BE LIABLE FOR ANY DAMAGES WHATSOEVER
     18 *	(INCLUDING WITHOUT LIMITATION, DAMAGES FOR LOSS OF BUSINESS
     19 *	PROFITS, BUSINESS INTERRUPTION, LOSS OF BUSINESS INFORMATION, OR
     20 *	OTHER PECUNIARY LOSS) ARISING OF THE USE OR INABILITY TO USE THE
     21 *	SOFTWARE.  Motorola assumes no responsibility for the maintenance
     22 *	and support of the SOFTWARE.  
     23 *
     24 *	You are hereby granted a copyright license to use, modify, and
     25 *	distribute the SOFTWARE so long as this entire notice is retained
     26 *	without alteration in any modified and/or redistributed versions,
     27 *	and that such modified versions are clearly identified as such.
     28 *	No licenses are granted by implication, estoppel or otherwise
     29 *	under any patents or trademarks of Motorola, Inc.
     30 
     31 *
     32 *	satan.sa 3.3 12/19/90
     33 *
     34 *	The entry point satan computes the arctagent of an
     35 *	input value. satand does the same except the input value is a
     36 *	denormalized number.
     37 *
     38 *	Input: Double-extended value in memory location pointed to by address
     39 *		register a0.
     40 *
     41 *	Output:	Arctan(X) returned in floating-point register Fp0.
     42 *
     43 *	Accuracy and Monotonicity: The returned result is within 2 ulps in
     44 *		64 significant bit, i.e. within 0.5001 ulp to 53 bits if the
     45 *		result is subsequently rounded to double precision. The
     46 *		result is provably monotonic in double precision.
     47 *
     48 *	Speed: The program satan takes approximately 160 cycles for input
     49 *		argument X such that 1/16 < |X| < 16. For the other arguments,
     50 *		the program will run no worse than 10% slower.
     51 *
     52 *	Algorithm:
     53 *	Step 1. If |X| >= 16 or |X| < 1/16, go to Step 5.
     54 *
     55 *	Step 2. Let X = sgn * 2**k * 1.xxxxxxxx...x. Note that k = -4, -3,..., or 3.
     56 *		Define F = sgn * 2**k * 1.xxxx1, i.e. the first 5 significant bits
     57 *		of X with a bit-1 attached at the 6-th bit position. Define u
     58 *		to be u = (X-F) / (1 + X*F).
     59 *
     60 *	Step 3. Approximate arctan(u) by a polynomial poly.
     61 *
     62 *	Step 4. Return arctan(F) + poly, arctan(F) is fetched from a table of values
     63 *		calculated beforehand. Exit.
     64 *
     65 *	Step 5. If |X| >= 16, go to Step 7.
     66 *
     67 *	Step 6. Approximate arctan(X) by an odd polynomial in X. Exit.
     68 *
     69 *	Step 7. Define X' = -1/X. Approximate arctan(X') by an odd polynomial in X'.
     70 *		Arctan(X) = sign(X)*Pi/2 + arctan(X'). Exit.
     71 *
     72 
     73 satan	IDNT	2,1 Motorola 040 Floating Point Software Package
     74 
     75 	section	8
     76 
     77 	include fpsp.h
     78 	
     79 BOUNDS1	DC.L $3FFB8000,$4002FFFF
     80 
     81 ONE	DC.L $3F800000
     82 
     83 	DC.L $00000000
     84 
     85 ATANA3	DC.L $BFF6687E,$314987D8
     86 ATANA2	DC.L $4002AC69,$34A26DB3
     87 
     88 ATANA1	DC.L $BFC2476F,$4E1DA28E
     89 ATANB6	DC.L $3FB34444,$7F876989
     90 
     91 ATANB5	DC.L $BFB744EE,$7FAF45DB
     92 ATANB4	DC.L $3FBC71C6,$46940220
     93 
     94 ATANB3	DC.L $BFC24924,$921872F9
     95 ATANB2	DC.L $3FC99999,$99998FA9
     96 
     97 ATANB1	DC.L $BFD55555,$55555555
     98 ATANC5	DC.L $BFB70BF3,$98539E6A
     99 
    100 ATANC4	DC.L $3FBC7187,$962D1D7D
    101 ATANC3	DC.L $BFC24924,$827107B8
    102 
    103 ATANC2	DC.L $3FC99999,$9996263E
    104 ATANC1	DC.L $BFD55555,$55555536
    105 
    106 PPIBY2	DC.L $3FFF0000,$C90FDAA2,$2168C235,$00000000
    107 NPIBY2	DC.L $BFFF0000,$C90FDAA2,$2168C235,$00000000
    108 PTINY	DC.L $00010000,$80000000,$00000000,$00000000
    109 NTINY	DC.L $80010000,$80000000,$00000000,$00000000
    110 
    111 ATANTBL:
    112 	DC.L	$3FFB0000,$83D152C5,$060B7A51,$00000000
    113 	DC.L	$3FFB0000,$8BC85445,$65498B8B,$00000000
    114 	DC.L	$3FFB0000,$93BE4060,$17626B0D,$00000000
    115 	DC.L	$3FFB0000,$9BB3078D,$35AEC202,$00000000
    116 	DC.L	$3FFB0000,$A3A69A52,$5DDCE7DE,$00000000
    117 	DC.L	$3FFB0000,$AB98E943,$62765619,$00000000
    118 	DC.L	$3FFB0000,$B389E502,$F9C59862,$00000000
    119 	DC.L	$3FFB0000,$BB797E43,$6B09E6FB,$00000000
    120 	DC.L	$3FFB0000,$C367A5C7,$39E5F446,$00000000
    121 	DC.L	$3FFB0000,$CB544C61,$CFF7D5C6,$00000000
    122 	DC.L	$3FFB0000,$D33F62F8,$2488533E,$00000000
    123 	DC.L	$3FFB0000,$DB28DA81,$62404C77,$00000000
    124 	DC.L	$3FFB0000,$E310A407,$8AD34F18,$00000000
    125 	DC.L	$3FFB0000,$EAF6B0A8,$188EE1EB,$00000000
    126 	DC.L	$3FFB0000,$F2DAF194,$9DBE79D5,$00000000
    127 	DC.L	$3FFB0000,$FABD5813,$61D47E3E,$00000000
    128 	DC.L	$3FFC0000,$8346AC21,$0959ECC4,$00000000
    129 	DC.L	$3FFC0000,$8B232A08,$304282D8,$00000000
    130 	DC.L	$3FFC0000,$92FB70B8,$D29AE2F9,$00000000
    131 	DC.L	$3FFC0000,$9ACF476F,$5CCD1CB4,$00000000
    132 	DC.L	$3FFC0000,$A29E7630,$4954F23F,$00000000
    133 	DC.L	$3FFC0000,$AA68C5D0,$8AB85230,$00000000
    134 	DC.L	$3FFC0000,$B22DFFFD,$9D539F83,$00000000
    135 	DC.L	$3FFC0000,$B9EDEF45,$3E900EA5,$00000000
    136 	DC.L	$3FFC0000,$C1A85F1C,$C75E3EA5,$00000000
    137 	DC.L	$3FFC0000,$C95D1BE8,$28138DE6,$00000000
    138 	DC.L	$3FFC0000,$D10BF300,$840D2DE4,$00000000
    139 	DC.L	$3FFC0000,$D8B4B2BA,$6BC05E7A,$00000000
    140 	DC.L	$3FFC0000,$E0572A6B,$B42335F6,$00000000
    141 	DC.L	$3FFC0000,$E7F32A70,$EA9CAA8F,$00000000
    142 	DC.L	$3FFC0000,$EF888432,$64ECEFAA,$00000000
    143 	DC.L	$3FFC0000,$F7170A28,$ECC06666,$00000000
    144 	DC.L	$3FFD0000,$812FD288,$332DAD32,$00000000
    145 	DC.L	$3FFD0000,$88A8D1B1,$218E4D64,$00000000
    146 	DC.L	$3FFD0000,$9012AB3F,$23E4AEE8,$00000000
    147 	DC.L	$3FFD0000,$976CC3D4,$11E7F1B9,$00000000
    148 	DC.L	$3FFD0000,$9EB68949,$3889A227,$00000000
    149 	DC.L	$3FFD0000,$A5EF72C3,$4487361B,$00000000
    150 	DC.L	$3FFD0000,$AD1700BA,$F07A7227,$00000000
    151 	DC.L	$3FFD0000,$B42CBCFA,$FD37EFB7,$00000000
    152 	DC.L	$3FFD0000,$BB303A94,$0BA80F89,$00000000
    153 	DC.L	$3FFD0000,$C22115C6,$FCAEBBAF,$00000000
    154 	DC.L	$3FFD0000,$C8FEF3E6,$86331221,$00000000
    155 	DC.L	$3FFD0000,$CFC98330,$B4000C70,$00000000
    156 	DC.L	$3FFD0000,$D6807AA1,$102C5BF9,$00000000
    157 	DC.L	$3FFD0000,$DD2399BC,$31252AA3,$00000000
    158 	DC.L	$3FFD0000,$E3B2A855,$6B8FC517,$00000000
    159 	DC.L	$3FFD0000,$EA2D764F,$64315989,$00000000
    160 	DC.L	$3FFD0000,$F3BF5BF8,$BAD1A21D,$00000000
    161 	DC.L	$3FFE0000,$801CE39E,$0D205C9A,$00000000
    162 	DC.L	$3FFE0000,$8630A2DA,$DA1ED066,$00000000
    163 	DC.L	$3FFE0000,$8C1AD445,$F3E09B8C,$00000000
    164 	DC.L	$3FFE0000,$91DB8F16,$64F350E2,$00000000
    165 	DC.L	$3FFE0000,$97731420,$365E538C,$00000000
    166 	DC.L	$3FFE0000,$9CE1C8E6,$A0B8CDBA,$00000000
    167 	DC.L	$3FFE0000,$A22832DB,$CADAAE09,$00000000
    168 	DC.L	$3FFE0000,$A746F2DD,$B7602294,$00000000
    169 	DC.L	$3FFE0000,$AC3EC0FB,$997DD6A2,$00000000
    170 	DC.L	$3FFE0000,$B110688A,$EBDC6F6A,$00000000
    171 	DC.L	$3FFE0000,$B5BCC490,$59ECC4B0,$00000000
    172 	DC.L	$3FFE0000,$BA44BC7D,$D470782F,$00000000
    173 	DC.L	$3FFE0000,$BEA94144,$FD049AAC,$00000000
    174 	DC.L	$3FFE0000,$C2EB4ABB,$661628B6,$00000000
    175 	DC.L	$3FFE0000,$C70BD54C,$E602EE14,$00000000
    176 	DC.L	$3FFE0000,$CD000549,$ADEC7159,$00000000
    177 	DC.L	$3FFE0000,$D48457D2,$D8EA4EA3,$00000000
    178 	DC.L	$3FFE0000,$DB948DA7,$12DECE3B,$00000000
    179 	DC.L	$3FFE0000,$E23855F9,$69E8096A,$00000000
    180 	DC.L	$3FFE0000,$E8771129,$C4353259,$00000000
    181 	DC.L	$3FFE0000,$EE57C16E,$0D379C0D,$00000000
    182 	DC.L	$3FFE0000,$F3E10211,$A87C3779,$00000000
    183 	DC.L	$3FFE0000,$F919039D,$758B8D41,$00000000
    184 	DC.L	$3FFE0000,$FE058B8F,$64935FB3,$00000000
    185 	DC.L	$3FFF0000,$8155FB49,$7B685D04,$00000000
    186 	DC.L	$3FFF0000,$83889E35,$49D108E1,$00000000
    187 	DC.L	$3FFF0000,$859CFA76,$511D724B,$00000000
    188 	DC.L	$3FFF0000,$87952ECF,$FF8131E7,$00000000
    189 	DC.L	$3FFF0000,$89732FD1,$9557641B,$00000000
    190 	DC.L	$3FFF0000,$8B38CAD1,$01932A35,$00000000
    191 	DC.L	$3FFF0000,$8CE7A8D8,$301EE6B5,$00000000
    192 	DC.L	$3FFF0000,$8F46A39E,$2EAE5281,$00000000
    193 	DC.L	$3FFF0000,$922DA7D7,$91888487,$00000000
    194 	DC.L	$3FFF0000,$94D19FCB,$DEDF5241,$00000000
    195 	DC.L	$3FFF0000,$973AB944,$19D2A08B,$00000000
    196 	DC.L	$3FFF0000,$996FF00E,$08E10B96,$00000000
    197 	DC.L	$3FFF0000,$9B773F95,$12321DA7,$00000000
    198 	DC.L	$3FFF0000,$9D55CC32,$0F935624,$00000000
    199 	DC.L	$3FFF0000,$9F100575,$006CC571,$00000000
    200 	DC.L	$3FFF0000,$A0A9C290,$D97CC06C,$00000000
    201 	DC.L	$3FFF0000,$A22659EB,$EBC0630A,$00000000
    202 	DC.L	$3FFF0000,$A388B4AF,$F6EF0EC9,$00000000
    203 	DC.L	$3FFF0000,$A4D35F10,$61D292C4,$00000000
    204 	DC.L	$3FFF0000,$A60895DC,$FBE3187E,$00000000
    205 	DC.L	$3FFF0000,$A72A51DC,$7367BEAC,$00000000
    206 	DC.L	$3FFF0000,$A83A5153,$0956168F,$00000000
    207 	DC.L	$3FFF0000,$A93A2007,$7539546E,$00000000
    208 	DC.L	$3FFF0000,$AA9E7245,$023B2605,$00000000
    209 	DC.L	$3FFF0000,$AC4C84BA,$6FE4D58F,$00000000
    210 	DC.L	$3FFF0000,$ADCE4A4A,$606B9712,$00000000
    211 	DC.L	$3FFF0000,$AF2A2DCD,$8D263C9C,$00000000
    212 	DC.L	$3FFF0000,$B0656F81,$F22265C7,$00000000
    213 	DC.L	$3FFF0000,$B1846515,$0F71496A,$00000000
    214 	DC.L	$3FFF0000,$B28AAA15,$6F9ADA35,$00000000
    215 	DC.L	$3FFF0000,$B37B44FF,$3766B895,$00000000
    216 	DC.L	$3FFF0000,$B458C3DC,$E9630433,$00000000
    217 	DC.L	$3FFF0000,$B525529D,$562246BD,$00000000
    218 	DC.L	$3FFF0000,$B5E2CCA9,$5F9D88CC,$00000000
    219 	DC.L	$3FFF0000,$B692CADA,$7ACA1ADA,$00000000
    220 	DC.L	$3FFF0000,$B736AEA7,$A6925838,$00000000
    221 	DC.L	$3FFF0000,$B7CFAB28,$7E9F7B36,$00000000
    222 	DC.L	$3FFF0000,$B85ECC66,$CB219835,$00000000
    223 	DC.L	$3FFF0000,$B8E4FD5A,$20A593DA,$00000000
    224 	DC.L	$3FFF0000,$B99F41F6,$4AFF9BB5,$00000000
    225 	DC.L	$3FFF0000,$BA7F1E17,$842BBE7B,$00000000
    226 	DC.L	$3FFF0000,$BB471285,$7637E17D,$00000000
    227 	DC.L	$3FFF0000,$BBFABE8A,$4788DF6F,$00000000
    228 	DC.L	$3FFF0000,$BC9D0FAD,$2B689D79,$00000000
    229 	DC.L	$3FFF0000,$BD306A39,$471ECD86,$00000000
    230 	DC.L	$3FFF0000,$BDB6C731,$856AF18A,$00000000
    231 	DC.L	$3FFF0000,$BE31CAC5,$02E80D70,$00000000
    232 	DC.L	$3FFF0000,$BEA2D55C,$E33194E2,$00000000
    233 	DC.L	$3FFF0000,$BF0B10B7,$C03128F0,$00000000
    234 	DC.L	$3FFF0000,$BF6B7A18,$DACB778D,$00000000
    235 	DC.L	$3FFF0000,$BFC4EA46,$63FA18F6,$00000000
    236 	DC.L	$3FFF0000,$C0181BDE,$8B89A454,$00000000
    237 	DC.L	$3FFF0000,$C065B066,$CFBF6439,$00000000
    238 	DC.L	$3FFF0000,$C0AE345F,$56340AE6,$00000000
    239 	DC.L	$3FFF0000,$C0F22291,$9CB9E6A7,$00000000
    240 
    241 X	equ	FP_SCR1
    242 XDCARE	equ	X+2
    243 XFRAC	equ	X+4
    244 XFRACLO	equ	X+8
    245 
    246 ATANF	equ	FP_SCR2
    247 ATANFHI	equ	ATANF+4
    248 ATANFLO	equ	ATANF+8
    249 
    250 
    251 	xref	t_frcinx
    252 	xref	t_extdnrm
    253 
    254 	xdef	satand
    255 satand:
    256 *--ENTRY POINT FOR ATAN(X) FOR DENORMALIZED ARGUMENT
    257 
    258 	bra		t_extdnrm
    259 
    260 	xdef	satan
    261 satan:
    262 *--ENTRY POINT FOR ATAN(X), HERE X IS FINITE, NON-ZERO, AND NOT NAN'S
    263 
    264 	FMOVE.X		(A0),FP0	...LOAD INPUT
    265 
    266 	MOVE.L		(A0),D0
    267 	MOVE.W		4(A0),D0
    268 	FMOVE.X		FP0,X(a6)
    269 	ANDI.L		#$7FFFFFFF,D0
    270 
    271 	CMPI.L		#$3FFB8000,D0		...|X| >= 1/16?
    272 	BGE.B		ATANOK1
    273 	BRA.W		ATANSM
    274 
    275 ATANOK1:
    276 	CMPI.L		#$4002FFFF,D0		...|X| < 16 ?
    277 	BLE.B		ATANMAIN
    278 	BRA.W		ATANBIG
    279 
    280 
    281 *--THE MOST LIKELY CASE, |X| IN [1/16, 16). WE USE TABLE TECHNIQUE
    282 *--THE IDEA IS ATAN(X) = ATAN(F) + ATAN( [X-F] / [1+XF] ).
    283 *--SO IF F IS CHOSEN TO BE CLOSE TO X AND ATAN(F) IS STORED IN
    284 *--A TABLE, ALL WE NEED IS TO APPROXIMATE ATAN(U) WHERE
    285 *--U = (X-F)/(1+XF) IS SMALL (REMEMBER F IS CLOSE TO X). IT IS
    286 *--TRUE THAT A DIVIDE IS NOW NEEDED, BUT THE APPROXIMATION FOR
    287 *--ATAN(U) IS A VERY SHORT POLYNOMIAL AND THE INDEXING TO
    288 *--FETCH F AND SAVING OF REGISTERS CAN BE ALL HIDED UNDER THE
    289 *--DIVIDE. IN THE END THIS METHOD IS MUCH FASTER THAN A TRADITIONAL
    290 *--ONE. NOTE ALSO THAT THE TRADITIONAL SCHEME THAT APPROXIMATE
    291 *--ATAN(X) DIRECTLY WILL NEED TO USE A RATIONAL APPROXIMATION
    292 *--(DIVISION NEEDED) ANYWAY BECAUSE A POLYNOMIAL APPROXIMATION
    293 *--WILL INVOLVE A VERY LONG POLYNOMIAL.
    294 
    295 *--NOW WE SEE X AS +-2^K * 1.BBBBBBB....B <- 1. + 63 BITS
    296 *--WE CHOSE F TO BE +-2^K * 1.BBBB1
    297 *--THAT IS IT MATCHES THE EXPONENT AND FIRST 5 BITS OF X, THE
    298 *--SIXTH BITS IS SET TO BE 1. SINCE K = -4, -3, ..., 3, THERE
    299 *--ARE ONLY 8 TIMES 16 = 2^7 = 128 |F|'S. SINCE ATAN(-|F|) IS
    300 *-- -ATAN(|F|), WE NEED TO STORE ONLY ATAN(|F|).
    301 
    302 ATANMAIN:
    303 
    304 	MOVE.W		#$0000,XDCARE(a6)	...CLEAN UP X JUST IN CASE
    305 	ANDI.L		#$F8000000,XFRAC(a6)	...FIRST 5 BITS
    306 	ORI.L		#$04000000,XFRAC(a6)	...SET 6-TH BIT TO 1
    307 	MOVE.L		#$00000000,XFRACLO(a6)	...LOCATION OF X IS NOW F
    308 
    309 	FMOVE.X		FP0,FP1			...FP1 IS X
    310 	FMUL.X		X(a6),FP1		...FP1 IS X*F, NOTE THAT X*F > 0
    311 	FSUB.X		X(a6),FP0		...FP0 IS X-F
    312 	FADD.S		#:3F800000,FP1		...FP1 IS 1 + X*F
    313 	FDIV.X		FP1,FP0			...FP0 IS U = (X-F)/(1+X*F)
    314 
    315 *--WHILE THE DIVISION IS TAKING ITS TIME, WE FETCH ATAN(|F|)
    316 *--CREATE ATAN(F) AND STORE IT IN ATANF, AND
    317 *--SAVE REGISTERS FP2.
    318 
    319 	MOVE.L		d2,-(a7)	...SAVE d2 TEMPORARILY
    320 	MOVE.L		d0,d2		...THE EXPO AND 16 BITS OF X
    321 	ANDI.L		#$00007800,d0	...4 VARYING BITS OF F'S FRACTION
    322 	ANDI.L		#$7FFF0000,d2	...EXPONENT OF F
    323 	SUBI.L		#$3FFB0000,d2	...K+4
    324 	ASR.L		#1,d2
    325 	ADD.L		d2,d0		...THE 7 BITS IDENTIFYING F
    326 	ASR.L		#7,d0		...INDEX INTO TBL OF ATAN(|F|)
    327 	LEA		ATANTBL,a1
    328 	ADDA.L		d0,a1		...ADDRESS OF ATAN(|F|)
    329 	MOVE.L		(a1)+,ATANF(a6)
    330 	MOVE.L		(a1)+,ATANFHI(a6)
    331 	MOVE.L		(a1)+,ATANFLO(a6)	...ATANF IS NOW ATAN(|F|)
    332 	MOVE.L		X(a6),d0		...LOAD SIGN AND EXPO. AGAIN
    333 	ANDI.L		#$80000000,d0	...SIGN(F)
    334 	OR.L		d0,ATANF(a6)	...ATANF IS NOW SIGN(F)*ATAN(|F|)
    335 	MOVE.L		(a7)+,d2	...RESTORE d2
    336 
    337 *--THAT'S ALL I HAVE TO DO FOR NOW,
    338 *--BUT ALAS, THE DIVIDE IS STILL CRANKING!
    339 
    340 *--U IN FP0, WE ARE NOW READY TO COMPUTE ATAN(U) AS
    341 *--U + A1*U*V*(A2 + V*(A3 + V)), V = U*U
    342 *--THE POLYNOMIAL MAY LOOK STRANGE, BUT IS NEVERTHELESS CORRECT.
    343 *--THE NATURAL FORM IS U + U*V*(A1 + V*(A2 + V*A3))
    344 *--WHAT WE HAVE HERE IS MERELY	A1 = A3, A2 = A1/A3, A3 = A2/A3.
    345 *--THE REASON FOR THIS REARRANGEMENT IS TO MAKE THE INDEPENDENT
    346 *--PARTS A1*U*V AND (A2 + ... STUFF) MORE LOAD-BALANCED
    347 
    348 	
    349 	FMOVE.X		FP0,FP1
    350 	FMUL.X		FP1,FP1
    351 	FMOVE.D		ATANA3,FP2
    352 	FADD.X		FP1,FP2		...A3+V
    353 	FMUL.X		FP1,FP2		...V*(A3+V)
    354 	FMUL.X		FP0,FP1		...U*V
    355 	FADD.D		ATANA2,FP2	...A2+V*(A3+V)
    356 	FMUL.D		ATANA1,FP1	...A1*U*V
    357 	FMUL.X		FP2,FP1		...A1*U*V*(A2+V*(A3+V))
    358 	
    359 	FADD.X		FP1,FP0		...ATAN(U), FP1 RELEASED
    360 	FMOVE.L		d1,FPCR		;restore users exceptions
    361 	FADD.X		ATANF(a6),FP0	...ATAN(X)
    362 	bra		t_frcinx
    363 
    364 ATANBORS:
    365 *--|X| IS IN d0 IN COMPACT FORM. FP1, d0 SAVED.
    366 *--FP0 IS X AND |X| <= 1/16 OR |X| >= 16.
    367 	CMPI.L		#$3FFF8000,d0
    368 	BGT.W		ATANBIG	...I.E. |X| >= 16
    369 
    370 ATANSM:
    371 *--|X| <= 1/16
    372 *--IF |X| < 2^(-40), RETURN X AS ANSWER. OTHERWISE, APPROXIMATE
    373 *--ATAN(X) BY X + X*Y*(B1+Y*(B2+Y*(B3+Y*(B4+Y*(B5+Y*B6)))))
    374 *--WHICH IS X + X*Y*( [B1+Z*(B3+Z*B5)] + [Y*(B2+Z*(B4+Z*B6)] )
    375 *--WHERE Y = X*X, AND Z = Y*Y.
    376 
    377 	CMPI.L		#$3FD78000,d0
    378 	BLT.W		ATANTINY
    379 *--COMPUTE POLYNOMIAL
    380 	FMUL.X		FP0,FP0	...FP0 IS Y = X*X
    381 
    382 	
    383 	MOVE.W		#$0000,XDCARE(a6)
    384 
    385 	FMOVE.X		FP0,FP1
    386 	FMUL.X		FP1,FP1		...FP1 IS Z = Y*Y
    387 
    388 	FMOVE.D		ATANB6,FP2
    389 	FMOVE.D		ATANB5,FP3
    390 
    391 	FMUL.X		FP1,FP2		...Z*B6
    392 	FMUL.X		FP1,FP3		...Z*B5
    393 
    394 	FADD.D		ATANB4,FP2	...B4+Z*B6
    395 	FADD.D		ATANB3,FP3	...B3+Z*B5
    396 
    397 	FMUL.X		FP1,FP2		...Z*(B4+Z*B6)
    398 	FMUL.X		FP3,FP1		...Z*(B3+Z*B5)
    399 
    400 	FADD.D		ATANB2,FP2	...B2+Z*(B4+Z*B6)
    401 	FADD.D		ATANB1,FP1	...B1+Z*(B3+Z*B5)
    402 
    403 	FMUL.X		FP0,FP2		...Y*(B2+Z*(B4+Z*B6))
    404 	FMUL.X		X(a6),FP0		...X*Y
    405 
    406 	FADD.X		FP2,FP1		...[B1+Z*(B3+Z*B5)]+[Y*(B2+Z*(B4+Z*B6))]
    407 	
    408 
    409 	FMUL.X		FP1,FP0	...X*Y*([B1+Z*(B3+Z*B5)]+[Y*(B2+Z*(B4+Z*B6))])
    410 
    411 	FMOVE.L		d1,FPCR		;restore users exceptions
    412 	FADD.X		X(a6),FP0
    413 
    414 	bra		t_frcinx
    415 
    416 ATANTINY:
    417 *--|X| < 2^(-40), ATAN(X) = X
    418 	MOVE.W		#$0000,XDCARE(a6)
    419 
    420 	FMOVE.L		d1,FPCR		;restore users exceptions
    421 	FMOVE.X		X(a6),FP0	;last inst - possible exception set
    422 
    423 	bra		t_frcinx
    424 
    425 ATANBIG:
    426 *--IF |X| > 2^(100), RETURN	SIGN(X)*(PI/2 - TINY). OTHERWISE,
    427 *--RETURN SIGN(X)*PI/2 + ATAN(-1/X).
    428 	CMPI.L		#$40638000,d0
    429 	BGT.W		ATANHUGE
    430 
    431 *--APPROXIMATE ATAN(-1/X) BY
    432 *--X'+X'*Y*(C1+Y*(C2+Y*(C3+Y*(C4+Y*C5)))), X' = -1/X, Y = X'*X'
    433 *--THIS CAN BE RE-WRITTEN AS
    434 *--X'+X'*Y*( [C1+Z*(C3+Z*C5)] + [Y*(C2+Z*C4)] ), Z = Y*Y.
    435 
    436 	FMOVE.S		#:BF800000,FP1	...LOAD -1
    437 	FDIV.X		FP0,FP1		...FP1 IS -1/X
    438 
    439 	
    440 *--DIVIDE IS STILL CRANKING
    441 
    442 	FMOVE.X		FP1,FP0		...FP0 IS X'
    443 	FMUL.X		FP0,FP0		...FP0 IS Y = X'*X'
    444 	FMOVE.X		FP1,X(a6)		...X IS REALLY X'
    445 
    446 	FMOVE.X		FP0,FP1
    447 	FMUL.X		FP1,FP1		...FP1 IS Z = Y*Y
    448 
    449 	FMOVE.D		ATANC5,FP3
    450 	FMOVE.D		ATANC4,FP2
    451 
    452 	FMUL.X		FP1,FP3		...Z*C5
    453 	FMUL.X		FP1,FP2		...Z*B4
    454 
    455 	FADD.D		ATANC3,FP3	...C3+Z*C5
    456 	FADD.D		ATANC2,FP2	...C2+Z*C4
    457 
    458 	FMUL.X		FP3,FP1		...Z*(C3+Z*C5), FP3 RELEASED
    459 	FMUL.X		FP0,FP2		...Y*(C2+Z*C4)
    460 
    461 	FADD.D		ATANC1,FP1	...C1+Z*(C3+Z*C5)
    462 	FMUL.X		X(a6),FP0		...X'*Y
    463 
    464 	FADD.X		FP2,FP1		...[Y*(C2+Z*C4)]+[C1+Z*(C3+Z*C5)]
    465 	
    466 
    467 	FMUL.X		FP1,FP0		...X'*Y*([B1+Z*(B3+Z*B5)]
    468 *					...	+[Y*(B2+Z*(B4+Z*B6))])
    469 	FADD.X		X(a6),FP0
    470 
    471 	FMOVE.L		d1,FPCR		;restore users exceptions
    472 	
    473 	btst.b		#7,(a0)
    474 	beq.b		pos_big
    475 
    476 neg_big:
    477 	FADD.X		NPIBY2,FP0
    478 	bra		t_frcinx
    479 
    480 pos_big:
    481 	FADD.X		PPIBY2,FP0
    482 	bra		t_frcinx
    483 
    484 ATANHUGE:
    485 *--RETURN SIGN(X)*(PIBY2 - TINY) = SIGN(X)*PIBY2 - SIGN(X)*TINY
    486 	btst.b		#7,(a0)
    487 	beq.b		pos_huge
    488 
    489 neg_huge:
    490 	FMOVE.X		NPIBY2,fp0
    491 	fmove.l		d1,fpcr
    492 	fsub.x		NTINY,fp0
    493 	bra		t_frcinx
    494 
    495 pos_huge:
    496 	FMOVE.X		PPIBY2,fp0
    497 	fmove.l		d1,fpcr
    498 	fsub.x		PTINY,fp0
    499 	bra		t_frcinx
    500 	
    501 	end
    502