arch/vax/n_atan2.S

1.6.22.1    matt /*	n_atan2.S,v 1.6 2003/08/07 16:44:44 agc Exp	*/
     1.1   ragge /*
     1.1   ragge  * Copyright (c) 1985, 1993
     1.1   ragge  *	The Regents of the University of California.  All rights reserved.
     1.1   ragge  *
     1.1   ragge  * Redistribution and use in source and binary forms, with or without
     1.1   ragge  * modification, are permitted provided that the following conditions
     1.1   ragge  * are met:
     1.1   ragge  * 1. Redistributions of source code must retain the above copyright
     1.1   ragge  *    notice, this list of conditions and the following disclaimer.
     1.1   ragge  * 2. Redistributions in binary form must reproduce the above copyright
     1.1   ragge  *    notice, this list of conditions and the following disclaimer in the
     1.1   ragge  *    documentation and/or other materials provided with the distribution.
     1.6     agc  * 3. Neither the name of the University nor the names of its contributors
     1.1   ragge  *    may be used to endorse or promote products derived from this software
     1.1   ragge  *    without specific prior written permission.
     1.1   ragge  *
     1.1   ragge  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     1.1   ragge  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     1.1   ragge  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     1.1   ragge  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     1.1   ragge  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     1.1   ragge  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     1.1   ragge  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     1.1   ragge  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     1.1   ragge  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     1.1   ragge  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     1.1   ragge  * SUCH DAMAGE.
     1.1   ragge  *
     1.1   ragge  *	@(#)atan2.s	8.1 (Berkeley) 6/4/93
     1.1   ragge  */
     1.1   ragge
     1.4    matt #include <machine/asm.h>
     1.4    matt
     1.1   ragge /*
     1.1   ragge  * ATAN2(Y,X)
     1.1   ragge  * RETURN ARG (X+iY)
     1.1   ragge  * VAX D FORMAT (56 BITS PRECISION)
     1.3  simonb  * CODED IN VAX ASSEMBLY LANGUAGE BY K.C. NG, 4/16/85;
     1.3  simonb  *
     1.1   ragge  *
     1.1   ragge  * Method :
     1.1   ragge  *	1. Reduce y to positive by atan2(y,x)=-atan2(-y,x).
     1.3  simonb  *	2. Reduce x to positive by (if x and y are unexceptional):
     1.1   ragge  *		ARG (x+iy) = arctan(y/x)   	   ... if x > 0,
     1.1   ragge  *		ARG (x+iy) = pi - arctan[y/(-x)]   ... if x < 0,
     1.3  simonb  *	3. According to the integer k=4t+0.25 truncated , t=y/x, the argument
     1.3  simonb  *	   is further reduced to one of the following intervals and the
     1.1   ragge  *	   arctangent of y/x is evaluated by the corresponding formula:
     1.1   ragge  *
     1.1   ragge  *          [0,7/16]	   atan(y/x) = t - t^3*(a1+t^2*(a2+...(a10+t^2*a11)...)
     1.1   ragge  *	   [7/16,11/16]    atan(y/x) = atan(1/2) + atan( (y-x/2)/(x+y/2) )
     1.1   ragge  *	   [11/16.19/16]   atan(y/x) = atan( 1 ) + atan( (y-x)/(x+y) )
     1.1   ragge  *	   [19/16,39/16]   atan(y/x) = atan(3/2) + atan( (y-1.5x)/(x+1.5y) )
     1.1   ragge  *	   [39/16,INF]     atan(y/x) = atan(INF) + atan( -x/y )
     1.1   ragge  *
     1.1   ragge  * Special cases:
     1.1   ragge  * Notations: atan2(y,x) == ARG (x+iy) == ARG(x,y).
     1.1   ragge  *
     1.1   ragge  *	ARG( NAN , (anything) ) is NaN;
     1.1   ragge  *	ARG( (anything), NaN ) is NaN;
     1.1   ragge  *	ARG(+(anything but NaN), +-0) is +-0  ;
     1.1   ragge  *	ARG(-(anything but NaN), +-0) is +-PI ;
     1.1   ragge  *	ARG( 0, +-(anything but 0 and NaN) ) is +-PI/2;
     1.1   ragge  *	ARG( +INF,+-(anything but INF and NaN) ) is +-0 ;
     1.1   ragge  *	ARG( -INF,+-(anything but INF and NaN) ) is +-PI;
     1.1   ragge  *	ARG( +INF,+-INF ) is +-PI/4 ;
     1.1   ragge  *	ARG( -INF,+-INF ) is +-3PI/4;
     1.1   ragge  *	ARG( (anything but,0,NaN, and INF),+-INF ) is +-PI/2;
     1.1   ragge  *
     1.1   ragge  * Accuracy:
     1.3  simonb  *	atan2(y,x) returns the exact ARG(x+iy) nearly rounded.
     1.1   ragge  */
     1.1   ragge
1.6.22.1    matt #ifdef WEAK_ALIAS
1.6.22.1    matt WEAK_ALIAS(atan2f, _atan2f)
1.6.22.1    matt #endif
1.6.22.1    matt
1.6.22.1    matt ENTRY(_atan2f, 0)
1.6.22.1    matt 	cvtfd	4(%ap),-(%sp)
1.6.22.1    matt 	calls	$2,_C_LABEL(_atan2)
1.6.22.1    matt 	cvtdf	%r0,%r0
1.6.22.1    matt 	ret
1.6.22.1    matt
1.6.22.1    matt #ifdef WEAK_ALIAS
1.6.22.1    matt WEAK_ALIAS(atan2, _atan2)
1.6.22.1    matt #endif
1.6.22.1    matt
1.6.22.1    matt ENTRY(_atan2, 0x0fc0)
     1.5    matt 	movq	4(%ap),%r2		# %r2 = y
     1.5    matt 	movq	12(%ap),%r4		# %r4 = x
     1.5    matt 	bicw3	$0x7f,%r2,%r0
     1.5    matt 	bicw3	$0x7f,%r4,%r1
     1.5    matt 	cmpw	%r0,$0x8000		# y is the reserved operand
     1.1   ragge 	jeql	resop
     1.5    matt 	cmpw	%r1,$0x8000		# x is the reserved operand
     1.1   ragge 	jeql	resop
     1.5    matt 	subl2	$8,%sp
     1.5    matt 	bicw3	$0x7fff,%r2,-4(%fp)	# copy y sign bit to -4(%fp)
     1.5    matt 	bicw3	$0x7fff,%r4,-8(%fp)	# copy x sign bit to -8(%fp)
     1.5    matt 	cmpd	%r4,$0x4080		# x = 1.0 ?
     1.1   ragge 	bneq	xnot1
     1.5    matt 	movq	%r2,%r0
     1.5    matt 	bicw2	$0x8000,%r0		# t = |y|
     1.5    matt 	movq	%r0,%r2			# y = |y|
     1.4    matt 	jbr	begin
     1.1   ragge xnot1:
     1.5    matt 	bicw3	$0x807f,%r2,%r11		# yexp
     1.1   ragge 	jeql	yeq0			# if y=0 goto yeq0
     1.5    matt 	bicw3	$0x807f,%r4,%r10		# xexp
     1.1   ragge 	jeql	pio2			# if x=0 goto pio2
     1.5    matt 	subw2	%r10,%r11			# k = yexp - xexp
     1.5    matt 	cmpw	%r11,$0x2000		# k >= 64 (exp) ?
     1.1   ragge 	jgeq	pio2			# atan2 = +-pi/2
     1.5    matt 	divd3	%r4,%r2,%r0		# t = y/x  never overflow
     1.5    matt 	bicw2	$0x8000,%r0		# t > 0
     1.5    matt 	bicw2	$0xff80,%r2		# clear the exponent of y
     1.5    matt 	bicw2	$0xff80,%r4		# clear the exponent of x
     1.5    matt 	bisw2	$0x4080,%r2		# normalize y to [1,2)
     1.5    matt 	bisw2	$0x4080,%r4		# normalize x to [1,2)
     1.5    matt 	subw2	%r11,%r4			# scale x so that yexp-xexp=k
     1.1   ragge begin:
     1.5    matt 	cmpw	%r0,$0x411c		# t : 39/16
     1.1   ragge 	jgeq	L50
     1.5    matt 	addl3	$0x180,%r0,%r10		# 8*t
     1.5    matt 	cvtrfl	%r10,%r10			# [8*t] rounded to int
     1.5    matt 	ashl	$-1,%r10,%r10		# [8*t]/2
     1.5    matt 	casel	%r10,$0,$4
     1.3  simonb L1:
     1.1   ragge 	.word	L20-L1
     1.1   ragge 	.word	L20-L1
     1.1   ragge 	.word	L30-L1
     1.1   ragge 	.word	L40-L1
     1.1   ragge 	.word	L40-L1
     1.3  simonb L10:
     1.5    matt 	movq	$0xb4d9940f985e407b,%r6	# Hi=.98279372324732906796d0
     1.5    matt 	movq	$0x21b1879a3bc2a2fc,%r8	# Lo=-.17092002525602665777d-17
     1.5    matt 	subd3	%r4,%r2,%r0		# y-x
     1.5    matt 	addw2	$0x80,%r0		# 2(y-x)
     1.5    matt 	subd2	%r4,%r0			# 2(y-x)-x
     1.5    matt 	addw2	$0x80,%r4		# 2x
     1.5    matt 	movq	%r2,%r10
     1.5    matt 	addw2	$0x80,%r10		# 2y
     1.5    matt 	addd2	%r10,%r2			# 3y
     1.5    matt 	addd2	%r4,%r2			# 3y+2x
     1.5    matt 	divd2	%r2,%r0			# (2y-3x)/(2x+3y)
     1.4    matt 	jbr	L60
     1.3  simonb L20:
     1.5    matt 	cmpw	%r0,$0x3280		# t : 2**(-28)
     1.1   ragge 	jlss	L80
     1.5    matt 	clrq	%r6			# Hi=%r6=0, Lo=%r8=0
     1.5    matt 	clrq	%r8
     1.4    matt 	jbr	L60
     1.3  simonb L30:
     1.5    matt 	movq	$0xda7b2b0d63383fed,%r6	# Hi=.46364760900080611433d0
     1.5    matt 	movq	$0xf0ea17b2bf912295,%r8	# Lo=.10147340032515978826d-17
     1.5    matt 	movq	%r2,%r0
     1.5    matt 	addw2	$0x80,%r0		# 2y
     1.5    matt 	subd2	%r4,%r0			# 2y-x
     1.5    matt 	addw2	$0x80,%r4		# 2x
     1.5    matt 	addd2	%r2,%r4			# 2x+y
     1.5    matt 	divd2	%r4,%r0 			# (2y-x)/(2x+y)
     1.4    matt 	jbr	L60
     1.3  simonb L50:
     1.5    matt 	movq	$0x68c2a2210fda40c9,%r6	# Hi=1.5707963267948966135d1
     1.5    matt 	movq	$0x06e0145c26332326,%r8	# Lo=.22517417741562176079d-17
     1.5    matt 	cmpw	%r0,$0x5100		# y : 2**57
     1.1   ragge 	bgeq	L90
     1.5    matt 	divd3	%r2,%r4,%r0
     1.5    matt 	bisw2	$0x8000,%r0 		# -x/y
     1.4    matt 	jbr	L60
     1.3  simonb L40:
     1.5    matt 	movq	$0x68c2a2210fda4049,%r6	# Hi=.78539816339744830676d0
     1.5    matt 	movq	$0x06e0145c263322a6,%r8	# Lo=.11258708870781088040d-17
     1.5    matt 	subd3	%r4,%r2,%r0		# y-x
     1.5    matt 	addd2	%r4,%r2			# y+x
     1.5    matt 	divd2	%r2,%r0			# (y-x)/(y+x)
     1.3  simonb L60:
     1.5    matt 	movq	%r0,%r10
     1.5    matt 	muld2	%r0,%r0
     1.5    matt 	polyd	%r0,$12,ptable
     1.5    matt 	muld2	%r10,%r0
     1.5    matt 	subd2	%r0,%r8
     1.5    matt 	addd3	%r8,%r10,%r0
     1.5    matt 	addd2	%r6,%r0
     1.3  simonb L80:
     1.5    matt 	movw	-8(%fp),%r2
     1.1   ragge 	bneq	pim
     1.5    matt 	bisw2	-4(%fp),%r0		# return sign(y)*%r0
     1.1   ragge 	ret
     1.3  simonb L90:					# x >= 2**25
     1.5    matt 	movq	%r6,%r0
     1.4    matt 	jbr	L80
     1.1   ragge pim:
     1.5    matt 	subd3	%r0,$0x68c2a2210fda4149,%r0	# pi-t
     1.5    matt 	bisw2	-4(%fp),%r0
     1.1   ragge 	ret
     1.1   ragge yeq0:
     1.5    matt 	movw	-8(%fp),%r2
     1.1   ragge 	beql	zero			# if sign(x)=1 return pi
     1.5    matt 	movq	$0x68c2a2210fda4149,%r0	# pi=3.1415926535897932270d1
     1.1   ragge 	ret
     1.1   ragge zero:
     1.5    matt 	clrq	%r0			# return 0
     1.1   ragge 	ret
     1.1   ragge pio2:
     1.5    matt 	movq	$0x68c2a2210fda40c9,%r0	# pi/2=1.5707963267948966135d1
     1.5    matt 	bisw2	-4(%fp),%r0		# return sign(y)*pi/2
     1.1   ragge 	ret
     1.1   ragge resop:
     1.5    matt 	movq	$0x8000,%r0		# propagate the reserved operand
     1.1   ragge 	ret
     1.4    matt
     1.4    matt 	_ALIGN_TEXT
     1.1   ragge ptable:
     1.1   ragge 	.quad	0xb50f5ce96e7abd60
     1.1   ragge 	.quad	0x51e44a42c1073e02
     1.1   ragge 	.quad	0x3487e3289643be35
     1.1   ragge 	.quad	0xdb62066dffba3e54
     1.1   ragge 	.quad	0xcf8e2d5199abbe70
     1.1   ragge 	.quad	0x26f39cb884883e88
     1.1   ragge 	.quad	0x135117d18998be9d
     1.1   ragge 	.quad	0x602ce9742e883eba
     1.1   ragge 	.quad	0xa35ad0be8e38bee3
     1.1   ragge 	.quad	0xffac922249243f12
     1.1   ragge 	.quad	0x7f14ccccccccbf4c
     1.1   ragge 	.quad	0xaa8faaaaaaaa3faa
     1.1   ragge 	.quad	0x0000000000000000