arch/vax/n_cabs.S

1.6  mhitch /*	$NetBSD: n_cabs.S,v 1.6 2008/03/20 16:41:26 mhitch Exp $	*/
1.1   ragge /*
1.1   ragge  * Copyright (c) 1985, 1993
1.1   ragge  *	The Regents of the University of California.  All rights reserved.
1.1   ragge  *
1.1   ragge  * Redistribution and use in source and binary forms, with or without
1.1   ragge  * modification, are permitted provided that the following conditions
1.1   ragge  * are met:
1.1   ragge  * 1. Redistributions of source code must retain the above copyright
1.1   ragge  *    notice, this list of conditions and the following disclaimer.
1.1   ragge  * 2. Redistributions in binary form must reproduce the above copyright
1.1   ragge  *    notice, this list of conditions and the following disclaimer in the
1.1   ragge  *    documentation and/or other materials provided with the distribution.
1.5     agc  * 3. Neither the name of the University nor the names of its contributors
1.1   ragge  *    may be used to endorse or promote products derived from this software
1.1   ragge  *    without specific prior written permission.
1.1   ragge  *
1.1   ragge  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
1.1   ragge  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
1.1   ragge  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
1.1   ragge  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
1.1   ragge  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
1.1   ragge  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
1.1   ragge  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
1.1   ragge  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
1.1   ragge  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
1.1   ragge  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
1.1   ragge  * SUCH DAMAGE.
1.1   ragge  *
1.1   ragge  *	@(#)cabs.s	8.1 (Berkeley) 6/4/93
1.1   ragge  */
1.1   ragge
1.3    matt #include <machine/asm.h>
1.3    matt
1.3    matt 	.globl	_C_LABEL(__libm_dsqrt_r5)
1.1   ragge /*
1.1   ragge  * double precision complex absolute value
1.1   ragge  * CABS by W. Kahan, 9/7/80.
1.1   ragge  * Revised for reserved operands by E. LeBlanc, 8/18/82
1.4    matt  * argument for complex absolute value by reference, *4(%ap)
1.4    matt  * argument for cabs and hypot (C fcns) by value, 4(%ap)
1.4    matt  * output is in %r0:%r1 (error less than 0.86 ulps)
1.1   ragge  */
1.1   ragge
1.1   ragge /*	entry for c functions cabs and hypot */
1.6  mhitch #ifdef WEAK_ALIAS
1.6  mhitch WEAK_ALIAS(hypotf, _hypotf)
1.6  mhitch #endif
1.6  mhitch
1.6  mhitch ENTRY(_hypotf, 0)
1.6  mhitch 	cvtfd	4(%ap),-(%sp)
1.6  mhitch 	calls	$2,_C_LABEL(_hypot)
1.6  mhitch 	cvtdf	%r0,%r0
1.6  mhitch 	ret
1.6  mhitch
1.6  mhitch #ifdef WEAK_ALIAS
1.6  mhitch WEAK_ALIAS(hypot, _hypot)
1.6  mhitch #endif
1.6  mhitch
1.3    matt ALTENTRY(cabs)
1.6  mhitch ENTRY(_hypot, 0x8040) 		# save %r6, enable floating overflow
1.4    matt 	movq	4(%ap),%r0	# %r0:1 = x
1.4    matt 	movq	12(%ap),%r2	# %r2:3 = y
1.3    matt 	jbr	cabs2
1.3    matt
1.1   ragge /*	entry for Fortran use, call by:   d = abs(z) */
1.4    matt ENTRY(z_abs, 0x8040)		# save %r6, enable floating overflow
1.4    matt 	movl	4(%ap),%r2	# indirect addressing is necessary here
1.4    matt 	movq	(%r2)+,%r0	# %r0:1 = x
1.4    matt 	movq	(%r2),%r2		# %r2:3 = y
1.1   ragge
1.1   ragge cabs2:
1.4    matt 	bicw3	$0x7f,%r0,%r4	# %r4 has signed biased exp of x
1.4    matt 	cmpw	$0x8000,%r4
1.1   ragge 	jeql	return		# x is a reserved operand, so return it
1.4    matt 	bicw3	$0x7f,%r2,%r5	# %r5 has signed biased exp of y
1.4    matt 	cmpw	$0x8000,%r5
1.1   ragge 	jneq	cont		/* y isn't a reserved operand */
1.4    matt 	movq	%r2,%r0		/* return y if it's reserved */
1.1   ragge 	ret
1.1   ragge
1.1   ragge cont:
1.4    matt 	bsbb	regs_set	# %r0:1 = dsqrt(x^2+y^2)/2^%r6
1.4    matt 	addw2	%r6,%r0		# unscaled cdabs in %r0:1
1.1   ragge 	jvc	return		# unless it overflows
1.4    matt 	subw2	$0x80,%r0	# halve %r0 to get meaningful overflow
1.4    matt 	addd2	%r0,%r0		# overflow; %r0 is half of true abs value
1.1   ragge return:
1.1   ragge 	ret
1.1   ragge
1.3    matt ENTRY(__libm_cdabs_r6,0)	# ENTRY POINT for cdsqrt
1.4    matt 				# calculates a scaled (factor in %r6)
1.1   ragge 				# complex absolute value
1.1   ragge
1.4    matt 	movq	(%r4)+,%r0	# %r0:%r1 = x via indirect addressing
1.4    matt 	movq	(%r4),%r2		# %r2:%r3 = y via indirect addressing
1.1   ragge
1.4    matt 	bicw3	$0x7f,%r0,%r5	# %r5 has signed biased exp of x
1.4    matt 	cmpw	$0x8000,%r5
1.1   ragge 	jeql	cdreserved	# x is a reserved operand
1.4    matt 	bicw3	$0x7f,%r2,%r5	# %r5 has signed biased exp of y
1.4    matt 	cmpw	$0x8000,%r5
1.1   ragge 	jneq	regs_set	/* y isn't a reserved operand either? */
1.1   ragge
1.1   ragge cdreserved:
1.4    matt 	movl	*4(%ap),%r4	# %r4 -> (u,v), if x or y is reserved
1.4    matt 	movq	%r0,(%r4)+	# copy u and v as is and return
1.4    matt 	movq	%r2,(%r4)		# (again addressing is indirect)
1.1   ragge 	ret
1.1   ragge
1.1   ragge regs_set:
1.4    matt 	bicw2	$0x8000,%r0	# %r0:%r1 = dabs(x)
1.4    matt 	bicw2	$0x8000,%r2	# %r2:%r3 = dabs(y)
1.4    matt 	cmpw	%r0,%r2
1.1   ragge 	jgeq	ordered
1.4    matt 	movq	%r0,%r4
1.4    matt 	movq	%r2,%r0
1.4    matt 	movq	%r4,%r2		# force y's exp <= x's exp
1.1   ragge ordered:
1.4    matt 	bicw3	$0x7f,%r0,%r6	# %r6 = exponent(x) + bias(129)
1.1   ragge 	jeql	retsb		# if x = y = 0 then cdabs(x,y) = 0
1.4    matt 	subw2	$0x4780,%r6	# %r6 = exponent(x) - 14
1.4    matt 	subw2	%r6,%r0		# 2^14 <= scaled x < 2^15
1.4    matt 	bitw	$0xff80,%r2
1.1   ragge 	jeql	retsb		# if y = 0 return dabs(x)
1.4    matt 	subw2	%r6,%r2
1.4    matt 	cmpw	$0x3780,%r2	# if scaled y < 2^-18
1.1   ragge 	jgtr	retsb		#   return dabs(x)
1.4    matt 	emodd	%r0,$0,%r0,%r4,%r0	# %r4 + %r0:1 = scaled x^2
1.4    matt 	emodd	%r2,$0,%r2,%r5,%r2	# %r5 + %r2:3 = scaled y^2
1.4    matt 	addd2	%r2,%r0
1.4    matt 	addl2	%r5,%r4
1.4    matt 	cvtld	%r4,%r2
1.4    matt 	addd2	%r2,%r0		# %r0:1 = scaled x^2 + y^2
1.3    matt 	jmp	_C_LABEL(__libm_dsqrt_r5)+2
1.4    matt 				# %r0:1 = dsqrt(x^2+y^2)/2^%r6
1.1   ragge retsb:
1.1   ragge 	rsb			# error < 0.86 ulp