config/xtensa/ieee754-sf.S

1.1  mrg /* IEEE-754 single-precision functions for Xtensa
1.1  mrg    Copyright (C) 2006-2013 Free Software Foundation, Inc.
1.1  mrg    Contributed by Bob Wilson (bwilson (at) tensilica.com) at Tensilica.
1.1  mrg
1.1  mrg    This file is part of GCC.
1.1  mrg
1.1  mrg    GCC is free software; you can redistribute it and/or modify it
1.1  mrg    under the terms of the GNU General Public License as published by
1.1  mrg    the Free Software Foundation; either version 3, or (at your option)
1.1  mrg    any later version.
1.1  mrg
1.1  mrg    GCC is distributed in the hope that it will be useful, but WITHOUT
1.1  mrg    ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
1.1  mrg    or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public
1.1  mrg    License for more details.
1.1  mrg
1.1  mrg    Under Section 7 of GPL version 3, you are granted additional
1.1  mrg    permissions described in the GCC Runtime Library Exception, version
1.1  mrg    3.1, as published by the Free Software Foundation.
1.1  mrg
1.1  mrg    You should have received a copy of the GNU General Public License and
1.1  mrg    a copy of the GCC Runtime Library Exception along with this program;
1.1  mrg    see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
1.1  mrg    <http://www.gnu.org/licenses/>.  */
1.1  mrg
1.1  mrg #ifdef __XTENSA_EB__
1.1  mrg #define xh a2
1.1  mrg #define xl a3
1.1  mrg #define yh a4
1.1  mrg #define yl a5
1.1  mrg #else
1.1  mrg #define xh a3
1.1  mrg #define xl a2
1.1  mrg #define yh a5
1.1  mrg #define yl a4
1.1  mrg #endif
1.1  mrg
1.1  mrg /*  Warning!  The branch displacements for some Xtensa branch instructions
1.1  mrg     are quite small, and this code has been carefully laid out to keep
1.1  mrg     branch targets in range.  If you change anything, be sure to check that
1.1  mrg     the assembler is not relaxing anything to branch over a jump.  */
1.1  mrg
1.1  mrg #ifdef L_negsf2
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__negsf2
1.1  mrg 	.type	__negsf2, @function
1.1  mrg __negsf2:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg 	movi	a4, 0x80000000
1.1  mrg 	xor	a2, a2, a4
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg #endif /* L_negsf2 */
1.1  mrg
1.1  mrg #ifdef L_addsubsf3
1.1  mrg
1.1  mrg 	/* Addition */
1.1  mrg __addsf3_aux:
1.1  mrg
1.1  mrg 	/* Handle NaNs and Infinities.  (This code is placed before the
1.1  mrg 	   start of the function just to keep it in range of the limited
1.1  mrg 	   branch displacements.)  */
1.1  mrg
1.1  mrg .Ladd_xnan_or_inf:
1.1  mrg 	/* If y is neither Infinity nor NaN, return x.  */
1.1  mrg 	bnall	a3, a6, 1f
1.1  mrg 	/* If x is a NaN, return it.  Otherwise, return y.  */
1.1  mrg 	slli	a7, a2, 9
1.1  mrg 	beqz	a7, .Ladd_ynan_or_inf
1.1  mrg 1:	leaf_return
1.1  mrg
1.1  mrg .Ladd_ynan_or_inf:
1.1  mrg 	/* Return y.  */
1.1  mrg 	mov	a2, a3
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Ladd_opposite_signs:
1.1  mrg 	/* Operand signs differ.  Do a subtraction.  */
1.1  mrg 	slli	a7, a6, 8
1.1  mrg 	xor	a3, a3, a7
1.1  mrg 	j	.Lsub_same_sign
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__addsf3
1.1  mrg 	.type	__addsf3, @function
1.1  mrg __addsf3:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg
1.1  mrg 	/* Check if the two operands have the same sign.  */
1.1  mrg 	xor	a7, a2, a3
1.1  mrg 	bltz	a7, .Ladd_opposite_signs
1.1  mrg
1.1  mrg .Ladd_same_sign:
1.1  mrg 	/* Check if either exponent == 0x7f8 (i.e., NaN or Infinity).  */
1.1  mrg 	ball	a2, a6, .Ladd_xnan_or_inf
1.1  mrg 	ball	a3, a6, .Ladd_ynan_or_inf
1.1  mrg
1.1  mrg 	/* Compare the exponents.  The smaller operand will be shifted
1.1  mrg 	   right by the exponent difference and added to the larger
1.1  mrg 	   one.  */
1.1  mrg 	extui	a7, a2, 23, 9
1.1  mrg 	extui	a8, a3, 23, 9
1.1  mrg 	bltu	a7, a8, .Ladd_shiftx
1.1  mrg
1.1  mrg .Ladd_shifty:
1.1  mrg 	/* Check if the smaller (or equal) exponent is zero.  */
1.1  mrg 	bnone	a3, a6, .Ladd_yexpzero
1.1  mrg
1.1  mrg 	/* Replace y sign/exponent with 0x008.  */
1.1  mrg 	or	a3, a3, a6
1.1  mrg 	slli	a3, a3, 8
1.1  mrg 	srli	a3, a3, 8
1.1  mrg
1.1  mrg .Ladd_yexpdiff:
1.1  mrg 	/* Compute the exponent difference.  */
1.1  mrg 	sub	a10, a7, a8
1.1  mrg
1.1  mrg 	/* Exponent difference > 32 -- just return the bigger value.  */
1.1  mrg 	bgeui	a10, 32, 1f
1.1  mrg
1.1  mrg 	/* Shift y right by the exponent difference.  Any bits that are
1.1  mrg 	   shifted out of y are saved in a9 for rounding the result.  */
1.1  mrg 	ssr	a10
1.1  mrg 	movi	a9, 0
1.1  mrg 	src	a9, a3, a9
1.1  mrg 	srl	a3, a3
1.1  mrg
1.1  mrg 	/* Do the addition.  */
1.1  mrg 	add	a2, a2, a3
1.1  mrg
1.1  mrg 	/* Check if the add overflowed into the exponent.  */
1.1  mrg 	extui	a10, a2, 23, 9
1.1  mrg 	beq	a10, a7, .Ladd_round
1.1  mrg 	mov	a8, a7
1.1  mrg 	j	.Ladd_carry
1.1  mrg
1.1  mrg .Ladd_yexpzero:
1.1  mrg 	/* y is a subnormal value.  Replace its sign/exponent with zero,
1.1  mrg 	   i.e., no implicit "1.0", and increment the apparent exponent
1.1  mrg 	   because subnormals behave as if they had the minimum (nonzero)
1.1  mrg 	   exponent.  Test for the case when both exponents are zero.  */
1.1  mrg 	slli	a3, a3, 9
1.1  mrg 	srli	a3, a3, 9
1.1  mrg 	bnone	a2, a6, .Ladd_bothexpzero
1.1  mrg 	addi	a8, a8, 1
1.1  mrg 	j	.Ladd_yexpdiff
1.1  mrg
1.1  mrg .Ladd_bothexpzero:
1.1  mrg 	/* Both exponents are zero.  Handle this as a special case.  There
1.1  mrg 	   is no need to shift or round, and the normal code for handling
1.1  mrg 	   a carry into the exponent field will not work because it
1.1  mrg 	   assumes there is an implicit "1.0" that needs to be added.  */
1.1  mrg 	add	a2, a2, a3
1.1  mrg 1:	leaf_return
1.1  mrg
1.1  mrg .Ladd_xexpzero:
1.1  mrg 	/* Same as "yexpzero" except skip handling the case when both
1.1  mrg 	   exponents are zero.  */
1.1  mrg 	slli	a2, a2, 9
1.1  mrg 	srli	a2, a2, 9
1.1  mrg 	addi	a7, a7, 1
1.1  mrg 	j	.Ladd_xexpdiff
1.1  mrg
1.1  mrg .Ladd_shiftx:
1.1  mrg 	/* Same thing as the "shifty" code, but with x and y swapped.  Also,
1.1  mrg 	   because the exponent difference is always nonzero in this version,
1.1  mrg 	   the shift sequence can use SLL and skip loading a constant zero.  */
1.1  mrg 	bnone	a2, a6, .Ladd_xexpzero
1.1  mrg
1.1  mrg 	or	a2, a2, a6
1.1  mrg 	slli	a2, a2, 8
1.1  mrg 	srli	a2, a2, 8
1.1  mrg
1.1  mrg .Ladd_xexpdiff:
1.1  mrg 	sub	a10, a8, a7
1.1  mrg 	bgeui	a10, 32, .Ladd_returny
1.1  mrg
1.1  mrg 	ssr	a10
1.1  mrg 	sll	a9, a2
1.1  mrg 	srl	a2, a2
1.1  mrg
1.1  mrg 	add	a2, a2, a3
1.1  mrg
1.1  mrg 	/* Check if the add overflowed into the exponent.  */
1.1  mrg 	extui	a10, a2, 23, 9
1.1  mrg 	bne	a10, a8, .Ladd_carry
1.1  mrg
1.1  mrg .Ladd_round:
1.1  mrg 	/* Round up if the leftover fraction is >= 1/2.  */
1.1  mrg 	bgez	a9, 1f
1.1  mrg 	addi	a2, a2, 1
1.1  mrg
1.1  mrg 	/* Check if the leftover fraction is exactly 1/2.  */
1.1  mrg 	slli	a9, a9, 1
1.1  mrg 	beqz	a9, .Ladd_exactlyhalf
1.1  mrg 1:	leaf_return
1.1  mrg
1.1  mrg .Ladd_returny:
1.1  mrg 	mov	a2, a3
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Ladd_carry:
1.1  mrg 	/* The addition has overflowed into the exponent field, so the
1.1  mrg 	   value needs to be renormalized.  The mantissa of the result
1.1  mrg 	   can be recovered by subtracting the original exponent and
1.1  mrg 	   adding 0x800000 (which is the explicit "1.0" for the
1.1  mrg 	   mantissa of the non-shifted operand -- the "1.0" for the
1.1  mrg 	   shifted operand was already added).  The mantissa can then
1.1  mrg 	   be shifted right by one bit.  The explicit "1.0" of the
1.1  mrg 	   shifted mantissa then needs to be replaced by the exponent,
1.1  mrg 	   incremented by one to account for the normalizing shift.
1.1  mrg 	   It is faster to combine these operations: do the shift first
1.1  mrg 	   and combine the additions and subtractions.  If x is the
1.1  mrg 	   original exponent, the result is:
1.1  mrg 	       shifted mantissa - (x << 22) + (1 << 22) + (x << 23)
1.1  mrg 	   or:
1.1  mrg 	       shifted mantissa + ((x + 1) << 22)
1.1  mrg 	   Note that the exponent is incremented here by leaving the
1.1  mrg 	   explicit "1.0" of the mantissa in the exponent field.  */
1.1  mrg
1.1  mrg 	/* Shift x right by one bit.  Save the lsb.  */
1.1  mrg 	mov	a10, a2
1.1  mrg 	srli	a2, a2, 1
1.1  mrg
1.1  mrg 	/* See explanation above.  The original exponent is in a8.  */
1.1  mrg 	addi	a8, a8, 1
1.1  mrg 	slli	a8, a8, 22
1.1  mrg 	add	a2, a2, a8
1.1  mrg
1.1  mrg 	/* Return an Infinity if the exponent overflowed.  */
1.1  mrg 	ball	a2, a6, .Ladd_infinity
1.1  mrg
1.1  mrg 	/* Same thing as the "round" code except the msb of the leftover
1.1  mrg 	   fraction is bit 0 of a10, with the rest of the fraction in a9.  */
1.1  mrg 	bbci.l	a10, 0, 1f
1.1  mrg 	addi	a2, a2, 1
1.1  mrg 	beqz	a9, .Ladd_exactlyhalf
1.1  mrg 1:	leaf_return
1.1  mrg
1.1  mrg .Ladd_infinity:
1.1  mrg 	/* Clear the mantissa.  */
1.1  mrg 	srli	a2, a2, 23
1.1  mrg 	slli	a2, a2, 23
1.1  mrg
1.1  mrg 	/* The sign bit may have been lost in a carry-out.  Put it back.  */
1.1  mrg 	slli	a8, a8, 1
1.1  mrg 	or	a2, a2, a8
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Ladd_exactlyhalf:
1.1  mrg 	/* Round down to the nearest even value.  */
1.1  mrg 	srli	a2, a2, 1
1.1  mrg 	slli	a2, a2, 1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg
1.1  mrg 	/* Subtraction */
1.1  mrg __subsf3_aux:
1.1  mrg
1.1  mrg 	/* Handle NaNs and Infinities.  (This code is placed before the
1.1  mrg 	   start of the function just to keep it in range of the limited
1.1  mrg 	   branch displacements.)  */
1.1  mrg
1.1  mrg .Lsub_xnan_or_inf:
1.1  mrg 	/* If y is neither Infinity nor NaN, return x.  */
1.1  mrg 	bnall	a3, a6, 1f
1.1  mrg 	/* Both x and y are either NaN or Inf, so the result is NaN.  */
1.1  mrg 	movi	a4, 0x400000	/* make it a quiet NaN */
1.1  mrg 	or	a2, a2, a4
1.1  mrg 1:	leaf_return
1.1  mrg
1.1  mrg .Lsub_ynan_or_inf:
1.1  mrg 	/* Negate y and return it.  */
1.1  mrg 	slli	a7, a6, 8
1.1  mrg 	xor	a2, a3, a7
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lsub_opposite_signs:
1.1  mrg 	/* Operand signs differ.  Do an addition.  */
1.1  mrg 	slli	a7, a6, 8
1.1  mrg 	xor	a3, a3, a7
1.1  mrg 	j	.Ladd_same_sign
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__subsf3
1.1  mrg 	.type	__subsf3, @function
1.1  mrg __subsf3:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg
1.1  mrg 	/* Check if the two operands have the same sign.  */
1.1  mrg 	xor	a7, a2, a3
1.1  mrg 	bltz	a7, .Lsub_opposite_signs
1.1  mrg
1.1  mrg .Lsub_same_sign:
1.1  mrg 	/* Check if either exponent == 0x7f8 (i.e., NaN or Infinity).  */
1.1  mrg 	ball	a2, a6, .Lsub_xnan_or_inf
1.1  mrg 	ball	a3, a6, .Lsub_ynan_or_inf
1.1  mrg
1.1  mrg 	/* Compare the operands.  In contrast to addition, the entire
1.1  mrg 	   value matters here.  */
1.1  mrg 	extui	a7, a2, 23, 8
1.1  mrg 	extui	a8, a3, 23, 8
1.1  mrg 	bltu	a2, a3, .Lsub_xsmaller
1.1  mrg
1.1  mrg .Lsub_ysmaller:
1.1  mrg 	/* Check if the smaller (or equal) exponent is zero.  */
1.1  mrg 	bnone	a3, a6, .Lsub_yexpzero
1.1  mrg
1.1  mrg 	/* Replace y sign/exponent with 0x008.  */
1.1  mrg 	or	a3, a3, a6
1.1  mrg 	slli	a3, a3, 8
1.1  mrg 	srli	a3, a3, 8
1.1  mrg
1.1  mrg .Lsub_yexpdiff:
1.1  mrg 	/* Compute the exponent difference.  */
1.1  mrg 	sub	a10, a7, a8
1.1  mrg
1.1  mrg 	/* Exponent difference > 32 -- just return the bigger value.  */
1.1  mrg 	bgeui	a10, 32, 1f
1.1  mrg
1.1  mrg 	/* Shift y right by the exponent difference.  Any bits that are
1.1  mrg 	   shifted out of y are saved in a9 for rounding the result.  */
1.1  mrg 	ssr	a10
1.1  mrg 	movi	a9, 0
1.1  mrg 	src	a9, a3, a9
1.1  mrg 	srl	a3, a3
1.1  mrg
1.1  mrg 	sub	a2, a2, a3
1.1  mrg
1.1  mrg 	/* Subtract the leftover bits in a9 from zero and propagate any
1.1  mrg 	   borrow from a2.  */
1.1  mrg 	neg	a9, a9
1.1  mrg 	addi	a10, a2, -1
1.1  mrg 	movnez	a2, a10, a9
1.1  mrg
1.1  mrg 	/* Check if the subtract underflowed into the exponent.  */
1.1  mrg 	extui	a10, a2, 23, 8
1.1  mrg 	beq	a10, a7, .Lsub_round
1.1  mrg 	j	.Lsub_borrow
1.1  mrg
1.1  mrg .Lsub_yexpzero:
1.1  mrg 	/* Return zero if the inputs are equal.  (For the non-subnormal
1.1  mrg 	   case, subtracting the "1.0" will cause a borrow from the exponent
1.1  mrg 	   and this case can be detected when handling the borrow.)  */
1.1  mrg 	beq	a2, a3, .Lsub_return_zero
1.1  mrg
1.1  mrg 	/* y is a subnormal value.  Replace its sign/exponent with zero,
1.1  mrg 	   i.e., no implicit "1.0".  Unless x is also a subnormal, increment
1.1  mrg 	   y's apparent exponent because subnormals behave as if they had
1.1  mrg 	   the minimum (nonzero) exponent.  */
1.1  mrg 	slli	a3, a3, 9
1.1  mrg 	srli	a3, a3, 9
1.1  mrg 	bnone	a2, a6, .Lsub_yexpdiff
1.1  mrg 	addi	a8, a8, 1
1.1  mrg 	j	.Lsub_yexpdiff
1.1  mrg
1.1  mrg .Lsub_returny:
1.1  mrg 	/* Negate and return y.  */
1.1  mrg 	slli	a7, a6, 8
1.1  mrg 	xor	a2, a3, a7
1.1  mrg 1:	leaf_return
1.1  mrg
1.1  mrg .Lsub_xsmaller:
1.1  mrg 	/* Same thing as the "ysmaller" code, but with x and y swapped and
1.1  mrg 	   with y negated.  */
1.1  mrg 	bnone	a2, a6, .Lsub_xexpzero
1.1  mrg
1.1  mrg 	or	a2, a2, a6
1.1  mrg 	slli	a2, a2, 8
1.1  mrg 	srli	a2, a2, 8
1.1  mrg
1.1  mrg .Lsub_xexpdiff:
1.1  mrg 	sub	a10, a8, a7
1.1  mrg 	bgeui	a10, 32, .Lsub_returny
1.1  mrg
1.1  mrg 	ssr	a10
1.1  mrg 	movi	a9, 0
1.1  mrg 	src	a9, a2, a9
1.1  mrg 	srl	a2, a2
1.1  mrg
1.1  mrg 	/* Negate y.  */
1.1  mrg 	slli	a11, a6, 8
1.1  mrg 	xor	a3, a3, a11
1.1  mrg
1.1  mrg 	sub	a2, a3, a2
1.1  mrg
1.1  mrg 	neg	a9, a9
1.1  mrg 	addi	a10, a2, -1
1.1  mrg 	movnez	a2, a10, a9
1.1  mrg
1.1  mrg 	/* Check if the subtract underflowed into the exponent.  */
1.1  mrg 	extui	a10, a2, 23, 8
1.1  mrg 	bne	a10, a8, .Lsub_borrow
1.1  mrg
1.1  mrg .Lsub_round:
1.1  mrg 	/* Round up if the leftover fraction is >= 1/2.  */
1.1  mrg 	bgez	a9, 1f
1.1  mrg 	addi	a2, a2, 1
1.1  mrg
1.1  mrg 	/* Check if the leftover fraction is exactly 1/2.  */
1.1  mrg 	slli	a9, a9, 1
1.1  mrg 	beqz	a9, .Lsub_exactlyhalf
1.1  mrg 1:	leaf_return
1.1  mrg
1.1  mrg .Lsub_xexpzero:
1.1  mrg 	/* Same as "yexpzero".  */
1.1  mrg 	beq	a2, a3, .Lsub_return_zero
1.1  mrg 	slli	a2, a2, 9
1.1  mrg 	srli	a2, a2, 9
1.1  mrg 	bnone	a3, a6, .Lsub_xexpdiff
1.1  mrg 	addi	a7, a7, 1
1.1  mrg 	j	.Lsub_xexpdiff
1.1  mrg
1.1  mrg .Lsub_return_zero:
1.1  mrg 	movi	a2, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lsub_borrow:
1.1  mrg 	/* The subtraction has underflowed into the exponent field, so the
1.1  mrg 	   value needs to be renormalized.  Shift the mantissa left as
1.1  mrg 	   needed to remove any leading zeros and adjust the exponent
1.1  mrg 	   accordingly.  If the exponent is not large enough to remove
1.1  mrg 	   all the leading zeros, the result will be a subnormal value.  */
1.1  mrg
1.1  mrg 	slli	a8, a2, 9
1.1  mrg 	beqz	a8, .Lsub_xzero
1.1  mrg 	do_nsau	a6, a8, a7, a11
1.1  mrg 	srli	a8, a8, 9
1.1  mrg 	bge	a6, a10, .Lsub_subnormal
1.1  mrg 	addi	a6, a6, 1
1.1  mrg
1.1  mrg .Lsub_normalize_shift:
1.1  mrg 	/* Shift the mantissa (a8/a9) left by a6.  */
1.1  mrg 	ssl	a6
1.1  mrg 	src	a8, a8, a9
1.1  mrg 	sll	a9, a9
1.1  mrg
1.1  mrg 	/* Combine the shifted mantissa with the sign and exponent,
1.1  mrg 	   decrementing the exponent by a6.  (The exponent has already
1.1  mrg 	   been decremented by one due to the borrow from the subtraction,
1.1  mrg 	   but adding the mantissa will increment the exponent by one.)  */
1.1  mrg 	srli	a2, a2, 23
1.1  mrg 	sub	a2, a2, a6
1.1  mrg 	slli	a2, a2, 23
1.1  mrg 	add	a2, a2, a8
1.1  mrg 	j	.Lsub_round
1.1  mrg
1.1  mrg .Lsub_exactlyhalf:
1.1  mrg 	/* Round down to the nearest even value.  */
1.1  mrg 	srli	a2, a2, 1
1.1  mrg 	slli	a2, a2, 1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lsub_xzero:
1.1  mrg 	/* If there was a borrow from the exponent, and the mantissa and
1.1  mrg 	   guard digits are all zero, then the inputs were equal and the
1.1  mrg 	   result should be zero.  */
1.1  mrg 	beqz	a9, .Lsub_return_zero
1.1  mrg
1.1  mrg 	/* Only the guard digit is nonzero.  Shift by min(24, a10).  */
1.1  mrg 	addi	a11, a10, -24
1.1  mrg 	movi	a6, 24
1.1  mrg 	movltz	a6, a10, a11
1.1  mrg 	j	.Lsub_normalize_shift
1.1  mrg
1.1  mrg .Lsub_subnormal:
1.1  mrg 	/* The exponent is too small to shift away all the leading zeros.
1.1  mrg 	   Set a6 to the current exponent (which has already been
1.1  mrg 	   decremented by the borrow) so that the exponent of the result
1.1  mrg 	   will be zero.  Do not add 1 to a6 in this case, because: (1)
1.1  mrg 	   adding the mantissa will not increment the exponent, so there is
1.1  mrg 	   no need to subtract anything extra from the exponent to
1.1  mrg 	   compensate, and (2) the effective exponent of a subnormal is 1
1.1  mrg 	   not 0 so the shift amount must be 1 smaller than normal. */
1.1  mrg 	mov	a6, a10
1.1  mrg 	j	.Lsub_normalize_shift
1.1  mrg
1.1  mrg #endif /* L_addsubsf3 */
1.1  mrg
1.1  mrg #ifdef L_mulsf3
1.1  mrg
1.1  mrg 	/* Multiplication */
1.1  mrg #if !XCHAL_HAVE_MUL16 && !XCHAL_HAVE_MUL32 && !XCHAL_HAVE_MAC16
1.1  mrg #define XCHAL_NO_MUL 1
1.1  mrg #endif
1.1  mrg
1.1  mrg __mulsf3_aux:
1.1  mrg
1.1  mrg 	/* Handle unusual cases (zeros, subnormals, NaNs and Infinities).
1.1  mrg 	   (This code is placed before the start of the function just to
1.1  mrg 	   keep it in range of the limited branch displacements.)  */
1.1  mrg
1.1  mrg .Lmul_xexpzero:
1.1  mrg 	/* Clear the sign bit of x.  */
1.1  mrg 	slli	a2, a2, 1
1.1  mrg 	srli	a2, a2, 1
1.1  mrg
1.1  mrg 	/* If x is zero, return zero.  */
1.1  mrg 	beqz	a2, .Lmul_return_zero
1.1  mrg
1.1  mrg 	/* Normalize x.  Adjust the exponent in a8.  */
1.1  mrg 	do_nsau	a10, a2, a11, a12
1.1  mrg 	addi	a10, a10, -8
1.1  mrg 	ssl	a10
1.1  mrg 	sll	a2, a2
1.1  mrg 	movi	a8, 1
1.1  mrg 	sub	a8, a8, a10
1.1  mrg 	j	.Lmul_xnormalized
1.1  mrg
1.1  mrg .Lmul_yexpzero:
1.1  mrg 	/* Clear the sign bit of y.  */
1.1  mrg 	slli	a3, a3, 1
1.1  mrg 	srli	a3, a3, 1
1.1  mrg
1.1  mrg 	/* If y is zero, return zero.  */
1.1  mrg 	beqz	a3, .Lmul_return_zero
1.1  mrg
1.1  mrg 	/* Normalize y.  Adjust the exponent in a9.  */
1.1  mrg 	do_nsau	a10, a3, a11, a12
1.1  mrg 	addi	a10, a10, -8
1.1  mrg 	ssl	a10
1.1  mrg 	sll	a3, a3
1.1  mrg 	movi	a9, 1
1.1  mrg 	sub	a9, a9, a10
1.1  mrg 	j	.Lmul_ynormalized
1.1  mrg
1.1  mrg .Lmul_return_zero:
1.1  mrg 	/* Return zero with the appropriate sign bit.  */
1.1  mrg 	srli	a2, a7, 31
1.1  mrg 	slli	a2, a2, 31
1.1  mrg 	j	.Lmul_done
1.1  mrg
1.1  mrg .Lmul_xnan_or_inf:
1.1  mrg 	/* If y is zero, return NaN.  */
1.1  mrg 	slli	a8, a3, 1
1.1  mrg 	bnez	a8, 1f
1.1  mrg 	movi	a4, 0x400000	/* make it a quiet NaN */
1.1  mrg 	or	a2, a2, a4
1.1  mrg 	j	.Lmul_done
1.1  mrg 1:
1.1  mrg 	/* If y is NaN, return y.  */
1.1  mrg 	bnall	a3, a6, .Lmul_returnx
1.1  mrg 	slli	a8, a3, 9
1.1  mrg 	beqz	a8, .Lmul_returnx
1.1  mrg
1.1  mrg .Lmul_returny:
1.1  mrg 	mov	a2, a3
1.1  mrg
1.1  mrg .Lmul_returnx:
1.1  mrg 	/* Set the sign bit and return.  */
1.1  mrg 	extui	a7, a7, 31, 1
1.1  mrg 	slli	a2, a2, 1
1.1  mrg 	ssai	1
1.1  mrg 	src	a2, a7, a2
1.1  mrg 	j	.Lmul_done
1.1  mrg
1.1  mrg .Lmul_ynan_or_inf:
1.1  mrg 	/* If x is zero, return NaN.  */
1.1  mrg 	slli	a8, a2, 1
1.1  mrg 	bnez	a8, .Lmul_returny
1.1  mrg 	movi	a7, 0x400000	/* make it a quiet NaN */
1.1  mrg 	or	a2, a3, a7
1.1  mrg 	j	.Lmul_done
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__mulsf3
1.1  mrg 	.type	__mulsf3, @function
1.1  mrg __mulsf3:
1.1  mrg #if __XTENSA_CALL0_ABI__
1.1  mrg 	leaf_entry sp, 32
1.1  mrg 	addi	sp, sp, -32
1.1  mrg 	s32i	a12, sp, 16
1.1  mrg 	s32i	a13, sp, 20
1.1  mrg 	s32i	a14, sp, 24
1.1  mrg 	s32i	a15, sp, 28
1.1  mrg #elif XCHAL_NO_MUL
1.1  mrg 	/* This is not really a leaf function; allocate enough stack space
1.1  mrg 	   to allow CALL12s to a helper function.  */
1.1  mrg 	leaf_entry sp, 64
1.1  mrg #else
1.1  mrg 	leaf_entry sp, 32
1.1  mrg #endif
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg
1.1  mrg 	/* Get the sign of the result.  */
1.1  mrg 	xor	a7, a2, a3
1.1  mrg
1.1  mrg 	/* Check for NaN and infinity.  */
1.1  mrg 	ball	a2, a6, .Lmul_xnan_or_inf
1.1  mrg 	ball	a3, a6, .Lmul_ynan_or_inf
1.1  mrg
1.1  mrg 	/* Extract the exponents.  */
1.1  mrg 	extui	a8, a2, 23, 8
1.1  mrg 	extui	a9, a3, 23, 8
1.1  mrg
1.1  mrg 	beqz	a8, .Lmul_xexpzero
1.1  mrg .Lmul_xnormalized:
1.1  mrg 	beqz	a9, .Lmul_yexpzero
1.1  mrg .Lmul_ynormalized:
1.1  mrg
1.1  mrg 	/* Add the exponents.  */
1.1  mrg 	add	a8, a8, a9
1.1  mrg
1.1  mrg 	/* Replace sign/exponent fields with explicit "1.0".  */
1.1  mrg 	movi	a10, 0xffffff
1.1  mrg 	or	a2, a2, a6
1.1  mrg 	and	a2, a2, a10
1.1  mrg 	or	a3, a3, a6
1.1  mrg 	and	a3, a3, a10
1.1  mrg
1.1  mrg 	/* Multiply 32x32 to 64 bits.  The result ends up in a2/a6.  */
1.1  mrg
1.1  mrg #if XCHAL_HAVE_MUL32_HIGH
1.1  mrg
1.1  mrg 	mull	a6, a2, a3
1.1  mrg 	muluh	a2, a2, a3
1.1  mrg
1.1  mrg #else
1.1  mrg
1.1  mrg 	/* Break the inputs into 16-bit chunks and compute 4 32-bit partial
1.1  mrg 	   products.  These partial products are:
1.1  mrg
1.1  mrg 		0 xl * yl
1.1  mrg
1.1  mrg 		1 xl * yh
1.1  mrg 		2 xh * yl
1.1  mrg
1.1  mrg 		3 xh * yh
1.1  mrg
1.1  mrg 	   If using the Mul16 or Mul32 multiplier options, these input
1.1  mrg 	   chunks must be stored in separate registers.  For Mac16, the
1.1  mrg 	   UMUL.AA.* opcodes can specify that the inputs come from either
1.1  mrg 	   half of the registers, so there is no need to shift them out
1.1  mrg 	   ahead of time.  If there is no multiply hardware, the 16-bit
1.1  mrg 	   chunks can be extracted when setting up the arguments to the
1.1  mrg 	   separate multiply function.  */
1.1  mrg
1.1  mrg #if __XTENSA_CALL0_ABI__ && XCHAL_NO_MUL
1.1  mrg 	/* Calling a separate multiply function will clobber a0 and requires
1.1  mrg 	   use of a8 as a temporary, so save those values now.  (The function
1.1  mrg 	   uses a custom ABI so nothing else needs to be saved.)  */
1.1  mrg 	s32i	a0, sp, 0
1.1  mrg 	s32i	a8, sp, 4
1.1  mrg #endif
1.1  mrg
1.1  mrg #if XCHAL_HAVE_MUL16 || XCHAL_HAVE_MUL32
1.1  mrg
1.1  mrg #define a2h a4
1.1  mrg #define a3h a5
1.1  mrg
1.1  mrg 	/* Get the high halves of the inputs into registers.  */
1.1  mrg 	srli	a2h, a2, 16
1.1  mrg 	srli	a3h, a3, 16
1.1  mrg
1.1  mrg #define a2l a2
1.1  mrg #define a3l a3
1.1  mrg
1.1  mrg #if XCHAL_HAVE_MUL32 && !XCHAL_HAVE_MUL16
1.1  mrg 	/* Clear the high halves of the inputs.  This does not matter
1.1  mrg 	   for MUL16 because the high bits are ignored.  */
1.1  mrg 	extui	a2, a2, 0, 16
1.1  mrg 	extui	a3, a3, 0, 16
1.1  mrg #endif
1.1  mrg #endif /* MUL16 || MUL32 */
1.1  mrg
1.1  mrg
1.1  mrg #if XCHAL_HAVE_MUL16
1.1  mrg
1.1  mrg #define do_mul(dst, xreg, xhalf, yreg, yhalf) \
1.1  mrg 	mul16u	dst, xreg ## xhalf, yreg ## yhalf
1.1  mrg
1.1  mrg #elif XCHAL_HAVE_MUL32
1.1  mrg
1.1  mrg #define do_mul(dst, xreg, xhalf, yreg, yhalf) \
1.1  mrg 	mull	dst, xreg ## xhalf, yreg ## yhalf
1.1  mrg
1.1  mrg #elif XCHAL_HAVE_MAC16
1.1  mrg
1.1  mrg /* The preprocessor insists on inserting a space when concatenating after
1.1  mrg    a period in the definition of do_mul below.  These macros are a workaround
1.1  mrg    using underscores instead of periods when doing the concatenation.  */
1.1  mrg #define umul_aa_ll umul.aa.ll
1.1  mrg #define umul_aa_lh umul.aa.lh
1.1  mrg #define umul_aa_hl umul.aa.hl
1.1  mrg #define umul_aa_hh umul.aa.hh
1.1  mrg
1.1  mrg #define do_mul(dst, xreg, xhalf, yreg, yhalf) \
1.1  mrg 	umul_aa_ ## xhalf ## yhalf	xreg, yreg; \
1.1  mrg 	rsr	dst, ACCLO
1.1  mrg
1.1  mrg #else /* no multiply hardware */
1.1  mrg
1.1  mrg #define set_arg_l(dst, src) \
1.1  mrg 	extui	dst, src, 0, 16
1.1  mrg #define set_arg_h(dst, src) \
1.1  mrg 	srli	dst, src, 16
1.1  mrg
1.1  mrg #if __XTENSA_CALL0_ABI__
1.1  mrg #define do_mul(dst, xreg, xhalf, yreg, yhalf) \
1.1  mrg 	set_arg_ ## xhalf (a13, xreg); \
1.1  mrg 	set_arg_ ## yhalf (a14, yreg); \
1.1  mrg 	call0	.Lmul_mulsi3; \
1.1  mrg 	mov	dst, a12
1.1  mrg #else
1.1  mrg #define do_mul(dst, xreg, xhalf, yreg, yhalf) \
1.1  mrg 	set_arg_ ## xhalf (a14, xreg); \
1.1  mrg 	set_arg_ ## yhalf (a15, yreg); \
1.1  mrg 	call12	.Lmul_mulsi3; \
1.1  mrg 	mov	dst, a14
1.1  mrg #endif /* __XTENSA_CALL0_ABI__ */
1.1  mrg
1.1  mrg #endif /* no multiply hardware */
1.1  mrg
1.1  mrg 	/* Add pp1 and pp2 into a6 with carry-out in a9.  */
1.1  mrg 	do_mul(a6, a2, l, a3, h)	/* pp 1 */
1.1  mrg 	do_mul(a11, a2, h, a3, l)	/* pp 2 */
1.1  mrg 	movi	a9, 0
1.1  mrg 	add	a6, a6, a11
1.1  mrg 	bgeu	a6, a11, 1f
1.1  mrg 	addi	a9, a9, 1
1.1  mrg 1:
1.1  mrg 	/* Shift the high half of a9/a6 into position in a9.  Note that
1.1  mrg 	   this value can be safely incremented without any carry-outs.  */
1.1  mrg 	ssai	16
1.1  mrg 	src	a9, a9, a6
1.1  mrg
1.1  mrg 	/* Compute the low word into a6.  */
1.1  mrg 	do_mul(a11, a2, l, a3, l)	/* pp 0 */
1.1  mrg 	sll	a6, a6
1.1  mrg 	add	a6, a6, a11
1.1  mrg 	bgeu	a6, a11, 1f
1.1  mrg 	addi	a9, a9, 1
1.1  mrg 1:
1.1  mrg 	/* Compute the high word into a2.  */
1.1  mrg 	do_mul(a2, a2, h, a3, h)	/* pp 3 */
1.1  mrg 	add	a2, a2, a9
1.1  mrg
1.1  mrg #if __XTENSA_CALL0_ABI__ && XCHAL_NO_MUL
1.1  mrg 	/* Restore values saved on the stack during the multiplication.  */
1.1  mrg 	l32i	a0, sp, 0
1.1  mrg 	l32i	a8, sp, 4
1.1  mrg #endif
1.1  mrg #endif /* ! XCHAL_HAVE_MUL32_HIGH */
1.1  mrg
1.1  mrg 	/* Shift left by 9 bits, unless there was a carry-out from the
1.1  mrg 	   multiply, in which case, shift by 8 bits and increment the
1.1  mrg 	   exponent.  */
1.1  mrg 	movi	a4, 9
1.1  mrg 	srli	a5, a2, 24 - 9
1.1  mrg 	beqz	a5, 1f
1.1  mrg 	addi	a4, a4, -1
1.1  mrg 	addi	a8, a8, 1
1.1  mrg 1:	ssl	a4
1.1  mrg 	src	a2, a2, a6
1.1  mrg 	sll	a6, a6
1.1  mrg
1.1  mrg 	/* Subtract the extra bias from the exponent sum (plus one to account
1.1  mrg 	   for the explicit "1.0" of the mantissa that will be added to the
1.1  mrg 	   exponent in the final result).  */
1.1  mrg 	movi	a4, 0x80
1.1  mrg 	sub	a8, a8, a4
1.1  mrg
1.1  mrg 	/* Check for over/underflow.  The value in a8 is one less than the
1.1  mrg 	   final exponent, so values in the range 0..fd are OK here.  */
1.1  mrg 	movi	a4, 0xfe
1.1  mrg 	bgeu	a8, a4, .Lmul_overflow
1.1  mrg
1.1  mrg .Lmul_round:
1.1  mrg 	/* Round.  */
1.1  mrg 	bgez	a6, .Lmul_rounded
1.1  mrg 	addi	a2, a2, 1
1.1  mrg 	slli	a6, a6, 1
1.1  mrg 	beqz	a6, .Lmul_exactlyhalf
1.1  mrg
1.1  mrg .Lmul_rounded:
1.1  mrg 	/* Add the exponent to the mantissa.  */
1.1  mrg 	slli	a8, a8, 23
1.1  mrg 	add	a2, a2, a8
1.1  mrg
1.1  mrg .Lmul_addsign:
1.1  mrg 	/* Add the sign bit.  */
1.1  mrg 	srli	a7, a7, 31
1.1  mrg 	slli	a7, a7, 31
1.1  mrg 	or	a2, a2, a7
1.1  mrg
1.1  mrg .Lmul_done:
1.1  mrg #if __XTENSA_CALL0_ABI__
1.1  mrg 	l32i	a12, sp, 16
1.1  mrg 	l32i	a13, sp, 20
1.1  mrg 	l32i	a14, sp, 24
1.1  mrg 	l32i	a15, sp, 28
1.1  mrg 	addi	sp, sp, 32
1.1  mrg #endif
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lmul_exactlyhalf:
1.1  mrg 	/* Round down to the nearest even value.  */
1.1  mrg 	srli	a2, a2, 1
1.1  mrg 	slli	a2, a2, 1
1.1  mrg 	j	.Lmul_rounded
1.1  mrg
1.1  mrg .Lmul_overflow:
1.1  mrg 	bltz	a8, .Lmul_underflow
1.1  mrg 	/* Return +/- Infinity.  */
1.1  mrg 	movi	a8, 0xff
1.1  mrg 	slli	a2, a8, 23
1.1  mrg 	j	.Lmul_addsign
1.1  mrg
1.1  mrg .Lmul_underflow:
1.1  mrg 	/* Create a subnormal value, where the exponent field contains zero,
1.1  mrg 	   but the effective exponent is 1.  The value of a8 is one less than
1.1  mrg 	   the actual exponent, so just negate it to get the shift amount.  */
1.1  mrg 	neg	a8, a8
1.1  mrg 	mov	a9, a6
1.1  mrg 	ssr	a8
1.1  mrg 	bgeui	a8, 32, .Lmul_flush_to_zero
1.1  mrg
1.1  mrg 	/* Shift a2 right.  Any bits that are shifted out of a2 are saved
1.1  mrg 	   in a6 (combined with the shifted-out bits currently in a6) for
1.1  mrg 	   rounding the result.  */
1.1  mrg 	sll	a6, a2
1.1  mrg 	srl	a2, a2
1.1  mrg
1.1  mrg 	/* Set the exponent to zero.  */
1.1  mrg 	movi	a8, 0
1.1  mrg
1.1  mrg 	/* Pack any nonzero bits shifted out into a6.  */
1.1  mrg 	beqz	a9, .Lmul_round
1.1  mrg 	movi	a9, 1
1.1  mrg 	or	a6, a6, a9
1.1  mrg 	j	.Lmul_round
1.1  mrg
1.1  mrg .Lmul_flush_to_zero:
1.1  mrg 	/* Return zero with the appropriate sign bit.  */
1.1  mrg 	srli	a2, a7, 31
1.1  mrg 	slli	a2, a2, 31
1.1  mrg 	j	.Lmul_done
1.1  mrg
1.1  mrg #if XCHAL_NO_MUL
1.1  mrg
1.1  mrg 	/* For Xtensa processors with no multiply hardware, this simplified
1.1  mrg 	   version of _mulsi3 is used for multiplying 16-bit chunks of
1.1  mrg 	   the floating-point mantissas.  When using CALL0, this function
1.1  mrg 	   uses a custom ABI: the inputs are passed in a13 and a14, the
1.1  mrg 	   result is returned in a12, and a8 and a15 are clobbered.  */
1.1  mrg 	.align	4
1.1  mrg .Lmul_mulsi3:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg 	.macro mul_mulsi3_body dst, src1, src2, tmp1, tmp2
1.1  mrg 	movi	\dst, 0
1.1  mrg 1:	add	\tmp1, \src2, \dst
1.1  mrg 	extui	\tmp2, \src1, 0, 1
1.1  mrg 	movnez	\dst, \tmp1, \tmp2
1.1  mrg
1.1  mrg 	do_addx2 \tmp1, \src2, \dst, \tmp1
1.1  mrg 	extui	\tmp2, \src1, 1, 1
1.1  mrg 	movnez	\dst, \tmp1, \tmp2
1.1  mrg
1.1  mrg 	do_addx4 \tmp1, \src2, \dst, \tmp1
1.1  mrg 	extui	\tmp2, \src1, 2, 1
1.1  mrg 	movnez	\dst, \tmp1, \tmp2
1.1  mrg
1.1  mrg 	do_addx8 \tmp1, \src2, \dst, \tmp1
1.1  mrg 	extui	\tmp2, \src1, 3, 1
1.1  mrg 	movnez	\dst, \tmp1, \tmp2
1.1  mrg
1.1  mrg 	srli	\src1, \src1, 4
1.1  mrg 	slli	\src2, \src2, 4
1.1  mrg 	bnez	\src1, 1b
1.1  mrg 	.endm
1.1  mrg #if __XTENSA_CALL0_ABI__
1.1  mrg 	mul_mulsi3_body a12, a13, a14, a15, a8
1.1  mrg #else
1.1  mrg 	/* The result will be written into a2, so save that argument in a4.  */
1.1  mrg 	mov	a4, a2
1.1  mrg 	mul_mulsi3_body a2, a4, a3, a5, a6
1.1  mrg #endif
1.1  mrg 	leaf_return
1.1  mrg #endif /* XCHAL_NO_MUL */
1.1  mrg #endif /* L_mulsf3 */
1.1  mrg
1.1  mrg #ifdef L_divsf3
1.1  mrg
1.1  mrg 	/* Division */
1.1  mrg __divsf3_aux:
1.1  mrg
1.1  mrg 	/* Handle unusual cases (zeros, subnormals, NaNs and Infinities).
1.1  mrg 	   (This code is placed before the start of the function just to
1.1  mrg 	   keep it in range of the limited branch displacements.)  */
1.1  mrg
1.1  mrg .Ldiv_yexpzero:
1.1  mrg 	/* Clear the sign bit of y.  */
1.1  mrg 	slli	a3, a3, 1
1.1  mrg 	srli	a3, a3, 1
1.1  mrg
1.1  mrg 	/* Check for division by zero.  */
1.1  mrg 	beqz	a3, .Ldiv_yzero
1.1  mrg
1.1  mrg 	/* Normalize y.  Adjust the exponent in a9.  */
1.1  mrg 	do_nsau	a10, a3, a4, a5
1.1  mrg 	addi	a10, a10, -8
1.1  mrg 	ssl	a10
1.1  mrg 	sll	a3, a3
1.1  mrg 	movi	a9, 1
1.1  mrg 	sub	a9, a9, a10
1.1  mrg 	j	.Ldiv_ynormalized
1.1  mrg
1.1  mrg .Ldiv_yzero:
1.1  mrg 	/* y is zero.  Return NaN if x is also zero; otherwise, infinity.  */
1.1  mrg 	slli	a4, a2, 1
1.1  mrg 	srli	a4, a4, 1
1.1  mrg 	srli	a2, a7, 31
1.1  mrg 	slli	a2, a2, 31
1.1  mrg 	or	a2, a2, a6
1.1  mrg 	bnez	a4, 1f
1.1  mrg 	movi	a4, 0x400000	/* make it a quiet NaN */
1.1  mrg 	or	a2, a2, a4
1.1  mrg 1:	leaf_return
1.1  mrg
1.1  mrg .Ldiv_xexpzero:
1.1  mrg 	/* Clear the sign bit of x.  */
1.1  mrg 	slli	a2, a2, 1
1.1  mrg 	srli	a2, a2, 1
1.1  mrg
1.1  mrg 	/* If x is zero, return zero.  */
1.1  mrg 	beqz	a2, .Ldiv_return_zero
1.1  mrg
1.1  mrg 	/* Normalize x.  Adjust the exponent in a8.  */
1.1  mrg 	do_nsau	a10, a2, a4, a5
1.1  mrg 	addi	a10, a10, -8
1.1  mrg 	ssl	a10
1.1  mrg 	sll	a2, a2
1.1  mrg 	movi	a8, 1
1.1  mrg 	sub	a8, a8, a10
1.1  mrg 	j	.Ldiv_xnormalized
1.1  mrg
1.1  mrg .Ldiv_return_zero:
1.1  mrg 	/* Return zero with the appropriate sign bit.  */
1.1  mrg 	srli	a2, a7, 31
1.1  mrg 	slli	a2, a2, 31
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Ldiv_xnan_or_inf:
1.1  mrg 	/* Set the sign bit of the result.  */
1.1  mrg 	srli	a7, a3, 31
1.1  mrg 	slli	a7, a7, 31
1.1  mrg 	xor	a2, a2, a7
1.1  mrg 	/* If y is NaN or Inf, return NaN.  */
1.1  mrg 	bnall	a3, a6, 1f
1.1  mrg 	movi	a4, 0x400000	/* make it a quiet NaN */
1.1  mrg 	or	a2, a2, a4
1.1  mrg 1:	leaf_return
1.1  mrg
1.1  mrg .Ldiv_ynan_or_inf:
1.1  mrg 	/* If y is Infinity, return zero.  */
1.1  mrg 	slli	a8, a3, 9
1.1  mrg 	beqz	a8, .Ldiv_return_zero
1.1  mrg 	/* y is NaN; return it.  */
1.1  mrg 	mov	a2, a3
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__divsf3
1.1  mrg 	.type	__divsf3, @function
1.1  mrg __divsf3:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg
1.1  mrg 	/* Get the sign of the result.  */
1.1  mrg 	xor	a7, a2, a3
1.1  mrg
1.1  mrg 	/* Check for NaN and infinity.  */
1.1  mrg 	ball	a2, a6, .Ldiv_xnan_or_inf
1.1  mrg 	ball	a3, a6, .Ldiv_ynan_or_inf
1.1  mrg
1.1  mrg 	/* Extract the exponents.  */
1.1  mrg 	extui	a8, a2, 23, 8
1.1  mrg 	extui	a9, a3, 23, 8
1.1  mrg
1.1  mrg 	beqz	a9, .Ldiv_yexpzero
1.1  mrg .Ldiv_ynormalized:
1.1  mrg 	beqz	a8, .Ldiv_xexpzero
1.1  mrg .Ldiv_xnormalized:
1.1  mrg
1.1  mrg 	/* Subtract the exponents.  */
1.1  mrg 	sub	a8, a8, a9
1.1  mrg
1.1  mrg 	/* Replace sign/exponent fields with explicit "1.0".  */
1.1  mrg 	movi	a10, 0xffffff
1.1  mrg 	or	a2, a2, a6
1.1  mrg 	and	a2, a2, a10
1.1  mrg 	or	a3, a3, a6
1.1  mrg 	and	a3, a3, a10
1.1  mrg
1.1  mrg 	/* The first digit of the mantissa division must be a one.
1.1  mrg 	   Shift x (and adjust the exponent) as needed to make this true.  */
1.1  mrg 	bltu	a3, a2, 1f
1.1  mrg 	slli	a2, a2, 1
1.1  mrg 	addi	a8, a8, -1
1.1  mrg 1:
1.1  mrg 	/* Do the first subtraction and shift.  */
1.1  mrg 	sub	a2, a2, a3
1.1  mrg 	slli	a2, a2, 1
1.1  mrg
1.1  mrg 	/* Put the quotient into a10.  */
1.1  mrg 	movi	a10, 1
1.1  mrg
1.1  mrg 	/* Divide one bit at a time for 23 bits.  */
1.1  mrg 	movi	a9, 23
1.1  mrg #if XCHAL_HAVE_LOOPS
1.1  mrg 	loop	a9, .Ldiv_loopend
1.1  mrg #endif
1.1  mrg .Ldiv_loop:
1.1  mrg 	/* Shift the quotient << 1.  */
1.1  mrg 	slli	a10, a10, 1
1.1  mrg
1.1  mrg 	/* Is this digit a 0 or 1?  */
1.1  mrg 	bltu	a2, a3, 1f
1.1  mrg
1.1  mrg 	/* Output a 1 and subtract.  */
1.1  mrg 	addi	a10, a10, 1
1.1  mrg 	sub	a2, a2, a3
1.1  mrg
1.1  mrg 	/* Shift the dividend << 1.  */
1.1  mrg 1:	slli	a2, a2, 1
1.1  mrg
1.1  mrg #if !XCHAL_HAVE_LOOPS
1.1  mrg 	addi	a9, a9, -1
1.1  mrg 	bnez	a9, .Ldiv_loop
1.1  mrg #endif
1.1  mrg .Ldiv_loopend:
1.1  mrg
1.1  mrg 	/* Add the exponent bias (less one to account for the explicit "1.0"
1.1  mrg 	   of the mantissa that will be added to the exponent in the final
1.1  mrg 	   result).  */
1.1  mrg 	addi	a8, a8, 0x7e
1.1  mrg
1.1  mrg 	/* Check for over/underflow.  The value in a8 is one less than the
1.1  mrg 	   final exponent, so values in the range 0..fd are OK here.  */
1.1  mrg 	movi	a4, 0xfe
1.1  mrg 	bgeu	a8, a4, .Ldiv_overflow
1.1  mrg
1.1  mrg .Ldiv_round:
1.1  mrg 	/* Round.  The remainder (<< 1) is in a2.  */
1.1  mrg 	bltu	a2, a3, .Ldiv_rounded
1.1  mrg 	addi	a10, a10, 1
1.1  mrg 	beq	a2, a3, .Ldiv_exactlyhalf
1.1  mrg
1.1  mrg .Ldiv_rounded:
1.1  mrg 	/* Add the exponent to the mantissa.  */
1.1  mrg 	slli	a8, a8, 23
1.1  mrg 	add	a2, a10, a8
1.1  mrg
1.1  mrg .Ldiv_addsign:
1.1  mrg 	/* Add the sign bit.  */
1.1  mrg 	srli	a7, a7, 31
1.1  mrg 	slli	a7, a7, 31
1.1  mrg 	or	a2, a2, a7
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Ldiv_overflow:
1.1  mrg 	bltz	a8, .Ldiv_underflow
1.1  mrg 	/* Return +/- Infinity.  */
1.1  mrg 	addi	a8, a4, 1	/* 0xff */
1.1  mrg 	slli	a2, a8, 23
1.1  mrg 	j	.Ldiv_addsign
1.1  mrg
1.1  mrg .Ldiv_exactlyhalf:
1.1  mrg 	/* Remainder is exactly half the divisor.  Round even.  */
1.1  mrg 	srli	a10, a10, 1
1.1  mrg 	slli	a10, a10, 1
1.1  mrg 	j	.Ldiv_rounded
1.1  mrg
1.1  mrg .Ldiv_underflow:
1.1  mrg 	/* Create a subnormal value, where the exponent field contains zero,
1.1  mrg 	   but the effective exponent is 1.  The value of a8 is one less than
1.1  mrg 	   the actual exponent, so just negate it to get the shift amount.  */
1.1  mrg 	neg	a8, a8
1.1  mrg 	ssr	a8
1.1  mrg 	bgeui	a8, 32, .Ldiv_flush_to_zero
1.1  mrg
1.1  mrg 	/* Shift a10 right.  Any bits that are shifted out of a10 are
1.1  mrg 	   saved in a6 for rounding the result.  */
1.1  mrg 	sll	a6, a10
1.1  mrg 	srl	a10, a10
1.1  mrg
1.1  mrg 	/* Set the exponent to zero.  */
1.1  mrg 	movi	a8, 0
1.1  mrg
1.1  mrg 	/* Pack any nonzero remainder (in a2) into a6.  */
1.1  mrg 	beqz	a2, 1f
1.1  mrg 	movi	a9, 1
1.1  mrg 	or	a6, a6, a9
1.1  mrg
1.1  mrg 	/* Round a10 based on the bits shifted out into a6.  */
1.1  mrg 1:	bgez	a6, .Ldiv_rounded
1.1  mrg 	addi	a10, a10, 1
1.1  mrg 	slli	a6, a6, 1
1.1  mrg 	bnez	a6, .Ldiv_rounded
1.1  mrg 	srli	a10, a10, 1
1.1  mrg 	slli	a10, a10, 1
1.1  mrg 	j	.Ldiv_rounded
1.1  mrg
1.1  mrg .Ldiv_flush_to_zero:
1.1  mrg 	/* Return zero with the appropriate sign bit.  */
1.1  mrg 	srli	a2, a7, 31
1.1  mrg 	slli	a2, a2, 31
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg #endif /* L_divsf3 */
1.1  mrg
1.1  mrg #ifdef L_cmpsf2
1.1  mrg
1.1  mrg 	/* Equal and Not Equal */
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__eqsf2
1.1  mrg 	.global	__nesf2
1.1  mrg 	.set	__nesf2, __eqsf2
1.1  mrg 	.type	__eqsf2, @function
1.1  mrg __eqsf2:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg 	bne	a2, a3, 4f
1.1  mrg
1.1  mrg 	/* The values are equal but NaN != NaN.  Check the exponent.  */
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg 	ball	a2, a6, 3f
1.1  mrg
1.1  mrg 	/* Equal.  */
1.1  mrg 	movi	a2, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg 	/* Not equal.  */
1.1  mrg 2:	movi	a2, 1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg 	/* Check if the mantissas are nonzero.  */
1.1  mrg 3:	slli	a7, a2, 9
1.1  mrg 	j	5f
1.1  mrg
1.1  mrg 	/* Check if x and y are zero with different signs.  */
1.1  mrg 4:	or	a7, a2, a3
1.1  mrg 	slli	a7, a7, 1
1.1  mrg
1.1  mrg 	/* Equal if a7 == 0, where a7 is either abs(x | y) or the mantissa
1.1  mrg 	   or x when exponent(x) = 0x7f8 and x == y.  */
1.1  mrg 5:	movi	a2, 0
1.1  mrg 	movi	a3, 1
1.1  mrg 	movnez	a2, a3, a7
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg
1.1  mrg 	/* Greater Than */
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__gtsf2
1.1  mrg 	.type	__gtsf2, @function
1.1  mrg __gtsf2:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg 	ball	a2, a6, 2f
1.1  mrg 1:	bnall	a3, a6, .Lle_cmp
1.1  mrg
1.1  mrg 	/* Check if y is a NaN.  */
1.1  mrg 	slli	a7, a3, 9
1.1  mrg 	beqz	a7, .Lle_cmp
1.1  mrg 	movi	a2, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg 	/* Check if x is a NaN.  */
1.1  mrg 2:	slli	a7, a2, 9
1.1  mrg 	beqz	a7, 1b
1.1  mrg 	movi	a2, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg
1.1  mrg 	/* Less Than or Equal */
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__lesf2
1.1  mrg 	.type	__lesf2, @function
1.1  mrg __lesf2:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg 	ball	a2, a6, 2f
1.1  mrg 1:	bnall	a3, a6, .Lle_cmp
1.1  mrg
1.1  mrg 	/* Check if y is a NaN.  */
1.1  mrg 	slli	a7, a3, 9
1.1  mrg 	beqz	a7, .Lle_cmp
1.1  mrg 	movi	a2, 1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg 	/* Check if x is a NaN.  */
1.1  mrg 2:	slli	a7, a2, 9
1.1  mrg 	beqz	a7, 1b
1.1  mrg 	movi	a2, 1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lle_cmp:
1.1  mrg 	/* Check if x and y have different signs.  */
1.1  mrg 	xor	a7, a2, a3
1.1  mrg 	bltz	a7, .Lle_diff_signs
1.1  mrg
1.1  mrg 	/* Check if x is negative.  */
1.1  mrg 	bltz	a2, .Lle_xneg
1.1  mrg
1.1  mrg 	/* Check if x <= y.  */
1.1  mrg 	bltu	a3, a2, 5f
1.1  mrg 4:	movi	a2, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lle_xneg:
1.1  mrg 	/* Check if y <= x.  */
1.1  mrg 	bgeu	a2, a3, 4b
1.1  mrg 5:	movi	a2, 1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lle_diff_signs:
1.1  mrg 	bltz	a2, 4b
1.1  mrg
1.1  mrg 	/* Check if both x and y are zero.  */
1.1  mrg 	or	a7, a2, a3
1.1  mrg 	slli	a7, a7, 1
1.1  mrg 	movi	a2, 1
1.1  mrg 	movi	a3, 0
1.1  mrg 	moveqz	a2, a3, a7
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg
1.1  mrg 	/* Greater Than or Equal */
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__gesf2
1.1  mrg 	.type	__gesf2, @function
1.1  mrg __gesf2:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg 	ball	a2, a6, 2f
1.1  mrg 1:	bnall	a3, a6, .Llt_cmp
1.1  mrg
1.1  mrg 	/* Check if y is a NaN.  */
1.1  mrg 	slli	a7, a3, 9
1.1  mrg 	beqz	a7, .Llt_cmp
1.1  mrg 	movi	a2, -1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg 	/* Check if x is a NaN.  */
1.1  mrg 2:	slli	a7, a2, 9
1.1  mrg 	beqz	a7, 1b
1.1  mrg 	movi	a2, -1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg
1.1  mrg 	/* Less Than */
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__ltsf2
1.1  mrg 	.type	__ltsf2, @function
1.1  mrg __ltsf2:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg 	ball	a2, a6, 2f
1.1  mrg 1:	bnall	a3, a6, .Llt_cmp
1.1  mrg
1.1  mrg 	/* Check if y is a NaN.  */
1.1  mrg 	slli	a7, a3, 9
1.1  mrg 	beqz	a7, .Llt_cmp
1.1  mrg 	movi	a2, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg 	/* Check if x is a NaN.  */
1.1  mrg 2:	slli	a7, a2, 9
1.1  mrg 	beqz	a7, 1b
1.1  mrg 	movi	a2, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Llt_cmp:
1.1  mrg 	/* Check if x and y have different signs.  */
1.1  mrg 	xor	a7, a2, a3
1.1  mrg 	bltz	a7, .Llt_diff_signs
1.1  mrg
1.1  mrg 	/* Check if x is negative.  */
1.1  mrg 	bltz	a2, .Llt_xneg
1.1  mrg
1.1  mrg 	/* Check if x < y.  */
1.1  mrg 	bgeu	a2, a3, 5f
1.1  mrg 4:	movi	a2, -1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Llt_xneg:
1.1  mrg 	/* Check if y < x.  */
1.1  mrg 	bltu	a3, a2, 4b
1.1  mrg 5:	movi	a2, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Llt_diff_signs:
1.1  mrg 	bgez	a2, 5b
1.1  mrg
1.1  mrg 	/* Check if both x and y are nonzero.  */
1.1  mrg 	or	a7, a2, a3
1.1  mrg 	slli	a7, a7, 1
1.1  mrg 	movi	a2, 0
1.1  mrg 	movi	a3, -1
1.1  mrg 	movnez	a2, a3, a7
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg
1.1  mrg 	/* Unordered */
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__unordsf2
1.1  mrg 	.type	__unordsf2, @function
1.1  mrg __unordsf2:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg 	ball	a2, a6, 3f
1.1  mrg 1:	ball	a3, a6, 4f
1.1  mrg 2:	movi	a2, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg 3:	slli	a7, a2, 9
1.1  mrg 	beqz	a7, 1b
1.1  mrg 	movi	a2, 1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg 4:	slli	a7, a3, 9
1.1  mrg 	beqz	a7, 2b
1.1  mrg 	movi	a2, 1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg #endif /* L_cmpsf2 */
1.1  mrg
1.1  mrg #ifdef L_fixsfsi
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__fixsfsi
1.1  mrg 	.type	__fixsfsi, @function
1.1  mrg __fixsfsi:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg
1.1  mrg 	/* Check for NaN and Infinity.  */
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg 	ball	a2, a6, .Lfixsfsi_nan_or_inf
1.1  mrg
1.1  mrg 	/* Extract the exponent and check if 0 < (exp - 0x7e) < 32.  */
1.1  mrg 	extui	a4, a2, 23, 8
1.1  mrg 	addi	a4, a4, -0x7e
1.1  mrg 	bgei	a4, 32, .Lfixsfsi_maxint
1.1  mrg 	blti	a4, 1, .Lfixsfsi_zero
1.1  mrg
1.1  mrg 	/* Add explicit "1.0" and shift << 8.  */
1.1  mrg 	or	a7, a2, a6
1.1  mrg 	slli	a5, a7, 8
1.1  mrg
1.1  mrg 	/* Shift back to the right, based on the exponent.  */
1.1  mrg 	ssl	a4		/* shift by 32 - a4 */
1.1  mrg 	srl	a5, a5
1.1  mrg
1.1  mrg 	/* Negate the result if sign != 0.  */
1.1  mrg 	neg	a2, a5
1.1  mrg 	movgez	a2, a5, a7
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lfixsfsi_nan_or_inf:
1.1  mrg 	/* Handle Infinity and NaN.  */
1.1  mrg 	slli	a4, a2, 9
1.1  mrg 	beqz	a4, .Lfixsfsi_maxint
1.1  mrg
1.1  mrg 	/* Translate NaN to +maxint.  */
1.1  mrg 	movi	a2, 0
1.1  mrg
1.1  mrg .Lfixsfsi_maxint:
1.1  mrg 	slli	a4, a6, 8	/* 0x80000000 */
1.1  mrg 	addi	a5, a4, -1	/* 0x7fffffff */
1.1  mrg 	movgez	a4, a5, a2
1.1  mrg 	mov	a2, a4
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lfixsfsi_zero:
1.1  mrg 	movi	a2, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg #endif /* L_fixsfsi */
1.1  mrg
1.1  mrg #ifdef L_fixsfdi
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__fixsfdi
1.1  mrg 	.type	__fixsfdi, @function
1.1  mrg __fixsfdi:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg
1.1  mrg 	/* Check for NaN and Infinity.  */
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg 	ball	a2, a6, .Lfixsfdi_nan_or_inf
1.1  mrg
1.1  mrg 	/* Extract the exponent and check if 0 < (exp - 0x7e) < 64.  */
1.1  mrg 	extui	a4, a2, 23, 8
1.1  mrg 	addi	a4, a4, -0x7e
1.1  mrg 	bgei	a4, 64, .Lfixsfdi_maxint
1.1  mrg 	blti	a4, 1, .Lfixsfdi_zero
1.1  mrg
1.1  mrg 	/* Add explicit "1.0" and shift << 8.  */
1.1  mrg 	or	a7, a2, a6
1.1  mrg 	slli	xh, a7, 8
1.1  mrg
1.1  mrg 	/* Shift back to the right, based on the exponent.  */
1.1  mrg 	ssl	a4		/* shift by 64 - a4 */
1.1  mrg 	bgei	a4, 32, .Lfixsfdi_smallshift
1.1  mrg 	srl	xl, xh
1.1  mrg 	movi	xh, 0
1.1  mrg
1.1  mrg .Lfixsfdi_shifted:
1.1  mrg 	/* Negate the result if sign != 0.  */
1.1  mrg 	bgez	a7, 1f
1.1  mrg 	neg	xl, xl
1.1  mrg 	neg	xh, xh
1.1  mrg 	beqz	xl, 1f
1.1  mrg 	addi	xh, xh, -1
1.1  mrg 1:	leaf_return
1.1  mrg
1.1  mrg .Lfixsfdi_smallshift:
1.1  mrg 	movi	xl, 0
1.1  mrg 	sll	xl, xh
1.1  mrg 	srl	xh, xh
1.1  mrg 	j	.Lfixsfdi_shifted
1.1  mrg
1.1  mrg .Lfixsfdi_nan_or_inf:
1.1  mrg 	/* Handle Infinity and NaN.  */
1.1  mrg 	slli	a4, a2, 9
1.1  mrg 	beqz	a4, .Lfixsfdi_maxint
1.1  mrg
1.1  mrg 	/* Translate NaN to +maxint.  */
1.1  mrg 	movi	a2, 0
1.1  mrg
1.1  mrg .Lfixsfdi_maxint:
1.1  mrg 	slli	a7, a6, 8	/* 0x80000000 */
1.1  mrg 	bgez	a2, 1f
1.1  mrg 	mov	xh, a7
1.1  mrg 	movi	xl, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg 1:	addi	xh, a7, -1	/* 0x7fffffff */
1.1  mrg 	movi	xl, -1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lfixsfdi_zero:
1.1  mrg 	movi	xh, 0
1.1  mrg 	movi	xl, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg #endif /* L_fixsfdi */
1.1  mrg
1.1  mrg #ifdef L_fixunssfsi
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__fixunssfsi
1.1  mrg 	.type	__fixunssfsi, @function
1.1  mrg __fixunssfsi:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg
1.1  mrg 	/* Check for NaN and Infinity.  */
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg 	ball	a2, a6, .Lfixunssfsi_nan_or_inf
1.1  mrg
1.1  mrg 	/* Extract the exponent and check if 0 <= (exp - 0x7f) < 32.  */
1.1  mrg 	extui	a4, a2, 23, 8
1.1  mrg 	addi	a4, a4, -0x7f
1.1  mrg 	bgei	a4, 32, .Lfixunssfsi_maxint
1.1  mrg 	bltz	a4, .Lfixunssfsi_zero
1.1  mrg
1.1  mrg 	/* Add explicit "1.0" and shift << 8.  */
1.1  mrg 	or	a7, a2, a6
1.1  mrg 	slli	a5, a7, 8
1.1  mrg
1.1  mrg 	/* Shift back to the right, based on the exponent.  */
1.1  mrg 	addi	a4, a4, 1
1.1  mrg 	beqi	a4, 32, .Lfixunssfsi_bigexp
1.1  mrg 	ssl	a4		/* shift by 32 - a4 */
1.1  mrg 	srl	a5, a5
1.1  mrg
1.1  mrg 	/* Negate the result if sign != 0.  */
1.1  mrg 	neg	a2, a5
1.1  mrg 	movgez	a2, a5, a7
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lfixunssfsi_nan_or_inf:
1.1  mrg 	/* Handle Infinity and NaN.  */
1.1  mrg 	slli	a4, a2, 9
1.1  mrg 	beqz	a4, .Lfixunssfsi_maxint
1.1  mrg
1.1  mrg 	/* Translate NaN to 0xffffffff.  */
1.1  mrg 	movi	a2, -1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lfixunssfsi_maxint:
1.1  mrg 	slli	a4, a6, 8	/* 0x80000000 */
1.1  mrg 	movi	a5, -1		/* 0xffffffff */
1.1  mrg 	movgez	a4, a5, a2
1.1  mrg 	mov	a2, a4
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lfixunssfsi_zero:
1.1  mrg 	movi	a2, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lfixunssfsi_bigexp:
1.1  mrg 	/* Handle unsigned maximum exponent case.  */
1.1  mrg 	bltz	a2, 1f
1.1  mrg 	mov	a2, a5		/* no shift needed */
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg 	/* Return 0x80000000 if negative.  */
1.1  mrg 1:	slli	a2, a6, 8
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg #endif /* L_fixunssfsi */
1.1  mrg
1.1  mrg #ifdef L_fixunssfdi
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__fixunssfdi
1.1  mrg 	.type	__fixunssfdi, @function
1.1  mrg __fixunssfdi:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg
1.1  mrg 	/* Check for NaN and Infinity.  */
1.1  mrg 	movi	a6, 0x7f800000
1.1  mrg 	ball	a2, a6, .Lfixunssfdi_nan_or_inf
1.1  mrg
1.1  mrg 	/* Extract the exponent and check if 0 <= (exp - 0x7f) < 64.  */
1.1  mrg 	extui	a4, a2, 23, 8
1.1  mrg 	addi	a4, a4, -0x7f
1.1  mrg 	bgei	a4, 64, .Lfixunssfdi_maxint
1.1  mrg 	bltz	a4, .Lfixunssfdi_zero
1.1  mrg
1.1  mrg 	/* Add explicit "1.0" and shift << 8.  */
1.1  mrg 	or	a7, a2, a6
1.1  mrg 	slli	xh, a7, 8
1.1  mrg
1.1  mrg 	/* Shift back to the right, based on the exponent.  */
1.1  mrg 	addi	a4, a4, 1
1.1  mrg 	beqi	a4, 64, .Lfixunssfdi_bigexp
1.1  mrg 	ssl	a4		/* shift by 64 - a4 */
1.1  mrg 	bgei	a4, 32, .Lfixunssfdi_smallshift
1.1  mrg 	srl	xl, xh
1.1  mrg 	movi	xh, 0
1.1  mrg
1.1  mrg .Lfixunssfdi_shifted:
1.1  mrg 	/* Negate the result if sign != 0.  */
1.1  mrg 	bgez	a7, 1f
1.1  mrg 	neg	xl, xl
1.1  mrg 	neg	xh, xh
1.1  mrg 	beqz	xl, 1f
1.1  mrg 	addi	xh, xh, -1
1.1  mrg 1:	leaf_return
1.1  mrg
1.1  mrg .Lfixunssfdi_smallshift:
1.1  mrg 	movi	xl, 0
1.1  mrg 	src	xl, xh, xl
1.1  mrg 	srl	xh, xh
1.1  mrg 	j	.Lfixunssfdi_shifted
1.1  mrg
1.1  mrg .Lfixunssfdi_nan_or_inf:
1.1  mrg 	/* Handle Infinity and NaN.  */
1.1  mrg 	slli	a4, a2, 9
1.1  mrg 	beqz	a4, .Lfixunssfdi_maxint
1.1  mrg
1.1  mrg 	/* Translate NaN to 0xffffffff.... */
1.1  mrg 1:	movi	xh, -1
1.1  mrg 	movi	xl, -1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lfixunssfdi_maxint:
1.1  mrg 	bgez	a2, 1b
1.1  mrg 2:	slli	xh, a6, 8	/* 0x80000000 */
1.1  mrg 	movi	xl, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lfixunssfdi_zero:
1.1  mrg 	movi	xh, 0
1.1  mrg 	movi	xl, 0
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lfixunssfdi_bigexp:
1.1  mrg 	/* Handle unsigned maximum exponent case.  */
1.1  mrg 	bltz	a7, 2b
1.1  mrg 	movi	xl, 0
1.1  mrg 	leaf_return		/* no shift needed */
1.1  mrg
1.1  mrg #endif /* L_fixunssfdi */
1.1  mrg
1.1  mrg #ifdef L_floatsisf
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__floatunsisf
1.1  mrg 	.type	__floatunsisf, @function
1.1  mrg __floatunsisf:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg 	beqz	a2, .Lfloatsisf_return
1.1  mrg
1.1  mrg 	/* Set the sign to zero and jump to the floatsisf code.  */
1.1  mrg 	movi	a7, 0
1.1  mrg 	j	.Lfloatsisf_normalize
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__floatsisf
1.1  mrg 	.type	__floatsisf, @function
1.1  mrg __floatsisf:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg
1.1  mrg 	/* Check for zero.  */
1.1  mrg 	beqz	a2, .Lfloatsisf_return
1.1  mrg
1.1  mrg 	/* Save the sign.  */
1.1  mrg 	extui	a7, a2, 31, 1
1.1  mrg
1.1  mrg 	/* Get the absolute value.  */
1.1  mrg #if XCHAL_HAVE_ABS
1.1  mrg 	abs	a2, a2
1.1  mrg #else
1.1  mrg 	neg	a4, a2
1.1  mrg 	movltz	a2, a4, a2
1.1  mrg #endif
1.1  mrg
1.1  mrg .Lfloatsisf_normalize:
1.1  mrg 	/* Normalize with the first 1 bit in the msb.  */
1.1  mrg 	do_nsau	a4, a2, a5, a6
1.1  mrg 	ssl	a4
1.1  mrg 	sll	a5, a2
1.1  mrg
1.1  mrg 	/* Shift the mantissa into position, with rounding bits in a6.  */
1.1  mrg 	srli	a2, a5, 8
1.1  mrg 	slli	a6, a5, (32 - 8)
1.1  mrg
1.1  mrg 	/* Set the exponent.  */
1.1  mrg 	movi	a5, 0x9d	/* 0x7e + 31 */
1.1  mrg 	sub	a5, a5, a4
1.1  mrg 	slli	a5, a5, 23
1.1  mrg 	add	a2, a2, a5
1.1  mrg
1.1  mrg 	/* Add the sign.  */
1.1  mrg 	slli	a7, a7, 31
1.1  mrg 	or	a2, a2, a7
1.1  mrg
1.1  mrg 	/* Round up if the leftover fraction is >= 1/2.  */
1.1  mrg 	bgez	a6, .Lfloatsisf_return
1.1  mrg 	addi	a2, a2, 1	/* Overflow to the exponent is OK.  */
1.1  mrg
1.1  mrg 	/* Check if the leftover fraction is exactly 1/2.  */
1.1  mrg 	slli	a6, a6, 1
1.1  mrg 	beqz	a6, .Lfloatsisf_exactlyhalf
1.1  mrg
1.1  mrg .Lfloatsisf_return:
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg .Lfloatsisf_exactlyhalf:
1.1  mrg 	/* Round down to the nearest even value.  */
1.1  mrg 	srli	a2, a2, 1
1.1  mrg 	slli	a2, a2, 1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg #endif /* L_floatsisf */
1.1  mrg
1.1  mrg #ifdef L_floatdisf
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__floatundisf
1.1  mrg 	.type	__floatundisf, @function
1.1  mrg __floatundisf:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg
1.1  mrg 	/* Check for zero.  */
1.1  mrg 	or	a4, xh, xl
1.1  mrg 	beqz	a4, 2f
1.1  mrg
1.1  mrg 	/* Set the sign to zero and jump to the floatdisf code.  */
1.1  mrg 	movi	a7, 0
1.1  mrg 	j	.Lfloatdisf_normalize
1.1  mrg
1.1  mrg 	.align	4
1.1  mrg 	.global	__floatdisf
1.1  mrg 	.type	__floatdisf, @function
1.1  mrg __floatdisf:
1.1  mrg 	leaf_entry sp, 16
1.1  mrg
1.1  mrg 	/* Check for zero.  */
1.1  mrg 	or	a4, xh, xl
1.1  mrg 	beqz	a4, 2f
1.1  mrg
1.1  mrg 	/* Save the sign.  */
1.1  mrg 	extui	a7, xh, 31, 1
1.1  mrg
1.1  mrg 	/* Get the absolute value.  */
1.1  mrg 	bgez	xh, .Lfloatdisf_normalize
1.1  mrg 	neg	xl, xl
1.1  mrg 	neg	xh, xh
1.1  mrg 	beqz	xl, .Lfloatdisf_normalize
1.1  mrg 	addi	xh, xh, -1
1.1  mrg
1.1  mrg .Lfloatdisf_normalize:
1.1  mrg 	/* Normalize with the first 1 bit in the msb of xh.  */
1.1  mrg 	beqz	xh, .Lfloatdisf_bigshift
1.1  mrg 	do_nsau	a4, xh, a5, a6
1.1  mrg 	ssl	a4
1.1  mrg 	src	xh, xh, xl
1.1  mrg 	sll	xl, xl
1.1  mrg
1.1  mrg .Lfloatdisf_shifted:
1.1  mrg 	/* Shift the mantissa into position, with rounding bits in a6.  */
1.1  mrg 	ssai	8
1.1  mrg 	sll	a5, xl
1.1  mrg 	src	a6, xh, xl
1.1  mrg 	srl	xh, xh
1.1  mrg 	beqz	a5, 1f
1.1  mrg 	movi	a5, 1
1.1  mrg 	or	a6, a6, a5
1.1  mrg 1:
1.1  mrg 	/* Set the exponent.  */
1.1  mrg 	movi	a5, 0xbd	/* 0x7e + 63 */
1.1  mrg 	sub	a5, a5, a4
1.1  mrg 	slli	a5, a5, 23
1.1  mrg 	add	a2, xh, a5
1.1  mrg
1.1  mrg 	/* Add the sign.  */
1.1  mrg 	slli	a7, a7, 31
1.1  mrg 	or	a2, a2, a7
1.1  mrg
1.1  mrg 	/* Round up if the leftover fraction is >= 1/2.  */
1.1  mrg 	bgez	a6, 2f
1.1  mrg 	addi	a2, a2, 1	/* Overflow to the exponent is OK.  */
1.1  mrg
1.1  mrg 	/* Check if the leftover fraction is exactly 1/2.  */
1.1  mrg 	slli	a6, a6, 1
1.1  mrg 	beqz	a6, .Lfloatdisf_exactlyhalf
1.1  mrg 2:	leaf_return
1.1  mrg
1.1  mrg .Lfloatdisf_bigshift:
1.1  mrg 	/* xh is zero.  Normalize with first 1 bit of xl in the msb of xh.  */
1.1  mrg 	do_nsau	a4, xl, a5, a6
1.1  mrg 	ssl	a4
1.1  mrg 	sll	xh, xl
1.1  mrg 	movi	xl, 0
1.1  mrg 	addi	a4, a4, 32
1.1  mrg 	j	.Lfloatdisf_shifted
1.1  mrg
1.1  mrg .Lfloatdisf_exactlyhalf:
1.1  mrg 	/* Round down to the nearest even value.  */
1.1  mrg 	srli	a2, a2, 1
1.1  mrg 	slli	a2, a2, 1
1.1  mrg 	leaf_return
1.1  mrg
1.1  mrg #endif /* L_floatdisf */