modf.S revision 1.2 1 1.2 eeh /* $NetBSD: modf.S,v 1.2 2000/07/23 07:12:22 eeh Exp $ */
2 1.1 eeh
3 1.1 eeh /*
4 1.1 eeh * Copyright (c) 1992, 1993
5 1.1 eeh * The Regents of the University of California. All rights reserved.
6 1.1 eeh *
7 1.1 eeh * This software was developed by the Computer Systems Engineering group
8 1.1 eeh * at Lawrence Berkeley Laboratory under DARPA contract BG 91-66 and
9 1.1 eeh * contributed to Berkeley.
10 1.1 eeh *
11 1.1 eeh * Redistribution and use in source and binary forms, with or without
12 1.1 eeh * modification, are permitted provided that the following conditions
13 1.1 eeh * are met:
14 1.1 eeh * 1. Redistributions of source code must retain the above copyright
15 1.1 eeh * notice, this list of conditions and the following disclaimer.
16 1.1 eeh * 2. Redistributions in binary form must reproduce the above copyright
17 1.1 eeh * notice, this list of conditions and the following disclaimer in the
18 1.1 eeh * documentation and/or other materials provided with the distribution.
19 1.1 eeh * 3. All advertising materials mentioning features or use of this software
20 1.1 eeh * must display the following acknowledgement:
21 1.1 eeh * This product includes software developed by the University of
22 1.1 eeh * California, Berkeley and its contributors.
23 1.1 eeh * 4. Neither the name of the University nor the names of its contributors
24 1.1 eeh * may be used to endorse or promote products derived from this software
25 1.1 eeh * without specific prior written permission.
26 1.1 eeh *
27 1.1 eeh * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
28 1.1 eeh * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
29 1.1 eeh * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
30 1.1 eeh * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
31 1.1 eeh * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
32 1.1 eeh * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
33 1.1 eeh * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
34 1.1 eeh * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
35 1.1 eeh * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
36 1.1 eeh * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
37 1.1 eeh * SUCH DAMAGE.
38 1.1 eeh *
39 1.1 eeh * from: Header: modf.s,v 1.3 92/06/20 00:00:54 torek Exp
40 1.1 eeh */
41 1.1 eeh
42 1.1 eeh #include <machine/asm.h>
43 1.1 eeh #if defined(LIBC_SCCS) && !defined(lint)
44 1.1 eeh #if 0
45 1.1 eeh .asciz "@(#)modf.s 8.1 (Berkeley) 6/4/93"
46 1.1 eeh #else
47 1.2 eeh RCSID("$NetBSD: modf.S,v 1.2 2000/07/23 07:12:22 eeh Exp $")
48 1.1 eeh #endif
49 1.1 eeh #endif /* LIBC_SCCS and not lint */
50 1.1 eeh
51 1.1 eeh #include <machine/fsr.h>
52 1.1 eeh
53 1.1 eeh /*
54 1.1 eeh * double modf(double val, double *iptr)
55 1.1 eeh *
56 1.1 eeh * Returns the fractional part of `val', storing the integer part of
57 1.1 eeh * `val' in *iptr. Both *iptr and the return value have the same sign
58 1.1 eeh * as `val'.
59 1.1 eeh *
60 1.1 eeh * Method:
61 1.1 eeh *
62 1.1 eeh * We use the fpu's normalization hardware to compute the integer portion
63 1.1 eeh * of the double precision argument. Sun IEEE double precision numbers
64 1.1 eeh * have 52 bits of mantissa, 11 bits of exponent, and one bit of sign,
65 1.1 eeh * with the sign occupying bit 31 of word 0, and the exponent bits 30:20
66 1.1 eeh * of word 0. Thus, values >= 2^52 are by definition integers.
67 1.1 eeh *
68 1.1 eeh * If we take a value that is in the range [+0..2^52) and add 2^52, all
69 1.1 eeh * of the fractional bits fall out and all of the integer bits are summed
70 1.1 eeh * with 2^52. If we then subtract 2^52, we get those integer bits back.
71 1.1 eeh * This must be done with rounding set to `towards 0' or `towards -inf'.
72 1.1 eeh * `Toward -inf' fails when the value is 0 (we get -0 back)....
73 1.1 eeh *
74 1.1 eeh * Note that this method will work anywhere, but is machine dependent in
75 1.1 eeh * various aspects.
76 1.1 eeh *
77 1.1 eeh * Stack usage:
78 1.2 eeh * 4@[%fp + BIAS - 4] saved %fsr
79 1.2 eeh * 4@[%fp + BIAS - 8] new %fsr with rounding set to `towards 0'
80 1.2 eeh * 8@[%fp + BIAS - 16] space for moving between %i and %f registers
81 1.1 eeh * Register usage:
82 1.1 eeh * %i0%i1 double val;
83 1.1 eeh * %l0 scratch
84 1.1 eeh * %l1 sign bit (0x80000000)
85 1.1 eeh * %i2 double *iptr;
86 1.1 eeh * %f2:f3 `magic number' 2^52, in fpu registers
87 1.1 eeh * %f4:f5 double v, in fpu registers
88 1.1 eeh */
89 1.1 eeh
90 1.1 eeh .align 8
91 1.1 eeh Lmagic:
92 1.1 eeh .word 0x43300000 ! sign = 0, exponent = 52 + 1023, mantissa = 0
93 1.1 eeh .word 0 ! (i.e., .double 0r4503599627370496e+00)
94 1.1 eeh
95 1.1 eeh L0:
96 1.1 eeh .word 0 ! 0.0
97 1.1 eeh .word 0
98 1.1 eeh
99 1.1 eeh ENTRY(modf)
100 1.2 eeh save %sp, -CC64FSZ-16, %sp
101 1.1 eeh
102 1.1 eeh /*
103 1.1 eeh * First, compute v = abs(val) by clearing sign bit,
104 1.1 eeh * and then set up the fpu registers. This would be
105 1.1 eeh * much easier if we could do alu operations on fpu registers!
106 1.1 eeh */
107 1.1 eeh sethi %hi(0x80000000), %l1 ! sign bit
108 1.1 eeh andn %i0, %l1, %l0
109 1.2 eeh st %l0, [%fp + BIAS - 16]
110 1.1 eeh #ifdef PIC
111 1.1 eeh PICCY_SET(Lmagic, %l0, %o7)
112 1.1 eeh ldd [%l0], %f2
113 1.1 eeh #else
114 1.1 eeh sethi %hi(Lmagic), %l0
115 1.1 eeh ldd [%l0 + %lo(Lmagic)], %f2
116 1.1 eeh #endif
117 1.2 eeh st %i1, [%fp + BIAS - 12]
118 1.2 eeh ldd [%fp + BIAS - 16], %f4 ! %f4:f5 = v
119 1.1 eeh
120 1.1 eeh /*
121 1.1 eeh * Is %f4:f5 >= %f2:f3 ? If so, it is all integer bits.
122 1.1 eeh * It is probably less, though.
123 1.1 eeh */
124 1.1 eeh fcmped %f4, %f2
125 1.1 eeh nop ! fpop2 delay
126 1.1 eeh fbuge Lbig ! if >= (or unordered), go out
127 1.1 eeh nop
128 1.1 eeh
129 1.1 eeh /*
130 1.1 eeh * v < 2^52, so add 2^52, then subtract 2^52, but do it all
131 1.1 eeh * with rounding set towards zero. We leave any enabled
132 1.1 eeh * traps enabled, but change the rounding mode. This might
133 1.1 eeh * not be so good. Oh well....
134 1.1 eeh */
135 1.2 eeh st %fsr, [%fp + BIAS - 4] ! %l5 = current FSR mode
136 1.1 eeh set FSR_RD, %l3 ! %l3 = rounding direction mask
137 1.2 eeh ld [%fp + BIAS - 4], %l5
138 1.1 eeh set FSR_RD_RZ << FSR_RD_SHIFT, %l4
139 1.1 eeh andn %l5, %l3, %l6
140 1.1 eeh or %l6, %l4, %l6 ! round towards zero, please
141 1.1 eeh and %l5, %l3, %l5 ! save original rounding mode
142 1.2 eeh st %l6, [%fp + BIAS - 8]
143 1.2 eeh ld [%fp + BIAS - 8], %fsr
144 1.1 eeh
145 1.1 eeh faddd %f4, %f2, %f4 ! %f4:f5 += 2^52
146 1.1 eeh fsubd %f4, %f2, %f4 ! %f4:f5 -= 2^52
147 1.1 eeh
148 1.1 eeh /*
149 1.1 eeh * Restore %fsr, but leave exceptions accrued.
150 1.1 eeh */
151 1.2 eeh st %fsr, [%fp + BIAS - 4]
152 1.2 eeh ld [%fp + BIAS - 4], %l6
153 1.1 eeh andn %l6, %l3, %l6 ! %l6 = %fsr & ~FSR_RD;
154 1.1 eeh or %l5, %l6, %l5 ! %l5 |= %l6;
155 1.2 eeh st %l5, [%fp + BIAS - 4]
156 1.2 eeh ld [%fp + BIAS - 4], %fsr ! restore %fsr, leaving accrued stuff
157 1.1 eeh
158 1.1 eeh /*
159 1.1 eeh * Now insert the original sign in %f4:f5.
160 1.1 eeh * This is a lot of work, so it is conditional here.
161 1.1 eeh */
162 1.1 eeh btst %l1, %i0
163 1.1 eeh be 1f
164 1.1 eeh nop
165 1.2 eeh st %f4, [%fp + BIAS - 16]
166 1.2 eeh ld [%fp + BIAS - 16], %g1
167 1.1 eeh or %l1, %g1, %g1
168 1.2 eeh st %g1, [%fp + BIAS - 16]
169 1.2 eeh ld [%fp + BIAS - 16], %f4
170 1.1 eeh 1:
171 1.1 eeh
172 1.1 eeh /*
173 1.1 eeh * The value in %f4:f5 is now the integer portion of the original
174 1.1 eeh * argument. We need to store this in *ival (%i2), subtract it
175 1.1 eeh * from the original value argument (%i0:i1), and return the result.
176 1.1 eeh */
177 1.1 eeh std %f4, [%i2] ! *ival = %f4:f5;
178 1.2 eeh std %i0, [%fp + BIAS - 16]
179 1.2 eeh ldd [%fp + BIAS - 16], %f0 ! %f0:f1 = val;
180 1.1 eeh fsubd %f0, %f4, %f0 ! %f0:f1 -= %f4:f5;
181 1.1 eeh ret
182 1.1 eeh restore
183 1.1 eeh
184 1.1 eeh Lbig:
185 1.1 eeh /*
186 1.1 eeh * We get here if the original comparison of %f4:f5 (v) to
187 1.1 eeh * %f2:f3 (2^52) came out `greater or unordered'. In this
188 1.1 eeh * case the integer part is the original value, and the
189 1.1 eeh * fractional part is 0.
190 1.1 eeh */
191 1.1 eeh #ifdef PIC
192 1.1 eeh PICCY_SET(L0, %l0, %o7)
193 1.1 eeh std %f0, [%i2] ! *ival = val;
194 1.1 eeh ldd [%l0], %f0 ! return 0.0;
195 1.1 eeh #else
196 1.1 eeh sethi %hi(L0), %l0
197 1.1 eeh std %f0, [%i2] ! *ival = val;
198 1.1 eeh ldd [%l0 + %lo(L0)], %f0 ! return 0.0;
199 1.1 eeh #endif
200 1.1 eeh ret
201 1.1 eeh restore
202