1 1.18 isaki /* $NetBSD: fpu_log.c,v 1.18 2014/01/04 13:23:22 isaki Exp $ */ 2 1.1 briggs 3 1.1 briggs /* 4 1.1 briggs * Copyright (c) 1995 Ken Nakata 5 1.1 briggs * All rights reserved. 6 1.1 briggs * 7 1.1 briggs * Redistribution and use in source and binary forms, with or without 8 1.1 briggs * modification, are permitted provided that the following conditions 9 1.1 briggs * are met: 10 1.1 briggs * 1. Redistributions of source code must retain the above copyright 11 1.1 briggs * notice, this list of conditions and the following disclaimer. 12 1.1 briggs * 2. Redistributions in binary form must reproduce the above copyright 13 1.1 briggs * notice, this list of conditions and the following disclaimer in the 14 1.1 briggs * documentation and/or other materials provided with the distribution. 15 1.1 briggs * 3. Neither the name of the author nor the names of its contributors 16 1.1 briggs * may be used to endorse or promote products derived from this software 17 1.1 briggs * without specific prior written permission. 18 1.1 briggs * 19 1.1 briggs * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 20 1.1 briggs * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21 1.1 briggs * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22 1.1 briggs * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 23 1.1 briggs * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24 1.1 briggs * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25 1.1 briggs * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26 1.1 briggs * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27 1.1 briggs * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28 1.1 briggs * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29 1.1 briggs * SUCH DAMAGE. 30 1.1 briggs * 31 1.1 briggs * @(#)fpu_log.c 10/8/95 32 1.1 briggs */ 33 1.8 lukem 34 1.8 lukem #include <sys/cdefs.h> 35 1.18 isaki __KERNEL_RCSID(0, "$NetBSD: fpu_log.c,v 1.18 2014/01/04 13:23:22 isaki Exp $"); 36 1.1 briggs 37 1.1 briggs #include <sys/types.h> 38 1.3 briggs #include <sys/systm.h> 39 1.1 briggs 40 1.1 briggs #include "fpu_emulate.h" 41 1.1 briggs 42 1.15 isaki static uint32_t logA6[] = { 0x3FC2499A, 0xB5E4040B }; 43 1.15 isaki static uint32_t logA5[] = { 0xBFC555B5, 0x848CB7DB }; 44 1.15 isaki static uint32_t logA4[] = { 0x3FC99999, 0x987D8730 }; 45 1.15 isaki static uint32_t logA3[] = { 0xBFCFFFFF, 0xFF6F7E97 }; 46 1.15 isaki static uint32_t logA2[] = { 0x3FD55555, 0x555555A4 }; 47 1.15 isaki static uint32_t logA1[] = { 0xBFE00000, 0x00000008 }; 48 1.15 isaki 49 1.15 isaki static uint32_t logB5[] = { 0x3F175496, 0xADD7DAD6 }; 50 1.15 isaki static uint32_t logB4[] = { 0x3F3C71C2, 0xFE80C7E0 }; 51 1.15 isaki static uint32_t logB3[] = { 0x3F624924, 0x928BCCFF }; 52 1.15 isaki static uint32_t logB2[] = { 0x3F899999, 0x999995EC }; 53 1.15 isaki static uint32_t logB1[] = { 0x3FB55555, 0x55555555 }; 54 1.1 briggs 55 1.1 briggs /* sfpn = shortened fp number; can represent only positive numbers */ 56 1.1 briggs static struct sfpn { 57 1.13 isaki int sp_exp; 58 1.15 isaki uint32_t sp_m0, sp_m1; 59 1.1 briggs } logtbl[] = { 60 1.13 isaki { 0x3FFE - 0x3fff, 0xFE03F80FU, 0xE03F80FEU }, 61 1.13 isaki { 0x3FF7 - 0x3fff, 0xFF015358U, 0x833C47E2U }, 62 1.13 isaki { 0x3FFE - 0x3fff, 0xFA232CF2U, 0x52138AC0U }, 63 1.13 isaki { 0x3FF9 - 0x3fff, 0xBDC8D83EU, 0xAD88D549U }, 64 1.13 isaki { 0x3FFE - 0x3fff, 0xF6603D98U, 0x0F6603DAU }, 65 1.13 isaki { 0x3FFA - 0x3fff, 0x9CF43DCFU, 0xF5EAFD48U }, 66 1.13 isaki { 0x3FFE - 0x3fff, 0xF2B9D648U, 0x0F2B9D65U }, 67 1.13 isaki { 0x3FFA - 0x3fff, 0xDA16EB88U, 0xCB8DF614U }, 68 1.13 isaki { 0x3FFE - 0x3fff, 0xEF2EB71FU, 0xC4345238U }, 69 1.13 isaki { 0x3FFB - 0x3fff, 0x8B29B775U, 0x1BD70743U }, 70 1.13 isaki { 0x3FFE - 0x3fff, 0xEBBDB2A5U, 0xC1619C8CU }, 71 1.13 isaki { 0x3FFB - 0x3fff, 0xA8D839F8U, 0x30C1FB49U }, 72 1.13 isaki { 0x3FFE - 0x3fff, 0xE865AC7BU, 0x7603A197U }, 73 1.13 isaki { 0x3FFB - 0x3fff, 0xC61A2EB1U, 0x8CD907ADU }, 74 1.13 isaki { 0x3FFE - 0x3fff, 0xE525982AU, 0xF70C880EU }, 75 1.13 isaki { 0x3FFB - 0x3fff, 0xE2F2A47AU, 0xDE3A18AFU }, 76 1.13 isaki { 0x3FFE - 0x3fff, 0xE1FC780EU, 0x1FC780E2U }, 77 1.13 isaki { 0x3FFB - 0x3fff, 0xFF64898EU, 0xDF55D551U }, 78 1.13 isaki { 0x3FFE - 0x3fff, 0xDEE95C4CU, 0xA037BA57U }, 79 1.13 isaki { 0x3FFC - 0x3fff, 0x8DB956A9U, 0x7B3D0148U }, 80 1.13 isaki { 0x3FFE - 0x3fff, 0xDBEB61EEU, 0xD19C5958U }, 81 1.13 isaki { 0x3FFC - 0x3fff, 0x9B8FE100U, 0xF47BA1DEU }, 82 1.13 isaki { 0x3FFE - 0x3fff, 0xD901B203U, 0x6406C80EU }, 83 1.13 isaki { 0x3FFC - 0x3fff, 0xA9372F1DU, 0x0DA1BD17U }, 84 1.13 isaki { 0x3FFE - 0x3fff, 0xD62B80D6U, 0x2B80D62CU }, 85 1.13 isaki { 0x3FFC - 0x3fff, 0xB6B07F38U, 0xCE90E46BU }, 86 1.13 isaki { 0x3FFE - 0x3fff, 0xD3680D36U, 0x80D3680DU }, 87 1.13 isaki { 0x3FFC - 0x3fff, 0xC3FD0329U, 0x06488481U }, 88 1.13 isaki { 0x3FFE - 0x3fff, 0xD0B69FCBU, 0xD2580D0BU }, 89 1.13 isaki { 0x3FFC - 0x3fff, 0xD11DE0FFU, 0x15AB18CAU }, 90 1.13 isaki { 0x3FFE - 0x3fff, 0xCE168A77U, 0x25080CE1U }, 91 1.13 isaki { 0x3FFC - 0x3fff, 0xDE1433A1U, 0x6C66B150U }, 92 1.13 isaki { 0x3FFE - 0x3fff, 0xCB8727C0U, 0x65C393E0U }, 93 1.13 isaki { 0x3FFC - 0x3fff, 0xEAE10B5AU, 0x7DDC8ADDU }, 94 1.13 isaki { 0x3FFE - 0x3fff, 0xC907DA4EU, 0x871146ADU }, 95 1.13 isaki { 0x3FFC - 0x3fff, 0xF7856E5EU, 0xE2C9B291U }, 96 1.13 isaki { 0x3FFE - 0x3fff, 0xC6980C69U, 0x80C6980CU }, 97 1.13 isaki { 0x3FFD - 0x3fff, 0x82012CA5U, 0xA68206D7U }, 98 1.13 isaki { 0x3FFE - 0x3fff, 0xC4372F85U, 0x5D824CA6U }, 99 1.13 isaki { 0x3FFD - 0x3fff, 0x882C5FCDU, 0x7256A8C5U }, 100 1.13 isaki { 0x3FFE - 0x3fff, 0xC1E4BBD5U, 0x95F6E947U }, 101 1.13 isaki { 0x3FFD - 0x3fff, 0x8E44C60BU, 0x4CCFD7DEU }, 102 1.13 isaki { 0x3FFE - 0x3fff, 0xBFA02FE8U, 0x0BFA02FFU }, 103 1.13 isaki { 0x3FFD - 0x3fff, 0x944AD09EU, 0xF4351AF6U }, 104 1.13 isaki { 0x3FFE - 0x3fff, 0xBD691047U, 0x07661AA3U }, 105 1.13 isaki { 0x3FFD - 0x3fff, 0x9A3EECD4U, 0xC3EAA6B2U }, 106 1.13 isaki { 0x3FFE - 0x3fff, 0xBB3EE721U, 0xA54D880CU }, 107 1.13 isaki { 0x3FFD - 0x3fff, 0xA0218434U, 0x353F1DE8U }, 108 1.13 isaki { 0x3FFE - 0x3fff, 0xB92143FAU, 0x36F5E02EU }, 109 1.13 isaki { 0x3FFD - 0x3fff, 0xA5F2FCABU, 0xBBC506DAU }, 110 1.13 isaki { 0x3FFE - 0x3fff, 0xB70FBB5AU, 0x19BE3659U }, 111 1.13 isaki { 0x3FFD - 0x3fff, 0xABB3B8BAU, 0x2AD362A5U }, 112 1.13 isaki { 0x3FFE - 0x3fff, 0xB509E68AU, 0x9B94821FU }, 113 1.13 isaki { 0x3FFD - 0x3fff, 0xB1641795U, 0xCE3CA97BU }, 114 1.13 isaki { 0x3FFE - 0x3fff, 0xB30F6352U, 0x8917C80BU }, 115 1.13 isaki { 0x3FFD - 0x3fff, 0xB7047551U, 0x5D0F1C61U }, 116 1.13 isaki { 0x3FFE - 0x3fff, 0xB11FD3B8U, 0x0B11FD3CU }, 117 1.13 isaki { 0x3FFD - 0x3fff, 0xBC952AFEU, 0xEA3D13E1U }, 118 1.13 isaki { 0x3FFE - 0x3fff, 0xAF3ADDC6U, 0x80AF3ADEU }, 119 1.13 isaki { 0x3FFD - 0x3fff, 0xC2168ED0U, 0xF458BA4AU }, 120 1.13 isaki { 0x3FFE - 0x3fff, 0xAD602B58U, 0x0AD602B6U }, 121 1.13 isaki { 0x3FFD - 0x3fff, 0xC788F439U, 0xB3163BF1U }, 122 1.13 isaki { 0x3FFE - 0x3fff, 0xAB8F69E2U, 0x8359CD11U }, 123 1.13 isaki { 0x3FFD - 0x3fff, 0xCCECAC08U, 0xBF04565DU }, 124 1.13 isaki { 0x3FFE - 0x3fff, 0xA9C84A47U, 0xA07F5638U }, 125 1.13 isaki { 0x3FFD - 0x3fff, 0xD2420487U, 0x2DD85160U }, 126 1.13 isaki { 0x3FFE - 0x3fff, 0xA80A80A8U, 0x0A80A80BU }, 127 1.13 isaki { 0x3FFD - 0x3fff, 0xD7894992U, 0x3BC3588AU }, 128 1.13 isaki { 0x3FFE - 0x3fff, 0xA655C439U, 0x2D7B73A8U }, 129 1.13 isaki { 0x3FFD - 0x3fff, 0xDCC2C4B4U, 0x9887DACCU }, 130 1.13 isaki { 0x3FFE - 0x3fff, 0xA4A9CF1DU, 0x96833751U }, 131 1.13 isaki { 0x3FFD - 0x3fff, 0xE1EEBD3EU, 0x6D6A6B9EU }, 132 1.13 isaki { 0x3FFE - 0x3fff, 0xA3065E3FU, 0xAE7CD0E0U }, 133 1.13 isaki { 0x3FFD - 0x3fff, 0xE70D785CU, 0x2F9F5BDCU }, 134 1.13 isaki { 0x3FFE - 0x3fff, 0xA16B312EU, 0xA8FC377DU }, 135 1.13 isaki { 0x3FFD - 0x3fff, 0xEC1F392CU, 0x5179F283U }, 136 1.13 isaki { 0x3FFE - 0x3fff, 0x9FD809FDU, 0x809FD80AU }, 137 1.13 isaki { 0x3FFD - 0x3fff, 0xF12440D3U, 0xE36130E6U }, 138 1.13 isaki { 0x3FFE - 0x3fff, 0x9E4CAD23U, 0xDD5F3A20U }, 139 1.13 isaki { 0x3FFD - 0x3fff, 0xF61CCE92U, 0x346600BBU }, 140 1.13 isaki { 0x3FFE - 0x3fff, 0x9CC8E160U, 0xC3FB19B9U }, 141 1.13 isaki { 0x3FFD - 0x3fff, 0xFB091FD3U, 0x8145630AU }, 142 1.13 isaki { 0x3FFE - 0x3fff, 0x9B4C6F9EU, 0xF03A3CAAU }, 143 1.13 isaki { 0x3FFD - 0x3fff, 0xFFE97042U, 0xBFA4C2ADU }, 144 1.13 isaki { 0x3FFE - 0x3fff, 0x99D722DAU, 0xBDE58F06U }, 145 1.13 isaki { 0x3FFE - 0x3fff, 0x825EFCEDU, 0x49369330U }, 146 1.13 isaki { 0x3FFE - 0x3fff, 0x9868C809U, 0x868C8098U }, 147 1.13 isaki { 0x3FFE - 0x3fff, 0x84C37A7AU, 0xB9A905C9U }, 148 1.13 isaki { 0x3FFE - 0x3fff, 0x97012E02U, 0x5C04B809U }, 149 1.13 isaki { 0x3FFE - 0x3fff, 0x87224C2EU, 0x8E645FB7U }, 150 1.13 isaki { 0x3FFE - 0x3fff, 0x95A02568U, 0x095A0257U }, 151 1.13 isaki { 0x3FFE - 0x3fff, 0x897B8CACU, 0x9F7DE298U }, 152 1.13 isaki { 0x3FFE - 0x3fff, 0x94458094U, 0x45809446U }, 153 1.13 isaki { 0x3FFE - 0x3fff, 0x8BCF55DEU, 0xC4CD05FEU }, 154 1.13 isaki { 0x3FFE - 0x3fff, 0x92F11384U, 0x0497889CU }, 155 1.13 isaki { 0x3FFE - 0x3fff, 0x8E1DC0FBU, 0x89E125E5U }, 156 1.13 isaki { 0x3FFE - 0x3fff, 0x91A2B3C4U, 0xD5E6F809U }, 157 1.13 isaki { 0x3FFE - 0x3fff, 0x9066E68CU, 0x955B6C9BU }, 158 1.13 isaki { 0x3FFE - 0x3fff, 0x905A3863U, 0x3E06C43BU }, 159 1.13 isaki { 0x3FFE - 0x3fff, 0x92AADE74U, 0xC7BE59E0U }, 160 1.13 isaki { 0x3FFE - 0x3fff, 0x8F1779D9U, 0xFDC3A219U }, 161 1.13 isaki { 0x3FFE - 0x3fff, 0x94E9BFF6U, 0x15845643U }, 162 1.13 isaki { 0x3FFE - 0x3fff, 0x8DDA5202U, 0x37694809U }, 163 1.13 isaki { 0x3FFE - 0x3fff, 0x9723A1B7U, 0x20134203U }, 164 1.13 isaki { 0x3FFE - 0x3fff, 0x8CA29C04U, 0x6514E023U }, 165 1.13 isaki { 0x3FFE - 0x3fff, 0x995899C8U, 0x90EB8990U }, 166 1.13 isaki { 0x3FFE - 0x3fff, 0x8B70344AU, 0x139BC75AU }, 167 1.13 isaki { 0x3FFE - 0x3fff, 0x9B88BDAAU, 0x3A3DAE2FU }, 168 1.13 isaki { 0x3FFE - 0x3fff, 0x8A42F870U, 0x5669DB46U }, 169 1.13 isaki { 0x3FFE - 0x3fff, 0x9DB4224FU, 0xFFE1157CU }, 170 1.13 isaki { 0x3FFE - 0x3fff, 0x891AC73AU, 0xE9819B50U }, 171 1.13 isaki { 0x3FFE - 0x3fff, 0x9FDADC26U, 0x8B7A12DAU }, 172 1.13 isaki { 0x3FFE - 0x3fff, 0x87F78087U, 0xF78087F8U }, 173 1.13 isaki { 0x3FFE - 0x3fff, 0xA1FCFF17U, 0xCE733BD4U }, 174 1.13 isaki { 0x3FFE - 0x3fff, 0x86D90544U, 0x7A34ACC6U }, 175 1.13 isaki { 0x3FFE - 0x3fff, 0xA41A9E8FU, 0x5446FB9FU }, 176 1.13 isaki { 0x3FFE - 0x3fff, 0x85BF3761U, 0x2CEE3C9BU }, 177 1.13 isaki { 0x3FFE - 0x3fff, 0xA633CD7EU, 0x6771CD8BU }, 178 1.13 isaki { 0x3FFE - 0x3fff, 0x84A9F9C8U, 0x084A9F9DU }, 179 1.13 isaki { 0x3FFE - 0x3fff, 0xA8489E60U, 0x0B435A5EU }, 180 1.13 isaki { 0x3FFE - 0x3fff, 0x83993052U, 0x3FBE3368U }, 181 1.13 isaki { 0x3FFE - 0x3fff, 0xAA59233CU, 0xCCA4BD49U }, 182 1.13 isaki { 0x3FFE - 0x3fff, 0x828CBFBEU, 0xB9A020A3U }, 183 1.13 isaki { 0x3FFE - 0x3fff, 0xAC656DAEU, 0x6BCC4985U }, 184 1.13 isaki { 0x3FFE - 0x3fff, 0x81848DA8U, 0xFAF0D277U }, 185 1.13 isaki { 0x3FFE - 0x3fff, 0xAE6D8EE3U, 0x60BB2468U }, 186 1.13 isaki { 0x3FFE - 0x3fff, 0x80808080U, 0x80808081U }, 187 1.13 isaki { 0x3FFE - 0x3fff, 0xB07197A2U, 0x3C46C654U }, 188 1.1 briggs }; 189 1.1 briggs 190 1.10 dsl static struct fpn *__fpu_logn(struct fpemu *fe); 191 1.1 briggs 192 1.1 briggs /* 193 1.1 briggs * natural log - algorithm taken from Motorola FPSP, 194 1.1 briggs * except this doesn't bother to check for invalid input. 195 1.1 briggs */ 196 1.1 briggs static struct fpn * 197 1.12 dsl __fpu_logn(struct fpemu *fe) 198 1.1 briggs { 199 1.13 isaki static struct fpn X, F, U, V, W, KLOG2; 200 1.13 isaki struct fpn *d; 201 1.13 isaki int i, k; 202 1.13 isaki 203 1.13 isaki CPYFPN(&X, &fe->fe_f2); 204 1.13 isaki 205 1.13 isaki /* see if |X-1| < 1/16 approx. */ 206 1.13 isaki if ((-1 == X.fp_exp && (0xf07d0000U >> (31 - FP_LG)) <= X.fp_mant[0]) || 207 1.13 isaki (0 == X.fp_exp && X.fp_mant[0] <= (0x88410000U >> (31 - FP_LG)))) { 208 1.13 isaki /* log near 1 */ 209 1.6 briggs #if FPE_DEBUG 210 1.13 isaki printf("__fpu_logn: log near 1\n"); 211 1.6 briggs #endif 212 1.1 briggs 213 1.16 isaki fpu_const(&fe->fe_f1, FPU_CONST_1); 214 1.13 isaki /* X+1 */ 215 1.13 isaki d = fpu_add(fe); 216 1.13 isaki CPYFPN(&V, d); 217 1.13 isaki 218 1.13 isaki CPYFPN(&fe->fe_f1, &X); 219 1.16 isaki fpu_const(&fe->fe_f2, FPU_CONST_1); 220 1.13 isaki fe->fe_f2.fp_sign = 1; /* -1.0 */ 221 1.13 isaki /* X-1 */ 222 1.13 isaki d = fpu_add(fe); 223 1.13 isaki CPYFPN(&fe->fe_f1, d); 224 1.13 isaki /* 2(X-1) */ 225 1.13 isaki fe->fe_f1.fp_exp++; /* *= 2 */ 226 1.13 isaki CPYFPN(&fe->fe_f2, &V); 227 1.13 isaki /* U=2(X-1)/(X+1) */ 228 1.13 isaki d = fpu_div(fe); 229 1.13 isaki CPYFPN(&U, d); 230 1.13 isaki CPYFPN(&fe->fe_f1, d); 231 1.13 isaki CPYFPN(&fe->fe_f2, d); 232 1.13 isaki /* V=U*U */ 233 1.13 isaki d = fpu_mul(fe); 234 1.13 isaki CPYFPN(&V, d); 235 1.13 isaki CPYFPN(&fe->fe_f1, d); 236 1.13 isaki CPYFPN(&fe->fe_f2, d); 237 1.13 isaki /* W=V*V */ 238 1.13 isaki d = fpu_mul(fe); 239 1.13 isaki CPYFPN(&W, d); 240 1.13 isaki 241 1.13 isaki /* calculate U+U*V*([B1+W*(B3+W*B5)]+[V*(B2+W*B4)]) */ 242 1.13 isaki 243 1.13 isaki /* B1+W*(B3+W*B5) part */ 244 1.13 isaki CPYFPN(&fe->fe_f1, d); 245 1.13 isaki fpu_explode(fe, &fe->fe_f2, FTYPE_DBL, logB5); 246 1.13 isaki /* W*B5 */ 247 1.13 isaki d = fpu_mul(fe); 248 1.13 isaki CPYFPN(&fe->fe_f1, d); 249 1.13 isaki fpu_explode(fe, &fe->fe_f2, FTYPE_DBL, logB3); 250 1.13 isaki /* B3+W*B5 */ 251 1.13 isaki d = fpu_add(fe); 252 1.13 isaki CPYFPN(&fe->fe_f1, d); 253 1.13 isaki CPYFPN(&fe->fe_f2, &W); 254 1.13 isaki /* W*(B3+W*B5) */ 255 1.13 isaki d = fpu_mul(fe); 256 1.13 isaki CPYFPN(&fe->fe_f1, d); 257 1.13 isaki fpu_explode(fe, &fe->fe_f2, FTYPE_DBL, logB1); 258 1.13 isaki /* B1+W*(B3+W*B5) */ 259 1.13 isaki d = fpu_add(fe); 260 1.13 isaki CPYFPN(&X, d); 261 1.13 isaki 262 1.13 isaki /* [V*(B2+W*B4)] part */ 263 1.13 isaki CPYFPN(&fe->fe_f1, &W); 264 1.13 isaki fpu_explode(fe, &fe->fe_f2, FTYPE_DBL, logB4); 265 1.13 isaki /* W*B4 */ 266 1.13 isaki d = fpu_mul(fe); 267 1.13 isaki CPYFPN(&fe->fe_f1, d); 268 1.13 isaki fpu_explode(fe, &fe->fe_f2, FTYPE_DBL, logB2); 269 1.13 isaki /* B2+W*B4 */ 270 1.13 isaki d = fpu_add(fe); 271 1.13 isaki CPYFPN(&fe->fe_f1, d); 272 1.13 isaki CPYFPN(&fe->fe_f2, &V); 273 1.13 isaki /* V*(B2+W*B4) */ 274 1.13 isaki d = fpu_mul(fe); 275 1.13 isaki CPYFPN(&fe->fe_f1, d); 276 1.13 isaki CPYFPN(&fe->fe_f2, &X); 277 1.13 isaki /* B1+W*(B3+W*B5)+V*(B2+W*B4) */ 278 1.13 isaki d = fpu_add(fe); 279 1.13 isaki CPYFPN(&fe->fe_f1, d); 280 1.13 isaki CPYFPN(&fe->fe_f2, &V); 281 1.13 isaki /* V*(B1+W*(B3+W*B5)+V*(B2+W*B4)) */ 282 1.13 isaki d = fpu_mul(fe); 283 1.13 isaki CPYFPN(&fe->fe_f1, d); 284 1.13 isaki CPYFPN(&fe->fe_f2, &U); 285 1.13 isaki /* U*V*(B1+W*(B3+W*B5)+V*(B2+W*B4)) */ 286 1.13 isaki d = fpu_mul(fe); 287 1.13 isaki CPYFPN(&fe->fe_f1, d); 288 1.13 isaki CPYFPN(&fe->fe_f2, &U); 289 1.13 isaki /* U+U*V*(B1+W*(B3+W*B5)+V*(B2+W*B4)) */ 290 1.13 isaki d = fpu_add(fe); 291 1.13 isaki } else /* the usual case */ { 292 1.6 briggs #if FPE_DEBUG 293 1.13 isaki printf("__fpu_logn: the usual case. X=(%d,%08x,%08x...)\n", 294 1.14 isaki X.fp_exp, X.fp_mant[0], X.fp_mant[1]); 295 1.6 briggs #endif 296 1.1 briggs 297 1.13 isaki k = X.fp_exp; 298 1.13 isaki /* X <- Y */ 299 1.13 isaki X.fp_exp = fe->fe_f2.fp_exp = 0; 300 1.13 isaki 301 1.13 isaki /* get the most significant 7 bits of X */ 302 1.13 isaki F.fp_class = FPC_NUM; 303 1.13 isaki F.fp_sign = 0; 304 1.13 isaki F.fp_exp = X.fp_exp; 305 1.13 isaki F.fp_mant[0] = X.fp_mant[0] & (0xfe000000U >> (31 - FP_LG)); 306 1.13 isaki F.fp_mant[0] |= (0x01000000U >> (31 - FP_LG)); 307 1.13 isaki F.fp_mant[1] = F.fp_mant[2] = 0; 308 1.13 isaki F.fp_sticky = 0; 309 1.1 briggs 310 1.6 briggs #if FPE_DEBUG 311 1.13 isaki printf("__fpu_logn: X=Y*2^k=(%d,%08x,%08x...)*2^%d\n", 312 1.14 isaki fe->fe_f2.fp_exp, fe->fe_f2.fp_mant[0], 313 1.14 isaki fe->fe_f2.fp_mant[1], k); 314 1.13 isaki printf("__fpu_logn: F=(%d,%08x,%08x...)\n", 315 1.14 isaki F.fp_exp, F.fp_mant[0], F.fp_mant[1]); 316 1.6 briggs #endif 317 1.1 briggs 318 1.13 isaki /* index to the table */ 319 1.13 isaki i = (F.fp_mant[0] >> (FP_LG - 7)) & 0x7e; 320 1.1 briggs 321 1.6 briggs #if FPE_DEBUG 322 1.13 isaki printf("__fpu_logn: index to logtbl i=%d(%x)\n", i, i); 323 1.6 briggs #endif 324 1.1 briggs 325 1.13 isaki CPYFPN(&fe->fe_f1, &F); 326 1.13 isaki /* -F */ 327 1.13 isaki fe->fe_f1.fp_sign = 1; 328 1.13 isaki /* Y-F */ 329 1.13 isaki d = fpu_add(fe); 330 1.13 isaki CPYFPN(&fe->fe_f1, d); 331 1.13 isaki 332 1.13 isaki /* fe_f2 = 1/F */ 333 1.13 isaki fe->fe_f2.fp_class = FPC_NUM; 334 1.14 isaki fe->fe_f2.fp_sign = fe->fe_f2.fp_sticky = fe->fe_f2.fp_mant[2] 335 1.14 isaki = 0; 336 1.13 isaki fe->fe_f2.fp_exp = logtbl[i].sp_exp; 337 1.13 isaki fe->fe_f2.fp_mant[0] = (logtbl[i].sp_m0 >> (31 - FP_LG)); 338 1.13 isaki fe->fe_f2.fp_mant[1] = (logtbl[i].sp_m0 << (FP_LG + 1)) | 339 1.14 isaki (logtbl[i].sp_m1 >> (31 - FP_LG)); 340 1.15 isaki fe->fe_f2.fp_mant[2] = 341 1.15 isaki (uint32_t)(logtbl[i].sp_m1 << (FP_LG + 1)); 342 1.1 briggs 343 1.6 briggs #if FPE_DEBUG 344 1.13 isaki printf("__fpu_logn: 1/F=(%d,%08x,%08x...)\n", fe->fe_f2.fp_exp, 345 1.14 isaki fe->fe_f2.fp_mant[0], fe->fe_f2.fp_mant[1]); 346 1.6 briggs #endif 347 1.1 briggs 348 1.13 isaki /* U = (Y-F) * (1/F) */ 349 1.13 isaki d = fpu_mul(fe); 350 1.13 isaki CPYFPN(&U, d); 351 1.13 isaki 352 1.13 isaki /* KLOG2 = K * ln(2) */ 353 1.13 isaki /* fe_f1 == (fpn)k */ 354 1.13 isaki fpu_explode(fe, &fe->fe_f1, FTYPE_LNG, &k); 355 1.16 isaki (void)fpu_const(&fe->fe_f2, FPU_CONST_LN_2); 356 1.6 briggs #if FPE_DEBUG 357 1.14 isaki printf("__fpu_logn: fp(k)=(%d,%08x,%08x...)\n", 358 1.14 isaki fe->fe_f1.fp_exp, 359 1.14 isaki fe->fe_f1.fp_mant[0], fe->fe_f1.fp_mant[1]); 360 1.14 isaki printf("__fpu_logn: ln(2)=(%d,%08x,%08x...)\n", 361 1.14 isaki fe->fe_f2.fp_exp, 362 1.14 isaki fe->fe_f2.fp_mant[0], fe->fe_f2.fp_mant[1]); 363 1.6 briggs #endif 364 1.13 isaki /* K * LOGOF2 */ 365 1.13 isaki d = fpu_mul(fe); 366 1.13 isaki CPYFPN(&KLOG2, d); 367 1.13 isaki 368 1.13 isaki /* V=U*U */ 369 1.13 isaki CPYFPN(&fe->fe_f1, &U); 370 1.13 isaki CPYFPN(&fe->fe_f2, &U); 371 1.13 isaki d = fpu_mul(fe); 372 1.13 isaki CPYFPN(&V, d); 373 1.13 isaki 374 1.13 isaki /* 375 1.13 isaki * approximation of LOG(1+U) by 376 1.13 isaki * (U+V*(A1+V*(A3+V*A5)))+(U*V*(A2+V*(A4+V*A6))) 377 1.13 isaki */ 378 1.13 isaki 379 1.13 isaki /* (U+V*(A1+V*(A3+V*A5))) part */ 380 1.13 isaki CPYFPN(&fe->fe_f1, d); 381 1.13 isaki fpu_explode(fe, &fe->fe_f2, FTYPE_DBL, logA5); 382 1.13 isaki /* V*A5 */ 383 1.13 isaki d = fpu_mul(fe); 384 1.13 isaki 385 1.13 isaki CPYFPN(&fe->fe_f1, d); 386 1.13 isaki fpu_explode(fe, &fe->fe_f2, FTYPE_DBL, logA3); 387 1.13 isaki /* A3+V*A5 */ 388 1.13 isaki d = fpu_add(fe); 389 1.13 isaki 390 1.13 isaki CPYFPN(&fe->fe_f1, d); 391 1.13 isaki CPYFPN(&fe->fe_f2, &V); 392 1.13 isaki /* V*(A3+V*A5) */ 393 1.13 isaki d = fpu_mul(fe); 394 1.13 isaki 395 1.13 isaki CPYFPN(&fe->fe_f1, d); 396 1.13 isaki fpu_explode(fe, &fe->fe_f2, FTYPE_DBL, logA1); 397 1.13 isaki /* A1+V*(A3+V*A5) */ 398 1.13 isaki d = fpu_add(fe); 399 1.13 isaki 400 1.13 isaki CPYFPN(&fe->fe_f1, d); 401 1.13 isaki CPYFPN(&fe->fe_f2, &V); 402 1.13 isaki /* V*(A1+V*(A3+V*A5)) */ 403 1.13 isaki d = fpu_mul(fe); 404 1.13 isaki 405 1.13 isaki CPYFPN(&fe->fe_f1, d); 406 1.13 isaki CPYFPN(&fe->fe_f2, &U); 407 1.13 isaki /* U+V*(A1+V*(A3+V*A5)) */ 408 1.13 isaki d = fpu_add(fe); 409 1.13 isaki 410 1.13 isaki CPYFPN(&X, d); 411 1.13 isaki 412 1.13 isaki /* (U*V*(A2+V*(A4+V*A6))) part */ 413 1.13 isaki CPYFPN(&fe->fe_f1, &V); 414 1.13 isaki fpu_explode(fe, &fe->fe_f2, FTYPE_DBL, logA6); 415 1.13 isaki /* V*A6 */ 416 1.13 isaki d = fpu_mul(fe); 417 1.13 isaki CPYFPN(&fe->fe_f1, d); 418 1.13 isaki fpu_explode(fe, &fe->fe_f2, FTYPE_DBL, logA4); 419 1.13 isaki /* A4+V*A6 */ 420 1.13 isaki d = fpu_add(fe); 421 1.13 isaki CPYFPN(&fe->fe_f1, d); 422 1.13 isaki CPYFPN(&fe->fe_f2, &V); 423 1.13 isaki /* V*(A4+V*A6) */ 424 1.13 isaki d = fpu_mul(fe); 425 1.13 isaki CPYFPN(&fe->fe_f1, d); 426 1.13 isaki fpu_explode(fe, &fe->fe_f2, FTYPE_DBL, logA2); 427 1.13 isaki /* A2+V*(A4+V*A6) */ 428 1.13 isaki d = fpu_add(fe); 429 1.13 isaki CPYFPN(&fe->fe_f1, d); 430 1.13 isaki CPYFPN(&fe->fe_f2, &V); 431 1.13 isaki /* V*(A2+V*(A4+V*A6)) */ 432 1.13 isaki d = fpu_mul(fe); 433 1.13 isaki CPYFPN(&fe->fe_f1, d); 434 1.13 isaki CPYFPN(&fe->fe_f2, &U); 435 1.13 isaki /* U*V*(A2+V*(A4+V*A6)) */ 436 1.13 isaki d = fpu_mul(fe); 437 1.13 isaki CPYFPN(&fe->fe_f1, d); 438 1.13 isaki i++; 439 1.13 isaki /* fe_f2 = logtbl[i+1] (== LOG(F)) */ 440 1.13 isaki fe->fe_f2.fp_class = FPC_NUM; 441 1.14 isaki fe->fe_f2.fp_sign = fe->fe_f2.fp_sticky = fe->fe_f2.fp_mant[2] 442 1.14 isaki = 0; 443 1.13 isaki fe->fe_f2.fp_exp = logtbl[i].sp_exp; 444 1.13 isaki fe->fe_f2.fp_mant[0] = (logtbl[i].sp_m0 >> (31 - FP_LG)); 445 1.13 isaki fe->fe_f2.fp_mant[1] = (logtbl[i].sp_m0 << (FP_LG + 1)) | 446 1.14 isaki (logtbl[i].sp_m1 >> (31 - FP_LG)); 447 1.13 isaki fe->fe_f2.fp_mant[2] = (logtbl[i].sp_m1 << (FP_LG + 1)); 448 1.1 briggs 449 1.6 briggs #if FPE_DEBUG 450 1.14 isaki printf("__fpu_logn: ln(F)=(%d,%08x,%08x,...)\n", 451 1.14 isaki fe->fe_f2.fp_exp, 452 1.14 isaki fe->fe_f2.fp_mant[0], fe->fe_f2.fp_mant[1]); 453 1.6 briggs #endif 454 1.1 briggs 455 1.13 isaki /* LOG(F)+U*V*(A2+V*(A4+V*A6)) */ 456 1.13 isaki d = fpu_add(fe); 457 1.13 isaki CPYFPN(&fe->fe_f1, d); 458 1.13 isaki CPYFPN(&fe->fe_f2, &X); 459 1.13 isaki /* LOG(F)+U+V*(A1+V*(A3+V*A5))+U*V*(A2+V*(A4+V*A6)) */ 460 1.13 isaki d = fpu_add(fe); 461 1.1 briggs 462 1.6 briggs #if FPE_DEBUG 463 1.13 isaki printf("__fpu_logn: ln(Y)=(%c,%d,%08x,%08x,%08x)\n", 464 1.14 isaki d->fp_sign ? '-' : '+', d->fp_exp, 465 1.14 isaki d->fp_mant[0], d->fp_mant[1], d->fp_mant[2]); 466 1.6 briggs #endif 467 1.1 briggs 468 1.13 isaki CPYFPN(&fe->fe_f1, d); 469 1.13 isaki CPYFPN(&fe->fe_f2, &KLOG2); 470 1.13 isaki /* K*LOGOF2+LOG(F)+U+V*(A1+V*(A3+V*A5))+U*V*(A2+V*(A4+V*A6)) */ 471 1.13 isaki d = fpu_add(fe); 472 1.13 isaki } 473 1.1 briggs 474 1.13 isaki return d; 475 1.1 briggs } 476 1.1 briggs 477 1.1 briggs struct fpn * 478 1.11 dsl fpu_log10(struct fpemu *fe) 479 1.1 briggs { 480 1.13 isaki struct fpn *fp = &fe->fe_f2; 481 1.15 isaki uint32_t fpsr; 482 1.1 briggs 483 1.13 isaki fpsr = fe->fe_fpsr & ~FPSR_EXCP; /* clear all exceptions */ 484 1.1 briggs 485 1.13 isaki if (fp->fp_class >= FPC_NUM) { 486 1.13 isaki if (fp->fp_sign) { /* negative number or Inf */ 487 1.13 isaki fp = fpu_newnan(fe); 488 1.13 isaki fpsr |= FPSR_OPERR; 489 1.13 isaki } else if (fp->fp_class == FPC_NUM) { 490 1.13 isaki /* the real work here */ 491 1.13 isaki fp = __fpu_logn(fe); 492 1.13 isaki if (fp != &fe->fe_f1) 493 1.13 isaki CPYFPN(&fe->fe_f1, fp); 494 1.16 isaki (void)fpu_const(&fe->fe_f2, FPU_CONST_LN_10); 495 1.13 isaki fp = fpu_div(fe); 496 1.13 isaki } /* else if fp == +Inf, return +Inf */ 497 1.13 isaki } else if (fp->fp_class == FPC_ZERO) { 498 1.13 isaki /* return -Inf */ 499 1.13 isaki fp->fp_class = FPC_INF; 500 1.13 isaki fp->fp_sign = 1; 501 1.13 isaki fpsr |= FPSR_DZ; 502 1.13 isaki } else if (fp->fp_class == FPC_SNAN) { 503 1.13 isaki fpsr |= FPSR_SNAN; 504 1.13 isaki fp = fpu_newnan(fe); 505 1.13 isaki } else { 506 1.13 isaki fp = fpu_newnan(fe); 507 1.13 isaki } 508 1.1 briggs 509 1.13 isaki fe->fe_fpsr = fpsr; 510 1.1 briggs 511 1.13 isaki return fp; 512 1.1 briggs } 513 1.1 briggs 514 1.1 briggs struct fpn * 515 1.11 dsl fpu_log2(struct fpemu *fe) 516 1.1 briggs { 517 1.13 isaki struct fpn *fp = &fe->fe_f2; 518 1.15 isaki uint32_t fpsr; 519 1.1 briggs 520 1.13 isaki fpsr = fe->fe_fpsr & ~FPSR_EXCP; /* clear all exceptions */ 521 1.1 briggs 522 1.13 isaki if (fp->fp_class >= FPC_NUM) { 523 1.13 isaki if (fp->fp_sign) { /* negative number or Inf */ 524 1.13 isaki fp = fpu_newnan(fe); 525 1.13 isaki fpsr |= FPSR_OPERR; 526 1.13 isaki } else if (fp->fp_class == FPC_NUM) { 527 1.13 isaki /* the real work here */ 528 1.13 isaki if (fp->fp_mant[0] == FP_1 && fp->fp_mant[1] == 0 && 529 1.14 isaki fp->fp_mant[2] == 0) { 530 1.13 isaki /* fp == 2.0 ^ exp <--> log2(fp) == exp */ 531 1.14 isaki fpu_explode(fe, &fe->fe_f3, FTYPE_LNG, 532 1.14 isaki &fp->fp_exp); 533 1.13 isaki fp = &fe->fe_f3; 534 1.13 isaki } else { 535 1.13 isaki fp = __fpu_logn(fe); 536 1.13 isaki if (fp != &fe->fe_f1) 537 1.13 isaki CPYFPN(&fe->fe_f1, fp); 538 1.16 isaki (void)fpu_const(&fe->fe_f2, FPU_CONST_LN_2); 539 1.13 isaki fp = fpu_div(fe); 540 1.13 isaki } 541 1.13 isaki } /* else if fp == +Inf, return +Inf */ 542 1.13 isaki } else if (fp->fp_class == FPC_ZERO) { 543 1.13 isaki /* return -Inf */ 544 1.13 isaki fp->fp_class = FPC_INF; 545 1.13 isaki fp->fp_sign = 1; 546 1.13 isaki fpsr |= FPSR_DZ; 547 1.13 isaki } else if (fp->fp_class == FPC_SNAN) { 548 1.13 isaki fpsr |= FPSR_SNAN; 549 1.13 isaki fp = fpu_newnan(fe); 550 1.13 isaki } else { 551 1.13 isaki fp = fpu_newnan(fe); 552 1.13 isaki } 553 1.1 briggs 554 1.13 isaki fe->fe_fpsr = fpsr; 555 1.13 isaki return fp; 556 1.1 briggs } 557 1.1 briggs 558 1.1 briggs struct fpn * 559 1.11 dsl fpu_logn(struct fpemu *fe) 560 1.1 briggs { 561 1.13 isaki struct fpn *fp = &fe->fe_f2; 562 1.15 isaki uint32_t fpsr; 563 1.1 briggs 564 1.13 isaki fpsr = fe->fe_fpsr & ~FPSR_EXCP; /* clear all exceptions */ 565 1.1 briggs 566 1.13 isaki if (fp->fp_class >= FPC_NUM) { 567 1.13 isaki if (fp->fp_sign) { /* negative number or Inf */ 568 1.13 isaki fp = fpu_newnan(fe); 569 1.13 isaki fpsr |= FPSR_OPERR; 570 1.13 isaki } else if (fp->fp_class == FPC_NUM) { 571 1.13 isaki /* the real work here */ 572 1.13 isaki fp = __fpu_logn(fe); 573 1.13 isaki } /* else if fp == +Inf, return +Inf */ 574 1.13 isaki } else if (fp->fp_class == FPC_ZERO) { 575 1.13 isaki /* return -Inf */ 576 1.13 isaki fp->fp_class = FPC_INF; 577 1.13 isaki fp->fp_sign = 1; 578 1.13 isaki fpsr |= FPSR_DZ; 579 1.13 isaki } else if (fp->fp_class == FPC_SNAN) { 580 1.13 isaki fpsr |= FPSR_SNAN; 581 1.13 isaki fp = fpu_newnan(fe); 582 1.13 isaki } else { 583 1.13 isaki fp = fpu_newnan(fe); 584 1.13 isaki } 585 1.1 briggs 586 1.13 isaki fe->fe_fpsr = fpsr; 587 1.1 briggs 588 1.13 isaki return fp; 589 1.1 briggs } 590 1.1 briggs 591 1.1 briggs struct fpn * 592 1.11 dsl fpu_lognp1(struct fpemu *fe) 593 1.1 briggs { 594 1.13 isaki struct fpn *fp; 595 1.1 briggs 596 1.18 isaki /* if src is +0/-0, return +0/-0 */ 597 1.18 isaki if (ISZERO(&fe->fe_f2)) 598 1.18 isaki return &fe->fe_f2; 599 1.18 isaki 600 1.13 isaki /* build a 1.0 */ 601 1.16 isaki fp = fpu_const(&fe->fe_f1, FPU_CONST_1); 602 1.13 isaki /* fp = 1.0 + f2 */ 603 1.13 isaki fp = fpu_add(fe); 604 1.13 isaki 605 1.13 isaki /* copy the result to the src opr */ 606 1.17 isaki CPYFPN(&fe->fe_f2, fp); 607 1.1 briggs 608 1.13 isaki return fpu_logn(fe); 609 1.1 briggs } 610