[b5440cf] | 1 | /*
|
---|
[df4ed85] | 2 | * Copyright (c) 2005 Josef Cejka
|
---|
[c67aff2] | 3 | * Copyright (c) 2011 Petr Koupy
|
---|
[b5440cf] | 4 | * All rights reserved.
|
---|
| 5 | *
|
---|
| 6 | * Redistribution and use in source and binary forms, with or without
|
---|
| 7 | * modification, are permitted provided that the following conditions
|
---|
| 8 | * are met:
|
---|
| 9 | *
|
---|
| 10 | * - Redistributions of source code must retain the above copyright
|
---|
| 11 | * notice, this list of conditions and the following disclaimer.
|
---|
| 12 | * - Redistributions in binary form must reproduce the above copyright
|
---|
| 13 | * notice, this list of conditions and the following disclaimer in the
|
---|
| 14 | * documentation and/or other materials provided with the distribution.
|
---|
| 15 | * - The name of the author may not be used to endorse or promote products
|
---|
| 16 | * derived from this software without specific prior written permission.
|
---|
| 17 | *
|
---|
| 18 | * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
|
---|
| 19 | * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
|
---|
| 20 | * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
|
---|
| 21 | * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
|
---|
| 22 | * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
|
---|
| 23 | * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
---|
| 24 | * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
---|
| 25 | * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
---|
| 26 | * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
|
---|
| 27 | * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
---|
| 28 | */
|
---|
| 29 |
|
---|
[750636a] | 30 | /** @addtogroup softfloat
|
---|
[846848a6] | 31 | * @{
|
---|
| 32 | */
|
---|
[c67aff2] | 33 | /** @file Division functions.
|
---|
[846848a6] | 34 | */
|
---|
| 35 |
|
---|
[2416085] | 36 | #include "add.h"
|
---|
| 37 | #include "div.h"
|
---|
| 38 | #include "comparison.h"
|
---|
| 39 | #include "mul.h"
|
---|
| 40 | #include "common.h"
|
---|
[b5440cf] | 41 |
|
---|
[88d5c1e] | 42 | /** Divide two single-precision floats.
|
---|
| 43 | *
|
---|
[c67aff2] | 44 | * @param a Nominator.
|
---|
| 45 | * @param b Denominator.
|
---|
[88d5c1e] | 46 | *
|
---|
[c67aff2] | 47 | * @return Result of division.
|
---|
[88d5c1e] | 48 | *
|
---|
[c67aff2] | 49 | */
|
---|
[88d5c1e] | 50 | float32 div_float32(float32 a, float32 b)
|
---|
[12c6f2d] | 51 | {
|
---|
[1266543] | 52 | float32 result;
|
---|
[aa59fa0] | 53 | int32_t aexp, bexp, cexp;
|
---|
| 54 | uint64_t afrac, bfrac, cfrac;
|
---|
[a35b458] | 55 |
|
---|
[1266543] | 56 | result.parts.sign = a.parts.sign ^ b.parts.sign;
|
---|
[a35b458] | 57 |
|
---|
[88d5c1e] | 58 | if (is_float32_nan(a)) {
|
---|
| 59 | if (is_float32_signan(a)) {
|
---|
| 60 | // FIXME: SigNaN
|
---|
[1266543] | 61 | }
|
---|
[88d5c1e] | 62 | /* NaN */
|
---|
[1266543] | 63 | return a;
|
---|
| 64 | }
|
---|
[a35b458] | 65 |
|
---|
[88d5c1e] | 66 | if (is_float32_nan(b)) {
|
---|
| 67 | if (is_float32_signan(b)) {
|
---|
| 68 | // FIXME: SigNaN
|
---|
[1266543] | 69 | }
|
---|
[88d5c1e] | 70 | /* NaN */
|
---|
[1266543] | 71 | return b;
|
---|
| 72 | }
|
---|
[a35b458] | 73 |
|
---|
[88d5c1e] | 74 | if (is_float32_infinity(a)) {
|
---|
| 75 | if (is_float32_infinity(b)) {
|
---|
[1266543] | 76 | /*FIXME: inf / inf */
|
---|
[88d5c1e] | 77 | result.bin = FLOAT32_NAN;
|
---|
[1266543] | 78 | return result;
|
---|
| 79 | }
|
---|
| 80 | /* inf / num */
|
---|
| 81 | result.parts.exp = a.parts.exp;
|
---|
| 82 | result.parts.fraction = a.parts.fraction;
|
---|
| 83 | return result;
|
---|
| 84 | }
|
---|
[a35b458] | 85 |
|
---|
[88d5c1e] | 86 | if (is_float32_infinity(b)) {
|
---|
| 87 | if (is_float32_zero(a)) {
|
---|
[1266543] | 88 | /* FIXME 0 / inf */
|
---|
| 89 | result.parts.exp = 0;
|
---|
| 90 | result.parts.fraction = 0;
|
---|
| 91 | return result;
|
---|
| 92 | }
|
---|
| 93 | /* FIXME: num / inf*/
|
---|
| 94 | result.parts.exp = 0;
|
---|
| 95 | result.parts.fraction = 0;
|
---|
| 96 | return result;
|
---|
| 97 | }
|
---|
[a35b458] | 98 |
|
---|
[88d5c1e] | 99 | if (is_float32_zero(b)) {
|
---|
| 100 | if (is_float32_zero(a)) {
|
---|
[1266543] | 101 | /*FIXME: 0 / 0*/
|
---|
[88d5c1e] | 102 | result.bin = FLOAT32_NAN;
|
---|
[1266543] | 103 | return result;
|
---|
| 104 | }
|
---|
| 105 | /* FIXME: division by zero */
|
---|
| 106 | result.parts.exp = 0;
|
---|
| 107 | result.parts.fraction = 0;
|
---|
| 108 | return result;
|
---|
| 109 | }
|
---|
[a35b458] | 110 |
|
---|
[1266543] | 111 | afrac = a.parts.fraction;
|
---|
| 112 | aexp = a.parts.exp;
|
---|
| 113 | bfrac = b.parts.fraction;
|
---|
| 114 | bexp = b.parts.exp;
|
---|
[a35b458] | 115 |
|
---|
[1266543] | 116 | /* denormalized numbers */
|
---|
| 117 | if (aexp == 0) {
|
---|
| 118 | if (afrac == 0) {
|
---|
[c67aff2] | 119 | result.parts.exp = 0;
|
---|
| 120 | result.parts.fraction = 0;
|
---|
| 121 | return result;
|
---|
[1266543] | 122 | }
|
---|
[a35b458] | 123 |
|
---|
[1266543] | 124 | /* normalize it*/
|
---|
| 125 | afrac <<= 1;
|
---|
[88d5c1e] | 126 | /* afrac is nonzero => it must stop */
|
---|
[c67aff2] | 127 | while (!(afrac & FLOAT32_HIDDEN_BIT_MASK)) {
|
---|
[1266543] | 128 | afrac <<= 1;
|
---|
| 129 | aexp--;
|
---|
| 130 | }
|
---|
| 131 | }
|
---|
[a35b458] | 132 |
|
---|
[1266543] | 133 | if (bexp == 0) {
|
---|
| 134 | bfrac <<= 1;
|
---|
[88d5c1e] | 135 | /* bfrac is nonzero => it must stop */
|
---|
[c67aff2] | 136 | while (!(bfrac & FLOAT32_HIDDEN_BIT_MASK)) {
|
---|
[1266543] | 137 | bfrac <<= 1;
|
---|
| 138 | bexp--;
|
---|
| 139 | }
|
---|
| 140 | }
|
---|
[a35b458] | 141 |
|
---|
[88d5c1e] | 142 | afrac = (afrac | FLOAT32_HIDDEN_BIT_MASK) << (32 - FLOAT32_FRACTION_SIZE - 1);
|
---|
| 143 | bfrac = (bfrac | FLOAT32_HIDDEN_BIT_MASK) << (32 - FLOAT32_FRACTION_SIZE);
|
---|
[a35b458] | 144 |
|
---|
[c67aff2] | 145 | if (bfrac <= (afrac << 1)) {
|
---|
[1266543] | 146 | afrac >>= 1;
|
---|
| 147 | aexp++;
|
---|
| 148 | }
|
---|
[a35b458] | 149 |
|
---|
[1266543] | 150 | cexp = aexp - bexp + FLOAT32_BIAS - 2;
|
---|
[a35b458] | 151 |
|
---|
[1266543] | 152 | cfrac = (afrac << 32) / bfrac;
|
---|
[1b20da0] | 153 | if ((cfrac & 0x3F) == 0) {
|
---|
[c67aff2] | 154 | cfrac |= (bfrac * cfrac != afrac << 32);
|
---|
[1266543] | 155 | }
|
---|
[a35b458] | 156 |
|
---|
[1266543] | 157 | /* pack and round */
|
---|
[a35b458] | 158 |
|
---|
[e6a40ac] | 159 | /* find first nonzero digit and shift result and detect possibly underflow */
|
---|
[c67aff2] | 160 | while ((cexp > 0) && (cfrac) && (!(cfrac & (FLOAT32_HIDDEN_BIT_MASK << 7)))) {
|
---|
[1266543] | 161 | cexp--;
|
---|
| 162 | cfrac <<= 1;
|
---|
[c67aff2] | 163 | /* TODO: fix underflow */
|
---|
| 164 | }
|
---|
[a35b458] | 165 |
|
---|
[1266543] | 166 | cfrac += (0x1 << 6); /* FIXME: 7 is not sure*/
|
---|
[a35b458] | 167 |
|
---|
[1266543] | 168 | if (cfrac & (FLOAT32_HIDDEN_BIT_MASK << 7)) {
|
---|
| 169 | ++cexp;
|
---|
| 170 | cfrac >>= 1;
|
---|
[88d5c1e] | 171 | }
|
---|
[a35b458] | 172 |
|
---|
[1266543] | 173 | /* check overflow */
|
---|
[c67aff2] | 174 | if (cexp >= FLOAT32_MAX_EXPONENT) {
|
---|
[1266543] | 175 | /* FIXME: overflow, return infinity */
|
---|
| 176 | result.parts.exp = FLOAT32_MAX_EXPONENT;
|
---|
| 177 | result.parts.fraction = 0;
|
---|
| 178 | return result;
|
---|
| 179 | }
|
---|
[a35b458] | 180 |
|
---|
[1266543] | 181 | if (cexp < 0) {
|
---|
| 182 | /* FIXME: underflow */
|
---|
| 183 | result.parts.exp = 0;
|
---|
| 184 | if ((cexp + FLOAT32_FRACTION_SIZE) < 0) {
|
---|
| 185 | result.parts.fraction = 0;
|
---|
| 186 | return result;
|
---|
| 187 | }
|
---|
| 188 | cfrac >>= 1;
|
---|
| 189 | while (cexp < 0) {
|
---|
[c67aff2] | 190 | cexp++;
|
---|
[1266543] | 191 | cfrac >>= 1;
|
---|
[88d5c1e] | 192 | }
|
---|
[1266543] | 193 | } else {
|
---|
[c67aff2] | 194 | result.parts.exp = (uint32_t) cexp;
|
---|
[1266543] | 195 | }
|
---|
[a35b458] | 196 |
|
---|
[1b20da0] | 197 | result.parts.fraction = ((cfrac >> 6) & (~FLOAT32_HIDDEN_BIT_MASK));
|
---|
[a35b458] | 198 |
|
---|
[88d5c1e] | 199 | return result;
|
---|
[12c6f2d] | 200 | }
|
---|
[b5440cf] | 201 |
|
---|
[88d5c1e] | 202 | /** Divide two double-precision floats.
|
---|
[c67aff2] | 203 | *
|
---|
| 204 | * @param a Nominator.
|
---|
| 205 | * @param b Denominator.
|
---|
[88d5c1e] | 206 | *
|
---|
[c67aff2] | 207 | * @return Result of division.
|
---|
[88d5c1e] | 208 | *
|
---|
[c67aff2] | 209 | */
|
---|
[1b20da0] | 210 | float64 div_float64(float64 a, float64 b)
|
---|
[e6a40ac] | 211 | {
|
---|
| 212 | float64 result;
|
---|
[aa59fa0] | 213 | int64_t aexp, bexp, cexp;
|
---|
[1b20da0] | 214 | uint64_t afrac, bfrac, cfrac;
|
---|
[aa59fa0] | 215 | uint64_t remlo, remhi;
|
---|
[c67aff2] | 216 | uint64_t tmplo, tmphi;
|
---|
[a35b458] | 217 |
|
---|
[e6a40ac] | 218 | result.parts.sign = a.parts.sign ^ b.parts.sign;
|
---|
[a35b458] | 219 |
|
---|
[88d5c1e] | 220 | if (is_float64_nan(a)) {
|
---|
| 221 | if (is_float64_signan(b)) {
|
---|
| 222 | // FIXME: SigNaN
|
---|
[f1f95f2] | 223 | return b;
|
---|
| 224 | }
|
---|
[a35b458] | 225 |
|
---|
[88d5c1e] | 226 | if (is_float64_signan(a)) {
|
---|
| 227 | // FIXME: SigNaN
|
---|
[e6a40ac] | 228 | }
|
---|
[88d5c1e] | 229 | /* NaN */
|
---|
[e6a40ac] | 230 | return a;
|
---|
| 231 | }
|
---|
[a35b458] | 232 |
|
---|
[88d5c1e] | 233 | if (is_float64_nan(b)) {
|
---|
| 234 | if (is_float64_signan(b)) {
|
---|
| 235 | // FIXME: SigNaN
|
---|
[e6a40ac] | 236 | }
|
---|
[88d5c1e] | 237 | /* NaN */
|
---|
[e6a40ac] | 238 | return b;
|
---|
| 239 | }
|
---|
[a35b458] | 240 |
|
---|
[88d5c1e] | 241 | if (is_float64_infinity(a)) {
|
---|
| 242 | if (is_float64_infinity(b) || is_float64_zero(b)) {
|
---|
| 243 | // FIXME: inf / inf
|
---|
| 244 | result.bin = FLOAT64_NAN;
|
---|
[e6a40ac] | 245 | return result;
|
---|
| 246 | }
|
---|
| 247 | /* inf / num */
|
---|
| 248 | result.parts.exp = a.parts.exp;
|
---|
| 249 | result.parts.fraction = a.parts.fraction;
|
---|
| 250 | return result;
|
---|
| 251 | }
|
---|
[a35b458] | 252 |
|
---|
[88d5c1e] | 253 | if (is_float64_infinity(b)) {
|
---|
| 254 | if (is_float64_zero(a)) {
|
---|
[e6a40ac] | 255 | /* FIXME 0 / inf */
|
---|
| 256 | result.parts.exp = 0;
|
---|
| 257 | result.parts.fraction = 0;
|
---|
| 258 | return result;
|
---|
| 259 | }
|
---|
| 260 | /* FIXME: num / inf*/
|
---|
| 261 | result.parts.exp = 0;
|
---|
| 262 | result.parts.fraction = 0;
|
---|
| 263 | return result;
|
---|
| 264 | }
|
---|
[a35b458] | 265 |
|
---|
[88d5c1e] | 266 | if (is_float64_zero(b)) {
|
---|
| 267 | if (is_float64_zero(a)) {
|
---|
[e6a40ac] | 268 | /*FIXME: 0 / 0*/
|
---|
[88d5c1e] | 269 | result.bin = FLOAT64_NAN;
|
---|
[e6a40ac] | 270 | return result;
|
---|
| 271 | }
|
---|
| 272 | /* FIXME: division by zero */
|
---|
| 273 | result.parts.exp = 0;
|
---|
| 274 | result.parts.fraction = 0;
|
---|
| 275 | return result;
|
---|
| 276 | }
|
---|
[a35b458] | 277 |
|
---|
[e6a40ac] | 278 | afrac = a.parts.fraction;
|
---|
| 279 | aexp = a.parts.exp;
|
---|
| 280 | bfrac = b.parts.fraction;
|
---|
| 281 | bexp = b.parts.exp;
|
---|
[a35b458] | 282 |
|
---|
[e6a40ac] | 283 | /* denormalized numbers */
|
---|
| 284 | if (aexp == 0) {
|
---|
| 285 | if (afrac == 0) {
|
---|
[f1f95f2] | 286 | result.parts.exp = 0;
|
---|
| 287 | result.parts.fraction = 0;
|
---|
| 288 | return result;
|
---|
[e6a40ac] | 289 | }
|
---|
[a35b458] | 290 |
|
---|
[e6a40ac] | 291 | /* normalize it*/
|
---|
[f1f95f2] | 292 | aexp++;
|
---|
[1b20da0] | 293 | /* afrac is nonzero => it must stop */
|
---|
[c67aff2] | 294 | while (!(afrac & FLOAT64_HIDDEN_BIT_MASK)) {
|
---|
[e6a40ac] | 295 | afrac <<= 1;
|
---|
| 296 | aexp--;
|
---|
| 297 | }
|
---|
| 298 | }
|
---|
[a35b458] | 299 |
|
---|
[e6a40ac] | 300 | if (bexp == 0) {
|
---|
[f1f95f2] | 301 | bexp++;
|
---|
[1b20da0] | 302 | /* bfrac is nonzero => it must stop */
|
---|
[c67aff2] | 303 | while (!(bfrac & FLOAT64_HIDDEN_BIT_MASK)) {
|
---|
[e6a40ac] | 304 | bfrac <<= 1;
|
---|
| 305 | bexp--;
|
---|
| 306 | }
|
---|
| 307 | }
|
---|
[a35b458] | 308 |
|
---|
[88d5c1e] | 309 | afrac = (afrac | FLOAT64_HIDDEN_BIT_MASK) << (64 - FLOAT64_FRACTION_SIZE - 2);
|
---|
| 310 | bfrac = (bfrac | FLOAT64_HIDDEN_BIT_MASK) << (64 - FLOAT64_FRACTION_SIZE - 1);
|
---|
[a35b458] | 311 |
|
---|
[c67aff2] | 312 | if (bfrac <= (afrac << 1)) {
|
---|
[e6a40ac] | 313 | afrac >>= 1;
|
---|
| 314 | aexp++;
|
---|
| 315 | }
|
---|
[a35b458] | 316 |
|
---|
[1b20da0] | 317 | cexp = aexp - bexp + FLOAT64_BIAS - 2;
|
---|
[a35b458] | 318 |
|
---|
[c67aff2] | 319 | cfrac = div128est(afrac, 0x0ll, bfrac);
|
---|
[a35b458] | 320 |
|
---|
[c67aff2] | 321 | if ((cfrac & 0x1FF) <= 2) {
|
---|
| 322 | mul64(bfrac, cfrac, &tmphi, &tmplo);
|
---|
| 323 | sub128(afrac, 0x0ll, tmphi, tmplo, &remhi, &remlo);
|
---|
[a35b458] | 324 |
|
---|
[aa59fa0] | 325 | while ((int64_t) remhi < 0) {
|
---|
[e6a40ac] | 326 | cfrac--;
|
---|
[c67aff2] | 327 | add128(remhi, remlo, 0x0ll, bfrac, &remhi, &remlo);
|
---|
[e6a40ac] | 328 | }
|
---|
[c67aff2] | 329 | cfrac |= (remlo != 0);
|
---|
[e6a40ac] | 330 | }
|
---|
[a35b458] | 331 |
|
---|
[e979fea] | 332 | /* round and shift */
|
---|
[88d5c1e] | 333 | result = finish_float64(cexp, cfrac, result.parts.sign);
|
---|
[e979fea] | 334 | return result;
|
---|
[e6a40ac] | 335 | }
|
---|
| 336 |
|
---|
[88d5c1e] | 337 | /** Divide two quadruple-precision floats.
|
---|
[c67aff2] | 338 | *
|
---|
| 339 | * @param a Nominator.
|
---|
| 340 | * @param b Denominator.
|
---|
[88d5c1e] | 341 | *
|
---|
[c67aff2] | 342 | * @return Result of division.
|
---|
[88d5c1e] | 343 | *
|
---|
[c67aff2] | 344 | */
|
---|
[88d5c1e] | 345 | float128 div_float128(float128 a, float128 b)
|
---|
[e6a40ac] | 346 | {
|
---|
[c67aff2] | 347 | float128 result;
|
---|
| 348 | int64_t aexp, bexp, cexp;
|
---|
| 349 | uint64_t afrac_hi, afrac_lo, bfrac_hi, bfrac_lo, cfrac_hi, cfrac_lo;
|
---|
| 350 | uint64_t shift_out;
|
---|
| 351 | uint64_t rem_hihi, rem_hilo, rem_lohi, rem_lolo;
|
---|
| 352 | uint64_t tmp_hihi, tmp_hilo, tmp_lohi, tmp_lolo;
|
---|
[a35b458] | 353 |
|
---|
[c67aff2] | 354 | result.parts.sign = a.parts.sign ^ b.parts.sign;
|
---|
[a35b458] | 355 |
|
---|
[88d5c1e] | 356 | if (is_float128_nan(a)) {
|
---|
| 357 | if (is_float128_signan(b)) {
|
---|
| 358 | // FIXME: SigNaN
|
---|
[c67aff2] | 359 | return b;
|
---|
| 360 | }
|
---|
[a35b458] | 361 |
|
---|
[88d5c1e] | 362 | if (is_float128_signan(a)) {
|
---|
| 363 | // FIXME: SigNaN
|
---|
[c67aff2] | 364 | }
|
---|
[88d5c1e] | 365 | /* NaN */
|
---|
[c67aff2] | 366 | return a;
|
---|
[e6a40ac] | 367 | }
|
---|
[a35b458] | 368 |
|
---|
[88d5c1e] | 369 | if (is_float128_nan(b)) {
|
---|
| 370 | if (is_float128_signan(b)) {
|
---|
| 371 | // FIXME: SigNaN
|
---|
[e6a40ac] | 372 | }
|
---|
[88d5c1e] | 373 | /* NaN */
|
---|
[c67aff2] | 374 | return b;
|
---|
[e6a40ac] | 375 | }
|
---|
[a35b458] | 376 |
|
---|
[88d5c1e] | 377 | if (is_float128_infinity(a)) {
|
---|
| 378 | if (is_float128_infinity(b) || is_float128_zero(b)) {
|
---|
| 379 | // FIXME: inf / inf
|
---|
| 380 | result.bin.hi = FLOAT128_NAN_HI;
|
---|
| 381 | result.bin.lo = FLOAT128_NAN_LO;
|
---|
[c67aff2] | 382 | return result;
|
---|
| 383 | }
|
---|
| 384 | /* inf / num */
|
---|
| 385 | result.parts.exp = a.parts.exp;
|
---|
| 386 | result.parts.frac_hi = a.parts.frac_hi;
|
---|
| 387 | result.parts.frac_lo = a.parts.frac_lo;
|
---|
| 388 | return result;
|
---|
| 389 | }
|
---|
[a35b458] | 390 |
|
---|
[88d5c1e] | 391 | if (is_float128_infinity(b)) {
|
---|
| 392 | if (is_float128_zero(a)) {
|
---|
| 393 | // FIXME 0 / inf
|
---|
[c67aff2] | 394 | result.parts.exp = 0;
|
---|
| 395 | result.parts.frac_hi = 0;
|
---|
| 396 | result.parts.frac_lo = 0;
|
---|
| 397 | return result;
|
---|
| 398 | }
|
---|
[88d5c1e] | 399 | // FIXME: num / inf
|
---|
[c67aff2] | 400 | result.parts.exp = 0;
|
---|
| 401 | result.parts.frac_hi = 0;
|
---|
| 402 | result.parts.frac_lo = 0;
|
---|
| 403 | return result;
|
---|
| 404 | }
|
---|
[a35b458] | 405 |
|
---|
[88d5c1e] | 406 | if (is_float128_zero(b)) {
|
---|
| 407 | if (is_float128_zero(a)) {
|
---|
| 408 | // FIXME: 0 / 0
|
---|
| 409 | result.bin.hi = FLOAT128_NAN_HI;
|
---|
| 410 | result.bin.lo = FLOAT128_NAN_LO;
|
---|
[c67aff2] | 411 | return result;
|
---|
| 412 | }
|
---|
[88d5c1e] | 413 | // FIXME: division by zero
|
---|
[c67aff2] | 414 | result.parts.exp = 0;
|
---|
| 415 | result.parts.frac_hi = 0;
|
---|
| 416 | result.parts.frac_lo = 0;
|
---|
| 417 | return result;
|
---|
| 418 | }
|
---|
[a35b458] | 419 |
|
---|
[c67aff2] | 420 | afrac_hi = a.parts.frac_hi;
|
---|
| 421 | afrac_lo = a.parts.frac_lo;
|
---|
| 422 | aexp = a.parts.exp;
|
---|
| 423 | bfrac_hi = b.parts.frac_hi;
|
---|
| 424 | bfrac_lo = b.parts.frac_lo;
|
---|
| 425 | bexp = b.parts.exp;
|
---|
[a35b458] | 426 |
|
---|
[c67aff2] | 427 | /* denormalized numbers */
|
---|
| 428 | if (aexp == 0) {
|
---|
| 429 | if (eq128(afrac_hi, afrac_lo, 0x0ll, 0x0ll)) {
|
---|
| 430 | result.parts.exp = 0;
|
---|
| 431 | result.parts.frac_hi = 0;
|
---|
| 432 | result.parts.frac_lo = 0;
|
---|
| 433 | return result;
|
---|
| 434 | }
|
---|
[a35b458] | 435 |
|
---|
[c67aff2] | 436 | /* normalize it*/
|
---|
| 437 | aexp++;
|
---|
| 438 | /* afrac is nonzero => it must stop */
|
---|
| 439 | and128(afrac_hi, afrac_lo,
|
---|
| 440 | FLOAT128_HIDDEN_BIT_MASK_HI, FLOAT128_HIDDEN_BIT_MASK_LO,
|
---|
| 441 | &tmp_hihi, &tmp_lolo);
|
---|
| 442 | while (!lt128(0x0ll, 0x0ll, tmp_hihi, tmp_lolo)) {
|
---|
| 443 | lshift128(afrac_hi, afrac_lo, 1, &afrac_hi, &afrac_lo);
|
---|
| 444 | aexp--;
|
---|
| 445 | }
|
---|
| 446 | }
|
---|
[a35b458] | 447 |
|
---|
[c67aff2] | 448 | if (bexp == 0) {
|
---|
| 449 | bexp++;
|
---|
| 450 | /* bfrac is nonzero => it must stop */
|
---|
| 451 | and128(bfrac_hi, bfrac_lo,
|
---|
| 452 | FLOAT128_HIDDEN_BIT_MASK_HI, FLOAT128_HIDDEN_BIT_MASK_LO,
|
---|
| 453 | &tmp_hihi, &tmp_lolo);
|
---|
| 454 | while (!lt128(0x0ll, 0x0ll, tmp_hihi, tmp_lolo)) {
|
---|
| 455 | lshift128(bfrac_hi, bfrac_lo, 1, &bfrac_hi, &bfrac_lo);
|
---|
| 456 | bexp--;
|
---|
| 457 | }
|
---|
| 458 | }
|
---|
[a35b458] | 459 |
|
---|
[c67aff2] | 460 | or128(afrac_hi, afrac_lo,
|
---|
| 461 | FLOAT128_HIDDEN_BIT_MASK_HI, FLOAT128_HIDDEN_BIT_MASK_LO,
|
---|
| 462 | &afrac_hi, &afrac_lo);
|
---|
| 463 | lshift128(afrac_hi, afrac_lo,
|
---|
| 464 | (128 - FLOAT128_FRACTION_SIZE - 1), &afrac_hi, &afrac_lo);
|
---|
| 465 | or128(bfrac_hi, bfrac_lo,
|
---|
| 466 | FLOAT128_HIDDEN_BIT_MASK_HI, FLOAT128_HIDDEN_BIT_MASK_LO,
|
---|
| 467 | &bfrac_hi, &bfrac_lo);
|
---|
| 468 | lshift128(bfrac_hi, bfrac_lo,
|
---|
| 469 | (128 - FLOAT128_FRACTION_SIZE - 1), &bfrac_hi, &bfrac_lo);
|
---|
[a35b458] | 470 |
|
---|
[c67aff2] | 471 | if (le128(bfrac_hi, bfrac_lo, afrac_hi, afrac_lo)) {
|
---|
| 472 | rshift128(afrac_hi, afrac_lo, 1, &afrac_hi, &afrac_lo);
|
---|
| 473 | aexp++;
|
---|
| 474 | }
|
---|
[a35b458] | 475 |
|
---|
[c67aff2] | 476 | cexp = aexp - bexp + FLOAT128_BIAS - 2;
|
---|
[a35b458] | 477 |
|
---|
[c67aff2] | 478 | cfrac_hi = div128est(afrac_hi, afrac_lo, bfrac_hi);
|
---|
[a35b458] | 479 |
|
---|
[c67aff2] | 480 | mul128(bfrac_hi, bfrac_lo, 0x0ll, cfrac_hi,
|
---|
| 481 | &tmp_lolo /* dummy */, &tmp_hihi, &tmp_hilo, &tmp_lohi);
|
---|
[a35b458] | 482 |
|
---|
[7c3fb9b] | 483 | /*
|
---|
| 484 | * sub192(afrac_hi, afrac_lo, 0,
|
---|
[c67aff2] | 485 | * tmp_hihi, tmp_hilo, tmp_lohi
|
---|
[7c3fb9b] | 486 | * &rem_hihi, &rem_hilo, &rem_lohi);
|
---|
| 487 | */
|
---|
[c67aff2] | 488 | sub128(afrac_hi, afrac_lo, tmp_hihi, tmp_hilo, &rem_hihi, &rem_hilo);
|
---|
| 489 | if (tmp_lohi > 0) {
|
---|
| 490 | sub128(rem_hihi, rem_hilo, 0x0ll, 0x1ll, &rem_hihi, &rem_hilo);
|
---|
| 491 | }
|
---|
| 492 | rem_lohi = -tmp_lohi;
|
---|
[a35b458] | 493 |
|
---|
[c67aff2] | 494 | while ((int64_t) rem_hihi < 0) {
|
---|
| 495 | --cfrac_hi;
|
---|
[7c3fb9b] | 496 | /*
|
---|
| 497 | * add192(rem_hihi, rem_hilo, rem_lohi,
|
---|
[c67aff2] | 498 | * 0, bfrac_hi, bfrac_lo,
|
---|
[7c3fb9b] | 499 | * &rem_hihi, &rem_hilo, &rem_lohi);
|
---|
| 500 | */
|
---|
[c67aff2] | 501 | add128(rem_hilo, rem_lohi, bfrac_hi, bfrac_lo, &rem_hilo, &rem_lohi);
|
---|
| 502 | if (lt128(rem_hilo, rem_lohi, bfrac_hi, bfrac_lo)) {
|
---|
| 503 | ++rem_hihi;
|
---|
| 504 | }
|
---|
| 505 | }
|
---|
[a35b458] | 506 |
|
---|
[c67aff2] | 507 | cfrac_lo = div128est(rem_hilo, rem_lohi, bfrac_lo);
|
---|
[a35b458] | 508 |
|
---|
[c67aff2] | 509 | if ((cfrac_lo & 0x3FFF) <= 4) {
|
---|
| 510 | mul128(bfrac_hi, bfrac_lo, 0x0ll, cfrac_lo,
|
---|
[88d5c1e] | 511 | &tmp_hihi /* dummy */, &tmp_hilo, &tmp_lohi, &tmp_lolo);
|
---|
[a35b458] | 512 |
|
---|
[7c3fb9b] | 513 | /*
|
---|
| 514 | * sub192(rem_hilo, rem_lohi, 0,
|
---|
[c67aff2] | 515 | * tmp_hilo, tmp_lohi, tmp_lolo,
|
---|
[7c3fb9b] | 516 | * &rem_hilo, &rem_lohi, &rem_lolo);
|
---|
| 517 | */
|
---|
[c67aff2] | 518 | sub128(rem_hilo, rem_lohi, tmp_hilo, tmp_lohi, &rem_hilo, &rem_lohi);
|
---|
| 519 | if (tmp_lolo > 0) {
|
---|
| 520 | sub128(rem_hilo, rem_lohi, 0x0ll, 0x1ll, &rem_hilo, &rem_lohi);
|
---|
| 521 | }
|
---|
| 522 | rem_lolo = -tmp_lolo;
|
---|
[a35b458] | 523 |
|
---|
[c67aff2] | 524 | while ((int64_t) rem_hilo < 0) {
|
---|
| 525 | --cfrac_lo;
|
---|
[7c3fb9b] | 526 | /*
|
---|
| 527 | * add192(rem_hilo, rem_lohi, rem_lolo,
|
---|
[c67aff2] | 528 | * 0, bfrac_hi, bfrac_lo,
|
---|
[7c3fb9b] | 529 | * &rem_hilo, &rem_lohi, &rem_lolo);
|
---|
| 530 | */
|
---|
[c67aff2] | 531 | add128(rem_lohi, rem_lolo, bfrac_hi, bfrac_lo, &rem_lohi, &rem_lolo);
|
---|
| 532 | if (lt128(rem_lohi, rem_lolo, bfrac_hi, bfrac_lo)) {
|
---|
| 533 | ++rem_hilo;
|
---|
| 534 | }
|
---|
| 535 | }
|
---|
[a35b458] | 536 |
|
---|
[1433ecda] | 537 | cfrac_lo |= ((rem_hilo | rem_lohi | rem_lolo) != 0);
|
---|
[c67aff2] | 538 | }
|
---|
[a35b458] | 539 |
|
---|
[c67aff2] | 540 | shift_out = cfrac_lo << (64 - (128 - FLOAT128_FRACTION_SIZE - 1));
|
---|
| 541 | rshift128(cfrac_hi, cfrac_lo, (128 - FLOAT128_FRACTION_SIZE - 1),
|
---|
| 542 | &cfrac_hi, &cfrac_lo);
|
---|
[a35b458] | 543 |
|
---|
[88d5c1e] | 544 | result = finish_float128(cexp, cfrac_hi, cfrac_lo, result.parts.sign, shift_out);
|
---|
[e6a40ac] | 545 | return result;
|
---|
| 546 | }
|
---|
| 547 |
|
---|
[c0c38c7c] | 548 | #ifdef float32_t
|
---|
| 549 |
|
---|
| 550 | float32_t __divsf3(float32_t a, float32_t b)
|
---|
| 551 | {
|
---|
| 552 | float32_u ua;
|
---|
| 553 | ua.val = a;
|
---|
[a35b458] | 554 |
|
---|
[c0c38c7c] | 555 | float32_u ub;
|
---|
| 556 | ub.val = b;
|
---|
[a35b458] | 557 |
|
---|
[c0c38c7c] | 558 | float32_u res;
|
---|
| 559 | res.data = div_float32(ua.data, ub.data);
|
---|
[a35b458] | 560 |
|
---|
[c0c38c7c] | 561 | return res.val;
|
---|
| 562 | }
|
---|
| 563 |
|
---|
| 564 | float32_t __aeabi_fdiv(float32_t a, float32_t b)
|
---|
| 565 | {
|
---|
| 566 | float32_u ua;
|
---|
| 567 | ua.val = a;
|
---|
[a35b458] | 568 |
|
---|
[c0c38c7c] | 569 | float32_u ub;
|
---|
| 570 | ub.val = b;
|
---|
[a35b458] | 571 |
|
---|
[c0c38c7c] | 572 | float32_u res;
|
---|
| 573 | res.data = div_float32(ua.data, ub.data);
|
---|
[a35b458] | 574 |
|
---|
[c0c38c7c] | 575 | return res.val;
|
---|
| 576 | }
|
---|
| 577 |
|
---|
| 578 | #endif
|
---|
| 579 |
|
---|
| 580 | #ifdef float64_t
|
---|
| 581 |
|
---|
| 582 | float64_t __divdf3(float64_t a, float64_t b)
|
---|
| 583 | {
|
---|
| 584 | float64_u ua;
|
---|
| 585 | ua.val = a;
|
---|
[a35b458] | 586 |
|
---|
[c0c38c7c] | 587 | float64_u ub;
|
---|
| 588 | ub.val = b;
|
---|
[a35b458] | 589 |
|
---|
[c0c38c7c] | 590 | float64_u res;
|
---|
| 591 | res.data = div_float64(ua.data, ub.data);
|
---|
[a35b458] | 592 |
|
---|
[c0c38c7c] | 593 | return res.val;
|
---|
| 594 | }
|
---|
| 595 |
|
---|
| 596 | float64_t __aeabi_ddiv(float64_t a, float64_t b)
|
---|
| 597 | {
|
---|
| 598 | float64_u ua;
|
---|
| 599 | ua.val = a;
|
---|
[a35b458] | 600 |
|
---|
[c0c38c7c] | 601 | float64_u ub;
|
---|
| 602 | ub.val = b;
|
---|
[a35b458] | 603 |
|
---|
[c0c38c7c] | 604 | float64_u res;
|
---|
| 605 | res.data = div_float64(ua.data, ub.data);
|
---|
[a35b458] | 606 |
|
---|
[c0c38c7c] | 607 | return res.val;
|
---|
| 608 | }
|
---|
| 609 |
|
---|
| 610 | #endif
|
---|
| 611 |
|
---|
| 612 | #ifdef float128_t
|
---|
| 613 |
|
---|
| 614 | float128_t __divtf3(float128_t a, float128_t b)
|
---|
| 615 | {
|
---|
| 616 | float128_u ua;
|
---|
| 617 | ua.val = a;
|
---|
[a35b458] | 618 |
|
---|
[c0c38c7c] | 619 | float128_u ub;
|
---|
| 620 | ub.val = b;
|
---|
[a35b458] | 621 |
|
---|
[c0c38c7c] | 622 | float128_u res;
|
---|
| 623 | res.data = div_float128(ua.data, ub.data);
|
---|
[a35b458] | 624 |
|
---|
[c0c38c7c] | 625 | return res.val;
|
---|
| 626 | }
|
---|
| 627 |
|
---|
| 628 | void _Qp_div(float128_t *c, float128_t *a, float128_t *b)
|
---|
| 629 | {
|
---|
| 630 | *c = __divtf3(*a, *b);
|
---|
| 631 | }
|
---|
| 632 |
|
---|
| 633 | #endif
|
---|
| 634 |
|
---|
[231a60a] | 635 | /** @}
|
---|
[846848a6] | 636 | */
|
---|