OpenXM_contrib/gmp/mpfr/sub1.c - annotate

Return to sub1.c CVS log
Up to [local] / OpenXM_contrib / gmp / mpfr
Annotation of OpenXM_contrib/gmp/mpfr/sub1.c, Revision 1.1.1.1

1.1       ohara       1: /* mpfr_sub1 -- internal function to perform a "real" subtraction
                      2:
                      3: Copyright 2001 Free Software Foundation.
                      4: Contributed by the Spaces project, INRIA Lorraine.
                      5:
                      6: This file is part of the MPFR Library.
                      7:
                      8: The MPFR Library is free software; you can redistribute it and/or modify
                      9: it under the terms of the GNU Lesser General Public License as published by
                     10: the Free Software Foundation; either version 2.1 of the License, or (at your
                     11: option) any later version.
                     12:
                     13: The MPFR Library is distributed in the hope that it will be useful, but
                     14: WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
                     15: or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
                     16: License for more details.
                     17:
                     18: You should have received a copy of the GNU Lesser General Public License
                     19: along with the MPFR Library; see the file COPYING.LIB.  If not, write to
                     20: the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
                     21: MA 02111-1307, USA. */
                     22:
                     23: #include "gmp.h"
                     24: #include "gmp-impl.h"
                     25: #include "mpfr.h"
                     26: #include "mpfr-impl.h"
                     27:
                     28: /* compute sign(b) * (|b| - |c|), with |b| > |c|, diff_exp = EXP(b) - EXP(c)
                     29:    Returns 0 iff result is exact,
                     30:    a negative value when the result is less than the exact value,
                     31:    a positive value otherwise.
                     32: */
                     33:
                     34: int
                     35: mpfr_sub1 (mpfr_ptr a, mpfr_srcptr b, mpfr_srcptr c, mp_rnd_t rnd_mode,
                     36:            int sub)
                     37: {
                     38:   int sign;
                     39:   mp_exp_unsigned_t diff_exp;
                     40:   mp_prec_t cancel, cancel1;
                     41:   mp_size_t cancel2, an, bn, cn, cn0;
                     42:   mp_limb_t *ap, *bp, *cp;
                     43:   mp_limb_t carry, bb, cc, borrow = 0;
                     44:   int inexact = 0, shift_b, shift_c, is_exact = 1, down = 0, add_exp = 0;
                     45:   int sh, k;
                     46:   TMP_DECL(marker);
                     47:
                     48:   TMP_MARK(marker);
                     49:   ap = MPFR_MANT(a);
                     50:   an = 1 + (MPFR_PREC(a) - 1) / BITS_PER_MP_LIMB;
                     51:
                     52:   sign = mpfr_cmp2 (b, c, &cancel);
                     53:   if (sign == 0)
                     54:     {
                     55:       if (rnd_mode == GMP_RNDD)
                     56:         MPFR_SET_NEG(a);
                     57:       else
                     58:         MPFR_SET_POS(a);
                     59:       MPFR_SET_ZERO(a);
                     60:       MPFR_RET(0);
                     61:     }
                     62:
                     63:   /* If subtraction: sign(a) = sign * sign(b) */
                     64:   if (sub && MPFR_SIGN(a) != sign * MPFR_SIGN(b))
                     65:     MPFR_CHANGE_SIGN(a);
                     66:
                     67:   if (sign < 0) /* swap b and c so that |b| > |c| */
                     68:     {
                     69:       mpfr_srcptr t;
                     70:       t = b; b = c; c = t;
                     71:     }
                     72:
                     73:   /* If addition: sign(a) = sign of the larger argument in absolute value */
                     74:   if (!sub)
                     75:     MPFR_SET_SAME_SIGN(a, b);
                     76:
                     77:   diff_exp = (mp_exp_unsigned_t) MPFR_EXP(b) - MPFR_EXP(c);
                     78:
                     79:   /* reserve a space to store b aligned with the result, i.e. shifted by
                     80:      (-cancel) % BITS_PER_MP_LIMB to the right */
                     81:   bn = 1 + (MPFR_PREC(b) - 1) / BITS_PER_MP_LIMB;
                     82:   shift_b = cancel % BITS_PER_MP_LIMB;
                     83:   if (shift_b)
                     84:     shift_b = BITS_PER_MP_LIMB - shift_b;
                     85:   cancel1 = (cancel + shift_b) / BITS_PER_MP_LIMB;
                     86:   /* the high cancel1 limbs from b should not be taken into account */
                     87:   if (shift_b == 0)
                     88:     bp = MPFR_MANT(b); /* no need of an extra space */
                     89:   else
                     90:     {
                     91:       bp = TMP_ALLOC ((bn + 1) * BYTES_PER_MP_LIMB);
                     92:       bp[0] = mpn_rshift (bp + 1, MPFR_MANT(b), bn++, shift_b);
                     93:     }
                     94:
                     95:   /* reserve a space to store c aligned with the result, i.e. shifted by
                     96:      (diff_exp-cancel) % BITS_PER_MP_LIMB to the right */
                     97:   cn = 1 + (MPFR_PREC(c) - 1) / BITS_PER_MP_LIMB;
                     98:   shift_c = diff_exp - (cancel % BITS_PER_MP_LIMB);
                     99:   shift_c = (shift_c + BITS_PER_MP_LIMB) % BITS_PER_MP_LIMB;
                    100:   if (shift_c == 0)
                    101:     cp = MPFR_MANT(c);
                    102:   else
                    103:     {
                    104:       cp = TMP_ALLOC ((cn + 1) * BYTES_PER_MP_LIMB);
                    105:       cp[0] = mpn_rshift (cp + 1, MPFR_MANT(c), cn++, shift_c);
                    106:     }
                    107:
                    108: #ifdef DEBUG
                    109:   printf("shift_b=%u shift_c=%u\n", shift_b, shift_c);
                    110: #endif
                    111:
                    112:   /* ensure ap != bp and ap != cp */
                    113:   if (ap == bp)
                    114:     {
                    115:       bp = (mp_ptr) TMP_ALLOC(bn * BYTES_PER_MP_LIMB);
                    116:       MPN_COPY (bp, ap, bn);
                    117:       /* ap == cp cannot occur since we would have b=c, which is detected
                    118:         in mpfr_add or mpfr_sub */
                    119:     }
                    120:   else if (ap == cp)
                    121:     {
                    122:       cp = (mp_ptr) TMP_ALLOC (cn * BYTES_PER_MP_LIMB);
                    123:       MPN_COPY(cp, ap, cn);
                    124:     }
                    125:
                    126:   /* here we have shift_c = (diff_exp - cancel) % BITS_PER_MP_LIMB,
                    127:      thus we want cancel2 = ceil((cancel - diff_exp) / BITS_PER_MP_LIMB) */
                    128:
                    129:   cancel2 = (long int) (cancel - (diff_exp - shift_c)) / BITS_PER_MP_LIMB;
                    130:   /* the high cancel2 limbs from b should not be taken into account */
                    131: #ifdef DEBUG
                    132:   printf("cancel=%u cancel1=%u cancel2=%d\n", cancel, cancel1, cancel2);
                    133: #endif
                    134:
                    135:   /*               ap[an-1]        ap[0]
                    136:              <----------------+-----------|---->
                    137:              <----------PREC(a)----------><-sh->
                    138:  cancel1
                    139:  limbs        bp[bn-cancel1-1]
                    140:  <--...-----><----------------+-----------+----------->
                    141:   cancel2
                    142:   limbs       cp[cn-cancel2-1]                                    cancel2 >= 0
                    143:     <--...--><----------------+----------------+---------------->
                    144:                 (-cancel2)                                        cancel2 < 0
                    145:                    limbs      <----------------+---------------->
                    146:   */
                    147:
                    148:   /* first part: put in ap[0..an-1] the value of high(b) - high(c),
                    149:      where high(b) consists of the high an+cancel1 limbs of b,
                    150:      and high(c) consists of the high an+cancel2 limbs of c.
                    151:    */
                    152:
                    153:   /* copy high(b) into a */
                    154:   if (an + cancel1 <= bn) /* a: <----------------+-----------|---->
                    155:                         b: <-----------------------------------------> */
                    156:       MPN_COPY (ap, bp + bn - (an + cancel1), an);
                    157:   else  /* a: <----------------+-----------|---->
                    158:        b: <-------------------------> */
                    159:     if (cancel1 < bn) /* otherwise b does not overlap with a */
                    160:       {
                    161:        MPN_ZERO (ap, an + cancel1 - bn);
                    162:        MPN_COPY (ap + an + cancel1 - bn, bp, bn - cancel1);
                    163:       }
                    164:     else
                    165:       MPN_ZERO (ap, an);
                    166:
                    167: #ifdef DEBUG
                    168:   printf("after copying high(b), a="); mpfr_print_binary(a); putchar('\n');
                    169: #endif
                    170:
                    171:   /* subtract high(c) */
                    172:   if (an + cancel2 > 0) /* otherwise c does not overlap with a */
                    173:     {
                    174:       mp_limb_t *ap2;
                    175:
                    176:       if (cancel2 >= 0)
                    177:        {
                    178:          if (an + cancel2 <= cn) /* a: <----------------------------->
                    179:                              c: <-----------------------------------------> */
                    180:            mpn_sub_n (ap, ap, cp + cn - (an + cancel2), an);
                    181:          else /* a: <---------------------------->
                    182:              c: <-------------------------> */
                    183:            {
                    184:              ap2 = ap + an + cancel2 - cn;
                    185:              if (cn > cancel2)
                    186:                mpn_sub_n (ap2, ap2, cp, cn - cancel2);
                    187:            }
                    188:        }
                    189:       else /* cancel2 < 0 */
                    190:        {
                    191:          if (an + cancel2 <= cn) /* a: <----------------------------->
                    192:                                          c: <-----------------------------> */
                    193:              borrow = mpn_sub_n (ap, ap, cp + cn - (an + cancel2), an + cancel2);
                    194:          else /* a: <---------------------------->
                    195:                        c: <----------------> */
                    196:            {
                    197:              ap2 = ap + an + cancel2 - cn;
                    198:              borrow = mpn_sub_n (ap2, ap2, cp, cn);
                    199:            }
                    200:          ap2 = ap + an + cancel2;
                    201:          mpn_sub_1 (ap2, ap2, -cancel2, borrow);
                    202:        }
                    203:     }
                    204:
                    205: #ifdef DEBUG
                    206:   printf("after subtracting high(c), a="); mpfr_print_binary(a); putchar('\n');
                    207: #endif
                    208:
                    209:   /* now perform rounding */
                    210:   sh = an * BITS_PER_MP_LIMB - MPFR_PREC(a); /* last unused bits from a */
                    211:   carry = ap[0] & ((MP_LIMB_T_ONE << sh) - MP_LIMB_T_ONE);
                    212:   ap[0] -= carry;
                    213:
                    214:   if (rnd_mode == GMP_RNDN)
                    215:     {
                    216:       if (sh)
                    217:        {
                    218:          is_exact = (carry == 0);
                    219:          /* can decide except when carry = 2^(sh-1) [middle]
                    220:             or carry = 0 [truncate, but cannot decide inexact flag] */
                    221:          down = (carry < (MP_LIMB_T_ONE << (sh - 1)));
                    222:          if (carry > (MP_LIMB_T_ONE << (sh - 1)))
                    223:            goto add_one_ulp;
                    224:          else if ((0 < carry) && down)
                    225:            {
                    226:              inexact = -1; /* result if smaller than exact value */
                    227:              goto truncate;
                    228:            }
                    229:        }
                    230:     }
                    231:   else /* directed rounding: set rnd_mode to RNDZ iff towards zero */
                    232:     {
                    233:       if (((rnd_mode == GMP_RNDD) && (MPFR_SIGN(a) > 0)) ||
                    234:          ((rnd_mode == GMP_RNDU) && (MPFR_SIGN(a) < 0)))
                    235:        rnd_mode = GMP_RNDZ;
                    236:
                    237:       if (carry)
                    238:        {
                    239:          if (rnd_mode == GMP_RNDZ)
                    240:            {
                    241:              inexact = -1;
                    242:              goto truncate;
                    243:            }
                    244:          else /* round away */
                    245:            goto add_one_ulp;
                    246:        }
                    247:     }
                    248:
                    249:   /* we have to consider the low (bn - (an+cancel1)) limbs from b,
                    250:      and the (cn - (an+cancel2)) limbs from c. */
                    251:   bn -= an + cancel1;
                    252:   cn0 = cn;
                    253:   cn -= (long int) an + cancel2;
                    254: #ifdef DEBUG
                    255:   printf("last %d bits from a are %lu, bn=%ld, cn=%ld\n", sh, carry, bn, cn);
                    256: #endif
                    257:
                    258:   for (k = 0; (bn > 0) || (cn > 0); k = 1)
                    259:     {
                    260:       bb = (bn > 0) ? bp[--bn] : 0;
                    261:       if ((cn > 0) && (cn-- <= cn0))
                    262:        cc = cp[cn];
                    263:       else
                    264:        cc = 0;
                    265:
                    266:       if (down == 0)
                    267:        down = (bb < cc);
                    268:
                    269:       if ((rnd_mode == GMP_RNDN) && !k && sh == 0)
                    270:        {
                    271:          mp_limb_t half = GMP_LIMB_HIGHBIT;
                    272:
                    273:          is_exact = (bb == cc);
                    274:
                    275:          /* add one ulp if bb > cc + half
                    276:             truncate if cc - half < bb < cc + half
                    277:             sub one ulp if bb < cc - half
                    278:          */
                    279:
                    280:          if (down)
                    281:            {
                    282:              if (cc >= half)
                    283:                cc -= half;
                    284:              else
                    285:                bb += half;
                    286:            }
                    287:          else /* bb >= cc */
                    288:            {
                    289:              if (cc < half)
                    290:                cc += half;
                    291:              else
                    292:                bb -= half;
                    293:            }
                    294:        }
                    295:
                    296: #ifdef DEBUG
                    297:       printf("    bb=%lu cc=%lu down=%d is_exact=%d\n", bb, cc, down, is_exact);
                    298: #endif
                    299:       if (bb < cc)
                    300:        {
                    301:          if (rnd_mode == GMP_RNDZ)
                    302:            goto sub_one_ulp;
                    303:          else if (rnd_mode != GMP_RNDN) /* round away */
                    304:            {
                    305:              inexact = 1;
                    306:              goto truncate;
                    307:            }
                    308:          else /* round to nearest */
                    309:            {
                    310:              if (is_exact && sh == 0)
                    311:                {
                    312:                  inexact = 0;
                    313:                  goto truncate;
                    314:                }
                    315:              else if (down && sh == 0)
                    316:                goto sub_one_ulp;
                    317:              else
                    318:                {
                    319:                  inexact = (is_exact) ? 1 : -1;
                    320:                  goto truncate;
                    321:                }
                    322:            }
                    323:        }
                    324:       else if (bb > cc)
                    325:        {
                    326:          if (rnd_mode == GMP_RNDZ)
                    327:            {
                    328:              inexact = -1;
                    329:              goto truncate;
                    330:            }
                    331:          else if (rnd_mode != GMP_RNDN) /* round away */
                    332:              goto add_one_ulp;
                    333:          else /* round to nearest */
                    334:            {
                    335:              if (is_exact)
                    336:                {
                    337:                  inexact = -1;
                    338:                  goto truncate;
                    339:                }
                    340:              else if (down)
                    341:                {
                    342:                  inexact = 1;
                    343:                  goto truncate;
                    344:                }
                    345:              else
                    346:                goto add_one_ulp;
                    347:            }
                    348:        }
                    349:     }
                    350:
                    351:   if ((rnd_mode == GMP_RNDN) && !is_exact)
                    352:     {
                    353:       /* even rounding rule */
                    354:       if ((ap[0] >> sh) & 1)
                    355:        {
                    356:          if (down) goto sub_one_ulp;
                    357:          else goto add_one_ulp;
                    358:        }
                    359:       else
                    360:        inexact = (down) ? 1 : -1;
                    361:     }
                    362:   else
                    363:     inexact = 0;
                    364:   goto truncate;
                    365:
                    366:  sub_one_ulp: /* add one unit in last place to a */
                    367:   mpn_sub_1 (ap, ap, an, MP_LIMB_T_ONE << sh);
                    368:   inexact = -1;
                    369:   goto end_of_sub;
                    370:
                    371:  add_one_ulp: /* add one unit in last place to a */
                    372:   if (mpn_add_1 (ap, ap, an, MP_LIMB_T_ONE << sh)) /* result is a power of 2 */
                    373:     {
                    374:       ap[an-1] = GMP_LIMB_HIGHBIT;
                    375:       add_exp = 1;
                    376:     }
                    377:   inexact = 1; /* result larger than exact value */
                    378:
                    379:  truncate:
                    380:   if ((ap[an-1] >> (BITS_PER_MP_LIMB - 1)) == 0) /* case 1 - epsilon */
                    381:     {
                    382:       ap[an-1] = GMP_LIMB_HIGHBIT;
                    383:       add_exp = 1;
                    384:     }
                    385:
                    386:  end_of_sub:
                    387:   /* we have to set MPFR_EXP(a) to MPFR_EXP(b) - cancel + add_exp, taking
                    388:      care of underflows/overflows in that computation, and of the allowed
                    389:      exponent range */
                    390:   if (cancel)
                    391:     {
                    392:       mp_exp_t exp_b;
                    393:
                    394:       cancel -= add_exp; /* still valid as unsigned long */
                    395:       exp_b = MPFR_EXP(b); /* save it in case a equals b */
                    396:       MPFR_EXP(a) = MPFR_EXP(b) - cancel;
                    397:       if ((MPFR_EXP(a) > exp_b) /* underflow in type mp_exp_t */
                    398:          || (MPFR_EXP(a) < __mpfr_emin))
                    399:        {
                    400:          TMP_FREE(marker);
                    401:          return mpfr_set_underflow (a, rnd_mode, MPFR_SIGN(a));
                    402:        }
                    403:     }
                    404:   else /* cancel = 0: MPFR_EXP(a) <- MPFR_EXP(b) + add_exp */
                    405:     {
                    406:       /* in case cancel = 0, add_exp can still be 1, in case b is just
                    407:         below a power of two, c is very small, prec(a) < prec(b),
                    408:         and rnd=away or nearest */
                    409:       if (add_exp && MPFR_EXP(b) == __mpfr_emax)
                    410:        {
                    411:          TMP_FREE(marker);
                    412:          return mpfr_set_overflow (a, rnd_mode, MPFR_SIGN(a));
                    413:        }
                    414:       MPFR_EXP(a) = MPFR_EXP(b) + add_exp;
                    415:     }
                    416:   TMP_FREE(marker);
                    417: #ifdef DEBUG
                    418:   printf ("result is a="); mpfr_print_binary(a); putchar('\n');
                    419: #endif
                    420:   /* check that result is msb-normalized */
                    421:   MPFR_ASSERTN(ap[an-1] > ~ap[an-1]);
                    422:   return inexact * MPFR_SIGN(a);
                    423: }
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>