OpenXM_contrib/gmp/mpz/aorsmul_i.c - annotate

Return to aorsmul_i.c CVS log
Up to [local] / OpenXM_contrib / gmp / mpz
Annotation of OpenXM_contrib/gmp/mpz/aorsmul_i.c, Revision 1.1

1.1     ! ohara       1: /* mpz_addmul_ui, mpz_submul_ui - add or subtract small multiple.
        !             2:
        !             3:    THE mpz_aorsmul_1 FUNCTION IN THIS FILE IS FOR INTERNAL USE ONLY AND IS
        !             4:    ALMOST CERTAIN TO BE SUBJECT TO INCOMPATIBLE CHANGES OR DISAPPEAR
        !             5:    COMPLETELY IN FUTURE GNU MP RELEASES.
        !             6:
        !             7: Copyright 2001, 2002 Free Software Foundation, Inc.
        !             8:
        !             9: This file is part of the GNU MP Library.
        !            10:
        !            11: The GNU MP Library is free software; you can redistribute it and/or modify
        !            12: it under the terms of the GNU Lesser General Public License as published by
        !            13: the Free Software Foundation; either version 2.1 of the License, or (at your
        !            14: option) any later version.
        !            15:
        !            16: The GNU MP Library is distributed in the hope that it will be useful, but
        !            17: WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
        !            18: or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
        !            19: License for more details.
        !            20:
        !            21: You should have received a copy of the GNU Lesser General Public License
        !            22: along with the GNU MP Library; see the file COPYING.LIB.  If not, write to
        !            23: the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
        !            24: MA 02111-1307, USA. */
        !            25:
        !            26: #include "gmp.h"
        !            27: #include "gmp-impl.h"
        !            28:
        !            29:
        !            30: #if HAVE_NATIVE_mpn_mul_1c
        !            31: #define MPN_MUL_1C(cout, dst, src, size, n, cin)        \
        !            32:   do {                                                  \
        !            33:     (cout) = mpn_mul_1c (dst, src, size, n, cin);       \
        !            34:   } while (0)
        !            35: #else
        !            36: #define MPN_MUL_1C(cout, dst, src, size, n, cin)        \
        !            37:   do {                                                  \
        !            38:     mp_limb_t __cy;                                     \
        !            39:     __cy = mpn_mul_1 (dst, src, size, n);               \
        !            40:     (cout) = __cy + mpn_add_1 (dst, dst, size, cin);    \
        !            41:   } while (0)
        !            42: #endif
        !            43:
        !            44:
        !            45: /* sub>=0 means an addmul w += x*y, sub<0 means a submul w -= x*y.
        !            46:
        !            47:    All that's needed to account for negative w or x is to flip "sub".
        !            48:
        !            49:    The final w will retain its sign, unless an underflow occurs in a submul
        !            50:    of absolute values, in which case it's flipped.
        !            51:
        !            52:    If x has more limbs than w, then mpn_submul_1 followed by mpn_com_n is
        !            53:    used.  The alternative would be mpn_mul_1 into temporary space followed
        !            54:    by mpn_sub_n.  Avoiding temporary space seem good, and submul+com stands
        !            55:    a chance of being faster since it involves only one set of carry
        !            56:    propagations, not two.  Note that doing an addmul_1 with a
        !            57:    twos-complement negative y doesn't work, because it effectively adds an
        !            58:    extra x * 2^BITS_PER_MP_LIMB.  */
        !            59:
        !            60: void
        !            61: mpz_aorsmul_1 (mpz_ptr w, mpz_srcptr x, mp_limb_t y, mp_size_t sub)
        !            62: {
        !            63:   mp_size_t  xsize, wsize, wsize_signed, new_wsize, min_size, dsize;
        !            64:   mp_srcptr  xp;
        !            65:   mp_ptr     wp;
        !            66:   mp_limb_t  cy;
        !            67:
        !            68:   /* w unaffected if x==0 or y==0 */
        !            69:   xsize = SIZ (x);
        !            70:   if (xsize == 0 || y == 0)
        !            71:     return;
        !            72:
        !            73:   sub ^= xsize;
        !            74:   xsize = ABS (xsize);
        !            75:
        !            76:   wsize_signed = SIZ (w);
        !            77:   if (wsize_signed == 0)
        !            78:     {
        !            79:       /* nothing to add to, just set x*y, "sub" gives the sign */
        !            80:       MPZ_REALLOC (w, xsize+1);
        !            81:       wp = PTR (w);
        !            82:       cy = mpn_mul_1 (wp, PTR(x), xsize, y);
        !            83:       wp[xsize] = cy;
        !            84:       xsize += (cy != 0);
        !            85:       SIZ (w) = (sub >= 0 ? xsize : -xsize);
        !            86:       return;
        !            87:     }
        !            88:
        !            89:   sub ^= wsize_signed;
        !            90:   wsize = ABS (wsize_signed);
        !            91:
        !            92:   new_wsize = MAX (wsize, xsize);
        !            93:   MPZ_REALLOC (w, new_wsize+1);
        !            94:   wp = PTR (w);
        !            95:   xp = PTR (x);
        !            96:   min_size = MIN (wsize, xsize);
        !            97:
        !            98:   if (sub >= 0)
        !            99:     {
        !           100:       /* addmul of absolute values */
        !           101:
        !           102:       cy = mpn_addmul_1 (wp, xp, min_size, y);
        !           103:       wp += min_size;
        !           104:       xp += min_size;
        !           105:
        !           106:       dsize = xsize - wsize;
        !           107: #if HAVE_NATIVE_mpn_mul_1c
        !           108:       if (dsize > 0)
        !           109:         cy = mpn_mul_1c (wp, xp, dsize, y, cy);
        !           110:       else if (dsize < 0)
        !           111:         {
        !           112:           dsize = -dsize;
        !           113:           cy = mpn_add_1 (wp, wp, dsize, cy);
        !           114:         }
        !           115: #else
        !           116:       if (dsize != 0)
        !           117:         {
        !           118:           mp_limb_t  cy2;
        !           119:           if (dsize > 0)
        !           120:             cy2 = mpn_mul_1 (wp, xp, dsize, y);
        !           121:           else
        !           122:             {
        !           123:               dsize = -dsize;
        !           124:               cy2 = 0;
        !           125:             }
        !           126:           cy = cy2 + mpn_add_1 (wp, wp, dsize, cy);
        !           127:         }
        !           128: #endif
        !           129:
        !           130:       wp[dsize] = cy;
        !           131:       new_wsize += (cy != 0);
        !           132:     }
        !           133:   else
        !           134:     {
        !           135:       /* submul of absolute values */
        !           136:
        !           137:       cy = mpn_submul_1 (wp, xp, min_size, y);
        !           138:       if (wsize >= xsize)
        !           139:         {
        !           140:           /* if w bigger than x, then propagate borrow through it */
        !           141:           if (wsize != xsize)
        !           142:             cy = mpn_sub_1 (wp+xsize, wp+xsize, wsize-xsize, cy);
        !           143:
        !           144:           if (cy != 0)
        !           145:             {
        !           146:               /* Borrow out of w, take twos complement negative to get
        !           147:                  absolute value, flip sign of w.  */
        !           148:               wp[new_wsize] = ~-cy;  /* extra limb is 0-cy */
        !           149:               mpn_com_n (wp, wp, new_wsize);
        !           150:               new_wsize++;
        !           151:               MPN_INCR_U (wp, new_wsize, CNST_LIMB(1));
        !           152:               wsize_signed = -wsize_signed;
        !           153:             }
        !           154:         }
        !           155:       else /* wsize < xsize */
        !           156:         {
        !           157:           /* x bigger than w, so want x*y-w.  Submul has given w-x*y, so
        !           158:              take twos complement and use an mpn_mul_1 for the rest.  */
        !           159:
        !           160:           mp_limb_t  cy2;
        !           161:
        !           162:           /* -(-cy*b^n + w-x*y) = (cy-1)*b^n + ~(w-x*y) + 1 */
        !           163:           mpn_com_n (wp, wp, wsize);
        !           164:           cy += mpn_add_1 (wp, wp, wsize, CNST_LIMB(1));
        !           165:           cy -= 1;
        !           166:
        !           167:           /* If cy-1 == -1 then hold that -1 for latter.  mpn_submul_1 never
        !           168:              returns cy==MP_LIMB_T_MAX so that value always indicates a -1. */
        !           169:           cy2 = (cy == MP_LIMB_T_MAX);
        !           170:           cy += cy2;
        !           171:           MPN_MUL_1C (cy, wp+wsize, xp+wsize, xsize-wsize, y, cy);
        !           172:           wp[new_wsize] = cy;
        !           173:           new_wsize += (cy != 0);
        !           174:
        !           175:           /* Apply any -1 from above.  The value at wp+wsize is non-zero
        !           176:              because y!=0 and the high limb of x will be non-zero.  */
        !           177:           if (cy2)
        !           178:             MPN_DECR_U (wp+wsize, new_wsize-wsize, CNST_LIMB(1));
        !           179:
        !           180:           wsize_signed = -wsize_signed;
        !           181:         }
        !           182:
        !           183:       /* submul can produce high zero limbs due to cancellation, both when w
        !           184:          has more limbs or x has more  */
        !           185:       MPN_NORMALIZE (wp, new_wsize);
        !           186:     }
        !           187:
        !           188:   SIZ (w) = (wsize_signed >= 0 ? new_wsize : -new_wsize);
        !           189:
        !           190:   ASSERT (new_wsize == 0 || PTR(w)[new_wsize-1] != 0);
        !           191: }
        !           192:
        !           193:
        !           194: void
        !           195: mpz_addmul_ui (mpz_ptr w, mpz_srcptr x, unsigned long y)
        !           196: {
        !           197:   mpz_aorsmul_1 (w, x, (mp_limb_t) y & GMP_NUMB_MASK, (mp_size_t) 0);
        !           198: #if GMP_NAIL_BITS != 0
        !           199:   if (y > GMP_NUMB_MAX && SIZ(x) != 0)
        !           200:     {
        !           201:       mpz_t t;
        !           202:       mp_ptr tp;
        !           203:       mp_size_t xn;
        !           204:       TMP_DECL (mark);
        !           205:       TMP_MARK (mark);
        !           206:       xn = SIZ (x);
        !           207:       MPZ_TMP_INIT (t, ABS (xn) + 1);
        !           208:       tp = PTR (t);
        !           209:       tp[0] = 0;
        !           210:       MPN_COPY (tp + 1, PTR(x), ABS (xn));
        !           211:       SIZ(t) = xn >= 0 ? xn + 1 : xn - 1;
        !           212:       mpz_aorsmul_1 (w, t, (mp_limb_t) y >> GMP_NUMB_BITS, (mp_size_t) 0);
        !           213:       TMP_FREE (mark);
        !           214:     }
        !           215: #endif
        !           216: }
        !           217:
        !           218: void
        !           219: mpz_submul_ui (mpz_ptr w, mpz_srcptr x, unsigned long y)
        !           220: {
        !           221:   mpz_aorsmul_1 (w, x, (mp_limb_t) y & GMP_NUMB_MASK, (mp_size_t) -1);
        !           222: #if GMP_NAIL_BITS != 0
        !           223:   if (y > GMP_NUMB_MAX && SIZ(x) != 0)
        !           224:     {
        !           225:       mpz_t t;
        !           226:       mp_ptr tp;
        !           227:       mp_size_t xn;
        !           228:       TMP_DECL (mark);
        !           229:       TMP_MARK (mark);
        !           230:       xn = SIZ (x);
        !           231:       MPZ_TMP_INIT (t, ABS (xn) + 1);
        !           232:       tp = PTR (t);
        !           233:       tp[0] = 0;
        !           234:       MPN_COPY (tp + 1, PTR(x), ABS (xn));
        !           235:       SIZ(t) = xn >= 0 ? xn + 1 : xn - 1;
        !           236:       mpz_aorsmul_1 (w, t, (mp_limb_t) y >> GMP_NUMB_BITS, (mp_size_t) -1);
        !           237:       TMP_FREE (mark);
        !           238:     }
        !           239: #endif
        !           240: }
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>