OpenXM_contrib/gmp/tune/modlinv.c - annotate

Return to modlinv.c CVS log
Up to [local] / OpenXM_contrib / gmp / tune
Annotation of OpenXM_contrib/gmp/tune/modlinv.c, Revision 1.1.1.1

1.1       ohara       1: /* Alternate implementations of modlimb_invert to compare speeds. */
                      2:
                      3: /*
                      4: Copyright 2000, 2002 Free Software Foundation, Inc.
                      5:
                      6: This file is part of the GNU MP Library.
                      7:
                      8: The GNU MP Library is free software; you can redistribute it and/or modify
                      9: it under the terms of the GNU Lesser General Public License as published by
                     10: the Free Software Foundation; either version 2.1 of the License, or (at your
                     11: option) any later version.
                     12:
                     13: The GNU MP Library is distributed in the hope that it will be useful, but
                     14: WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
                     15: or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
                     16: License for more details.
                     17:
                     18: You should have received a copy of the GNU Lesser General Public License
                     19: along with the GNU MP Library; see the file COPYING.LIB.  If not, write to
                     20: the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
                     21: MA 02111-1307, USA.
                     22: */
                     23:
                     24: #include <stdio.h>
                     25: #include "gmp.h"
                     26: #include "gmp-impl.h"
                     27: #include "longlong.h"
                     28: #include "speed.h"
                     29:
                     30:
                     31: /* Like the standard version in gmp-impl.h, but with the expressions using a
                     32:    "1-" form.  This has the same number of steps, but "1-" is on the
                     33:    dependent chain, whereas the "2*" in the standard version isn't.
                     34:    Depending on the CPU this should be the same or a touch slower.  */
                     35:
                     36: #if BITS_PER_MP_LIMB <= 32
                     37: #define modlimb_invert_mul1(inv,n)                              \
                     38:   do {                                                          \
                     39:     mp_limb_t  __n = (n);                                       \
                     40:     mp_limb_t  __inv;                                           \
                     41:     ASSERT ((__n & 1) == 1);                                    \
                     42:     __inv = modlimb_invert_table[(__n&0xFF)/2]; /*  8 */        \
                     43:     __inv = (1 - __n * __inv) * __inv + __inv;  /* 16 */        \
                     44:     __inv = (1 - __n * __inv) * __inv + __inv;  /* 32 */        \
                     45:     ASSERT (__inv * __n == 1);                                  \
                     46:     (inv) = __inv;                                              \
                     47:   } while (0)
                     48: #endif
                     49:
                     50: #if BITS_PER_MP_LIMB > 32 && BITS_PER_MP_LIMB <= 64
                     51: #define modlimb_invert_mul1(inv,n)                              \
                     52:   do {                                                          \
                     53:     mp_limb_t  __n = (n);                                       \
                     54:     mp_limb_t  __inv;                                           \
                     55:     ASSERT ((__n & 1) == 1);                                    \
                     56:     __inv = modlimb_invert_table[(__n&0xFF)/2]; /*  8 */        \
                     57:     __inv = (1 - __n * __inv) * __inv + __inv;  /* 16 */        \
                     58:     __inv = (1 - __n * __inv) * __inv + __inv;  /* 32 */        \
                     59:     __inv = (1 - __n * __inv) * __inv + __inv;  /* 64 */        \
                     60:     ASSERT (__inv * __n == 1);                                  \
                     61:     (inv) = __inv;                                              \
                     62:   } while (0)
                     63: #endif
                     64:
                     65:
                     66: /* The loop based version used in GMP 3.0 and earlier.  Usually slower than
                     67:    multiplying, due to the number of steps that must be performed.  Much
                     68:    slower when the processor has a good multiply.  */
                     69:
                     70: #define modlimb_invert_loop(inv,n)              \
                     71:   do {                                          \
                     72:     mp_limb_t  __v = (n);                       \
                     73:     mp_limb_t  __v_orig = __v;                  \
                     74:     mp_limb_t  __make_zero = 1;                 \
                     75:     mp_limb_t  __two_i = 1;                     \
                     76:     mp_limb_t  __v_inv = 0;                     \
                     77:                                                 \
                     78:     ASSERT ((__v & 1) == 1);                    \
                     79:                                                 \
                     80:     do                                          \
                     81:       {                                         \
                     82:         while ((__two_i & __make_zero) == 0)    \
                     83:           __two_i <<= 1, __v <<= 1;             \
                     84:         __v_inv += __two_i;                     \
                     85:         __make_zero -= __v;                     \
                     86:       }                                         \
                     87:     while (__make_zero);                        \
                     88:                                                 \
                     89:     ASSERT (__v_orig * __v_inv == 1);           \
                     90:     (inv) = __v_inv;                            \
                     91:   } while (0)
                     92:
                     93:
                     94: /* Another loop based version with conditionals, but doing a fixed number of
                     95:    steps. */
                     96:
                     97: #define modlimb_invert_cond(inv,n)              \
                     98:   do {                                          \
                     99:     mp_limb_t  __n = (n);                       \
                    100:     mp_limb_t  __rem = (1 - __n) >> 1;          \
                    101:     mp_limb_t  __inv = GMP_LIMB_HIGHBIT;       \
                    102:     int        __count;                         \
                    103:                                                 \
                    104:     ASSERT ((__n & 1) == 1);                    \
                    105:                                                 \
                    106:     __count = BITS_PER_MP_LIMB-1;               \
                    107:     do                                          \
                    108:       {                                         \
                    109:         __inv >>= 1;                            \
                    110:         if (__rem & 1)                          \
                    111:           {                                     \
                    112:             __inv |= GMP_LIMB_HIGHBIT;         \
                    113:             __rem -= __n;                       \
                    114:           }                                     \
                    115:         __rem >>= 1;                            \
                    116:       }                                         \
                    117:     while (-- __count);                         \
                    118:                                                 \
                    119:     ASSERT (__inv * __n == 1);                  \
                    120:     (inv) = __inv;                              \
                    121:   } while (0)
                    122:
                    123:
                    124: /* Another loop based bitwise version, but purely arithmetic, no
                    125:    conditionals. */
                    126:
                    127: #define modlimb_invert_arith(inv,n)                                     \
                    128:   do {                                                                  \
                    129:     mp_limb_t  __n = (n);                                               \
                    130:     mp_limb_t  __rem = (1 - __n) >> 1;                                  \
                    131:     mp_limb_t  __inv = GMP_LIMB_HIGHBIT;                               \
                    132:     mp_limb_t  __lowbit;                                                \
                    133:     int        __count;                                                 \
                    134:                                                                         \
                    135:     ASSERT ((__n & 1) == 1);                                            \
                    136:                                                                         \
                    137:     __count = BITS_PER_MP_LIMB-1;                                       \
                    138:     do                                                                  \
                    139:       {                                                                 \
                    140:         __lowbit = __rem & 1;                                           \
                    141:         __inv = (__inv >> 1) | (__lowbit << (BITS_PER_MP_LIMB-1));      \
                    142:         __rem = (__rem - (__n & -__lowbit)) >> 1;                       \
                    143:       }                                                                 \
                    144:     while (-- __count);                                                 \
                    145:                                                                         \
                    146:     ASSERT (__inv * __n == 1);                                          \
                    147:     (inv) = __inv;                                                      \
                    148:   } while (0)
                    149:
                    150:
                    151: double
                    152: speed_modlimb_invert_mul1 (struct speed_params *s)
                    153: {
                    154:   SPEED_ROUTINE_MODLIMB_INVERT (modlimb_invert_mul1);
                    155: }
                    156: double
                    157: speed_modlimb_invert_loop (struct speed_params *s)
                    158: {
                    159:   SPEED_ROUTINE_MODLIMB_INVERT (modlimb_invert_loop);
                    160: }
                    161: double
                    162: speed_modlimb_invert_cond (struct speed_params *s)
                    163: {
                    164:   SPEED_ROUTINE_MODLIMB_INVERT (modlimb_invert_cond);
                    165: }
                    166: double
                    167: speed_modlimb_invert_arith (struct speed_params *s)
                    168: {
                    169:   SPEED_ROUTINE_MODLIMB_INVERT (modlimb_invert_arith);
                    170: }
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>