[BACK]Return to addmul_1.c CVS log [TXT][DIR] Up to [local] / OpenXM_contrib / gmp / mpn / tests

Annotation of OpenXM_contrib/gmp/mpn/tests/addmul_1.c, Revision 1.1.1.1

1.1       maekawa     1: #include <stdio.h>
                      2: #include "gmp.h"
                      3: #include "gmp-impl.h"
                      4: #include "longlong.h"
                      5:
                      6: #ifndef USG
                      7: #include <sys/time.h>
                      8: #include <sys/resource.h>
                      9:
                     10: unsigned long
                     11: cputime ()
                     12: {
                     13:     struct rusage rus;
                     14:
                     15:     getrusage (0, &rus);
                     16:     return rus.ru_utime.tv_sec * 1000 + rus.ru_utime.tv_usec / 1000;
                     17: }
                     18: #else
                     19: #include <time.h>
                     20:
                     21: #ifndef CLOCKS_PER_SEC
                     22: #define CLOCKS_PER_SEC 1000000
                     23: #endif
                     24:
                     25: #if CLOCKS_PER_SEC >= 10000
                     26: #define CLOCK_TO_MILLISEC(cl) ((cl) / (CLOCKS_PER_SEC / 1000))
                     27: #else
                     28: #define CLOCK_TO_MILLISEC(cl) ((cl) * 1000 / CLOCKS_PER_SEC)
                     29: #endif
                     30:
                     31: unsigned long
                     32: cputime ()
                     33: {
                     34:   return CLOCK_TO_MILLISEC (clock ());
                     35: }
                     36: #endif
                     37:
                     38: #define M * 1000000
                     39:
                     40: #ifndef CLOCK
                     41: #if defined (__m88k__)
                     42: #define CLOCK 20 M
                     43: #elif defined (__i386__)
                     44: #define CLOCK (16.666667 M)
                     45: #elif defined (__m68k__)
                     46: #define CLOCK (20 M)
                     47: #elif defined (_IBMR2)
                     48: #define CLOCK (25 M)
                     49: #elif defined (__sparc__)
                     50: #define CLOCK (20 M)
                     51: #elif defined (__sun__)
                     52: #define CLOCK (20 M)
                     53: #elif defined (__mips)
                     54: #define CLOCK (40 M)
                     55: #elif defined (__hppa__)
                     56: #define CLOCK (50 M)
                     57: #elif defined (__alpha)
                     58: #define CLOCK (133 M)
                     59: #else
                     60: #error "Don't know CLOCK of your machine"
                     61: #endif
                     62: #endif
                     63:
                     64: #ifndef OPS
                     65: #define OPS 20000000
                     66: #endif
                     67: #ifndef SIZE
                     68: #define SIZE 496
                     69: #endif
                     70: #ifndef TIMES
                     71: #define TIMES OPS/SIZE
                     72: #else
                     73: #undef OPS
                     74: #define OPS (SIZE*TIMES)
                     75: #endif
                     76:
                     77: mp_limb_t
                     78: refmpn_addmul_1 (res_ptr, s1_ptr, s1_size, s2_limb)
                     79:      register mp_ptr res_ptr;
                     80:      register mp_srcptr s1_ptr;
                     81:      mp_size_t s1_size;
                     82:      register mp_limb_t s2_limb;
                     83: {
                     84:   register mp_limb_t cy_limb;
                     85:   register mp_size_t j;
                     86:   register mp_limb_t prod_high, prod_low;
                     87:   register mp_limb_t x;
                     88:
                     89:   /* The loop counter and index J goes from -SIZE to -1.  This way
                     90:      the loop becomes faster.  */
                     91:   j = -s1_size;
                     92:
                     93:   /* Offset the base pointers to compensate for the negative indices.  */
                     94:   res_ptr -= j;
                     95:   s1_ptr -= j;
                     96:
                     97:   cy_limb = 0;
                     98:   do
                     99:     {
                    100:       umul_ppmm (prod_high, prod_low, s1_ptr[j], s2_limb);
                    101:
                    102:       prod_low += cy_limb;
                    103:       cy_limb = (prod_low < cy_limb) + prod_high;
                    104:
                    105:       x = res_ptr[j];
                    106:       prod_low = x + prod_low;
                    107:       cy_limb += (prod_low < x);
                    108:       res_ptr[j] = prod_low;
                    109:     }
                    110:   while (++j != 0);
                    111:
                    112:   return cy_limb;
                    113: }
                    114:
                    115: main (argc, argv)
                    116:      int argc;
                    117:      char **argv;
                    118: {
                    119:   mp_limb_t s1[SIZE];
                    120:   mp_limb_t dx[SIZE+2];
                    121:   mp_limb_t dy[SIZE+2];
                    122:   mp_limb_t cyx, cyy;
                    123:   int i;
                    124:   long t0, t;
                    125:   int test;
                    126:   mp_limb_t xlimb;
                    127:   mp_size_t size;
                    128:   double cyc;
                    129:
                    130:   for (test = 0; ; test++)
                    131:     {
                    132: #ifdef RANDOM
                    133:       size = (random () % SIZE + 1);
                    134: #else
                    135:       size = SIZE;
                    136: #endif
                    137:
                    138:       mpn_random2 (s1, size);
                    139:       mpn_random2 (dy+1, size);
                    140:
                    141:       if (random () % 0x100 == 0)
                    142:        xlimb = 0;
                    143:       else
                    144:        mpn_random2 (&xlimb, 1);
                    145:
                    146:       dy[size+1] = 0x12345678;
                    147:       dy[0] = 0x87654321;
                    148:
                    149: #if defined (PRINT) || defined (XPRINT)
                    150:       printf ("xlimb=%*lX\n", (int) (2 * sizeof(mp_limb_t)), xlimb);
                    151: #endif
                    152: #ifdef PRINT
                    153:       mpn_print (dy+1, size);
                    154:       mpn_print (s1, size);
                    155: #endif
                    156:
                    157:       MPN_COPY (dx, dy, size+2);
                    158:       t0 = cputime();
                    159:       for (i = 0; i < TIMES; i++)
                    160:        cyx = refmpn_addmul_1 (dx+1, s1, size, xlimb);
                    161:       t = cputime() - t0;
                    162: #if TIMES != 1
                    163:       cyc = ((double) t * CLOCK) / (OPS * 1000.0);
                    164:       printf ("refmpn_addmul_1: %5ldms (%.2f cycles/limb) [%.2f Gb/s]\n",
                    165:              t,
                    166:              cyc,
                    167:              CLOCK/cyc*BITS_PER_MP_LIMB*BITS_PER_MP_LIMB);
                    168: #endif
                    169:
                    170:       MPN_COPY (dx, dy, size+2);
                    171:       t0 = cputime();
                    172:       for (i = 0; i < TIMES; i++)
                    173:        cyy = mpn_addmul_1 (dx+1, s1, size, xlimb);
                    174:       t = cputime() - t0;
                    175: #if TIMES != 1
                    176:       cyc = ((double) t * CLOCK) / (OPS * 1000.0);
                    177:       printf ("mpn_addmul_1:    %5ldms (%.2f cycles/limb) [%.2f Gb/s]\n",
                    178:              t,
                    179:              cyc,
                    180:              CLOCK/cyc*BITS_PER_MP_LIMB*BITS_PER_MP_LIMB);
                    181: #endif
                    182:
                    183:       MPN_COPY (dx, dy, size+2);
                    184:       cyx = refmpn_addmul_1 (dx+1, s1, size, xlimb);
                    185:       cyy = mpn_addmul_1 (dy+1, s1, size, xlimb);
                    186:
                    187: #ifdef PRINT
                    188:       printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyx);
                    189:       mpn_print (dx+1, size);
                    190:       printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyy);
                    191:       mpn_print (dy+1, size);
                    192: #endif
                    193:
                    194: #ifndef NOCHECK
                    195:       if (cyx != cyy || mpn_cmp (dx, dy, size+2) != 0
                    196:          || dx[size+1] != 0x12345678 || dx[0] != 0x87654321)
                    197:        {
                    198: #ifndef PRINT
                    199:          printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyx);
                    200:          mpn_print (dx+1, size);
                    201:          printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyy);
                    202:          mpn_print (dy+1, size);
                    203: #endif
                    204:          abort();
                    205:        }
                    206: #endif
                    207:     }
                    208: }
                    209:
                    210: mpn_print (mp_ptr p, mp_size_t size)
                    211: {
                    212:   mp_size_t i;
                    213:
                    214:   for (i = size - 1; i >= 0; i--)
                    215:     {
                    216:       printf ("%0*lX", (int) (2 * sizeof(mp_limb_t)), p[i]);
                    217: #ifdef SPACE
                    218:       if (i != 0)
                    219:        printf (" ");
                    220: #endif
                    221:     }
                    222:   puts ("");
                    223: }

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>