[BACK]Return to submul_1.c CVS log [TXT][DIR] Up to [local] / OpenXM / src / kan96xx / gmp-2.0.2-ssh-2 / mpn / tests

Annotation of OpenXM/src/kan96xx/gmp-2.0.2-ssh-2/mpn/tests/submul_1.c, Revision 1.1

1.1     ! takayama    1: #include <stdio.h>
        !             2: #include "gmp.h"
        !             3: #include "gmp-impl.h"
        !             4: #include "longlong.h"
        !             5:
        !             6: #ifndef USG
        !             7: #include <sys/time.h>
        !             8: #include <sys/resource.h>
        !             9:
        !            10: unsigned long
        !            11: cputime ()
        !            12: {
        !            13:     struct rusage rus;
        !            14:
        !            15:     getrusage (0, &rus);
        !            16:     return rus.ru_utime.tv_sec * 1000 + rus.ru_utime.tv_usec / 1000;
        !            17: }
        !            18: #else
        !            19: #include <time.h>
        !            20:
        !            21: #ifndef CLOCKS_PER_SEC
        !            22: #define CLOCKS_PER_SEC 1000000
        !            23: #endif
        !            24:
        !            25: #if CLOCKS_PER_SEC >= 10000
        !            26: #define CLOCK_TO_MILLISEC(cl) ((cl) / (CLOCKS_PER_SEC / 1000))
        !            27: #else
        !            28: #define CLOCK_TO_MILLISEC(cl) ((cl) * 1000 / CLOCKS_PER_SEC)
        !            29: #endif
        !            30:
        !            31: unsigned long
        !            32: cputime ()
        !            33: {
        !            34:   return CLOCK_TO_MILLISEC (clock ());
        !            35: }
        !            36: #endif
        !            37:
        !            38: #define M * 1000000
        !            39:
        !            40: #ifndef CLOCK
        !            41: #if defined (__m88k__)
        !            42: #define CLOCK 20 M
        !            43: #elif defined (__i386__)
        !            44: #define CLOCK (16.666667 M)
        !            45: #elif defined (__m68k__)
        !            46: #define CLOCK (20 M)
        !            47: #elif defined (_IBMR2)
        !            48: #define CLOCK (25 M)
        !            49: #elif defined (__sparc__)
        !            50: #define CLOCK (20 M)
        !            51: #elif defined (__sun__)
        !            52: #define CLOCK (20 M)
        !            53: #elif defined (__mips)
        !            54: #define CLOCK (40 M)
        !            55: #elif defined (__hppa__)
        !            56: #define CLOCK (50 M)
        !            57: #elif defined (__alpha)
        !            58: #define CLOCK (133 M)
        !            59: #else
        !            60: #error "Don't know CLOCK of your machine"
        !            61: #endif
        !            62: #endif
        !            63:
        !            64: #ifndef OPS
        !            65: #define OPS 20000000
        !            66: #endif
        !            67: #ifndef SIZE
        !            68: #define SIZE 496
        !            69: #endif
        !            70: #ifndef TIMES
        !            71: #define TIMES OPS/SIZE
        !            72: #else
        !            73: #undef OPS
        !            74: #define OPS (SIZE*TIMES)
        !            75: #endif
        !            76:
        !            77: mp_limb_t
        !            78: refmpn_submul_1 (res_ptr, s1_ptr, s1_size, s2_limb)
        !            79:      register mp_ptr res_ptr;
        !            80:      register mp_srcptr s1_ptr;
        !            81:      mp_size_t s1_size;
        !            82:      register mp_limb_t s2_limb;
        !            83: {
        !            84:   register mp_limb_t cy_limb;
        !            85:   register mp_size_t j;
        !            86:   register mp_limb_t prod_high, prod_low;
        !            87:   register mp_limb_t x;
        !            88:
        !            89:   /* The loop counter and index J goes from -SIZE to -1.  This way
        !            90:      the loop becomes faster.  */
        !            91:   j = -s1_size;
        !            92:
        !            93:   /* Offset the base pointers to compensate for the negative indices.  */
        !            94:   res_ptr -= j;
        !            95:   s1_ptr -= j;
        !            96:
        !            97:   cy_limb = 0;
        !            98:   do
        !            99:     {
        !           100:       umul_ppmm (prod_high, prod_low, s1_ptr[j], s2_limb);
        !           101:
        !           102:       prod_low += cy_limb;
        !           103:       cy_limb = (prod_low < cy_limb) + prod_high;
        !           104:
        !           105:       x = res_ptr[j];
        !           106:       prod_low = x - prod_low;
        !           107:       cy_limb += (prod_low > x);
        !           108:       res_ptr[j] = prod_low;
        !           109:     }
        !           110:   while (++j != 0);
        !           111:
        !           112:   return cy_limb;
        !           113: }
        !           114:
        !           115: main (argc, argv)
        !           116:      int argc;
        !           117:      char **argv;
        !           118: {
        !           119:   mp_limb_t s1[SIZE];
        !           120:   mp_limb_t dx[SIZE+2];
        !           121:   mp_limb_t dy[SIZE+2];
        !           122:   mp_limb_t cyx, cyy;
        !           123:   int i;
        !           124:   long t0, t;
        !           125:   int test;
        !           126:   mp_limb_t xlimb;
        !           127:   mp_size_t size;
        !           128:
        !           129:   for (test = 0; ; test++)
        !           130:     {
        !           131: #ifdef RANDOM
        !           132:       size = (random () % SIZE + 1);
        !           133: #else
        !           134:       size = SIZE;
        !           135: #endif
        !           136:
        !           137:       mpn_random2 (s1, size);
        !           138:       mpn_random2 (dy+1, size);
        !           139:
        !           140:       if (random () % 0x100 == 0)
        !           141:        xlimb = 0;
        !           142:       else
        !           143:        mpn_random2 (&xlimb, 1);
        !           144:
        !           145:       dy[size+1] = 0x12345678;
        !           146:       dy[0] = 0x87654321;
        !           147:
        !           148: #if defined (PRINT) || defined (XPRINT)
        !           149:       printf ("xlimb=%*lX\n", (int) (2 * sizeof(mp_limb_t)), xlimb);
        !           150: #endif
        !           151: #ifdef PRINT
        !           152:       mpn_print (dy+1, size);
        !           153:       mpn_print (s1, size);
        !           154: #endif
        !           155:
        !           156:       MPN_COPY (dx, dy, size+2);
        !           157:       t0 = cputime();
        !           158:       for (i = 0; i < TIMES; i++)
        !           159:        cyx = refmpn_submul_1 (dx+1, s1, size, xlimb);
        !           160:       t = cputime() - t0;
        !           161: #if TIMES != 1
        !           162:       printf ("refmpn_submul_1: %5ldms (%.2f cycles/limb)\n",
        !           163:              t,
        !           164:              ((double) t * CLOCK) / (OPS * 1000.0));
        !           165: #endif
        !           166:
        !           167:       MPN_COPY (dx, dy, size+2);
        !           168:       t0 = cputime();
        !           169:       for (i = 0; i < TIMES; i++)
        !           170:        cyy = mpn_submul_1 (dx+1, s1, size, xlimb);
        !           171:       t = cputime() - t0;
        !           172: #if TIMES != 1
        !           173:       printf ("mpn_submul_1:    %5ldms (%.2f cycles/limb)\n",
        !           174:              t,
        !           175:              ((double) t * CLOCK) / (OPS * 1000.0));
        !           176: #endif
        !           177:
        !           178:       MPN_COPY (dx, dy, size+2);
        !           179:       cyx = refmpn_submul_1 (dx+1, s1, size, xlimb);
        !           180:       cyy = mpn_submul_1 (dy+1, s1, size, xlimb);
        !           181:
        !           182: #ifdef PRINT
        !           183:       printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyx);
        !           184:       mpn_print (dx+1, size);
        !           185:       printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyy);
        !           186:       mpn_print (dy+1, size);
        !           187: #endif
        !           188:
        !           189: #ifndef NOCHECK
        !           190:       if (cyx != cyy || mpn_cmp (dx, dy, size+2) != 0
        !           191:          || dx[size+1] != 0x12345678 || dx[0] != 0x87654321)
        !           192:        {
        !           193: #ifndef PRINT
        !           194:          printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyx);
        !           195:          mpn_print (dx+1, size);
        !           196:          printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyy);
        !           197:          mpn_print (dy+1, size);
        !           198: #endif
        !           199:          abort();
        !           200:        }
        !           201: #endif
        !           202:     }
        !           203: }
        !           204:
        !           205: mpn_print (mp_ptr p, mp_size_t size)
        !           206: {
        !           207:   mp_size_t i;
        !           208:
        !           209:   for (i = size - 1; i >= 0; i--)
        !           210:     {
        !           211:       printf ("%0*lX", (int) (2 * sizeof(mp_limb_t)), p[i]);
        !           212: #ifdef SPACE
        !           213:       if (i != 0)
        !           214:        printf (" ");
        !           215: #endif
        !           216:     }
        !           217:   puts ("");
        !           218: }

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>