Annotation of OpenXM_contrib/gmp/mpn/tests/submul_1.c, Revision 1.1
1.1 ! maekawa 1: #include <stdio.h>
! 2: #include "gmp.h"
! 3: #include "gmp-impl.h"
! 4: #include "longlong.h"
! 5:
! 6: #ifndef USG
! 7: #include <sys/time.h>
! 8: #include <sys/resource.h>
! 9:
! 10: unsigned long
! 11: cputime ()
! 12: {
! 13: struct rusage rus;
! 14:
! 15: getrusage (0, &rus);
! 16: return rus.ru_utime.tv_sec * 1000 + rus.ru_utime.tv_usec / 1000;
! 17: }
! 18: #else
! 19: #include <time.h>
! 20:
! 21: #ifndef CLOCKS_PER_SEC
! 22: #define CLOCKS_PER_SEC 1000000
! 23: #endif
! 24:
! 25: #if CLOCKS_PER_SEC >= 10000
! 26: #define CLOCK_TO_MILLISEC(cl) ((cl) / (CLOCKS_PER_SEC / 1000))
! 27: #else
! 28: #define CLOCK_TO_MILLISEC(cl) ((cl) * 1000 / CLOCKS_PER_SEC)
! 29: #endif
! 30:
! 31: unsigned long
! 32: cputime ()
! 33: {
! 34: return CLOCK_TO_MILLISEC (clock ());
! 35: }
! 36: #endif
! 37:
! 38: #define M * 1000000
! 39:
! 40: #ifndef CLOCK
! 41: #if defined (__m88k__)
! 42: #define CLOCK 20 M
! 43: #elif defined (__i386__)
! 44: #define CLOCK (16.666667 M)
! 45: #elif defined (__m68k__)
! 46: #define CLOCK (20 M)
! 47: #elif defined (_IBMR2)
! 48: #define CLOCK (25 M)
! 49: #elif defined (__sparc__)
! 50: #define CLOCK (20 M)
! 51: #elif defined (__sun__)
! 52: #define CLOCK (20 M)
! 53: #elif defined (__mips)
! 54: #define CLOCK (40 M)
! 55: #elif defined (__hppa__)
! 56: #define CLOCK (50 M)
! 57: #elif defined (__alpha)
! 58: #define CLOCK (133 M)
! 59: #else
! 60: #error "Don't know CLOCK of your machine"
! 61: #endif
! 62: #endif
! 63:
! 64: #ifndef OPS
! 65: #define OPS 20000000
! 66: #endif
! 67: #ifndef SIZE
! 68: #define SIZE 496
! 69: #endif
! 70: #ifndef TIMES
! 71: #define TIMES OPS/SIZE
! 72: #else
! 73: #undef OPS
! 74: #define OPS (SIZE*TIMES)
! 75: #endif
! 76:
! 77: mp_limb_t
! 78: refmpn_submul_1 (res_ptr, s1_ptr, s1_size, s2_limb)
! 79: register mp_ptr res_ptr;
! 80: register mp_srcptr s1_ptr;
! 81: mp_size_t s1_size;
! 82: register mp_limb_t s2_limb;
! 83: {
! 84: register mp_limb_t cy_limb;
! 85: register mp_size_t j;
! 86: register mp_limb_t prod_high, prod_low;
! 87: register mp_limb_t x;
! 88:
! 89: /* The loop counter and index J goes from -SIZE to -1. This way
! 90: the loop becomes faster. */
! 91: j = -s1_size;
! 92:
! 93: /* Offset the base pointers to compensate for the negative indices. */
! 94: res_ptr -= j;
! 95: s1_ptr -= j;
! 96:
! 97: cy_limb = 0;
! 98: do
! 99: {
! 100: umul_ppmm (prod_high, prod_low, s1_ptr[j], s2_limb);
! 101:
! 102: prod_low += cy_limb;
! 103: cy_limb = (prod_low < cy_limb) + prod_high;
! 104:
! 105: x = res_ptr[j];
! 106: prod_low = x - prod_low;
! 107: cy_limb += (prod_low > x);
! 108: res_ptr[j] = prod_low;
! 109: }
! 110: while (++j != 0);
! 111:
! 112: return cy_limb;
! 113: }
! 114:
! 115: main (argc, argv)
! 116: int argc;
! 117: char **argv;
! 118: {
! 119: mp_limb_t s1[SIZE];
! 120: mp_limb_t dx[SIZE+2];
! 121: mp_limb_t dy[SIZE+2];
! 122: mp_limb_t cyx, cyy;
! 123: int i;
! 124: long t0, t;
! 125: int test;
! 126: mp_limb_t xlimb;
! 127: mp_size_t size;
! 128:
! 129: for (test = 0; ; test++)
! 130: {
! 131: #ifdef RANDOM
! 132: size = (random () % SIZE + 1);
! 133: #else
! 134: size = SIZE;
! 135: #endif
! 136:
! 137: mpn_random2 (s1, size);
! 138: mpn_random2 (dy+1, size);
! 139:
! 140: if (random () % 0x100 == 0)
! 141: xlimb = 0;
! 142: else
! 143: mpn_random2 (&xlimb, 1);
! 144:
! 145: dy[size+1] = 0x12345678;
! 146: dy[0] = 0x87654321;
! 147:
! 148: #if defined (PRINT) || defined (XPRINT)
! 149: printf ("xlimb=%*lX\n", (int) (2 * sizeof(mp_limb_t)), xlimb);
! 150: #endif
! 151: #ifdef PRINT
! 152: mpn_print (dy+1, size);
! 153: mpn_print (s1, size);
! 154: #endif
! 155:
! 156: MPN_COPY (dx, dy, size+2);
! 157: t0 = cputime();
! 158: for (i = 0; i < TIMES; i++)
! 159: cyx = refmpn_submul_1 (dx+1, s1, size, xlimb);
! 160: t = cputime() - t0;
! 161: #if TIMES != 1
! 162: printf ("refmpn_submul_1: %5ldms (%.2f cycles/limb)\n",
! 163: t,
! 164: ((double) t * CLOCK) / (OPS * 1000.0));
! 165: #endif
! 166:
! 167: MPN_COPY (dx, dy, size+2);
! 168: t0 = cputime();
! 169: for (i = 0; i < TIMES; i++)
! 170: cyy = mpn_submul_1 (dx+1, s1, size, xlimb);
! 171: t = cputime() - t0;
! 172: #if TIMES != 1
! 173: printf ("mpn_submul_1: %5ldms (%.2f cycles/limb)\n",
! 174: t,
! 175: ((double) t * CLOCK) / (OPS * 1000.0));
! 176: #endif
! 177:
! 178: MPN_COPY (dx, dy, size+2);
! 179: cyx = refmpn_submul_1 (dx+1, s1, size, xlimb);
! 180: cyy = mpn_submul_1 (dy+1, s1, size, xlimb);
! 181:
! 182: #ifdef PRINT
! 183: printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyx);
! 184: mpn_print (dx+1, size);
! 185: printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyy);
! 186: mpn_print (dy+1, size);
! 187: #endif
! 188:
! 189: #ifndef NOCHECK
! 190: if (cyx != cyy || mpn_cmp (dx, dy, size+2) != 0
! 191: || dx[size+1] != 0x12345678 || dx[0] != 0x87654321)
! 192: {
! 193: #ifndef PRINT
! 194: printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyx);
! 195: mpn_print (dx+1, size);
! 196: printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyy);
! 197: mpn_print (dy+1, size);
! 198: #endif
! 199: abort();
! 200: }
! 201: #endif
! 202: }
! 203: }
! 204:
! 205: mpn_print (mp_ptr p, mp_size_t size)
! 206: {
! 207: mp_size_t i;
! 208:
! 209: for (i = size - 1; i >= 0; i--)
! 210: {
! 211: printf ("%0*lX", (int) (2 * sizeof(mp_limb_t)), p[i]);
! 212: #ifdef SPACE
! 213: if (i != 0)
! 214: printf (" ");
! 215: #endif
! 216: }
! 217: puts ("");
! 218: }
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>