Annotation of OpenXM_contrib/gmp/mpn/tests/submul_1.c, Revision 1.1.1.1
1.1 maekawa 1: #include <stdio.h>
2: #include "gmp.h"
3: #include "gmp-impl.h"
4: #include "longlong.h"
5:
6: #ifndef USG
7: #include <sys/time.h>
8: #include <sys/resource.h>
9:
10: unsigned long
11: cputime ()
12: {
13: struct rusage rus;
14:
15: getrusage (0, &rus);
16: return rus.ru_utime.tv_sec * 1000 + rus.ru_utime.tv_usec / 1000;
17: }
18: #else
19: #include <time.h>
20:
21: #ifndef CLOCKS_PER_SEC
22: #define CLOCKS_PER_SEC 1000000
23: #endif
24:
25: #if CLOCKS_PER_SEC >= 10000
26: #define CLOCK_TO_MILLISEC(cl) ((cl) / (CLOCKS_PER_SEC / 1000))
27: #else
28: #define CLOCK_TO_MILLISEC(cl) ((cl) * 1000 / CLOCKS_PER_SEC)
29: #endif
30:
31: unsigned long
32: cputime ()
33: {
34: return CLOCK_TO_MILLISEC (clock ());
35: }
36: #endif
37:
38: #define M * 1000000
39:
40: #ifndef CLOCK
41: #if defined (__m88k__)
42: #define CLOCK 20 M
43: #elif defined (__i386__)
44: #define CLOCK (16.666667 M)
45: #elif defined (__m68k__)
46: #define CLOCK (20 M)
47: #elif defined (_IBMR2)
48: #define CLOCK (25 M)
49: #elif defined (__sparc__)
50: #define CLOCK (20 M)
51: #elif defined (__sun__)
52: #define CLOCK (20 M)
53: #elif defined (__mips)
54: #define CLOCK (40 M)
55: #elif defined (__hppa__)
56: #define CLOCK (50 M)
57: #elif defined (__alpha)
58: #define CLOCK (133 M)
59: #else
60: #error "Don't know CLOCK of your machine"
61: #endif
62: #endif
63:
64: #ifndef OPS
65: #define OPS 20000000
66: #endif
67: #ifndef SIZE
68: #define SIZE 496
69: #endif
70: #ifndef TIMES
71: #define TIMES OPS/SIZE
72: #else
73: #undef OPS
74: #define OPS (SIZE*TIMES)
75: #endif
76:
77: mp_limb_t
78: refmpn_submul_1 (res_ptr, s1_ptr, s1_size, s2_limb)
79: register mp_ptr res_ptr;
80: register mp_srcptr s1_ptr;
81: mp_size_t s1_size;
82: register mp_limb_t s2_limb;
83: {
84: register mp_limb_t cy_limb;
85: register mp_size_t j;
86: register mp_limb_t prod_high, prod_low;
87: register mp_limb_t x;
88:
89: /* The loop counter and index J goes from -SIZE to -1. This way
90: the loop becomes faster. */
91: j = -s1_size;
92:
93: /* Offset the base pointers to compensate for the negative indices. */
94: res_ptr -= j;
95: s1_ptr -= j;
96:
97: cy_limb = 0;
98: do
99: {
100: umul_ppmm (prod_high, prod_low, s1_ptr[j], s2_limb);
101:
102: prod_low += cy_limb;
103: cy_limb = (prod_low < cy_limb) + prod_high;
104:
105: x = res_ptr[j];
106: prod_low = x - prod_low;
107: cy_limb += (prod_low > x);
108: res_ptr[j] = prod_low;
109: }
110: while (++j != 0);
111:
112: return cy_limb;
113: }
114:
115: main (argc, argv)
116: int argc;
117: char **argv;
118: {
119: mp_limb_t s1[SIZE];
120: mp_limb_t dx[SIZE+2];
121: mp_limb_t dy[SIZE+2];
122: mp_limb_t cyx, cyy;
123: int i;
124: long t0, t;
125: int test;
126: mp_limb_t xlimb;
127: mp_size_t size;
128:
129: for (test = 0; ; test++)
130: {
131: #ifdef RANDOM
132: size = (random () % SIZE + 1);
133: #else
134: size = SIZE;
135: #endif
136:
137: mpn_random2 (s1, size);
138: mpn_random2 (dy+1, size);
139:
140: if (random () % 0x100 == 0)
141: xlimb = 0;
142: else
143: mpn_random2 (&xlimb, 1);
144:
145: dy[size+1] = 0x12345678;
146: dy[0] = 0x87654321;
147:
148: #if defined (PRINT) || defined (XPRINT)
149: printf ("xlimb=%*lX\n", (int) (2 * sizeof(mp_limb_t)), xlimb);
150: #endif
151: #ifdef PRINT
152: mpn_print (dy+1, size);
153: mpn_print (s1, size);
154: #endif
155:
156: MPN_COPY (dx, dy, size+2);
157: t0 = cputime();
158: for (i = 0; i < TIMES; i++)
159: cyx = refmpn_submul_1 (dx+1, s1, size, xlimb);
160: t = cputime() - t0;
161: #if TIMES != 1
162: printf ("refmpn_submul_1: %5ldms (%.2f cycles/limb)\n",
163: t,
164: ((double) t * CLOCK) / (OPS * 1000.0));
165: #endif
166:
167: MPN_COPY (dx, dy, size+2);
168: t0 = cputime();
169: for (i = 0; i < TIMES; i++)
170: cyy = mpn_submul_1 (dx+1, s1, size, xlimb);
171: t = cputime() - t0;
172: #if TIMES != 1
173: printf ("mpn_submul_1: %5ldms (%.2f cycles/limb)\n",
174: t,
175: ((double) t * CLOCK) / (OPS * 1000.0));
176: #endif
177:
178: MPN_COPY (dx, dy, size+2);
179: cyx = refmpn_submul_1 (dx+1, s1, size, xlimb);
180: cyy = mpn_submul_1 (dy+1, s1, size, xlimb);
181:
182: #ifdef PRINT
183: printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyx);
184: mpn_print (dx+1, size);
185: printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyy);
186: mpn_print (dy+1, size);
187: #endif
188:
189: #ifndef NOCHECK
190: if (cyx != cyy || mpn_cmp (dx, dy, size+2) != 0
191: || dx[size+1] != 0x12345678 || dx[0] != 0x87654321)
192: {
193: #ifndef PRINT
194: printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyx);
195: mpn_print (dx+1, size);
196: printf ("%*lX ", (int) (2 * sizeof(mp_limb_t)), cyy);
197: mpn_print (dy+1, size);
198: #endif
199: abort();
200: }
201: #endif
202: }
203: }
204:
205: mpn_print (mp_ptr p, mp_size_t size)
206: {
207: mp_size_t i;
208:
209: for (i = size - 1; i >= 0; i--)
210: {
211: printf ("%0*lX", (int) (2 * sizeof(mp_limb_t)), p[i]);
212: #ifdef SPACE
213: if (i != 0)
214: printf (" ");
215: #endif
216: }
217: puts ("");
218: }
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>