Annotation of OpenXM_contrib2/asir2000/engine/nd.c, Revision 1.86
1.86 ! noro 1: /* $OpenXM: OpenXM_contrib2/asir2000/engine/nd.c,v 1.85 2003/10/28 03:23:40 noro Exp $ */
1.2 noro 2:
1.1 noro 3: #include "ca.h"
1.74 noro 4: #include "parse.h"
5: #include "ox.h"
1.1 noro 6: #include "inline.h"
1.64 noro 7: #include <time.h>
1.1 noro 8:
9: #if defined(__GNUC__)
10: #define INLINE inline
11: #elif defined(VISUAL)
12: #define INLINE __inline
13: #else
14: #define INLINE
15: #endif
16:
1.61 noro 17: typedef unsigned int UINT;
18:
1.47 noro 19: #define USE_GEOBUCKET 1
1.65 noro 20: #define USE_UNROLL 1
1.28 noro 21:
1.1 noro 22: #define REDTAB_LEN 32003
23:
1.40 noro 24: /* GeoBucket for polynomial addition */
25:
1.1 noro 26: typedef struct oPGeoBucket {
27: int m;
28: struct oND *body[32];
29: } *PGeoBucket;
30:
1.40 noro 31: /* distributed polynomial; linked list rep. */
1.1 noro 32: typedef struct oND {
33: struct oNM *body;
34: int nv;
1.31 noro 35: int len;
1.1 noro 36: int sugar;
37: } *ND;
38:
1.40 noro 39: /* distributed polynomial; array rep. */
1.3 noro 40: typedef struct oNDV {
41: struct oNMV *body;
42: int nv;
1.31 noro 43: int len;
1.3 noro 44: int sugar;
45: } *NDV;
46:
1.69 noro 47: typedef union oNDC {
48: int m;
49: Q z;
50: P p;
51: } *NDC;
52:
1.40 noro 53: /* monomial; linked list rep. */
1.1 noro 54: typedef struct oNM {
55: struct oNM *next;
1.69 noro 56: union oNDC c;
1.61 noro 57: UINT dl[1];
1.1 noro 58: } *NM;
59:
1.40 noro 60: /* monomial; array rep. */
1.3 noro 61: typedef struct oNMV {
1.69 noro 62: union oNDC c;
1.61 noro 63: UINT dl[1];
1.3 noro 64: } *NMV;
65:
1.40 noro 66: /* history of reducer */
1.13 noro 67: typedef struct oRHist {
68: struct oRHist *next;
69: int index;
1.34 noro 70: int sugar;
1.61 noro 71: UINT dl[1];
1.13 noro 72: } *RHist;
73:
1.40 noro 74: /* S-pair list */
1.1 noro 75: typedef struct oND_pairs {
76: struct oND_pairs *next;
77: int i1,i2;
1.34 noro 78: int sugar;
1.61 noro 79: UINT lcm[1];
1.1 noro 80: } *ND_pairs;
81:
1.42 noro 82: /* index and shift count for each exponent */
83: typedef struct oEPOS {
84: int i; /* index */
85: int s; /* shift */
86: } *EPOS;
87:
1.43 noro 88: typedef struct oBlockMask {
89: int n;
90: struct order_pair *order_pair;
1.61 noro 91: UINT **mask;
1.43 noro 92: } *BlockMask;
93:
1.45 noro 94: typedef struct oBaseSet {
95: int len;
96: NDV *ps;
1.61 noro 97: UINT **bound;
1.45 noro 98: } *BaseSet;
99:
1.63 noro 100: typedef struct oNM_ind_pair
101: {
102: NM mul;
1.76 noro 103: int index,sugar;
1.63 noro 104: } *NM_ind_pair;
105:
1.67 noro 106: typedef struct oIndArray
107: {
108: char width;
109: int head;
110: union {
111: unsigned char *c;
112: unsigned short *s;
113: unsigned int *i;
114: } index;
115: } *IndArray;
1.63 noro 116:
1.61 noro 117: int (*ndl_compare_function)(UINT *a1,UINT *a2);
1.32 noro 118:
1.74 noro 119: static int ndv_alloc;
1.69 noro 120: static int nd_f4_nsp=0x7fffffff;
1.42 noro 121: static double nd_scale=2;
1.61 noro 122: static UINT **nd_bound;
1.42 noro 123: static struct order_spec *nd_ord;
124: static EPOS nd_epos;
1.43 noro 125: static BlockMask nd_blockmask;
1.42 noro 126: static int nd_nvar;
127: static int nd_isrlex;
128: static int nd_epw,nd_bpe,nd_wpd,nd_exporigin;
1.61 noro 129: static UINT nd_mask[32];
130: static UINT nd_mask0,nd_mask1;
1.42 noro 131:
132: static NM _nm_free_list;
133: static ND _nd_free_list;
134: static ND_pairs _ndp_free_list;
1.20 noro 135:
136: static NDV *nd_ps;
1.53 noro 137: static NDV *nd_ps_trace;
1.42 noro 138: static RHist *nd_psh;
139: static int nd_psn,nd_pslen;
1.20 noro 140:
1.42 noro 141: static RHist *nd_red;
1.1 noro 142:
1.42 noro 143: static int nd_found,nd_create,nd_notfirst;
144: static int nm_adv;
145: static int nmv_adv;
146: static int nd_dcomp;
1.77 noro 147: static int nd_demand;
1.1 noro 148:
1.74 noro 149: extern struct order_spec dp_current_spec;
1.77 noro 150: extern char *Demand;
1.61 noro 151: extern VL CO;
1.77 noro 152: extern int Top,Reverse,DP_Print,dp_nelim,do_weyl,NoSugar;
1.58 noro 153: extern int *current_weyl_weight_vector;
1.1 noro 154:
1.40 noro 155: /* fundamental macros */
1.34 noro 156: #define TD(d) (d[0])
1.1 noro 157: #define HDL(d) ((d)->body->dl)
1.34 noro 158: #define HTD(d) (TD(HDL(d)))
1.14 noro 159: #define HCM(d) ((d)->body->c.m)
1.16 noro 160: #define HCQ(d) ((d)->body->c.z)
1.61 noro 161: #define HCP(d) ((d)->body->c.p)
1.14 noro 162: #define CM(a) ((a)->c.m)
1.16 noro 163: #define CQ(a) ((a)->c.z)
1.61 noro 164: #define CP(a) ((a)->c.p)
1.14 noro 165: #define DL(a) ((a)->dl)
166: #define SG(a) ((a)->sugar)
167: #define LEN(a) ((a)->len)
1.33 noro 168: #define LCM(a) ((a)->lcm)
1.42 noro 169: #define GET_EXP(d,a) (((d)[nd_epos[a].i]>>nd_epos[a].s)&nd_mask0)
1.60 noro 170: #define GET_EXP_MASK(d,a,m) ((((d)[nd_epos[a].i]&(m)[nd_epos[a].i])>>nd_epos[a].s)&nd_mask0)
1.42 noro 171: #define PUT_EXP(r,a,e) ((r)[nd_epos[a].i] |= ((e)<<nd_epos[a].s))
1.45 noro 172: #define XOR_EXP(r,a,e) ((r)[nd_epos[a].i] ^= ((e)<<nd_epos[a].s))
1.1 noro 173:
1.61 noro 174: #define GET_EXP_OLD(d,a) (((d)[oepos[a].i]>>oepos[a].s)&omask0)
175: #define PUT_EXP_OLD(r,a,e) ((r)[oepos[a].i] |= ((e)<<oepos[a].s))
176:
1.40 noro 177: /* macros for term comparison */
1.34 noro 178: #define TD_DL_COMPARE(d1,d2)\
1.41 noro 179: (TD(d1)>TD(d2)?1:(TD(d1)<TD(d2)?-1:ndl_lex_compare(d1,d2)))
1.43 noro 180: #if 0
1.34 noro 181: #define DL_COMPARE(d1,d2)\
1.43 noro 182: (nd_dcomp>0?TD_DL_COMPARE(d1,d2)\
183: :(nd_dcomp==0?ndl_lex_compare(d1,d2)\
184: :(nd_blockmask?ndl_block_compare(d1,d2)\
1.45 noro 185: :(*ndl_compare_function)(d1,d2))))
1.43 noro 186: #else
187: #define DL_COMPARE(d1,d2)\
1.45 noro 188: (nd_dcomp>0?TD_DL_COMPARE(d1,d2):(*ndl_compare_function)(d1,d2))
1.43 noro 189: #endif
1.34 noro 190:
1.40 noro 191: /* allocators */
1.15 noro 192: #define NEWRHist(r) \
1.61 noro 193: ((r)=(RHist)MALLOC(sizeof(struct oRHist)+(nd_wpd-1)*sizeof(UINT)))
1.34 noro 194: #define NEWND_pairs(m) \
195: if(!_ndp_free_list)_NDP_alloc();\
196: (m)=_ndp_free_list; _ndp_free_list = NEXT(_ndp_free_list)
197: #define NEWNM(m)\
198: if(!_nm_free_list)_NM_alloc();\
199: (m)=_nm_free_list; _nm_free_list = NEXT(_nm_free_list)
200: #define MKND(n,m,len,d)\
201: if(!_nd_free_list)_ND_alloc();\
202: (d)=_nd_free_list; _nd_free_list = (ND)BDY(_nd_free_list);\
203: NV(d)=(n); LEN(d)=(len); BDY(d)=(m)
1.40 noro 204: #define NEWNDV(d) ((d)=(NDV)MALLOC(sizeof(struct oNDV)))
205: #define MKNDV(n,m,l,d) NEWNDV(d); NV(d)=(n); BDY(d)=(m); LEN(d) = l;
1.63 noro 206: #define NEWNM_ind_pair(p)\
207: ((p)=(NM_ind_pair)MALLOC(sizeof(struct oNM_ind_pair)))
1.1 noro 208:
1.40 noro 209: /* allocate and link a new object */
1.13 noro 210: #define NEXTRHist(r,c) \
211: if(!(r)){NEWRHist(r);(c)=(r);}else{NEWRHist(NEXT(c));(c)=NEXT(c);}
1.1 noro 212: #define NEXTNM(r,c) \
213: if(!(r)){NEWNM(r);(c)=(r);}else{NEWNM(NEXT(c));(c)=NEXT(c);}
214: #define NEXTNM2(r,c,s) \
215: if(!(r)){(c)=(r)=(s);}else{NEXT(c)=(s);(c)=(s);}
1.40 noro 216: #define NEXTND_pairs(r,c) \
217: if(!(r)){NEWND_pairs(r);(c)=(r);}else{NEWND_pairs(NEXT(c));(c)=NEXT(c);}
1.76 noro 218: #define MKNM_ind_pair(p,m,i,s) (NEWNM_ind_pair(p),(p)->mul=(m),(p)->index=(i),(p)->sugar = (s))
1.34 noro 219:
1.40 noro 220: /* deallocators */
1.1 noro 221: #define FREENM(m) NEXT(m)=_nm_free_list; _nm_free_list=(m)
222: #define FREENDP(m) NEXT(m)=_ndp_free_list; _ndp_free_list=(m)
223: #define FREEND(m) BDY(m)=(NM)_nd_free_list; _nd_free_list=(m)
224:
1.40 noro 225: /* macro for increasing pointer to NMV */
226: #define NMV_ADV(m) (m = (NMV)(((char *)m)+nmv_adv))
1.61 noro 227: #define NMV_OADV(m) (m = (NMV)(((char *)m)+oadv))
228: #define NDV_NADV(m) (m = (NMV)(((char *)m)+newadv))
1.56 noro 229: #define NMV_PREV(m) (m = (NMV)(((char *)m)-nmv_adv))
1.61 noro 230: #define NMV_OPREV(m) (m = (NMV)(((char *)m)-oadv))
231:
1.40 noro 232: /* external functions */
1.71 noro 233: #if 1
1.40 noro 234: void GC_gcollect();
1.71 noro 235: #endif
1.40 noro 236: NODE append_one(NODE,int);
1.1 noro 237:
1.40 noro 238: /* manipulation of coefficients */
1.20 noro 239: void nd_removecont(int mod,ND p);
1.21 noro 240: void nd_removecont2(ND p1,ND p2);
1.40 noro 241: void removecont_array(Q *c,int n);
242:
243: /* GeoBucket functions */
1.25 noro 244: ND normalize_pbucket(int mod,PGeoBucket g);
245: int head_pbucket(int mod,PGeoBucket g);
1.26 noro 246: int head_pbucket_q(PGeoBucket g);
1.63 noro 247: void add_pbucket_symbolic(PGeoBucket g,ND d);
1.31 noro 248: void add_pbucket(int mod,PGeoBucket g,ND d);
1.25 noro 249: void free_pbucket(PGeoBucket b);
1.26 noro 250: void mulq_pbucket(PGeoBucket g,Q c);
1.63 noro 251: NM remove_head_pbucket_symbolic(PGeoBucket g);
1.25 noro 252: PGeoBucket create_pbucket();
1.20 noro 253:
1.40 noro 254: /* manipulation of pairs and bases */
1.39 noro 255: int nd_newps(int mod,ND a,ND aq);
1.40 noro 256: ND_pairs nd_newpairs( NODE g, int t );
1.1 noro 257: ND_pairs nd_minp( ND_pairs d, ND_pairs *prest );
1.63 noro 258: ND_pairs nd_minsugarp( ND_pairs d, ND_pairs *prest );
1.1 noro 259: NODE update_base(NODE nd,int ndp);
1.40 noro 260: ND_pairs update_pairs( ND_pairs d, NODE /* of index */ g, int t);
261: ND_pairs equivalent_pairs( ND_pairs d1, ND_pairs *prest );
262: ND_pairs crit_B( ND_pairs d, int s );
263: ND_pairs crit_M( ND_pairs d1 );
264: ND_pairs crit_F( ND_pairs d1 );
1.1 noro 265: int crit_2( int dp1, int dp2 );
1.77 noro 266: int ndv_newps(int m,NDV a,NDV aq);
1.40 noro 267:
268: /* top level functions */
1.63 noro 269: void nd_gr(LIST f,LIST v,int m,int f4,struct order_spec *ord,LIST *rp);
1.52 noro 270: void nd_gr_trace(LIST f,LIST v,int trace,int homo,struct order_spec *ord,LIST *rp);
1.63 noro 271: NODE nd_f4(int m);
1.77 noro 272: NODE nd_gb(int m,int ishomo,int checkonly);
1.82 noro 273: NODE nd_gb_trace(int m,int ishomo);
1.40 noro 274:
275: /* ndl functions */
1.61 noro 276: int ndl_weight(UINT *d);
277: void ndl_weight_mask(UINT *d);
278: void ndl_homogenize(UINT *d,UINT *r,int obpe,EPOS oepos,int weight);
279: void ndl_dehomogenize(UINT *p);
280: void ndl_reconstruct(UINT *d,UINT *r,int obpe,EPOS oepos);
281: INLINE int ndl_reducible(UINT *d1,UINT *d2);
282: INLINE int ndl_lex_compare(UINT *d1,UINT *d2);
283: INLINE int ndl_block_compare(UINT *d1,UINT *d2);
284: INLINE int ndl_equal(UINT *d1,UINT *d2);
285: INLINE void ndl_copy(UINT *d1,UINT *d2);
286: INLINE void ndl_zero(UINT *d);
287: INLINE void ndl_add(UINT *d1,UINT *d2,UINT *d);
288: INLINE void ndl_addto(UINT *d1,UINT *d2);
289: INLINE void ndl_sub(UINT *d1,UINT *d2,UINT *d);
290: INLINE int ndl_hash_value(UINT *d);
1.45 noro 291:
292: /* normal forms */
1.63 noro 293: INLINE int ndl_find_reducer(UINT *g);
1.53 noro 294: int nd_sp(int mod,int trace,ND_pairs p,ND *nf);
1.69 noro 295: int nd_nf(int mod,ND g,NDV *ps,int full,NDC dn,ND *nf);
1.53 noro 296: int nd_nf_pbucket(int mod,ND g,NDV *ps,int full,ND *nf);
1.40 noro 297:
298: /* finalizers */
1.61 noro 299: NODE ndv_reducebase(NODE x);
300: NODE ndv_reduceall(int m,NODE f);
1.40 noro 301:
302: /* allocators */
303: void nd_free_private_storage();
304: void _NM_alloc();
305: void _ND_alloc();
1.1 noro 306: void nd_free(ND p);
1.40 noro 307: void nd_free_redlist();
308:
309: /* printing */
1.61 noro 310: void ndl_print(UINT *dl);
1.1 noro 311: void nd_print(ND p);
1.16 noro 312: void nd_print_q(ND p);
1.1 noro 313: void ndp_print(ND_pairs d);
1.40 noro 314:
315:
316: /* setup, reconstruct */
317: void nd_init_ord(struct order_spec *spec);
318: ND_pairs nd_reconstruct(int mod,int trace,ND_pairs ndp);
1.61 noro 319: void ndv_setup(int mod,int trace,NODE f);
320: void nd_setup_parameters(int nvar,int max);
1.43 noro 321: BlockMask nd_create_blockmask(struct order_spec *ord);
1.57 noro 322: EPOS nd_create_epos(struct order_spec *ord);
1.48 noro 323: int nd_get_exporigin(struct order_spec *ord);
1.61 noro 324: void ndv_mod(int mod,NDV p);
325: NDV ndv_dup(int mod,NDV p);
1.63 noro 326: ND nd_dup(ND p);
1.40 noro 327:
328: /* ND functions */
1.61 noro 329: int ndv_check_candidate(NODE input,int obpe,int oadv,EPOS oepos,NODE cand);
1.40 noro 330: void nd_mul_c(int mod,ND p,int mul);
331: void nd_mul_c_q(ND p,Q mul);
1.61 noro 332: void nd_mul_c_p(VL vl,ND p,P mul);
1.40 noro 333: ND nd_remove_head(ND p);
1.69 noro 334: ND nd_separate_head(ND p,ND *head);
1.1 noro 335: int nd_length(ND p);
1.61 noro 336: void nd_append_red(UINT *d,int i);
337: UINT *ndv_compute_bound(NDV p);
1.6 noro 338: ND nd_copy(ND p);
1.63 noro 339: ND nd_merge(ND p1,ND p2);
1.40 noro 340: ND nd_add(int mod,ND p1,ND p2);
341: ND nd_add_q(ND p1,ND p2);
1.71 noro 342: ND nd_add_sf(ND p1,ND p2);
1.41 noro 343: INLINE int nd_length(ND p);
1.74 noro 344: NODE nd_f4_red(int m,ND_pairs sp0,UINT *s0vect,int col,NODE rp0);
345: NODE nd_f4_red_dist(int m,ND_pairs sp0,UINT *s0vect,int col,NODE rp0);
1.4 noro 346:
1.40 noro 347: /* NDV functions */
1.55 noro 348: ND weyl_ndv_mul_nm(int mod,NM m0,NDV p);
349: void weyl_mul_nm_nmv(int n,int mod,NM m0,NMV m1,NM *tab,int tlen);
1.19 noro 350: void ndv_mul_c(int mod,NDV p,int mul);
1.40 noro 351: void ndv_mul_c_q(NDV p,Q mul);
1.63 noro 352: ND ndv_mul_nm_symbolic(NM m0,NDV p);
1.61 noro 353: ND ndv_mul_nm(int mod,NM m0,NDV p);
1.43 noro 354: void ndv_realloc(NDV p,int obpe,int oadv,EPOS oepos);
1.61 noro 355: NDV ndv_dup_realloc(NDV p,int obpe,int oadv,EPOS oepos);
356: void ndv_homogenize(NDV p,int obpe,int oadv,EPOS eops);
1.45 noro 357: void ndv_dehomogenize(NDV p,struct order_spec *spec);
1.40 noro 358: void ndv_removecont(int mod,NDV p);
359: void ndv_print(NDV p);
360: void ndv_print_q(NDV p);
361: void ndv_free(NDV p);
1.77 noro 362: void ndv_save(NDV p,int index);
363: NDV ndv_load(int index);
1.40 noro 364:
365: /* converters */
1.61 noro 366: ND ptond(VL vl,VL dvl,P p);
367: NDV ptondv(VL vl,VL dvl,P p);
368: P ndvtop(int mod,VL vl,VL dvl,NDV p);
1.16 noro 369: NDV ndtondv(int mod,ND p);
1.23 noro 370: ND ndvtond(int mod,NDV p);
1.63 noro 371: int nm_ind_pair_to_vect(int m,UINT *s0,int n,NM_ind_pair pair,UINT *r);
1.67 noro 372: IndArray nm_ind_pair_to_vect_compress(int m,UINT *s0,int n,NM_ind_pair pair);
1.63 noro 373: int nd_to_vect(int mod,UINT *s0,int n,ND d,UINT *r);
1.1 noro 374:
1.76 noro 375: /* elimination */
376: int nd_gauss_elim_mod(int **mat0,int *sugar,int row,int col,int md,int *colstat);
377: int nd_gauss_elim_sf(int **mat0,int *sugar,int row,int col,int md,int *colstat);
378:
1.1 noro 379: void nd_free_private_storage()
380: {
381: _nm_free_list = 0;
1.5 noro 382: _ndp_free_list = 0;
1.71 noro 383: #if 0
1.1 noro 384: GC_gcollect();
1.71 noro 385: #endif
1.1 noro 386: }
387:
388: void _NM_alloc()
389: {
390: NM p;
391: int i;
392:
1.11 noro 393: for ( i = 0; i < 1024; i++ ) {
1.61 noro 394: p = (NM)GC_malloc(sizeof(struct oNM)+(nd_wpd-1)*sizeof(UINT));
1.1 noro 395: p->next = _nm_free_list; _nm_free_list = p;
396: }
397: }
398:
399: void _ND_alloc()
400: {
401: ND p;
402: int i;
403:
404: for ( i = 0; i < 1024; i++ ) {
405: p = (ND)GC_malloc(sizeof(struct oND));
406: p->body = (NM)_nd_free_list; _nd_free_list = p;
407: }
408: }
409:
410: void _NDP_alloc()
411: {
412: ND_pairs p;
413: int i;
414:
1.11 noro 415: for ( i = 0; i < 1024; i++ ) {
1.1 noro 416: p = (ND_pairs)GC_malloc(sizeof(struct oND_pairs)
1.61 noro 417: +(nd_wpd-1)*sizeof(UINT));
1.1 noro 418: p->next = _ndp_free_list; _ndp_free_list = p;
419: }
420: }
421:
1.30 noro 422: INLINE int nd_length(ND p)
1.1 noro 423: {
424: NM m;
425: int i;
426:
427: if ( !p )
428: return 0;
429: else {
430: for ( i = 0, m = BDY(p); m; m = NEXT(m), i++ );
431: return i;
432: }
433: }
434:
1.61 noro 435: INLINE int ndl_reducible(UINT *d1,UINT *d2)
1.1 noro 436: {
1.61 noro 437: UINT u1,u2;
1.1 noro 438: int i,j;
439:
1.34 noro 440: if ( TD(d1) < TD(d2) ) return 0;
1.65 noro 441: #if USE_UNROLL
1.1 noro 442: switch ( nd_bpe ) {
1.62 noro 443: case 3:
444: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
445: u1 = d1[i]; u2 = d2[i];
446: if ( (u1&0x38000000) < (u2&0x38000000) ) return 0;
447: if ( (u1& 0x7000000) < (u2& 0x7000000) ) return 0;
448: if ( (u1& 0xe00000) < (u2& 0xe00000) ) return 0;
449: if ( (u1& 0x1c0000) < (u2& 0x1c0000) ) return 0;
450: if ( (u1& 0x38000) < (u2& 0x38000) ) return 0;
451: if ( (u1& 0x7000) < (u2& 0x7000) ) return 0;
452: if ( (u1& 0xe00) < (u2& 0xe00) ) return 0;
453: if ( (u1& 0x1c0) < (u2& 0x1c0) ) return 0;
454: if ( (u1& 0x38) < (u2& 0x38) ) return 0;
455: if ( (u1& 0x7) < (u2& 0x7) ) return 0;
456: }
457: return 1;
458: break;
1.1 noro 459: case 4:
1.41 noro 460: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 461: u1 = d1[i]; u2 = d2[i];
462: if ( (u1&0xf0000000) < (u2&0xf0000000) ) return 0;
1.62 noro 463: if ( (u1& 0xf000000) < (u2& 0xf000000) ) return 0;
464: if ( (u1& 0xf00000) < (u2& 0xf00000) ) return 0;
465: if ( (u1& 0xf0000) < (u2& 0xf0000) ) return 0;
466: if ( (u1& 0xf000) < (u2& 0xf000) ) return 0;
467: if ( (u1& 0xf00) < (u2& 0xf00) ) return 0;
468: if ( (u1& 0xf0) < (u2& 0xf0) ) return 0;
469: if ( (u1& 0xf) < (u2& 0xf) ) return 0;
1.1 noro 470: }
471: return 1;
472: break;
473: case 6:
1.41 noro 474: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 475: u1 = d1[i]; u2 = d2[i];
476: if ( (u1&0x3f000000) < (u2&0x3f000000) ) return 0;
1.62 noro 477: if ( (u1& 0xfc0000) < (u2& 0xfc0000) ) return 0;
478: if ( (u1& 0x3f000) < (u2& 0x3f000) ) return 0;
479: if ( (u1& 0xfc0) < (u2& 0xfc0) ) return 0;
480: if ( (u1& 0x3f) < (u2& 0x3f) ) return 0;
1.1 noro 481: }
482: return 1;
483: break;
484: case 8:
1.41 noro 485: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 486: u1 = d1[i]; u2 = d2[i];
487: if ( (u1&0xff000000) < (u2&0xff000000) ) return 0;
1.62 noro 488: if ( (u1& 0xff0000) < (u2& 0xff0000) ) return 0;
489: if ( (u1& 0xff00) < (u2& 0xff00) ) return 0;
490: if ( (u1& 0xff) < (u2& 0xff) ) return 0;
1.1 noro 491: }
492: return 1;
493: break;
494: case 16:
1.41 noro 495: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 496: u1 = d1[i]; u2 = d2[i];
497: if ( (u1&0xffff0000) < (u2&0xffff0000) ) return 0;
1.62 noro 498: if ( (u1& 0xffff) < (u2& 0xffff) ) return 0;
1.1 noro 499: }
500: return 1;
501: break;
502: case 32:
1.41 noro 503: for ( i = nd_exporigin; i < nd_wpd; i++ )
1.1 noro 504: if ( d1[i] < d2[i] ) return 0;
505: return 1;
506: break;
507: default:
1.41 noro 508: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 509: u1 = d1[i]; u2 = d2[i];
510: for ( j = 0; j < nd_epw; j++ )
511: if ( (u1&nd_mask[j]) < (u2&nd_mask[j]) ) return 0;
512: }
513: return 1;
514: }
1.65 noro 515: #else
516: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
517: u1 = d1[i]; u2 = d2[i];
518: for ( j = 0; j < nd_epw; j++ )
519: if ( (u1&nd_mask[j]) < (u2&nd_mask[j]) ) return 0;
520: }
521: return 1;
522: #endif
1.1 noro 523: }
524:
1.61 noro 525: /*
526: * If the current order is a block order,
527: * then the last block is length 1 and contains
528: * the homo variable. Otherwise, the original
529: * order is either 0 or 2.
530: */
531:
532: void ndl_homogenize(UINT *d,UINT *r,int obpe,EPOS oepos,int weight)
1.23 noro 533: {
1.61 noro 534: int w,i,e,n,omask0;
535:
536: omask0 = (1<<obpe)-1;
537: n = nd_nvar-1;
538: ndl_zero(r);
539: for ( i = 0; i < n; i++ ) {
540: e = GET_EXP_OLD(d,i);
541: PUT_EXP(r,i,e);
542: }
543: w = TD(d);
544: PUT_EXP(r,nd_nvar-1,weight-w);
545: TD(r) = weight;
546: if ( nd_blockmask ) ndl_weight_mask(r);
547: }
548:
549: void ndl_dehomogenize(UINT *d)
550: {
551: UINT mask;
552: UINT h;
1.31 noro 553: int i,bits;
1.23 noro 554:
1.44 noro 555: if ( nd_blockmask ) {
556: h = GET_EXP(d,nd_nvar-1);
1.45 noro 557: XOR_EXP(d,nd_nvar-1,h);
1.44 noro 558: TD(d) -= h;
559: d[nd_exporigin-1] -= h;
560: } else {
561: if ( nd_isrlex ) {
562: if ( nd_bpe == 32 ) {
563: h = d[nd_exporigin];
564: for ( i = nd_exporigin+1; i < nd_wpd; i++ )
565: d[i-1] = d[i];
566: d[i-1] = 0;
567: TD(d) -= h;
568: } else {
569: bits = nd_epw*nd_bpe;
570: mask = bits==32?0xffffffff:((1<<(nd_epw*nd_bpe))-1);
571: h = (d[nd_exporigin]>>((nd_epw-1)*nd_bpe))&nd_mask0;
572: for ( i = nd_exporigin; i < nd_wpd; i++ )
573: d[i] = ((d[i]<<nd_bpe)&mask)
574: |(i+1<nd_wpd?((d[i+1]>>((nd_epw-1)*nd_bpe))&nd_mask0):0);
575: TD(d) -= h;
576: }
1.45 noro 577: } else {
578: h = GET_EXP(d,nd_nvar-1);
579: XOR_EXP(d,nd_nvar-1,h);
580: TD(d) -= h;
581: }
1.44 noro 582: }
1.23 noro 583: }
584:
1.61 noro 585: void ndl_lcm(UINT *d1,unsigned *d2,UINT *d)
1.1 noro 586: {
1.61 noro 587: UINT t1,t2,u,u1,u2;
1.43 noro 588: int i,j,l;
1.1 noro 589:
1.65 noro 590: #if USE_UNROLL
1.1 noro 591: switch ( nd_bpe ) {
1.62 noro 592: case 3:
593: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
594: u1 = d1[i]; u2 = d2[i];
595: t1 = (u1&0x38000000); t2 = (u2&0x38000000); u = t1>t2?t1:t2;
596: t1 = (u1& 0x7000000); t2 = (u2& 0x7000000); u |= t1>t2?t1:t2;
597: t1 = (u1& 0xe00000); t2 = (u2& 0xe00000); u |= t1>t2?t1:t2;
598: t1 = (u1& 0x1c0000); t2 = (u2& 0x1c0000); u |= t1>t2?t1:t2;
599: t1 = (u1& 0x38000); t2 = (u2& 0x38000); u |= t1>t2?t1:t2;
600: t1 = (u1& 0x7000); t2 = (u2& 0x7000); u |= t1>t2?t1:t2;
601: t1 = (u1& 0xe00); t2 = (u2& 0xe00); u |= t1>t2?t1:t2;
602: t1 = (u1& 0x1c0); t2 = (u2& 0x1c0); u |= t1>t2?t1:t2;
603: t1 = (u1& 0x38); t2 = (u2& 0x38); u |= t1>t2?t1:t2;
604: t1 = (u1& 0x7); t2 = (u2& 0x7); u |= t1>t2?t1:t2;
605: d[i] = u;
606: }
607: break;
1.1 noro 608: case 4:
1.41 noro 609: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 610: u1 = d1[i]; u2 = d2[i];
611: t1 = (u1&0xf0000000); t2 = (u2&0xf0000000); u = t1>t2?t1:t2;
1.62 noro 612: t1 = (u1& 0xf000000); t2 = (u2& 0xf000000); u |= t1>t2?t1:t2;
613: t1 = (u1& 0xf00000); t2 = (u2& 0xf00000); u |= t1>t2?t1:t2;
614: t1 = (u1& 0xf0000); t2 = (u2& 0xf0000); u |= t1>t2?t1:t2;
615: t1 = (u1& 0xf000); t2 = (u2& 0xf000); u |= t1>t2?t1:t2;
616: t1 = (u1& 0xf00); t2 = (u2& 0xf00); u |= t1>t2?t1:t2;
617: t1 = (u1& 0xf0); t2 = (u2& 0xf0); u |= t1>t2?t1:t2;
618: t1 = (u1& 0xf); t2 = (u2& 0xf); u |= t1>t2?t1:t2;
1.1 noro 619: d[i] = u;
620: }
621: break;
622: case 6:
1.41 noro 623: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 624: u1 = d1[i]; u2 = d2[i];
625: t1 = (u1&0x3f000000); t2 = (u2&0x3f000000); u = t1>t2?t1:t2;
1.62 noro 626: t1 = (u1& 0xfc0000); t2 = (u2& 0xfc0000); u |= t1>t2?t1:t2;
627: t1 = (u1& 0x3f000); t2 = (u2& 0x3f000); u |= t1>t2?t1:t2;
628: t1 = (u1& 0xfc0); t2 = (u2& 0xfc0); u |= t1>t2?t1:t2;
629: t1 = (u1& 0x3f); t2 = (u2& 0x3f); u |= t1>t2?t1:t2;
1.1 noro 630: d[i] = u;
631: }
632: break;
633: case 8:
1.41 noro 634: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 635: u1 = d1[i]; u2 = d2[i];
636: t1 = (u1&0xff000000); t2 = (u2&0xff000000); u = t1>t2?t1:t2;
1.62 noro 637: t1 = (u1& 0xff0000); t2 = (u2& 0xff0000); u |= t1>t2?t1:t2;
638: t1 = (u1& 0xff00); t2 = (u2& 0xff00); u |= t1>t2?t1:t2;
639: t1 = (u1& 0xff); t2 = (u2& 0xff); u |= t1>t2?t1:t2;
1.1 noro 640: d[i] = u;
641: }
642: break;
643: case 16:
1.41 noro 644: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 645: u1 = d1[i]; u2 = d2[i];
646: t1 = (u1&0xffff0000); t2 = (u2&0xffff0000); u = t1>t2?t1:t2;
1.62 noro 647: t1 = (u1& 0xffff); t2 = (u2& 0xffff); u |= t1>t2?t1:t2;
1.1 noro 648: d[i] = u;
649: }
650: break;
651: case 32:
1.41 noro 652: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 653: u1 = d1[i]; u2 = d2[i];
654: d[i] = u1>u2?u1:u2;
655: }
656: break;
657: default:
1.41 noro 658: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 659: u1 = d1[i]; u2 = d2[i];
660: for ( j = 0, u = 0; j < nd_epw; j++ ) {
661: t1 = (u1&nd_mask[j]); t2 = (u2&nd_mask[j]); u |= t1>t2?t1:t2;
662: }
663: d[i] = u;
664: }
665: break;
666: }
1.65 noro 667: #else
668: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
669: u1 = d1[i]; u2 = d2[i];
670: for ( j = 0, u = 0; j < nd_epw; j++ ) {
671: t1 = (u1&nd_mask[j]); t2 = (u2&nd_mask[j]); u |= t1>t2?t1:t2;
672: }
673: d[i] = u;
674: }
675: #endif
1.39 noro 676: TD(d) = ndl_weight(d);
1.61 noro 677: if ( nd_blockmask ) ndl_weight_mask(d);
1.57 noro 678: }
679:
1.61 noro 680: int ndl_weight(UINT *d)
1.1 noro 681: {
1.61 noro 682: UINT t,u;
1.1 noro 683: int i,j;
684:
1.60 noro 685: if ( current_dl_weight_vector )
686: for ( i = 0, t = 0; i < nd_nvar; i++ ) {
687: u = GET_EXP(d,i);
688: t += MUL_WEIGHT(u,i);
689: }
690: else
691: for ( t = 0, i = nd_exporigin; i < nd_wpd; i++ ) {
692: u = d[i];
693: for ( j = 0; j < nd_epw; j++, u>>=nd_bpe )
694: t += (u&nd_mask0);
695: }
1.1 noro 696: return t;
697: }
698:
1.61 noro 699: void ndl_weight_mask(UINT *d)
1.43 noro 700: {
1.61 noro 701: UINT t,u;
702: UINT *mask;
703: int i,j,k,l;
1.43 noro 704:
1.61 noro 705: l = nd_blockmask->n;
706: for ( k = 0; k < l; k++ ) {
707: mask = nd_blockmask->mask[k];
708: if ( current_dl_weight_vector )
709: for ( i = 0, t = 0; i < nd_nvar; i++ ) {
710: u = GET_EXP_MASK(d,i,mask);
711: t += MUL_WEIGHT(u,i);
712: }
713: else
714: for ( t = 0, i = nd_exporigin; i < nd_wpd; i++ ) {
715: u = d[i]&mask[i];
716: for ( j = 0; j < nd_epw; j++, u>>=nd_bpe )
717: t += (u&nd_mask0);
718: }
719: d[k+1] = t;
720: }
1.43 noro 721: }
722:
1.61 noro 723: int ndl_lex_compare(UINT *d1,UINT *d2)
1.1 noro 724: {
725: int i;
726:
1.41 noro 727: d1 += nd_exporigin;
728: d2 += nd_exporigin;
729: for ( i = nd_exporigin; i < nd_wpd; i++, d1++, d2++ )
1.1 noro 730: if ( *d1 > *d2 )
1.32 noro 731: return nd_isrlex ? -1 : 1;
1.1 noro 732: else if ( *d1 < *d2 )
1.32 noro 733: return nd_isrlex ? 1 : -1;
1.1 noro 734: return 0;
735: }
736:
1.61 noro 737: int ndl_block_compare(UINT *d1,UINT *d2)
1.43 noro 738: {
739: int i,l,j,ord_o,ord_l;
740: struct order_pair *op;
1.61 noro 741: UINT t1,t2,m;
742: UINT *mask;
1.43 noro 743:
744: l = nd_blockmask->n;
745: op = nd_blockmask->order_pair;
746: for ( j = 0; j < l; j++ ) {
747: mask = nd_blockmask->mask[j];
748: ord_o = op[j].order;
749: if ( ord_o < 2 )
1.44 noro 750: if ( (t1=d1[j+1]) > (t2=d2[j+1]) ) return 1;
751: else if ( t1 < t2 ) return -1;
1.43 noro 752: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.44 noro 753: m = mask[i];
754: t1 = d1[i]&m;
755: t2 = d2[i]&m;
1.43 noro 756: if ( t1 > t2 )
757: return !ord_o ? -1 : 1;
758: else if ( t1 < t2 )
759: return !ord_o ? 1 : -1;
760: }
761: }
762: return 0;
763: }
764:
1.58 noro 765: /* TDH -> WW -> TD-> RL */
766:
1.61 noro 767: int ndl_ww_lex_compare(UINT *d1,UINT *d2)
1.58 noro 768: {
769: int i,m,e1,e2;
770:
771: if ( TD(d1) > TD(d2) ) return 1;
772: else if ( TD(d1) < TD(d2) ) return -1;
773: m = nd_nvar>>1;
774: for ( i = 0, e1 = e2 = 0; i < m; i++ ) {
775: e1 += current_weyl_weight_vector[i]*(GET_EXP(d1,m+i)-GET_EXP(d1,i));
776: e2 += current_weyl_weight_vector[i]*(GET_EXP(d2,m+i)-GET_EXP(d2,i));
777: }
778: if ( e1 > e2 ) return 1;
779: else if ( e1 < e2 ) return -1;
780: return ndl_lex_compare(d1,d2);
781: }
782:
1.61 noro 783: INLINE int ndl_equal(UINT *d1,UINT *d2)
1.1 noro 784: {
785: int i;
786:
1.81 noro 787: switch ( nd_wpd ) {
788: case 2:
789: if ( TD(d2) != TD(d1) ) return 0;
790: if ( d2[1] != d1[1] ) return 0;
791: return 1;
792: break;
793: case 3:
794: if ( TD(d2) != TD(d1) ) return 0;
795: if ( d2[1] != d1[1] ) return 0;
796: if ( d2[2] != d1[2] ) return 0;
797: return 1;
798: break;
799: default:
800: for ( i = 0; i < nd_wpd; i++ )
801: if ( *d1++ != *d2++ ) return 0;
802: return 1;
803: break;
804: }
1.1 noro 805: }
806:
1.61 noro 807: INLINE void ndl_copy(UINT *d1,UINT *d2)
1.6 noro 808: {
809: int i;
810:
811: switch ( nd_wpd ) {
1.41 noro 812: case 2:
1.34 noro 813: TD(d2) = TD(d1);
814: d2[1] = d1[1];
1.6 noro 815: break;
1.41 noro 816: case 3:
1.34 noro 817: TD(d2) = TD(d1);
1.6 noro 818: d2[1] = d1[1];
1.34 noro 819: d2[2] = d1[2];
1.6 noro 820: break;
821: default:
1.41 noro 822: for ( i = 0; i < nd_wpd; i++ )
1.6 noro 823: d2[i] = d1[i];
824: break;
825: }
826: }
827:
1.61 noro 828: INLINE void ndl_zero(UINT *d)
829: {
830: int i;
831: for ( i = 0; i < nd_wpd; i++ ) d[i] = 0;
832: }
833:
834: INLINE void ndl_add(UINT *d1,UINT *d2,UINT *d)
1.1 noro 835: {
836: int i;
837:
1.43 noro 838: #if 1
1.6 noro 839: switch ( nd_wpd ) {
1.41 noro 840: case 2:
841: TD(d) = TD(d1)+TD(d2);
1.34 noro 842: d[1] = d1[1]+d2[1];
1.6 noro 843: break;
1.41 noro 844: case 3:
845: TD(d) = TD(d1)+TD(d2);
1.6 noro 846: d[1] = d1[1]+d2[1];
1.34 noro 847: d[2] = d1[2]+d2[2];
1.6 noro 848: break;
849: default:
1.43 noro 850: for ( i = 0; i < nd_wpd; i++ ) d[i] = d1[i]+d2[i];
1.6 noro 851: break;
852: }
1.43 noro 853: #else
854: for ( i = 0; i < nd_wpd; i++ ) d[i] = d1[i]+d2[i];
855: #endif
1.6 noro 856: }
857:
1.55 noro 858: /* d1 += d2 */
1.61 noro 859: INLINE void ndl_addto(UINT *d1,UINT *d2)
1.55 noro 860: {
861: int i;
862:
863: #if 1
864: switch ( nd_wpd ) {
865: case 2:
866: TD(d1) += TD(d2);
867: d1[1] += d2[1];
868: break;
869: case 3:
870: TD(d1) += TD(d2);
871: d1[1] += d2[1];
872: d1[2] += d2[2];
873: break;
874: default:
875: for ( i = 0; i < nd_wpd; i++ ) d1[i] += d2[i];
876: break;
877: }
878: #else
879: for ( i = 0; i < nd_wpd; i++ ) d1[i] += d2[i];
880: #endif
881: }
882:
1.61 noro 883: INLINE void ndl_sub(UINT *d1,UINT *d2,UINT *d)
1.6 noro 884: {
885: int i;
886:
1.43 noro 887: for ( i = 0; i < nd_wpd; i++ ) d[i] = d1[i]-d2[i];
1.1 noro 888: }
889:
1.61 noro 890: int ndl_disjoint(UINT *d1,UINT *d2)
1.1 noro 891: {
1.61 noro 892: UINT t1,t2,u,u1,u2;
1.1 noro 893: int i,j;
894:
1.65 noro 895: #if USE_UNROLL
1.1 noro 896: switch ( nd_bpe ) {
1.62 noro 897: case 3:
898: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
899: u1 = d1[i]; u2 = d2[i];
900: t1 = u1&0x38000000; t2 = u2&0x38000000; if ( t1&&t2 ) return 0;
901: t1 = u1& 0x7000000; t2 = u2& 0x7000000; if ( t1&&t2 ) return 0;
902: t1 = u1& 0xe00000; t2 = u2& 0xe00000; if ( t1&&t2 ) return 0;
903: t1 = u1& 0x1c0000; t2 = u2& 0x1c0000; if ( t1&&t2 ) return 0;
904: t1 = u1& 0x38000; t2 = u2& 0x38000; if ( t1&&t2 ) return 0;
905: t1 = u1& 0x7000; t2 = u2& 0x7000; if ( t1&&t2 ) return 0;
906: t1 = u1& 0xe00; t2 = u2& 0xe00; if ( t1&&t2 ) return 0;
907: t1 = u1& 0x1c0; t2 = u2& 0x1c0; if ( t1&&t2 ) return 0;
908: t1 = u1& 0x38; t2 = u2& 0x38; if ( t1&&t2 ) return 0;
909: t1 = u1& 0x7; t2 = u2& 0x7; if ( t1&&t2 ) return 0;
910: }
911: return 1;
912: break;
1.1 noro 913: case 4:
1.41 noro 914: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 915: u1 = d1[i]; u2 = d2[i];
916: t1 = u1&0xf0000000; t2 = u2&0xf0000000; if ( t1&&t2 ) return 0;
1.62 noro 917: t1 = u1& 0xf000000; t2 = u2& 0xf000000; if ( t1&&t2 ) return 0;
918: t1 = u1& 0xf00000; t2 = u2& 0xf00000; if ( t1&&t2 ) return 0;
919: t1 = u1& 0xf0000; t2 = u2& 0xf0000; if ( t1&&t2 ) return 0;
920: t1 = u1& 0xf000; t2 = u2& 0xf000; if ( t1&&t2 ) return 0;
921: t1 = u1& 0xf00; t2 = u2& 0xf00; if ( t1&&t2 ) return 0;
922: t1 = u1& 0xf0; t2 = u2& 0xf0; if ( t1&&t2 ) return 0;
923: t1 = u1& 0xf; t2 = u2& 0xf; if ( t1&&t2 ) return 0;
1.1 noro 924: }
925: return 1;
926: break;
927: case 6:
1.41 noro 928: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 929: u1 = d1[i]; u2 = d2[i];
930: t1 = u1&0x3f000000; t2 = u2&0x3f000000; if ( t1&&t2 ) return 0;
1.62 noro 931: t1 = u1& 0xfc0000; t2 = u2& 0xfc0000; if ( t1&&t2 ) return 0;
932: t1 = u1& 0x3f000; t2 = u2& 0x3f000; if ( t1&&t2 ) return 0;
933: t1 = u1& 0xfc0; t2 = u2& 0xfc0; if ( t1&&t2 ) return 0;
934: t1 = u1& 0x3f; t2 = u2& 0x3f; if ( t1&&t2 ) return 0;
1.1 noro 935: }
936: return 1;
937: break;
938: case 8:
1.41 noro 939: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 940: u1 = d1[i]; u2 = d2[i];
941: t1 = u1&0xff000000; t2 = u2&0xff000000; if ( t1&&t2 ) return 0;
1.62 noro 942: t1 = u1& 0xff0000; t2 = u2& 0xff0000; if ( t1&&t2 ) return 0;
943: t1 = u1& 0xff00; t2 = u2& 0xff00; if ( t1&&t2 ) return 0;
944: t1 = u1& 0xff; t2 = u2& 0xff; if ( t1&&t2 ) return 0;
1.1 noro 945: }
946: return 1;
947: break;
948: case 16:
1.41 noro 949: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 950: u1 = d1[i]; u2 = d2[i];
951: t1 = u1&0xffff0000; t2 = u2&0xffff0000; if ( t1&&t2 ) return 0;
1.62 noro 952: t1 = u1& 0xffff; t2 = u2& 0xffff; if ( t1&&t2 ) return 0;
1.1 noro 953: }
954: return 1;
955: break;
956: case 32:
1.41 noro 957: for ( i = nd_exporigin; i < nd_wpd; i++ )
1.1 noro 958: if ( d1[i] && d2[i] ) return 0;
959: return 1;
960: break;
961: default:
1.41 noro 962: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.1 noro 963: u1 = d1[i]; u2 = d2[i];
964: for ( j = 0; j < nd_epw; j++ ) {
965: if ( (u1&nd_mask0) && (u2&nd_mask0) ) return 0;
966: u1 >>= nd_bpe; u2 >>= nd_bpe;
967: }
968: }
969: return 1;
970: break;
971: }
1.65 noro 972: #else
973: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
974: u1 = d1[i]; u2 = d2[i];
975: for ( j = 0; j < nd_epw; j++ ) {
976: if ( (u1&nd_mask0) && (u2&nd_mask0) ) return 0;
977: u1 >>= nd_bpe; u2 >>= nd_bpe;
978: }
979: }
980: return 1;
981: #endif
1.1 noro 982: }
983:
1.61 noro 984: int ndl_check_bound2(int index,UINT *d2)
1.1 noro 985: {
1.61 noro 986: UINT u2;
987: UINT *d1;
1.5 noro 988: int i,j,ind,k;
1.1 noro 989:
1.5 noro 990: d1 = nd_bound[index];
991: ind = 0;
1.65 noro 992: #if USE_UNROLL
1.5 noro 993: switch ( nd_bpe ) {
1.62 noro 994: case 3:
995: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
996: u2 = d2[i];
997: if ( d1[ind++]+((u2>>27)&0x7) >= 0x8 ) return 1;
998: if ( d1[ind++]+((u2>>24)&0x7) >= 0x8 ) return 1;
999: if ( d1[ind++]+((u2>>21)&0x7) >= 0x8 ) return 1;
1000: if ( d1[ind++]+((u2>>18)&0x7) >= 0x8 ) return 1;
1001: if ( d1[ind++]+((u2>>15)&0x7) >= 0x8 ) return 1;
1002: if ( d1[ind++]+((u2>>12)&0x7) >= 0x8 ) return 1;
1003: if ( d1[ind++]+((u2>>9)&0x7) >= 0x8 ) return 1;
1004: if ( d1[ind++]+((u2>>6)&0x7) >= 0x8 ) return 1;
1005: if ( d1[ind++]+((u2>>3)&0x7) >= 0x8 ) return 1;
1006: if ( d1[ind++]+(u2&0x7) >= 0x8 ) return 1;
1007: }
1008: return 0;
1009: break;
1.5 noro 1010: case 4:
1.41 noro 1011: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.5 noro 1012: u2 = d2[i];
1013: if ( d1[ind++]+((u2>>28)&0xf) >= 0x10 ) return 1;
1014: if ( d1[ind++]+((u2>>24)&0xf) >= 0x10 ) return 1;
1015: if ( d1[ind++]+((u2>>20)&0xf) >= 0x10 ) return 1;
1016: if ( d1[ind++]+((u2>>16)&0xf) >= 0x10 ) return 1;
1017: if ( d1[ind++]+((u2>>12)&0xf) >= 0x10 ) return 1;
1018: if ( d1[ind++]+((u2>>8)&0xf) >= 0x10 ) return 1;
1019: if ( d1[ind++]+((u2>>4)&0xf) >= 0x10 ) return 1;
1020: if ( d1[ind++]+(u2&0xf) >= 0x10 ) return 1;
1021: }
1022: return 0;
1023: break;
1024: case 6:
1.41 noro 1025: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.5 noro 1026: u2 = d2[i];
1027: if ( d1[ind++]+((u2>>24)&0x3f) >= 0x40 ) return 1;
1028: if ( d1[ind++]+((u2>>18)&0x3f) >= 0x40 ) return 1;
1029: if ( d1[ind++]+((u2>>12)&0x3f) >= 0x40 ) return 1;
1030: if ( d1[ind++]+((u2>>6)&0x3f) >= 0x40 ) return 1;
1031: if ( d1[ind++]+(u2&0x3f) >= 0x40 ) return 1;
1032: }
1033: return 0;
1034: break;
1035: case 8:
1.41 noro 1036: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.5 noro 1037: u2 = d2[i];
1038: if ( d1[ind++]+((u2>>24)&0xff) >= 0x100 ) return 1;
1039: if ( d1[ind++]+((u2>>16)&0xff) >= 0x100 ) return 1;
1040: if ( d1[ind++]+((u2>>8)&0xff) >= 0x100 ) return 1;
1041: if ( d1[ind++]+(u2&0xff) >= 0x100 ) return 1;
1042: }
1043: return 0;
1044: break;
1045: case 16:
1.41 noro 1046: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.5 noro 1047: u2 = d2[i];
1048: if ( d1[ind++]+((u2>>16)&0xffff) > 0x10000 ) return 1;
1049: if ( d1[ind++]+(u2&0xffff) > 0x10000 ) return 1;
1050: }
1051: return 0;
1052: break;
1053: case 32:
1.41 noro 1054: for ( i = nd_exporigin; i < nd_wpd; i++ )
1.5 noro 1055: if ( d1[i]+d2[i]<d1[i] ) return 1;
1056: return 0;
1057: break;
1058: default:
1.41 noro 1059: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1.5 noro 1060: u2 = d2[i];
1061: k = (nd_epw-1)*nd_bpe;
1062: for ( j = 0; j < nd_epw; j++, k -= nd_bpe )
1063: if ( d1[ind++]+((u2>>k)&nd_mask0) > nd_mask0 ) return 1;
1064: }
1065: return 0;
1066: break;
1067: }
1.65 noro 1068: #else
1069: for ( i = nd_exporigin; i < nd_wpd; i++ ) {
1070: u2 = d2[i];
1071: k = (nd_epw-1)*nd_bpe;
1072: for ( j = 0; j < nd_epw; j++, k -= nd_bpe )
1073: if ( d1[ind++]+((u2>>k)&nd_mask0) > nd_mask0 ) return 1;
1074: }
1075: return 0;
1076: #endif
1.1 noro 1077: }
1078:
1.61 noro 1079: INLINE int ndl_hash_value(UINT *d)
1.1 noro 1080: {
1081: int i;
1082: int r;
1083:
1.34 noro 1084: r = 0;
1.41 noro 1085: for ( i = 0; i < nd_wpd; i++ )
1.1 noro 1086: r = ((r<<16)+d[i])%REDTAB_LEN;
1087: return r;
1088: }
1089:
1.63 noro 1090: INLINE int ndl_find_reducer(UINT *dg)
1.1 noro 1091: {
1.13 noro 1092: RHist r;
1.6 noro 1093: int d,k,i;
1.1 noro 1094:
1.63 noro 1095: d = ndl_hash_value(dg);
1.13 noro 1096: for ( r = nd_red[d], k = 0; r; r = NEXT(r), k++ ) {
1.34 noro 1097: if ( ndl_equal(dg,DL(r)) ) {
1.1 noro 1098: if ( k > 0 ) nd_notfirst++;
1099: nd_found++;
1.13 noro 1100: return r->index;
1.1 noro 1101: }
1102: }
1.13 noro 1103: if ( Reverse )
1104: for ( i = nd_psn-1; i >= 0; i-- ) {
1105: r = nd_psh[i];
1.34 noro 1106: if ( ndl_reducible(dg,DL(r)) ) {
1.13 noro 1107: nd_create++;
1.34 noro 1108: nd_append_red(dg,i);
1.13 noro 1109: return i;
1110: }
1111: }
1112: else
1113: for ( i = 0; i < nd_psn; i++ ) {
1114: r = nd_psh[i];
1.34 noro 1115: if ( ndl_reducible(dg,DL(r)) ) {
1.13 noro 1116: nd_create++;
1.34 noro 1117: nd_append_red(dg,i);
1.13 noro 1118: return i;
1119: }
1.1 noro 1120: }
1.6 noro 1121: return -1;
1.1 noro 1122: }
1123:
1.63 noro 1124: ND nd_merge(ND p1,ND p2)
1125: {
1126: int n,c;
1127: int t,can,td1,td2;
1128: ND r;
1129: NM m1,m2,mr0,mr,s;
1130:
1131: if ( !p1 ) return p2;
1132: else if ( !p2 ) return p1;
1133: else {
1134: can = 0;
1135: for ( n = NV(p1), m1 = BDY(p1), m2 = BDY(p2), mr0 = 0; m1 && m2; ) {
1136: c = DL_COMPARE(DL(m1),DL(m2));
1137: switch ( c ) {
1138: case 0:
1139: s = m1; m1 = NEXT(m1);
1140: can++; NEXTNM2(mr0,mr,s);
1141: s = m2; m2 = NEXT(m2); FREENM(s);
1142: break;
1143: case 1:
1144: s = m1; m1 = NEXT(m1); NEXTNM2(mr0,mr,s);
1145: break;
1146: case -1:
1147: s = m2; m2 = NEXT(m2); NEXTNM2(mr0,mr,s);
1148: break;
1149: }
1150: }
1151: if ( !mr0 )
1152: if ( m1 ) mr0 = m1;
1153: else if ( m2 ) mr0 = m2;
1154: else return 0;
1155: else if ( m1 ) NEXT(mr) = m1;
1156: else if ( m2 ) NEXT(mr) = m2;
1157: else NEXT(mr) = 0;
1158: BDY(p1) = mr0;
1159: SG(p1) = MAX(SG(p1),SG(p2));
1160: LEN(p1) = LEN(p1)+LEN(p2)-can;
1161: FREEND(p2);
1162: return p1;
1163: }
1164: }
1165:
1.31 noro 1166: ND nd_add(int mod,ND p1,ND p2)
1.1 noro 1167: {
1168: int n,c;
1.34 noro 1169: int t,can,td1,td2;
1.1 noro 1170: ND r;
1171: NM m1,m2,mr0,mr,s;
1172:
1.34 noro 1173: if ( !p1 ) return p2;
1174: else if ( !p2 ) return p1;
1.71 noro 1175: else if ( mod == -1 ) return nd_add_sf(p1,p2);
1.34 noro 1176: else if ( !mod ) return nd_add_q(p1,p2);
1.1 noro 1177: else {
1.30 noro 1178: can = 0;
1.1 noro 1179: for ( n = NV(p1), m1 = BDY(p1), m2 = BDY(p2), mr0 = 0; m1 && m2; ) {
1.34 noro 1180: c = DL_COMPARE(DL(m1),DL(m2));
1.1 noro 1181: switch ( c ) {
1182: case 0:
1.19 noro 1183: t = ((CM(m1))+(CM(m2))) - mod;
1.34 noro 1184: if ( t < 0 ) t += mod;
1.1 noro 1185: s = m1; m1 = NEXT(m1);
1186: if ( t ) {
1.34 noro 1187: can++; NEXTNM2(mr0,mr,s); CM(mr) = (t);
1.1 noro 1188: } else {
1.34 noro 1189: can += 2; FREENM(s);
1.1 noro 1190: }
1191: s = m2; m2 = NEXT(m2); FREENM(s);
1192: break;
1193: case 1:
1194: s = m1; m1 = NEXT(m1); NEXTNM2(mr0,mr,s);
1195: break;
1196: case -1:
1197: s = m2; m2 = NEXT(m2); NEXTNM2(mr0,mr,s);
1198: break;
1199: }
1200: }
1201: if ( !mr0 )
1.34 noro 1202: if ( m1 ) mr0 = m1;
1203: else if ( m2 ) mr0 = m2;
1204: else return 0;
1205: else if ( m1 ) NEXT(mr) = m1;
1206: else if ( m2 ) NEXT(mr) = m2;
1207: else NEXT(mr) = 0;
1.1 noro 1208: BDY(p1) = mr0;
1.14 noro 1209: SG(p1) = MAX(SG(p1),SG(p2));
1.31 noro 1210: LEN(p1) = LEN(p1)+LEN(p2)-can;
1.1 noro 1211: FREEND(p2);
1212: return p1;
1213: }
1214: }
1215:
1.31 noro 1216: ND nd_add_q(ND p1,ND p2)
1.17 noro 1217: {
1.30 noro 1218: int n,c,can;
1.17 noro 1219: ND r;
1220: NM m1,m2,mr0,mr,s;
1221: Q t;
1222:
1.34 noro 1223: if ( !p1 ) return p2;
1224: else if ( !p2 ) return p1;
1.31 noro 1225: else {
1.30 noro 1226: can = 0;
1.17 noro 1227: for ( n = NV(p1), m1 = BDY(p1), m2 = BDY(p2), mr0 = 0; m1 && m2; ) {
1.34 noro 1228: c = DL_COMPARE(DL(m1),DL(m2));
1.17 noro 1229: switch ( c ) {
1230: case 0:
1231: addq(CQ(m1),CQ(m2),&t);
1232: s = m1; m1 = NEXT(m1);
1233: if ( t ) {
1.34 noro 1234: can++; NEXTNM2(mr0,mr,s); CQ(mr) = (t);
1.17 noro 1235: } else {
1.34 noro 1236: can += 2; FREENM(s);
1.17 noro 1237: }
1238: s = m2; m2 = NEXT(m2); FREENM(s);
1239: break;
1240: case 1:
1241: s = m1; m1 = NEXT(m1); NEXTNM2(mr0,mr,s);
1242: break;
1243: case -1:
1244: s = m2; m2 = NEXT(m2); NEXTNM2(mr0,mr,s);
1245: break;
1246: }
1247: }
1248: if ( !mr0 )
1.34 noro 1249: if ( m1 ) mr0 = m1;
1250: else if ( m2 ) mr0 = m2;
1251: else return 0;
1252: else if ( m1 ) NEXT(mr) = m1;
1253: else if ( m2 ) NEXT(mr) = m2;
1254: else NEXT(mr) = 0;
1.17 noro 1255: BDY(p1) = mr0;
1256: SG(p1) = MAX(SG(p1),SG(p2));
1.31 noro 1257: LEN(p1) = LEN(p1)+LEN(p2)-can;
1.17 noro 1258: FREEND(p2);
1259: return p1;
1260: }
1261: }
1262:
1.71 noro 1263: ND nd_add_sf(ND p1,ND p2)
1264: {
1265: int n,c,can;
1266: ND r;
1267: NM m1,m2,mr0,mr,s;
1268: int t;
1269:
1270: if ( !p1 ) return p2;
1271: else if ( !p2 ) return p1;
1272: else {
1273: can = 0;
1274: for ( n = NV(p1), m1 = BDY(p1), m2 = BDY(p2), mr0 = 0; m1 && m2; ) {
1275: c = DL_COMPARE(DL(m1),DL(m2));
1276: switch ( c ) {
1277: case 0:
1278: t = _addsf(CM(m1),CM(m2));
1279: s = m1; m1 = NEXT(m1);
1280: if ( t ) {
1281: can++; NEXTNM2(mr0,mr,s); CM(mr) = (t);
1282: } else {
1283: can += 2; FREENM(s);
1284: }
1285: s = m2; m2 = NEXT(m2); FREENM(s);
1286: break;
1287: case 1:
1288: s = m1; m1 = NEXT(m1); NEXTNM2(mr0,mr,s);
1289: break;
1290: case -1:
1291: s = m2; m2 = NEXT(m2); NEXTNM2(mr0,mr,s);
1292: break;
1293: }
1294: }
1295: if ( !mr0 )
1296: if ( m1 ) mr0 = m1;
1297: else if ( m2 ) mr0 = m2;
1298: else return 0;
1299: else if ( m1 ) NEXT(mr) = m1;
1300: else if ( m2 ) NEXT(mr) = m2;
1301: else NEXT(mr) = 0;
1302: BDY(p1) = mr0;
1303: SG(p1) = MAX(SG(p1),SG(p2));
1304: LEN(p1) = LEN(p1)+LEN(p2)-can;
1305: FREEND(p2);
1306: return p1;
1307: }
1308: }
1309:
1.1 noro 1310: /* ret=1 : success, ret=0 : overflow */
1.69 noro 1311: int nd_nf(int mod,ND g,NDV *ps,int full,NDC dn,ND *rp)
1.1 noro 1312: {
1.11 noro 1313: ND d;
1.1 noro 1314: NM m,mrd,tail;
1.7 noro 1315: NM mul;
1.10 noro 1316: int n,sugar,psugar,sugar0,stat,index;
1.30 noro 1317: int c,c1,c2,dummy;
1.17 noro 1318: RHist h;
1.11 noro 1319: NDV p,red;
1.69 noro 1320: Q cg,cred,gcd,tq,qq;
1.21 noro 1321: double hmag;
1.1 noro 1322:
1.69 noro 1323: if ( dn ) {
1324: if ( mod )
1325: dn->m = 1;
1326: else
1327: dn->z = ONE;
1328: }
1.1 noro 1329: if ( !g ) {
1330: *rp = 0;
1331: return 1;
1332: }
1.34 noro 1333: if ( !mod ) hmag = ((double)p_mag((P)HCQ(g)))*nd_scale;
1.21 noro 1334:
1.14 noro 1335: sugar0 = sugar = SG(g);
1.1 noro 1336: n = NV(g);
1.61 noro 1337: mul = (NM)ALLOCA(sizeof(struct oNM)+(nd_wpd-1)*sizeof(UINT));
1.1 noro 1338: for ( d = 0; g; ) {
1.63 noro 1339: index = ndl_find_reducer(HDL(g));
1.6 noro 1340: if ( index >= 0 ) {
1.17 noro 1341: h = nd_psh[index];
1342: ndl_sub(HDL(g),DL(h),DL(mul));
1.14 noro 1343: if ( ndl_check_bound2(index,DL(mul)) ) {
1.6 noro 1344: nd_free(g); nd_free(d);
1345: return 0;
1346: }
1.77 noro 1347: if ( nd_demand )
1348: p = ndv_load(index);
1349: else
1350: p = ps[index];
1.71 noro 1351: if ( mod == -1 )
1352: CM(mul) = _mulsf(_invsf(HCM(p)),_chsgnsf(HCM(g)));
1353: else if ( mod ) {
1.19 noro 1354: c1 = invm(HCM(p),mod); c2 = mod-HCM(g);
1355: DMAR(c1,c2,0,mod,c); CM(mul) = c;
1.16 noro 1356: } else {
1.17 noro 1357: igcd_cofactor(HCQ(g),HCQ(p),&gcd,&cg,&cred);
1.16 noro 1358: chsgnq(cg,&CQ(mul));
1.20 noro 1359: nd_mul_c_q(d,cred); nd_mul_c_q(g,cred);
1.69 noro 1360: if ( dn ) {
1361: mulq(dn->z,cred,&tq); dn->z = tq;
1362: }
1.16 noro 1363: }
1.55 noro 1364: g = nd_add(mod,g,ndv_mul_nm(mod,mul,p));
1.34 noro 1365: sugar = MAX(sugar,SG(p)+TD(DL(mul)));
1.22 noro 1366: if ( !mod && hmag && g && ((double)(p_mag((P)HCQ(g))) > hmag) ) {
1.69 noro 1367: tq = HCQ(g);
1.21 noro 1368: nd_removecont2(d,g);
1.69 noro 1369: if ( dn ) {
1370: divq(tq,HCQ(g),&qq); divq(dn->z,qq,&tq); dn->z = tq;
1371: }
1.21 noro 1372: hmag = ((double)p_mag((P)HCQ(g)))*nd_scale;
1373: }
1.1 noro 1374: } else if ( !full ) {
1375: *rp = g;
1376: return 1;
1377: } else {
1378: m = BDY(g);
1379: if ( NEXT(m) ) {
1.34 noro 1380: BDY(g) = NEXT(m); NEXT(m) = 0; LEN(g)--;
1.1 noro 1381: } else {
1382: FREEND(g); g = 0;
1383: }
1384: if ( d ) {
1.34 noro 1385: NEXT(tail)=m; tail=m; LEN(d)++;
1.1 noro 1386: } else {
1.34 noro 1387: MKND(n,m,1,d); tail = BDY(d);
1.1 noro 1388: }
1389: }
1390: }
1.34 noro 1391: if ( d ) SG(d) = sugar;
1.1 noro 1392: *rp = d;
1393: return 1;
1394: }
1.28 noro 1395:
1.53 noro 1396: int nd_nf_pbucket(int mod,ND g,NDV *ps,int full,ND *rp)
1.25 noro 1397: {
1398: int hindex,index;
1399: NDV p;
1400: ND u,d,red;
1401: NODE l;
1.31 noro 1402: NM mul,m,mrd,tail;
1.25 noro 1403: int sugar,psugar,n,h_reducible;
1404: PGeoBucket bucket;
1405: int c,c1,c2;
1.26 noro 1406: Q cg,cred,gcd,zzz;
1.25 noro 1407: RHist h;
1.28 noro 1408: double hmag,gmag;
1.77 noro 1409: int count = 0;
1410: int hcount = 0;
1.25 noro 1411:
1412: if ( !g ) {
1413: *rp = 0;
1414: return 1;
1415: }
1416: sugar = SG(g);
1417: n = NV(g);
1.34 noro 1418: if ( !mod ) hmag = ((double)p_mag((P)HCQ(g)))*nd_scale;
1.25 noro 1419: bucket = create_pbucket();
1.31 noro 1420: add_pbucket(mod,bucket,g);
1.25 noro 1421: d = 0;
1.61 noro 1422: mul = (NM)ALLOCA(sizeof(struct oNM)+(nd_wpd-1)*sizeof(UINT));
1.25 noro 1423: while ( 1 ) {
1.26 noro 1424: hindex = mod?head_pbucket(mod,bucket):head_pbucket_q(bucket);
1.25 noro 1425: if ( hindex < 0 ) {
1.77 noro 1426: if ( DP_Print > 3 ) printf("(%d %d)",count,hcount);
1.34 noro 1427: if ( d ) SG(d) = sugar;
1.25 noro 1428: *rp = d;
1429: return 1;
1430: }
1431: g = bucket->body[hindex];
1.63 noro 1432: index = ndl_find_reducer(HDL(g));
1.25 noro 1433: if ( index >= 0 ) {
1.77 noro 1434: count++;
1435: if ( !d ) hcount++;
1.25 noro 1436: h = nd_psh[index];
1437: ndl_sub(HDL(g),DL(h),DL(mul));
1438: if ( ndl_check_bound2(index,DL(mul)) ) {
1.26 noro 1439: nd_free(d);
1.25 noro 1440: free_pbucket(bucket);
1441: *rp = 0;
1442: return 0;
1443: }
1.53 noro 1444: p = ps[index];
1.71 noro 1445: if ( mod == -1 )
1446: CM(mul) = _mulsf(_invsf(HCM(p)),_chsgnsf(HCM(g)));
1447: else if ( mod ) {
1.25 noro 1448: c1 = invm(HCM(p),mod); c2 = mod-HCM(g);
1449: DMAR(c1,c2,0,mod,c); CM(mul) = c;
1450: } else {
1451: igcd_cofactor(HCQ(g),HCQ(p),&gcd,&cg,&cred);
1452: chsgnq(cg,&CQ(mul));
1.26 noro 1453: nd_mul_c_q(d,cred);
1454: mulq_pbucket(bucket,cred);
1455: g = bucket->body[hindex];
1.28 noro 1456: gmag = (double)p_mag((P)HCQ(g));
1.25 noro 1457: }
1.55 noro 1458: red = ndv_mul_nm(mod,mul,p);
1.25 noro 1459: bucket->body[hindex] = nd_remove_head(g);
1460: red = nd_remove_head(red);
1.31 noro 1461: add_pbucket(mod,bucket,red);
1.34 noro 1462: psugar = SG(p)+TD(DL(mul));
1463: sugar = MAX(sugar,psugar);
1.28 noro 1464: if ( !mod && hmag && (gmag > hmag) ) {
1465: g = normalize_pbucket(mod,bucket);
1466: if ( !g ) {
1.34 noro 1467: if ( d ) SG(d) = sugar;
1.28 noro 1468: *rp = d;
1469: return 1;
1470: }
1471: nd_removecont2(d,g);
1472: hmag = ((double)p_mag((P)HCQ(g)))*nd_scale;
1.31 noro 1473: add_pbucket(mod,bucket,g);
1.28 noro 1474: }
1.25 noro 1475: } else if ( !full ) {
1476: g = normalize_pbucket(mod,bucket);
1.34 noro 1477: if ( g ) SG(g) = sugar;
1.25 noro 1478: *rp = g;
1479: return 1;
1480: } else {
1481: m = BDY(g);
1482: if ( NEXT(m) ) {
1.34 noro 1483: BDY(g) = NEXT(m); NEXT(m) = 0; LEN(g)--;
1.25 noro 1484: } else {
1485: FREEND(g); g = 0;
1486: }
1487: bucket->body[hindex] = g;
1488: NEXT(m) = 0;
1489: if ( d ) {
1.34 noro 1490: NEXT(tail)=m; tail=m; LEN(d)++;
1.25 noro 1491: } else {
1.34 noro 1492: MKND(n,m,1,d); tail = BDY(d);
1.25 noro 1493: }
1494: }
1495: }
1496: }
1.27 noro 1497:
1.61 noro 1498: /* input : list of NDV, cand : list of NDV */
1.28 noro 1499:
1.61 noro 1500: int ndv_check_candidate(NODE input,int obpe,int oadv,EPOS oepos,NODE cand)
1.28 noro 1501: {
1502: int n,i,stat;
1503: ND nf,d;
1.61 noro 1504: NDV r;
1.45 noro 1505: NODE t,s;
1.69 noro 1506: union oNDC dn;
1.45 noro 1507:
1.61 noro 1508: ndv_setup(0,0,cand);
1.31 noro 1509: n = length(cand);
1.28 noro 1510:
1511: /* membercheck : list is a subset of Id(cand) ? */
1512: for ( t = input; t; t = NEXT(t) ) {
1.45 noro 1513: again:
1.61 noro 1514: if ( nd_bpe > obpe )
1515: r = ndv_dup_realloc((NDV)BDY(t),obpe,oadv,oepos);
1516: else
1517: r = (NDV)BDY(t);
1518: d = ndvtond(0,r);
1.69 noro 1519: stat = nd_nf(0,d,nd_ps,0,0,&nf);
1.45 noro 1520: if ( !stat ) {
1521: nd_reconstruct(0,0,0);
1522: goto again;
1523: } else if ( nf ) return 0;
1.71 noro 1524: if ( DP_Print ) { printf("."); fflush(stdout); }
1.28 noro 1525: }
1.71 noro 1526: if ( DP_Print ) { printf("\n"); }
1.28 noro 1527: /* gbcheck : cand is a GB of Id(cand) ? */
1.77 noro 1528: if ( !nd_gb(0,0,1) ) return 0;
1.28 noro 1529: /* XXX */
1.23 noro 1530: return 1;
1531: }
1.1 noro 1532:
1533: ND nd_remove_head(ND p)
1534: {
1535: NM m;
1536:
1537: m = BDY(p);
1538: if ( !NEXT(m) ) {
1.34 noro 1539: FREEND(p); p = 0;
1.31 noro 1540: } else {
1.34 noro 1541: BDY(p) = NEXT(m); LEN(p)--;
1.31 noro 1542: }
1.1 noro 1543: FREENM(m);
1544: return p;
1545: }
1546:
1.69 noro 1547: ND nd_separate_head(ND p,ND *head)
1548: {
1549: NM m,m0;
1550: ND r;
1551:
1552: m = BDY(p);
1553: if ( !NEXT(m) ) {
1554: *head = p; p = 0;
1555: } else {
1556: m0 = m;
1557: BDY(p) = NEXT(m); LEN(p)--;
1558: NEXT(m0) = 0;
1559: MKND(NV(p),m0,1,r);
1560: *head = r;
1561: }
1562: return p;
1563: }
1564:
1.1 noro 1565: PGeoBucket create_pbucket()
1566: {
1567: PGeoBucket g;
1568:
1569: g = CALLOC(1,sizeof(struct oPGeoBucket));
1570: g->m = -1;
1571: return g;
1572: }
1573:
1.25 noro 1574: void free_pbucket(PGeoBucket b) {
1575: int i;
1576:
1.26 noro 1577: for ( i = 0; i <= b->m; i++ )
1.25 noro 1578: if ( b->body[i] ) {
1579: nd_free(b->body[i]);
1580: b->body[i] = 0;
1581: }
1582: GC_free(b);
1583: }
1584:
1.63 noro 1585: void add_pbucket_symbolic(PGeoBucket g,ND d)
1586: {
1587: int l,i,k,m;
1588:
1589: if ( !d )
1590: return;
1591: l = LEN(d);
1592: for ( k = 0, m = 1; l > m; k++, m <<= 1 );
1593: /* 2^(k-1) < l <= 2^k (=m) */
1594: d = nd_merge(g->body[k],d);
1595: for ( ; d && LEN(d) > m; k++, m <<= 1 ) {
1596: g->body[k] = 0;
1597: d = nd_merge(g->body[k+1],d);
1598: }
1599: g->body[k] = d;
1600: g->m = MAX(g->m,k);
1601: }
1602:
1.31 noro 1603: void add_pbucket(int mod,PGeoBucket g,ND d)
1.1 noro 1604: {
1.31 noro 1605: int l,i,k,m;
1.1 noro 1606:
1.31 noro 1607: if ( !d )
1608: return;
1609: l = LEN(d);
1.29 noro 1610: for ( k = 0, m = 1; l > m; k++, m <<= 1 );
1611: /* 2^(k-1) < l <= 2^k (=m) */
1.31 noro 1612: d = nd_add(mod,g->body[k],d);
1613: for ( ; d && LEN(d) > m; k++, m <<= 1 ) {
1.1 noro 1614: g->body[k] = 0;
1.31 noro 1615: d = nd_add(mod,g->body[k+1],d);
1.1 noro 1616: }
1617: g->body[k] = d;
1618: g->m = MAX(g->m,k);
1619: }
1620:
1.26 noro 1621: void mulq_pbucket(PGeoBucket g,Q c)
1622: {
1623: int k;
1624:
1625: for ( k = 0; k <= g->m; k++ )
1626: nd_mul_c_q(g->body[k],c);
1627: }
1628:
1.63 noro 1629: NM remove_head_pbucket_symbolic(PGeoBucket g)
1630: {
1631: int j,i,k,c;
1632: NM head;
1633:
1634: k = g->m;
1635: j = -1;
1636: for ( i = 0; i <= k; i++ ) {
1637: if ( !g->body[i] ) continue;
1638: if ( j < 0 ) j = i;
1639: else {
1640: c = DL_COMPARE(HDL(g->body[i]),HDL(g->body[j]));
1641: if ( c > 0 )
1642: j = i;
1643: else if ( c == 0 )
1644: g->body[i] = nd_remove_head(g->body[i]);
1645: }
1646: }
1647: if ( j < 0 ) return 0;
1648: else {
1649: head = BDY(g->body[j]);
1650: if ( !NEXT(head) ) {
1651: FREEND(g->body[j]);
1652: g->body[j] = 0;
1653: } else {
1654: BDY(g->body[j]) = NEXT(head);
1655: LEN(g->body[j])--;
1656: }
1657: return head;
1658: }
1659: }
1660:
1.19 noro 1661: int head_pbucket(int mod,PGeoBucket g)
1.1 noro 1662: {
1663: int j,i,c,k,nv,sum;
1.61 noro 1664: UINT *di,*dj;
1.1 noro 1665: ND gi,gj;
1666:
1667: k = g->m;
1668: while ( 1 ) {
1669: j = -1;
1670: for ( i = 0; i <= k; i++ ) {
1671: if ( !(gi = g->body[i]) )
1672: continue;
1673: if ( j < 0 ) {
1674: j = i;
1675: gj = g->body[j];
1676: dj = HDL(gj);
1.14 noro 1677: sum = HCM(gj);
1.1 noro 1678: } else {
1.34 noro 1679: c = DL_COMPARE(HDL(gi),dj);
1.1 noro 1680: if ( c > 0 ) {
1.34 noro 1681: if ( sum ) HCM(gj) = sum;
1682: else g->body[j] = nd_remove_head(gj);
1.1 noro 1683: j = i;
1684: gj = g->body[j];
1685: dj = HDL(gj);
1.14 noro 1686: sum = HCM(gj);
1.1 noro 1687: } else if ( c == 0 ) {
1.71 noro 1688: if ( mod == -1 )
1689: sum = _addsf(sum,HCM(gi));
1690: else {
1691: sum = sum+HCM(gi)-mod;
1692: if ( sum < 0 ) sum += mod;
1693: }
1.1 noro 1694: g->body[i] = nd_remove_head(gi);
1695: }
1696: }
1697: }
1.34 noro 1698: if ( j < 0 ) return -1;
1.1 noro 1699: else if ( sum ) {
1.14 noro 1700: HCM(gj) = sum;
1.26 noro 1701: return j;
1.31 noro 1702: } else
1.26 noro 1703: g->body[j] = nd_remove_head(gj);
1704: }
1705: }
1706:
1707: int head_pbucket_q(PGeoBucket g)
1708: {
1709: int j,i,c,k,nv;
1710: Q sum,t;
1711: ND gi,gj;
1712:
1713: k = g->m;
1714: while ( 1 ) {
1715: j = -1;
1716: for ( i = 0; i <= k; i++ ) {
1.34 noro 1717: if ( !(gi = g->body[i]) ) continue;
1.26 noro 1718: if ( j < 0 ) {
1719: j = i;
1720: gj = g->body[j];
1721: sum = HCQ(gj);
1722: } else {
1723: nv = NV(gi);
1.34 noro 1724: c = DL_COMPARE(HDL(gi),HDL(gj));
1.26 noro 1725: if ( c > 0 ) {
1.34 noro 1726: if ( sum ) HCQ(gj) = sum;
1727: else g->body[j] = nd_remove_head(gj);
1.26 noro 1728: j = i;
1729: gj = g->body[j];
1730: sum = HCQ(gj);
1731: } else if ( c == 0 ) {
1732: addq(sum,HCQ(gi),&t);
1733: sum = t;
1734: g->body[i] = nd_remove_head(gi);
1735: }
1736: }
1737: }
1.34 noro 1738: if ( j < 0 ) return -1;
1.26 noro 1739: else if ( sum ) {
1740: HCQ(gj) = sum;
1.1 noro 1741: return j;
1.31 noro 1742: } else
1.1 noro 1743: g->body[j] = nd_remove_head(gj);
1744: }
1745: }
1746:
1.25 noro 1747: ND normalize_pbucket(int mod,PGeoBucket g)
1.1 noro 1748: {
1.31 noro 1749: int i;
1.1 noro 1750: ND r,t;
1751:
1752: r = 0;
1.28 noro 1753: for ( i = 0; i <= g->m; i++ ) {
1.31 noro 1754: r = nd_add(mod,r,g->body[i]);
1.28 noro 1755: g->body[i] = 0;
1756: }
1757: g->m = -1;
1.1 noro 1758: return r;
1759: }
1760:
1.27 noro 1761: /* return value = 0 => input is not a GB */
1762:
1.77 noro 1763: NODE nd_gb(int m,int ishomo,int checkonly)
1.1 noro 1764: {
1765: int i,nh,sugar,stat;
1.23 noro 1766: NODE r,g,t;
1.1 noro 1767: ND_pairs d;
1768: ND_pairs l;
1.77 noro 1769: ND h,nf,s,head;
1.63 noro 1770: NDV nfv;
1.85 noro 1771: Q q,num,den;
1.69 noro 1772: union oNDC dn;
1.1 noro 1773:
1.23 noro 1774: g = 0; d = 0;
1775: for ( i = 0; i < nd_psn; i++ ) {
1.1 noro 1776: d = update_pairs(d,g,i);
1777: g = update_base(g,i);
1778: }
1779: sugar = 0;
1780: while ( d ) {
1781: again:
1782: l = nd_minp(d,&d);
1.14 noro 1783: if ( SG(l) != sugar ) {
1.77 noro 1784: if ( ishomo ) {
1.85 noro 1785: for ( i = nd_psn-1; i >= 0 && SG(nd_psh[i]) == sugar; i-- ) {
1.82 noro 1786: if ( nd_demand )
1787: nfv = ndv_load(i);
1788: else
1789: nfv = nd_ps[i];
1790: s = ndvtond(m,nfv);
1.77 noro 1791: s = nd_separate_head(s,&head);
1792: nd_nf(m,s,nd_ps,1,&dn,&nf);
1.85 noro 1793: if ( !m ) {
1794: NTOQ(NM(dn.z),SGN(dn.z),num);
1795: mulq(HCQ(head),num,&q); HCQ(head) = q;
1796: if ( DN(dn.z) ) {
1797: NTOQ(DN(dn.z),1,den);
1798: nd_mul_c_q(nf,den);
1799: }
1800: }
1.77 noro 1801: nf = nd_add(m,head,nf);
1.82 noro 1802: ndv_free(nfv);
1.77 noro 1803: nd_removecont(m,nf);
1.82 noro 1804: nfv = ndtondv(m,nf);
1805: nd_free(nf);
1806: nd_bound[i] = ndv_compute_bound(nfv);
1807: if ( nd_demand ) {
1808: ndv_save(nfv,i);
1809: ndv_free(nfv);
1810: } else
1811: nd_ps[i] = nfv;
1.77 noro 1812: }
1813: }
1.14 noro 1814: sugar = SG(l);
1.71 noro 1815: if ( DP_Print ) fprintf(asir_out,"%d",sugar);
1.1 noro 1816: }
1.53 noro 1817: stat = nd_sp(m,0,l,&h);
1.1 noro 1818: if ( !stat ) {
1819: NEXT(l) = d; d = l;
1.20 noro 1820: d = nd_reconstruct(m,0,d);
1.1 noro 1821: goto again;
1822: }
1.41 noro 1823: #if USE_GEOBUCKET
1.69 noro 1824: stat = m?nd_nf_pbucket(m,h,nd_ps,!Top,&nf):nd_nf(m,h,nd_ps,!Top,0,&nf);
1.41 noro 1825: #else
1.69 noro 1826: stat = nd_nf(m,h,nd_ps,!Top,0,&nf);
1.41 noro 1827: #endif
1.1 noro 1828: if ( !stat ) {
1829: NEXT(l) = d; d = l;
1.20 noro 1830: d = nd_reconstruct(m,0,d);
1.1 noro 1831: goto again;
1832: } else if ( nf ) {
1.27 noro 1833: if ( checkonly ) return 0;
1.71 noro 1834: if ( DP_Print ) { printf("+"); fflush(stdout); }
1.63 noro 1835: nd_removecont(m,nf);
1836: nfv = ndtondv(m,nf); nd_free(nf);
1.77 noro 1837: nh = ndv_newps(m,nfv,0);
1.1 noro 1838: d = update_pairs(d,g,nh);
1839: g = update_base(g,nh);
1840: FREENDP(l);
1841: } else {
1.71 noro 1842: if ( DP_Print ) { printf("."); fflush(stdout); }
1.1 noro 1843: FREENDP(l);
1844: }
1845: }
1.77 noro 1846: if ( nd_demand )
1847: for ( t = g; t; t = NEXT(t) )
1848: BDY(t) = (pointer)ndv_load((int)BDY(t));
1849: else
1850: for ( t = g; t; t = NEXT(t) )
1851: BDY(t) = (pointer)nd_ps[(int)BDY(t)];
1.1 noro 1852: return g;
1853: }
1854:
1.82 noro 1855: NODE nd_gb_trace(int m,int ishomo)
1.20 noro 1856: {
1857: int i,nh,sugar,stat;
1.23 noro 1858: NODE r,g,t;
1.20 noro 1859: ND_pairs d;
1860: ND_pairs l;
1.82 noro 1861: ND h,nf,nfq,s,head;
1.63 noro 1862: NDV nfv,nfqv;
1.85 noro 1863: Q q,den,num;
1.69 noro 1864: union oNDC dn;
1.20 noro 1865:
1.23 noro 1866: g = 0; d = 0;
1867: for ( i = 0; i < nd_psn; i++ ) {
1.20 noro 1868: d = update_pairs(d,g,i);
1869: g = update_base(g,i);
1870: }
1871: sugar = 0;
1872: while ( d ) {
1873: again:
1874: l = nd_minp(d,&d);
1875: if ( SG(l) != sugar ) {
1.82 noro 1876: if ( ishomo ) {
1.85 noro 1877: for ( i = nd_psn-1; i >= 0 && SG(nd_psh[i]) == sugar; i-- ) {
1.82 noro 1878: /* for nd_ps */
1879: s = ndvtond(m,nd_ps[i]);
1880: s = nd_separate_head(s,&head);
1881: nd_nf_pbucket(m,s,nd_ps,1,&nf);
1882: nf = nd_add(m,head,nf);
1883: ndv_free(nd_ps[i]);
1884: nd_ps[i] = ndtondv(m,nf);
1885: nd_free(nf);
1886:
1887: /* for nd_ps_trace */
1888: if ( nd_demand )
1889: nfv = ndv_load(i);
1890: else
1891: nfv = nd_ps_trace[i];
1892: s = ndvtond(0,nfv);
1893: s = nd_separate_head(s,&head);
1894: nd_nf(0,s,nd_ps_trace,1,&dn,&nf);
1.85 noro 1895: NTOQ(NM(dn.z),SGN(dn.z),num);
1896: mulq(HCQ(head),num,&q); HCQ(head) = q;
1897: if ( DN(dn.z) ) {
1898: NTOQ(DN(dn.z),1,den);
1899: nd_mul_c_q(nf,den);
1900: }
1.82 noro 1901: nf = nd_add(0,head,nf);
1902: ndv_free(nfv);
1903: nd_removecont(0,nf);
1904: nfv = ndtondv(0,nf);
1905: nd_free(nf);
1906: nd_bound[i] = ndv_compute_bound(nfv);
1907: if ( nd_demand ) {
1908: ndv_save(nfv,i);
1909: ndv_free(nfv);
1910: } else
1911: nd_ps_trace[i] = nfv;
1912: }
1913: }
1.20 noro 1914: sugar = SG(l);
1.71 noro 1915: if ( DP_Print ) fprintf(asir_out,"%d",sugar);
1.20 noro 1916: }
1.53 noro 1917: stat = nd_sp(m,0,l,&h);
1.20 noro 1918: if ( !stat ) {
1919: NEXT(l) = d; d = l;
1920: d = nd_reconstruct(m,1,d);
1921: goto again;
1922: }
1.41 noro 1923: #if USE_GEOBUCKET
1.53 noro 1924: stat = nd_nf_pbucket(m,h,nd_ps,!Top,&nf);
1.41 noro 1925: #else
1.69 noro 1926: stat = nd_nf(m,h,nd_ps,!Top,0,&nf);
1.41 noro 1927: #endif
1.20 noro 1928: if ( !stat ) {
1929: NEXT(l) = d; d = l;
1930: d = nd_reconstruct(m,1,d);
1931: goto again;
1932: } else if ( nf ) {
1.77 noro 1933: if ( nd_demand ) {
1934: nfqv = ndv_load(nd_psn);
1935: nfq = ndvtond(0,nfqv);
1936: } else
1937: nfq = 0;
1938: if ( !nfq ) {
1939: if ( !nd_sp(0,1,l,&h) || !nd_nf(0,h,nd_ps_trace,!Top,0,&nfq) ) {
1940: NEXT(l) = d; d = l;
1941: d = nd_reconstruct(m,1,d);
1942: goto again;
1943: }
1.70 noro 1944: }
1.20 noro 1945: if ( nfq ) {
1.70 noro 1946: /* m|HC(nfq) => failure */
1.63 noro 1947: if ( !rem(NM(HCQ(nfq)),m) ) return 0;
1948:
1.71 noro 1949: if ( DP_Print ) { printf("+"); fflush(stdout); }
1.63 noro 1950: nd_removecont(m,nf); nfv = ndtondv(m,nf); nd_free(nf);
1951: nd_removecont(0,nfq); nfqv = ndtondv(0,nfq); nd_free(nfq);
1.77 noro 1952: nh = ndv_newps(0,nfv,nfqv);
1.20 noro 1953: d = update_pairs(d,g,nh);
1954: g = update_base(g,nh);
1955: } else {
1.71 noro 1956: if ( DP_Print ) { printf("*"); fflush(stdout); }
1.20 noro 1957: }
1958: } else {
1.71 noro 1959: if ( DP_Print ) { printf("."); fflush(stdout); }
1.20 noro 1960: }
1961: FREENDP(l);
1962: }
1.77 noro 1963: if ( nd_demand )
1964: for ( t = g; t; t = NEXT(t) )
1965: BDY(t) = (pointer)ndv_load((int)BDY(t));
1966: else
1967: for ( t = g; t; t = NEXT(t) )
1968: BDY(t) = (pointer)nd_ps_trace[(int)BDY(t)];
1.20 noro 1969: return g;
1970: }
1971:
1.23 noro 1972: int ndv_compare(NDV *p1,NDV *p2)
1973: {
1.34 noro 1974: return DL_COMPARE(HDL(*p1),HDL(*p2));
1.23 noro 1975: }
1976:
1977: int ndv_compare_rev(NDV *p1,NDV *p2)
1978: {
1.34 noro 1979: return -DL_COMPARE(HDL(*p1),HDL(*p2));
1.23 noro 1980: }
1981:
1.61 noro 1982: NODE ndv_reduceall(int m,NODE f)
1.23 noro 1983: {
1.69 noro 1984: int i,n,stat;
1985: ND nf,g,head;
1.23 noro 1986: NODE t,a0,a;
1.69 noro 1987: union oNDC dn;
1988: NDV *w;
1.85 noro 1989: Q q,num,den;
1.23 noro 1990:
1.69 noro 1991: n = length(f);
1992: #if 0
1993: w = (NDV *)ALLOCA(n*sizeof(NDV));
1994: for ( i = 0, t = f; i < n; i++, t = NEXT(t) ) w[i] = (NDV)BDY(t);
1995: qsort(w,n,sizeof(NDV),
1996: (int (*)(const void *,const void *))ndv_compare);
1997: for ( t = f, i = 0; t; i++, t = NEXT(t) ) BDY(t) = (pointer)w[i];
1998: #endif
1999: ndv_setup(m,0,f);
2000: for ( i = 0; i < n; ) {
2001: g = ndvtond(m,nd_ps[i]);
2002: g = nd_separate_head(g,&head);
2003: stat = nd_nf(m,g,nd_ps,1,&dn,&nf);
1.50 noro 2004: if ( !stat )
1.69 noro 2005: nd_reconstruct(m,0,0);
2006: else {
1.71 noro 2007: if ( DP_Print ) { printf("."); fflush(stdout); }
1.85 noro 2008: if ( !m ) {
2009: NTOQ(NM(dn.z),SGN(dn.z),num);
2010: mulq(HCQ(head),num,&q); HCQ(head) = q;
2011: if ( DN(dn.z) ) {
2012: NTOQ(DN(dn.z),1,den);
2013: nd_mul_c_q(nf,den);
2014: }
2015: }
1.69 noro 2016: nf = nd_add(m,head,nf);
2017: ndv_free(nd_ps[i]);
1.24 noro 2018: nd_removecont(m,nf);
1.69 noro 2019: nd_ps[i] = ndtondv(m,nf); nd_free(nf);
2020: nd_bound[i] = ndv_compute_bound(nd_ps[i]);
1.50 noro 2021: i++;
1.23 noro 2022: }
2023: }
1.71 noro 2024: if ( DP_Print ) { printf("\n"); }
1.23 noro 2025: for ( a0 = 0, i = 0; i < n; i++ ) {
2026: NEXTNODE(a0,a);
1.69 noro 2027: BDY(a) = (pointer)nd_ps[i];
1.23 noro 2028: }
2029: NEXT(a) = 0;
2030: return a0;
2031: }
2032:
1.1 noro 2033: ND_pairs update_pairs( ND_pairs d, NODE /* of index */ g, int t)
2034: {
2035: ND_pairs d1,nd,cur,head,prev,remove;
2036:
2037: if ( !g ) return d;
2038: d = crit_B(d,t);
2039: d1 = nd_newpairs(g,t);
2040: d1 = crit_M(d1);
2041: d1 = crit_F(d1);
1.55 noro 2042: if ( do_weyl )
2043: head = d1;
2044: else {
2045: prev = 0; cur = head = d1;
2046: while ( cur ) {
2047: if ( crit_2( cur->i1,cur->i2 ) ) {
2048: remove = cur;
2049: if ( !prev ) head = cur = NEXT(cur);
2050: else cur = NEXT(prev) = NEXT(cur);
2051: FREENDP(remove);
2052: } else {
2053: prev = cur; cur = NEXT(cur);
2054: }
1.1 noro 2055: }
2056: }
2057: if ( !d )
2058: return head;
2059: else {
2060: nd = d;
1.34 noro 2061: while ( NEXT(nd) ) nd = NEXT(nd);
1.1 noro 2062: NEXT(nd) = head;
2063: return d;
2064: }
2065: }
2066:
2067: ND_pairs nd_newpairs( NODE g, int t )
2068: {
2069: NODE h;
1.61 noro 2070: UINT *dl;
1.34 noro 2071: int ts,s;
1.1 noro 2072: ND_pairs r,r0;
2073:
1.20 noro 2074: dl = DL(nd_psh[t]);
1.34 noro 2075: ts = SG(nd_psh[t]) - TD(dl);
1.1 noro 2076: for ( r0 = 0, h = g; h; h = NEXT(h) ) {
2077: NEXTND_pairs(r0,r);
2078: r->i1 = (int)BDY(h);
2079: r->i2 = t;
1.20 noro 2080: ndl_lcm(DL(nd_psh[r->i1]),dl,r->lcm);
1.34 noro 2081: s = SG(nd_psh[r->i1])-TD(DL(nd_psh[r->i1]));
2082: SG(r) = MAX(s,ts) + TD(LCM(r));
1.1 noro 2083: }
2084: NEXT(r) = 0;
2085: return r0;
2086: }
2087:
2088: ND_pairs crit_B( ND_pairs d, int s )
2089: {
2090: ND_pairs cur,head,prev,remove;
1.61 noro 2091: UINT *t,*tl,*lcm;
1.1 noro 2092: int td,tdl;
2093:
2094: if ( !d ) return 0;
1.20 noro 2095: t = DL(nd_psh[s]);
1.1 noro 2096: prev = 0;
2097: head = cur = d;
1.61 noro 2098: lcm = (UINT *)ALLOCA(nd_wpd*sizeof(UINT));
1.1 noro 2099: while ( cur ) {
2100: tl = cur->lcm;
2101: if ( ndl_reducible(tl,t)
1.20 noro 2102: && (ndl_lcm(DL(nd_psh[cur->i1]),t,lcm),!ndl_equal(lcm,tl))
2103: && (ndl_lcm(DL(nd_psh[cur->i2]),t,lcm),!ndl_equal(lcm,tl)) ) {
1.1 noro 2104: remove = cur;
2105: if ( !prev ) {
2106: head = cur = NEXT(cur);
2107: } else {
2108: cur = NEXT(prev) = NEXT(cur);
2109: }
2110: FREENDP(remove);
2111: } else {
1.34 noro 2112: prev = cur; cur = NEXT(cur);
1.1 noro 2113: }
2114: }
2115: return head;
2116: }
2117:
2118: ND_pairs crit_M( ND_pairs d1 )
2119: {
2120: ND_pairs e,d2,d3,dd,p;
1.61 noro 2121: UINT *id,*jd;
1.1 noro 2122:
2123: for ( dd = 0, e = d1; e; e = d3 ) {
2124: if ( !(d2 = NEXT(e)) ) {
2125: NEXT(e) = dd;
2126: return e;
2127: }
1.34 noro 2128: id = LCM(e);
1.1 noro 2129: for ( d3 = 0; d2; d2 = p ) {
1.34 noro 2130: p = NEXT(d2);
2131: jd = LCM(d2);
2132: if ( ndl_equal(jd,id) )
2133: ;
2134: else if ( TD(jd) > TD(id) )
1.1 noro 2135: if ( ndl_reducible(jd,id) ) continue;
2136: else ;
1.34 noro 2137: else if ( ndl_reducible(id,jd) ) goto delit;
1.1 noro 2138: NEXT(d2) = d3;
2139: d3 = d2;
2140: }
2141: NEXT(e) = dd;
2142: dd = e;
2143: continue;
2144: /**/
2145: delit: NEXT(d2) = d3;
2146: d3 = d2;
2147: for ( ; p; p = d2 ) {
2148: d2 = NEXT(p);
2149: NEXT(p) = d3;
2150: d3 = p;
2151: }
2152: FREENDP(e);
2153: }
2154: return dd;
2155: }
2156:
2157: ND_pairs crit_F( ND_pairs d1 )
2158: {
2159: ND_pairs rest, head,remove;
2160: ND_pairs last, p, r, w;
2161: int s;
2162:
2163: for ( head = last = 0, p = d1; NEXT(p); ) {
2164: r = w = equivalent_pairs(p,&rest);
1.14 noro 2165: s = SG(r);
1.1 noro 2166: w = NEXT(w);
2167: while ( w ) {
2168: if ( crit_2(w->i1,w->i2) ) {
2169: r = w;
2170: w = NEXT(w);
2171: while ( w ) {
2172: remove = w;
2173: w = NEXT(w);
2174: FREENDP(remove);
2175: }
2176: break;
1.14 noro 2177: } else if ( SG(w) < s ) {
1.1 noro 2178: FREENDP(r);
2179: r = w;
1.14 noro 2180: s = SG(r);
1.1 noro 2181: w = NEXT(w);
2182: } else {
2183: remove = w;
2184: w = NEXT(w);
2185: FREENDP(remove);
2186: }
2187: }
2188: if ( last ) NEXT(last) = r;
2189: else head = r;
2190: NEXT(last = r) = 0;
2191: p = rest;
2192: if ( !p ) return head;
2193: }
2194: if ( !last ) return p;
2195: NEXT(last) = p;
2196: return head;
2197: }
2198:
2199: int crit_2( int dp1, int dp2 )
2200: {
1.20 noro 2201: return ndl_disjoint(DL(nd_psh[dp1]),DL(nd_psh[dp2]));
1.1 noro 2202: }
2203:
1.40 noro 2204: ND_pairs equivalent_pairs( ND_pairs d1, ND_pairs *prest )
1.1 noro 2205: {
2206: ND_pairs w,p,r,s;
1.61 noro 2207: UINT *d;
1.1 noro 2208:
2209: w = d1;
1.34 noro 2210: d = LCM(w);
1.1 noro 2211: s = NEXT(w);
2212: NEXT(w) = 0;
2213: for ( r = 0; s; s = p ) {
2214: p = NEXT(s);
1.34 noro 2215: if ( ndl_equal(d,LCM(s)) ) {
1.39 noro 2216: NEXT(s) = w; w = s;
1.1 noro 2217: } else {
1.39 noro 2218: NEXT(s) = r; r = s;
1.1 noro 2219: }
2220: }
2221: *prest = r;
2222: return w;
2223: }
2224:
2225: NODE update_base(NODE nd,int ndp)
2226: {
1.61 noro 2227: UINT *dl, *dln;
1.1 noro 2228: NODE last, p, head;
2229:
1.20 noro 2230: dl = DL(nd_psh[ndp]);
1.1 noro 2231: for ( head = last = 0, p = nd; p; ) {
1.20 noro 2232: dln = DL(nd_psh[(int)BDY(p)]);
1.34 noro 2233: if ( ndl_reducible( dln, dl ) ) {
1.1 noro 2234: p = NEXT(p);
2235: if ( last ) NEXT(last) = p;
2236: } else {
2237: if ( !last ) head = p;
2238: p = NEXT(last = p);
2239: }
2240: }
2241: head = append_one(head,ndp);
2242: return head;
2243: }
2244:
2245: ND_pairs nd_minp( ND_pairs d, ND_pairs *prest )
2246: {
2247: ND_pairs m,ml,p,l;
1.61 noro 2248: UINT *lcm;
1.33 noro 2249: int s,td,len,tlen,c,c1;
1.1 noro 2250:
2251: if ( !(p = NEXT(m = d)) ) {
2252: *prest = p;
2253: NEXT(m) = 0;
2254: return m;
2255: }
1.14 noro 2256: s = SG(m);
1.77 noro 2257: if ( !NoSugar ) {
2258: for ( ml = 0, l = m; p; p = NEXT(l = p) )
2259: if ( (SG(p) < s)
2260: || ((SG(p) == s) && (DL_COMPARE(LCM(p),LCM(m)) < 0)) ) {
2261: ml = l; m = p; s = SG(m);
2262: }
2263: } else {
2264: for ( ml = 0, l = m; p; p = NEXT(l = p) )
2265: if ( DL_COMPARE(LCM(p),LCM(m)) < 0 ) {
2266: ml = l; m = p; s = SG(m);
2267: }
2268: }
1.1 noro 2269: if ( !ml ) *prest = NEXT(m);
2270: else {
2271: NEXT(ml) = NEXT(m);
2272: *prest = d;
2273: }
2274: NEXT(m) = 0;
2275: return m;
2276: }
2277:
1.63 noro 2278: ND_pairs nd_minsugarp( ND_pairs d, ND_pairs *prest )
2279: {
1.69 noro 2280: int msugar,i;
1.63 noro 2281: ND_pairs t,dm0,dm,dr0,dr;
2282:
2283: for ( msugar = SG(d), t = NEXT(d); t; t = NEXT(t) )
2284: if ( SG(t) < msugar ) msugar = SG(t);
2285: dm0 = 0; dr0 = 0;
1.69 noro 2286: for ( i = 0, t = d; t; t = NEXT(t) )
2287: if ( i < nd_f4_nsp && SG(t) == msugar ) {
1.63 noro 2288: if ( dm0 ) NEXT(dm) = t;
2289: else dm0 = t;
2290: dm = t;
1.69 noro 2291: i++;
1.63 noro 2292: } else {
2293: if ( dr0 ) NEXT(dr) = t;
2294: else dr0 = t;
2295: dr = t;
2296: }
2297: NEXT(dm) = 0;
2298: if ( dr0 ) NEXT(dr) = 0;
2299: *prest = dr0;
2300: return dm0;
2301: }
2302:
1.77 noro 2303: int ndv_newps(int m,NDV a,NDV aq)
1.1 noro 2304: {
1.3 noro 2305: int len;
1.13 noro 2306: RHist r;
1.20 noro 2307: NDV b;
1.3 noro 2308:
1.1 noro 2309: if ( nd_psn == nd_pslen ) {
2310: nd_pslen *= 2;
1.11 noro 2311: nd_ps = (NDV *)REALLOC((char *)nd_ps,nd_pslen*sizeof(NDV));
1.53 noro 2312: nd_ps_trace = (NDV *)REALLOC((char *)nd_ps_trace,nd_pslen*sizeof(NDV));
1.13 noro 2313: nd_psh = (RHist *)REALLOC((char *)nd_psh,nd_pslen*sizeof(RHist));
1.61 noro 2314: nd_bound = (UINT **)
2315: REALLOC((char *)nd_bound,nd_pslen*sizeof(UINT *));
1.1 noro 2316: }
1.39 noro 2317: NEWRHist(r); nd_psh[nd_psn] = r;
1.63 noro 2318: nd_ps[nd_psn] = a;
1.39 noro 2319: if ( aq ) {
1.63 noro 2320: nd_ps_trace[nd_psn] = aq;
2321: nd_bound[nd_psn] = ndv_compute_bound(aq);
1.39 noro 2322: SG(r) = SG(aq); ndl_copy(HDL(aq),DL(r));
1.53 noro 2323: } else {
1.63 noro 2324: nd_bound[nd_psn] = ndv_compute_bound(a);
1.53 noro 2325: SG(r) = SG(a); ndl_copy(HDL(a),DL(r));
1.39 noro 2326: }
1.77 noro 2327: if ( nd_demand ) {
2328: if ( aq ) {
2329: ndv_save(nd_ps_trace[nd_psn],nd_psn);
2330: nd_ps_trace[nd_psn] = 0;
2331: } else {
2332: ndv_save(nd_ps[nd_psn],nd_psn);
2333: nd_ps[nd_psn] = 0;
2334: }
2335: }
1.1 noro 2336: return nd_psn++;
2337: }
2338:
1.61 noro 2339: void ndv_setup(int mod,int trace,NODE f)
1.1 noro 2340: {
1.5 noro 2341: int i,j,td,len,max;
1.1 noro 2342: NODE s,s0,f0;
1.61 noro 2343: UINT *d;
1.13 noro 2344: RHist r;
1.69 noro 2345: NDV *w;
1.61 noro 2346: NDV a,am;
1.11 noro 2347:
2348: nd_found = 0; nd_notfirst = 0; nd_create = 0;
1.1 noro 2349:
1.69 noro 2350: for ( nd_psn = 0, s = f; s; s = NEXT(s) ) if ( BDY(s) ) nd_psn++;
2351: w = (NDV *)ALLOCA(nd_psn*sizeof(NDV));
2352: for ( i = 0, s = f; s; s = NEXT(s) ) if ( BDY(s) ) w[i++] = BDY(s);
2353: qsort(w,nd_psn,sizeof(NDV),
2354: (int (*)(const void *,const void *))ndv_compare);
2355: nd_pslen = 2*nd_psn;
1.11 noro 2356: nd_ps = (NDV *)MALLOC(nd_pslen*sizeof(NDV));
1.53 noro 2357: nd_ps_trace = (NDV *)MALLOC(nd_pslen*sizeof(NDV));
1.13 noro 2358: nd_psh = (RHist *)MALLOC(nd_pslen*sizeof(RHist));
1.61 noro 2359: nd_bound = (UINT **)MALLOC(nd_pslen*sizeof(UINT *));
1.57 noro 2360:
1.11 noro 2361: if ( !nd_red )
1.13 noro 2362: nd_red = (RHist *)MALLOC(REDTAB_LEN*sizeof(RHist));
1.71 noro 2363: for ( i = 0; i < REDTAB_LEN; i++ ) nd_red[i] = 0;
1.69 noro 2364: for ( i = 0; i < nd_psn; i++ ) {
1.39 noro 2365: if ( trace ) {
1.69 noro 2366: a = nd_ps_trace[i] = ndv_dup(0,w[i]);
1.61 noro 2367: ndv_removecont(0,a);
2368: am = nd_ps[i] = ndv_dup(mod,a);
2369: ndv_mod(mod,am);
2370: ndv_removecont(mod,am);
2371: } else {
1.69 noro 2372: a = nd_ps[i] = ndv_dup(mod,w[i]);
1.61 noro 2373: ndv_removecont(mod,a);
1.39 noro 2374: }
1.61 noro 2375: NEWRHist(r); SG(r) = HTD(a); ndl_copy(HDL(a),DL(r));
1.57 noro 2376: nd_bound[i] = ndv_compute_bound(a);
1.20 noro 2377: nd_psh[i] = r;
1.77 noro 2378: if ( nd_demand ) {
2379: if ( trace ) {
2380: ndv_save(nd_ps_trace[i],i);
2381: nd_ps_trace[i] = 0;
2382: } else {
2383: ndv_save(nd_ps[i],i);
2384: nd_ps[i] = 0;
2385: }
2386: }
1.20 noro 2387: }
2388: }
2389:
1.63 noro 2390: void nd_gr(LIST f,LIST v,int m,int f4,struct order_spec *ord,LIST *rp)
1.1 noro 2391: {
1.61 noro 2392: VL tv,fv,vv,vc;
1.1 noro 2393: NODE fd,fd0,r,r0,t,x,s,xx;
1.61 noro 2394: int e,max,nvar;
1.69 noro 2395: NDV b;
1.77 noro 2396: int ishomo;
1.1 noro 2397:
1.78 noro 2398: if ( !m && Demand ) nd_demand = 1;
2399: else nd_demand = 0;
2400:
1.74 noro 2401: ndv_alloc = 0;
1.1 noro 2402: get_vars((Obj)f,&fv); pltovl(v,&vv);
1.74 noro 2403: for ( nvar = 0, tv = vv; tv; tv = NEXT(tv), nvar++ );
1.32 noro 2404: nd_init_ord(ord);
1.61 noro 2405: for ( t = BDY(f), max = 0; t; t = NEXT(t) )
2406: for ( tv = vv; tv; tv = NEXT(tv) ) {
2407: e = getdeg(tv->v,(P)BDY(t));
2408: max = MAX(e,max);
2409: }
2410: nd_setup_parameters(nvar,max);
1.77 noro 2411: ishomo = 1;
1.1 noro 2412: for ( fd0 = 0, t = BDY(f); t; t = NEXT(t) ) {
1.61 noro 2413: b = (pointer)ptondv(CO,vv,(P)BDY(t));
1.77 noro 2414: if ( ishomo )
2415: ishomo = ishomo && ndv_ishomo(b);
1.69 noro 2416: if ( m ) ndv_mod(m,b);
1.61 noro 2417: if ( b ) { NEXTNODE(fd0,fd); BDY(fd) = (pointer)b; }
1.1 noro 2418: }
2419: if ( fd0 ) NEXT(fd) = 0;
1.61 noro 2420: ndv_setup(m,0,fd0);
1.77 noro 2421: x = f4?nd_f4(m):nd_gb(m,ishomo,0);
1.82 noro 2422: nd_demand = 0;
1.61 noro 2423: x = ndv_reducebase(x);
2424: x = ndv_reduceall(m,x);
1.23 noro 2425: for ( r0 = 0, t = x; t; t = NEXT(t) ) {
1.1 noro 2426: NEXTNODE(r0,r);
1.61 noro 2427: BDY(r) = ndvtop(m,CO,vv,BDY(t));
1.20 noro 2428: }
2429: if ( r0 ) NEXT(r) = 0;
2430: MKLIST(*rp,r0);
1.74 noro 2431: fprintf(asir_out,"ndv_alloc=%d\n",ndv_alloc);
1.20 noro 2432: }
2433:
1.52 noro 2434: void nd_gr_trace(LIST f,LIST v,int trace,int homo,struct order_spec *ord,LIST *rp)
1.20 noro 2435: {
2436: struct order_spec ord1;
1.61 noro 2437: VL tv,fv,vv,vc;
1.27 noro 2438: NODE fd,fd0,in0,in,r,r0,t,s,cand;
1.61 noro 2439: int m,nocheck,nvar,mindex,e,max;
2440: NDV c;
2441: NMV a;
1.27 noro 2442: P p;
1.61 noro 2443: EPOS oepos;
1.82 noro 2444: int obpe,oadv,wmax,i,len,cbpe,ishomo;
1.20 noro 2445:
2446: get_vars((Obj)f,&fv); pltovl(v,&vv);
1.74 noro 2447: for ( nvar = 0, tv = vv; tv; tv = NEXT(tv), nvar++ );
1.52 noro 2448: nocheck = 0;
2449: mindex = 0;
2450:
1.78 noro 2451: if ( Demand ) nd_demand = 1;
2452: else nd_demand = 0;
2453:
1.52 noro 2454: /* setup modulus */
2455: if ( trace < 0 ) {
2456: trace = -trace;
2457: nocheck = 1;
2458: }
2459: m = trace > 1 ? trace : get_lprime(mindex);
1.61 noro 2460: for ( t = BDY(f), max = 0; t; t = NEXT(t) )
2461: for ( tv = vv; tv; tv = NEXT(tv) ) {
2462: e = getdeg(tv->v,(P)BDY(t));
2463: max = MAX(e,max);
1.23 noro 2464: }
1.61 noro 2465: nd_init_ord(ord);
2466: nd_setup_parameters(nvar,max);
2467: obpe = nd_bpe; oadv = nmv_adv; oepos = nd_epos;
1.82 noro 2468: ishomo = 1;
1.61 noro 2469: for ( in0 = 0, fd0 = 0, t = BDY(f); t; t = NEXT(t) ) {
2470: c = ptondv(CO,vv,(P)BDY(t));
1.82 noro 2471: if ( ishomo )
2472: ishomo = ishomo && ndv_ishomo(c);
1.61 noro 2473: if ( c ) {
2474: NEXTNODE(in0,in); BDY(in) = (pointer)c;
2475: NEXTNODE(fd0,fd); BDY(fd) = (pointer)ndv_dup(0,c);
1.23 noro 2476: }
1.61 noro 2477: }
2478: if ( in0 ) NEXT(in) = 0;
2479: if ( fd0 ) NEXT(fd) = 0;
1.82 noro 2480: if ( !ishomo && homo ) {
1.61 noro 2481: for ( t = in0, wmax = 0; t; t = NEXT(t) ) {
2482: c = (NDV)BDY(t); len = LEN(c);
2483: for ( a = BDY(c), i = 0; i < len; i++, NMV_ADV(a) )
2484: wmax = MAX(TD(DL(a)),wmax);
2485: }
2486: homogenize_order(ord,nvar,&ord1);
2487: nd_init_ord(&ord1);
2488: nd_setup_parameters(nvar+1,wmax);
2489: for ( t = fd0; t; t = NEXT(t) )
2490: ndv_homogenize((NDV)BDY(t),obpe,oadv,oepos);
1.27 noro 2491: }
1.52 noro 2492: while ( 1 ) {
1.77 noro 2493: if ( Demand )
2494: nd_demand = 1;
1.61 noro 2495: ndv_setup(m,1,fd0);
1.82 noro 2496: cand = nd_gb_trace(m,ishomo || homo);
1.52 noro 2497: if ( !cand ) {
2498: /* failure */
1.61 noro 2499: if ( trace > 1 ) { *rp = 0; return; }
2500: else m = get_lprime(++mindex);
1.52 noro 2501: continue;
2502: }
1.82 noro 2503: if ( !ishomo && homo ) {
1.27 noro 2504: /* dehomogenization */
1.61 noro 2505: for ( t = cand; t; t = NEXT(t) ) ndv_dehomogenize((NDV)BDY(t),ord);
1.45 noro 2506: nd_init_ord(ord);
1.61 noro 2507: nd_setup_parameters(nvar,0);
1.27 noro 2508: }
1.77 noro 2509: nd_demand = 0;
1.61 noro 2510: cand = ndv_reducebase(cand);
2511: cand = ndv_reduceall(0,cand);
1.78 noro 2512: cbpe = nd_bpe;
1.61 noro 2513: if ( nocheck )
2514: break;
2515: if ( ndv_check_candidate(in0,obpe,oadv,oepos,cand) )
1.52 noro 2516: /* success */
2517: break;
2518: else if ( trace > 1 ) {
2519: /* failure */
2520: *rp = 0; return;
1.61 noro 2521: } else {
1.52 noro 2522: /* try the next modulus */
2523: m = get_lprime(++mindex);
1.61 noro 2524: /* reset the parameters */
1.82 noro 2525: if ( !ishomo && homo ) {
1.61 noro 2526: nd_init_ord(&ord1);
2527: nd_setup_parameters(nvar+1,wmax);
2528: } else {
2529: nd_init_ord(ord);
2530: nd_setup_parameters(nvar,max);
2531: }
2532: }
1.52 noro 2533: }
1.27 noro 2534: /* dp->p */
1.61 noro 2535: nd_bpe = cbpe;
1.73 noro 2536: nd_setup_parameters(nd_nvar,0);
1.61 noro 2537: for ( r = cand; r; r = NEXT(r) ) BDY(r) = (pointer)ndvtop(0,CO,vv,BDY(r));
1.27 noro 2538: MKLIST(*rp,cand);
1.1 noro 2539: }
2540:
1.61 noro 2541: void dltondl(int n,DL dl,UINT *r)
1.1 noro 2542: {
1.61 noro 2543: UINT *d;
1.57 noro 2544: int i,j,l,s,ord_l;
1.43 noro 2545: struct order_pair *op;
1.1 noro 2546:
2547: d = dl->d;
1.41 noro 2548: for ( i = 0; i < nd_wpd; i++ ) r[i] = 0;
1.43 noro 2549: if ( nd_blockmask ) {
2550: l = nd_blockmask->n;
2551: op = nd_blockmask->order_pair;
2552: for ( j = 0, s = 0; j < l; j++ ) {
2553: ord_l = op[j].length;
1.57 noro 2554: for ( i = 0; i < ord_l; i++, s++ ) PUT_EXP(r,s,d[s]);
1.43 noro 2555: }
2556: TD(r) = ndl_weight(r);
1.61 noro 2557: ndl_weight_mask(r);
1.43 noro 2558: } else {
1.56 noro 2559: for ( i = 0; i < n; i++ ) PUT_EXP(r,i,d[i]);
1.43 noro 2560: TD(r) = ndl_weight(r);
2561: }
1.1 noro 2562: }
2563:
1.61 noro 2564: DL ndltodl(int n,UINT *ndl)
1.1 noro 2565: {
2566: DL dl;
2567: int *d;
1.57 noro 2568: int i,j,l,s,ord_l;
1.43 noro 2569: struct order_pair *op;
1.1 noro 2570:
2571: NEWDL(dl,n);
1.34 noro 2572: dl->td = TD(ndl);
1.1 noro 2573: d = dl->d;
1.43 noro 2574: if ( nd_blockmask ) {
2575: l = nd_blockmask->n;
2576: op = nd_blockmask->order_pair;
2577: for ( j = 0, s = 0; j < l; j++ ) {
2578: ord_l = op[j].length;
1.57 noro 2579: for ( i = 0; i < ord_l; i++, s++ ) d[s] = GET_EXP(ndl,s);
1.43 noro 2580: }
2581: } else {
1.56 noro 2582: for ( i = 0; i < n; i++ ) d[i] = GET_EXP(ndl,i);
1.43 noro 2583: }
1.1 noro 2584: return dl;
2585: }
2586:
1.61 noro 2587: void ndl_print(UINT *dl)
1.1 noro 2588: {
2589: int n;
1.57 noro 2590: int i,j,l,ord_l,s,s0;
1.43 noro 2591: struct order_pair *op;
1.1 noro 2592:
2593: n = nd_nvar;
2594: printf("<<");
1.43 noro 2595: if ( nd_blockmask ) {
2596: l = nd_blockmask->n;
2597: op = nd_blockmask->order_pair;
2598: for ( j = 0, s = s0 = 0; j < l; j++ ) {
2599: ord_l = op[j].length;
1.57 noro 2600: for ( i = 0; i < ord_l; i++, s++ )
2601: printf(s==n-1?"%d":"%d,",GET_EXP(dl,s));
1.43 noro 2602: }
2603: } else {
1.56 noro 2604: for ( i = 0; i < n; i++ ) printf(i==n-1?"%d":"%d,",GET_EXP(dl,i));
1.43 noro 2605: }
1.1 noro 2606: printf(">>");
2607: }
2608:
2609: void nd_print(ND p)
2610: {
2611: NM m;
2612:
2613: if ( !p )
2614: printf("0\n");
2615: else {
2616: for ( m = BDY(p); m; m = NEXT(m) ) {
1.71 noro 2617: if ( CM(m) & 0x80000000 ) printf("+@_%d*",IFTOF(CM(m)));
2618: else printf("+%d*",CM(m));
1.14 noro 2619: ndl_print(DL(m));
1.1 noro 2620: }
2621: printf("\n");
2622: }
2623: }
2624:
1.16 noro 2625: void nd_print_q(ND p)
2626: {
2627: NM m;
2628:
2629: if ( !p )
2630: printf("0\n");
2631: else {
2632: for ( m = BDY(p); m; m = NEXT(m) ) {
2633: printf("+");
1.74 noro 2634: printexpr(CO,(Obj)CQ(m));
1.16 noro 2635: printf("*");
2636: ndl_print(DL(m));
2637: }
2638: printf("\n");
2639: }
2640: }
2641:
1.1 noro 2642: void ndp_print(ND_pairs d)
2643: {
2644: ND_pairs t;
2645:
1.34 noro 2646: for ( t = d; t; t = NEXT(t) ) printf("%d,%d ",t->i1,t->i2);
1.1 noro 2647: printf("\n");
2648: }
2649:
1.20 noro 2650: void nd_removecont(int mod,ND p)
1.16 noro 2651: {
2652: int i,n;
2653: Q *w;
2654: Q dvr,t;
2655: NM m;
1.21 noro 2656: struct oVECT v;
2657: N q,r;
1.16 noro 2658:
1.71 noro 2659: if ( mod == -1 ) nd_mul_c(mod,p,_invsf(HCM(p)));
2660: else if ( mod ) nd_mul_c(mod,p,invm(HCM(p),mod));
1.20 noro 2661: else {
2662: for ( m = BDY(p), n = 0; m; m = NEXT(m), n++ );
2663: w = (Q *)ALLOCA(n*sizeof(Q));
1.21 noro 2664: v.len = n;
2665: v.body = (pointer *)w;
1.34 noro 2666: for ( m = BDY(p), i = 0; i < n; m = NEXT(m), i++ ) w[i] = CQ(m);
1.21 noro 2667: removecont_array(w,n);
2668: for ( m = BDY(p), i = 0; i < n; m = NEXT(m), i++ ) CQ(m) = w[i];
1.16 noro 2669: }
2670: }
2671:
1.21 noro 2672: void nd_removecont2(ND p1,ND p2)
2673: {
2674: int i,n1,n2,n;
2675: Q *w;
2676: Q dvr,t;
2677: NM m;
2678: struct oVECT v;
2679: N q,r;
2680:
2681: if ( !p1 ) {
2682: nd_removecont(0,p2); return;
2683: } else if ( !p2 ) {
2684: nd_removecont(0,p1); return;
2685: }
2686: n1 = nd_length(p1);
2687: n2 = nd_length(p2);
2688: n = n1+n2;
2689: w = (Q *)ALLOCA(n*sizeof(Q));
2690: v.len = n;
2691: v.body = (pointer *)w;
1.34 noro 2692: for ( m = BDY(p1), i = 0; i < n1; m = NEXT(m), i++ ) w[i] = CQ(m);
2693: for ( m = BDY(p2); i < n; m = NEXT(m), i++ ) w[i] = CQ(m);
1.21 noro 2694: removecont_array(w,n);
2695: for ( m = BDY(p1), i = 0; i < n1; m = NEXT(m), i++ ) CQ(m) = w[i];
2696: for ( m = BDY(p2); i < n; m = NEXT(m), i++ ) CQ(m) = w[i];
2697: }
2698:
1.20 noro 2699: void ndv_removecont(int mod,NDV p)
1.16 noro 2700: {
2701: int i,len;
2702: Q *w;
2703: Q dvr,t;
2704: NMV m;
2705:
1.71 noro 2706: if ( mod == -1 )
2707: ndv_mul_c(mod,p,_invsf(HCM(p)));
2708: else if ( mod )
1.20 noro 2709: ndv_mul_c(mod,p,invm(HCM(p),mod));
2710: else {
2711: len = p->len;
2712: w = (Q *)ALLOCA(len*sizeof(Q));
1.34 noro 2713: for ( m = BDY(p), i = 0; i < len; NMV_ADV(m), i++ ) w[i] = CQ(m);
1.20 noro 2714: sortbynm(w,len);
2715: qltozl(w,len,&dvr);
2716: for ( m = BDY(p), i = 0; i < len; NMV_ADV(m), i++ ) {
2717: divq(CQ(m),dvr,&t); CQ(m) = t;
2718: }
1.16 noro 2719: }
1.21 noro 2720: }
2721:
1.61 noro 2722: void ndv_homogenize(NDV p,int obpe,int oadv,EPOS oepos)
2723: {
2724: int len,i,max;
2725: NMV m,mr0,mr,t;
2726:
2727: len = p->len;
2728: for ( m = BDY(p), i = 0, max = 0; i < len; NMV_OADV(m), i++ )
2729: max = MAX(max,TD(DL(m)));
2730: mr0 = nmv_adv>oadv?(NMV)REALLOC(BDY(p),len*nmv_adv):BDY(p);
2731: m = (NMV)((char *)mr0+(len-1)*oadv);
2732: mr = (NMV)((char *)mr0+(len-1)*nmv_adv);
2733: t = (NMV)ALLOCA(nmv_adv);
2734: for ( i = 0; i < len; i++, NMV_OPREV(m), NMV_PREV(mr) ) {
2735: ndl_homogenize(DL(m),DL(t),obpe,oepos,max);
2736: CQ(mr) = CQ(m);
2737: ndl_copy(DL(t),DL(mr));
2738: }
2739: NV(p)++;
2740: BDY(p) = mr0;
2741: }
2742:
1.45 noro 2743: void ndv_dehomogenize(NDV p,struct order_spec *ord)
1.23 noro 2744: {
1.45 noro 2745: int i,j,adj,len,newnvar,newwpd,newadv,newexporigin;
1.23 noro 2746: Q *w;
2747: Q dvr,t;
2748: NMV m,r;
2749:
2750: len = p->len;
2751: newnvar = nd_nvar-1;
1.48 noro 2752: newexporigin = nd_get_exporigin(ord);
1.45 noro 2753: newwpd = newnvar/nd_epw+(newnvar%nd_epw?1:0)+newexporigin;
1.23 noro 2754: for ( m = BDY(p), i = 0; i < len; NMV_ADV(m), i++ )
1.34 noro 2755: ndl_dehomogenize(DL(m));
1.23 noro 2756: if ( newwpd != nd_wpd ) {
1.61 noro 2757: newadv = sizeof(struct oNMV)+(newwpd-1)*sizeof(UINT);
2758: for ( m = r = BDY(p), i = 0; i < len; NMV_ADV(m), NDV_NADV(r), i++ ) {
1.45 noro 2759: CQ(r) = CQ(m);
2760: for ( j = 0; j < newexporigin; j++ ) DL(r)[j] = DL(m)[j];
2761: adj = nd_exporigin-newexporigin;
2762: for ( ; j < newwpd; j++ ) DL(r)[j] = DL(m)[j+adj];
1.23 noro 2763: }
2764: }
2765: NV(p)--;
2766: }
2767:
1.21 noro 2768: void removecont_array(Q *c,int n)
2769: {
2770: struct oVECT v;
2771: Q d0,d1,a,u,u1,gcd;
2772: int i;
2773: N qn,rn,gn;
2774: Q *q,*r;
2775:
2776: q = (Q *)ALLOCA(n*sizeof(Q));
2777: r = (Q *)ALLOCA(n*sizeof(Q));
2778: v.id = O_VECT; v.len = n; v.body = (pointer *)c;
2779: igcdv_estimate(&v,&d0);
2780: for ( i = 0; i < n; i++ ) {
2781: divn(NM(c[i]),NM(d0),&qn,&rn);
2782: NTOQ(qn,SGN(c[i])*SGN(d0),q[i]);
2783: NTOQ(rn,SGN(c[i]),r[i]);
2784: }
1.34 noro 2785: for ( i = 0; i < n; i++ ) if ( r[i] ) break;
1.21 noro 2786: if ( i < n ) {
2787: v.id = O_VECT; v.len = n; v.body = (pointer *)r;
2788: igcdv(&v,&d1);
2789: gcdn(NM(d0),NM(d1),&gn); NTOQ(gn,1,gcd);
2790: divsn(NM(d0),gn,&qn); NTOQ(qn,1,a);
2791: for ( i = 0; i < n; i++ ) {
2792: mulq(a,q[i],&u);
2793: if ( r[i] ) {
2794: divsn(NM(r[i]),gn,&qn); NTOQ(qn,SGN(r[i]),u1);
2795: addq(u,u1,&q[i]);
2796: } else
2797: q[i] = u;
2798: }
2799: }
1.34 noro 2800: for ( i = 0; i < n; i++ ) c[i] = q[i];
1.16 noro 2801: }
2802:
1.19 noro 2803: void nd_mul_c(int mod,ND p,int mul)
1.1 noro 2804: {
2805: NM m;
2806: int c,c1;
2807:
1.34 noro 2808: if ( !p ) return;
1.71 noro 2809: if ( mod == -1 )
2810: for ( m = BDY(p); m; m = NEXT(m) )
2811: CM(m) = _mulsf(CM(m),mul);
2812: else
2813: for ( m = BDY(p); m; m = NEXT(m) ) {
2814: c1 = CM(m); DMAR(c1,mul,0,mod,c); CM(m) = c;
2815: }
1.1 noro 2816: }
2817:
1.16 noro 2818: void nd_mul_c_q(ND p,Q mul)
2819: {
2820: NM m;
2821: Q c;
2822:
1.34 noro 2823: if ( !p ) return;
1.16 noro 2824: for ( m = BDY(p); m; m = NEXT(m) ) {
2825: mulq(CQ(m),mul,&c); CQ(m) = c;
2826: }
2827: }
2828:
1.61 noro 2829: void nd_mul_c_p(VL vl,ND p,P mul)
2830: {
2831: NM m;
2832: P c;
2833:
2834: if ( !p ) return;
2835: for ( m = BDY(p); m; m = NEXT(m) ) {
2836: mulp(vl,CP(m),mul,&c); CP(m) = c;
2837: }
2838: }
2839:
1.1 noro 2840: void nd_free(ND p)
2841: {
2842: NM t,s;
2843:
1.34 noro 2844: if ( !p ) return;
1.1 noro 2845: t = BDY(p);
2846: while ( t ) {
2847: s = NEXT(t);
2848: FREENM(t);
2849: t = s;
2850: }
2851: FREEND(p);
2852: }
2853:
1.23 noro 2854: void ndv_free(NDV p)
2855: {
2856: GC_free(BDY(p));
2857: }
2858:
1.61 noro 2859: void nd_append_red(UINT *d,int i)
1.1 noro 2860: {
1.13 noro 2861: RHist m,m0;
1.1 noro 2862: int h;
2863:
1.13 noro 2864: NEWRHist(m);
1.34 noro 2865: h = ndl_hash_value(d);
1.13 noro 2866: m->index = i;
1.14 noro 2867: ndl_copy(d,DL(m));
1.1 noro 2868: NEXT(m) = nd_red[h];
2869: nd_red[h] = m;
2870: }
2871:
1.61 noro 2872: UINT *ndv_compute_bound(NDV p)
1.1 noro 2873: {
1.61 noro 2874: UINT *d1,*d2,*t;
2875: UINT u;
1.57 noro 2876: int i,j,k,l,len,ind;
1.45 noro 2877: NMV m;
1.1 noro 2878:
2879: if ( !p )
2880: return 0;
1.61 noro 2881: d1 = (UINT *)ALLOCA(nd_wpd*sizeof(UINT));
2882: d2 = (UINT *)ALLOCA(nd_wpd*sizeof(UINT));
1.45 noro 2883: len = LEN(p);
2884: m = BDY(p); ndl_copy(DL(m),d1); NMV_ADV(m);
2885: for ( i = 1; i < len; i++, NMV_ADV(m) ) {
1.14 noro 2886: ndl_lcm(DL(m),d1,d2);
1.1 noro 2887: t = d1; d1 = d2; d2 = t;
2888: }
1.12 noro 2889: l = nd_nvar+31;
1.61 noro 2890: t = (UINT *)MALLOC_ATOMIC(l*sizeof(UINT));
1.57 noro 2891: for ( i = nd_exporigin, ind = 0; i < nd_wpd; i++ ) {
2892: u = d1[i];
2893: k = (nd_epw-1)*nd_bpe;
2894: for ( j = 0; j < nd_epw; j++, k -= nd_bpe, ind++ )
2895: t[ind] = (u>>k)&nd_mask0;
2896: }
2897: for ( ; ind < l; ind++ ) t[ind] = 0;
1.1 noro 2898: return t;
2899: }
2900:
1.48 noro 2901: int nd_get_exporigin(struct order_spec *ord)
2902: {
1.51 noro 2903: switch ( ord->id ) {
1.41 noro 2904: case 0:
1.48 noro 2905: return 1;
1.41 noro 2906: case 1:
2907: /* block order */
1.43 noro 2908: /* d[0]:weight d[1]:w0,...,d[nd_exporigin-1]:w(n-1) */
1.48 noro 2909: return ord->ord.block.length+1;
1.41 noro 2910: case 2:
1.52 noro 2911: error("nd_get_exporigin : matrix order is not supported yet.");
1.41 noro 2912: }
1.48 noro 2913: }
2914:
1.61 noro 2915: void nd_setup_parameters(int nvar,int max) {
1.79 noro 2916: int i,j,n,elen,ord_o,ord_l,l,s,wpd;
1.57 noro 2917: struct order_pair *op;
1.48 noro 2918:
1.73 noro 2919: nd_nvar = nvar;
1.79 noro 2920: if ( max ) {
1.83 noro 2921: /* XXX */
2922: if ( do_weyl ) nd_bpe = 32;
2923: else if ( max < 2 ) nd_bpe = 1;
1.79 noro 2924: else if ( max < 4 ) nd_bpe = 2;
2925: else if ( max < 8 ) nd_bpe = 3;
2926: else if ( max < 16 ) nd_bpe = 4;
2927: else if ( max < 32 ) nd_bpe = 5;
2928: else if ( max < 64 ) nd_bpe = 6;
2929: else if ( max < 256 ) nd_bpe = 8;
2930: else if ( max < 1024 ) nd_bpe = 10;
2931: else if ( max < 65536 ) nd_bpe = 16;
2932: else nd_bpe = 32;
2933: }
1.61 noro 2934: nd_epw = (sizeof(UINT)*8)/nd_bpe;
1.48 noro 2935: elen = nd_nvar/nd_epw+(nd_nvar%nd_epw?1:0);
2936: nd_exporigin = nd_get_exporigin(nd_ord);
1.79 noro 2937: wpd = nd_exporigin+elen;
2938: if ( wpd != nd_wpd ) {
2939: nd_free_private_storage();
2940: nd_wpd = wpd;
2941: }
1.1 noro 2942: if ( nd_bpe < 32 ) {
2943: nd_mask0 = (1<<nd_bpe)-1;
2944: } else {
2945: nd_mask0 = 0xffffffff;
2946: }
2947: bzero(nd_mask,sizeof(nd_mask));
2948: nd_mask1 = 0;
2949: for ( i = 0; i < nd_epw; i++ ) {
2950: nd_mask[nd_epw-i-1] = (nd_mask0<<(i*nd_bpe));
2951: nd_mask1 |= (1<<(nd_bpe-1))<<(i*nd_bpe);
2952: }
1.61 noro 2953: nm_adv = sizeof(struct oNM)+(nd_wpd-1)*sizeof(UINT);
2954: nmv_adv = sizeof(struct oNMV)+(nd_wpd-1)*sizeof(UINT);
1.57 noro 2955: nd_epos = nd_create_epos(nd_ord);
1.43 noro 2956: nd_blockmask = nd_create_blockmask(nd_ord);
1.1 noro 2957: }
2958:
1.20 noro 2959: ND_pairs nd_reconstruct(int mod,int trace,ND_pairs d)
1.1 noro 2960: {
1.37 noro 2961: int i,obpe,oadv,h;
1.71 noro 2962: static NM prev_nm_free_list;
2963: static ND_pairs prev_ndp_free_list;
1.13 noro 2964: RHist mr0,mr;
2965: RHist r;
1.37 noro 2966: RHist *old_red;
1.71 noro 2967: ND_pairs s0,s,t;
1.43 noro 2968: EPOS oepos;
1.15 noro 2969:
1.1 noro 2970: obpe = nd_bpe;
1.11 noro 2971: oadv = nmv_adv;
1.43 noro 2972: oepos = nd_epos;
1.63 noro 2973: if ( obpe < 2 ) nd_bpe = 2;
2974: else if ( obpe < 3 ) nd_bpe = 3;
1.62 noro 2975: else if ( obpe < 4 ) nd_bpe = 4;
1.63 noro 2976: else if ( obpe < 5 ) nd_bpe = 5;
1.34 noro 2977: else if ( obpe < 6 ) nd_bpe = 6;
2978: else if ( obpe < 8 ) nd_bpe = 8;
1.63 noro 2979: else if ( obpe < 10 ) nd_bpe = 10;
1.34 noro 2980: else if ( obpe < 16 ) nd_bpe = 16;
2981: else if ( obpe < 32 ) nd_bpe = 32;
2982: else error("nd_reconstruct : exponent too large");
1.5 noro 2983:
1.73 noro 2984: nd_setup_parameters(nd_nvar,0);
1.1 noro 2985: prev_nm_free_list = _nm_free_list;
2986: prev_ndp_free_list = _ndp_free_list;
2987: _nm_free_list = 0;
2988: _ndp_free_list = 0;
1.53 noro 2989: for ( i = nd_psn-1; i >= 0; i-- ) ndv_realloc(nd_ps[i],obpe,oadv,oepos);
2990: if ( trace )
2991: for ( i = nd_psn-1; i >= 0; i-- )
2992: ndv_realloc(nd_ps_trace[i],obpe,oadv,oepos);
1.1 noro 2993: s0 = 0;
2994: for ( t = d; t; t = NEXT(t) ) {
2995: NEXTND_pairs(s0,s);
2996: s->i1 = t->i1;
2997: s->i2 = t->i2;
1.14 noro 2998: SG(s) = SG(t);
1.61 noro 2999: ndl_reconstruct(LCM(t),LCM(s),obpe,oepos);
1.1 noro 3000: }
1.37 noro 3001:
3002: old_red = (RHist *)ALLOCA(REDTAB_LEN*sizeof(RHist));
1.6 noro 3003: for ( i = 0; i < REDTAB_LEN; i++ ) {
1.37 noro 3004: old_red[i] = nd_red[i];
3005: nd_red[i] = 0;
3006: }
3007: for ( i = 0; i < REDTAB_LEN; i++ )
3008: for ( r = old_red[i]; r; r = NEXT(r) ) {
3009: NEWRHist(mr);
1.13 noro 3010: mr->index = r->index;
1.20 noro 3011: SG(mr) = SG(r);
1.61 noro 3012: ndl_reconstruct(DL(r),DL(mr),obpe,oepos);
1.37 noro 3013: h = ndl_hash_value(DL(mr));
3014: NEXT(mr) = nd_red[h];
3015: nd_red[h] = mr;
1.6 noro 3016: }
1.37 noro 3017: for ( i = 0; i < REDTAB_LEN; i++ ) old_red[i] = 0;
3018: old_red = 0;
1.11 noro 3019: for ( i = 0; i < nd_psn; i++ ) {
1.20 noro 3020: NEWRHist(r); SG(r) = SG(nd_psh[i]);
1.61 noro 3021: ndl_reconstruct(DL(nd_psh[i]),DL(r),obpe,oepos);
1.13 noro 3022: nd_psh[i] = r;
1.11 noro 3023: }
1.1 noro 3024: if ( s0 ) NEXT(s) = 0;
3025: prev_nm_free_list = 0;
3026: prev_ndp_free_list = 0;
1.71 noro 3027: #if 0
1.1 noro 3028: GC_gcollect();
1.71 noro 3029: #endif
1.1 noro 3030: return s0;
3031: }
3032:
1.61 noro 3033: void ndl_reconstruct(UINT *d,UINT *r,int obpe,EPOS oepos)
1.1 noro 3034: {
1.57 noro 3035: int n,i,ei,oepw,omask0,j,s,ord_l,l;
1.43 noro 3036: struct order_pair *op;
1.1 noro 3037:
3038: n = nd_nvar;
1.61 noro 3039: oepw = (sizeof(UINT)*8)/obpe;
1.43 noro 3040: omask0 = (1<<obpe)-1;
1.34 noro 3041: TD(r) = TD(d);
1.41 noro 3042: for ( i = nd_exporigin; i < nd_wpd; i++ ) r[i] = 0;
1.43 noro 3043: if ( nd_blockmask ) {
3044: l = nd_blockmask->n;
3045: op = nd_blockmask->order_pair;
3046: for ( i = 1; i < nd_exporigin; i++ )
3047: r[i] = d[i];
3048: for ( j = 0, s = 0; j < l; j++ ) {
3049: ord_l = op[j].length;
1.57 noro 3050: for ( i = 0; i < ord_l; i++, s++ ) {
3051: ei = GET_EXP_OLD(d,s);
3052: PUT_EXP(r,s,ei);
3053: }
1.1 noro 3054: }
1.43 noro 3055: } else {
1.56 noro 3056: for ( i = 0; i < n; i++ ) {
3057: ei = GET_EXP_OLD(d,i);
3058: PUT_EXP(r,i,ei);
3059: }
1.1 noro 3060: }
3061: }
1.3 noro 3062:
1.6 noro 3063: ND nd_copy(ND p)
3064: {
3065: NM m,mr,mr0;
1.41 noro 3066: int c,n;
1.6 noro 3067: ND r;
3068:
3069: if ( !p )
3070: return 0;
3071: else {
3072: for ( mr0 = 0, m = BDY(p); m; m = NEXT(m) ) {
3073: NEXTNM(mr0,mr);
1.14 noro 3074: CM(mr) = CM(m);
3075: ndl_copy(DL(m),DL(mr));
1.6 noro 3076: }
3077: NEXT(mr) = 0;
1.31 noro 3078: MKND(NV(p),mr0,LEN(p),r);
1.14 noro 3079: SG(r) = SG(p);
1.6 noro 3080: return r;
3081: }
3082: }
3083:
1.53 noro 3084: int nd_sp(int mod,int trace,ND_pairs p,ND *rp)
1.11 noro 3085: {
3086: NM m;
3087: NDV p1,p2;
3088: ND t1,t2;
1.61 noro 3089: UINT *lcm;
1.31 noro 3090: int td;
1.11 noro 3091:
1.77 noro 3092: if ( !mod && nd_demand ) {
3093: p1 = ndv_load(p->i1); p2 = ndv_load(p->i2);
1.53 noro 3094: } else {
1.77 noro 3095: if ( trace ) {
3096: p1 = nd_ps_trace[p->i1]; p2 = nd_ps_trace[p->i2];
3097: } else {
3098: p1 = nd_ps[p->i1]; p2 = nd_ps[p->i2];
3099: }
1.20 noro 3100: }
1.34 noro 3101: lcm = LCM(p);
1.11 noro 3102: NEWNM(m);
1.20 noro 3103: CQ(m) = HCQ(p2);
1.34 noro 3104: ndl_sub(lcm,HDL(p1),DL(m));
1.56 noro 3105: if ( ndl_check_bound2(p->i1,DL(m)) )
3106: return 0;
1.55 noro 3107: t1 = ndv_mul_nm(mod,m,p1);
1.71 noro 3108: if ( mod == -1 ) CM(m) = _chsgnsf(HCM(p1));
3109: else if ( mod ) CM(m) = mod-HCM(p1);
1.34 noro 3110: else chsgnq(HCQ(p1),&CQ(m));
3111: ndl_sub(lcm,HDL(p2),DL(m));
1.14 noro 3112: if ( ndl_check_bound2(p->i2,DL(m)) ) {
1.11 noro 3113: nd_free(t1);
3114: return 0;
3115: }
1.55 noro 3116: t2 = ndv_mul_nm(mod,m,p2);
1.31 noro 3117: *rp = nd_add(mod,t1,t2);
1.11 noro 3118: FREENM(m);
3119: return 1;
3120: }
3121:
1.19 noro 3122: void ndv_mul_c(int mod,NDV p,int mul)
1.11 noro 3123: {
3124: NMV m;
3125: int c,c1,len,i;
3126:
1.34 noro 3127: if ( !p ) return;
1.14 noro 3128: len = LEN(p);
1.71 noro 3129: if ( mod == -1 )
3130: for ( m = BDY(p), i = 0; i < len; i++, NMV_ADV(m) )
3131: CM(m) = _mulsf(CM(m),mul);
3132: else
3133: for ( m = BDY(p), i = 0; i < len; i++, NMV_ADV(m) ) {
3134: c1 = CM(m); DMAR(c1,mul,0,mod,c); CM(m) = c;
3135: }
1.11 noro 3136: }
3137:
1.16 noro 3138: void ndv_mul_c_q(NDV p,Q mul)
3139: {
3140: NMV m;
3141: Q c;
3142: int len,i;
3143:
1.34 noro 3144: if ( !p ) return;
1.16 noro 3145: len = LEN(p);
3146: for ( m = BDY(p), i = 0; i < len; i++, NMV_ADV(m) ) {
3147: mulq(CQ(m),mul,&c); CQ(m) = c;
3148: }
3149: }
3150:
1.55 noro 3151: ND weyl_ndv_mul_nm(int mod,NM m0,NDV p) {
3152: int n2,i,j,l,n,tlen;
1.61 noro 3153: UINT *d0;
1.55 noro 3154: NM *tab,*psum;
3155: ND s,r;
3156: NM t;
3157: NMV m1;
3158:
3159: if ( !p ) return 0;
3160: n = NV(p); n2 = n>>1;
3161: d0 = DL(m0);
3162: l = LEN(p);
3163: for ( i = 0, tlen = 1; i < n2; i++ ) tlen *= (GET_EXP(d0,n2+i)+1);
3164: tab = (NM *)ALLOCA(tlen*sizeof(NM));
3165: psum = (NM *)ALLOCA(tlen*sizeof(NM));
3166: for ( i = 0; i < tlen; i++ ) psum[i] = 0;
1.56 noro 3167: m1 = (NMV)(((char *)BDY(p))+nmv_adv*(l-1));
3168: for ( i = l-1; i >= 0; i--, NMV_PREV(m1) ) {
1.55 noro 3169: /* m0(NM) * m1(NMV) => tab(NM) */
1.56 noro 3170: weyl_mul_nm_nmv(n,mod,m0,m1,tab,tlen);
1.55 noro 3171: for ( j = 0; j < tlen; j++ ) {
3172: if ( tab[j] ) {
3173: NEXT(tab[j]) = psum[j]; psum[j] = tab[j];
3174: }
3175: }
3176: }
3177: for ( i = tlen-1, r = 0; i >= 0; i-- )
3178: if ( psum[i] ) {
3179: for ( j = 0, t = psum[i]; t; t = NEXT(t), j++ );
3180: MKND(n,psum[i],j,s);
3181: r = nd_add(mod,r,s);
3182: }
1.56 noro 3183: if ( r ) SG(r) = SG(p)+TD(d0);
3184: return r;
1.55 noro 3185: }
3186:
1.56 noro 3187: /* product of monomials */
3188: /* XXX block order is not handled correctly */
3189:
1.55 noro 3190: void weyl_mul_nm_nmv(int n,int mod,NM m0,NMV m1,NM *tab,int tlen)
3191: {
1.56 noro 3192: int i,n2,j,s,curlen,homo,h,a,b,k,l,u,min;
1.61 noro 3193: UINT *d0,*d1,*d,*dt,*ctab;
1.56 noro 3194: Q *ctab_q;
3195: Q q,q1;
1.61 noro 3196: UINT c0,c1,c;
1.55 noro 3197: NM *p;
3198: NM m,t;
3199:
3200: for ( i = 0; i < tlen; i++ ) tab[i] = 0;
3201: if ( !m0 || !m1 ) return;
3202: d0 = DL(m0); d1 = DL(m1); n2 = n>>1;
3203: NEWNM(m); d = DL(m);
1.56 noro 3204: if ( mod ) {
3205: c0 = CM(m0); c1 = CM(m1); DMAR(c0,c1,0,mod,c); CM(m) = c;
3206: } else
3207: mulq(CQ(m0),CQ(m1),&CQ(m));
1.55 noro 3208: for ( i = 0; i < nd_wpd; i++ ) d[i] = 0;
3209: homo = n&1 ? 1 : 0;
3210: if ( homo ) {
3211: /* offset of h-degree */
3212: h = GET_EXP(d0,n-1)+GET_EXP(d1,n-1);
3213: PUT_EXP(DL(m),n-1,h);
3214: TD(DL(m)) = h;
1.61 noro 3215: if ( nd_blockmask ) ndl_weight_mask(DL(m));
1.55 noro 3216: }
3217: tab[0] = m;
3218: NEWNM(m); d = DL(m);
1.57 noro 3219: for ( i = 0, curlen = 1; i < n2; i++ ) {
1.55 noro 3220: a = GET_EXP(d0,i); b = GET_EXP(d1,n2+i);
3221: k = GET_EXP(d0,n2+i); l = GET_EXP(d1,i);
3222: /* xi^a*(Di^k*xi^l)*Di^b */
3223: a += l; b += k;
1.56 noro 3224: s = MUL_WEIGHT(a,i)+MUL_WEIGHT(b,n2+i);
1.55 noro 3225: if ( !k || !l ) {
3226: for ( j = 0; j < curlen; j++ )
1.56 noro 3227: if ( t = tab[j] ) {
3228: dt = DL(t);
3229: PUT_EXP(dt,i,a); PUT_EXP(dt,n2+i,b); TD(dt) += s;
1.61 noro 3230: if ( nd_blockmask ) ndl_weight_mask(dt);
1.55 noro 3231: }
3232: curlen *= k+1;
3233: continue;
3234: }
3235: min = MIN(k,l);
1.56 noro 3236: if ( mod ) {
1.61 noro 3237: ctab = (UINT *)ALLOCA((min+1)*sizeof(UINT));
1.56 noro 3238: mkwcm(k,l,mod,ctab);
3239: } else {
3240: ctab_q = (Q *)ALLOCA((min+1)*sizeof(Q));
3241: mkwc(k,l,ctab_q);
3242: }
1.57 noro 3243: for ( j = min; j >= 0; j-- ) {
1.56 noro 3244: for ( u = 0; u < nd_wpd; u++ ) d[u] = 0;
1.55 noro 3245: PUT_EXP(d,i,a-j); PUT_EXP(d,n2+i,b-j);
1.56 noro 3246: h = MUL_WEIGHT(a-j,i)+MUL_WEIGHT(b-j,n2+i);
1.55 noro 3247: if ( homo ) {
3248: TD(d) = s;
1.56 noro 3249: PUT_EXP(d,n-1,s-h);
1.55 noro 3250: } else TD(d) = h;
1.61 noro 3251: if ( nd_blockmask ) ndl_weight_mask(d);
1.56 noro 3252: if ( mod ) c = ctab[j];
3253: else q = ctab_q[j];
1.57 noro 3254: p = tab+curlen*j;
3255: if ( j == 0 ) {
3256: for ( u = 0; u < curlen; u++, p++ ) {
3257: if ( tab[u] ) {
3258: ndl_addto(DL(tab[u]),d);
3259: if ( mod ) {
3260: c0 = CM(tab[u]); DMAR(c0,c,0,mod,c1); CM(tab[u]) = c1;
3261: } else {
3262: mulq(CQ(tab[u]),q,&q1); CQ(tab[u]) = q1;
3263: }
3264: }
1.56 noro 3265: }
1.57 noro 3266: } else {
3267: for ( u = 0; u < curlen; u++, p++ ) {
3268: if ( tab[u] ) {
3269: NEWNM(t);
3270: ndl_add(DL(tab[u]),d,DL(t));
3271: if ( mod ) {
3272: c0 = CM(tab[u]); DMAR(c0,c,0,mod,c1); CM(t) = c1;
3273: } else
3274: mulq(CQ(tab[u]),q,&CQ(t));
3275: *p = t;
3276: }
1.55 noro 3277: }
3278: }
3279: }
3280: curlen *= k+1;
3281: }
3282: FREENM(m);
3283: }
3284:
1.63 noro 3285: ND ndv_mul_nm_symbolic(NM m0,NDV p)
3286: {
3287: NM mr,mr0;
3288: NMV m;
3289: UINT *d,*dt,*dm;
3290: int c,n,td,i,c1,c2,len;
3291: Q q;
3292: ND r;
3293:
3294: if ( !p ) return 0;
3295: else {
3296: n = NV(p); m = BDY(p);
3297: d = DL(m0);
3298: len = LEN(p);
3299: mr0 = 0;
3300: td = TD(d);
3301: c = CM(m0);
3302: for ( i = 0; i < len; i++, NMV_ADV(m) ) {
3303: NEXTNM(mr0,mr);
3304: CM(mr) = 1;
3305: ndl_add(DL(m),d,DL(mr));
3306: }
3307: NEXT(mr) = 0;
3308: MKND(NV(p),mr0,len,r);
3309: SG(r) = SG(p) + TD(d);
3310: return r;
3311: }
3312: }
3313:
1.55 noro 3314: ND ndv_mul_nm(int mod,NM m0,NDV p)
1.9 noro 3315: {
3316: NM mr,mr0;
3317: NMV m;
1.61 noro 3318: UINT *d,*dt,*dm;
1.9 noro 3319: int c,n,td,i,c1,c2,len;
1.16 noro 3320: Q q;
1.9 noro 3321: ND r;
3322:
1.34 noro 3323: if ( !p ) return 0;
1.55 noro 3324: else if ( do_weyl )
1.71 noro 3325: if ( mod == -1 )
3326: error("ndv_mul_nm : not implemented (weyl)");
3327: else
3328: return weyl_ndv_mul_nm(mod,m0,p);
1.9 noro 3329: else {
3330: n = NV(p); m = BDY(p);
1.34 noro 3331: d = DL(m0);
1.14 noro 3332: len = LEN(p);
1.9 noro 3333: mr0 = 0;
1.34 noro 3334: td = TD(d);
1.71 noro 3335: if ( mod == -1 ) {
3336: c = CM(m0);
3337: for ( i = 0; i < len; i++, NMV_ADV(m) ) {
3338: NEXTNM(mr0,mr);
3339: CM(mr) = _mulsf(CM(m),c);
3340: ndl_add(DL(m),d,DL(mr));
3341: }
3342: } else if ( mod ) {
1.16 noro 3343: c = CM(m0);
3344: for ( i = 0; i < len; i++, NMV_ADV(m) ) {
3345: NEXTNM(mr0,mr);
3346: c1 = CM(m);
1.19 noro 3347: DMAR(c1,c,0,mod,c2);
1.16 noro 3348: CM(mr) = c2;
3349: ndl_add(DL(m),d,DL(mr));
3350: }
3351: } else {
3352: q = CQ(m0);
3353: for ( i = 0; i < len; i++, NMV_ADV(m) ) {
3354: NEXTNM(mr0,mr);
3355: mulq(CQ(m),q,&CQ(mr));
3356: ndl_add(DL(m),d,DL(mr));
3357: }
1.4 noro 3358: }
1.9 noro 3359: NEXT(mr) = 0;
1.31 noro 3360: MKND(NV(p),mr0,len,r);
1.34 noro 3361: SG(r) = SG(p) + TD(d);
1.9 noro 3362: return r;
1.4 noro 3363: }
3364: }
3365:
1.43 noro 3366: void ndv_realloc(NDV p,int obpe,int oadv,EPOS oepos)
1.11 noro 3367: {
1.13 noro 3368: NMV m,mr,mr0,t;
3369: int len,i,k;
1.11 noro 3370:
1.61 noro 3371: if ( !p ) return;
3372: m = BDY(p); len = LEN(p);
3373: mr0 = nmv_adv>oadv?(NMV)REALLOC(BDY(p),len*nmv_adv):BDY(p);
3374: m = (NMV)((char *)mr0+(len-1)*oadv);
3375: mr = (NMV)((char *)mr0+(len-1)*nmv_adv);
3376: t = (NMV)ALLOCA(nmv_adv);
3377: for ( i = 0; i < len; i++, NMV_OPREV(m), NMV_PREV(mr) ) {
3378: CQ(t) = CQ(m);
3379: for ( k = 0; k < nd_wpd; k++ ) DL(t)[k] = 0;
3380: ndl_reconstruct(DL(m),DL(t),obpe,oepos);
3381: CQ(mr) = CQ(t);
3382: ndl_copy(DL(t),DL(mr));
3383: }
3384: BDY(p) = mr0;
3385: }
3386:
3387: NDV ndv_dup_realloc(NDV p,int obpe,int oadv,EPOS oepos)
3388: {
3389: NMV m,mr,mr0;
3390: int len,i;
3391: NDV r;
1.11 noro 3392:
1.61 noro 3393: if ( !p ) return 0;
3394: m = BDY(p); len = LEN(p);
3395: mr0 = mr = (NMV)MALLOC(len*nmv_adv);
3396: for ( i = 0; i < len; i++, NMV_OADV(m), NMV_ADV(mr) ) {
3397: ndl_zero(DL(mr));
3398: ndl_reconstruct(DL(m),DL(mr),obpe,oepos);
3399: CQ(mr) = CQ(m);
1.11 noro 3400: }
1.61 noro 3401: MKNDV(NV(p),mr0,len,r);
3402: SG(r) = SG(p);
3403: return r;
1.11 noro 3404: }
3405:
1.61 noro 3406: /* duplicate p */
3407:
3408: NDV ndv_dup(int mod,NDV p)
1.3 noro 3409: {
3410: NDV d;
1.61 noro 3411: NMV t,m,m0;
1.3 noro 3412: int i,len;
3413:
1.34 noro 3414: if ( !p ) return 0;
1.31 noro 3415: len = LEN(p);
1.34 noro 3416: m0 = m = (NMV)(mod?MALLOC_ATOMIC(len*nmv_adv):MALLOC(len*nmv_adv));
1.61 noro 3417: for ( t = BDY(p), i = 0; i < len; i++, NMV_ADV(t), NMV_ADV(m) ) {
1.14 noro 3418: ndl_copy(DL(t),DL(m));
1.16 noro 3419: CQ(m) = CQ(t);
1.3 noro 3420: }
3421: MKNDV(NV(p),m0,len,d);
1.23 noro 3422: SG(d) = SG(p);
3423: return d;
3424: }
3425:
1.63 noro 3426: ND nd_dup(ND p)
3427: {
3428: ND d;
3429: NM t,m,m0;
3430:
3431: if ( !p ) return 0;
3432: for ( m0 = 0, t = BDY(p); t; t = NEXT(t) ) {
3433: NEXTNM(m0,m);
3434: ndl_copy(DL(t),DL(m));
3435: CQ(m) = CQ(t);
3436: }
3437: if ( m0 ) NEXT(m) = 0;
3438: MKND(NV(p),m0,LEN(p),d);
3439: SG(d) = SG(p);
3440: return d;
3441: }
3442:
1.61 noro 3443: /* XXX if p->len == 0 then it represents 0 */
3444:
3445: void ndv_mod(int mod,NDV p)
3446: {
3447: NMV t,d;
3448: int r;
3449: int i,len,dlen;
1.71 noro 3450: Obj gfs;
1.61 noro 3451:
3452: if ( !p ) return;
3453: len = LEN(p);
3454: dlen = 0;
1.71 noro 3455: if ( mod == -1 )
3456: for ( t = d = BDY(p), i = 0; i < len; i++, NMV_ADV(t) ) {
3457: simp_ff((Obj)CP(t),&gfs);
3458: r = FTOIF(CONT((GFS)gfs));
1.61 noro 3459: CM(d) = r;
3460: ndl_copy(DL(t),DL(d));
3461: NMV_ADV(d);
3462: dlen++;
3463: }
1.71 noro 3464: else
3465: for ( t = d = BDY(p), i = 0; i < len; i++, NMV_ADV(t) ) {
3466: r = rem(NM(CQ(t)),mod);
3467: if ( r ) {
3468: if ( SGN(CQ(t)) < 0 )
3469: r = mod-r;
3470: CM(d) = r;
3471: ndl_copy(DL(t),DL(d));
3472: NMV_ADV(d);
3473: dlen++;
3474: }
3475: }
1.61 noro 3476: LEN(p) = dlen;
3477: }
3478:
3479: NDV ptondv(VL vl,VL dvl,P p)
3480: {
3481: ND nd;
3482:
3483: nd = ptond(vl,dvl,p);
3484: return ndtondv(0,nd);
3485: }
3486:
3487: ND ptond(VL vl,VL dvl,P p)
1.23 noro 3488: {
1.61 noro 3489: int n,i,j,k,e;
3490: VL tvl;
3491: V v;
3492: DCP dc;
3493: DCP *w;
3494: ND r,s,t,u;
3495: P x;
3496: int c;
3497: UINT *d;
1.23 noro 3498: NM m,m0;
1.61 noro 3499:
3500: if ( !p )
3501: return 0;
3502: else if ( NUM(p) ) {
3503: NEWNM(m);
3504: ndl_zero(DL(m));
3505: CQ(m) = (Q)p;
3506: NEXT(m) = 0;
3507: MKND(nd_nvar,m,1,r);
3508: SG(r) = 0;
3509: return r;
3510: } else {
3511: for ( dc = DC(p), k = 0; dc; dc = NEXT(dc), k++ );
3512: w = (DCP *)ALLOCA(k*sizeof(DCP));
3513: for ( dc = DC(p), j = 0; j < k; dc = NEXT(dc), j++ ) w[j] = dc;
3514: for ( i = 0, tvl = dvl, v = VR(p);
3515: vl && tvl->v != v; tvl = NEXT(tvl), i++ );
3516: if ( !tvl ) {
3517: for ( j = k-1, s = 0, MKV(v,x); j >= 0; j-- ) {
3518: t = ptond(vl,dvl,COEF(w[j]));
3519: pwrp(vl,x,DEG(w[j]),&p);
3520: nd_mul_c_p(CO,t,p); s = nd_add(0,s,t);
3521: }
3522: return s;
3523: } else {
3524: NEWNM(m0); d = DL(m0);
3525: for ( j = k-1, s = 0; j >= 0; j-- ) {
3526: ndl_zero(d); e = QTOS(DEG(w[j])); PUT_EXP(d,i,e);
3527: TD(d) = MUL_WEIGHT(e,i);
3528: if ( nd_blockmask) ndl_weight_mask(d);
3529: t = ptond(vl,dvl,COEF(w[j]));
3530: for ( m = BDY(t); m; m = NEXT(m) )
3531: ndl_addto(DL(m),d);
3532: SG(t) += TD(d);
3533: s = nd_add(0,s,t);
3534: }
3535: FREENM(m0);
3536: return s;
3537: }
3538: }
3539: }
3540:
3541: P ndvtop(int mod,VL vl,VL dvl,NDV p)
3542: {
3543: VL tvl;
3544: int len,n,j,i,e;
3545: NMV m;
3546: Q q;
3547: P c;
3548: UINT *d;
3549: P s,r,u,t,w;
1.71 noro 3550: GFS gfs;
1.23 noro 3551:
1.34 noro 3552: if ( !p ) return 0;
1.61 noro 3553: else {
3554: len = LEN(p);
3555: n = NV(p);
3556: m = (NMV)(((char *)BDY(p))+nmv_adv*(len-1));
3557: for ( j = len-1, s = 0; j >= 0; j--, NMV_PREV(m) ) {
1.71 noro 3558: if ( mod == -1 ) {
3559: e = IFTOF(CM(m)); MKGFS(e,gfs); c = (P)gfs;
3560: } else if ( mod ) {
1.61 noro 3561: STOQ(CM(m),q); c = (P)q;
3562: } else
3563: c = CP(m);
3564: d = DL(m);
3565: for ( i = 0, t = c, tvl = dvl; i < n; tvl = NEXT(tvl), i++ ) {
3566: MKV(tvl->v,r); e = GET_EXP(d,i); STOQ(e,q);
3567: pwrp(vl,r,q,&u); mulp(vl,t,u,&w); t = w;
3568: }
3569: addp(vl,s,t,&u); s = u;
3570: }
3571: return s;
1.23 noro 3572: }
1.3 noro 3573: }
3574:
1.61 noro 3575: NDV ndtondv(int mod,ND p)
1.11 noro 3576: {
3577: NDV d;
1.61 noro 3578: NMV m,m0;
3579: NM t;
3580: int i,len;
1.11 noro 3581:
1.34 noro 3582: if ( !p ) return 0;
1.61 noro 3583: len = LEN(p);
1.74 noro 3584: if ( mod )
3585: m0 = m = (NMV)GC_malloc_atomic_ignore_off_page(len*nmv_adv);
3586: else
3587: m0 = m = MALLOC(len*nmv_adv);
3588: ndv_alloc += nmv_adv*len;
1.61 noro 3589: for ( t = BDY(p), i = 0; t; t = NEXT(t), i++, NMV_ADV(m) ) {
3590: ndl_copy(DL(t),DL(m));
3591: CQ(m) = CQ(t);
1.11 noro 3592: }
1.61 noro 3593: MKNDV(NV(p),m0,len,d);
1.14 noro 3594: SG(d) = SG(p);
1.11 noro 3595: return d;
3596: }
3597:
1.61 noro 3598: ND ndvtond(int mod,NDV p)
1.11 noro 3599: {
1.61 noro 3600: ND d;
3601: NM m,m0;
1.11 noro 3602: NMV t;
1.61 noro 3603: int i,len;
1.11 noro 3604:
1.34 noro 3605: if ( !p ) return 0;
1.11 noro 3606: m0 = 0;
1.61 noro 3607: len = p->len;
3608: for ( t = BDY(p), i = 0; i < len; NMV_ADV(t), i++ ) {
3609: NEXTNM(m0,m);
3610: ndl_copy(DL(t),DL(m));
3611: CQ(m) = CQ(t);
1.11 noro 3612: }
3613: NEXT(m) = 0;
1.61 noro 3614: MKND(NV(p),m0,len,d);
1.14 noro 3615: SG(d) = SG(p);
1.11 noro 3616: return d;
3617: }
3618:
1.3 noro 3619: void ndv_print(NDV p)
3620: {
3621: NMV m;
3622: int i,len;
3623:
1.34 noro 3624: if ( !p ) printf("0\n");
1.3 noro 3625: else {
1.14 noro 3626: len = LEN(p);
1.3 noro 3627: for ( m = BDY(p), i = 0; i < len; i++, NMV_ADV(m) ) {
1.71 noro 3628: if ( CM(m) & 0x80000000 ) printf("+@_%d*",IFTOF(CM(m)));
3629: else printf("+%d*",CM(m));
1.16 noro 3630: ndl_print(DL(m));
3631: }
3632: printf("\n");
3633: }
3634: }
3635:
3636: void ndv_print_q(NDV p)
3637: {
3638: NMV m;
3639: int i,len;
3640:
1.34 noro 3641: if ( !p ) printf("0\n");
1.16 noro 3642: else {
3643: len = LEN(p);
3644: for ( m = BDY(p), i = 0; i < len; i++, NMV_ADV(m) ) {
3645: printf("+");
1.74 noro 3646: printexpr(CO,(Obj)CQ(m));
1.16 noro 3647: printf("*");
1.14 noro 3648: ndl_print(DL(m));
1.3 noro 3649: }
3650: printf("\n");
3651: }
1.25 noro 3652: }
3653:
1.61 noro 3654: NODE ndv_reducebase(NODE x)
1.27 noro 3655: {
3656: int len,i,j;
3657: NDV *w;
3658: NODE t,t0;
3659:
3660: len = length(x);
3661: w = (NDV *)ALLOCA(len*sizeof(NDV));
3662: for ( i = 0, t = x; i < len; i++, t = NEXT(t) ) w[i] = BDY(t);
3663: for ( i = 0; i < len; i++ ) {
3664: for ( j = 0; j < i; j++ ) {
3665: if ( w[i] && w[j] )
3666: if ( ndl_reducible(HDL(w[i]),HDL(w[j])) ) w[i] = 0;
3667: else if ( ndl_reducible(HDL(w[j]),HDL(w[i])) ) w[j] = 0;
3668: }
3669: }
3670: for ( i = len-1, t0 = 0; i >= 0; i-- ) {
3671: if ( w[i] ) { NEXTNODE(t0,t); BDY(t) = (pointer)w[i]; }
3672: }
3673: NEXT(t) = 0; x = t0;
3674: return x;
1.11 noro 3675: }
1.32 noro 3676:
1.43 noro 3677: /* XXX incomplete */
3678:
1.32 noro 3679: void nd_init_ord(struct order_spec *ord)
3680: {
1.43 noro 3681: switch ( ord->id ) {
1.32 noro 3682: case 0:
1.43 noro 3683: switch ( ord->ord.simple ) {
3684: case 0:
3685: nd_dcomp = 1;
3686: nd_isrlex = 1;
3687: break;
3688: case 1:
3689: nd_dcomp = 1;
3690: nd_isrlex = 0;
3691: break;
3692: case 2:
3693: nd_dcomp = 0;
3694: nd_isrlex = 0;
1.45 noro 3695: ndl_compare_function = ndl_lex_compare;
1.58 noro 3696: break;
3697: case 11:
3698: /* XXX */
3699: nd_dcomp = 0;
3700: nd_isrlex = 1;
3701: ndl_compare_function = ndl_ww_lex_compare;
1.43 noro 3702: break;
3703: default:
3704: error("nd_gr : unsupported order");
3705: }
1.32 noro 3706: break;
3707: case 1:
1.43 noro 3708: /* XXX */
3709: nd_dcomp = -1;
1.32 noro 3710: nd_isrlex = 0;
1.45 noro 3711: ndl_compare_function = ndl_block_compare;
1.34 noro 3712: break;
1.43 noro 3713: case 2:
3714: error("nd_init_ord : matrix order is not supported yet.");
1.32 noro 3715: break;
3716: }
1.41 noro 3717: nd_ord = ord;
1.32 noro 3718: }
3719:
1.43 noro 3720: BlockMask nd_create_blockmask(struct order_spec *ord)
3721: {
3722: int n,i,j,s,l;
1.61 noro 3723: UINT *t;
1.43 noro 3724: BlockMask bm;
3725:
3726: if ( !ord->id )
3727: return 0;
3728: n = ord->ord.block.length;
3729: bm = (BlockMask)MALLOC(sizeof(struct oBlockMask));
3730: bm->n = n;
3731: bm->order_pair = ord->ord.block.order_pair;
1.61 noro 3732: bm->mask = (UINT **)MALLOC(n*sizeof(UINT *));
1.43 noro 3733: for ( i = 0, s = 0; i < n; i++ ) {
1.61 noro 3734: bm->mask[i] = t = (UINT *)MALLOC_ATOMIC(nd_wpd*sizeof(UINT));
1.43 noro 3735: for ( j = 0; j < nd_wpd; j++ ) t[j] = 0;
3736: l = bm->order_pair[i].length;
3737: for ( j = 0; j < l; j++, s++ ) PUT_EXP(t,s,nd_mask0);
3738: }
3739: return bm;
1.57 noro 3740: }
3741:
3742: EPOS nd_create_epos(struct order_spec *ord)
3743: {
3744: int i,j,l,s,ord_l,ord_o;
3745: EPOS epos;
3746: struct order_pair *op;
3747:
3748: epos = (EPOS)MALLOC_ATOMIC(nd_nvar*sizeof(struct oEPOS));
3749: switch ( ord->id ) {
3750: case 0:
3751: if ( nd_isrlex ) {
3752: for ( i = 0; i < nd_nvar; i++ ) {
3753: epos[i].i = nd_exporigin + (nd_nvar-1-i)/nd_epw;
3754: epos[i].s = (nd_epw-((nd_nvar-1-i)%nd_epw)-1)*nd_bpe;
3755: }
3756: } else {
3757: for ( i = 0; i < nd_nvar; i++ ) {
3758: epos[i].i = nd_exporigin + i/nd_epw;
3759: epos[i].s = (nd_epw-(i%nd_epw)-1)*nd_bpe;
3760: }
3761: }
3762: break;
3763: case 1:
3764: /* block order */
3765: l = ord->ord.block.length;
3766: op = ord->ord.block.order_pair;
3767: for ( j = 0, s = 0; j < l; j++ ) {
3768: ord_o = op[j].order;
3769: ord_l = op[j].length;
3770: if ( !ord_o )
3771: for ( i = 0; i < ord_l; i++ ) {
3772: epos[s+i].i = nd_exporigin + (s+ord_l-i-1)/nd_epw;
3773: epos[s+i].s = (nd_epw-((s+ord_l-i-1)%nd_epw)-1)*nd_bpe;
3774: }
3775: else
3776: for ( i = 0; i < ord_l; i++ ) {
3777: epos[s+i].i = nd_exporigin + (s+i)/nd_epw;
3778: epos[s+i].s = (nd_epw-((s+i)%nd_epw)-1)*nd_bpe;
3779: }
3780: s += ord_l;
3781: }
3782: break;
3783: case 2:
3784: error("nd_create_epos : matrix order is not supported yet.");
3785: }
3786: return epos;
1.43 noro 3787: }
1.59 noro 3788:
3789: /* external interface */
3790:
3791: void nd_nf_p(P f,LIST g,LIST v,int m,struct order_spec *ord,P *rp)
3792: {
1.61 noro 3793: NODE t,in0,in;
1.59 noro 3794: ND nd,nf;
1.61 noro 3795: NDV ndv;
3796: VL vv,tv;
3797: int stat,nvar,max,e;
1.69 noro 3798: union oNDC dn;
1.59 noro 3799:
3800: pltovl(v,&vv);
1.74 noro 3801: for ( nvar = 0, tv = vv; tv; tv = NEXT(tv), nvar++ );
1.61 noro 3802:
3803: /* get the degree bound */
3804: for ( t = BDY(g), max = 0; t; t = NEXT(t) )
3805: for ( tv = vv; tv; tv = NEXT(tv) ) {
3806: e = getdeg(tv->v,(P)BDY(t));
3807: max = MAX(e,max);
3808: }
3809: for ( tv = vv; tv; tv = NEXT(tv) ) {
3810: e = getdeg(tv->v,f);
3811: max = MAX(e,max);
3812: }
3813:
1.59 noro 3814: nd_init_ord(ord);
1.61 noro 3815: nd_setup_parameters(nvar,max);
3816:
3817: /* conversion to ndv */
3818: for ( in0 = 0, t = BDY(g); t; t = NEXT(t) ) {
3819: NEXTNODE(in0,in);
3820: BDY(in) = (pointer)ptondv(CO,vv,(P)BDY(t));
1.69 noro 3821: if ( m ) ndv_mod(m,(NDV)BDY(in));
1.61 noro 3822: }
3823: NEXTNODE(in0,in);
3824: BDY(in) = (pointer)ptondv(CO,vv,f);
1.69 noro 3825: if ( m ) ndv_mod(m,(NDV)BDY(in));
1.61 noro 3826: NEXT(in) = 0;
3827:
3828: ndv_setup(m,0,in0);
1.59 noro 3829: nd_psn--;
3830: nd_scale=2;
3831: while ( 1 ) {
3832: nd = (pointer)ndvtond(m,nd_ps[nd_psn]);
1.69 noro 3833: stat = nd_nf(m,nd,nd_ps,1,0,&nf);
1.59 noro 3834: if ( !stat ) {
3835: nd_psn++;
3836: nd_reconstruct(m,0,0);
3837: nd_psn--;
3838: } else
3839: break;
3840: }
1.61 noro 3841: *rp = ndvtop(m,CO,vv,ndtondv(m,nf));
1.63 noro 3842: }
3843:
3844: int nd_to_vect(int mod,UINT *s0,int n,ND d,UINT *r)
3845: {
3846: NM m;
3847: UINT *t,*s;
3848: int i;
3849:
3850: for ( i = 0; i < n; i++ ) r[i] = 0;
3851: for ( i = 0, s = s0, m = BDY(d); m; m = NEXT(m) ) {
3852: t = DL(m);
3853: for ( ; !ndl_equal(t,s); s += nd_wpd, i++ );
3854: r[i] = CM(m);
3855: }
3856: for ( i = 0; !r[i]; i++ );
3857: return i;
3858: }
3859:
1.74 noro 3860: int ndv_to_vect(int mod,UINT *s0,int n,NDV d,UINT *r)
3861: {
3862: NMV m;
3863: UINT *t,*s;
3864: int i,j,len;
3865:
3866: for ( i = 0; i < n; i++ ) r[i] = 0;
3867: m = BDY(d);
3868: len = LEN(d);
3869: for ( i = j = 0, s = s0; j < len; j++, NMV_ADV(m)) {
3870: t = DL(m);
3871: for ( ; !ndl_equal(t,s); s += nd_wpd, i++ );
3872: r[i] = CM(m);
3873: }
3874: for ( i = 0; !r[i]; i++ );
3875: return i;
3876: }
3877:
1.63 noro 3878: int nm_ind_pair_to_vect(int mod,UINT *s0,int n,NM_ind_pair pair,UINT *r)
3879: {
3880: NM m;
3881: NMV mr;
3882: UINT *d,*t,*s;
3883: NDV p;
3884: int i,j,len;
3885:
3886: m = pair->mul;
3887: d = DL(m);
3888: p = nd_ps[pair->index];
3889: t = (UINT *)ALLOCA(nd_wpd*sizeof(UINT));
3890: for ( i = 0; i < n; i++ ) r[i] = 0;
3891: len = LEN(p);
3892: for ( i = j = 0, s = s0, mr = BDY(p); j < len; j++, NMV_ADV(mr) ) {
3893: ndl_add(d,DL(mr),t);
3894: for ( ; !ndl_equal(t,s); s += nd_wpd, i++ );
3895: r[i] = CM(mr);
3896: }
3897: for ( i = 0; !r[i]; i++ );
3898: return i;
3899: }
3900:
1.67 noro 3901: IndArray nm_ind_pair_to_vect_compress(int mod,UINT *s0,int n,NM_ind_pair pair)
1.64 noro 3902: {
3903: NM m;
3904: NMV mr;
3905: UINT *d,*t,*s;
3906: NDV p;
1.67 noro 3907: unsigned char *ivc;
3908: unsigned short *ivs;
1.81 noro 3909: UINT *v,*ivi,*s0v;
1.67 noro 3910: int i,j,len,prev,diff,cdiff;
3911: IndArray r;
1.64 noro 3912:
3913: m = pair->mul;
3914: d = DL(m);
3915: p = nd_ps[pair->index];
3916: len = LEN(p);
3917: t = (UINT *)ALLOCA(nd_wpd*sizeof(UINT));
1.67 noro 3918: v = (unsigned int *)ALLOCA(len*sizeof(unsigned int));
1.64 noro 3919: for ( i = j = 0, s = s0, mr = BDY(p); j < len; j++, NMV_ADV(mr) ) {
3920: ndl_add(d,DL(mr),t);
3921: for ( ; !ndl_equal(t,s); s += nd_wpd, i++ );
1.67 noro 3922: v[j] = i;
3923: }
1.81 noro 3924: r = (IndArray)MALLOC(sizeof(struct oIndArray));
1.67 noro 3925: r->head = v[0];
3926: diff = 0;
3927: for ( i = 1; i < len; i++ ) {
3928: cdiff = v[i]-v[i-1]; diff = MAX(cdiff,diff);
3929: }
3930: if ( diff < 256 ) {
3931: r->width = 1;
3932: ivc = (unsigned char *)MALLOC_ATOMIC(len*sizeof(unsigned char));
3933: r->index.c = ivc;
3934: for ( i = 1, ivc[0] = 0; i < len; i++ ) ivc[i] = v[i]-v[i-1];
3935: } else if ( diff < 65536 ) {
3936: r->width = 2;
3937: ivs = (unsigned short *)MALLOC_ATOMIC(len*sizeof(unsigned short));
3938: r->index.s = ivs;
3939: for ( i = 1, ivs[0] = 0; i < len; i++ ) ivs[i] = v[i]-v[i-1];
3940: } else {
3941: r->width = 4;
3942: ivi = (unsigned int *)MALLOC_ATOMIC(len*sizeof(unsigned int));
3943: r->index.i = ivi;
3944: for ( i = 1, ivi[0] = 0; i < len; i++ ) ivi[i] = v[i]-v[i-1];
1.64 noro 3945: }
1.67 noro 3946: return r;
1.64 noro 3947: }
3948:
1.65 noro 3949:
1.76 noro 3950: int ndv_reduce_vect(int m,UINT *svect,int col,IndArray *imat,NM_ind_pair *rp0,int nred)
1.65 noro 3951: {
1.67 noro 3952: int i,j,k,len,pos,prev;
1.66 noro 3953: UINT c,c1,c2,c3,up,lo,dmy;
1.67 noro 3954: IndArray ivect;
3955: unsigned char *ivc;
3956: unsigned short *ivs;
3957: unsigned int *ivi;
1.65 noro 3958: NDV redv;
1.67 noro 3959: NMV mr;
1.65 noro 3960: NODE rp;
1.76 noro 3961: int maxrs;
1.65 noro 3962:
1.76 noro 3963: maxrs = 0;
1.74 noro 3964: for ( i = 0; i < nred; i++ ) {
1.65 noro 3965: ivect = imat[i];
1.67 noro 3966: k = ivect->head; svect[k] %= m;
1.65 noro 3967: if ( c = svect[k] ) {
1.76 noro 3968: maxrs = MAX(maxrs,rp0[i]->sugar);
1.74 noro 3969: c = m-c; redv = nd_ps[rp0[i]->index];
1.67 noro 3970: len = LEN(redv); mr = BDY(redv);
3971: svect[k] = 0; prev = k;
3972: switch ( ivect->width ) {
3973: case 1:
3974: ivc = ivect->index.c;
3975: for ( j = 1, NMV_ADV(mr); j < len; j++, NMV_ADV(mr) ) {
3976: pos = prev+ivc[j]; c1 = CM(mr); c2 = svect[pos];
3977: prev = pos;
3978: DMA(c1,c,c2,up,lo);
3979: if ( up ) { DSAB(m,up,lo,dmy,c3); svect[pos] = c3;
3980: } else svect[pos] = lo;
3981: }
3982: break;
3983: case 2:
3984: ivs = ivect->index.s;
3985: for ( j = 1, NMV_ADV(mr); j < len; j++, NMV_ADV(mr) ) {
3986: pos = prev+ivs[j]; c1 = CM(mr); c2 = svect[pos];
3987: prev = pos;
3988: DMA(c1,c,c2,up,lo);
3989: if ( up ) { DSAB(m,up,lo,dmy,c3); svect[pos] = c3;
3990: } else svect[pos] = lo;
3991: }
3992: break;
3993: case 4:
3994: ivi = ivect->index.i;
3995: for ( j = 1, NMV_ADV(mr); j < len; j++, NMV_ADV(mr) ) {
3996: pos = prev+ivi[j]; c1 = CM(mr); c2 = svect[pos];
3997: prev = pos;
3998: DMA(c1,c,c2,up,lo);
3999: if ( up ) { DSAB(m,up,lo,dmy,c3); svect[pos] = c3;
4000: } else svect[pos] = lo;
4001: }
4002: break;
1.65 noro 4003: }
4004: }
4005: }
1.66 noro 4006: for ( i = 0; i < col; i++ )
4007: if ( svect[i] >= (UINT)m ) svect[i] %= m;
1.76 noro 4008: return maxrs;
1.65 noro 4009: }
4010:
1.76 noro 4011: int ndv_reduce_vect_sf(int m,UINT *svect,int col,IndArray *imat,NM_ind_pair *rp0,int nred)
1.72 noro 4012: {
4013: int i,j,k,len,pos,prev;
4014: UINT c,c1,c2,c3,up,lo,dmy;
4015: IndArray ivect;
4016: unsigned char *ivc;
4017: unsigned short *ivs;
4018: unsigned int *ivi;
4019: NDV redv;
4020: NMV mr;
4021: NODE rp;
1.76 noro 4022: int maxrs;
1.72 noro 4023:
1.76 noro 4024: maxrs = 0;
1.74 noro 4025: for ( i = 0; i < nred; i++ ) {
1.72 noro 4026: ivect = imat[i];
4027: k = ivect->head; svect[k] %= m;
4028: if ( c = svect[k] ) {
1.76 noro 4029: maxrs = MAX(maxrs,rp0[i]->sugar);
1.74 noro 4030: c = _chsgnsf(c); redv = nd_ps[rp0[i]->index];
1.72 noro 4031: len = LEN(redv); mr = BDY(redv);
4032: svect[k] = 0; prev = k;
4033: switch ( ivect->width ) {
4034: case 1:
4035: ivc = ivect->index.c;
4036: for ( j = 1, NMV_ADV(mr); j < len; j++, NMV_ADV(mr) ) {
4037: pos = prev+ivc[j]; prev = pos;
4038: svect[pos] = _addsf(_mulsf(CM(mr),c),svect[pos]);
4039: }
4040: break;
4041: case 2:
4042: ivs = ivect->index.s;
4043: for ( j = 1, NMV_ADV(mr); j < len; j++, NMV_ADV(mr) ) {
4044: pos = prev+ivs[j]; prev = pos;
4045: svect[pos] = _addsf(_mulsf(CM(mr),c),svect[pos]);
4046: }
4047: break;
4048: case 4:
4049: ivi = ivect->index.i;
4050: for ( j = 1, NMV_ADV(mr); j < len; j++, NMV_ADV(mr) ) {
4051: pos = prev+ivi[j]; prev = pos;
4052: svect[pos] = _addsf(_mulsf(CM(mr),c),svect[pos]);
4053: }
4054: break;
4055: }
4056: }
4057: }
1.76 noro 4058: return maxrs;
1.72 noro 4059: }
4060:
1.65 noro 4061: NDV vect_to_ndv(UINT *vect,int spcol,int col,int *rhead,UINT *s0vect)
4062: {
4063: int j,k,len;
4064: UINT *p;
4065: UINT c;
4066: NDV r;
4067: NMV mr0,mr;
4068:
4069: for ( j = 0, len = 0; j < spcol; j++ ) if ( vect[j] ) len++;
4070: if ( !len ) return 0;
4071: else {
1.74 noro 4072: mr0 = (NMV)GC_malloc_atomic_ignore_off_page(nmv_adv*len);
4073: ndv_alloc += nmv_adv*len;
1.65 noro 4074: mr = mr0;
4075: p = s0vect;
4076: for ( j = k = 0; j < col; j++, p += nd_wpd )
4077: if ( !rhead[j] ) {
4078: if ( c = vect[k++] ) {
4079: ndl_copy(p,DL(mr)); CM(mr) = c; NMV_ADV(mr);
4080: }
4081: }
4082: MKNDV(nd_nvar,mr0,len,r);
4083: return r;
4084: }
4085: }
4086:
1.74 noro 4087: int nd_sp_f4(int m,ND_pairs l,PGeoBucket bucket)
1.65 noro 4088: {
4089: ND_pairs t;
4090: NODE sp0,sp;
4091: int stat;
4092: ND spol;
4093:
4094: for ( t = l; t; t = NEXT(t) ) {
4095: stat = nd_sp(m,0,t,&spol);
4096: if ( !stat ) return 0;
4097: if ( spol ) {
4098: add_pbucket_symbolic(bucket,spol);
4099: }
4100: }
1.68 noro 4101: return 1;
1.65 noro 4102: }
4103:
4104: int nd_symbolic_preproc(PGeoBucket bucket,UINT **s0vect,NODE *r)
4105: {
4106: NODE rp0,rp;
4107: NM mul,head,s0,s;
1.76 noro 4108: int index,col,i,sugar;
1.65 noro 4109: RHist h;
4110: UINT *s0v,*p;
4111: NM_ind_pair pair;
4112: ND red;
4113:
4114: s0 = 0; rp0 = 0; col = 0;
4115: while ( 1 ) {
4116: head = remove_head_pbucket_symbolic(bucket);
4117: if ( !head ) break;
4118: if ( !s0 ) s0 = head;
4119: else NEXT(s) = head;
4120: s = head;
4121: index = ndl_find_reducer(DL(head));
4122: if ( index >= 0 ) {
4123: h = nd_psh[index];
4124: NEWNM(mul);
4125: ndl_sub(DL(head),DL(h),DL(mul));
4126: if ( ndl_check_bound2(index,DL(mul)) ) return 0;
1.76 noro 4127: sugar = TD(DL(mul))+SG(nd_ps[index]);
4128: MKNM_ind_pair(pair,mul,index,sugar);
1.65 noro 4129: red = ndv_mul_nm_symbolic(mul,nd_ps[index]);
4130: add_pbucket_symbolic(bucket,nd_remove_head(red));
4131: NEXTNODE(rp0,rp); BDY(rp) = (pointer)pair;
4132: }
4133: col++;
4134: }
1.72 noro 4135: if ( rp0 ) NEXT(rp) = 0;
4136: NEXT(s) = 0;
1.65 noro 4137: s0v = (UINT *)MALLOC_ATOMIC(col*nd_wpd*sizeof(UINT));
4138: for ( i = 0, p = s0v, s = s0; i < col;
4139: i++, p += nd_wpd, s = NEXT(s) ) ndl_copy(DL(s),p);
4140: *s0vect = s0v;
4141: *r = rp0;
4142: return col;
4143: }
4144:
1.69 noro 4145: NODE nd_f4(int m)
4146: {
4147: int i,nh,stat,index;
4148: NODE r,g;
4149: ND_pairs d,l,t;
4150: ND spol,red;
4151: NDV nf,redv;
4152: NM s0,s;
1.84 noro 4153: NODE rp0,srp0,nflist;
1.69 noro 4154: int nsp,nred,col,rank,len,k,j,a;
4155: UINT c;
1.74 noro 4156: UINT **spmat;
1.69 noro 4157: UINT *s0vect,*svect,*p,*v;
4158: int *colstat;
4159: IndArray *imat;
4160: int *rhead;
4161: int spcol,sprow;
4162: int sugar;
4163: PGeoBucket bucket;
4164: struct oEGT eg0,eg1,eg_f4;
4165:
4166: if ( !m )
4167: error("nd_f4 : not implemented");
1.74 noro 4168: ndv_alloc = 0;
1.69 noro 4169: g = 0; d = 0;
4170: for ( i = 0; i < nd_psn; i++ ) {
4171: d = update_pairs(d,g,i);
4172: g = update_base(g,i);
4173: }
4174: while ( d ) {
4175: get_eg(&eg0);
4176: l = nd_minsugarp(d,&d);
4177: sugar = SG(l);
4178: bucket = create_pbucket();
1.74 noro 4179: stat = nd_sp_f4(m,l,bucket);
1.69 noro 4180: if ( !stat ) {
4181: for ( t = l; NEXT(t); t = NEXT(t) );
4182: NEXT(t) = d; d = l;
4183: d = nd_reconstruct(m,0,d);
4184: continue;
4185: }
1.86 ! noro 4186: if ( bucket->m < 0 ) continue;
1.69 noro 4187: col = nd_symbolic_preproc(bucket,&s0vect,&rp0);
4188: if ( !col ) {
4189: for ( t = l; NEXT(t); t = NEXT(t) );
4190: NEXT(t) = d; d = l;
4191: d = nd_reconstruct(m,0,d);
4192: continue;
4193: }
4194: get_eg(&eg1); init_eg(&eg_f4); add_eg(&eg_f4,&eg0,&eg1);
1.74 noro 4195: if ( DP_Print )
4196: fprintf(asir_out,"sugar=%d,symb=%fsec,",
4197: sugar,eg_f4.exectime+eg_f4.gctime);
4198: if ( 1 )
4199: nflist = nd_f4_red(m,l,s0vect,col,rp0);
4200: else
4201: nflist = nd_f4_red_dist(m,l,s0vect,col,rp0);
1.69 noro 4202: /* adding new bases */
1.74 noro 4203: for ( r = nflist; r; r = NEXT(r) ) {
4204: nf = (NDV)BDY(r);
1.69 noro 4205: ndv_removecont(m,nf);
1.77 noro 4206: nh = ndv_newps(m,nf,0);
1.69 noro 4207: d = update_pairs(d,g,nh);
4208: g = update_base(g,nh);
4209: }
4210: }
4211: for ( r = g; r; r = NEXT(r) ) BDY(r) = (pointer)nd_ps[(int)BDY(r)];
1.74 noro 4212: fprintf(asir_out,"ndv_alloc=%d\n",ndv_alloc);
1.69 noro 4213: return g;
4214: }
1.74 noro 4215:
4216: NODE nd_f4_red(int m,ND_pairs sp0,UINT *s0vect,int col,NODE rp0)
1.63 noro 4217: {
1.67 noro 4218: IndArray *imat;
1.74 noro 4219: int nsp,nred,spcol,sprow,a;
1.65 noro 4220: int *rhead;
1.74 noro 4221: int i,j,k,l,rank;
4222: NODE rp,r0,r;
4223: ND_pairs sp;
4224: ND spol;
4225: int **spmat;
4226: UINT *svect,*v;
4227: int *colstat;
1.80 noro 4228: struct oEGT eg0,eg1,eg2,eg_f4,eg_f4_1,eg_f4_2;
1.74 noro 4229: NM_ind_pair *rvect;
1.76 noro 4230: int maxrs;
4231: int *spsugar;
1.63 noro 4232:
1.74 noro 4233: get_eg(&eg0);
4234: for ( sp = sp0, nsp = 0; sp; sp = NEXT(sp), nsp++ );
4235: nred = length(rp0); spcol = col-nred;
4236: imat = (IndArray *)ALLOCA(nred*sizeof(IndArray));
4237: rhead = (int *)ALLOCA(col*sizeof(int));
4238: for ( i = 0; i < col; i++ ) rhead[i] = 0;
1.63 noro 4239:
1.74 noro 4240: /* construction of index arrays */
4241: rvect = (NM_ind_pair *)ALLOCA(nred*sizeof(NM_ind_pair));
4242: for ( rp = rp0, i = 0; rp; i++, rp = NEXT(rp) ) {
4243: rvect[i] = (NM_ind_pair)BDY(rp);
4244: imat[i] = nm_ind_pair_to_vect_compress(m,s0vect,col,rvect[i]);
4245: rhead[imat[i]->head] = 1;
4246: }
4247:
4248: /* elimination (1st step) */
4249: spmat = (int **)ALLOCA(nsp*sizeof(UINT *));
4250: svect = (UINT *)ALLOCA(col*sizeof(UINT));
1.76 noro 4251: spsugar = (int *)ALLOCA(nsp*sizeof(UINT));
1.74 noro 4252: for ( a = sprow = 0, sp = sp0; a < nsp; a++, sp = NEXT(sp) ) {
4253: nd_sp(m,0,sp,&spol);
1.75 noro 4254: if ( !spol ) continue;
1.74 noro 4255: nd_to_vect(m,s0vect,col,spol,svect);
1.76 noro 4256: if ( m == -1 )
4257: maxrs = ndv_reduce_vect_sf(m,svect,col,imat,rvect,nred);
4258: else
4259: maxrs = ndv_reduce_vect(m,svect,col,imat,rvect,nred);
1.74 noro 4260: for ( i = 0; i < col; i++ ) if ( svect[i] ) break;
4261: if ( i < col ) {
4262: spmat[sprow] = v = (UINT *)MALLOC_ATOMIC(spcol*sizeof(UINT));
4263: for ( j = k = 0; j < col; j++ )
4264: if ( !rhead[j] ) v[k++] = svect[j];
1.76 noro 4265: spsugar[sprow] = MAX(maxrs,SG(spol));
1.74 noro 4266: sprow++;
4267: }
1.76 noro 4268: nd_free(spol);
1.74 noro 4269: }
1.80 noro 4270: get_eg(&eg1); init_eg(&eg_f4_1); add_eg(&eg_f4_1,&eg0,&eg1);
4271: if ( DP_Print ) {
4272: fprintf(asir_out,"elim1=%fsec,",eg_f4_1.exectime+eg_f4_1.gctime);
4273: fflush(asir_out);
4274: }
1.74 noro 4275: /* free index arrays */
4276: for ( i = 0; i < nred; i++ ) GC_free(imat[i]->index.c);
4277:
4278: /* elimination (2nd step) */
4279: colstat = (int *)ALLOCA(spcol*sizeof(int));
4280: if ( m == -1 )
1.76 noro 4281: rank = nd_gauss_elim_sf(spmat,spsugar,sprow,spcol,m,colstat);
1.74 noro 4282: else
1.76 noro 4283: rank = nd_gauss_elim_mod(spmat,spsugar,sprow,spcol,m,colstat);
1.74 noro 4284: r0 = 0;
4285: for ( i = 0; i < rank; i++ ) {
4286: NEXTNODE(r0,r); BDY(r) =
4287: (pointer)vect_to_ndv(spmat[i],spcol,col,rhead,s0vect);
1.76 noro 4288: SG((NDV)BDY(r)) = spsugar[i];
1.74 noro 4289: GC_free(spmat[i]);
4290: }
4291: for ( ; i < sprow; i++ ) GC_free(spmat[i]);
1.80 noro 4292: get_eg(&eg2); init_eg(&eg_f4_2); add_eg(&eg_f4_2,&eg1,&eg2);
4293: init_eg(&eg_f4); add_eg(&eg_f4,&eg0,&eg2);
1.74 noro 4294: if ( DP_Print ) {
1.80 noro 4295: fprintf(asir_out,"elim2=%fsec\n",eg_f4_2.exectime+eg_f4_2.gctime);
1.74 noro 4296: fprintf(asir_out,"nsp=%d,nred=%d,spmat=(%d,%d),rank=%d ",
4297: nsp,nred,sprow,spcol,rank);
4298: fprintf(asir_out,"%fsec\n",eg_f4.exectime+eg_f4.gctime);
1.63 noro 4299: }
1.74 noro 4300: return r0;
4301: }
4302:
4303: FILE *nd_write,*nd_read;
4304:
4305: void nd_send_int(int a) {
4306: write_int(nd_write,&a);
4307: }
4308:
4309: void nd_send_intarray(int *p,int len) {
4310: write_intarray(nd_write,p,len);
4311: }
4312:
4313: int nd_recv_int() {
4314: int a;
4315:
4316: read_int(nd_read,&a);
4317: return a;
4318: }
4319:
4320: void nd_recv_intarray(int *p,int len) {
4321: read_intarray(nd_read,p,len);
4322: }
4323:
4324: void nd_send_ndv(NDV p) {
4325: int len,i;
4326: NMV m;
4327:
4328: if ( !p ) nd_send_int(0);
4329: else {
4330: len = LEN(p);
4331: nd_send_int(len);
4332: m = BDY(p);
4333: for ( i = 0; i < len; i++, NMV_ADV(m) ) {
4334: nd_send_int(CM(m));
4335: nd_send_intarray(DL(m),nd_wpd);
1.68 noro 4336: }
1.74 noro 4337: }
4338: }
4339:
4340: void nd_send_nd(ND p) {
4341: int len,i;
4342: NM m;
4343:
4344: if ( !p ) nd_send_int(0);
4345: else {
4346: len = LEN(p);
4347: nd_send_int(len);
4348: m = BDY(p);
4349: for ( i = 0; i < len; i++, m = NEXT(m) ) {
4350: nd_send_int(CM(m));
4351: nd_send_intarray(DL(m),nd_wpd);
1.65 noro 4352: }
1.74 noro 4353: }
4354: }
1.65 noro 4355:
1.74 noro 4356: NDV nd_recv_ndv()
4357: {
4358: int len,i;
4359: NMV m,m0;
4360: NDV r;
1.65 noro 4361:
1.74 noro 4362: len = nd_recv_int();
4363: if ( !len ) return 0;
4364: else {
4365: m0 = m = (NMV)GC_malloc_atomic_ignore_off_page(nmv_adv*len);
4366: ndv_alloc += len*nmv_adv;
4367: for ( i = 0; i < len; i++, NMV_ADV(m) ) {
4368: CM(m) = nd_recv_int();
4369: nd_recv_intarray(DL(m),nd_wpd);
1.71 noro 4370: }
1.74 noro 4371: MKNDV(nd_nvar,m0,len,r);
4372: return r;
4373: }
4374: }
1.65 noro 4375:
1.74 noro 4376: int ox_exec_f4_red(Q proc)
4377: {
4378: Obj obj;
4379: STRING fname;
4380: NODE arg;
4381: int s;
4382: extern int ox_need_conv,ox_file_io;
4383:
4384: MKSTR(fname,"nd_exec_f4_red");
4385: arg = mknode(2,proc,fname);
4386: Pox_cmo_rpc(arg,&obj);
4387: s = get_ox_server_id(QTOS(proc));
4388: nd_write = iofp[s].out;
4389: nd_read = iofp[s].in;
4390: ox_need_conv = ox_file_io = 0;
4391: return s;
4392: }
4393:
4394: NODE nd_f4_red_dist(int m,ND_pairs sp0,UINT *s0vect,int col,NODE rp0)
4395: {
4396: int nsp,nred;
4397: int i,rank,s;
4398: NODE rp,r0,r;
4399: ND_pairs sp;
4400: NM_ind_pair pair;
4401: NMV nmv;
4402: NM nm;
4403: NDV nf;
4404: Obj proc,dmy;
4405:
4406: ox_launch_main(0,0,&proc);
4407: s = ox_exec_f4_red((Q)proc);
4408:
4409: nd_send_int(m);
4410: nd_send_int(nd_nvar);
4411: nd_send_int(nd_bpe);
4412: nd_send_int(nd_wpd);
4413: nd_send_int(nmv_adv);
4414:
4415: saveobj(nd_write,dp_current_spec.obj); fflush(nd_write);
4416:
4417: nd_send_int(nd_psn);
4418: for ( i = 0; i < nd_psn; i++ ) nd_send_ndv(nd_ps[i]);
4419:
4420: for ( sp = sp0, nsp = 0; sp; sp = NEXT(sp), nsp++ );
4421: nd_send_int(nsp);
4422: for ( i = 0, sp = sp0; i < nsp; i++, sp = NEXT(sp) ) {
4423: nd_send_int(sp->i1); nd_send_int(sp->i2);
4424: }
4425:
4426: nd_send_int(col); nd_send_intarray(s0vect,col*nd_wpd);
4427:
4428: nred = length(rp0); nd_send_int(nred);
4429: for ( i = 0, rp = rp0; i < nred; i++, rp = NEXT(rp) ) {
4430: pair = (NM_ind_pair)BDY(rp);
4431: nd_send_int(pair->index);
4432: nd_send_intarray(pair->mul->dl,nd_wpd);
4433: }
4434: fflush(nd_write);
4435: rank = nd_recv_int();
4436: fprintf(asir_out,"rank=%d\n",rank);
4437: r0 = 0;
4438: for ( i = 0; i < rank; i++ ) {
4439: nf = nd_recv_ndv();
4440: NEXTNODE(r0,r); BDY(r) = (pointer)nf;
4441: }
4442: Pox_shutdown(mknode(1,proc),&dmy);
4443: return r0;
4444: }
4445:
4446: /* server side */
4447:
4448: void nd_exec_f4_red_dist()
4449: {
4450: int m,i,nsp,col,s0size,nred,spcol,j,k;
4451: NM_ind_pair *rp0;
4452: NDV nf;
4453: UINT *s0vect;
4454: IndArray *imat;
4455: int *rhead;
4456: int **spmat;
4457: UINT *svect,*v;
4458: ND_pairs *sp0;
4459: int *colstat;
4460: int a,sprow,rank;
4461: struct order_spec ord;
4462: Obj ordspec;
4463: ND spol;
1.76 noro 4464: int maxrs;
4465: int *spsugar;
1.74 noro 4466:
4467: nd_read = iofp[0].in;
4468: nd_write = iofp[0].out;
4469: m = nd_recv_int();
4470: nd_nvar = nd_recv_int();
4471: nd_bpe = nd_recv_int();
4472: nd_wpd = nd_recv_int();
4473: nmv_adv = nd_recv_int();
4474:
4475: loadobj(nd_read,&ordspec);
4476: create_order_spec(ordspec,&ord);
4477: nd_init_ord(&ord);
4478: nd_setup_parameters(nd_nvar,0);
4479:
4480: nd_psn = nd_recv_int();
4481: nd_ps = (NDV *)MALLOC(nd_psn*sizeof(NDV));
4482: nd_bound = (UINT **)MALLOC(nd_psn*sizeof(UINT *));
4483: for ( i = 0; i < nd_psn; i++ ) {
4484: nd_ps[i] = nd_recv_ndv();
4485: nd_bound[i] = ndv_compute_bound(nd_ps[i]);
4486: }
4487:
4488: nsp = nd_recv_int();
4489: sp0 = (ND_pairs *)MALLOC(nsp*sizeof(ND_pairs));
4490: for ( i = 0; i < nsp; i++ ) {
4491: NEWND_pairs(sp0[i]);
4492: sp0[i]->i1 = nd_recv_int(); sp0[i]->i2 = nd_recv_int();
4493: ndl_lcm(HDL(nd_ps[sp0[i]->i1]),HDL(nd_ps[sp0[i]->i2]),LCM(sp0[i]));
4494: }
4495:
4496: col = nd_recv_int();
4497: s0size = col*nd_wpd;
4498: s0vect = (UINT *)MALLOC(s0size*sizeof(UINT));
4499: nd_recv_intarray(s0vect,s0size);
4500:
4501: nred = nd_recv_int();
4502: rp0 = (NM_ind_pair *)MALLOC(nred*sizeof(NM_ind_pair));
4503: for ( i = 0; i < nred; i++ ) {
4504: rp0[i] = (NM_ind_pair)MALLOC(sizeof(struct oNM_ind_pair));
4505: rp0[i]->index = nd_recv_int();
4506: rp0[i]->mul = (NM)MALLOC(sizeof(struct oNM)+(nd_wpd-1)*sizeof(UINT));
4507: nd_recv_intarray(rp0[i]->mul->dl,nd_wpd);
4508: }
4509:
4510: spcol = col-nred;
4511: imat = (IndArray *)MALLOC(nred*sizeof(IndArray));
4512: rhead = (int *)MALLOC(col*sizeof(int));
4513: for ( i = 0; i < col; i++ ) rhead[i] = 0;
4514:
4515: /* construction of index arrays */
4516: for ( i = 0; i < nred; i++ ) {
4517: imat[i] = nm_ind_pair_to_vect_compress(m,s0vect,col,rp0[i]);
4518: rhead[imat[i]->head] = 1;
4519: }
4520:
4521: /* elimination (1st step) */
4522: spmat = (int **)MALLOC(nsp*sizeof(UINT *));
4523: svect = (UINT *)MALLOC(col*sizeof(UINT));
1.76 noro 4524: spsugar = (int *)ALLOCA(nsp*sizeof(UINT));
1.74 noro 4525: for ( a = sprow = 0; a < nsp; a++ ) {
4526: nd_sp(m,0,sp0[a],&spol);
1.75 noro 4527: if ( !spol ) continue;
1.74 noro 4528: nd_to_vect(m,s0vect,col,spol,svect);
1.76 noro 4529: if ( m == -1 )
4530: maxrs = ndv_reduce_vect_sf(m,svect,col,imat,rp0,nred);
4531: else
4532: maxrs = ndv_reduce_vect(m,svect,col,imat,rp0,nred);
1.74 noro 4533: for ( i = 0; i < col; i++ ) if ( svect[i] ) break;
4534: if ( i < col ) {
4535: spmat[sprow] = v = (UINT *)MALLOC(spcol*sizeof(UINT));
4536: for ( j = k = 0; j < col; j++ )
4537: if ( !rhead[j] ) v[k++] = svect[j];
1.76 noro 4538: spsugar[sprow] = MAX(maxrs,SG(spol));
1.74 noro 4539: sprow++;
4540: }
1.76 noro 4541: nd_free(spol);
1.74 noro 4542: }
4543: /* elimination (2nd step) */
4544: colstat = (int *)ALLOCA(spcol*sizeof(int));
4545: if ( m == -1 )
1.76 noro 4546: rank = nd_gauss_elim_sf(spmat,spsugar,sprow,spcol,m,colstat);
1.74 noro 4547: else
1.76 noro 4548: rank = nd_gauss_elim_mod(spmat,spsugar,sprow,spcol,m,colstat);
1.74 noro 4549: nd_send_int(rank);
4550: for ( i = 0; i < rank; i++ ) {
4551: nf = vect_to_ndv(spmat[i],spcol,col,rhead,s0vect);
4552: nd_send_ndv(nf);
1.63 noro 4553: }
1.74 noro 4554: fflush(nd_write);
1.76 noro 4555: }
4556:
4557: int nd_gauss_elim_mod(int **mat0,int *sugar,int row,int col,int md,int *colstat)
4558: {
4559: int i,j,k,l,inv,a,rank,s;
4560: unsigned int *t,*pivot,*pk;
4561: unsigned int **mat;
4562:
4563: mat = (unsigned int **)mat0;
4564: for ( rank = 0, j = 0; j < col; j++ ) {
4565: for ( i = rank; i < row; i++ )
4566: mat[i][j] %= md;
4567: for ( i = rank; i < row; i++ )
4568: if ( mat[i][j] )
4569: break;
4570: if ( i == row ) {
4571: colstat[j] = 0;
4572: continue;
4573: } else
4574: colstat[j] = 1;
4575: if ( i != rank ) {
4576: t = mat[i]; mat[i] = mat[rank]; mat[rank] = t;
4577: s = sugar[i]; sugar[i] = sugar[rank]; sugar[rank] = s;
4578: }
4579: pivot = mat[rank];
4580: s = sugar[rank];
4581: inv = invm(pivot[j],md);
4582: for ( k = j, pk = pivot+k; k < col; k++, pk++ )
4583: if ( *pk ) {
4584: if ( *pk >= (unsigned int)md )
4585: *pk %= md;
4586: DMAR(*pk,inv,0,md,*pk)
4587: }
4588: for ( i = rank+1; i < row; i++ ) {
4589: t = mat[i];
4590: if ( a = t[j] ) {
4591: sugar[i] = MAX(sugar[i],s);
4592: red_by_vect(md,t+j,pivot+j,md-a,col-j);
4593: }
4594: }
4595: rank++;
4596: }
4597: for ( j = col-1, l = rank-1; j >= 0; j-- )
4598: if ( colstat[j] ) {
4599: pivot = mat[l];
4600: s = sugar[l];
4601: for ( i = 0; i < l; i++ ) {
4602: t = mat[i];
4603: t[j] %= md;
4604: if ( a = t[j] ) {
4605: sugar[i] = MAX(sugar[i],s);
4606: red_by_vect(md,t+j,pivot+j,md-a,col-j);
4607: }
4608: }
4609: l--;
4610: }
4611: for ( j = 0, l = 0; l < rank; j++ )
4612: if ( colstat[j] ) {
4613: t = mat[l];
4614: for ( k = j; k < col; k++ )
4615: if ( t[k] >= (unsigned int)md )
4616: t[k] %= md;
4617: l++;
4618: }
4619: return rank;
4620: }
4621:
4622: int nd_gauss_elim_sf(int **mat0,int *sugar,int row,int col,int md,int *colstat)
4623: {
4624: int i,j,k,l,inv,a,rank,s;
4625: unsigned int *t,*pivot,*pk;
4626: unsigned int **mat;
4627:
4628: mat = (unsigned int **)mat0;
4629: for ( rank = 0, j = 0; j < col; j++ ) {
4630: for ( i = rank; i < row; i++ )
4631: if ( mat[i][j] )
4632: break;
4633: if ( i == row ) {
4634: colstat[j] = 0;
4635: continue;
4636: } else
4637: colstat[j] = 1;
4638: if ( i != rank ) {
4639: t = mat[i]; mat[i] = mat[rank]; mat[rank] = t;
4640: s = sugar[i]; sugar[i] = sugar[rank]; sugar[rank] = s;
4641: }
4642: pivot = mat[rank];
4643: s = sugar[rank];
4644: inv = _invsf(pivot[j]);
4645: for ( k = j, pk = pivot+k; k < col; k++, pk++ )
4646: if ( *pk )
4647: *pk = _mulsf(*pk,inv);
4648: for ( i = rank+1; i < row; i++ ) {
4649: t = mat[i];
4650: if ( a = t[j] ) {
4651: sugar[i] = MAX(sugar[i],s);
4652: red_by_vect_sf(md,t+j,pivot+j,_chsgnsf(a),col-j);
4653: }
4654: }
4655: rank++;
4656: }
4657: for ( j = col-1, l = rank-1; j >= 0; j-- )
4658: if ( colstat[j] ) {
4659: pivot = mat[l];
4660: s = sugar[l];
4661: for ( i = 0; i < l; i++ ) {
4662: t = mat[i];
4663: if ( a = t[j] ) {
4664: sugar[i] = MAX(sugar[i],s);
4665: red_by_vect_sf(md,t+j,pivot+j,_chsgnsf(a),col-j);
4666: }
4667: }
4668: l--;
4669: }
4670: return rank;
1.77 noro 4671: }
4672:
4673: int ndv_ishomo(NDV p)
4674: {
4675: NMV m;
4676: int len,h;
4677:
4678: if ( !p ) return 1;
4679: len = LEN(p);
4680: m = BDY(p);
4681: h = TD(DL(m));
4682: NMV_ADV(m);
4683: for ( len--; len; len--, NMV_ADV(m) )
4684: if ( TD(DL(m)) != h ) return 0;
4685: return 1;
4686: }
4687:
4688: void ndv_save(NDV p,int index)
4689: {
4690: FILE *s;
4691: char name[BUFSIZ];
4692: short id;
4693: int nv,sugar,len,n,i,td,e,j;
4694: NMV m;
4695: unsigned int *dl;
4696:
4697: sprintf(name,"%s/%d",Demand,index);
4698: s = fopen(name,"w");
4699: savevl(s,0);
4700: if ( !p ) {
4701: saveobj(s,0);
4702: return;
4703: }
4704: id = O_DP;
4705: nv = NV(p);
4706: sugar = SG(p);
4707: len = LEN(p);
4708: write_short(s,&id); write_int(s,&nv); write_int(s,&sugar);
4709: write_int(s,&len);
4710:
4711: for ( m = BDY(p), i = 0; i < len; i++, NMV_ADV(m) ) {
4712: saveobj(s,(Obj)CQ(m));
4713: dl = DL(m);
4714: td = TD(dl);
4715: write_int(s,&td);
4716: for ( j = 0; j < nv; j++ ) {
4717: e = GET_EXP(dl,j);
4718: write_int(s,&e);
4719: }
4720: }
4721: fclose(s);
4722: }
4723:
4724: NDV ndv_load(int index)
4725: {
4726: FILE *s;
4727: char name[BUFSIZ];
4728: short id;
4729: int nv,sugar,len,n,i,td,e,j;
4730: NDV d;
4731: NMV m0,m;
4732: unsigned int *dl;
4733: Obj obj;
4734:
4735: sprintf(name,"%s/%d",Demand,index);
4736: s = fopen(name,"r");
4737: if ( !s ) return 0;
4738:
4739: skipvl(s);
4740: read_short(s,&id);
4741: if ( !id ) return 0;
4742: read_int(s,&nv);
4743: read_int(s,&sugar);
4744: read_int(s,&len);
4745:
4746: m0 = m = MALLOC(len*nmv_adv);
4747: for ( i = 0; i < len; i++, NMV_ADV(m) ) {
4748: loadobj(s,&obj); CQ(m) = (Q)obj;
4749: dl = DL(m);
4750: ndl_zero(dl);
4751: read_int(s,&td); TD(dl) = td;
4752: for ( j = 0; j < nv; j++ ) {
4753: read_int(s,&e);
4754: PUT_EXP(dl,j,e);
4755: }
4756: if ( nd_blockmask ) ndl_weight_mask(dl);
4757: }
4758: fclose(s);
4759: MKNDV(nv,m0,len,d);
4760: SG(d) = sugar;
4761: return d;
1.59 noro 4762: }
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>