=================================================================== RCS file: /home/cvs/OpenXM_contrib2/asir2000/engine/nd.c,v retrieving revision 1.40 retrieving revision 1.44 diff -u -p -r1.40 -r1.44 --- OpenXM_contrib2/asir2000/engine/nd.c 2003/08/21 04:44:36 1.40 +++ OpenXM_contrib2/asir2000/engine/nd.c 2003/08/22 08:32:51 1.44 @@ -1,4 +1,4 @@ -/* $OpenXM: OpenXM_contrib2/asir2000/engine/nd.c,v 1.39 2003/08/21 03:13:01 noro Exp $ */ +/* $OpenXM: OpenXM_contrib2/asir2000/engine/nd.c,v 1.43 2003/08/22 07:12:49 noro Exp $ */ #include "ca.h" #include "inline.h" @@ -73,31 +73,46 @@ typedef struct oND_pairs { unsigned int lcm[1]; } *ND_pairs; +/* index and shift count for each exponent */ +typedef struct oEPOS { + int i; /* index */ + int s; /* shift */ +} *EPOS; + +typedef struct oBlockMask { + int n; + struct order_pair *order_pair; + unsigned int **mask; +} *BlockMask; + int (*nd_compare_function)(unsigned int *a1,unsigned int *a2); -double nd_scale=2; +static double nd_scale=2; static unsigned int **nd_bound; -int nd_nvar; -int nd_isrlex; -int nd_epw,nd_bpe,nd_wpd; -unsigned int nd_mask[32]; -unsigned int nd_mask0,nd_mask1; +static struct order_spec *nd_ord; +static EPOS nd_epos; +static BlockMask nd_blockmask; +static int nd_nvar; +static int nd_isrlex; +static int nd_epw,nd_bpe,nd_wpd,nd_exporigin; +static unsigned int nd_mask[32]; +static unsigned int nd_mask0,nd_mask1; -NM _nm_free_list; -ND _nd_free_list; -ND_pairs _ndp_free_list; +static NM _nm_free_list; +static ND _nd_free_list; +static ND_pairs _ndp_free_list; static NDV *nd_ps; static NDV *nd_psq; -RHist *nd_psh; -int nd_psn,nd_pslen; +static RHist *nd_psh; +static int nd_psn,nd_pslen; -RHist *nd_red; +static RHist *nd_red; -int nd_found,nd_create,nd_notfirst; -int nm_adv; -int nmv_adv; -int nd_dcomp; +static int nd_found,nd_create,nd_notfirst; +static int nm_adv; +static int nmv_adv; +static int nd_dcomp; extern int Top,Reverse,dp_nelim; @@ -113,16 +128,26 @@ extern int Top,Reverse,dp_nelim; #define SG(a) ((a)->sugar) #define LEN(a) ((a)->len) #define LCM(a) ((a)->lcm) +#define GET_EXP(d,a) (((d)[nd_epos[a].i]>>nd_epos[a].s)&nd_mask0) +#define PUT_EXP(r,a,e) ((r)[nd_epos[a].i] |= ((e)<TD(d2)?1:(TD(d1)TD(d2)?1:(TD(d1)0?TD_DL_COMPARE(d1,d2)\ + :(nd_dcomp==0?ndl_lex_compare(d1,d2)\ + :(nd_blockmask?ndl_block_compare(d1,d2)\ + :(*nd_compare_function)(d1,d2)))) +#else +#define DL_COMPARE(d1,d2)\ +(nd_dcomp>0?TD_DL_COMPARE(d1,d2):(*nd_compare_function)(d1,d2)) +#endif /* allocators */ #define NEWRHist(r) \ -((r)=(RHist)MALLOC(sizeof(struct oRHist)+nd_wpd*sizeof(unsigned int))) +((r)=(RHist)MALLOC(sizeof(struct oRHist)+(nd_wpd-1)*sizeof(unsigned int))) #define NEWND_pairs(m) \ if(!_ndp_free_list)_NDP_alloc();\ (m)=_ndp_free_list; _ndp_free_list = NEXT(_ndp_free_list) @@ -192,11 +217,12 @@ NODE nd_gb_trace(int m); /* ndl functions */ int ndl_weight(unsigned int *d); +int ndl_weight_mask(unsigned int *d,int i); void ndl_dehomogenize(unsigned int *p); -void ndl_reconstruct(int obpe,unsigned int *d,unsigned int *r); -INLINE int nd_length(ND p); +void ndl_reconstruct(int obpe,EPOS oepos,unsigned int *d,unsigned int *r); INLINE int ndl_reducible(unsigned int *d1,unsigned int *d2); INLINE int ndl_lex_compare(unsigned int *d1,unsigned int *d2); +INLINE int ndl_block_compare(unsigned int *d1,unsigned int *d2); INLINE int ndl_equal(unsigned int *d1,unsigned int *d2); INLINE void ndl_copy(unsigned int *d1,unsigned int *d2); INLINE void ndl_add(unsigned int *d1,unsigned int *d2,unsigned int *d); @@ -225,7 +251,6 @@ void nd_free_private_storage(); void _NM_alloc(); void _ND_alloc(); void nd_free(ND p); -void nd_realloc(ND p,int obpe); void nd_free_redlist(); /* printing */ @@ -241,6 +266,7 @@ ND_pairs nd_reconstruct(int mod,int trace,ND_pairs ndp void nd_reconstruct_direct(int mod,NDV *ps,int len); void nd_setup(int mod,int trace,NODE f); void nd_setup_parameters(); +BlockMask nd_create_blockmask(struct order_spec *ord); /* ND functions */ int nd_check_candidate(NODE input,NODE cand); @@ -254,11 +280,12 @@ unsigned int *dp_compute_bound(DP p); ND nd_copy(ND p); ND nd_add(int mod,ND p1,ND p2); ND nd_add_q(ND p1,ND p2); +INLINE int nd_length(ND p); /* NDV functions */ void ndv_mul_c(int mod,NDV p,int mul); void ndv_mul_c_q(NDV p,Q mul); -void ndv_realloc(NDV p,int obpe,int oadv); +void ndv_realloc(NDV p,int obpe,int oadv,EPOS oepos); ND ndv_mul_nm(int mod,NDV p,NM m0); void ndv_dehomogenize(NDV p); void ndv_removecont(int mod,NDV p); @@ -289,7 +316,7 @@ void _NM_alloc() int i; for ( i = 0; i < 1024; i++ ) { - p = (NM)GC_malloc(sizeof(struct oNM)+nd_wpd*sizeof(unsigned int)); + p = (NM)GC_malloc(sizeof(struct oNM)+(nd_wpd-1)*sizeof(unsigned int)); p->next = _nm_free_list; _nm_free_list = p; } } @@ -312,7 +339,7 @@ void _NDP_alloc() for ( i = 0; i < 1024; i++ ) { p = (ND_pairs)GC_malloc(sizeof(struct oND_pairs) - +nd_wpd*sizeof(unsigned int)); + +(nd_wpd-1)*sizeof(unsigned int)); p->next = _ndp_free_list; _ndp_free_list = p; } } @@ -338,7 +365,7 @@ INLINE int ndl_reducible(unsigned int *d1,unsigned int if ( TD(d1) < TD(d2) ) return 0; switch ( nd_bpe ) { case 4: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; if ( (u1&0xf0000000) < (u2&0xf0000000) ) return 0; if ( (u1&0xf000000) < (u2&0xf000000) ) return 0; @@ -352,7 +379,7 @@ INLINE int ndl_reducible(unsigned int *d1,unsigned int return 1; break; case 6: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; if ( (u1&0x3f000000) < (u2&0x3f000000) ) return 0; if ( (u1&0xfc0000) < (u2&0xfc0000) ) return 0; @@ -363,7 +390,7 @@ INLINE int ndl_reducible(unsigned int *d1,unsigned int return 1; break; case 8: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; if ( (u1&0xff000000) < (u2&0xff000000) ) return 0; if ( (u1&0xff0000) < (u2&0xff0000) ) return 0; @@ -373,7 +400,7 @@ INLINE int ndl_reducible(unsigned int *d1,unsigned int return 1; break; case 16: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; if ( (u1&0xffff0000) < (u2&0xffff0000) ) return 0; if ( (u1&0xffff) < (u2&0xffff) ) return 0; @@ -381,12 +408,12 @@ INLINE int ndl_reducible(unsigned int *d1,unsigned int return 1; break; case 32: - for ( i = 1; i <= nd_wpd; i++ ) + for ( i = nd_exporigin; i < nd_wpd; i++ ) if ( d1[i] < d2[i] ) return 0; return 1; break; default: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; for ( j = 0; j < nd_epw; j++ ) if ( (u1&nd_mask[j]) < (u2&nd_mask[j]) ) return 0; @@ -401,35 +428,40 @@ void ndl_dehomogenize(unsigned int *d) unsigned int h; int i,bits; - if ( nd_isrlex ) { - if ( nd_bpe == 32 ) { - h = d[1]; - for ( i = 2; i <= nd_wpd; i++ ) - d[i-1] = d[i]; - d[i-1] = 0; - TD(d) -= h; - } else { - bits = nd_epw*nd_bpe; - mask = bits==32?0xffffffff:((1<<(nd_epw*nd_bpe))-1); - h = (d[1]>>((nd_epw-1)*nd_bpe))&nd_mask0; - for ( i = 1; i <= nd_wpd; i++ ) - d[i] = ((d[i]<>((nd_epw-1)*nd_bpe))&nd_mask0):0); - TD(d) -= h; - } - } else - TD(d) -= ((d[(nd_nvar-1)/nd_epw+1]>> - ((nd_epw-((nd_nvar-1)%nd_epw)-1)*nd_bpe))&((1<>((nd_epw-1)*nd_bpe))&nd_mask0; + for ( i = nd_exporigin; i < nd_wpd; i++ ) + d[i] = ((d[i]<>((nd_epw-1)*nd_bpe))&nd_mask0):0); + TD(d) -= h; + } + } else + TD(d) -= GET_EXP(d,nd_nvar-1); + } } void ndl_lcm(unsigned int *d1,unsigned *d2,unsigned int *d) { unsigned int t1,t2,u,u1,u2; - int i,j; + int i,j,l; switch ( nd_bpe ) { case 4: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; t1 = (u1&0xf0000000); t2 = (u2&0xf0000000); u = t1>t2?t1:t2; t1 = (u1&0xf000000); t2 = (u2&0xf000000); u |= t1>t2?t1:t2; @@ -443,7 +475,7 @@ void ndl_lcm(unsigned int *d1,unsigned *d2,unsigned in } break; case 6: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; t1 = (u1&0x3f000000); t2 = (u2&0x3f000000); u = t1>t2?t1:t2; t1 = (u1&0xfc0000); t2 = (u2&0xfc0000); u |= t1>t2?t1:t2; @@ -454,7 +486,7 @@ void ndl_lcm(unsigned int *d1,unsigned *d2,unsigned in } break; case 8: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; t1 = (u1&0xff000000); t2 = (u2&0xff000000); u = t1>t2?t1:t2; t1 = (u1&0xff0000); t2 = (u2&0xff0000); u |= t1>t2?t1:t2; @@ -464,7 +496,7 @@ void ndl_lcm(unsigned int *d1,unsigned *d2,unsigned in } break; case 16: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; t1 = (u1&0xffff0000); t2 = (u2&0xffff0000); u = t1>t2?t1:t2; t1 = (u1&0xffff); t2 = (u2&0xffff); u |= t1>t2?t1:t2; @@ -472,13 +504,13 @@ void ndl_lcm(unsigned int *d1,unsigned *d2,unsigned in } break; case 32: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; d[i] = u1>u2?u1:u2; } break; default: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; for ( j = 0, u = 0; j < nd_epw; j++ ) { t1 = (u1&nd_mask[j]); t2 = (u2&nd_mask[j]); u |= t1>t2?t1:t2; @@ -488,6 +520,11 @@ void ndl_lcm(unsigned int *d1,unsigned *d2,unsigned in break; } TD(d) = ndl_weight(d); + if ( nd_blockmask ) { + l = nd_blockmask->n; + for ( j = 0; j < l; j++ ) + d[j+1] = ndl_weight_mask(d,j); + } } int ndl_weight(unsigned int *d) @@ -495,7 +532,7 @@ int ndl_weight(unsigned int *d) unsigned int t,u; int i,j; - for ( t = 0, i = 1; i <= nd_wpd; i++ ) { + for ( t = 0, i = nd_exporigin; i < nd_wpd; i++ ) { u = d[i]; for ( j = 0; j < nd_epw; j++, u>>=nd_bpe ) t += (u&nd_mask0); @@ -503,11 +540,28 @@ int ndl_weight(unsigned int *d) return t; } -INLINE int ndl_lex_compare(unsigned int *d1,unsigned int *d2) +int ndl_weight_mask(unsigned int *d,int index) { + unsigned int t,u; + unsigned int *mask; + int i,j; + + mask = nd_blockmask->mask[index]; + for ( t = 0, i = nd_exporigin; i < nd_wpd; i++ ) { + u = d[i]&mask[i]; + for ( j = 0; j < nd_epw; j++, u>>=nd_bpe ) + t += (u&nd_mask0); + } + return t; +} + +int ndl_lex_compare(unsigned int *d1,unsigned int *d2) +{ int i; - for ( i = 0; i < nd_wpd; i++, d1++, d2++ ) + d1 += nd_exporigin; + d2 += nd_exporigin; + for ( i = nd_exporigin; i < nd_wpd; i++, d1++, d2++ ) if ( *d1 > *d2 ) return nd_isrlex ? -1 : 1; else if ( *d1 < *d2 ) @@ -515,12 +569,39 @@ INLINE int ndl_lex_compare(unsigned int *d1,unsigned i return 0; } +int ndl_block_compare(unsigned int *d1,unsigned int *d2) +{ + int i,l,j,ord_o,ord_l; + struct order_pair *op; + unsigned int t1,t2,m; + unsigned int *mask; + + l = nd_blockmask->n; + op = nd_blockmask->order_pair; + for ( j = 0; j < l; j++ ) { + mask = nd_blockmask->mask[j]; + ord_o = op[j].order; + if ( ord_o < 2 ) + if ( (t1=d1[j+1]) > (t2=d2[j+1]) ) return 1; + else if ( t1 < t2 ) return -1; + for ( i = nd_exporigin; i < nd_wpd; i++ ) { + m = mask[i]; + t1 = d1[i]&m; + t2 = d2[i]&m; + if ( t1 > t2 ) + return !ord_o ? -1 : 1; + else if ( t1 < t2 ) + return !ord_o ? 1 : -1; + } + } + return 0; +} + INLINE int ndl_equal(unsigned int *d1,unsigned int *d2) { int i; - if ( *d1++ != *d2++ ) return 0; - for ( i = 1; i <= nd_wpd; i++ ) + for ( i = 0; i < nd_wpd; i++ ) if ( *d1++ != *d2++ ) return 0; return 1; @@ -531,17 +612,17 @@ INLINE void ndl_copy(unsigned int *d1,unsigned int *d2 int i; switch ( nd_wpd ) { - case 1: + case 2: TD(d2) = TD(d1); d2[1] = d1[1]; break; - case 2: + case 3: TD(d2) = TD(d1); d2[1] = d1[1]; d2[2] = d1[2]; break; default: - for ( i = 0; i <= nd_wpd; i++ ) + for ( i = 0; i < nd_wpd; i++ ) d2[i] = d1[i]; break; } @@ -551,28 +632,31 @@ INLINE void ndl_add(unsigned int *d1,unsigned int *d2, { int i; - TD(d) = TD(d1)+TD(d2); +#if 1 switch ( nd_wpd ) { - case 1: + case 2: + TD(d) = TD(d1)+TD(d2); d[1] = d1[1]+d2[1]; break; - case 2: + case 3: + TD(d) = TD(d1)+TD(d2); d[1] = d1[1]+d2[1]; d[2] = d1[2]+d2[2]; break; default: - for ( i = 1; i <= nd_wpd; i++ ) - d[i] = d1[i]+d2[i]; + for ( i = 0; i < nd_wpd; i++ ) d[i] = d1[i]+d2[i]; break; } +#else + for ( i = 0; i < nd_wpd; i++ ) d[i] = d1[i]+d2[i]; +#endif } INLINE void ndl_sub(unsigned int *d1,unsigned int *d2,unsigned int *d) { int i; - for ( i = 0; i <= nd_wpd; i++ ) - d[i] = d1[i]-d2[i]; + for ( i = 0; i < nd_wpd; i++ ) d[i] = d1[i]-d2[i]; } int ndl_disjoint(unsigned int *d1,unsigned int *d2) @@ -582,7 +666,7 @@ int ndl_disjoint(unsigned int *d1,unsigned int *d2) switch ( nd_bpe ) { case 4: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; t1 = u1&0xf0000000; t2 = u2&0xf0000000; if ( t1&&t2 ) return 0; t1 = u1&0xf000000; t2 = u2&0xf000000; if ( t1&&t2 ) return 0; @@ -596,7 +680,7 @@ int ndl_disjoint(unsigned int *d1,unsigned int *d2) return 1; break; case 6: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; t1 = u1&0x3f000000; t2 = u2&0x3f000000; if ( t1&&t2 ) return 0; t1 = u1&0xfc0000; t2 = u2&0xfc0000; if ( t1&&t2 ) return 0; @@ -607,7 +691,7 @@ int ndl_disjoint(unsigned int *d1,unsigned int *d2) return 1; break; case 8: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; t1 = u1&0xff000000; t2 = u2&0xff000000; if ( t1&&t2 ) return 0; t1 = u1&0xff0000; t2 = u2&0xff0000; if ( t1&&t2 ) return 0; @@ -617,7 +701,7 @@ int ndl_disjoint(unsigned int *d1,unsigned int *d2) return 1; break; case 16: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; t1 = u1&0xffff0000; t2 = u2&0xffff0000; if ( t1&&t2 ) return 0; t1 = u1&0xffff; t2 = u2&0xffff; if ( t1&&t2 ) return 0; @@ -625,12 +709,12 @@ int ndl_disjoint(unsigned int *d1,unsigned int *d2) return 1; break; case 32: - for ( i = 1; i <= nd_wpd; i++ ) + for ( i = nd_exporigin; i < nd_wpd; i++ ) if ( d1[i] && d2[i] ) return 0; return 1; break; default: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; for ( j = 0; j < nd_epw; j++ ) { if ( (u1&nd_mask0) && (u2&nd_mask0) ) return 0; @@ -652,7 +736,7 @@ int ndl_check_bound2(int index,unsigned int *d2) ind = 0; switch ( nd_bpe ) { case 4: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u2 = d2[i]; if ( d1[ind++]+((u2>>28)&0xf) >= 0x10 ) return 1; if ( d1[ind++]+((u2>>24)&0xf) >= 0x10 ) return 1; @@ -666,7 +750,7 @@ int ndl_check_bound2(int index,unsigned int *d2) return 0; break; case 6: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u2 = d2[i]; if ( d1[ind++]+((u2>>24)&0x3f) >= 0x40 ) return 1; if ( d1[ind++]+((u2>>18)&0x3f) >= 0x40 ) return 1; @@ -677,7 +761,7 @@ int ndl_check_bound2(int index,unsigned int *d2) return 0; break; case 8: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u2 = d2[i]; if ( d1[ind++]+((u2>>24)&0xff) >= 0x100 ) return 1; if ( d1[ind++]+((u2>>16)&0xff) >= 0x100 ) return 1; @@ -687,7 +771,7 @@ int ndl_check_bound2(int index,unsigned int *d2) return 0; break; case 16: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u2 = d2[i]; if ( d1[ind++]+((u2>>16)&0xffff) > 0x10000 ) return 1; if ( d1[ind++]+(u2&0xffff) > 0x10000 ) return 1; @@ -695,12 +779,12 @@ int ndl_check_bound2(int index,unsigned int *d2) return 0; break; case 32: - for ( i = 1; i <= nd_wpd; i++ ) + for ( i = nd_exporigin; i < nd_wpd; i++ ) if ( d1[i]+d2[i]>28)&0xf)+((u2>>28)&0xf) >= 0x10 ) return 1; if ( ((u1>>24)&0xf)+((u2>>24)&0xf) >= 0x10 ) return 1; @@ -732,7 +816,7 @@ int ndl_check_bound2_direct(unsigned int *d1,unsigned return 0; break; case 6: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; if ( ((u1>>24)&0x3f)+((u2>>24)&0x3f) >= 0x40 ) return 1; if ( ((u1>>18)&0x3f)+((u2>>18)&0x3f) >= 0x40 ) return 1; @@ -743,7 +827,7 @@ int ndl_check_bound2_direct(unsigned int *d1,unsigned return 0; break; case 8: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; if ( ((u1>>24)&0xff)+((u2>>24)&0xff) >= 0x100 ) return 1; if ( ((u1>>16)&0xff)+((u2>>16)&0xff) >= 0x100 ) return 1; @@ -753,7 +837,7 @@ int ndl_check_bound2_direct(unsigned int *d1,unsigned return 0; break; case 16: - for ( i = 1; i <= nd_wpd; i++ ) { + for ( i = nd_exporigin; i < nd_wpd; i++ ) { u1 = d1[i]; u2 = d2[i]; if ( ((u1>>16)&0xffff)+((u2>>16)&0xffff) > 0x10000 ) return 1; if ( (u2&0xffff)+(u2&0xffff) > 0x10000 ) return 1; @@ -761,12 +845,12 @@ int ndl_check_bound2_direct(unsigned int *d1,unsigned return 0; break; case 32: - for ( i = 1; i <= nd_wpd; i++ ) + for ( i = nd_exporigin; i < nd_wpd; i++ ) if ( d1[i]+d2[i]= 0 ) { @@ -1041,7 +1125,7 @@ int nd_nf_pbucket(int mod,ND g,int full,ND *rp) bucket = create_pbucket(); add_pbucket(mod,bucket,g); d = 0; - mul = (NM)ALLOCA(sizeof(struct oNM)+nd_wpd*sizeof(unsigned int)); + mul = (NM)ALLOCA(sizeof(struct oNM)+(nd_wpd-1)*sizeof(unsigned int)); while ( 1 ) { hindex = mod?head_pbucket(mod,bucket):head_pbucket_q(bucket); if ( hindex < 0 ) { @@ -1139,7 +1223,7 @@ int nd_nf_direct(int mod,ND g,NDV *ps,int len,int full sugar0 = sugar = SG(g); n = NV(g); - mul = (NM)ALLOCA(sizeof(struct oNM)+nd_wpd*sizeof(unsigned int)); + mul = (NM)ALLOCA(sizeof(struct oNM)+(nd_wpd-1)*sizeof(unsigned int)); for ( d = 0; g; ) { index = nd_find_reducer_direct(g,ps,len); if ( index >= 0 ) { @@ -1215,7 +1299,7 @@ int nd_nf_direct_pbucket(int mod,ND g,NDV *ps,int len, bucket = create_pbucket(); add_pbucket(mod,bucket,g); d = 0; - mul = (NM)ALLOCA(sizeof(struct oNM)+nd_wpd*sizeof(unsigned int)); + mul = (NM)ALLOCA(sizeof(struct oNM)+(nd_wpd-1)*sizeof(unsigned int)); while ( 1 ) { hindex = mod?head_pbucket(mod,bucket):head_pbucket_q(bucket); if ( hindex < 0 ) { @@ -1494,7 +1578,11 @@ again: d = nd_reconstruct(m,0,d); goto again; } +#if USE_GEOBUCKET stat = m?nd_nf_pbucket(m,h,!Top,&nf):nd_nf(m,h,!Top,&nf); +#else + stat = nd_nf(m,h,!Top,&nf); +#endif if ( !stat ) { NEXT(l) = d; d = l; d = nd_reconstruct(m,0,d); @@ -1545,7 +1633,11 @@ again: d = nd_reconstruct(m,1,d); goto again; } +#if USE_GEOBUCKET stat = nd_nf_pbucket(m,h,!Top,&nf); +#else + stat = nd_nf(m,h,!Top,&nf); +#endif if ( !stat ) { NEXT(l) = d; d = l; d = nd_reconstruct(m,1,d); @@ -1686,7 +1778,7 @@ ND_pairs crit_B( ND_pairs d, int s ) t = DL(nd_psh[s]); prev = 0; head = cur = d; - lcm = (unsigned int *)ALLOCA((nd_wpd+1)*sizeof(unsigned int)); + lcm = (unsigned int *)ALLOCA(nd_wpd*sizeof(unsigned int)); while ( cur ) { tl = cur->lcm; if ( ndl_reducible(tl,t) @@ -2055,36 +2147,69 @@ void nd_gr_trace(LIST f,LIST v,int m,int homo,struct o void dltondl(int n,DL dl,unsigned int *r) { unsigned int *d; - int i; + int i,j,l,s,ord_l,ord_o; + struct order_pair *op; d = dl->d; - for ( i = 0; i <= nd_wpd; i++ ) r[i] = 0; - if ( nd_isrlex ) - for ( i = 0; i < n; i++ ) - r[(n-1-i)/nd_epw+1] |= (d[i]<<((nd_epw-((n-1-i)%nd_epw)-1)*nd_bpe)); - else - for ( i = 0; i < n; i++ ) - r[i/nd_epw+1] |= d[i]<<((nd_epw-(i%nd_epw)-1)*nd_bpe); - TD(r) = ndl_weight(r); + for ( i = 0; i < nd_wpd; i++ ) r[i] = 0; + if ( nd_blockmask ) { + l = nd_blockmask->n; + op = nd_blockmask->order_pair; + for ( j = 0, s = 0; j < l; j++ ) { + ord_o = op[j].order; + ord_l = op[j].length; + if ( !ord_o ) + for ( i = 0; i < ord_l; i++ ) + PUT_EXP(r,s+ord_l-i-1,d[s+i]); + else + for ( i = 0; i < ord_l; i++ ) + PUT_EXP(r,s+i,d[s+i]); + s += ord_l; + } + TD(r) = ndl_weight(r); + for ( j = 0; j < l; j++ ) + r[j+1] = ndl_weight_mask(r,j); + } else { + if ( nd_isrlex ) + for ( i = 0; i < n; i++ ) PUT_EXP(r,n-1-i,d[i]); + else + for ( i = 0; i < n; i++ ) PUT_EXP(r,i,d[i]); + TD(r) = ndl_weight(r); + } } DL ndltodl(int n,unsigned int *ndl) { DL dl; int *d; - int i; + int i,j,l,s,ord_l,ord_o; + struct order_pair *op; NEWDL(dl,n); dl->td = TD(ndl); d = dl->d; - if ( nd_isrlex ) - for ( i = 0; i < n; i++ ) - d[i] = (ndl[(n-1-i)/nd_epw+1]>>((nd_epw-((n-1-i)%nd_epw)-1)*nd_bpe)) - &((1<>((nd_epw-(i%nd_epw)-1)*nd_bpe)) - &((1<n; + op = nd_blockmask->order_pair; + for ( j = 0, s = 0; j < l; j++ ) { + ord_o = op[j].order; + ord_l = op[j].length; + if ( !ord_o ) + for ( i = 0; i < ord_l; i++ ) + d[s+i] = GET_EXP(ndl,s+ord_l-i-1); + else + for ( i = 0; i < ord_l; i++ ) + d[s+i] = GET_EXP(ndl,s+i); + s += ord_l; + } + } else { + if ( nd_isrlex ) + for ( i = 0; i < n; i++ ) + d[i] = GET_EXP(ndl,n-1-i); + else + for ( i = 0; i < n; i++ ) + d[i] = GET_EXP(ndl,i); + } return dl; } @@ -2137,20 +2262,30 @@ DP ndtodp(int mod,ND p) void ndl_print(unsigned int *dl) { int n; - int i; + int i,j,l,ord_o,ord_l,s,s0; + struct order_pair *op; n = nd_nvar; printf("<<"); - if ( nd_isrlex ) - for ( i = 0; i < n; i++ ) - printf(i==n-1?"%d":"%d,", - (dl[(n-1-i)/nd_epw+1]>>((nd_epw-((n-1-i)%nd_epw)-1)*nd_bpe)) - &((1<>((nd_epw-(i%nd_epw)-1)*nd_bpe)) - &((1<n; + op = nd_blockmask->order_pair; + for ( j = 0, s = s0 = 0; j < l; j++ ) { + ord_o = op[j].order; + ord_l = op[j].length; + if ( !ord_o ) + for ( i = 0, s0 += ord_l; i < ord_l; i++, s++ ) + printf(s==n-1?"%d":"%d,",GET_EXP(dl,s0-i-1)); + else + for ( i = 0; i < ord_l; i++, s++ ) + printf(s==n-1?"%d":"%d,",GET_EXP(dl,s)); + } + } else { + if ( nd_isrlex ) + for ( i = 0; i < n; i++ ) printf(i==n-1?"%d":"%d,",GET_EXP(dl,n-1-i)); + else + for ( i = 0; i < n; i++ ) printf(i==n-1?"%d":"%d,",GET_EXP(dl,i)); + } printf(">>"); } @@ -2274,12 +2409,12 @@ void ndv_dehomogenize(NDV p) len = p->len; newnvar = nd_nvar-1; - newwpd = newnvar/nd_epw+(newnvar%nd_epw?1:0); + newwpd = newnvar/nd_epw+(newnvar%nd_epw?1:0)+nd_exporigin; for ( m = BDY(p), i = 0; i < len; NMV_ADV(m), i++ ) ndl_dehomogenize(DL(m)); if ( newwpd != nd_wpd ) { - d = (unsigned int *)ALLOCA((newwpd+1)*sizeof(unsigned int)); - newadv = sizeof(struct oNMV)+newwpd*sizeof(unsigned int); + d = (unsigned int *)ALLOCA(newwpd*sizeof(unsigned int)); + newadv = sizeof(struct oNMV)+(newwpd-1)*sizeof(unsigned int); for ( m = r = BDY(p), i = 0; i < len; NMV_ADV(m), NEWADV(r), i++ ) { CQ(r) = CQ(m); ndl_copy(DL(m),d); ndl_copy(d,DL(r)); } @@ -2421,18 +2556,36 @@ unsigned int *nd_compute_bound(ND p) } l = nd_nvar+31; t = (unsigned int *)MALLOC_ATOMIC(l*sizeof(unsigned int)); - for ( i = 0; i < l; i++ ) t[i] = 0; - for ( i = 0; i < nd_nvar; i++ ) - t[i] = (d1[i/nd_epw+1]>>((nd_epw-(i%nd_epw)-1)*nd_bpe))&nd_mask0; + for ( i = 0; i < nd_nvar; i++ ) t[i] = GET_EXP(d1,i); for ( ; i < l; i++ ) t[i] = 0; return t; } void nd_setup_parameters() { - int i; + int i,n,elen; nd_epw = (sizeof(unsigned int)*8)/nd_bpe; - nd_wpd = nd_nvar/nd_epw+(nd_nvar%nd_epw?1:0); + elen = nd_nvar/nd_epw+(nd_nvar%nd_epw?1:0); + + switch ( nd_ord->id ) { + case 0: + nd_exporigin = 1; + break; + case 1: + /* block order */ + /* d[0]:weight d[1]:w0,...,d[nd_exporigin-1]:w(n-1) */ + nd_exporigin = nd_ord->ord.block.length+1; + break; + case 2: + error("nd_setup_parameters : matrix order is not supported yet."); + break; + } + nd_wpd = nd_exporigin+elen; + nd_epos = (EPOS)MALLOC_ATOMIC(nd_nvar*sizeof(struct oEPOS)); + for ( i = 0; i < nd_nvar; i++ ) { + nd_epos[i].i = nd_exporigin + i/nd_epw; + nd_epos[i].s = (nd_epw-(i%nd_epw)-1)*nd_bpe; + } if ( nd_bpe < 32 ) { nd_mask0 = (1< realloc nd_ps and pd_psq */ - ND_pairs nd_reconstruct(int mod,int trace,ND_pairs d) { int i,obpe,oadv,h; @@ -2458,9 +2610,11 @@ ND_pairs nd_reconstruct(int mod,int trace,ND_pairs d) RHist r; RHist *old_red; ND_pairs s0,s,t,prev_ndp_free_list; + EPOS oepos; obpe = nd_bpe; oadv = nmv_adv; + oepos = nd_epos; if ( obpe < 4 ) nd_bpe = 4; else if ( obpe < 6 ) nd_bpe = 6; else if ( obpe < 8 ) nd_bpe = 8; @@ -2474,16 +2628,16 @@ ND_pairs nd_reconstruct(int mod,int trace,ND_pairs d) _nm_free_list = 0; _ndp_free_list = 0; if ( mod != 0 ) - for ( i = nd_psn-1; i >= 0; i-- ) ndv_realloc(nd_ps[i],obpe,oadv); + for ( i = nd_psn-1; i >= 0; i-- ) ndv_realloc(nd_ps[i],obpe,oadv,oepos); if ( !mod || trace ) - for ( i = nd_psn-1; i >= 0; i-- ) ndv_realloc(nd_psq[i],obpe,oadv); + for ( i = nd_psn-1; i >= 0; i-- ) ndv_realloc(nd_psq[i],obpe,oadv,oepos); s0 = 0; for ( t = d; t; t = NEXT(t) ) { NEXTND_pairs(s0,s); s->i1 = t->i1; s->i2 = t->i2; SG(s) = SG(t); - ndl_reconstruct(obpe,LCM(t),LCM(s)); + ndl_reconstruct(obpe,oepos,LCM(t),LCM(s)); } old_red = (RHist *)ALLOCA(REDTAB_LEN*sizeof(RHist)); @@ -2496,7 +2650,7 @@ ND_pairs nd_reconstruct(int mod,int trace,ND_pairs d) NEWRHist(mr); mr->index = r->index; SG(mr) = SG(r); - ndl_reconstruct(obpe,DL(r),DL(mr)); + ndl_reconstruct(obpe,oepos,DL(r),DL(mr)); h = ndl_hash_value(DL(mr)); NEXT(mr) = nd_red[h]; nd_red[h] = mr; @@ -2505,7 +2659,7 @@ ND_pairs nd_reconstruct(int mod,int trace,ND_pairs d) old_red = 0; for ( i = 0; i < nd_psn; i++ ) { NEWRHist(r); SG(r) = SG(nd_psh[i]); - ndl_reconstruct(obpe,DL(nd_psh[i]),DL(r)); + ndl_reconstruct(obpe,oepos,DL(nd_psh[i]),DL(r)); nd_psh[i] = r; } if ( s0 ) NEXT(s) = 0; @@ -2523,9 +2677,11 @@ void nd_reconstruct_direct(int mod,NDV *ps,int len) RHist r; RHist *old_red; ND_pairs s0,s,t,prev_ndp_free_list; + EPOS oepos; obpe = nd_bpe; oadv = nmv_adv; + oepos = nd_epos; if ( obpe < 4 ) nd_bpe = 4; else if ( obpe < 6 ) nd_bpe = 6; else if ( obpe < 8 ) nd_bpe = 8; @@ -2537,8 +2693,7 @@ void nd_reconstruct_direct(int mod,NDV *ps,int len) prev_nm_free_list = _nm_free_list; prev_ndp_free_list = _ndp_free_list; _nm_free_list = 0; _ndp_free_list = 0; - if ( mod != 0 ) - for ( i = len-1; i >= 0; i-- ) ndv_realloc(ps[i],obpe,oadv); + for ( i = len-1; i >= 0; i-- ) ndv_realloc(ps[i],obpe,oadv,oepos); old_red = (RHist *)ALLOCA(REDTAB_LEN*sizeof(RHist)); for ( i = 0; i < REDTAB_LEN; i++ ) { old_red[i] = nd_red[i]; @@ -2549,7 +2704,7 @@ void nd_reconstruct_direct(int mod,NDV *ps,int len) NEWRHist(mr); mr->index = r->index; SG(mr) = SG(r); - ndl_reconstruct(obpe,DL(r),DL(mr)); + ndl_reconstruct(obpe,oepos,DL(r),DL(mr)); h = ndl_hash_value(DL(mr)); NEXT(mr) = nd_red[h]; nd_red[h] = mr; @@ -2561,56 +2716,61 @@ void nd_reconstruct_direct(int mod,NDV *ps,int len) GC_gcollect(); } -void ndl_reconstruct(int obpe,unsigned int *d,unsigned int *r) +void ndl_reconstruct(int obpe,EPOS oepos,unsigned int *d,unsigned int *r) { - int n,i,ei,oepw,cepw,cbpe; + int n,i,ei,oepw,omask0,j,s,ord_l,ord_o,l; + struct order_pair *op; +#define GET_EXP_OLD(d,a) (((d)[oepos[a].i]>>oepos[a].s)&omask0) +#define PUT_EXP_OLD(r,a,e) ((r)[oepos[a].i] |= ((e)<>((oepw-((n-1-i)%oepw)-1)*obpe)) - &((1<n; + op = nd_blockmask->order_pair; + for ( i = 1; i < nd_exporigin; i++ ) + r[i] = d[i]; + for ( j = 0, s = 0; j < l; j++ ) { + ord_o = op[j].order; + ord_l = op[j].length; + if ( !ord_o ) + for ( i = 0; i < ord_l; i++ ) { + ei = GET_EXP_OLD(d,s+ord_l-i-1); + PUT_EXP(r,s+ord_l-i-1,ei); + } + else + for ( i = 0; i < ord_l; i++ ) { + ei = GET_EXP_OLD(d,s+i); + PUT_EXP(r,s+i,ei); + } + s += ord_l; } - else - for ( i = 0; i < n; i++ ) { - ei = (d[i/oepw+1]>>((oepw-(i%oepw)-1)*obpe)) - &((1<id ) - error("nd_gr : unsupported order"); - nd_dcomp = 0; - switch ( ord->ord.simple ) { + switch ( ord->id ) { case 0: - nd_dcomp = 1; - nd_isrlex = 1; + switch ( ord->ord.simple ) { + case 0: + nd_dcomp = 1; + nd_isrlex = 1; + break; + case 1: + nd_dcomp = 1; + nd_isrlex = 0; + break; + case 2: + nd_dcomp = 0; + nd_isrlex = 0; + break; + default: + error("nd_gr : unsupported order"); + } break; case 1: - nd_dcomp = 1; + /* XXX */ + nd_dcomp = -1; nd_isrlex = 0; + nd_compare_function = ndl_block_compare; break; - case 9: - /* td1->td->rlex */ - nd_dcomp = -dp_nelim; - nd_isrlex = 1; + case 2: + error("nd_init_ord : matrix order is not supported yet."); break; - default: - error("nd_gr : unsupported order"); } + nd_ord = ord; } +BlockMask nd_create_blockmask(struct order_spec *ord) +{ + int n,i,j,s,l; + unsigned int *t; + BlockMask bm; + + if ( !ord->id ) + return 0; + n = ord->ord.block.length; + bm = (BlockMask)MALLOC(sizeof(struct oBlockMask)); + bm->n = n; + bm->order_pair = ord->ord.block.order_pair; + bm->mask = (unsigned int **)MALLOC(n*sizeof(unsigned int *)); + for ( i = 0, s = 0; i < n; i++ ) { + bm->mask[i] = t + = (unsigned int *)MALLOC_ATOMIC(nd_wpd*sizeof(unsigned int)); + for ( j = 0; j < nd_wpd; j++ ) t[j] = 0; + l = bm->order_pair[i].length; + for ( j = 0; j < l; j++, s++ ) PUT_EXP(t,s,nd_mask0); + } + return bm; +}