=================================================================== RCS file: /home/cvs/OpenXM_contrib2/asir2000/engine/_distm.c,v retrieving revision 1.2 retrieving revision 1.5 diff -u -p -r1.2 -r1.5 --- OpenXM_contrib2/asir2000/engine/_distm.c 2000/08/21 08:31:27 1.2 +++ OpenXM_contrib2/asir2000/engine/_distm.c 2000/12/05 06:59:16 1.5 @@ -23,7 +23,7 @@ * shall be made on your publication or presentation in any form of the * results obtained by use of the SOFTWARE. * (4) In the event that you modify the SOFTWARE, you shall notify FLL by - * e-mail at risa-admin@flab.fujitsu.co.jp of the detailed specification + * e-mail at risa-admin@sec.flab.fujitsu.co.jp of the detailed specification * for such modification or the source code of the modified part of the * SOFTWARE. * @@ -45,54 +45,32 @@ * DEVELOPER SHALL HAVE NO LIABILITY IN CONNECTION WITH THE USE, * PERFORMANCE OR NON-PERFORMANCE OF THE SOFTWARE. * - * $OpenXM: OpenXM_contrib2/asir2000/engine/_distm.c,v 1.1 2000/07/13 05:50:39 noro Exp $ + * $OpenXM: OpenXM_contrib2/asir2000/engine/_distm.c,v 1.4 2000/11/07 06:06:39 noro Exp $ */ #include "ca.h" #include "inline.h" -#define NV(p) ((p)->nv) -#define C(p) ((p)->c) -#if 0 -#define ITOS(p) (((unsigned int)(p))>>1) -#define STOI(i) ((P)((((unsigned int)(i))<<1)|1)) -#else -#define ITOS(p) (((unsigned int)(p))&0x7fffffff) -#define STOI(i) ((P)((unsigned int)(i)|0x80000000)) -#endif - extern int (*cmpdl)(); extern int do_weyl; +void dpto_dp(); void _dptodp(); -void adddl_dup(); +void _adddl_dup(); +void adddl_destructive(); void _mulmdm_dup(); void _free_dp(); void _comm_mulmd_dup(); void _weyl_mulmd_dup(); void _weyl_mulmmm_dup(); void _weyl_mulmdm_dup(); +void _comm_mulmd_tab(); +void _comm_mulmd_tab_destructive(); MP _mp_free_list; DP _dp_free_list; DL _dl_free_list; int current_dl_length; -#define _NEWDL_NOINIT(d,n) if ((n)!= current_dl_length){_dl_free_list=0; current_dl_length=(n);} if(!_dl_free_list)_DL_alloc(); (d)=_dl_free_list; _dl_free_list = *((DL *)_dl_free_list) -#define _NEWDL(d,n) if ((n)!= current_dl_length){_dl_free_list=0; current_dl_length=(n);} if(!_dl_free_list)_DL_alloc(); (d)=_dl_free_list; _dl_free_list = *((DL *)_dl_free_list); bzero((d),(((n)+1)*sizeof(int))) -#define _NEWMP(m) if(!_mp_free_list)_MP_alloc(); (m)=_mp_free_list; _mp_free_list = NEXT(_mp_free_list) -#define _MKDP(n,m,d) if(!_dp_free_list)_DP_alloc(); (d)=_dp_free_list; _dp_free_list = (DP)BDY(_dp_free_list); (d)->nv=(n); BDY(d)=(m) - -#define _NEXTMP(r,c) \ -if(!(r)){_NEWMP(r);(c)=(r);}else{_NEWMP(NEXT(c));(c)=NEXT(c);} - -#define _NEXTMP2(r,c,s) \ -if(!(r)){(c)=(r)=(s);}else{NEXT(c)=(s);(c)=(s);} - -#define FREEDL(m) *((DL *)m)=_dl_free_list; _dl_free_list=(m) -#define FREEMP(m) NEXT(m)=_mp_free_list; _mp_free_list=(m) -#define FREEDP(m) BDY(m)=(MP)_dp_free_list; _dp_free_list=(m) - - void _DL_alloc() { int *p; @@ -159,9 +137,9 @@ DP p1,p2,*pr; if ( t ) { _NEXTMP2(mr0,mr,s); C(mr) = STOI(t); } else { - FREEDL(s->dl); FREEMP(s); + _FREEDL(s->dl); _FREEMP(s); } - s = m2; m2 = NEXT(m2); FREEDL(s->dl); FREEMP(s); + s = m2; m2 = NEXT(m2); _FREEDL(s->dl); _FREEMP(s); break; case 1: s = m1; m1 = NEXT(m1); _NEXTMP2(mr0,mr,s); @@ -188,7 +166,7 @@ DP p1,p2,*pr; _MKDP(NV(p1),mr0,*pr); if ( *pr ) (*pr)->sugar = MAX(p1->sugar,p2->sugar); - FREEDP(p1); FREEDP(p2); + _FREEDP(p1); _FREEDP(p2); } } @@ -249,16 +227,16 @@ DP p1,p2,*pr; if ( !p1 || !p2 ) *pr = 0; else { - for ( m = BDY(p2), l = 0; m; m = NEXT(m), l++ ); + for ( m = BDY(p1), l = 0; m; m = NEXT(m), l++ ); if ( l > wlen ) { if ( w ) GC_free(w); w = (MP *)MALLOC(l*sizeof(MP)); wlen = l; } - for ( m = BDY(p2), i = 0; i < l; m = NEXT(m), i++ ) + for ( m = BDY(p1), i = 0; i < l; m = NEXT(m), i++ ) w[i] = m; for ( s = 0, i = l-1; i >= 0; i-- ) { - _weyl_mulmdm_dup(mod,p1,w[i],&t); _addmd_destructive(mod,s,t,&u); s = u; + _weyl_mulmdm_dup(mod,w[i],p2,&t); _addmd_destructive(mod,s,t,&u); s = u; } bzero(w,l*sizeof(MP)); *pr = s; @@ -295,17 +273,22 @@ DP *pr; } } -void _weyl_mulmdm_dup(mod,p,m0,pr) +void _weyl_mulmmm_dup_bug(); + +void _weyl_mulmdm_dup(mod,m0,p,pr) int mod; -DP p; MP m0; +DP p; DP *pr; { DP r,t,t1; MP m; - int n,l,i; - static MP *w; + DL d0; + int n,n2,l,i,j,tlen; + static MP *w,*psum; + static struct cdlm *tab; static int wlen; + static int rtlen; if ( !p ) *pr = 0; @@ -318,143 +301,238 @@ DP *pr; } for ( m = BDY(p), i = 0; i < l; m = NEXT(m), i++ ) w[i] = m; - for ( r = 0, i = l-1, n = NV(p); i >= 0; i-- ) { - _weyl_mulmmm_dup(mod,w[i],m0,n,&t); - _addmd_destructive(mod,r,t,&t1); r = t1; + n = NV(p); n2 = n>>1; + d0 = m0->dl; + + for ( i = 0, tlen = 1; i < n2; i++ ) + tlen *= d0->d[n2+i]+1; + if ( tlen > rtlen ) { + if ( tab ) GC_free(tab); + if ( psum ) GC_free(psum); + rtlen = tlen; + tab = (struct cdlm *)MALLOC(rtlen*sizeof(struct cdlm)); + psum = (MP *)MALLOC(rtlen*sizeof(MP)); } - bzero(w,l*sizeof(MP)); + bzero(psum,tlen*sizeof(MP)); + for ( i = l-1; i >= 0; i-- ) { + bzero(tab,tlen*sizeof(struct cdlm)); + _weyl_mulmmm_dup(mod,m0,w[i],n,tab,tlen); + for ( j = 0; j < tlen; j++ ) { + if ( tab[j].c ) { + _NEWMP(m); m->dl = tab[j].d; + C(m) = STOI(tab[j].c); NEXT(m) = psum[j]; + psum[j] = m; + } + } + } + for ( j = tlen-1, r = 0; j >= 0; j-- ) + if ( psum[j] ) { + _MKDP(n,psum[j],t); _addmd_destructive(mod,r,t,&t1); r = t1; + } if ( r ) r->sugar = p->sugar + m0->dl->td; *pr = r; } } + /* m0 = x0^d0*x1^d1*... * dx0^d(n/2)*dx1^d(n/2+1)*... */ -void _weyl_mulmmm_dup(mod,m0,m1,n,pr) +void _weyl_mulmmm_dup(mod,m0,m1,n,rtab,rtablen) int mod; MP m0,m1; int n; -DP *pr; +struct cdlm *rtab; +int rtablen; { MP m,mr,mr0; DP r,t,t1; int c,c0,c1,cc; - DL d,d0,d1; - int i,j,a,b,k,l,n2,s,min,h; - static int *tab; + DL d,d0,d1,dt; + int i,j,a,b,k,l,n2,s,min,h,curlen; + struct cdlm *p; + static int *ctab; + static struct cdlm *tab; static int tablen; + static struct cdlm *tmptab; + static int tmptablen; - if ( !m0 || !m1 ) - *pr = 0; - else { - c0 = ITOS(C(m0)); c1 = ITOS(C(m1)); - c = dmar(c0,c1,0,mod); - d0 = m0->dl; d1 = m1->dl; - n2 = n>>1; + if ( !m0 || !m1 ) { + rtab[0].c = 0; + rtab[0].d = 0; + return; + } + c0 = ITOS(C(m0)); c1 = ITOS(C(m1)); + c = dmar(c0,c1,0,mod); + d0 = m0->dl; d1 = m1->dl; + n2 = n>>1; + curlen = 1; - _NEWDL(d,n); - if ( n & 1 ) - /* offset of h-degree */ - d->td = d->d[n-1] = d0->d[n-1]+d1->d[n-1]; - else - d->td = 0; - _NEWMP(mr); mr->c = STOI(c); mr->dl = d; NEXT(mr) = 0; - _MKDP(n,mr,r); r->sugar = d->td; + _NEWDL(d,n); + if ( n & 1 ) + /* offset of h-degree */ + d->td = d->d[n-1] = d0->d[n-1]+d1->d[n-1]; + else + d->td = 0; + rtab[0].c = c; + rtab[0].d = d; - /* homogenized computation; dx-xd=h^2 */ - for ( i = 0; i < n2; i++ ) { - a = d0->d[i]; b = d1->d[n2+i]; - k = d0->d[n2+i]; l = d1->d[i]; - /* degree of xi^a*(Di^k*xi^l)*Di^b */ - s = a+k+l+b; - /* compute xi^a*(Di^k*xi^l)*Di^b */ - min = MIN(k,l); + if ( rtablen > tmptablen ) { + if ( tmptab ) GC_free(tmptab); + tmptab = (struct cdlm *)MALLOC(rtablen*sizeof(struct cdlm)); + tmptablen = rtablen; + } - if ( min+1 > tablen ) { - if ( tab ) GC_free(tab); - tab = (int *)MALLOC((min+1)*sizeof(int)); - tablen = min+1; - } - mkwcm(k,l,mod,tab); - if ( n & 1 ) - for ( mr0 = 0, j = 0; j <= min; j++ ) { - _NEXTMP(mr0,mr); _NEWDL(d,n); - d->d[i] = l-j+a; d->d[n2+i] = k-j+b; - d->td = s; - d->d[n-1] = s-(d->d[i]+d->d[n2+i]); - mr->c = STOI(tab[j]); mr->dl = d; + for ( i = 0; i < n2; i++ ) { + a = d0->d[i]; b = d1->d[n2+i]; + k = d0->d[n2+i]; l = d1->d[i]; + if ( !k || !l ) { + a += l; + b += k; + s = a+b; + for ( j = 0, p = rtab; j < curlen; j++, p++ ) { + if ( p->c ) { + dt = p->d; + dt->d[i] = a; + dt->d[n2+i] = b; + dt->td += s; } - else - for ( mr0 = 0, s = 0, j = 0; j <= min; j++ ) { - _NEXTMP(mr0,mr); _NEWDL(d,n); - d->d[i] = l-j+a; d->d[n2+i] = k-j+b; - d->td = d->d[i]+d->d[n2+i]; /* XXX */ - s = MAX(s,d->td); /* XXX */ - mr->c = STOI(tab[j]); mr->dl = d; - } - bzero(tab,(min+1)*sizeof(int)); - if ( mr0 ) - NEXT(mr) = 0; - _MKDP(n,mr0,t); - if ( t ) - t->sugar = s; - _comm_mulmd_dup(mod,r,t,&t1); - _free_dp(r); _free_dp(t); - r = t1; + } + curlen *= k+1; + continue; } - *pr = r; + if ( k+1 > tablen ) { + if ( tab ) GC_free(tab); + if ( ctab ) GC_free(ctab); + tablen = k+1; + tab = (struct cdlm *)MALLOC(tablen*sizeof(struct cdlm)); + ctab = (int *)MALLOC(tablen*sizeof(int)); + } + /* degree of xi^a*(Di^k*xi^l)*Di^b */ + s = a+k+l+b; + /* compute xi^a*(Di^k*xi^l)*Di^b */ + min = MIN(k,l); + mkwcm(k,l,mod,ctab); + bzero(tab,(k+1)*sizeof(struct cdlm)); + /* n&1 != 0 => homogenized computation; dx-xd=h^2 */ + if ( n & 1 ) + for ( j = 0; j <= min; j++ ) { + _NEWDL(d,n); + d->d[i] = l-j+a; d->d[n2+i] = k-j+b; + d->td = s; + d->d[n-1] = s-(d->d[i]+d->d[n2+i]); + tab[j].d = d; + tab[j].c = ctab[j]; + } + else + for ( j = 0; j <= min; j++ ) { + _NEWDL(d,n); + d->d[i] = l-j+a; d->d[n2+i] = k-j+b; + d->td = d->d[i]+d->d[n2+i]; /* XXX */ + tab[j].d = d; + tab[j].c = ctab[j]; + } +#if 0 + _comm_mulmd_tab(mod,n,rtab,curlen,tab,k+1,tmptab); + for ( j = 0; j < curlen; j++ ) + if ( rtab[j].d ) { _FREEDL(rtab[j].d); } + for ( j = 0; j <= min; j++ ) + if ( tab[j].d ) { _FREEDL(tab[j].d); } + curlen *= k+1; + bcopy(tmptab,rtab,curlen*sizeof(struct cdlm)); +#else + _comm_mulmd_tab_destructive(mod,n,rtab,curlen,tab,k+1); + for ( j = 0; j <= min; j++ ) + if ( tab[j].d ) { _FREEDL(tab[j].d); } + curlen *= k+1; +#endif } } -void _dp_red_mod_destructive(p1,p2,mod,rp) -DP p1,p2; +/* direct product of two cdlm tables + rt[] = [ + t[0]*t1[0],...,t[n-1]*t1[0], + t[0]*t1[1],...,t[n-1]*t1[1], + ... + t[0]*t1[n1-1],...,t[n-1]*t1[n1-1] + ] +*/ + +void _comm_mulmd_tab(mod,nv,t,n,t1,n1,rt) int mod; -DP *rp; +int nv; +struct cdlm *t; +int n; +struct cdlm *t1; +int n1; +struct cdlm *rt; { - int i,n; - DL d1,d2,d; - MP m; - DP t,s; - int c,c1; + int i,j; + struct cdlm *p; + int c; + DL d; - n = p1->nv; d1 = BDY(p1)->dl; d2 = BDY(p2)->dl; - _NEWDL(d,n); d->td = d1->td - d2->td; - for ( i = 0; i < n; i++ ) - d->d[i] = d1->d[i]-d2->d[i]; - c = invm(ITOS(BDY(p2)->c),mod); c1 = dmar(c,ITOS(BDY(p1)->c),0,mod); - _NEWMP(m); m->dl = d; m->c = STOI(mod-c1); NEXT(m) = 0; - _MKDP(n,m,s); s->sugar = d->td; - _mulmd_dup(mod,s,p2,&t); _free_dp(s); - _addmd_destructive(mod,p1,t,rp); + bzero(rt,n*n1*sizeof(struct cdlm)); + for ( j = 0, p = rt; j < n1; j++ ) { + c = t1[j].c; + d = t1[j].d; + if ( !c ) + break; + for ( i = 0; i < n; i++, p++ ) { + if ( t[i].c ) { + p->c = dmar(t[i].c,c,0,mod); + _adddl_dup(nv,t[i].d,d,&p->d); + } + } + } } -void _dp_sp_mod_dup(p1,p2,mod,rp) -DP p1,p2; +void _comm_mulmd_tab_destructive(mod,nv,t,n,t1,n1) int mod; -DP *rp; +int nv; +struct cdlm *t; +int n; +struct cdlm *t1; +int n1; { - int i,n,td; - int *w; - DL d1,d2,d; - MP m; - DP t,s,u; + int i,j; + struct cdlm *p; + int c; + DL d; - n = p1->nv; d1 = BDY(p1)->dl; d2 = BDY(p2)->dl; - w = (int *)ALLOCA(n*sizeof(int)); - for ( i = 0, td = 0; i < n; i++ ) { - w[i] = MAX(d1->d[i],d2->d[i]); td += w[i]; + for ( j = 1, p = t+n; j < n1; j++ ) { + c = t1[j].c; + d = t1[j].d; + if ( !c ) + break; + for ( i = 0; i < n; i++, p++ ) { + if ( t[i].c ) { + p->c = dmar(t[i].c,c,0,mod); + _adddl_dup(nv,t[i].d,d,&p->d); + } + } } - _NEWDL(d,n); d->td = td - d1->td; + c = t1[0].c; + d = t1[0].d; + for ( i = 0, p = t; i < n; i++, p++ ) + if ( t[i].c ) { + p->c = dmar(t[i].c,c,0,mod); + /* t[i].d += d */ + adddl_destructive(nv,t[i].d,d); + } +} + +void dlto_dl(d,dr) +DL d; +DL *dr; +{ + int i,n; + DL t; + + n = current_dl_length; + _NEWDL(t,n); *dr = t; + t->td = d->td; for ( i = 0; i < n; i++ ) - d->d[i] = w[i] - d1->d[i]; - _NEWMP(m); m->dl = d; m->c = BDY(p2)->c; NEXT(m) = 0; - _MKDP(n,m,s); s->sugar = d->td; _mulmd_dup(mod,s,p1,&t); _free_dp(s); - _NEWDL(d,n); d->td = td - d2->td; - for ( i = 0; i < n; i++ ) - d->d[i] = w[i] - d2->d[i]; - _NEWMP(m); m->dl = d; m->c = STOI(mod - ITOS(BDY(p1)->c)); NEXT(m) = 0; - _MKDP(n,m,s); s->sugar = d->td; _mulmd_dup(mod,s,p2,&u); _free_dp(s); - _addmd_destructive(mod,t,u,rp); + t->d[i] = d->d[i]; } void _dltodl(d,dr) @@ -471,7 +549,7 @@ DL *dr; t->d[i] = d->d[i]; } -void adddl_dup(n,d1,d2,dr) +void _adddl_dup(n,d1,d2,dr) int n; DL d1,d2; DL *dr; @@ -479,12 +557,22 @@ DL *dr; DL dt; int i; - _NEWDL(dt,n); *dr = dt; + _NEWDL(dt,n); + *dr = dt; dt->td = d1->td + d2->td; for ( i = 0; i < n; i++ ) dt->d[i] = d1->d[i]+d2->d[i]; } +void _free_dlarray(a,n) +DL *a; +int n; +{ + int i; + + for ( i = 0; i < n; i++ ) { _FREEDL(a[i]); } +} + void _free_dp(f) DP f; { @@ -494,11 +582,32 @@ DP f; return; m = f->body; while ( m ) { - s = m; m = NEXT(m); FREEDL(s->dl); FREEMP(s); + s = m; m = NEXT(m); _FREEDL(s->dl); _FREEMP(s); } - FREEDP(f); + _FREEDP(f); } +void dpto_dp(p,r) +DP p; +DP *r; +{ + MP m,mr0,mr; + + if ( !p ) + *r = 0; + else { + current_dl_length = NV(p); + for ( m = BDY(p), mr0 = 0; m; m = NEXT(m) ) { + _NEXTMP(mr0,mr); + dlto_dl(m->dl,&mr->dl); + mr->c = m->c; + } + NEXT(mr) = 0; + _MKDP(p->nv,mr0,*r); + (*r)->sugar = p->sugar; + } +} + void _dptodp(p,r) DP p; DP *r; @@ -519,61 +628,55 @@ DP *r; } } -void _dp_nf_mod_destructive(b,g,ps,mod,full,rp) -NODE b; -DP g; -DP *ps; -int mod,full; -DP *rp; +/* + * destructive merge of two list + * + * p1, p2 : list of DL + * return : a merged list + */ + +NODE _symb_merge(m1,m2,n) +NODE m1,m2; +int n; { - DP u,p,d,s,t; - NODE l; - MP m,mr,mrd; - int sugar,psugar,n,h_reducible,i; + NODE top,prev,cur,m,t; - if ( !g ) { - *rp = 0; return; - } - sugar = g->sugar; - n = g->nv; - for ( d = 0; g; ) { - for ( h_reducible = 0, l = b; l; l = NEXT(l) ) { - if ( dp_redble(g,p = ps[(int)BDY(l)]) ) { - h_reducible = 1; - psugar = (BDY(g)->dl->td - BDY(p)->dl->td) + p->sugar; - _dp_red_mod_destructive(g,p,mod,&u); g = u; - sugar = MAX(sugar,psugar); - if ( !g ) { - if ( d ) - d->sugar = sugar; - _dptodp(d,rp); _free_dp(d); return; - } + if ( !m1 ) + return m2; + else if ( !m2 ) + return m1; + else { + switch ( (*cmpdl)(n,(DL)BDY(m1),(DL)BDY(m2)) ) { + case 0: + top = m1; _FREEDL((DL)BDY(m2)); m = NEXT(m2); break; - } + case 1: + top = m1; m = m2; + break; + case -1: + top = m2; m = m1; + break; } - if ( !h_reducible ) { - /* head term is not reducible */ - if ( !full ) { - if ( g ) - g->sugar = sugar; - _dptodp(g,rp); _free_dp(g); return; - } else { - m = BDY(g); - if ( NEXT(m) ) { - BDY(g) = NEXT(m); NEXT(m) = 0; - } else { - FREEDP(g); g = 0; - } - if ( d ) { - for ( mrd = BDY(d); NEXT(mrd); mrd = NEXT(mrd) ); - NEXT(mrd) = m; - } else { - _MKDP(n,m,d); - } + prev = top; cur = NEXT(top); + /* BDY(prev) > BDY(m) always holds */ + while ( cur && m ) { + switch ( (*cmpdl)(n,(DL)BDY(cur),(DL)BDY(m)) ) { + case 0: + _FREEDL(BDY(m)); m = NEXT(m); + prev = cur; cur = NEXT(cur); + break; + case 1: + t = NEXT(cur); NEXT(cur) = m; m = t; + prev = cur; cur = NEXT(cur); + break; + case -1: + NEXT(prev) = m; m = cur; + prev = NEXT(prev); cur = NEXT(prev); + break; } } + if ( !cur ) + NEXT(prev) = m; + return top; } - if ( d ) - d->sugar = sugar; - _dptodp(d,rp); _free_dp(d); }