📄 mainilutp.c

📁 数学算法的实现库。可以实现常见的线性计算。
💻 C
📖 第 1 页 / 共 2 页
字号:
上一页 12
    /* ------------------------------------------------------------------- */    fprintf(fo,"ILUTP     |");    /* set up paramaters for ILUTP */    /* n       = integer. The row dimension of the matrix A. The matrix      */    /* a,ja,ia = matrix stored in Compressed Sparse Row format.              */    /* lfil    = integer. The fill-in parameter. Each row of L and each row                 of U will have a maximum of lfil elements (excluding the 		 diagonal element). lfil must be .ge. 0.		 ** WARNING: THE MEANING OF LFIL HAS CHANGED WITH RESPECT TO		 EARLIER VERSIONS.                                           */    ipar[0]=n;    /* droptol = real*8. Sets the threshold for dropping small terms in the                 factorization. See below for details on dropping strategy.  */    fpar[0]=DROP_TOL;    /* permtol = tolerance ratio used to  determne whether or not to permute                 two columns.  At step i columns i and j are permuted when                  abs(a(i,j))*permtol .gt. abs(a(i,i))                 [0 --> never permute; good values 0.1 to 0.01]              */    fpar[1]=PERM_TOL;    /* mbloc   = if desired, permuting can be done only within the diagonal                 blocks of size mbloc. Useful for PDE problems with several                 degrees of freedom.. If feature not wanted take mbloc=n.    */    ipar[1]=n;    /* iwk     = integer. The lengths of arrays alu and jlu. If the arrays                 are not big enough to store the ILU factorizations, ilut		 will stop with an error message.                            */    ipar[2]=ELBOW*nz;    /* On return:       ===========       alu,jlu = matrix stored in Modified Sparse Row (MSR) format containing                 the L and U factors together. The diagonal (stored in		 alu(1:n) ) is inverted. Each i-th row of the alu,jlu matrix		 contains the i-th row of L (excluding the diagonal entry=1)		 followed by the i-th row of U.                              */    ilutmat.ja=(int *)  MALLOC((size_t)ipar[2]*sizeof(int),  "mainilutp:ilutmat.ja");    ilutmat.a =(FLOAT *)MALLOC((size_t)ipar[2]*sizeof(FLOAT),"mainilutp:ilutmat.a");    /* ju      = integer array of length n containing the pointers to                 the beginning of each row of U in the matrix alu,jlu.       */    ilutmat.ia=(int *)  MALLOC((size_t)(n+1)*sizeof(int),"mainilutp:ilutmat.ia");    /* iperm   = contains the permutation arrays.                  iperm(1:n) = old numbers of unknowns                 iperm(n+1:2*n) = reverse permutation = new unknowns.        */    invperm=(int *)MALLOC(2*(size_t)n*sizeof(int),"mainilutp:invperm");    /* ierr    = integer. Error message with the following meaning.                 ierr  = 0    --> successful return.		 ierr .gt. 0  --> zero pivot encountered at step number ierr.		 ierr  = -1   --> Error. input matrix may be wrong.                                  (The elimination process has generated a				  row in L or U whose length is .gt.  n.)                 ierr  = -2   --> The matrix L overflows the array alu.		 ierr  = -3   --> The matrix U overflows the array alu.		 ierr  = -4   --> Illegal value for lfil.		 ierr  = -5   --> zero row encountered.                      */    ipar[3]=0;    /* work arrays:       =============       jw      = integer work array of length 5*n.       w       = real work array of length n                                 */    ws=(int *)  MALLOC(5*(size_t)n*sizeof(int),"mainilutp:ws");    w =(FLOAT *)MALLOC((size_t)n*sizeof(FLOAT),"mainilutp:w");    printf("ILUTP2 PARAMETERS:\n");    printf("   droptol=%8.1e\n",fpar[0]);    printf("   permtol=%8.1e\n",fpar[1]);    printf("   lfil   =%d\n",   ipar[0]);    printf("   elbow space factor=%4d\n",  ELBOW);    /* perform ILUTP decomposition */    evaluate_time(&time_start,&systime);    ILUTP(&n,A.a,A.ja,A.ia,ipar,fpar,fpar+1,ipar+1,	  ilutmat.a,ilutmat.ja,ilutmat.ia,ipar+2,w,ws,invperm,ipar+3);    free(w);    free(ws);     for (i=0; i<A.ia[n]-1; i++)        A.ja[i] = invperm[A.ja[i]-1];     evaluate_time(&time_stop,&systime);    secnds=time_stop-time_start;    fprintf(fo,"   |");    nc=0;    for (i=0; i<n; i++)        nc+=ilutmat.ia[i]-ilutmat.ja[i];    tmp0=(1.0*nc)/n+.5;    tmp3=0;    for (i=0; i<n; i++)        tmp3+=ilutmat.ja[i+1]-ilutmat.ia[i];    tmp=(1.0*tmp3)/n;    printf("\nfill-in L: %5d(%4.1fav.), U: %5d(%4.1fav.), totally %5d(%4.1fav.)\n",	   nc,(1.0*nc)/n,tmp3,(1.0*tmp3)/n,tmp3+nc+n,(1.0*(tmp3+nc+n))/n);    printf("fill-in factor: %5.1f\n",(1.0*(tmp3+nc+n))/nz);    fprintf(fo,"%5.1f|",(1.0*(tmp3+nc+n))/nz);    printf("time: %8.1e [sec]\n\n",(double)secnds);    fprintf(fo,"%7.1le|",(double)secnds+secndsprep);    fflush(stdout);    switch (ipar[3])    {           case  0: /* perfect! */	            break;           case -1: /* Error. input matrix may be wrong.                       (The elimination process has generated a			row in L or U whose length is .gt.  n.) */	            printf("Error. input matrix may be wrong\n");		    break;           case -2: /* The matrix L overflows the array alu */	            printf("The matrix L overflows the array alu\n");		    break;           case -3: /* The matrix U overflows the array alu */	            printf("The matrix U overflows the array alu\n");		    break;           case -4: /* Illegal value for lfil */	            printf("Illegal value for lfil\n");		    break;           case -5: /* zero row encountered */	            printf("zero row encountered\n");		    break;           default: /* zero pivot encountered at step number ierr */	            printf("zero pivot encountered at step number %d\n",ipar[2]);		    break;    } /* end switch */    if (ipar[3]!=0)      {	printf("Iterative solver(s) cannot be applied\n\n");	fprintf(fo,"Iterative solver(s) cannot be applied\n");	fflush(fo);	exit(0);      }    /* --------------------   apply preconditioner   --------------------- */    /* initial solution */    if (rhstyp[1]=='G' || rhstyp[1]=='g') {       j=nrhs*n;       if (rhstyp[0]=='M' || rhstyp[0]=='m')	  j=n;       for (i=0; i<n; i++,j++)	   sol[i]=rhs[j];    }    else      for (i=0; i<n; i++)#if defined _DOUBLE_REAL_ || defined _SINGLE_REAL_	  sol[i]=0;#else	  sol[i].r=sol[i].i=0;#endif        // rescale initial solution    for (i=0; i<n; i++) {  #if defined _DOUBLE_REAL_ || defined _SINGLE_REAL_        sol[i]/=colscale[i];#else	val=sol[i].r;	nrm=1.0/(colscale[i].r*colscale[i].r+colscale[i].i*colscale[i].i);	sol[i].r=( val*colscale[i].r+sol[i].i*colscale[i].i)*nrm;	sol[i].i=(-val*colscale[i].i+sol[i].i*colscale[i].r)*nrm;#endif    } // end for i    // reorder solution    for (i=0; i<n; i++)         param.dbuff[invq[i]-1]=sol[i];    i=1;    COPY(&n,param.dbuff,&i,sol,&i);        /* init solver */    ipar[0]=0;    /* right preconditioning */    ipar[1]=2;    if (ipar[1]==0)      printf("no preconditioning\n");    else if (ipar[1]==1)      printf("left preconditioning\n");    else if (ipar[1]==2)      printf("right preconditioning\n");    else if (ipar[1]==3)      printf("both sides preconditioning\n");        /* stopping criteria, residual norm */    ipar[2]=3;    /* number of restart length for GMRES,FOM,... */    ipar[4]=30;    /* maximum number of iteration steps */    ipar[5]=1.1*n+10;    ipar[5]=MIN(ipar[5],MAX_IT);    /* init with zeros */    ipar[6]=ipar[7]=ipar[8]=ipar[9]=ipar[10]=ipar[11]=ipar[12]=ipar[13]=0;    /* relative error tolerance */    fpar[0]=1e-8;    /* absolute error tolerance */    fpar[1]=0;    /* init with zeros */    fpar[2]=fpar[3]=fpar[4]=fpar[5]=fpar[6]=fpar[7]=fpar[8]=fpar[9]=fpar[10]=0;        /* allocate memory for iterative solver depending on our choice */    i=ipar[4];    switch (SOLVER) {    case  1:   /* cg */      i=5*n;      printf("use CG as iterative solver\n");      break;    case  2:   /* cgnr */      i=5*n;      printf("use CGNR as iterative solver\n");      break;    case  3:   /* bcg */      printf("use BCG as iterative solver\n");      i=7*n;      break;    case  4:   /* dbcg */      i=11*n;      printf("use DBCG as iterative solver\n");      break;    case  5:   /* bcgstab */      i=8*n;      printf("use BCGSTAB as iterative solver\n");      break;    case  6:   /* tfqmr */      i=11*n;      printf("use TFQMR as iterative solver\n");      break;    case  7:   /* fom */      i=(n+3)*(i+2)+(i+1)*i/2;      printf("use FOM(%d) as iterative solver\n",ipar[4]);      break;    case  8:   /* gmres */      i=(n+3)*(i+2)+(i+1)*i/2;      printf("use GMRES(%d) as iterative solver\n",ipar[4]);      break;    case  9:   /* fgmres */      i=2*n*(i+1)+((i+1)*i)/2+3*i+2;      printf("use FGMRES(%d) as iterative solver\n",ipar[4]);      break;    case 10:   /* dqgmres */      i=n+(i+1)*(2*n+4);      printf("use DQGMRES(%d) as iterative solver\n",ipar[4]);      break;    } /* end switch */    w=(FLOAT *)MALLOC((size_t)i*sizeof(FLOAT),"main:w");     ipar[3]=i;    // init buffer for column sumns    rbuff=(REALS *)dbuff;    for (i=0; i<n; i++)       rbuff[i]=0.0;    // val = maximum row sum    val=0.0;    for (i=0; i<n; i++) {        j=1;	k=A.ia[i+1]-A.ia[i];	val=MAX(val,ASUM(&k,A.a+A.ia[i]-1,&j));	for (j=A.ia[i]-1; j<A.ia[i+1]-1; j++) {	  k=A.ja[j]-1;	  rbuff[k]+=FABS(A.a[j]);	} // end for j    } // end for i    vb=0;    for (i=0; i<n; i++)      vb=MAX(vb,rbuff[i]);    fpar[11]=sqrt((double)val*vb);        /* start iterative solver */    evaluate_time(&time_start,&systime);    flag=-1;    while (flag) {      /* which solver do we use? */      switch (SOLVER) {/*      case  1:   // cg 	PCG(&n,rhs,sol,ipar,fpar,w);	break;      case  2:   // cgnr	cgnr(&n,rhs,sol,ipar,fpar,w);	break;      case  3:   // bcg	bcg(&n,rhs,sol,ipar,fpar,w);	break;      case  4:   // dbcg 	dbcg(&n,rhs,sol,ipar,fpar,w);	break;      case  5:   // bcgstab	bcgstab(&n,rhs,sol,ipar,fpar,w);	break;      case  6:   // tfqmr	tfqmr(&n,rhs,sol,ipar,fpar,w);	break;      case  7:   // fom	fom(&n,rhs,sol,ipar,fpar,w);	break;*/      case  8:   // gmres	GMRES(&n,rhs,sol,ipar,fpar,w);	break;      case  9:   // fgmres	FGMRES(&n,rhs,sol,ipar,fpar,w);	break;/*      case 10:   // dqgmres	dqgmres(&n,rhs,sol,ipar,fpar,w);	break;*/      } /* end switch */      /* what is needed for the solver? */      w--;      switch (ipar[0]) {      case  1:   // apply matrix vector multiplication	// printf("apply matrix vector multiplication\n");fflush(stdout);	CSRMATVEC(A,w+ipar[7],w+ipar[8]);	break;      case  2:   /* apply transposed matrix vector multiplication */	CSRMATTVEC(A,w+ipar[7],w+ipar[8]);	break;      case  3:   /* (no) left preconditioner solver */	i=1;	if (ipar[1]==1) {	   LUSOL(&n, w+ipar[7],param.dbuff, ilutmat.a,ilutmat.ja,ilutmat.ia);	   w+=ipar[8]-1;	   for (i=0; i<n; i++)	       w[invperm[i]]=param.dbuff[i];	   w-=ipar[8]-1;	} // end if	else	   COPY(&n,w+ipar[7],&i,w+ipar[8],&i);	break;      case  4:   /* (no) left preconditioner transposed solver */	i=1;	if (ipar[1]==1) {	   w+=ipar[7]-1;	   for (i=0; i<n; i++)	       param.dbuff[i]=w[invperm[i]];	   w-=ipar[7]-1;	   LUTSOL(&n, param.dbuff,w+ipar[8], ilutmat.a,ilutmat.ja,ilutmat.ia);	} // end if	else	   COPY(&n,w+ipar[7],&i,w+ipar[8],&i);	break;      case  5:   /* (no) right preconditioner solver */	i=1;	if (ipar[1]==2) {	   // printf("apply right preconditioning\n");fflush(stdout);	   LUSOL(&n, w+ipar[7],param.dbuff, ilutmat.a,ilutmat.ja,ilutmat.ia);	   w+=ipar[8]-1;	   for (i=0; i<n; i++)	       w[invperm[i]]=param.dbuff[i];	   w-=ipar[8]-1;	} // end if	else	   COPY(&n,w+ipar[7],&i,w+ipar[8],&i);	break;      case  6:   /* (no) right preconditioner transposed solver */	i=1;	if (ipar[1]==2) {	   w+=ipar[7]-1;	   for (i=0; i<n; i++)	       param.dbuff[i]=w[invperm[i]];	   w-=ipar[7]-1;	   LUTSOL(&n, param.dbuff,w+ipar[8], ilutmat.a,ilutmat.ja,ilutmat.ia);	} // end if	else	   COPY(&n,w+ipar[7],&i,w+ipar[8],&i);	break;      case 10:   /* call my own stopping test routine */	break;      default:   /* the iterative solver terminated with code=ipar[0] */	flag=0;	break;      } /* end switch */      w++;    } /* end while */    // reorder solution back    for (i=0; i<n; i++)         param.dbuff[i]=sol[invq[i]-1];    i=1;    COPY(&n,param.dbuff,&i,sol,&i);    // rescale solution    for (i=0; i<n; i++) {  #if defined _DOUBLE_REAL_ || defined _SINGLE_REAL_        sol[i]*=colscale[i];#else	val=sol[i].r;	sol[i].r=val*colscale[i].r-sol[i].i*colscale[i].i;	sol[i].i=val*colscale[i].i+sol[i].i*colscale[i].r;#endif    } // end for i    evaluate_time(&time_stop,&systime);    secnds=time_stop-time_start;    /* why did the iterative solver stop? */    switch (ipar[0]) {    case  0:  /* everything is fine */      break;    case -1:  /* too many iterations */      printf("number of iteration steps exceeds its limit\n");      break;    case -2:  /* not enough work space */      printf("not enough work space provided\n");      break;    case -3:  /* not enough work space */      printf("algorithm breaks down ");      /* Arnoldi-type solvers */      if (SOLVER>=7) {	switch (ipar[11]) {	case -1:  	  printf("due to zero input vector");	  break;	case -2:  	  printf("since input vector contains abnormal numbers");	  break;	case -3:  	  printf("since input vector is a linear combination of others");	  break;	case -4:  	  printf("since triangular system in GMRES/FOM/etc. has null rank");	  break;	} /* end switch */      } /* end if */      printf("\n");      break;    default:  /* unknown */      printf("solver exited with error code %d\n",ipar[0]);      break;    } /* end switch */    printf("number of iteration steps: %d\n",ipar[6]);    printf("time: %8.1le [sec]\n\n", (double)secnds);    if (ipar[6]>=MAX_IT) {       fprintf(fo,"  inf  |");       fprintf(fo," inf\n");    }    else        if (ipar[0]!=0) {	  fprintf(fo,"  NaN  |");	  fprintf(fo," NaN\n");       }       else {	  fprintf(fo,"%7.1le|",(double)secnds);	  fprintf(fo," %3d\n",ipar[6]);       }    fflush(fo);        printf("residual norms:\n");    printf("initial: %8.1le\n",fpar[2]);    printf("target:  %8.1le\n",fpar[3]);    printf("current: %8.1le\n",fpar[5]);    printf("convergence rate: %8.1le\n",fpar[6]);    if (nrhs==0) {       for (i=0; i<n; i++) #if defined _DOUBLE_REAL_ || defined _SINGLE_REAL_	   sol[i]-=1;#else	   sol[i].r-=1;#endif       i=1;       printf("rel. error in the solution: %8.1le\n\n",NRM(&n,sol,&i)/sqrt(1.0*n));    }    else        if (rhstyp[2]=='X' || rhstyp[2]=='x') {	 j=nrhs*n;	 if (rhstyp[1]=='G' || rhstyp[1]=='g') 	    j*=2;	 for (i=0; i<n; i++,j++) {#if defined _DOUBLE_REAL_ || defined _SINGLE_REAL_	     sol[i]-=rhs[j];#else	     sol[i].r-=rhs[j].r;	     sol[i].i-=rhs[j].i;#endif	 } // end for i	 j-=n;	 i=1;	 printf("rel. error in the solution: %8.1le\n\n",NRM(&n,sol,&i)/NRM(&n,rhs+j,&i));       }    free(w);    printf("\n\n");    /* ------------------   END apply preconditioner   ------------------- */    free(ilutmat.ia);    free(ilutmat.ja);    free(ilutmat.a);    /* ------------------------------------------------------------------- */    /* ------------------------   END MAIN part   ------------------------ */    /* ------------------------------------------------------------------- */    free(A.ia);    free(A.ja);    free(A.a);} /* end main */
上一页 12
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -