📄 misc_core.c

📁 A sparse variant of the Levenberg-Marquardt algorithm implemented by levmar has been applied to bund
💻 C
📖 第 1 页 / 共 2 页
字号:
上一页 12
	return rank;}#else // no LAPACK/* * This function computes the inverse of A in B. A and B can coincide * * The function employs LAPACK-free LU decomposition of A to solve m linear * systems A*B_i=I_i, where B_i and I_i are the i-th columns of B and I. * * A and B are mxm * * The function returns 0 in case of error, 1 if successful * */static int LEVMAR_LUINVERSE(LM_REAL *A, LM_REAL *B, int m){void *buf=NULL;int buf_sz=0;register int i, j, k, l;int *idx, maxi=-1, idx_sz, a_sz, x_sz, work_sz, tot_sz;LM_REAL *a, *x, *work, max, sum, tmp;  /* calculate required memory size */  idx_sz=m;  a_sz=m*m;  x_sz=m;  work_sz=m;  tot_sz=(a_sz + x_sz + work_sz)*sizeof(LM_REAL) + idx_sz*sizeof(int); /* should be arranged in that order for proper doubles alignment */  buf_sz=tot_sz;  buf=(void *)malloc(tot_sz);  if(!buf){    fprintf(stderr, RCAT("memory allocation in ", LEVMAR_LUINVERSE) "() failed!\n");    return 0; /* error */  }  a=buf;  x=a+a_sz;  work=x+x_sz;  idx=(int *)(work+work_sz);  /* avoid destroying A by copying it to a */  for(i=0; i<a_sz; ++i) a[i]=A[i];  /* compute the LU decomposition of a row permutation of matrix a; the permutation itself is saved in idx[] */	for(i=0; i<m; ++i){		max=0.0;		for(j=0; j<m; ++j)			if((tmp=FABS(a[i*m+j]))>max)        max=tmp;		  if(max==0.0){        fprintf(stderr, RCAT("Singular matrix A in ", LEVMAR_LUINVERSE) "()!\n");        free(buf);        return 0;      }		  work[i]=LM_CNST(1.0)/max;	}	for(j=0; j<m; ++j){		for(i=0; i<j; ++i){			sum=a[i*m+j];			for(k=0; k<i; ++k)        sum-=a[i*m+k]*a[k*m+j];			a[i*m+j]=sum;		}		max=0.0;		for(i=j; i<m; ++i){			sum=a[i*m+j];			for(k=0; k<j; ++k)        sum-=a[i*m+k]*a[k*m+j];			a[i*m+j]=sum;			if((tmp=work[i]*FABS(sum))>=max){				max=tmp;				maxi=i;			}		}		if(j!=maxi){			for(k=0; k<m; ++k){				tmp=a[maxi*m+k];				a[maxi*m+k]=a[j*m+k];				a[j*m+k]=tmp;			}			work[maxi]=work[j];		}		idx[j]=maxi;		if(a[j*m+j]==0.0)      a[j*m+j]=LM_REAL_EPSILON;		if(j!=m-1){			tmp=LM_CNST(1.0)/(a[j*m+j]);			for(i=j+1; i<m; ++i)        a[i*m+j]*=tmp;		}	}  /* The decomposition has now replaced a. Solve the m linear systems using   * forward and back substitution   */  for(l=0; l<m; ++l){    for(i=0; i<m; ++i) x[i]=0.0;    x[l]=LM_CNST(1.0);	  for(i=k=0; i<m; ++i){		  j=idx[i];		  sum=x[j];		  x[j]=x[i];		  if(k!=0)			  for(j=k-1; j<i; ++j)          sum-=a[i*m+j]*x[j];		  else        if(sum!=0.0)			    k=i+1;		  x[i]=sum;	  }	  for(i=m-1; i>=0; --i){		  sum=x[i];		  for(j=i+1; j<m; ++j)        sum-=a[i*m+j]*x[j];		  x[i]=sum/a[i*m+i];	  }    for(i=0; i<m; ++i)      B[i*m+l]=x[i];  }  free(buf);  return 1;}#endif /* HAVE_LAPACK *//* * This function computes in C the covariance matrix corresponding to a least * squares fit. JtJ is the approximate Hessian at the solution (i.e. J^T*J, where * J is the Jacobian at the solution), sumsq is the sum of squared residuals * (i.e. goodnes of fit) at the solution, m is the number of parameters (variables) * and n the number of observations. JtJ can coincide with C. *  * if JtJ is of full rank, C is computed as sumsq/(n-m)*(JtJ)^-1 * otherwise and if LAPACK is available, C=sumsq/(n-r)*(JtJ)^+ * where r is JtJ's rank and ^+ denotes the pseudoinverse * The diagonal of C is made up from the estimates of the variances * of the estimated regression coefficients. * See the documentation of routine E04YCF from the NAG fortran lib * * The function returns the rank of JtJ if successful, 0 on error * * A and C are mxm * */int LEVMAR_COVAR(LM_REAL *JtJ, LM_REAL *C, LM_REAL sumsq, int m, int n){register int i;int rnk;LM_REAL fact;#ifdef HAVE_LAPACK   rnk=LEVMAR_PSEUDOINVERSE(JtJ, C, m);   if(!rnk) return 0;#else#ifdef _MSC_VER#pragma message("LAPACK not available, LU will be used for matrix inversion when computing the covariance; this might be unstable at times")#else#warning LAPACK not available, LU will be used for matrix inversion when computing the covariance; this might be unstable at times#endif // _MSC_VER   rnk=LEVMAR_LUINVERSE(JtJ, C, m);   if(!rnk) return 0;   rnk=m; /* assume full rank */#endif /* HAVE_LAPACK */   fact=sumsq/(LM_REAL)(n-rnk);   for(i=0; i<m*m; ++i)     C[i]*=fact;   return rnk;}/*  standard deviation of the best-fit parameter i. *  covar is the mxm covariance matrix of the best-fit parameters (see also LEVMAR_COVAR()). * *  The standard deviation is computed as \sigma_{i} = \sqrt{C_{ii}}  */LM_REAL LEVMAR_STDDEV(LM_REAL *covar, int m, int i){   return (LM_REAL)sqrt(covar[i*m+i]);}/* Pearson's correlation coefficient of the best-fit parameters i and j. * covar is the mxm covariance matrix of the best-fit parameters (see also LEVMAR_COVAR()). * * The coefficient is computed as \rho_{ij} = C_{ij} / sqrt(C_{ii} C_{jj}) */LM_REAL LEVMAR_CORCOEF(LM_REAL *covar, int m, int i, int j){   return (LM_REAL)(covar[i*m+j]/sqrt(covar[i*m+i]*covar[j*m+j]));}/* coefficient of determination. * see  http://en.wikipedia.org/wiki/Coefficient_of_determination */LM_REAL LEVMAR_R2(void (*func)(LM_REAL *p, LM_REAL *hx, int m, int n, void *adata),                  LM_REAL *p, LM_REAL *x, int m, int n, void *adata){register int i;register LM_REAL tmp;LM_REAL SSerr,  // sum of squared errors, i.e. residual sum of squares \sum_i (x_i-hx_i)^2         SStot, // \sum_i (x_i-xavg)^2        *hx, xavg;  if((hx=(LM_REAL *)malloc(n*sizeof(LM_REAL)))==NULL){    fprintf(stderr, RCAT("memory allocation request failed in ", LEVMAR_R2) "()\n");    exit(1);  }  /* hx=f(p) */  (*func)(p, hx, m, n, adata);  for(i=0, tmp=0.0; i<n; ++i)    tmp+=x[i];  xavg=tmp/(LM_REAL)n;    for(i=0, SSerr=SStot=0.0; i<n; ++i){    tmp=x[i]-hx[i];    SSerr+=tmp*tmp;    tmp=x[i]-xavg;    SStot+=tmp*tmp;  }  free(hx);  return LM_CNST(1.0) - SSerr/SStot;}/* check box constraints for consistency */int LEVMAR_BOX_CHECK(LM_REAL *lb, LM_REAL *ub, int m){register int i;  if(!lb || !ub) return 1;  for(i=0; i<m; ++i)    if(lb[i]>ub[i]) return 0;  return 1;}#ifdef HAVE_LAPACK/* compute the Cholesky decomposition of C in W, s.t. C=W^t W and W is upper triangular */int LEVMAR_CHOLESKY(LM_REAL *C, LM_REAL *W, int m){register int i, j;int info;  /* copy weights array C to W so that LAPACK won't destroy it;   * C is assumed symmetric, hence no transposition is needed   */  for(i=0, j=m*m; i<j; ++i)    W[i]=C[i];  /* Cholesky decomposition */  POTF2("U", (int *)&m, W, (int *)&m, (int *)&info);  /* error treatment */  if(info!=0){		if(info<0){      fprintf(stderr, "LAPACK error: illegal value for argument %d of dpotf2 in %s\n", -info, LCAT(LEVMAR_CHOLESKY, "()"));		}		else{			fprintf(stderr, "LAPACK error: the leading minor of order %d is not positive definite,\n%s()\n", info,						RCAT("and the Cholesky factorization could not be completed in ", LEVMAR_CHOLESKY));		}    return LM_ERROR;  }  /* the decomposition is in the upper part of W (in column-major order!).   * copying it to the lower part and zeroing the upper transposes   * W in row-major order   */  for(i=0; i<m; i++)    for(j=0; j<i; j++){      W[i+j*m]=W[j+i*m];      W[j+i*m]=0.0;    }  return 0;}#endif /* HAVE_LAPACK *//* Compute e=x-y for two n-vectors x and y and return the squared L2 norm of e. * e can coincide with either x or y; x can be NULL, in which case it is assumed * to be equal to the zero vector. * Uses loop unrolling and blocking to reduce bookkeeping overhead & pipeline * stalls and increase instruction-level parallelism; see http://www.abarnett.demon.co.uk/tutorial.html */LM_REAL LEVMAR_L2NRMXMY(LM_REAL *e, LM_REAL *x, LM_REAL *y, int n){const int blocksize=8, bpwr=3; /* 8=2^3 */register int i;int j1, j2, j3, j4, j5, j6, j7;int blockn;register LM_REAL sum0=0.0, sum1=0.0, sum2=0.0, sum3=0.0;  /* n may not be divisible by blocksize,    * go as near as we can first, then tidy up.   */   blockn = (n>>bpwr)<<bpwr; /* (n / blocksize) * blocksize; */  /* unroll the loop in blocks of `blocksize'; looping downwards gains some more speed */  if(x){    for(i=blockn-1; i>0; i-=blocksize){              e[i ]=x[i ]-y[i ]; sum0+=e[i ]*e[i ];      j1=i-1; e[j1]=x[j1]-y[j1]; sum1+=e[j1]*e[j1];      j2=i-2; e[j2]=x[j2]-y[j2]; sum2+=e[j2]*e[j2];      j3=i-3; e[j3]=x[j3]-y[j3]; sum3+=e[j3]*e[j3];      j4=i-4; e[j4]=x[j4]-y[j4]; sum0+=e[j4]*e[j4];      j5=i-5; e[j5]=x[j5]-y[j5]; sum1+=e[j5]*e[j5];      j6=i-6; e[j6]=x[j6]-y[j6]; sum2+=e[j6]*e[j6];      j7=i-7; e[j7]=x[j7]-y[j7]; sum3+=e[j7]*e[j7];    }   /*    * There may be some left to do.    * This could be done as a simple for() loop,     * but a switch is faster (and more interesting)     */     i=blockn;    if(i<n){       /* Jump into the case at the place that will allow       * us to finish off the appropriate number of items.        */       switch(n - i){         case 7 : e[i]=x[i]-y[i]; sum0+=e[i]*e[i]; ++i;        case 6 : e[i]=x[i]-y[i]; sum0+=e[i]*e[i]; ++i;        case 5 : e[i]=x[i]-y[i]; sum0+=e[i]*e[i]; ++i;        case 4 : e[i]=x[i]-y[i]; sum0+=e[i]*e[i]; ++i;        case 3 : e[i]=x[i]-y[i]; sum0+=e[i]*e[i]; ++i;        case 2 : e[i]=x[i]-y[i]; sum0+=e[i]*e[i]; ++i;        case 1 : e[i]=x[i]-y[i]; sum0+=e[i]*e[i]; ++i;      }    }  }  else{ /* x==0 */    for(i=blockn-1; i>0; i-=blocksize){              e[i ]=-y[i ]; sum0+=e[i ]*e[i ];      j1=i-1; e[j1]=-y[j1]; sum1+=e[j1]*e[j1];      j2=i-2; e[j2]=-y[j2]; sum2+=e[j2]*e[j2];      j3=i-3; e[j3]=-y[j3]; sum3+=e[j3]*e[j3];      j4=i-4; e[j4]=-y[j4]; sum0+=e[j4]*e[j4];      j5=i-5; e[j5]=-y[j5]; sum1+=e[j5]*e[j5];      j6=i-6; e[j6]=-y[j6]; sum2+=e[j6]*e[j6];      j7=i-7; e[j7]=-y[j7]; sum3+=e[j7]*e[j7];    }   /*    * There may be some left to do.    * This could be done as a simple for() loop,     * but a switch is faster (and more interesting)     */     i=blockn;    if(i<n){       /* Jump into the case at the place that will allow       * us to finish off the appropriate number of items.        */       switch(n - i){         case 7 : e[i]=-y[i]; sum0+=e[i]*e[i]; ++i;        case 6 : e[i]=-y[i]; sum0+=e[i]*e[i]; ++i;        case 5 : e[i]=-y[i]; sum0+=e[i]*e[i]; ++i;        case 4 : e[i]=-y[i]; sum0+=e[i]*e[i]; ++i;        case 3 : e[i]=-y[i]; sum0+=e[i]*e[i]; ++i;        case 2 : e[i]=-y[i]; sum0+=e[i]*e[i]; ++i;        case 1 : e[i]=-y[i]; sum0+=e[i]*e[i]; ++i;      }    }  }  return sum0+sum1+sum2+sum3;}/* undefine everything. THIS MUST REMAIN AT THE END OF THE FILE */#undef LEVMAR_PSEUDOINVERSE#undef LEVMAR_LUINVERSE#undef LEVMAR_BOX_CHECK#undef LEVMAR_CHOLESKY#undef LEVMAR_COVAR#undef LEVMAR_STDDEV#undef LEVMAR_CORCOEF#undef LEVMAR_R2#undef LEVMAR_CHKJAC#undef LEVMAR_FDIF_FORW_JAC_APPROX#undef LEVMAR_FDIF_CENT_JAC_APPROX#undef LEVMAR_TRANS_MAT_MAT_MULT#undef LEVMAR_L2NRMXMY
上一页 12
💿 文件大小 77 K
👤 上传用户 gdmichael
📂 所属分类其他
🏷️ 相关标签

#Levenberg-Marquardt #implemented #algorithm #applied
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -