📄 optimization.java

📁 wekaUT是 university texas austin 开发的基于weka的半指导学习(semi supervised learning)的分类器
💻 JAVA
📖 第 1 页 / 共 3 页
字号:
	    System.err.println("alpha: " + Utils.doubleToString(alpha,10,7));	}		if(alpha <= m_Zero){ // Zero	   	    m_IsZeroStep = true;	    if (m_Debug)		System.err.println("Alpha too small, try again");	    return x;	}		alam = alpha; // Always try full feasible newton step 	if(alam > 1.0)	    alam = 1.0;		// Iteration of one newton step, if necessary, backtracking is done	double initF=fold, // Initial function value	    hi=alam, lo=alam, newSlope=0, fhi=m_f, flo=m_f;// Variables used for beta condition	double[] newGrad;  // Gradient on the new variable values		kloop:	for (k=0;;k++) {	    if(m_Debug)		System.err.println("\nIteration: " + k);	    	    for (i=0;i<len;i++){		if(!isFixed[i]){		    x[i] = xold[i]+alam*direct[i];  // Compute xnew		    if(!Double.isNaN(nwsBounds[0][i]) && (x[i]<nwsBounds[0][i])){    			x[i] = nwsBounds[0][i]; //Rounding error			    }		    else if(!Double.isNaN(nwsBounds[1][i]) && (x[i]>nwsBounds[1][i])){					x[i] = nwsBounds[1][i]; //Rounding error			    }		}	    }	    	    m_f = objectiveFunction(x);    // Compute fnew	    	    while(Double.isInfinite(m_f)){ // Avoid infinity		if(m_Debug)		    System.err.println("Too large m_f.  Shrink step by half.");		alam *= 0.5; // Shrink by half		if(alam <= m_Epsilon){		    if(m_Debug)			System.err.println("Wrong starting points, change them!");		    return x;		}				for (i=0;i<len;i++)		    if(!isFixed[i])			x[i] = xold[i]+alam*direct[i]; 				m_f = objectiveFunction(x); 		initF = Double.POSITIVE_INFINITY;	    }	    	    if(m_Debug) {		System.err.println("obj. function: " + 				 Utils.doubleToString(m_f, 10, 7));		System.err.println("threshold: " + 				 Utils.doubleToString(fold+m_ALF*alam*m_Slope,10,7));	    }	    	    if(m_f<=fold+m_ALF*alam*m_Slope){// Alpha condition: sufficient function decrease		if(m_Debug)				    System.err.println("Sufficient function decrease (alpha condition): "); 		newGrad = evaluateGradient(x);		for(newSlope=0.0,i=0; i<len; i++)		    if(!isFixed[i])			newSlope += newGrad[i]*direct[i];		if(newSlope >= m_BETA*m_Slope){ // Beta condition: ensure pos. defnty.			    if(m_Debug)					System.err.println("Increasing derivatives (beta condition): "); 			    if((fixedOne!=-1) && (alam>=alpha)){ // Has bounds and over			if(direct[fixedOne] > 0){			    x[fixedOne] = nwsBounds[1][fixedOne]; // Avoid rounding error			    nwsBounds[1][fixedOne]=Double.NaN; //Add cons. to working set			}			else{			    x[fixedOne] = nwsBounds[0][fixedOne]; // Avoid rounding error			    nwsBounds[0][fixedOne]=Double.NaN; //Add cons. to working set			}						if(m_Debug)			    System.err.println("Fix variable "					       +fixedOne+" to bound "+ x[fixedOne]+					       " from value "+ xold[fixedOne]);			isFixed[fixedOne]=true; // Fix the variable			wsBdsIndx.addElement(new Integer(fixedOne));		    }				    return x;		}		else if(k==0){ // First time: increase alam 		    // Search for the smallest value not complying with alpha condition		    double upper = Math.min(alpha,maxalam); 		    if(m_Debug)			System.err.println("Alpha condition holds, increase alpha... ");		    while((alam>=upper) || (m_f>fold+m_ALF*alam*m_Slope)){			lo = alam;			flo = m_f;			alam *= 2.0;			if(alam>=upper)			    alam=upper;			for (i=0;i<len;i++)			    if(!isFixed[i])				x[i] = xold[i]+alam*direct[i];			m_f = objectiveFunction(x);			newGrad = evaluateGradient(x);			for(newSlope=0.0,i=0; i<len; i++)			    if(!isFixed[i])				newSlope += newGrad[i]*direct[i];			if(newSlope >= m_BETA*m_Slope){			    if (m_Debug)						System.err.println("Increasing derivatives (beta condition): ");			    if((fixedOne!=-1) && (alam>=alpha)){ // Has bounds and over				if(direct[fixedOne] > 0){				    x[fixedOne] = nwsBounds[1][fixedOne]; // Avoid rounding error				    nwsBounds[1][fixedOne]=Double.NaN; //Add cons. to working set				}				else{				    x[fixedOne] = nwsBounds[0][fixedOne]; // Avoid rounding error				    nwsBounds[0][fixedOne]=Double.NaN; //Add cons. to working set				}								if(m_Debug)				    System.err.println("Fix variable "						       +fixedOne+" to bound "+ x[fixedOne]+						       " from value "+ xold[fixedOne]);				isFixed[fixedOne]=true; // Fix the variable				wsBdsIndx.addElement(new Integer(fixedOne));			    }		 				    			    return x;			}		    }		    hi = alam;		    fhi = m_f;					    break kloop;		}		else{		    if(m_Debug)			System.err.println("Alpha condition holds.");		    hi = alam2; lo = alam; flo = m_f;		    break kloop;		}		    	    }        	    else if (alam < alamin) { // No feasible lambda found       		if(initF<fold){ 		    alam = Math.min(1.0,alpha);		    for (i=0;i<len;i++)			if(!isFixed[i])			    x[i] = xold[i]+alam*direct[i]; //Still take Alpha		    		    if (m_Debug)			System.err.println("No feasible lambda: still take"+					   " alpha="+alam);		    		    if((fixedOne!=-1) && (alam>=alpha)){ // Has bounds and over			if(direct[fixedOne] > 0){			    x[fixedOne] = nwsBounds[1][fixedOne]; // Avoid rounding error			    nwsBounds[1][fixedOne]=Double.NaN; //Add cons. to working set			}			else{			    x[fixedOne] = nwsBounds[0][fixedOne]; // Avoid rounding error			    nwsBounds[0][fixedOne]=Double.NaN; //Add cons. to working set			}						if(m_Debug)			    System.err.println("Fix variable "					       +fixedOne+" to bound "+ x[fixedOne]+					       " from value "+ xold[fixedOne]);			isFixed[fixedOne]=true; // Fix the variable			wsBdsIndx.addElement(new Integer(fixedOne));		    }		 		    		}		else{   // Convergence on delta(x)		    for(i=0;i<len;i++) 			x[i]=xold[i];		    m_f=fold;		    if (m_Debug)			System.err.println("Cannot find feasible lambda"); 		}				return x; 	    }	    else { // Backtracking by polynomial interpolation		if(k==0){ // First time backtrack: quadratic interpolation		    if(!Double.isInfinite(initF))			initF = m_f;		    		    // lambda = -g'(0)/(2*g''(0))		    tmplam = -0.5*alam*m_Slope/((m_f-fold)/alam-m_Slope);		}		else {    // Subsequent backtrack: cubic interpolation 		    rhs1 = m_f-fold-alam*m_Slope;		    rhs2 = fhi-fold-alam2*m_Slope;		    a=(rhs1/(alam*alam)-rhs2/(alam2*alam2))/(alam-alam2);		    b=(-alam2*rhs1/(alam*alam)+alam*rhs2/(alam2*alam2))/(alam-alam2);		    if (a == 0.0) tmplam = -m_Slope/(2.0*b);		    else {			disc=b*b-3.0*a*m_Slope;			if (disc < 0.0) disc = 0.0;			tmplam=(-b+Math.sqrt(disc))/(3.0*a);		    }		    if (m_Debug)			System.err.print("newstuff: \n" + 					 "a:   " + Utils.doubleToString(a,10,7)+ "\n" +					 "b:   " + Utils.doubleToString(b,10,7)+ "\n" +					 "disc:   " + Utils.doubleToString(disc,10,7)+ "\n" +					 "tmplam:   " + tmplam + "\n" +					 "alam:   " + Utils.doubleToString(alam,10,7)+ "\n");			    if (tmplam>0.5*alam)			tmplam=0.5*alam;             // lambda <= 0.5*lambda_old		}	    }	    alam2=alam;	    fhi=m_f;	    alam=Math.max(tmplam,0.1*alam);          // lambda >= 0.1*lambda_old	    	    if(alam>alpha){		throw new Exception("Sth. wrong in lnsrch:"+				    "Lambda infeasible!(lambda="+alam+				    ", alpha="+alpha+", upper="+tmplam+				    "|"+(-alpha*m_Slope/(2.0*((m_f-fold)/alpha-m_Slope)))+				    ", m_f="+m_f+", fold="+fold+				    ", slope="+m_Slope);	    }	    	} // Endfor(k=0;;k++)		// Quadratic interpolation between lamda values between lo and hi.	// If cannot find a value satisfying beta condition, use lo.	double ldiff = hi-lo, lincr;	if(m_Debug)	    System.err.println("Last stage of searching for beta condition (alam between "			       +Utils.doubleToString(lo,10,7)+" and "			       +Utils.doubleToString(hi,10,7)+")...");	while((newSlope<m_BETA*m_Slope) && (ldiff>=alamin)){	    lincr = -0.5*newSlope*ldiff*ldiff/(fhi-flo-newSlope*ldiff);	    if(lincr<0.2*ldiff) lincr=0.2*ldiff;	    alam = lo+lincr;	    for (i=0;i<len;i++)		if(!isFixed[i])		    x[i] = xold[i]+alam*direct[i];	    m_f = objectiveFunction(x);	    if(m_f>fold+m_ALF*alam*m_Slope){ 		// Alpha condition fails, shrink lambda_upper		ldiff = lincr;		fhi = m_f;	    }	    	    else{ // Alpha condition holds	    		newGrad = evaluateGradient(x);		for(newSlope=0.0,i=0; i<len; i++)		    if(!isFixed[i])			newSlope += newGrad[i]*direct[i];				if(newSlope < m_BETA*m_Slope){		    // Beta condition fails, shrink lambda_lower		    lo = alam;		    ldiff -= lincr;		    flo = m_f;		}	    }	} 		if(newSlope < m_BETA*m_Slope){ // Cannot satisfy beta condition, take lo	    if(m_Debug)		System.err.println("Beta condition cannot be satisfied, take alpha condition");	    alam=lo;	    for (i=0;i<len;i++)		if(!isFixed[i])		    x[i] = xold[i]+alam*direct[i];	    m_f = flo;	}	else if(m_Debug)	    System.err.println("Both alpha and beta conditions are satisfied. alam="			       +Utils.doubleToString(alam,10,7));		if((fixedOne!=-1) && (alam>=alpha)){ // Has bounds and over	    if(direct[fixedOne] > 0){		x[fixedOne] = nwsBounds[1][fixedOne]; // Avoid rounding error		nwsBounds[1][fixedOne]=Double.NaN; //Add cons. to working set	    }	    else{		x[fixedOne] = nwsBounds[0][fixedOne]; // Avoid rounding error		nwsBounds[0][fixedOne]=Double.NaN; //Add cons. to working set	    }	    	    if(m_Debug)		System.err.println("Fix variable "				   +fixedOne+" to bound "+ x[fixedOne]+				   " from value "+ xold[fixedOne]);	    isFixed[fixedOne]=true; // Fix the variable	    wsBdsIndx.addElement(new Integer(fixedOne));	}		return x;    }        /**     * Main algorithm.  Descriptions see "Practical Optimization"     *     * @param initX initial point of x, assuming no value's on the bound!     * @param constraints the bound constraints of each variable     *                    constraints[0] is the lower bounds and      *                    constraints[1] is the upper bounds     * @return the solution of x, null if number of iterations not enough     * @exception Exception if an error occurs     */    public double[] findArgmin(double[] initX, double[][] constraints) 	throws Exception{	int l = initX.length;		// Initially all variables are free, all bounds are constraints of	// non-working-set constraints	boolean[] isFixed = new boolean[l];	double[][] nwsBounds = new double[2][l];	// Record indice of fixed variables, simply for efficiency	FastVector wsBdsIndx = new FastVector(); 	// Vectors used to record the variable indices to be freed 		FastVector toFree=null, oldToFree=null;		// Initial value of obj. function, gradient and inverse of the Hessian	m_f = objectiveFunction(initX);	double sum=0;	double[] grad=evaluateGradient(initX), oldGrad, oldX,	    deltaGrad=new double[l], deltaX=new double[l],	    direct = new double[l], x = new double[l];	Matrix L = new Matrix(l, l),// Lower triangle of Cholesky factor 	    D = new Matrix(l, l);   // Diagonal of Cholesky factor	for(int i=0; i<l; i++){	    L.setRow(i, new double[l]);	    L.setElement(i,i,1.0);	    D.setRow(i, new double[l]);	    D.setElement(i,i,1.0);	    direct[i] = -grad[i];	    sum += grad[i]*grad[i];	    x[i] = initX[i];	    nwsBounds[0][i] = constraints[0][i];	    nwsBounds[1][i] = constraints[1][i];	    isFixed[i] = false;	}		double stpmax = m_STPMX*Math.max(Math.sqrt(sum), l);		iterates:	for(int step=0; step < m_MAXITS; step++){	    if (m_Debug)		System.err.println("\nIteration # " + step + ":");	    	    	    // Try at most one feasible newton step, i.e. 0<lamda<=alpha	    oldX = x;	    oldGrad = grad;	    	    // Also update grad	    if (m_Debug)		System.err.println("Line search ... ");	    m_IsZeroStep = false;	    x=lnsrch(x, grad, direct, stpmax, 		     isFixed, nwsBounds, wsBdsIndx);	    if (m_Debug)		System.err.println("Line search finished.");	    	    if(m_IsZeroStep){ // Zero step, simply delete rows/cols of D and L		for(int f=0; f<wsBdsIndx.size(); f++){		    int idx=((Integer)wsBdsIndx.elementAt(f)).intValue();		    L.setRow(idx, new double[l]);		    L.setColumn(idx, new double[l]);		    D.setElement(idx, idx, 0.0);		}				grad = evaluateGradient(x);		step--;	    }	    else{		// Check converge on x		boolean finish = false;		double test=0.0;		for(int h=0; h<l; h++){		    deltaX[h] = x[h]-oldX[h];		    double tmp=Math.abs(deltaX[h])/			Math.max(Math.abs(x[h]), 1.0);		    if(tmp > test) test = tmp;				    		}		if(test < m_Zero){		    if (m_Debug)			System.err.println("\nDeltaX converge: "+test);		    finish = true;		}				// Check zero gradient	    		grad = evaluateGradient(x);
💿 文件大小 12323 K
👤 上传用户 ilovexzhu
📂 所属分类人工智能/神经网络
🏷️ 相关标签

#university #supervised #learning #wekaUT
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -