📄 logistic.java

📁 Java 编写的多种数据挖掘算法包括聚类、分类、预处理等
💻 JAVA
📖 第 1 页 / 共 2 页
字号:
上一页 12
     * @return the value of the objective function      */    protected double objectiveFunction(double[] x){      double nll = 0; // -LogLikelihood      int dim = m_NumPredictors+1; // Number of variables per class	          for(int i=0; i<cls.length; i++){ // ith instance	double[] exp = new double[m_NumClasses-1];	int index;	for(int offset=0; offset<m_NumClasses-1; offset++){ 	  index = offset * dim;	  for(int j=0; j<dim; j++)	    exp[offset] += m_Data[i][j]*x[index + j];	}	double max = exp[Utils.maxIndex(exp)];	double denom = Math.exp(-max);	double num;	if (cls[i] == m_NumClasses - 1) { // Class of this instance	  num = -max;	} else {	  num = exp[cls[i]] - max;	}	for(int offset=0; offset<m_NumClasses-1; offset++){	  denom += Math.exp(exp[offset] - max);	}			nll -= weights[i]*(num - Math.log(denom)); // Weighted NLL      }	          // Ridge: note that intercepts NOT included      for(int offset=0; offset<m_NumClasses-1; offset++){	for(int r=1; r<dim; r++)	  nll += m_Ridge*x[offset*dim+r]*x[offset*dim+r];      }	          return nll;    }    /**      * Evaluate Jacobian vector     * @param x the current values of variables     * @return the gradient vector      */    protected double[] evaluateGradient(double[] x){      double[] grad = new double[x.length];      int dim = m_NumPredictors+1; // Number of variables per class	          for(int i=0; i<cls.length; i++){ // ith instance	double[] num=new double[m_NumClasses-1]; // numerator of [-log(1+sum(exp))]'	int index;	for(int offset=0; offset<m_NumClasses-1; offset++){ // Which part of x	  double exp=0.0;	  index = offset * dim;	  for(int j=0; j<dim; j++)	    exp += m_Data[i][j]*x[index + j];	  num[offset] = exp;	}	double max = num[Utils.maxIndex(num)];	double denom = Math.exp(-max); // Denominator of [-log(1+sum(exp))]'	for(int offset=0; offset<m_NumClasses-1; offset++){	  num[offset] = Math.exp(num[offset] - max);	  denom += num[offset];	}	Utils.normalize(num, denom);			// Update denominator of the gradient of -log(Posterior)	double firstTerm;	for(int offset=0; offset<m_NumClasses-1; offset++){ // Which part of x	  index = offset * dim;	  firstTerm = weights[i] * num[offset];	  for(int q=0; q<dim; q++){	    grad[index + q] += firstTerm * m_Data[i][q];	  }	}			if(cls[i] != m_NumClasses-1){ // Not the last class	  for(int p=0; p<dim; p++){	    grad[cls[i]*dim+p] -= weights[i]*m_Data[i][p]; 	  }	}      }	          // Ridge: note that intercepts NOT included      for(int offset=0; offset<m_NumClasses-1; offset++){	for(int r=1; r<dim; r++)	  grad[offset*dim+r] += 2*m_Ridge*x[offset*dim+r];      }	          return grad;    }  }  /**   * Returns default capabilities of the classifier.   *   * @return      the capabilities of this classifier   */  public Capabilities getCapabilities() {    Capabilities result = super.getCapabilities();    // attributes    result.enable(Capability.NOMINAL_ATTRIBUTES);    result.enable(Capability.NUMERIC_ATTRIBUTES);    result.enable(Capability.DATE_ATTRIBUTES);    result.enable(Capability.MISSING_VALUES);    // class    result.enable(Capability.NOMINAL_CLASS);    result.enable(Capability.MISSING_CLASS_VALUES);        return result;  }      /**   * Builds the classifier   *   * @param train the training data to be used for generating the   * boosted classifier.   * @throws Exception if the classifier could not be built successfully   */  public void buildClassifier(Instances train) throws Exception {    // can classifier handle the data?    getCapabilities().testWithFail(train);    // remove instances with missing class    train = new Instances(train);    train.deleteWithMissingClass();        // Replace missing values	    m_ReplaceMissingValues = new ReplaceMissingValues();    m_ReplaceMissingValues.setInputFormat(train);    train = Filter.useFilter(train, m_ReplaceMissingValues);    // Remove useless attributes    m_AttFilter = new RemoveUseless();    m_AttFilter.setInputFormat(train);    train = Filter.useFilter(train, m_AttFilter);	    // Transform attributes    m_NominalToBinary = new NominalToBinary();    m_NominalToBinary.setInputFormat(train);    train = Filter.useFilter(train, m_NominalToBinary);	    // Extract data    m_ClassIndex = train.classIndex();    m_NumClasses = train.numClasses();    int nK = m_NumClasses - 1;                     // Only K-1 class labels needed     int nR = m_NumPredictors = train.numAttributes() - 1;    int nC = train.numInstances();	    m_Data = new double[nC][nR + 1];               // Data values    int [] Y  = new int[nC];                       // Class labels    double [] xMean= new double[nR + 1];           // Attribute means    double [] xSD  = new double[nR + 1];           // Attribute stddev's    double [] sY = new double[nK + 1];             // Number of classes    double [] weights = new double[nC];            // Weights of instances    double totWeights = 0;                         // Total weights of the instances    m_Par = new double[nR + 1][nK];                // Optimized parameter values	    if (m_Debug) {      System.out.println("Extracting data...");    }	    for (int i = 0; i < nC; i++) {      // initialize X[][]      Instance current = train.instance(i);      Y[i] = (int)current.classValue();  // Class value starts from 0      weights[i] = current.weight();     // Dealing with weights      totWeights += weights[i];	          m_Data[i][0] = 1;      int j = 1;      for (int k = 0; k <= nR; k++) {	if (k != m_ClassIndex) {	  double x = current.value(k);	  m_Data[i][j] = x;	  xMean[j] += weights[i]*x;	  xSD[j] += weights[i]*x*x;	  j++;	}      }	          // Class count      sY[Y[i]]++;	    }	    if((totWeights <= 1) && (nC > 1))      throw new Exception("Sum of weights of instances less than 1, please reweight!");    xMean[0] = 0; xSD[0] = 1;    for (int j = 1; j <= nR; j++) {      xMean[j] = xMean[j] / totWeights;      if(totWeights > 1)	xSD[j] = Math.sqrt(Math.abs(xSD[j] - totWeights*xMean[j]*xMean[j])/(totWeights-1));      else	xSD[j] = 0;    }    if (m_Debug) {	          // Output stats about input data      System.out.println("Descriptives...");      for (int m = 0; m <= nK; m++)	System.out.println(sY[m] + " cases have class " + m);      System.out.println("\n Variable     Avg       SD    ");      for (int j = 1; j <= nR; j++) 	System.out.println(Utils.doubleToString(j,8,4) 			   + Utils.doubleToString(xMean[j], 10, 4) 			   + Utils.doubleToString(xSD[j], 10, 4)			   );    }	    // Normalise input data     for (int i = 0; i < nC; i++) {      for (int j = 0; j <= nR; j++) {	if (xSD[j] != 0) {	  m_Data[i][j] = (m_Data[i][j] - xMean[j]) / xSD[j];	}      }    }	    if (m_Debug) {      System.out.println("\nIteration History..." );    }	    double x[] = new double[(nR+1)*nK];    double[][] b = new double[2][x.length]; // Boundary constraints, N/A here    // Initialize    for(int p=0; p<nK; p++){      int offset=p*(nR+1);	       x[offset] =  Math.log(sY[p]+1.0) - Math.log(sY[nK]+1.0); // Null model      b[0][offset] = Double.NaN;      b[1][offset] = Double.NaN;         for (int q=1; q <= nR; q++){	x[offset+q] = 0.0;			b[0][offset+q] = Double.NaN;	b[1][offset+q] = Double.NaN;      }	    }	    OptEng opt = new OptEng();	    opt.setDebug(m_Debug);    opt.setWeights(weights);    opt.setClassLabels(Y);    if(m_MaxIts == -1){  // Search until convergence      x = opt.findArgmin(x, b);      while(x==null){	x = opt.getVarbValues();	if (m_Debug)	  System.out.println("200 iterations finished, not enough!");	x = opt.findArgmin(x, b);      }      if (m_Debug)	System.out.println(" -------------<Converged>--------------");    }    else{      opt.setMaxIteration(m_MaxIts);      x = opt.findArgmin(x, b);      if(x==null) // Not enough, but use the current value	x = opt.getVarbValues();    }	    m_LL = -opt.getMinFunction(); // Log-likelihood    // Don't need data matrix anymore    m_Data = null;	        // Convert coefficients back to non-normalized attribute units    for(int i=0; i < nK; i++){      m_Par[0][i] = x[i*(nR+1)];      for(int j = 1; j <= nR; j++) {	m_Par[j][i] = x[i*(nR+1)+j];	if (xSD[j] != 0) {	  m_Par[j][i] /= xSD[j];	  m_Par[0][i] -= m_Par[j][i] * xMean[j];	}      }    }  }		      /**   * Computes the distribution for a given instance   *   * @param instance the instance for which distribution is computed   * @return the distribution   * @throws Exception if the distribution can't be computed successfully   */  public double [] distributionForInstance(Instance instance)     throws Exception {	    m_ReplaceMissingValues.input(instance);    instance = m_ReplaceMissingValues.output();    m_AttFilter.input(instance);    instance = m_AttFilter.output();    m_NominalToBinary.input(instance);    instance = m_NominalToBinary.output();	    // Extract the predictor columns into an array    double [] instDat = new double [m_NumPredictors + 1];    int j = 1;    instDat[0] = 1;    for (int k = 0; k <= m_NumPredictors; k++) {      if (k != m_ClassIndex) {	instDat[j++] = instance.value(k);      }    }	    double [] distribution = evaluateProbability(instDat);    return distribution;  }  /**   * Compute the posterior distribution using optimized parameter values   * and the testing instance.   * @param data the testing instance   * @return the posterior probability distribution   */   private double[] evaluateProbability(double[] data){    double[] prob = new double[m_NumClasses],      v = new double[m_NumClasses];    // Log-posterior before normalizing    for(int j = 0; j < m_NumClasses-1; j++){      for(int k = 0; k <= m_NumPredictors; k++){	v[j] += m_Par[k][j] * data[k];      }    }    v[m_NumClasses-1] = 0;	    // Do so to avoid scaling problems    for(int m=0; m < m_NumClasses; m++){      double sum = 0;      for(int n=0; n < m_NumClasses-1; n++)	sum += Math.exp(v[n] - v[m]);      prob[m] = 1 / (sum + Math.exp(-v[m]));    }	    return prob;  }       /**   * Gets a string describing the classifier.   *   * @return a string describing the classifer built.   */  public String toString() {	    String result = "Logistic Regression with ridge parameter of "+m_Ridge;    if (m_Par == null) {      return result + ": No model built yet.";    }	    result += "\nCoefficients...\n"      + "Variable      Coeff.\n";    for (int j = 1; j <= m_NumPredictors; j++) {      result += Utils.doubleToString(j, 8, 0);      for (int k = 0; k < m_NumClasses-1; k++)	result += " "+Utils.doubleToString(m_Par[j][k], 12, 4);       result += "\n";    }	    result += "Intercept ";    for (int k = 0; k < m_NumClasses-1; k++)      result += " "+Utils.doubleToString(m_Par[0][k], 10, 4);     result += "\n";	    result += "\nOdds Ratios...\n"      + "Variable         O.R.\n";    for (int j = 1; j <= m_NumPredictors; j++) {      result += Utils.doubleToString(j, 8, 0);       for (int k = 0; k < m_NumClasses-1; k++){	double ORc = Math.exp(m_Par[j][k]);	result += " " + ((ORc > 1e10) ?  "" + ORc : Utils.doubleToString(ORc, 12, 4));      }      result += "\n";    }    return result;  }      /**   * Main method for testing this class.   *   * @param argv should contain the command line arguments to the   * scheme (see Evaluation)   */  public static void main(String [] argv) {    try {      System.out.println(Evaluation.evaluateModel(new Logistic(), argv));    } catch (Exception e) {      e.printStackTrace();      System.err.println(e.getMessage());    }  }}
上一页 12
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -