maxenttrainer.java

来自「mallet是自然语言处理、机器学习领域的一个开源项目。」· Java 代码 · 共 747 行 · 第 1/3 页
JAVA
747 行
/* Copyright (C) 2002 Univ. of Massachusetts Amherst, Computer Science Dept.   This file is part of "MALLET" (MAchine Learning for LanguagE Toolkit).   http://www.cs.umass.edu/~mccallum/mallet   This software is provided under the terms of the Common Public License,   version 1.0, as published by http://www.opensource.org.  For further   information, see the file `LICENSE' included with this distribution. */package edu.umass.cs.mallet.base.classify;import edu.umass.cs.mallet.base.classify.Classifier;import edu.umass.cs.mallet.base.types.Instance;import edu.umass.cs.mallet.base.types.InstanceList;import edu.umass.cs.mallet.base.types.MatrixOps;import edu.umass.cs.mallet.base.types.Instance;import edu.umass.cs.mallet.base.types.Alphabet;import edu.umass.cs.mallet.base.types.Label;import edu.umass.cs.mallet.base.types.LabelAlphabet;import edu.umass.cs.mallet.base.types.FeatureVector;import edu.umass.cs.mallet.base.types.RankedFeatureVector;import edu.umass.cs.mallet.base.types.Labeling;import edu.umass.cs.mallet.base.types.LabelVector;import edu.umass.cs.mallet.base.types.Vector;import edu.umass.cs.mallet.base.types.FeatureSelection;import edu.umass.cs.mallet.base.types.FeatureInducer;import edu.umass.cs.mallet.base.types.ExpGain;import edu.umass.cs.mallet.base.types.GradientGain;import edu.umass.cs.mallet.base.types.InfoGain;import edu.umass.cs.mallet.base.util.MalletLogger;import edu.umass.cs.mallet.base.util.Maths;import edu.umass.cs.mallet.base.maximize.Maximizable;import edu.umass.cs.mallet.base.maximize.Maximizer;import edu.umass.cs.mallet.base.maximize.tests.*;import edu.umass.cs.mallet.base.maximize.LimitedMemoryBFGS;import edu.umass.cs.mallet.base.pipe.Pipe;import edu.umass.cs.mallet.base.util.CommandOption;import edu.umass.cs.mallet.base.util.MalletProgressMessageLogger;import java.util.logging.*;import java.util.*;import java.io.*;// Does not currently handle instances that are labeled with distributions// instead of a single label./** * The trainer for a Maximum Entropy classifier.   @author Andrew McCallum <a href="mailto:mccallum@cs.umass.edu">mccallum@cs.umass.edu</a> */public class MaxEntTrainer extends ClassifierTrainer implements Boostable, Serializable //implements CommandOption.ListProviding{	private static Logger logger = MalletLogger.getLogger(MaxEntTrainer.class.getName());	private static Logger progressLogger = MalletProgressMessageLogger.getLogger(MaxEntTrainer.class.getName()+"-pl");	int numGetValueCalls = 0;	int numGetValueGradientCalls = 0;	int numIterations = 10;  public static final String EXP_GAIN = "exp";  public static final String GRADIENT_GAIN = "grad";  public static final String INFORMATION_GAIN = "info";	// xxx Why does TestMaximizable fail when this variance is very small?	static final double DEFAULT_GAUSSIAN_PRIOR_VARIANCE = 1;	static final double DEFAULT_HYPERBOLIC_PRIOR_SLOPE = 0.2;	static final double DEFAULT_HYPERBOLIC_PRIOR_SHARPNESS = 10.0;	static final Class DEFAULT_MAXIMIZER_CLASS = LimitedMemoryBFGS.class;    // CPAL    boolean usingMultiConditionalTraining = false;    boolean usingHyperbolicPrior = false;	double gaussianPriorVariance = DEFAULT_GAUSSIAN_PRIOR_VARIANCE;	double hyperbolicPriorSlope = DEFAULT_HYPERBOLIC_PRIOR_SLOPE;	double hyperbolicPriorSharpness = DEFAULT_HYPERBOLIC_PRIOR_SHARPNESS;	Class maximizerClass = DEFAULT_MAXIMIZER_CLASS;    // CPAL    static CommandOption.Boolean usingMultiConditionalTrainingOption =    new CommandOption.Boolean (MaxEntTrainer.class, "useMCTraining", "true|false", false, false,                                                        "Use MultiConditional Training", null);    static CommandOption.Boolean usingHyperbolicPriorOption =	new CommandOption.Boolean (MaxEntTrainer.class, "useHyperbolicPrior", "true|false", false, false,														 "Use hyperbolic (close to L1 penalty) prior over parameters", null);	static CommandOption.Double gaussianPriorVarianceOption =	new CommandOption.Double (MaxEntTrainer.class, "gaussianPriorVariance", "FLOAT", true, 10.0,														"Variance of the gaussian prior over parameters", null);	static CommandOption.Double hyperbolicPriorSlopeOption =	new CommandOption.Double (MaxEntTrainer.class, "hyperbolicPriorSlope", "FLOAT", true, 0.2,														"Slope of the (L1 penalty) hyperbolic prior over parameters", null);	static CommandOption.Double hyperbolicPriorSharpnessOption =	new CommandOption.Double (MaxEntTrainer.class, "hyperbolicPriorSharpness", "FLOAT", true, 10.0,														"Sharpness of the (L1 penalty) hyperbolic prior over parameters", null);	static final CommandOption.List commandOptions =	new CommandOption.List (		"Maximum Entropy Classifier",		new CommandOption[] {			usingHyperbolicPriorOption,			gaussianPriorVarianceOption,			hyperbolicPriorSlopeOption,			hyperbolicPriorSharpnessOption,            usingMultiConditionalTrainingOption,   // CPAL        });	public static CommandOption.List getCommandOptionList ()	{		return commandOptions;	}	/*	public MaxEntTrainer(Maximizer.ByGradient maximizer)	{		this.maximizerByGradient = maximizer;		this.usingHyperbolicPrior = false;	}	*/	public MaxEntTrainer (CommandOption.List col)	{		this.usingHyperbolicPrior = usingHyperbolicPriorOption.value;		this.gaussianPriorVariance = gaussianPriorVarianceOption.value;		this.hyperbolicPriorSlope = hyperbolicPriorSlopeOption.value;		this.hyperbolicPriorSharpness = hyperbolicPriorSharpnessOption.value;        this.usingMultiConditionalTraining = usingMultiConditionalTrainingOption.value;    }	public MaxEntTrainer ()	{		this (false);	}	public MaxEntTrainer (boolean useHyperbolicPrior)	{		this.usingHyperbolicPrior = useHyperbolicPrior;	}    /** Constructs a trainer with a parameter to avoid overtraining.  1.0 is     * usually a reasonable default value. */	public MaxEntTrainer (double gaussianPriorVariance)	{		this.usingHyperbolicPrior = false;		this.gaussianPriorVariance = gaussianPriorVariance;	}    // CPAL - added this to do MultiConditionalTraining    public MaxEntTrainer (double gaussianPriorVariance, boolean useMultiConditionalTraining )    {        this.usingHyperbolicPrior = false;        this.usingMultiConditionalTraining = useMultiConditionalTraining;        this.gaussianPriorVariance = gaussianPriorVariance;    }    public MaxEntTrainer (double hyperbolicPriorSlope,												double hyperbolicPriorSharpness)	{		this.usingHyperbolicPrior = true;		this.hyperbolicPriorSlope = hyperbolicPriorSlope;		this.hyperbolicPriorSharpness = hyperbolicPriorSharpness;	}	public Maximizable.ByGradient getMaximizableTrainer (InstanceList ilist)	{		if (ilist == null)			return new MaximizableTrainer ();		return new MaximizableTrainer (ilist, null);	}  /**   * Specifies the maximum number of iterations to run during a single call   * to <code>train</code> or <code>trainWithFeatureInduction</code>.  Not   * currently functional.   * @return This trainer   */  // XXX Since we maximize before using numIterations, this doesn't work.  // Is that a bug?  If so, should the default numIterations be higher?	public MaxEntTrainer setNumIterations (int i)	{		numIterations = i;		return this;	}	public MaxEntTrainer setUseHyperbolicPrior (boolean useHyperbolicPrior)	{		this.usingHyperbolicPrior = useHyperbolicPrior;		return this;	}    /**     * Sets a parameter to prevent overtraining.  A smaller variance for the prior     * means that feature weights are expected to hover closer to 0, so extra     * evidence is required to set a higher weight.     * @return This trainer     */	public MaxEntTrainer setGaussianPriorVariance (double gaussianPriorVariance)	{		this.usingHyperbolicPrior = false;		this.gaussianPriorVariance = gaussianPriorVariance;		return this;	}	public MaxEntTrainer setHyperbolicPriorSlope(double hyperbolicPriorSlope)	{		this.usingHyperbolicPrior = true;		this.hyperbolicPriorSlope = hyperbolicPriorSlope;		return this;	}	public MaxEntTrainer setHyperbolicPriorSharpness (double hyperbolicPriorSharpness)	{		this.usingHyperbolicPrior = true;		this.hyperbolicPriorSharpness = hyperbolicPriorSharpness;		return this;	}	public Classifier train (InstanceList trainingSet,													 InstanceList validationSet,													 InstanceList testSet,													 ClassifierEvaluating evaluator,													 Classifier initialClassifier)	{		logger.fine ("trainingSet.size() = "+trainingSet.size());		MaximizableTrainer mt = new MaximizableTrainer (trainingSet, (MaxEnt)initialClassifier);		Maximizer.ByGradient maximizer = new LimitedMemoryBFGS();		maximizer.maximize (mt); // XXX given the loop below, this seems wrong.		logger.info("MaxEnt ngetValueCalls:"+getValueCalls()+"\nMaxEnt ngetValueGradientCalls:"+getValueGradientCalls());//		boolean converged;////	 	for (int i = 0; i < numIterations; i++) {//			converged = maximizer.maximize (mt, 1);//			if (converged)//			 	break;//			else if (evaluator != null)//			 	if (!evaluator.evaluate (mt.getClassifier(), converged, i, mt.getValue(),//				 												 trainingSet, validationSet, testSet))//				 	break;//		}//		TestMaximizable.testValueAndGradient (mt);		progressLogger.info("\n"); //  progess messages are on one line; move on.		return mt.getClassifier ();	}  /**
maxenttrainer.java - 源码说明

本页面展示了「mallet是自然语言处理、机器学习领域的一个开源项目。」中的 maxenttrainer.java 源码文件，采用 Java 编程语言编写，共 747 行代码。您可以在线阅读完整代码内容，也可以返回资源详情页下载完整源码包进行本地学习和开发。
虫虫下载站收录了大量与mallet相关的技术资源，包括源代码、技术文档、电路图等，是电子工程师和嵌入式开发者的专业学习平台。
⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?