venuepipe.java

来自「mallet是自然语言处理、机器学习领域的一个开源项目。」· Java 代码 · 共 61 行

JAVA
61
字号
package edu.umass.cs.mallet.projects.seg_plus_coref.coreference;import com.wcohen.secondstring.*;import edu.umass.cs.mallet.base.types.*;import edu.umass.cs.mallet.base.classify.*;import edu.umass.cs.mallet.base.pipe.*;import edu.umass.cs.mallet.base.pipe.iterator.*;import edu.umass.cs.mallet.base.util.*;import java.util.*;import java.lang.*;import java.io.*;public class VenuePipe extends Pipe{	StringDistance distMetric;	double threshold = 0.5;	public VenuePipe(double threshold)	{		this.threshold = threshold;	}	public VenuePipe(StringDistance dm) 	{		this.distMetric = dm;	}	public Instance pipe (Instance carrier) 	{		NodePair pair = (NodePair)carrier.getData();		Citation s1 = (Citation)pair.getObject1();		Citation s2 = (Citation)pair.getObject2();		String ss1 = s1.getField(Citation.venue);		String ss2 = s2.getField(Citation.venue);		if(!ss1.equals("") && !ss2.equals("")){			double dist = distMetric.score(ss1, ss2);				pair.setFeatureValue( "VenueSimilarity"+getFeatureNameFromScore( dist ), 1.0 );		}		return carrier;	}	private String getFeatureNameFromScore (double dist) {		if (dist >= 0.9)			return "HIGH";		else if (dist > 0.75)			return "MED";		else if (dist > 0.5)			return "WEAK";		else if (dist > 0.3)			return "MIN";		else 			return "NONE";	}}

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?