urlporttaghandler.java
来自「spam source codejasen-0.9jASEN - java An」· Java 代码 · 共 190 行
JAVA
190 行
/*
* @(#)URLPortTagHandler.java 9/11/2004
*
* Copyright (c) 2004, 2005 jASEN.org
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are met:
*
* 1. Redistributions of source code must retain the above copyright notice,
* this list of conditions and the following disclaimer.
*
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in
* the documentation and/or other materials provided with the distribution.
*
* 3. The names of the authors may not be used to endorse or promote products
* derived from this software without specific prior written permission.
*
* 4. Any modification or additions to the software must be contributed back
* to the project.
*
* 5. Any investigation or reverse engineering of source code or binary to
* enable emails to bypass the filters, and hence inflict spam and or viruses
* onto users who use or do not use jASEN could subject the perpetrator to
* criminal and or civil liability.
*
* THIS SOFTWARE IS PROVIDED "AS IS" AND ANY EXPRESSED OR IMPLIED WARRANTIES,
* INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
* FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL JASEN.ORG,
* OR ANY CONTRIBUTORS TO THIS SOFTWARE BE LIABLE FOR ANY DIRECT, INDIRECT,
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA,
* OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
* EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*
*/
package org.jasen.core.parsers.handlers;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import javax.swing.text.AttributeSet;
import javax.swing.text.html.HTML.Attribute;
import javax.swing.text.html.HTML.Tag;
import org.jasen.interfaces.HTMLTagHandlerResult;
/**
* <P>
* Looks for tcp port references at the end of url domains.
* </P>
* @author Jason Polites
*/
public class URLPortTagHandler extends SrcCgiTagHandler
{
public String PORT_URL_REGEX = "(?:http|ftp):\\/\\/.*?:(\\d+.*?)";
/**
*
*/
public URLPortTagHandler() {
super ();
}
/*
* (non-Javadoc)
* @see org.jasen.interfaces.HTMLTagHandler#handleTag(javax.swing.text.html.HTML.Tag, javax.swing.text.AttributeSet, org.jasen.interfaces.HTMLTagHandlerResult)
*/
public int handleTag(Tag tag, AttributeSet attributes, HTMLTagHandlerResult result) {
// The following tags can have remote source attributes:
// IMG (src, longdesc, usemap, ismap)
// FRAME (src)
// IFRAME (src)
// BODY (background)
// BGSOUND (src)
// APPLET (codebase, code, archive)
// OBJECT (data, usemap)
// INS (cite)
// SCRIPT (src)
// LINK (href)
// A
// FORM
// TODO Work out how to re-use SrcCgiHandler for this...
String port = null;
String url = null;
if(tag.equals(Tag.IMG)) {
url = (String)attributes.getAttribute(Attribute.SRC);
port = getPortFromUrl(url);
}
else if(tag.equals(Tag.A)) {
url = (String)attributes.getAttribute(Attribute.HREF);
port = getPortFromUrl(url);
}
else if(tag.equals(Tag.FORM)) {
url = (String)attributes.getAttribute(Attribute.ACTION);
port = getPortFromUrl(url);
}
else if(tag.equals(Tag.BODY)) {
url = (String)attributes.getAttribute(Attribute.BACKGROUND);
port = getPortFromUrl(url);
}
else if(tag.equals(Tag.LINK)) {
url = (String)attributes.getAttribute(Attribute.HREF);
port = getPortFromUrl(url);
}
else if(tag.equals(Tag.OBJECT)) {
url = (String)attributes.getAttribute(Attribute.DATA);
port = getPortFromUrl(url);
if(port == null) {
url = (String)attributes.getAttribute(Attribute.USEMAP);
port = getPortFromUrl(url);
}
}
else if(tag.equals(Tag.FRAME)) {
url = (String)attributes.getAttribute(Attribute.SRC);
port = getPortFromUrl(url);
}
else if(tag.equals(Tag.APPLET)) {
url = (String)attributes.getAttribute(Attribute.CODE);
port = getPortFromUrl(url);
if(port == null) {
url = (String)attributes.getAttribute(Attribute.ARCHIVE);
port = getPortFromUrl(url);
}
if(port == null) {
url = (String)attributes.getAttribute(Attribute.CODEBASE);
port = getPortFromUrl(url);
}
}
else if(tag.equals(Tag.SCRIPT)) {
url = (String)attributes.getAttribute(Attribute.SRC);
port = getPortFromUrl(url);
}
else if (tag.toString().equalsIgnoreCase("iframe")) {
url = (String)attributes.getAttribute(Attribute.SRC);
port = getPortFromUrl(url);
}
else if (tag.toString().equalsIgnoreCase("bgsound")) {
url = (String)attributes.getAttribute(Attribute.SRC);
port = getPortFromUrl(url);
}
if(port == null) {
return NOMATCH;
}
else
{
if(result != null && result instanceof URLPortTagHandlerResult) {
((URLPortTagHandlerResult)result).setPort(port);
}
return MATCH;
}
}
/**
* Returns the tcp port appended to the given url as a String, or null if no port reference exists
* @param url
* @return
*/
protected String getPortFromUrl(String url) {
String port = null;
if(url != null) {
Pattern p = Pattern.compile(PORT_URL_REGEX);
Matcher m = p.matcher(url);
if(m.find()) {
port = m.group(1);
}
}
return port;
}
}
⌨️ 快捷键说明
复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?