srccgitaghandler.java

来自「spam source codejasen-0.9jASEN - java An」· Java 代码 · 共 167 行

JAVA
167
字号
/*
 * @(#)SrcCgiTagHandler.java	30/10/2004
 *
 * Copyright (c) 2004, 2005  jASEN.org
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   1. Redistributions of source code must retain the above copyright notice,
 *      this list of conditions and the following disclaimer.
 *
 *   2. Redistributions in binary form must reproduce the above copyright
 *      notice, this list of conditions and the following disclaimer in
 *      the documentation and/or other materials provided with the distribution.
 *
 *   3. The names of the authors may not be used to endorse or promote products
 *      derived from this software without specific prior written permission.
 *
 *   4. Any modification or additions to the software must be contributed back
 *      to the project.
 *
 *   5. Any investigation or reverse engineering of source code or binary to
 *      enable emails to bypass the filters, and hence inflict spam and or viruses
 *      onto users who use or do not use jASEN could subject the perpetrator to
 *      criminal and or civil liability.
 *
 * THIS SOFTWARE IS PROVIDED "AS IS" AND ANY EXPRESSED OR IMPLIED WARRANTIES,
 * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
 * FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL JASEN.ORG,
 * OR ANY CONTRIBUTORS TO THIS SOFTWARE BE LIABLE FOR ANY DIRECT, INDIRECT,
 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA,
 * OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
 * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
 * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
 * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 *
 */
package org.jasen.core.parsers.handlers;

import java.util.regex.Pattern;

import javax.swing.text.AttributeSet;
import javax.swing.text.html.HTML.Attribute;
import javax.swing.text.html.HTML.Tag;

import org.jasen.interfaces.HTMLTagHandler;
import org.jasen.interfaces.HTMLTagHandlerResult;

/**
 * <P>
 * 	Looks for source attributes of HTML tags which do not end in a known file type.
 * </P>
 * @author Jason Polites
 */
public class SrcCgiTagHandler implements HTMLTagHandler
{
    public String CGI_URL_REGEX = "(?:http|ftp):\\/\\/.*\\?";

    /**
     *
     */
    public SrcCgiTagHandler() {
        super ();
    }

    /*
     *  (non-Javadoc)
     * @see org.jasen.interfaces.HTMLTagHandler#handleTag(javax.swing.text.html.HTML.Tag, javax.swing.text.AttributeSet, org.jasen.interfaces.HTMLTagHandlerResult)
     */
    public int handleTag(Tag tag, AttributeSet attributes, HTMLTagHandlerResult result) {

        // The following tags can have remote source attributes:
        // IMG (src, longdesc, usemap, ismap)
        // FRAME (src)
        // IFRAME (src)
        // BODY (background)
        // BGSOUND (src)
        // APPLET (codebase, code, archive)
        // OBJECT (data, usemap)
        // INS (cite)
        // SCRIPT (src)
        // LINK (href)

        boolean hasCgi = false;
        String url = null;

        if(tag.equals(Tag.IMG)) {
            url = (String)attributes.getAttribute(Attribute.SRC);
            hasCgi = hasCgiRef(url);
        }
        else if(tag.equals(Tag.BODY)) {
            url = (String)attributes.getAttribute(Attribute.BACKGROUND);
            hasCgi = hasCgiRef(url);
        }
        else if(tag.equals(Tag.LINK)) {
            url = (String)attributes.getAttribute(Attribute.HREF);
            hasCgi = hasCgiRef(url);
        }
        else if(tag.equals(Tag.OBJECT)) {
            url = (String)attributes.getAttribute(Attribute.DATA);
            hasCgi = hasCgiRef(url);

            if(!hasCgi) {
                url = (String)attributes.getAttribute(Attribute.USEMAP);
                hasCgi = hasCgiRef(url);
            }
        }
        else if(tag.equals(Tag.FRAME)) {
            url = (String)attributes.getAttribute(Attribute.SRC);
            hasCgi = hasCgiRef(url);
        }
        else if(tag.equals(Tag.APPLET)) {
            url = (String)attributes.getAttribute(Attribute.CODE);
            hasCgi = hasCgiRef(url);

            if(!hasCgi) {
                url = (String)attributes.getAttribute(Attribute.ARCHIVE);
                hasCgi = hasCgiRef(url);
            }

            if(!hasCgi) {
                url = (String)attributes.getAttribute(Attribute.CODEBASE);
                hasCgi = hasCgiRef(url);
            }
        }
        else if(tag.equals(Tag.SCRIPT)) {
            url = (String)attributes.getAttribute(Attribute.SRC);
            hasCgi = hasCgiRef(url);
        }
        else if (tag.toString().equalsIgnoreCase("iframe")) {
            url = (String)attributes.getAttribute(Attribute.SRC);
            hasCgi = hasCgiRef(url);
        }
        else if (tag.toString().equalsIgnoreCase("bgsound")) {
            url = (String)attributes.getAttribute(Attribute.SRC);
            hasCgi = hasCgiRef(url);
        }


        if(hasCgi) {
            return MATCH;
        }
        else {
            return NOMATCH;
        }
    }

    /**
     * Returns true if the url provided points to a remote cgi interface
     * @param url
     * @return
     */
    private boolean hasCgiRef(String url) {
        boolean match = false;

        if(url != null) {
            Pattern p = Pattern.compile(CGI_URL_REGEX);
            match = p.matcher(url).find();
        }

        return match;
    }

}

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?