⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 uri.java

📁 Light in the box 抓取程序。 使用HttpClient
💻 JAVA
📖 第 1 页 / 共 5 页
字号:
        authority.or(server);        authority.or(reg_name);    }    /**     * BitSet for scheme.     * <p><blockquote><pre>     * scheme        = alpha *( alpha | digit | "+" | "-" | "." )     * </pre></blockquote><p>     */    protected static final BitSet scheme = new BitSet(256);    // Static initializer for scheme    static {        scheme.or(alpha);        scheme.or(digit);        scheme.set('+');        scheme.set('-');        scheme.set('.');    }    /**     * BitSet for rel_segment.     * <p><blockquote><pre>     * rel_segment   = 1*( unreserved | escaped |     *                     ";" | "@" | "&amp;" | "=" | "+" | "$" | "," )     * </pre></blockquote><p>     */    protected static final BitSet rel_segment = new BitSet(256);    // Static initializer for rel_segment    static {        rel_segment.or(unreserved);        rel_segment.or(escaped);        rel_segment.set(';');        rel_segment.set('@');        rel_segment.set('&');        rel_segment.set('=');        rel_segment.set('+');        rel_segment.set('$');        rel_segment.set(',');    }    /**     * BitSet for rel_path.     * <p><blockquote><pre>     * rel_path      = rel_segment [ abs_path ]     * </pre></blockquote><p>     */    protected static final BitSet rel_path = new BitSet(256);    // Static initializer for rel_path    static {        rel_path.or(rel_segment);        rel_path.or(abs_path);    }    /**     * BitSet for net_path.     * <p><blockquote><pre>     * net_path      = "//" authority [ abs_path ]     * </pre></blockquote><p>     */    protected static final BitSet net_path = new BitSet(256);    // Static initializer for net_path    static {        net_path.set('/');        net_path.or(authority);        net_path.or(abs_path);    }        /**     * BitSet for hier_part.     * <p><blockquote><pre>     * hier_part     = ( net_path | abs_path ) [ "?" query ]     * </pre></blockquote><p>     */    protected static final BitSet hier_part = new BitSet(256);    // Static initializer for hier_part    static {        hier_part.or(net_path);        hier_part.or(abs_path);        // hier_part.set('?'); aleady included        hier_part.or(query);    }    /**     * BitSet for relativeURI.     * <p><blockquote><pre>     * relativeURI   = ( net_path | abs_path | rel_path ) [ "?" query ]     * </pre></blockquote><p>     */    protected static final BitSet relativeURI = new BitSet(256);    // Static initializer for relativeURI    static {        relativeURI.or(net_path);        relativeURI.or(abs_path);        relativeURI.or(rel_path);        // relativeURI.set('?'); aleady included        relativeURI.or(query);    }    /**     * BitSet for absoluteURI.     * <p><blockquote><pre>     * absoluteURI   = scheme ":" ( hier_part | opaque_part )     * </pre></blockquote><p>     */    protected static final BitSet absoluteURI = new BitSet(256);    // Static initializer for absoluteURI    static {        absoluteURI.or(scheme);        absoluteURI.set(':');        absoluteURI.or(hier_part);        absoluteURI.or(opaque_part);    }    /**     * BitSet for URI-reference.     * <p><blockquote><pre>     * URI-reference = [ absoluteURI | relativeURI ] [ "#" fragment ]     * </pre></blockquote><p>     */    protected static final BitSet URI_reference = new BitSet(256);    // Static initializer for URI_reference    static {        URI_reference.or(absoluteURI);        URI_reference.or(relativeURI);        URI_reference.set('#');        URI_reference.or(fragment);    }    // ---------------------------- Characters disallowed within the URI syntax    // Excluded US-ASCII Characters are like control, space, delims and unwise    /**     * BitSet for control.     */    public static final BitSet control = new BitSet(256);    // Static initializer for control    static {        for (int i = 0; i <= 0x1F; i++) {            control.set(i);        }        control.set(0x7F);    }    /**     * BitSet for space.     */    public static final BitSet space = new BitSet(256);    // Static initializer for space    static {        space.set(0x20);    }    /**     * BitSet for delims.     */    public static final BitSet delims = new BitSet(256);    // Static initializer for delims    static {        delims.set('<');        delims.set('>');        delims.set('#');        delims.set('%');        delims.set('"');    }    /**     * BitSet for unwise.     */    public static final BitSet unwise = new BitSet(256);    // Static initializer for unwise    static {        unwise.set('{');        unwise.set('}');        unwise.set('|');        unwise.set('\\');        unwise.set('^');        unwise.set('[');        unwise.set(']');        unwise.set('`');    }    /**     * Disallowed rel_path before escaping.     */    public static final BitSet disallowed_rel_path = new BitSet(256);    // Static initializer for disallowed_rel_path    static {        disallowed_rel_path.or(uric);        disallowed_rel_path.andNot(rel_path);    }    /**     * Disallowed opaque_part before escaping.     */    public static final BitSet disallowed_opaque_part = new BitSet(256);    // Static initializer for disallowed_opaque_part    static {        disallowed_opaque_part.or(uric);        disallowed_opaque_part.andNot(opaque_part);    }    // ----------------------- Characters allowed within and for each component    /**     * Those characters that are allowed for the authority component.     */    public static final BitSet allowed_authority = new BitSet(256);    // Static initializer for allowed_authority    static {        allowed_authority.or(authority);        allowed_authority.clear('%');    }    /**     * Those characters that are allowed for the opaque_part.     */    public static final BitSet allowed_opaque_part = new BitSet(256);    // Static initializer for allowed_opaque_part     static {        allowed_opaque_part.or(opaque_part);        allowed_opaque_part.clear('%');    }    /**     * Those characters that are allowed for the reg_name.     */    public static final BitSet allowed_reg_name = new BitSet(256);    // Static initializer for allowed_reg_name     static {        allowed_reg_name.or(reg_name);        // allowed_reg_name.andNot(percent);        allowed_reg_name.clear('%');    }    /**     * Those characters that are allowed for the userinfo component.     */    public static final BitSet allowed_userinfo = new BitSet(256);    // Static initializer for allowed_userinfo    static {        allowed_userinfo.or(userinfo);        // allowed_userinfo.andNot(percent);        allowed_userinfo.clear('%');    }    /**     * Those characters that are allowed for within the userinfo component.     */    public static final BitSet allowed_within_userinfo = new BitSet(256);    // Static initializer for allowed_within_userinfo    static {        allowed_within_userinfo.or(within_userinfo);        allowed_within_userinfo.clear('%');    }    /**     * Those characters that are allowed for the IPv6reference component.     * The characters '[', ']' in IPv6reference should be excluded.     */    public static final BitSet allowed_IPv6reference = new BitSet(256);    // Static initializer for allowed_IPv6reference    static {        allowed_IPv6reference.or(IPv6reference);        // allowed_IPv6reference.andNot(unwise);        allowed_IPv6reference.clear('[');        allowed_IPv6reference.clear(']');    }    /**     * Those characters that are allowed for the host component.     * The characters '[', ']' in IPv6reference should be excluded.     */    public static final BitSet allowed_host = new BitSet(256);    // Static initializer for allowed_host    static {        allowed_host.or(hostname);        allowed_host.or(allowed_IPv6reference);    }    /**     * Those characters that are allowed for the authority component.     */    public static final BitSet allowed_within_authority = new BitSet(256);    // Static initializer for allowed_within_authority    static {        allowed_within_authority.or(server);        allowed_within_authority.or(reg_name);        allowed_within_authority.clear(';');        allowed_within_authority.clear(':');        allowed_within_authority.clear('@');        allowed_within_authority.clear('?');        allowed_within_authority.clear('/');    }    /**     * Those characters that are allowed for the abs_path.     */    public static final BitSet allowed_abs_path = new BitSet(256);    // Static initializer for allowed_abs_path    static {        allowed_abs_path.or(abs_path);        // allowed_abs_path.set('/');  // aleady included        allowed_abs_path.andNot(percent);        allowed_abs_path.clear('+');    }    /**     * Those characters that are allowed for the rel_path.     */    public static final BitSet allowed_rel_path = new BitSet(256);    // Static initializer for allowed_rel_path    static {        allowed_rel_path.or(rel_path);        allowed_rel_path.clear('%');        allowed_rel_path.clear('+');    }    /**     * Those characters that are allowed within the path.     */    public static final BitSet allowed_within_path = new BitSet(256);    // Static initializer for allowed_within_path    static {        allowed_within_path.or(abs_path);        allowed_within_path.clear('/');        allowed_within_path.clear(';');        allowed_within_path.clear('=');        allowed_within_path.clear('?');    }    /**     * Those characters that are allowed for the query component.     */    public static final BitSet allowed_query = new BitSet(256);    // Static initializer for allowed_query    static {        allowed_query.or(uric);        allowed_query.clear('%');    }    /**     * Those characters that are allowed within the query component.     */    public static final BitSet allowed_within_query = new BitSet(256);    // Static initializer for allowed_within_query    static {        allowed_within_query.or(allowed_query);        allowed_within_query.andNot(reserved); // excluded 'reserved'    }    /**     * Those characters that are allowed for the fragment component.     */    public static final BitSet allowed_fragment = new BitSet(256);    // Static initializer for allowed_fragment    static {        allowed_fragment.or(uric);        allowed_fragment.clear('%');    }    // ------------------------------------------- Flags for this URI-reference    // TODO: Figure out what all these variables are for and provide javadoc    // URI-reference = [ absoluteURI | relativeURI ] [ "#" fragment ]    // absoluteURI   = scheme ":" ( hier_part | opaque_part )    protected boolean _is_hier_part;    protected boolean _is_opaque_part;    // relativeURI   = ( net_path | abs_path | rel_path ) [ "?" query ]     // hier_part     = ( net_path | abs_path ) [ "?" query ]    protected boolean _is_net_path;    protected boolean _is_abs_path;    protected boolean _is_rel_path;    // net_path      = "//" authority [ abs_path ]     // authority     = server | reg_name    protected boolean _is_reg_name;    protected boolean _is_server;  // = _has_server    // server        = [ [ userinfo "@" ] hostport ]    // host          = hostname | IPv4address | IPv6reference    protected boolean _is_hostname;    protected boolean _is_IPv4address;    protected boolean _is_IPv6reference;    // ------------------------------------------ Character and escape encoding        /**

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -