⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 urlutils.cxx

📁 PTypes (C++ Portable Types Library) is a simple alternative to the STL that includes multithreading
💻 CXX
字号:
/* * *  C++ Portable Types Library (PTypes) *  Version 1.7.5   Released 9-Mar-2003 * *  Copyright (c) 2001, 2002, 2003 Hovik Melikyan * *  http://www.melikyan.com/ptypes/ *  http://ptypes.sourceforge.net/ * */#include <stdlib.h>#include <ptypes.h>#include <pinet.h>#include "urlutils.h"USING_PTYPESchar* opt_anonymous_username = "ftp";char* opt_anonymous_password = "unknown@";char* opt_default_urlscheme = "http";static cset schemechars("0-9A-Za-z~-.");static cset unsafechars("~00-~20%:/@?#;\\<>+\"'~7F-~FF");static cset unsafepathchars(unsafechars - '/');static cset unsafeparamchars(unsafechars + '.');static cset pathtermchars("~00#?;");bool isurl(const string& s){    const char* p = pconst(s);    const char* b = p;    while (*p & schemechars)        p++;    return p > b && *p == ':';}static string urlencode(const string& s, const cset& unsafe) {    static const char hexchars[17] = "0123456789ABCDEF";    int numunsafe = 0;    int numsp = 0;    const char* p;    for (p = s; *p != 0; p++)        if (*p == ' ')            numsp++;        else if (*p & unsafe)            numunsafe++;    if (numunsafe == 0 && numsp == 0)        return s;    else {        string ret;        setlength(ret, length(s) + numunsafe * 2);        p = s;        char* d = unique(ret);        for (; *p != 0; p++, d++) {            if (*p == ' ')                *d = '+';            else if (*p & unsafe) {                *d++ = '%';                *d++ = hexchars[*p >> 4];                *d = hexchars[*p & 0x0f];            }            else                *d = *p;        }        return ret;    }}string urlencodepath(const string& path){    return urlencode(path, unsafepathchars);}static int urldefport(const string& scheme) {    if (scheme == "http")        return 80;    else if (scheme == "https")        return 443;    else if (scheme == "ftp")        return 21;    else        return 0;}urlrec::urlrec()    : scheme(), username(), password(), pwdset(false), host(),      port(0), path(), proto(), query(), fragment() {}void urlclear(urlrec& u) {    clear(u.scheme);    clear(u.username);    clear(u.password);    u.pwdset = false;    clear(u.host);    u.port = 0;    clear(u.path);    clear(u.proto);    clear(u.query);    clear(u.fragment);}// urlcreate:// NOTES: if scheme is empty, opt_DefaultUrlScheme is taken; for ftp scheme // leading '/' in the path component is significant; for all other schemes // the leading '/' is ignored.string urlcreate(const urlrec& u) {    string ret;    string s, p;    // scheme    if (isempty(u.scheme))        s = opt_default_urlscheme;    else        s = lowercase(u.scheme);    if (s[length(s) - 1] == ':')        setlength(s, length(s) - 1);    ret = s + "://";    // username and password    if (!isempty(u.username)) {        ret += urlencode(u.username, unsafechars);        if (u.pwdset)            ret += ':' + urlencode(u.password, unsafechars);        ret += '@';    }    // host name and port number    ret += u.host;    if (u.port != 0 && u.port != urldefport(s))        ret += ':' + itostring(u.port);    // path    ret += '/';    p = u.path;    if (!isempty(p) && p[0] == '/') {        if (s == "ftp")            ret += "%2F";        del(p, 0, 1);    }    ret += urlencode(p, unsafepathchars);    // params    if (!isempty(u.proto))        ret += ';' + urlencode(u.proto, unsafeparamchars);    if (!isempty(u.query))        ret += '?' + urlencode(u.query, unsafeparamchars);    if (!isempty(u.fragment))        ret += '#' + urlencode(u.fragment, unsafeparamchars);    return ret;}// urlcrack:// Note: no "friendly" URL's! If the URL is invalid the result is undefined.static int xchartoint(char c) {    if (c >= 'a')        return c - 'a' + 10;    else if (c >= 'A')        return c - 'A' + 10;    else        return c - '0';}static void assignurlstr(string& s, const char* p, const char* end) {    if (p >= end)        clear(s);    else {        setlength(s, end - p);        char* d = unique(s);        for (; p < end; p++, d++) {            if (*p == '+')                *d = ' ';            else if (*p == '%') {                if (++p == end) break;                *d = char(xchartoint(*p) << 4);                if (++p == end) break;                *d |= char(xchartoint(*p));            }            else                *d = *p;        }        setlength(s, d - pconst(s));    }}static void crackpath(const char* p, urlrec& u) {    const char* end = p;    while (!(*end & pathtermchars))  // [#0, '?', '#', ';']        end++;    assignurlstr(u.path, p, end);    // leading '/'    if (u.scheme == "http" || u.scheme == "https")    {        if (isempty(u.path))            u.path = '/';        else if (*pconst(u.path) != '/' && *pconst(u.path) != '~')            ins('/', u.path, 0);    }    // parameters    while (*end != 0)    {        char paramtype = *end;        p = ++end;        while (!(*end & pathtermchars))            end++;        switch(paramtype)        {        case ';':            assignurlstr(u.proto, p, end);            break;        case '?':            assignurlstr(u.query, p, end);            break;        case '#':            assignurlstr(u.fragment, p, end);            break;        }    }}void urlcrack(const string& s, urlrec& u) {    urlclear(u);    const char* t;    const char* p = s;    const char* end = p;    // scheme    while (*end & schemechars)        end++;    if (*end != ':' || *(end + 1) != '/' || *(end + 2) != '/')        return;   // invalid scheme: we don't want to generate errors    assignurlstr(u.scheme, p, end);    u.scheme = lowercase(u.scheme);    end += 3;  // skip '://'    // hostname and possibly username:password    p = end;    while (*end != 0 && *end != '/' && *end != '@')        end++;    // username and possibly password    if (*end == '@') {        t = p;        while (*t != ':' && *t != '@')            t++;        // password        if (*t == ':') {            assignurlstr(u.password, t + 1, end);            u.pwdset = true;        }        // username        assignurlstr(u.username, p, t);        end++;        p = end;        while (*end != 0 && *end != '/')            end++;    }    else if (u.scheme == "ftp") {        u.username = opt_anonymous_username;        u.password = opt_anonymous_password;        u.pwdset = true;    }    // hostname and possibly port number    t = p;    while (*t != 0 && *t != ':' && *t != '/')        t++;    assign(u.host, p, t - p);    // port    if (*t == ':') {        string s;        assign(s, t + 1, end - t - 1);        u.port = atoi(s);    }    // path    if (*end == '/')        end++;    crackpath(end, u);}

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -