📄 bsd_glob.c
字号:
/* * Copyright (c) 1989, 1993 * The Regents of the University of California. All rights reserved. * * This code is derived from software contributed to Berkeley by * Guido van Rossum. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * 3. Neither the name of the University nor the names of its contributors * may be used to endorse or promote products derived from this software * without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF * SUCH DAMAGE. */#if defined(LIBC_SCCS) && !defined(lint)static char sccsid[] = "@(#)glob.c 8.3 (Berkeley) 10/13/93";#endif /* LIBC_SCCS and not lint *//* * glob(3) -- a superset of the one defined in POSIX 1003.2. * * The [!...] convention to negate a range is supported (SysV, Posix, ksh). * * Optional extra services, controlled by flags not defined by POSIX: * * GLOB_QUOTE: * Escaping convention: \ inhibits any special meaning the following * character might have (except \ at end of string is retained). * GLOB_MAGCHAR: * Set in gl_flags if pattern contained a globbing character. * GLOB_NOMAGIC: * Same as GLOB_NOCHECK, but it will only append pattern if it did * not contain any magic characters. [Used in csh style globbing] * GLOB_ALTDIRFUNC: * Use alternately specified directory access functions. * GLOB_TILDE: * expand ~user/foo to the /home/dir/of/user/foo * GLOB_BRACE: * expand {1,2}{a,b} to 1a 1b 2a 2b * gl_matchc: * Number of matches in the current invocation of glob. * GLOB_ALPHASORT: * sort alphabetically like csh (case doesn't matter) instead of in ASCII * order */#include <EXTERN.h>#include <perl.h>#include <XSUB.h>#include "bsd_glob.h"#ifdef I_PWD# include <pwd.h>#else#ifdef HAS_PASSWD struct passwd *getpwnam(char *); struct passwd *getpwuid(Uid_t);#endif#endif#ifndef MAXPATHLEN# ifdef PATH_MAX# define MAXPATHLEN PATH_MAX# ifdef MACOS_TRADITIONAL# define MAXPATHLEN 255# else# define MAXPATHLEN 1024# endif# endif#endif#define BG_DOLLAR '$'#define BG_DOT '.'#define BG_EOS '\0'#define BG_LBRACKET '['#define BG_NOT '!'#define BG_QUESTION '?'#define BG_QUOTE '\\'#define BG_RANGE '-'#define BG_RBRACKET ']'#ifdef MACOS_TRADITIONAL# define BG_SEP ':'#else# define BG_SEP '/'#endif#ifdef DOSISH#define BG_SEP2 '\\'#endif#define BG_STAR '*'#define BG_TILDE '~'#define BG_UNDERSCORE '_'#define BG_LBRACE '{'#define BG_RBRACE '}'#define BG_SLASH '/'#define BG_COMMA ','#ifndef GLOB_DEBUG#define M_QUOTE 0x8000#define M_PROTECT 0x4000#define M_MASK 0xffff#define M_ASCII 0x00fftypedef U16 Char;#else#define M_QUOTE 0x80#define M_PROTECT 0x40#define M_MASK 0xff#define M_ASCII 0x7ftypedef U8 Char;#endif /* !GLOB_DEBUG */#define CHAR(c) ((Char)((c)&M_ASCII))#define META(c) ((Char)((c)|M_QUOTE))#define M_ALL META('*')#define M_END META(']')#define M_NOT META('!')#define M_ONE META('?')#define M_RNG META('-')#define M_SET META('[')#define ismeta(c) (((c)&M_QUOTE) != 0)static int compare(const void *, const void *);static int ci_compare(const void *, const void *);static void g_Ctoc(const Char *, char *);static int g_lstat(Char *, Stat_t *, glob_t *);static DIR *g_opendir(Char *, glob_t *);static Char *g_strchr(Char *, int);#ifdef notdefstatic Char *g_strcat(Char *, const Char *);#endifstatic int g_stat(Char *, Stat_t *, glob_t *);static int glob0(const Char *, glob_t *);static int glob1(Char *, glob_t *);static int glob2(Char *, Char *, Char *, glob_t *);static int glob3(Char *, Char *, Char *, Char *, glob_t *);static int globextend(const Char *, glob_t *);static const Char * globtilde(const Char *, Char *, glob_t *);static int globexp1(const Char *, glob_t *);static int globexp2(const Char *, const Char *, glob_t *, int *);static int match(Char *, Char *, Char *, int);#ifdef GLOB_DEBUGstatic void qprintf(const char *, Char *);#endif /* GLOB_DEBUG */#ifdef PERL_IMPLICIT_CONTEXTstatic Direntry_t * my_readdir(DIR*);static Direntry_t *my_readdir(DIR *d){ return PerlDir_read(d);}#else#define my_readdir readdir#endifintbsd_glob(const char *pattern, int flags, int (*errfunc)(const char *, int), glob_t *pglob){ const U8 *patnext; int c; Char *bufnext, *bufend, patbuf[MAXPATHLEN+1]; patnext = (U8 *) pattern; if (!(flags & GLOB_APPEND)) { pglob->gl_pathc = 0; pglob->gl_pathv = NULL; if (!(flags & GLOB_DOOFFS)) pglob->gl_offs = 0; } pglob->gl_flags = flags & ~GLOB_MAGCHAR; pglob->gl_errfunc = errfunc; pglob->gl_matchc = 0; bufnext = patbuf; bufend = bufnext + MAXPATHLEN;#ifdef DOSISH /* Nasty hack to treat patterns like "C:*" correctly. In this * case, the * should match any file in the current directory * on the C: drive. However, the glob code does not treat the * colon specially, so it looks for files beginning "C:" in * the current directory. To fix this, change the pattern to * add an explicit "./" at the start (just after the drive * letter and colon - ie change to "C:./*"). */ if (isalpha(pattern[0]) && pattern[1] == ':' && pattern[2] != BG_SEP && pattern[2] != BG_SEP2 && bufend - bufnext > 4) { *bufnext++ = pattern[0]; *bufnext++ = ':'; *bufnext++ = '.'; *bufnext++ = BG_SEP; patnext += 2; }#endif if (flags & GLOB_QUOTE) { /* Protect the quoted characters. */ while (bufnext < bufend && (c = *patnext++) != BG_EOS) if (c == BG_QUOTE) {#ifdef DOSISH /* To avoid backslashitis on Win32, * we only treat \ as a quoting character * if it precedes one of the * metacharacters []-{}~\ */ if ((c = *patnext++) != '[' && c != ']' && c != '-' && c != '{' && c != '}' && c != '~' && c != '\\') {#else if ((c = *patnext++) == BG_EOS) {#endif c = BG_QUOTE; --patnext; } *bufnext++ = c | M_PROTECT; } else *bufnext++ = c; } else while (bufnext < bufend && (c = *patnext++) != BG_EOS) *bufnext++ = c; *bufnext = BG_EOS; if (flags & GLOB_BRACE) return globexp1(patbuf, pglob); else return glob0(patbuf, pglob);}/* * Expand recursively a glob {} pattern. When there is no more expansion * invoke the standard globbing routine to glob the rest of the magic * characters */static int globexp1(const Char *pattern, glob_t *pglob){ const Char* ptr = pattern; int rv; /* Protect a single {}, for find(1), like csh */ if (pattern[0] == BG_LBRACE && pattern[1] == BG_RBRACE && pattern[2] == BG_EOS) return glob0(pattern, pglob); while ((ptr = (const Char *) g_strchr((Char *) ptr, BG_LBRACE)) != NULL) if (!globexp2(ptr, pattern, pglob, &rv)) return rv; return glob0(pattern, pglob);}/* * Recursive brace globbing helper. Tries to expand a single brace. * If it succeeds then it invokes globexp1 with the new pattern. * If it fails then it tries to glob the rest of the pattern and returns. */static int globexp2(const Char *ptr, const Char *pattern, glob_t *pglob, int *rv){ int i; Char *lm, *ls; const Char *pe, *pm, *pl; Char patbuf[MAXPATHLEN + 1]; /* copy part up to the brace */ for (lm = patbuf, pm = pattern; pm != ptr; *lm++ = *pm++) continue; ls = lm; /* Find the balanced brace */ for (i = 0, pe = ++ptr; *pe; pe++) if (*pe == BG_LBRACKET) { /* Ignore everything between [] */ for (pm = pe++; *pe != BG_RBRACKET && *pe != BG_EOS; pe++) continue; if (*pe == BG_EOS) { /* * We could not find a matching BG_RBRACKET. * Ignore and just look for BG_RBRACE */ pe = pm; } } else if (*pe == BG_LBRACE) i++; else if (*pe == BG_RBRACE) { if (i == 0) break; i--; } /* Non matching braces; just glob the pattern */ if (i != 0 || *pe == BG_EOS) { *rv = glob0(patbuf, pglob); return 0; } for (i = 0, pl = pm = ptr; pm <= pe; pm++) switch (*pm) { case BG_LBRACKET: /* Ignore everything between [] */ for (pl = pm++; *pm != BG_RBRACKET && *pm != BG_EOS; pm++) continue; if (*pm == BG_EOS) { /* * We could not find a matching BG_RBRACKET. * Ignore and just look for BG_RBRACE */ pm = pl; } break; case BG_LBRACE: i++; break; case BG_RBRACE: if (i) { i--; break; } /* FALLTHROUGH */ case BG_COMMA: if (i && *pm == BG_COMMA) break; else { /* Append the current string */ for (lm = ls; (pl < pm); *lm++ = *pl++) continue; /* * Append the rest of the pattern after the * closing brace */ for (pl = pe + 1; (*lm++ = *pl++) != BG_EOS;) continue; /* Expand the current pattern */#ifdef GLOB_DEBUG qprintf("globexp2:", patbuf);#endif /* GLOB_DEBUG */ *rv = globexp1(patbuf, pglob); /* move after the comma, to the next string */ pl = pm + 1; } break; default: break; } *rv = 0; return 0;}/* * expand tilde from the passwd file. */static const Char *globtilde(const Char *pattern, Char *patbuf, glob_t *pglob){ struct passwd *pwd; char *h; const Char *p; Char *b; if (*pattern != BG_TILDE || !(pglob->gl_flags & GLOB_TILDE)) return pattern; /* Copy up to the end of the string or / */ for (p = pattern + 1, h = (char *) patbuf; *p && *p != BG_SLASH; *h++ = *p++) continue; *h = BG_EOS; if (((char *) patbuf)[0] == BG_EOS) { /* * handle a plain ~ or ~/ by expanding $HOME * first and then trying the password file */ if ((h = getenv("HOME")) == NULL) {#ifdef HAS_PASSWD if ((pwd = getpwuid(getuid())) == NULL) return pattern; else h = pwd->pw_dir;#else return pattern;#endif } } else { /* * Expand a ~user */#ifdef HAS_PASSWD if ((pwd = getpwnam((char*) patbuf)) == NULL) return pattern; else h = pwd->pw_dir;#else return pattern;#endif } /* Copy the home directory */ for (b = patbuf; *h; *b++ = *h++) continue; /* Append the rest of the pattern */ while ((*b++ = *p++) != BG_EOS) continue; return patbuf;}/* * The main glob() routine: compiles the pattern (optionally processing * quotes), calls glob1() to do the real pattern matching, and finally * sorts the list (unless unsorted operation is requested). Returns 0 * if things went well, nonzero if errors occurred. It is not an error * to find no matches. */static intglob0(const Char *pattern, glob_t *pglob){ const Char *qpat, *qpatnext; int c, err, oldflags, oldpathc; Char *bufnext, patbuf[MAXPATHLEN+1];#ifdef MACOS_TRADITIONAL if ( (*pattern == BG_TILDE) && (pglob->gl_flags & GLOB_TILDE) ) { return(globextend(pattern, pglob)); }#endif qpat = globtilde(pattern, patbuf, pglob); qpatnext = qpat; oldflags = pglob->gl_flags; oldpathc = pglob->gl_pathc; bufnext = patbuf; /* We don't need to check for buffer overflow any more. */ while ((c = *qpatnext++) != BG_EOS) { switch (c) { case BG_LBRACKET: c = *qpatnext; if (c == BG_NOT) ++qpatnext; if (*qpatnext == BG_EOS || g_strchr((Char *) qpatnext+1, BG_RBRACKET) == NULL) { *bufnext++ = BG_LBRACKET; if (c == BG_NOT) --qpatnext; break; }
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -