newlib-cygwin/winsup/cygwin/glob.cc

1021 lines
24 KiB
C++
Raw Normal View History

2000-02-18 03:38:33 +08:00
/*
* Copyright (c) 1989, 1993
* The Regents of the University of California. All rights reserved.
*
* This code is derived from software contributed to Berkeley by
* Guido van Rossum.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 4. Neither the name of the University nor the names of its contributors
* may be used to endorse or promote products derived from this software
* without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
#ifdef __CYGWIN__
#include "winsup.h"
#endif
#if defined(LIBC_SCCS) && !defined(lint)
static char sccsid[] = "@(#)glob.c 8.3 (Berkeley) 10/13/93";
#endif /* LIBC_SCCS and not lint */
#include <sys/cdefs.h>
__FBSDID("$FreeBSD: src/lib/libc/gen/glob.c,v 1.28 2010/05/12 17:44:00 gordon Exp $");
2000-02-18 03:38:33 +08:00
/*
* glob(3) -- a superset of the one defined in POSIX 1003.2.
*
* The [!...] convention to negate a range is supported (SysV, Posix, ksh).
*
* Optional extra services, controlled by flags not defined by POSIX:
*
* GLOB_QUOTE:
* Escaping convention: \ inhibits any special meaning the following
* character might have (except \ at end of string is retained).
* GLOB_MAGCHAR:
* Set in gl_flags if pattern contained a globbing character.
* GLOB_NOMAGIC:
* Same as GLOB_NOCHECK, but it will only append pattern if it did
* not contain any magic characters. [Used in csh style globbing]
* GLOB_ALTDIRFUNC:
* Use alternately specified directory access functions.
* GLOB_TILDE:
* expand ~user/foo to the /home/dir/of/user/foo
* GLOB_BRACE:
* expand {1,2}{a,b} to 1a 1b 2a 2b
2000-02-18 03:38:33 +08:00
* gl_matchc:
* Number of matches in the current invocation of glob.
*/
/*
* Some notes on multibyte character support:
* 1. Patterns with illegal byte sequences match nothing - even if
* GLOB_NOCHECK is specified.
* 2. Illegal byte sequences in filenames are handled by treating them as
* single-byte characters with a value of the first byte of the sequence
* cast to wint_t.
* 3. State-dependent encodings are not currently supported.
*/
#include <sys/param.h>
#include <sys/stat.h>
2000-02-18 03:38:33 +08:00
#include <ctype.h>
2000-02-18 03:38:33 +08:00
#include <dirent.h>
#include <errno.h>
2000-02-18 03:38:33 +08:00
#include <glob.h>
#include <limits.h>
2000-02-18 03:38:33 +08:00
#include <pwd.h>
#include <stdint.h>
#include <stdio.h>
2000-02-18 03:38:33 +08:00
#include <stdlib.h>
#include <string.h>
2000-02-18 03:38:33 +08:00
#include <unistd.h>
#include <wchar.h>
#include "collate.h"
#ifdef __CYGWIN__
#include <wctype.h>
#include "path.h"
#include "fhandler.h"
#include "dtable.h"
#include "cygheap.h"
#include "cygwin/version.h"
Switch to 32/64 datatypes: * Makefile.in (OBSOLETE_FUNCTIONS): Add open acl aclcheck aclfrommode aclfrompbits aclfromtext aclsort acltomode acltopbits acltotext chown facl fchown fgetpos fopen freopen fseeko fsetpos fstat ftello ftruncate getegid geteuid getgid getgrent getgrgid getgrnam getgroups getpwuid getpwuid_r getuid initgroups lchown lseek lstat mknod mmap seekdir setegid seteuid setgid setgroups setregid setreuid setuid stat telldir truncate. (NEW_FUNCTIONS): Add _open64 acl32 aclcheck32 aclfrommode32 aclfrompbits32 aclfromtext32 aclsort32 acltomode32 acltopbits32 acltotext32 chown32 facl32 fchown32 fgetpos64 fopen64 freopen64 fseeko64 fsetpos64 fstat64 ftello64 ftruncate64 getegid32 geteuid32 getgid32 getgrent32 getgrgid32 getgrnam32 getgroups32 getpwuid32 getpwuid_r32 getuid32 initgroups32 lchown32 lseek64 lstat64 mknod32 mmap64 seekdir64 setegid32 seteuid32 setgid32 setgroups32 setregid32 setreuid32 setuid32 stat64 telldir64 truncate64 to substitute the above. * cygserver_shm.h (class client_request_shm): Change uid_t and gid_t members to __uid32_t and __gid32_t. * cygwin.din: Add symbols acl32 aclcheck32 aclfrommode32 aclfrompbits32 aclfromtext32 aclsort32 acltomode32 acltopbits32 acltotext32 facl32 fgetpos64 fopen64 freopen64 fseeko64 fsetpos64 _fstat64 ftello64 _lseek64 mknod32 _open64. * glob.c: Include perprocess.h. (globtilde): Call getpwuid32 and getuid32 instead of getpwuid and getuid. (g_lstat): Check for applications API version to call the appropriate typed gl_lstat function. (g_stat): Ditto for gl_stat. * shm.cc (client_request_shm::client_request_shm): Call geteuid32 and getegid32 instead of geteuid and getegid throughout. * syscalls.cc (_open64): New alias for open. (_lseek64): New alias for lseek64. (_fstat64): New alias for fseek64. (mknod32): New function. (mknod): Calls mknod32 now. * winsup.h: Make function declarations for getuid32, geteuid32, and getpwuid32 accessible for plain C sources. Add declarations for getegid32 and getpwnam. * include/cygwin/version.h: Bum API minor number to 78. * include/sys/cygwin.h: Guard C++ specific members of struct per_process against inclusion in plain C sources. * include/sys/mman.h (mman): Add guard to avoid type clash when compiling Cygwin.
2003-03-10 05:51:00 +08:00
#define CCHAR(c) (ignore_case_with_glob ? towlower (CHAR (c)) : CHAR (c))
#define Cchar(c) (ignore_case_with_glob ? towlower (c) : (c))
#endif
#undef MAXPATHLEN
#define MAXPATHLEN 8192
2000-02-18 03:38:33 +08:00
#define DOLLAR '$'
#define DOT '.'
#define COLON ':'
#define EQUALS '='
2000-02-18 03:38:33 +08:00
#define EOS '\0'
#define LBRACKET '['
#define NOT '!'
#define QUESTION '?'
#define QUOTE '\\'
#define RANGE '-'
#define RBRACKET ']'
#define SEP '/'
#define STAR '*'
#define TILDE '~'
#define UNDERSCORE '_'
#define LBRACE '{'
#define RBRACE '}'
#define SLASH '/'
#define COMMA ','
#ifndef DEBUG
#define M_QUOTE 0x8000000000ULL
#define M_PROTECT 0x4000000000ULL
#define M_MASK 0xffffffffffULL
#define M_CHAR 0x00ffffffffULL
2000-02-18 03:38:33 +08:00
typedef uint_fast64_t Char;
2000-02-18 03:38:33 +08:00
#else
#define M_QUOTE 0x80
#define M_PROTECT 0x40
#define M_MASK 0xff
#define M_CHAR 0x7f
2000-02-18 03:38:33 +08:00
typedef char Char;
#endif
#define CHAR(c) ((Char)((c)&M_CHAR))
2000-02-18 03:38:33 +08:00
#define META(c) ((Char)((c)|M_QUOTE))
#define M_ALL META('*')
#define M_END META(']')
#define M_NOT META('!')
#define M_ONE META('?')
#define M_RNG META('-')
#define M_SET META('[')
#define M_NAMED META(':')
#define M_EQUIV META('=')
2000-02-18 03:38:33 +08:00
#define ismeta(c) (((c)&M_QUOTE) != 0)
static int compare(const void *, const void *);
static int g_Ctoc(const Char *, char *, size_t);
static int g_lstat(Char *, struct stat *, glob_t *);
static DIR *g_opendir(Char *, glob_t *);
static const Char *g_strchr(const Char *, wint_t);
2000-02-18 03:38:33 +08:00
#ifdef notdef
static Char *g_strcat(Char *, const Char *);
2000-02-18 03:38:33 +08:00
#endif
static int g_stat(Char *, struct stat *, glob_t *);
static int glob0(const Char *, glob_t *, size_t *);
static int glob1(Char *, glob_t *, size_t *);
static int glob2(Char *, Char *, Char *, Char *, glob_t *, size_t *);
static int glob3(Char *, Char *, Char *, Char *, Char *, glob_t *, size_t *);
static int globextend(const Char *, glob_t *, size_t *);
2012-08-17 07:34:45 +08:00
static const Char *
globtilde(const Char *, Char *, size_t, glob_t *);
static int globexp1(const Char *, glob_t *, size_t *);
static int globexp2(const Char *, const Char *, glob_t *, int *, size_t *);
static int match(Char *, Char *, Char *);
2000-02-18 03:38:33 +08:00
#ifdef DEBUG
static void qprintf(const char *, Char *);
2000-02-18 03:38:33 +08:00
#endif
/* Return value is either EOS, COLON, DOT, EQUALS, or LBRACKET if no class
expression found. */
static inline Char
check_classes_expr(const Char *&cptr, wint_t *classbuf = NULL,
size_t classbufsize = 0)
{
const Char *ctype = NULL;
if (*cptr == LBRACKET &&
(cptr[1] == COLON || cptr[1] == DOT || cptr[1] == EQUALS)) {
ctype = ++cptr;
while (*++cptr != EOS &&
(*cptr != *ctype || cptr[1] != RBRACKET))
;
if (*cptr == EOS)
return EOS;
if (classbuf) {
const Char *class_p = ctype + 1;
size_t clen = cptr - class_p;
size_t idx;
if (clen < classbufsize) {
for (idx = 0; idx < clen; ++idx)
classbuf[idx] = CHAR(class_p[idx]);
classbuf[idx] = '\0';
} else
ctype = NULL;
}
cptr++; /* Advance cptr to closing RBRACKET of class expr */
}
return ctype ? *ctype : LBRACKET;
}
2000-02-18 03:38:33 +08:00
int
glob(const char *__restrict pattern, int flags, int (*errfunc)(const char *, int), glob_t *__restrict pglob)
2000-02-18 03:38:33 +08:00
{
const char *patnext;
size_t limit;
Char *bufnext, *bufend, patbuf[MAXPATHLEN], prot;
mbstate_t mbs;
wint_t wc;
size_t clen;
patnext = pattern;
2000-02-18 03:38:33 +08:00
if (!(flags & GLOB_APPEND)) {
pglob->gl_pathc = 0;
pglob->gl_pathv = NULL;
if (!(flags & GLOB_DOOFFS))
pglob->gl_offs = 0;
}
if (flags & GLOB_LIMIT) {
limit = pglob->gl_matchc;
if (limit == 0)
limit = ARG_MAX;
} else
limit = 0;
2000-02-18 03:38:33 +08:00
pglob->gl_flags = flags & ~GLOB_MAGCHAR;
pglob->gl_errfunc = errfunc;
pglob->gl_matchc = 0;
bufnext = patbuf;
bufend = bufnext + MAXPATHLEN - 1;
if (flags & GLOB_NOESCAPE) {
memset(&mbs, 0, sizeof(mbs));
while (bufend - bufnext >= MB_CUR_MAX) {
clen = mbrtowi(&wc, patnext, MB_LEN_MAX, &mbs);
if (clen == (size_t)-1 || clen == (size_t)-2)
return (GLOB_NOMATCH);
else if (clen == 0)
break;
*bufnext++ = wc;
patnext += clen;
}
} else {
2000-02-18 03:38:33 +08:00
/* Protect the quoted characters. */
memset(&mbs, 0, sizeof(mbs));
while (bufend - bufnext >= MB_CUR_MAX) {
if (*patnext == QUOTE) {
if (*++patnext == EOS) {
*bufnext++ = QUOTE | M_PROTECT;
continue;
2000-02-18 03:38:33 +08:00
}
prot = M_PROTECT;
} else
prot = 0;
clen = mbrtowi(&wc, patnext, MB_LEN_MAX, &mbs);
if (clen == (size_t)-1 || clen == (size_t)-2)
return (GLOB_NOMATCH);
else if (clen == 0)
break;
*bufnext++ = wc | prot;
patnext += clen;
}
2000-02-18 03:38:33 +08:00
}
*bufnext = EOS;
if (flags & GLOB_BRACE)
return globexp1(patbuf, pglob, &limit);
2000-02-18 03:38:33 +08:00
else
return glob0(patbuf, pglob, &limit);
2000-02-18 03:38:33 +08:00
}
/*
* Expand recursively a glob {} pattern. When there is no more expansion
* invoke the standard globbing routine to glob the rest of the magic
* characters
*/
static int
globexp1(const Char *pattern, glob_t *pglob, size_t *limit)
2000-02-18 03:38:33 +08:00
{
const Char* ptr = pattern;
int rv;
/* Protect a single {}, for find(1), like csh */
if (pattern[0] == LBRACE && pattern[1] == RBRACE && pattern[2] == EOS)
return glob0(pattern, pglob, limit);
2000-02-18 03:38:33 +08:00
while ((ptr = g_strchr(ptr, LBRACE)) != NULL)
if (!globexp2(ptr, pattern, pglob, &rv, limit))
2000-02-18 03:38:33 +08:00
return rv;
return glob0(pattern, pglob, limit);
2000-02-18 03:38:33 +08:00
}
/*
* Recursive brace globbing helper. Tries to expand a single brace.
* If it succeeds then it invokes globexp1 with the new pattern.
* If it fails then it tries to glob the rest of the pattern and returns.
*/
static int
globexp2(const Char *ptr, const Char *pattern, glob_t *pglob, int *rv, size_t *limit)
2000-02-18 03:38:33 +08:00
{
int i;
Char *lm, *ls;
const Char *pe, *pm, *pm1, *pl;
Char patbuf[MAXPATHLEN];
2000-02-18 03:38:33 +08:00
/* copy part up to the brace */
for (lm = patbuf, pm = pattern; pm != ptr; *lm++ = *pm++)
continue;
*lm = EOS;
2000-02-18 03:38:33 +08:00
ls = lm;
/* Find the balanced brace */
for (i = 0, pe = ++ptr; *pe; pe++)
if (*pe == LBRACKET) {
/* Ignore everything between [] */
for (pm = pe++; *pe != RBRACKET && *pe != EOS; pe++) {
if (check_classes_expr (pe) == EOS)
break;
}
2000-02-18 03:38:33 +08:00
if (*pe == EOS) {
/*
2000-02-18 03:38:33 +08:00
* We could not find a matching RBRACKET.
* Ignore and just look for RBRACE
*/
pe = pm;
}
}
else if (*pe == LBRACE)
i++;
else if (*pe == RBRACE) {
if (i == 0)
break;
i--;
}
/* Non matching braces; just glob the pattern */
if (i != 0 || *pe == EOS) {
*rv = glob0(patbuf, pglob, limit);
2000-02-18 03:38:33 +08:00
return 0;
}
for (i = 0, pl = pm = ptr; pm <= pe; pm++)
switch (*pm) {
case LBRACKET:
/* Ignore everything between [] */
for (pm1 = pm++; *pm != RBRACKET && *pm != EOS; pm++) {
if (check_classes_expr (pm) == EOS)
break;
}
2000-02-18 03:38:33 +08:00
if (*pm == EOS) {
/*
2000-02-18 03:38:33 +08:00
* We could not find a matching RBRACKET.
* Ignore and just look for RBRACE
*/
pm = pm1;
2000-02-18 03:38:33 +08:00
}
break;
case LBRACE:
i++;
break;
case RBRACE:
if (i) {
i--;
break;
}
fallthrough;
2000-02-18 03:38:33 +08:00
case COMMA:
if (i && *pm == COMMA)
break;
else {
/* Append the current string */
for (lm = ls; (pl < pm); *lm++ = *pl++)
continue;
/*
2000-02-18 03:38:33 +08:00
* Append the rest of the pattern after the
* closing brace
*/
for (pl = pe + 1; (*lm++ = *pl++) != EOS;)
continue;
/* Expand the current pattern */
#ifdef DEBUG
qprintf("globexp2:", patbuf);
#endif
*rv = globexp1(patbuf, pglob, limit);
2000-02-18 03:38:33 +08:00
/* move after the comma, to the next string */
pl = pm + 1;
}
break;
default:
break;
}
*rv = 0;
return 0;
}
/*
* expand tilde from the passwd file.
*/
static const Char *
globtilde(const Char *pattern, Char *patbuf, size_t patbuf_len, glob_t *pglob)
2000-02-18 03:38:33 +08:00
{
struct passwd *pwd;
char *h;
const Char *p;
Char *b, *eb;
2000-02-18 03:38:33 +08:00
if (*pattern != TILDE || !(pglob->gl_flags & GLOB_TILDE))
return pattern;
2012-08-17 07:34:45 +08:00
/*
* Copy up to the end of the string or /
*/
eb = &patbuf[patbuf_len - 1];
for (p = pattern + 1, h = (char *) patbuf;
h < (char *)eb && *p && *p != SLASH; *h++ = *p++)
2000-02-18 03:38:33 +08:00
continue;
*h = EOS;
if (((char *) patbuf)[0] == EOS) {
/*
* handle a plain ~ or ~/ by expanding $HOME first (iff
* we're not running setuid or setgid) and then trying
* the password file
2000-02-18 03:38:33 +08:00
*/
if (issetugid() != 0 ||
(h = getenv("HOME")) == NULL) {
if (((h = getlogin()) != NULL &&
(pwd = getpwnam(h)) != NULL) ||
(pwd = getpwuid(getuid())) != NULL)
2000-02-18 03:38:33 +08:00
h = pwd->pw_dir;
else
return pattern;
2000-02-18 03:38:33 +08:00
}
}
else {
/*
* Expand a ~user
*/
if ((pwd = getpwnam((char*) patbuf)) == NULL)
return pattern;
else
h = pwd->pw_dir;
}
/* Copy the home directory */
for (b = patbuf; b < eb && *h; *b++ = *h++)
2000-02-18 03:38:33 +08:00
continue;
2000-02-18 03:38:33 +08:00
/* Append the rest of the pattern */
while (b < eb && (*b++ = *p++) != EOS)
2000-02-18 03:38:33 +08:00
continue;
*b = EOS;
2000-02-18 03:38:33 +08:00
return patbuf;
}
static void
wcitoascii(char *dst, wint_t *src)
{
while ((*dst++ = *src++));
}
2000-02-18 03:38:33 +08:00
/*
* The main glob() routine: compiles the pattern (optionally processing
* quotes), calls glob1() to do the real pattern matching, and finally
* sorts the list (unless unsorted operation is requested). Returns 0
* if things went well, nonzero if errors occurred.
2000-02-18 03:38:33 +08:00
*/
static int
glob0(const Char *pattern, glob_t *pglob, size_t *limit)
2000-02-18 03:38:33 +08:00
{
const Char *qpatnext, *qpatrbsrch;
int err;
size_t oldpathc;
Char *bufnext, c, patbuf[MAXPATHLEN];
2000-02-18 03:38:33 +08:00
qpatnext = globtilde(pattern, patbuf, MAXPATHLEN, pglob);
2000-02-18 03:38:33 +08:00
oldpathc = pglob->gl_pathc;
bufnext = patbuf;
/* We don't need to check for buffer overflow any more. */
while ((c = *qpatnext++) != EOS) {
switch (c) {
case LBRACKET:
c = *qpatnext;
if (c == NOT)
++qpatnext;
for (qpatrbsrch = qpatnext;
*qpatrbsrch != RBRACKET && *qpatrbsrch != EOS;
++qpatrbsrch) {
if (check_classes_expr (qpatrbsrch) == EOS)
break;
}
if (*qpatrbsrch == EOS) {
2000-02-18 03:38:33 +08:00
*bufnext++ = LBRACKET;
if (c == NOT)
--qpatnext;
break;
}
*bufnext++ = M_SET;
if (c == NOT)
*bufnext++ = M_NOT;
c = *qpatnext;
2000-02-18 03:38:33 +08:00
do {
wint_t wclass[64];
Char ctype;
ctype = check_classes_expr(qpatnext, wclass,
64);
if (ctype) {
wctype_t type;
if (ctype == COLON) {
char cclass[64];
/* No worries, char classes are
ASCII-only anyway */
wcitoascii (cclass, wclass);
if ((type = wctype (cclass))) {
*bufnext++ = M_NAMED;
*bufnext++ = CHAR (type);
}
} else if (ctype == EQUALS &&
wclass[0] && !wclass[1]) {
*bufnext++ = M_EQUIV;
*bufnext++ = CHAR (wclass[0]);
}
/* TODO: [. is ignored yet */
qpatnext++;
continue;
}
2000-02-18 03:38:33 +08:00
*bufnext++ = CHAR(c);
if (*qpatnext == RANGE &&
(c = qpatnext[1]) != RBRACKET) {
*bufnext++ = M_RNG;
*bufnext++ = CHAR(c);
qpatnext += 2;
}
} while ((c = *qpatnext++) != RBRACKET);
pglob->gl_flags |= GLOB_MAGCHAR;
*bufnext++ = M_END;
break;
case QUESTION:
pglob->gl_flags |= GLOB_MAGCHAR;
*bufnext++ = M_ONE;
break;
case STAR:
pglob->gl_flags |= GLOB_MAGCHAR;
/* collapse adjacent stars to one,
2000-02-18 03:38:33 +08:00
* to avoid exponential behavior
*/
if (bufnext == patbuf || bufnext[-1] != M_ALL)
*bufnext++ = M_ALL;
break;
default:
*bufnext++ = CHAR(c);
break;
}
}
*bufnext = EOS;
#ifdef DEBUG
qprintf("glob0:", patbuf);
#endif
if ((err = glob1(patbuf, pglob, limit)) != 0)
2000-02-18 03:38:33 +08:00
return(err);
/*
* If there was no match we are going to append the pattern
2000-02-18 03:38:33 +08:00
* if GLOB_NOCHECK was specified or if GLOB_NOMAGIC was specified
* and the pattern did not contain any magic characters
* GLOB_NOMAGIC is there just for compatibility with csh.
*/
if (pglob->gl_pathc == oldpathc) {
if (((pglob->gl_flags & GLOB_NOCHECK) ||
((pglob->gl_flags & GLOB_NOMAGIC) &&
!(pglob->gl_flags & GLOB_MAGCHAR))))
return(globextend(pattern, pglob, limit));
else
return(GLOB_NOMATCH);
}
if (!(pglob->gl_flags & GLOB_NOSORT))
2000-02-18 03:38:33 +08:00
qsort(pglob->gl_pathv + pglob->gl_offs + oldpathc,
pglob->gl_pathc - oldpathc, sizeof(char *), compare);
return(0);
}
static int
compare(const void *p, const void *q)
2000-02-18 03:38:33 +08:00
{
return(strcmp(*(char **)p, *(char **)q));
}
static int
glob1(Char *pattern, glob_t *pglob, size_t *limit)
2000-02-18 03:38:33 +08:00
{
Char pathbuf[MAXPATHLEN];
2000-02-18 03:38:33 +08:00
/* A null pathname is invalid -- POSIX 1003.1 sect. 2.4. */
if (*pattern == EOS)
return(0);
return(glob2(pathbuf, pathbuf, pathbuf + MAXPATHLEN - 1,
pattern, pglob, limit));
2000-02-18 03:38:33 +08:00
}
/*
* The functions glob2 and glob3 are mutually recursive; there is one level
* of recursion for each segment in the pattern that contains one or more
* meta characters.
*/
static int
glob2(Char *pathbuf, Char *pathend, Char *pathend_last, Char *pattern,
glob_t *pglob, size_t *limit)
2000-02-18 03:38:33 +08:00
{
struct stat sb;
2000-02-18 03:38:33 +08:00
Char *p, *q;
int anymeta;
/*
* Loop over pattern segments until end of pattern or until
* segment with meta character found.
*/
for (anymeta = 0;;) {
if (*pattern == EOS) { /* End of pattern? */
*pathend = EOS;
if (g_lstat(pathbuf, &sb, pglob))
return(0);
2000-02-18 03:38:33 +08:00
if (((pglob->gl_flags & GLOB_MARK) &&
pathend[-1] != SEP) && (S_ISDIR(sb.st_mode)
|| (S_ISLNK(sb.st_mode) &&
(g_stat(pathbuf, &sb, pglob) == 0) &&
S_ISDIR(sb.st_mode)))) {
if (pathend + 1 > pathend_last)
return (GLOB_ABORTED);
2000-02-18 03:38:33 +08:00
*pathend++ = SEP;
*pathend = EOS;
}
++pglob->gl_matchc;
return(globextend(pathbuf, pglob, limit));
2000-02-18 03:38:33 +08:00
}
/* Find end of next segment, copy tentatively to pathend. */
q = pathend;
p = pattern;
while (*p != EOS && *p != SEP) {
if (ismeta(*p))
anymeta = 1;
if (q + 1 > pathend_last)
return (GLOB_ABORTED);
2000-02-18 03:38:33 +08:00
*q++ = *p++;
}
if (!anymeta) { /* No expansion, do next segment. */
pathend = q;
pattern = p;
while (*pattern == SEP) {
if (pathend + 1 > pathend_last)
return (GLOB_ABORTED);
2000-02-18 03:38:33 +08:00
*pathend++ = *pattern++;
}
2000-02-18 03:38:33 +08:00
} else /* Need expansion, recurse. */
return(glob3(pathbuf, pathend, pathend_last, pattern, p,
pglob, limit));
2000-02-18 03:38:33 +08:00
}
/* NOTREACHED */
}
static int
glob3(Char *pathbuf, Char *pathend, Char *pathend_last,
Char *pattern, Char *restpattern,
glob_t *pglob, size_t *limit)
2000-02-18 03:38:33 +08:00
{
struct dirent *dp;
2000-02-18 03:38:33 +08:00
DIR *dirp;
int err;
char buf[MAXPATHLEN];
/*
* The readdirfunc declaration can't be prototyped, because it is
* assigned, below, to two functions which are prototyped in glob.h
* and dirent.h as taking pointers to differently typed opaque
* structures.
* CYGWIN: Needs prototype and subsequently wild casting to avoid
* compiler error.
2000-02-18 03:38:33 +08:00
*/
struct dirent *(*readdirfunc)(void *);
2000-02-18 03:38:33 +08:00
if (pathend > pathend_last)
return (GLOB_ABORTED);
2000-02-18 03:38:33 +08:00
*pathend = EOS;
errno = 0;
2000-02-18 03:38:33 +08:00
if ((dirp = g_opendir(pathbuf, pglob)) == NULL) {
/* TODO: don't call for ENOENT or ENOTDIR? */
if (pglob->gl_errfunc) {
if (g_Ctoc(pathbuf, buf, sizeof(buf)))
return (GLOB_ABORTED);
2000-02-18 03:38:33 +08:00
if (pglob->gl_errfunc(buf, errno) ||
pglob->gl_flags & GLOB_ERR)
return (GLOB_ABORTED);
2000-02-18 03:38:33 +08:00
}
return(0);
2000-02-18 03:38:33 +08:00
}
err = 0;
/* Search directory for matching names. */
if (pglob->gl_flags & GLOB_ALTDIRFUNC)
readdirfunc = pglob->gl_readdir;
else
readdirfunc = (dirent*(*)(void*)) readdir;
2000-02-18 03:38:33 +08:00
while ((dp = (*readdirfunc)(dirp))) {
char *sc;
Char *dc;
wint_t wc;
size_t clen;
mbstate_t mbs;
2000-02-18 03:38:33 +08:00
/* Initial DOT must be matched literally. */
if (dp->d_name[0] == DOT && *pattern != DOT)
continue;
memset(&mbs, 0, sizeof(mbs));
dc = pathend;
sc = dp->d_name;
while (dc < pathend_last) {
clen = mbrtowi(&wc, sc, MB_LEN_MAX, &mbs);
if (clen == (size_t)-1 || clen == (size_t)-2) {
wc = *sc;
clen = 1;
memset(&mbs, 0, sizeof(mbs));
}
if ((*dc++ = wc) == EOS)
break;
sc += clen;
}
2000-02-18 03:38:33 +08:00
if (!match(pathend, pattern, restpattern)) {
*pathend = EOS;
continue;
}
err = glob2(pathbuf, --dc, pathend_last, restpattern,
pglob, limit);
2000-02-18 03:38:33 +08:00
if (err)
break;
}
if (pglob->gl_flags & GLOB_ALTDIRFUNC)
(*pglob->gl_closedir)(dirp);
else
closedir(dirp);
return(err);
}
/*
* Extend the gl_pathv member of a glob_t structure to accomodate a new item,
2000-02-18 03:38:33 +08:00
* add the new item, and update gl_pathc.
*
* This assumes the BSD realloc, which only copies the block when its size
* crosses a power-of-two boundary; for v7 realloc, this would cause quadratic
* behavior.
*
* Return 0 if new item added, error code if memory couldn't be allocated.
*
* Invariant of the glob_t structure:
* Either gl_pathc is zero and gl_pathv is NULL; or gl_pathc > 0 and
* gl_pathv points to (gl_offs + gl_pathc + 1) items.
*/
static int
globextend(const Char *path, glob_t *pglob, size_t *limit)
2000-02-18 03:38:33 +08:00
{
char **pathv;
size_t i, newsize, len;
2000-02-18 03:38:33 +08:00
char *copy;
const Char *p;
if (*limit && pglob->gl_pathc > *limit) {
errno = 0;
return (GLOB_NOSPACE);
}
2000-02-18 03:38:33 +08:00
newsize = sizeof(*pathv) * (2 + pglob->gl_pathc + pglob->gl_offs);
pathv = pglob->gl_pathv ?
(char **) realloc((char *)pglob->gl_pathv, newsize) :
(char **) malloc(newsize);
if (pathv == NULL) {
if (pglob->gl_pathv) {
free(pglob->gl_pathv);
pglob->gl_pathv = NULL;
}
2000-02-18 03:38:33 +08:00
return(GLOB_NOSPACE);
}
2000-02-18 03:38:33 +08:00
if (pglob->gl_pathv == NULL && pglob->gl_offs > 0) {
/* first time around -- clear initial gl_offs items */
pathv += pglob->gl_offs;
for (i = pglob->gl_offs + 1; --i > 0; )
2000-02-18 03:38:33 +08:00
*--pathv = NULL;
}
pglob->gl_pathv = pathv;
for (p = path; *p++;)
continue;
len = MB_CUR_MAX * (size_t)(p - path); /* XXX overallocation */
if ((copy = (char *) malloc(len)) != NULL) {
if (g_Ctoc(path, copy, len)) {
free(copy);
return (GLOB_NOSPACE);
}
2000-02-18 03:38:33 +08:00
pathv[pglob->gl_offs + pglob->gl_pathc++] = copy;
}
pathv[pglob->gl_offs + pglob->gl_pathc] = NULL;
return(copy == NULL ? GLOB_NOSPACE : 0);
}
/*
* pattern matching function for filenames. Each occurrence of the *
* pattern causes a recursion level.
*/
static int
match(Char *name, Char *pat, Char *patend)
2000-02-18 03:38:33 +08:00
{
int ok, negate_range;
Char c, k;
while (pat < patend) {
c = *pat++;
switch (c & M_MASK) {
case M_ALL:
if (pat == patend)
return(1);
do
2000-02-18 03:38:33 +08:00
if (match(name, pat, patend))
return(1);
while (*name++ != EOS);
return(0);
case M_ONE:
if (*name++ == EOS)
return(0);
break;
case M_SET:
ok = 0;
if ((k = *name++) == EOS)
return(0);
if ((negate_range = ((*pat & M_MASK) == M_NOT)) != EOS)
++pat;
while (((c = *pat++) & M_MASK) != M_END)
if ((c & M_MASK) == M_NAMED) {
if (iswctype (k, *pat++))
ok = 1;
} else if ((c & M_MASK) == M_EQUIV) {
if (is_unicode_equiv (k, *pat++))
ok = 1;
} else if ((*pat & M_MASK) == M_RNG) {
#ifdef __CYGWIN__
if ((!__get_current_collate_locale ()->lcid) ?
#else
if (__collate_load_error ?
#endif
CCHAR(c) <= CCHAR(k) && CCHAR(k) <= CCHAR(pat[1]) :
__wcollate_range_cmp(CCHAR(c), CCHAR(k)) <= 0
&& __wcollate_range_cmp(CCHAR(k), CCHAR(pat[1])) <= 0
)
ok = 1;
pat += 2;
} else if (c == k)
ok = 1;
2000-02-18 03:38:33 +08:00
if (ok == negate_range)
return(0);
break;
default:
if (Cchar(*name++) != Cchar(c))
return(0);
2000-02-18 03:38:33 +08:00
break;
}
}
return(*name == EOS);
}
/* Free allocated data belonging to a glob_t structure. */
void
globfree(glob_t *pglob)
2000-02-18 03:38:33 +08:00
{
size_t i;
char **pp;
2000-02-18 03:38:33 +08:00
if (pglob->gl_pathv != NULL) {
pp = pglob->gl_pathv + pglob->gl_offs;
for (i = pglob->gl_pathc; i--; ++pp)
if (*pp)
free(*pp);
free(pglob->gl_pathv);
pglob->gl_pathv = NULL;
2000-02-18 03:38:33 +08:00
}
}
static DIR *
g_opendir(Char *str, glob_t *pglob)
2000-02-18 03:38:33 +08:00
{
char buf[MAXPATHLEN];
if (!*str)
strcpy(buf, ".");
else {
if (g_Ctoc(str, buf, sizeof(buf)))
return (NULL);
}
2000-02-18 03:38:33 +08:00
if (pglob->gl_flags & GLOB_ALTDIRFUNC)
return (DIR *) ((*pglob->gl_opendir)((const char *) buf));
2000-02-18 03:38:33 +08:00
return(opendir(buf));
}
2013-04-23 17:44:36 +08:00
#define CYGWIN_gl_stat(sfptr) ((*pglob->sfptr) (buf, sb))
2000-02-18 03:38:33 +08:00
static int
g_lstat(Char *fn, struct stat *sb, glob_t *pglob)
2000-02-18 03:38:33 +08:00
{
char buf[MAXPATHLEN];
if (g_Ctoc(fn, buf, sizeof(buf))) {
errno = ENAMETOOLONG;
return (-1);
}
if (pglob->gl_flags & GLOB_ALTDIRFUNC)
return CYGWIN_gl_stat (gl_lstat);
return(lstat(buf, sb));
2000-02-18 03:38:33 +08:00
}
static int
g_stat(Char *fn, struct stat *sb, glob_t *pglob)
2000-02-18 03:38:33 +08:00
{
char buf[MAXPATHLEN];
if (g_Ctoc(fn, buf, sizeof(buf))) {
errno = ENAMETOOLONG;
return (-1);
}
if (pglob->gl_flags & GLOB_ALTDIRFUNC)
return CYGWIN_gl_stat (gl_stat);
return(stat(buf, sb));
2000-02-18 03:38:33 +08:00
}
static const Char *
g_strchr(const Char *str, wint_t ch)
2000-02-18 03:38:33 +08:00
{
2000-02-18 03:38:33 +08:00
do {
if (*str == ch)
return (str);
} while (*str++);
return (NULL);
}
static int
g_Ctoc(const Char *str, char *buf, size_t len)
2000-02-18 03:38:33 +08:00
{
mbstate_t mbs;
size_t clen;
memset(&mbs, 0, sizeof(mbs));
while (len >= (size_t) MB_CUR_MAX) {
clen = wcrtomb(buf, *str, &mbs);
if (clen == (size_t)-1)
return (1);
if (*str == L'\0')
return (0);
str++;
buf += clen;
len -= clen;
}
return (1);
2000-02-18 03:38:33 +08:00
}
#ifdef DEBUG
static void
qprintf(const char *str, Char *s)
2000-02-18 03:38:33 +08:00
{
Char *p;
2000-02-18 03:38:33 +08:00
(void)printf("%s:\n", str);
for (p = s; *p; p++)
(void)printf("%c", CHAR(*p));
(void)printf("\n");
for (p = s; *p; p++)
(void)printf("%c", *p & M_PROTECT ? '"' : ' ');
(void)printf("\n");
for (p = s; *p; p++)
(void)printf("%c", ismeta(*p) ? '_' : ' ');
(void)printf("\n");
}
#endif