Annotation of embedaddon/rsync/lib/wildmatch.c, revision 1.1
1.1 ! misho 1: /*
! 2: ** Do shell-style pattern matching for ?, \, [], and * characters.
! 3: ** It is 8bit clean.
! 4: **
! 5: ** Written by Rich $alz, mirror!rs, Wed Nov 26 19:03:17 EST 1986.
! 6: ** Rich $alz is now <rsalz@bbn.com>.
! 7: **
! 8: ** Modified by Wayne Davison to special-case '/' matching, to make '**'
! 9: ** work differently than '*', and to fix the character-class code.
! 10: */
! 11:
! 12: #include "rsync.h"
! 13:
! 14: /* What character marks an inverted character class? */
! 15: #define NEGATE_CLASS '!'
! 16: #define NEGATE_CLASS2 '^'
! 17:
! 18: #define FALSE 0
! 19: #define TRUE 1
! 20: #define ABORT_ALL -1
! 21: #define ABORT_TO_STARSTAR -2
! 22:
! 23: #define CC_EQ(class, len, litmatch) ((len) == sizeof (litmatch)-1 \
! 24: && *(class) == *(litmatch) \
! 25: && strncmp((char*)class, litmatch, len) == 0)
! 26:
! 27: #if defined STDC_HEADERS || !defined isascii
! 28: # define ISASCII(c) 1
! 29: #else
! 30: # define ISASCII(c) isascii(c)
! 31: #endif
! 32:
! 33: #ifdef isblank
! 34: # define ISBLANK(c) (ISASCII(c) && isblank(c))
! 35: #else
! 36: # define ISBLANK(c) ((c) == ' ' || (c) == '\t')
! 37: #endif
! 38:
! 39: #ifdef isgraph
! 40: # define ISGRAPH(c) (ISASCII(c) && isgraph(c))
! 41: #else
! 42: # define ISGRAPH(c) (ISASCII(c) && isprint(c) && !isspace(c))
! 43: #endif
! 44:
! 45: #define ISPRINT(c) (ISASCII(c) && isprint(c))
! 46: #define ISDIGIT(c) (ISASCII(c) && isdigit(c))
! 47: #define ISALNUM(c) (ISASCII(c) && isalnum(c))
! 48: #define ISALPHA(c) (ISASCII(c) && isalpha(c))
! 49: #define ISCNTRL(c) (ISASCII(c) && iscntrl(c))
! 50: #define ISLOWER(c) (ISASCII(c) && islower(c))
! 51: #define ISPUNCT(c) (ISASCII(c) && ispunct(c))
! 52: #define ISSPACE(c) (ISASCII(c) && isspace(c))
! 53: #define ISUPPER(c) (ISASCII(c) && isupper(c))
! 54: #define ISXDIGIT(c) (ISASCII(c) && isxdigit(c))
! 55:
! 56: #ifdef WILD_TEST_ITERATIONS
! 57: int wildmatch_iteration_count;
! 58: #endif
! 59:
! 60: static int force_lower_case = 0;
! 61:
! 62: /* Match pattern "p" against the a virtually-joined string consisting
! 63: * of "text" and any strings in array "a". */
! 64: static int dowild(const uchar *p, const uchar *text, const uchar*const *a)
! 65: {
! 66: uchar p_ch;
! 67:
! 68: #ifdef WILD_TEST_ITERATIONS
! 69: wildmatch_iteration_count++;
! 70: #endif
! 71:
! 72: for ( ; (p_ch = *p) != '\0'; text++, p++) {
! 73: int matched, special;
! 74: uchar t_ch, prev_ch;
! 75: while ((t_ch = *text) == '\0') {
! 76: if (*a == NULL) {
! 77: if (p_ch != '*')
! 78: return ABORT_ALL;
! 79: break;
! 80: }
! 81: text = *a++;
! 82: }
! 83: if (force_lower_case && ISUPPER(t_ch))
! 84: t_ch = tolower(t_ch);
! 85: switch (p_ch) {
! 86: case '\\':
! 87: /* Literal match with following character. Note that the test
! 88: * in "default" handles the p[1] == '\0' failure case. */
! 89: p_ch = *++p;
! 90: /* FALLTHROUGH */
! 91: default:
! 92: if (t_ch != p_ch)
! 93: return FALSE;
! 94: continue;
! 95: case '?':
! 96: /* Match anything but '/'. */
! 97: if (t_ch == '/')
! 98: return FALSE;
! 99: continue;
! 100: case '*':
! 101: if (*++p == '*') {
! 102: while (*++p == '*') {}
! 103: special = TRUE;
! 104: } else
! 105: special = FALSE;
! 106: if (*p == '\0') {
! 107: /* Trailing "**" matches everything. Trailing "*" matches
! 108: * only if there are no more slash characters. */
! 109: if (!special) {
! 110: do {
! 111: if (strchr((char*)text, '/') != NULL)
! 112: return FALSE;
! 113: } while ((text = *a++) != NULL);
! 114: }
! 115: return TRUE;
! 116: }
! 117: while (1) {
! 118: if (t_ch == '\0') {
! 119: if ((text = *a++) == NULL)
! 120: break;
! 121: t_ch = *text;
! 122: continue;
! 123: }
! 124: if ((matched = dowild(p, text, a)) != FALSE) {
! 125: if (!special || matched != ABORT_TO_STARSTAR)
! 126: return matched;
! 127: } else if (!special && t_ch == '/')
! 128: return ABORT_TO_STARSTAR;
! 129: t_ch = *++text;
! 130: }
! 131: return ABORT_ALL;
! 132: case '[':
! 133: p_ch = *++p;
! 134: #ifdef NEGATE_CLASS2
! 135: if (p_ch == NEGATE_CLASS2)
! 136: p_ch = NEGATE_CLASS;
! 137: #endif
! 138: /* Assign literal TRUE/FALSE because of "matched" comparison. */
! 139: special = p_ch == NEGATE_CLASS? TRUE : FALSE;
! 140: if (special) {
! 141: /* Inverted character class. */
! 142: p_ch = *++p;
! 143: }
! 144: prev_ch = 0;
! 145: matched = FALSE;
! 146: do {
! 147: if (!p_ch)
! 148: return ABORT_ALL;
! 149: if (p_ch == '\\') {
! 150: p_ch = *++p;
! 151: if (!p_ch)
! 152: return ABORT_ALL;
! 153: if (t_ch == p_ch)
! 154: matched = TRUE;
! 155: } else if (p_ch == '-' && prev_ch && p[1] && p[1] != ']') {
! 156: p_ch = *++p;
! 157: if (p_ch == '\\') {
! 158: p_ch = *++p;
! 159: if (!p_ch)
! 160: return ABORT_ALL;
! 161: }
! 162: if (t_ch <= p_ch && t_ch >= prev_ch)
! 163: matched = TRUE;
! 164: p_ch = 0; /* This makes "prev_ch" get set to 0. */
! 165: } else if (p_ch == '[' && p[1] == ':') {
! 166: const uchar *s;
! 167: int i;
! 168: for (s = p += 2; (p_ch = *p) && p_ch != ']'; p++) {} /*SHARED ITERATOR*/
! 169: if (!p_ch)
! 170: return ABORT_ALL;
! 171: i = p - s - 1;
! 172: if (i < 0 || p[-1] != ':') {
! 173: /* Didn't find ":]", so treat like a normal set. */
! 174: p = s - 2;
! 175: p_ch = '[';
! 176: if (t_ch == p_ch)
! 177: matched = TRUE;
! 178: continue;
! 179: }
! 180: if (CC_EQ(s,i, "alnum")) {
! 181: if (ISALNUM(t_ch))
! 182: matched = TRUE;
! 183: } else if (CC_EQ(s,i, "alpha")) {
! 184: if (ISALPHA(t_ch))
! 185: matched = TRUE;
! 186: } else if (CC_EQ(s,i, "blank")) {
! 187: if (ISBLANK(t_ch))
! 188: matched = TRUE;
! 189: } else if (CC_EQ(s,i, "cntrl")) {
! 190: if (ISCNTRL(t_ch))
! 191: matched = TRUE;
! 192: } else if (CC_EQ(s,i, "digit")) {
! 193: if (ISDIGIT(t_ch))
! 194: matched = TRUE;
! 195: } else if (CC_EQ(s,i, "graph")) {
! 196: if (ISGRAPH(t_ch))
! 197: matched = TRUE;
! 198: } else if (CC_EQ(s,i, "lower")) {
! 199: if (ISLOWER(t_ch))
! 200: matched = TRUE;
! 201: } else if (CC_EQ(s,i, "print")) {
! 202: if (ISPRINT(t_ch))
! 203: matched = TRUE;
! 204: } else if (CC_EQ(s,i, "punct")) {
! 205: if (ISPUNCT(t_ch))
! 206: matched = TRUE;
! 207: } else if (CC_EQ(s,i, "space")) {
! 208: if (ISSPACE(t_ch))
! 209: matched = TRUE;
! 210: } else if (CC_EQ(s,i, "upper")) {
! 211: if (ISUPPER(t_ch))
! 212: matched = TRUE;
! 213: } else if (CC_EQ(s,i, "xdigit")) {
! 214: if (ISXDIGIT(t_ch))
! 215: matched = TRUE;
! 216: } else /* malformed [:class:] string */
! 217: return ABORT_ALL;
! 218: p_ch = 0; /* This makes "prev_ch" get set to 0. */
! 219: } else if (t_ch == p_ch)
! 220: matched = TRUE;
! 221: } while (prev_ch = p_ch, (p_ch = *++p) != ']');
! 222: if (matched == special || t_ch == '/')
! 223: return FALSE;
! 224: continue;
! 225: }
! 226: }
! 227:
! 228: do {
! 229: if (*text)
! 230: return FALSE;
! 231: } while ((text = *a++) != NULL);
! 232:
! 233: return TRUE;
! 234: }
! 235:
! 236: /* Match literal string "s" against the a virtually-joined string consisting
! 237: * of "text" and any strings in array "a". */
! 238: static int doliteral(const uchar *s, const uchar *text, const uchar*const *a)
! 239: {
! 240: for ( ; *s != '\0'; text++, s++) {
! 241: while (*text == '\0') {
! 242: if ((text = *a++) == NULL)
! 243: return FALSE;
! 244: }
! 245: if (*text != *s)
! 246: return FALSE;
! 247: }
! 248:
! 249: do {
! 250: if (*text)
! 251: return FALSE;
! 252: } while ((text = *a++) != NULL);
! 253:
! 254: return TRUE;
! 255: }
! 256:
! 257: /* Return the last "count" path elements from the concatenated string.
! 258: * We return a string pointer to the start of the string, and update the
! 259: * array pointer-pointer to point to any remaining string elements. */
! 260: static const uchar *trailing_N_elements(const uchar*const **a_ptr, int count)
! 261: {
! 262: const uchar*const *a = *a_ptr;
! 263: const uchar*const *first_a = a;
! 264:
! 265: while (*a)
! 266: a++;
! 267:
! 268: while (a != first_a) {
! 269: const uchar *s = *--a;
! 270: s += strlen((char*)s);
! 271: while (--s >= *a) {
! 272: if (*s == '/' && !--count) {
! 273: *a_ptr = a+1;
! 274: return s+1;
! 275: }
! 276: }
! 277: }
! 278:
! 279: if (count == 1) {
! 280: *a_ptr = a+1;
! 281: return *a;
! 282: }
! 283:
! 284: return NULL;
! 285: }
! 286:
! 287: /* Match the "pattern" against the "text" string. */
! 288: int wildmatch(const char *pattern, const char *text)
! 289: {
! 290: static const uchar *nomore[1]; /* A NULL pointer. */
! 291: #ifdef WILD_TEST_ITERATIONS
! 292: wildmatch_iteration_count = 0;
! 293: #endif
! 294: return dowild((const uchar*)pattern, (const uchar*)text, nomore) == TRUE;
! 295: }
! 296:
! 297: /* Match the "pattern" against the forced-to-lower-case "text" string. */
! 298: int iwildmatch(const char *pattern, const char *text)
! 299: {
! 300: static const uchar *nomore[1]; /* A NULL pointer. */
! 301: int ret;
! 302: #ifdef WILD_TEST_ITERATIONS
! 303: wildmatch_iteration_count = 0;
! 304: #endif
! 305: force_lower_case = 1;
! 306: ret = dowild((const uchar*)pattern, (const uchar*)text, nomore) == TRUE;
! 307: force_lower_case = 0;
! 308: return ret;
! 309: }
! 310:
! 311: /* Match pattern "p" against the a virtually-joined string consisting
! 312: * of all the pointers in array "texts" (which has a NULL pointer at the
! 313: * end). The int "where" can be 0 (normal matching), > 0 (match only
! 314: * the trailing N slash-separated filename components of "texts"), or < 0
! 315: * (match the "pattern" at the start or after any slash in "texts"). */
! 316: int wildmatch_array(const char *pattern, const char*const *texts, int where)
! 317: {
! 318: const uchar *p = (const uchar*)pattern;
! 319: const uchar*const *a = (const uchar*const*)texts;
! 320: const uchar *text;
! 321: int matched;
! 322:
! 323: #ifdef WILD_TEST_ITERATIONS
! 324: wildmatch_iteration_count = 0;
! 325: #endif
! 326:
! 327: if (where > 0)
! 328: text = trailing_N_elements(&a, where);
! 329: else
! 330: text = *a++;
! 331: if (!text)
! 332: return FALSE;
! 333:
! 334: if ((matched = dowild(p, text, a)) != TRUE && where < 0
! 335: && matched != ABORT_ALL) {
! 336: while (1) {
! 337: if (*text == '\0') {
! 338: if ((text = (uchar*)*a++) == NULL)
! 339: return FALSE;
! 340: continue;
! 341: }
! 342: if (*text++ == '/' && (matched = dowild(p, text, a)) != FALSE
! 343: && matched != ABORT_TO_STARSTAR)
! 344: break;
! 345: }
! 346: }
! 347: return matched == TRUE;
! 348: }
! 349:
! 350: /* Match literal string "s" against the a virtually-joined string consisting
! 351: * of all the pointers in array "texts" (which has a NULL pointer at the
! 352: * end). The int "where" can be 0 (normal matching), or > 0 (match
! 353: * only the trailing N slash-separated filename components of "texts"). */
! 354: int litmatch_array(const char *string, const char*const *texts, int where)
! 355: {
! 356: const uchar *s = (const uchar*)string;
! 357: const uchar*const *a = (const uchar* const*)texts;
! 358: const uchar *text;
! 359:
! 360: if (where > 0)
! 361: text = trailing_N_elements(&a, where);
! 362: else
! 363: text = *a++;
! 364: if (!text)
! 365: return FALSE;
! 366:
! 367: return doliteral(s, text, a) == TRUE;
! 368: }
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>