Annotation of embedaddon/pcre/pcre_xclass.c, revision 1.1
1.1 ! misho 1: /*************************************************
! 2: * Perl-Compatible Regular Expressions *
! 3: *************************************************/
! 4:
! 5: /* PCRE is a library of functions to support regular expressions whose syntax
! 6: and semantics are as close as possible to those of the Perl 5 language.
! 7:
! 8: Written by Philip Hazel
! 9: Copyright (c) 1997-2010 University of Cambridge
! 10:
! 11: -----------------------------------------------------------------------------
! 12: Redistribution and use in source and binary forms, with or without
! 13: modification, are permitted provided that the following conditions are met:
! 14:
! 15: * Redistributions of source code must retain the above copyright notice,
! 16: this list of conditions and the following disclaimer.
! 17:
! 18: * Redistributions in binary form must reproduce the above copyright
! 19: notice, this list of conditions and the following disclaimer in the
! 20: documentation and/or other materials provided with the distribution.
! 21:
! 22: * Neither the name of the University of Cambridge nor the names of its
! 23: contributors may be used to endorse or promote products derived from
! 24: this software without specific prior written permission.
! 25:
! 26: THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
! 27: AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
! 28: IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
! 29: ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
! 30: LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
! 31: CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
! 32: SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
! 33: INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
! 34: CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
! 35: ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
! 36: POSSIBILITY OF SUCH DAMAGE.
! 37: -----------------------------------------------------------------------------
! 38: */
! 39:
! 40:
! 41: /* This module contains an internal function that is used to match an extended
! 42: class. It is used by both pcre_exec() and pcre_def_exec(). */
! 43:
! 44:
! 45: #ifdef HAVE_CONFIG_H
! 46: #include "config.h"
! 47: #endif
! 48:
! 49: #include "pcre_internal.h"
! 50:
! 51:
! 52: /*************************************************
! 53: * Match character against an XCLASS *
! 54: *************************************************/
! 55:
! 56: /* This function is called to match a character against an extended class that
! 57: might contain values > 255 and/or Unicode properties.
! 58:
! 59: Arguments:
! 60: c the character
! 61: data points to the flag byte of the XCLASS data
! 62:
! 63: Returns: TRUE if character matches, else FALSE
! 64: */
! 65:
! 66: BOOL
! 67: _pcre_xclass(int c, const uschar *data)
! 68: {
! 69: int t;
! 70: BOOL negated = (*data & XCL_NOT) != 0;
! 71:
! 72: /* Character values < 256 are matched against a bitmap, if one is present. If
! 73: not, we still carry on, because there may be ranges that start below 256 in the
! 74: additional data. */
! 75:
! 76: if (c < 256)
! 77: {
! 78: if ((*data & XCL_MAP) != 0 && (data[1 + c/8] & (1 << (c&7))) != 0)
! 79: return !negated; /* char found */
! 80: }
! 81:
! 82: /* First skip the bit map if present. Then match against the list of Unicode
! 83: properties or large chars or ranges that end with a large char. We won't ever
! 84: encounter XCL_PROP or XCL_NOTPROP when UCP support is not compiled. */
! 85:
! 86: if ((*data++ & XCL_MAP) != 0) data += 32;
! 87:
! 88: while ((t = *data++) != XCL_END)
! 89: {
! 90: int x, y;
! 91: if (t == XCL_SINGLE)
! 92: {
! 93: GETCHARINC(x, data);
! 94: if (c == x) return !negated;
! 95: }
! 96: else if (t == XCL_RANGE)
! 97: {
! 98: GETCHARINC(x, data);
! 99: GETCHARINC(y, data);
! 100: if (c >= x && c <= y) return !negated;
! 101: }
! 102:
! 103: #ifdef SUPPORT_UCP
! 104: else /* XCL_PROP & XCL_NOTPROP */
! 105: {
! 106: const ucd_record *prop = GET_UCD(c);
! 107:
! 108: switch(*data)
! 109: {
! 110: case PT_ANY:
! 111: if (t == XCL_PROP) return !negated;
! 112: break;
! 113:
! 114: case PT_LAMP:
! 115: if ((prop->chartype == ucp_Lu || prop->chartype == ucp_Ll ||
! 116: prop->chartype == ucp_Lt) == (t == XCL_PROP)) return !negated;
! 117: break;
! 118:
! 119: case PT_GC:
! 120: if ((data[1] == _pcre_ucp_gentype[prop->chartype]) == (t == XCL_PROP))
! 121: return !negated;
! 122: break;
! 123:
! 124: case PT_PC:
! 125: if ((data[1] == prop->chartype) == (t == XCL_PROP)) return !negated;
! 126: break;
! 127:
! 128: case PT_SC:
! 129: if ((data[1] == prop->script) == (t == XCL_PROP)) return !negated;
! 130: break;
! 131:
! 132: case PT_ALNUM:
! 133: if ((_pcre_ucp_gentype[prop->chartype] == ucp_L ||
! 134: _pcre_ucp_gentype[prop->chartype] == ucp_N) == (t == XCL_PROP))
! 135: return !negated;
! 136: break;
! 137:
! 138: case PT_SPACE: /* Perl space */
! 139: if ((_pcre_ucp_gentype[prop->chartype] == ucp_Z ||
! 140: c == CHAR_HT || c == CHAR_NL || c == CHAR_FF || c == CHAR_CR)
! 141: == (t == XCL_PROP))
! 142: return !negated;
! 143: break;
! 144:
! 145: case PT_PXSPACE: /* POSIX space */
! 146: if ((_pcre_ucp_gentype[prop->chartype] == ucp_Z ||
! 147: c == CHAR_HT || c == CHAR_NL || c == CHAR_VT ||
! 148: c == CHAR_FF || c == CHAR_CR) == (t == XCL_PROP))
! 149: return !negated;
! 150: break;
! 151:
! 152: case PT_WORD:
! 153: if ((_pcre_ucp_gentype[prop->chartype] == ucp_L ||
! 154: _pcre_ucp_gentype[prop->chartype] == ucp_N || c == CHAR_UNDERSCORE)
! 155: == (t == XCL_PROP))
! 156: return !negated;
! 157: break;
! 158:
! 159: /* This should never occur, but compilers may mutter if there is no
! 160: default. */
! 161:
! 162: default:
! 163: return FALSE;
! 164: }
! 165:
! 166: data += 2;
! 167: }
! 168: #endif /* SUPPORT_UCP */
! 169: }
! 170:
! 171: return negated; /* char did not match */
! 172: }
! 173:
! 174: /* End of pcre_xclass.c */
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>