Annotation of embedaddon/php/ext/pcre/pcrelib/pcre_xclass.c, revision 1.1

1.1     ! misho       1: /*************************************************
        !             2: *      Perl-Compatible Regular Expressions       *
        !             3: *************************************************/
        !             4: 
        !             5: /* PCRE is a library of functions to support regular expressions whose syntax
        !             6: and semantics are as close as possible to those of the Perl 5 language.
        !             7: 
        !             8:                        Written by Philip Hazel
        !             9:            Copyright (c) 1997-2010 University of Cambridge
        !            10: 
        !            11: -----------------------------------------------------------------------------
        !            12: Redistribution and use in source and binary forms, with or without
        !            13: modification, are permitted provided that the following conditions are met:
        !            14: 
        !            15:     * Redistributions of source code must retain the above copyright notice,
        !            16:       this list of conditions and the following disclaimer.
        !            17: 
        !            18:     * Redistributions in binary form must reproduce the above copyright
        !            19:       notice, this list of conditions and the following disclaimer in the
        !            20:       documentation and/or other materials provided with the distribution.
        !            21: 
        !            22:     * Neither the name of the University of Cambridge nor the names of its
        !            23:       contributors may be used to endorse or promote products derived from
        !            24:       this software without specific prior written permission.
        !            25: 
        !            26: THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
        !            27: AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
        !            28: IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
        !            29: ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
        !            30: LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
        !            31: CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
        !            32: SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
        !            33: INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
        !            34: CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
        !            35: ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
        !            36: POSSIBILITY OF SUCH DAMAGE.
        !            37: -----------------------------------------------------------------------------
        !            38: */
        !            39: 
        !            40: 
        !            41: /* This module contains an internal function that is used to match an extended
        !            42: class. It is used by both pcre_exec() and pcre_def_exec(). */
        !            43: 
        !            44: 
        !            45: #include "config.h"
        !            46: 
        !            47: #include "pcre_internal.h"
        !            48: 
        !            49: 
        !            50: /*************************************************
        !            51: *       Match character against an XCLASS        *
        !            52: *************************************************/
        !            53: 
        !            54: /* This function is called to match a character against an extended class that
        !            55: might contain values > 255 and/or Unicode properties.
        !            56: 
        !            57: Arguments:
        !            58:   c           the character
        !            59:   data        points to the flag byte of the XCLASS data
        !            60: 
        !            61: Returns:      TRUE if character matches, else FALSE
        !            62: */
        !            63: 
        !            64: BOOL
        !            65: _pcre_xclass(int c, const uschar *data)
        !            66: {
        !            67: int t;
        !            68: BOOL negated = (*data & XCL_NOT) != 0;
        !            69: 
        !            70: /* Character values < 256 are matched against a bitmap, if one is present. If
        !            71: not, we still carry on, because there may be ranges that start below 256 in the
        !            72: additional data. */
        !            73: 
        !            74: if (c < 256)
        !            75:   {
        !            76:   if ((*data & XCL_MAP) != 0 && (data[1 + c/8] & (1 << (c&7))) != 0)
        !            77:     return !negated;   /* char found */
        !            78:   }
        !            79: 
        !            80: /* First skip the bit map if present. Then match against the list of Unicode
        !            81: properties or large chars or ranges that end with a large char. We won't ever
        !            82: encounter XCL_PROP or XCL_NOTPROP when UCP support is not compiled. */
        !            83: 
        !            84: if ((*data++ & XCL_MAP) != 0) data += 32;
        !            85: 
        !            86: while ((t = *data++) != XCL_END)
        !            87:   {
        !            88:   int x, y;
        !            89:   if (t == XCL_SINGLE)
        !            90:     {
        !            91:     GETCHARINC(x, data);
        !            92:     if (c == x) return !negated;
        !            93:     }
        !            94:   else if (t == XCL_RANGE)
        !            95:     {
        !            96:     GETCHARINC(x, data);
        !            97:     GETCHARINC(y, data);
        !            98:     if (c >= x && c <= y) return !negated;
        !            99:     }
        !           100: 
        !           101: #ifdef SUPPORT_UCP
        !           102:   else  /* XCL_PROP & XCL_NOTPROP */
        !           103:     {
        !           104:     const ucd_record *prop = GET_UCD(c);
        !           105: 
        !           106:     switch(*data)
        !           107:       {
        !           108:       case PT_ANY:
        !           109:       if (t == XCL_PROP) return !negated;
        !           110:       break;
        !           111: 
        !           112:       case PT_LAMP:
        !           113:       if ((prop->chartype == ucp_Lu || prop->chartype == ucp_Ll ||
        !           114:            prop->chartype == ucp_Lt) == (t == XCL_PROP)) return !negated;
        !           115:       break;
        !           116: 
        !           117:       case PT_GC:
        !           118:       if ((data[1] == _pcre_ucp_gentype[prop->chartype]) == (t == XCL_PROP))
        !           119:         return !negated;
        !           120:       break;
        !           121: 
        !           122:       case PT_PC:
        !           123:       if ((data[1] == prop->chartype) == (t == XCL_PROP)) return !negated;
        !           124:       break;
        !           125: 
        !           126:       case PT_SC:
        !           127:       if ((data[1] == prop->script) == (t == XCL_PROP)) return !negated;
        !           128:       break;
        !           129: 
        !           130:       case PT_ALNUM:
        !           131:       if ((_pcre_ucp_gentype[prop->chartype] == ucp_L ||
        !           132:            _pcre_ucp_gentype[prop->chartype] == ucp_N) == (t == XCL_PROP))
        !           133:         return !negated;
        !           134:       break;
        !           135: 
        !           136:       case PT_SPACE:    /* Perl space */
        !           137:       if ((_pcre_ucp_gentype[prop->chartype] == ucp_Z ||
        !           138:            c == CHAR_HT || c == CHAR_NL || c == CHAR_FF || c == CHAR_CR)
        !           139:              == (t == XCL_PROP))
        !           140:         return !negated;
        !           141:       break;
        !           142: 
        !           143:       case PT_PXSPACE:  /* POSIX space */
        !           144:       if ((_pcre_ucp_gentype[prop->chartype] == ucp_Z ||
        !           145:            c == CHAR_HT || c == CHAR_NL || c == CHAR_VT ||
        !           146:            c == CHAR_FF || c == CHAR_CR) == (t == XCL_PROP))
        !           147:         return !negated;
        !           148:       break;
        !           149: 
        !           150:       case PT_WORD:
        !           151:       if ((_pcre_ucp_gentype[prop->chartype] == ucp_L ||
        !           152:            _pcre_ucp_gentype[prop->chartype] == ucp_N || c == CHAR_UNDERSCORE)
        !           153:              == (t == XCL_PROP))
        !           154:         return !negated;
        !           155:       break;
        !           156: 
        !           157:       /* This should never occur, but compilers may mutter if there is no
        !           158:       default. */
        !           159: 
        !           160:       default:
        !           161:       return FALSE;
        !           162:       }
        !           163: 
        !           164:     data += 2;
        !           165:     }
        !           166: #endif  /* SUPPORT_UCP */
        !           167:   }
        !           168: 
        !           169: return negated;   /* char did not match */
        !           170: }
        !           171: 
        !           172: /* End of pcre_xclass.c */

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>