Annotation of embedaddon/pcre/pcre_newline.c, revision 1.1

1.1     ! misho       1: /*************************************************
        !             2: *      Perl-Compatible Regular Expressions       *
        !             3: *************************************************/
        !             4: 
        !             5: /* PCRE is a library of functions to support regular expressions whose syntax
        !             6: and semantics are as close as possible to those of the Perl 5 language.
        !             7: 
        !             8:                        Written by Philip Hazel
        !             9:            Copyright (c) 1997-2009 University of Cambridge
        !            10: 
        !            11: -----------------------------------------------------------------------------
        !            12: Redistribution and use in source and binary forms, with or without
        !            13: modification, are permitted provided that the following conditions are met:
        !            14: 
        !            15:     * Redistributions of source code must retain the above copyright notice,
        !            16:       this list of conditions and the following disclaimer.
        !            17: 
        !            18:     * Redistributions in binary form must reproduce the above copyright
        !            19:       notice, this list of conditions and the following disclaimer in the
        !            20:       documentation and/or other materials provided with the distribution.
        !            21: 
        !            22:     * Neither the name of the University of Cambridge nor the names of its
        !            23:       contributors may be used to endorse or promote products derived from
        !            24:       this software without specific prior written permission.
        !            25: 
        !            26: THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
        !            27: AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
        !            28: IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
        !            29: ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
        !            30: LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
        !            31: CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
        !            32: SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
        !            33: INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
        !            34: CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
        !            35: ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
        !            36: POSSIBILITY OF SUCH DAMAGE.
        !            37: -----------------------------------------------------------------------------
        !            38: */
        !            39: 
        !            40: 
        !            41: /* This module contains internal functions for testing newlines when more than
        !            42: one kind of newline is to be recognized. When a newline is found, its length is
        !            43: returned. In principle, we could implement several newline "types", each
        !            44: referring to a different set of newline characters. At present, PCRE supports
        !            45: only NLTYPE_FIXED, which gets handled without these functions, NLTYPE_ANYCRLF,
        !            46: and NLTYPE_ANY. The full list of Unicode newline characters is taken from
        !            47: http://unicode.org/unicode/reports/tr18/. */
        !            48: 
        !            49: 
        !            50: #ifdef HAVE_CONFIG_H
        !            51: #include "config.h"
        !            52: #endif
        !            53: 
        !            54: #include "pcre_internal.h"
        !            55: 
        !            56: 
        !            57: 
        !            58: /*************************************************
        !            59: *      Check for newline at given position       *
        !            60: *************************************************/
        !            61: 
        !            62: /* It is guaranteed that the initial value of ptr is less than the end of the
        !            63: string that is being processed.
        !            64: 
        !            65: Arguments:
        !            66:   ptr          pointer to possible newline
        !            67:   type         the newline type
        !            68:   endptr       pointer to the end of the string
        !            69:   lenptr       where to return the length
        !            70:   utf8         TRUE if in utf8 mode
        !            71: 
        !            72: Returns:       TRUE or FALSE
        !            73: */
        !            74: 
        !            75: BOOL
        !            76: _pcre_is_newline(USPTR ptr, int type, USPTR endptr, int *lenptr, BOOL utf8)
        !            77: {
        !            78: int c;
        !            79: if (utf8) { GETCHAR(c, ptr); } else c = *ptr;
        !            80: 
        !            81: if (type == NLTYPE_ANYCRLF) switch(c)
        !            82:   {
        !            83:   case 0x000a: *lenptr = 1; return TRUE;             /* LF */
        !            84:   case 0x000d: *lenptr = (ptr < endptr - 1 && ptr[1] == 0x0a)? 2 : 1;
        !            85:                return TRUE;                          /* CR */
        !            86:   default: return FALSE;
        !            87:   }
        !            88: 
        !            89: /* NLTYPE_ANY */
        !            90: 
        !            91: else switch(c)
        !            92:   {
        !            93:   case 0x000a:                                       /* LF */
        !            94:   case 0x000b:                                       /* VT */
        !            95:   case 0x000c: *lenptr = 1; return TRUE;             /* FF */
        !            96:   case 0x000d: *lenptr = (ptr < endptr - 1 && ptr[1] == 0x0a)? 2 : 1;
        !            97:                return TRUE;                          /* CR */
        !            98:   case 0x0085: *lenptr = utf8? 2 : 1; return TRUE;   /* NEL */
        !            99:   case 0x2028:                                       /* LS */
        !           100:   case 0x2029: *lenptr = 3; return TRUE;             /* PS */
        !           101:   default: return FALSE;
        !           102:   }
        !           103: }
        !           104: 
        !           105: 
        !           106: 
        !           107: /*************************************************
        !           108: *     Check for newline at previous position     *
        !           109: *************************************************/
        !           110: 
        !           111: /* It is guaranteed that the initial value of ptr is greater than the start of
        !           112: the string that is being processed.
        !           113: 
        !           114: Arguments:
        !           115:   ptr          pointer to possible newline
        !           116:   type         the newline type
        !           117:   startptr     pointer to the start of the string
        !           118:   lenptr       where to return the length
        !           119:   utf8         TRUE if in utf8 mode
        !           120: 
        !           121: Returns:       TRUE or FALSE
        !           122: */
        !           123: 
        !           124: BOOL
        !           125: _pcre_was_newline(USPTR ptr, int type, USPTR startptr, int *lenptr, BOOL utf8)
        !           126: {
        !           127: int c;
        !           128: ptr--;
        !           129: #ifdef SUPPORT_UTF8
        !           130: if (utf8)
        !           131:   {
        !           132:   BACKCHAR(ptr);
        !           133:   GETCHAR(c, ptr);
        !           134:   }
        !           135: else c = *ptr;
        !           136: #else   /* no UTF-8 support */
        !           137: c = *ptr;
        !           138: #endif  /* SUPPORT_UTF8 */
        !           139: 
        !           140: if (type == NLTYPE_ANYCRLF) switch(c)
        !           141:   {
        !           142:   case 0x000a: *lenptr = (ptr > startptr && ptr[-1] == 0x0d)? 2 : 1;
        !           143:                return TRUE;                         /* LF */
        !           144:   case 0x000d: *lenptr = 1; return TRUE;            /* CR */
        !           145:   default: return FALSE;
        !           146:   }
        !           147: 
        !           148: else switch(c)
        !           149:   {
        !           150:   case 0x000a: *lenptr = (ptr > startptr && ptr[-1] == 0x0d)? 2 : 1;
        !           151:                return TRUE;                         /* LF */
        !           152:   case 0x000b:                                      /* VT */
        !           153:   case 0x000c:                                      /* FF */
        !           154:   case 0x000d: *lenptr = 1; return TRUE;            /* CR */
        !           155:   case 0x0085: *lenptr = utf8? 2 : 1; return TRUE;  /* NEL */
        !           156:   case 0x2028:                                      /* LS */
        !           157:   case 0x2029: *lenptr = 3; return TRUE;            /* PS */
        !           158:   default: return FALSE;
        !           159:   }
        !           160: }
        !           161: 
        !           162: /* End of pcre_newline.c */

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>