Annotation of embedaddon/pcre/pcre_newline.c, revision 1.1.1.2
1.1 misho 1: /*************************************************
2: * Perl-Compatible Regular Expressions *
3: *************************************************/
4:
5: /* PCRE is a library of functions to support regular expressions whose syntax
6: and semantics are as close as possible to those of the Perl 5 language.
7:
8: Written by Philip Hazel
1.1.1.2 ! misho 9: Copyright (c) 1997-2012 University of Cambridge
1.1 misho 10:
11: -----------------------------------------------------------------------------
12: Redistribution and use in source and binary forms, with or without
13: modification, are permitted provided that the following conditions are met:
14:
15: * Redistributions of source code must retain the above copyright notice,
16: this list of conditions and the following disclaimer.
17:
18: * Redistributions in binary form must reproduce the above copyright
19: notice, this list of conditions and the following disclaimer in the
20: documentation and/or other materials provided with the distribution.
21:
22: * Neither the name of the University of Cambridge nor the names of its
23: contributors may be used to endorse or promote products derived from
24: this software without specific prior written permission.
25:
26: THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
27: AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
28: IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
29: ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
30: LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
31: CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
32: SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
33: INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
34: CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
35: ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
36: POSSIBILITY OF SUCH DAMAGE.
37: -----------------------------------------------------------------------------
38: */
39:
40:
41: /* This module contains internal functions for testing newlines when more than
42: one kind of newline is to be recognized. When a newline is found, its length is
43: returned. In principle, we could implement several newline "types", each
44: referring to a different set of newline characters. At present, PCRE supports
45: only NLTYPE_FIXED, which gets handled without these functions, NLTYPE_ANYCRLF,
46: and NLTYPE_ANY. The full list of Unicode newline characters is taken from
47: http://unicode.org/unicode/reports/tr18/. */
48:
49:
50: #ifdef HAVE_CONFIG_H
51: #include "config.h"
52: #endif
53:
54: #include "pcre_internal.h"
55:
56:
57:
58: /*************************************************
59: * Check for newline at given position *
60: *************************************************/
61:
62: /* It is guaranteed that the initial value of ptr is less than the end of the
63: string that is being processed.
64:
65: Arguments:
66: ptr pointer to possible newline
67: type the newline type
68: endptr pointer to the end of the string
69: lenptr where to return the length
1.1.1.2 ! misho 70: utf TRUE if in utf mode
1.1 misho 71:
72: Returns: TRUE or FALSE
73: */
74:
75: BOOL
1.1.1.2 ! misho 76: PRIV(is_newline)(PCRE_PUCHAR ptr, int type, PCRE_PUCHAR endptr, int *lenptr,
! 77: BOOL utf)
1.1 misho 78: {
79: int c;
1.1.1.2 ! misho 80: (void)utf;
! 81: #ifdef SUPPORT_UTF
! 82: if (utf)
! 83: {
! 84: GETCHAR(c, ptr);
! 85: }
! 86: else
! 87: #endif /* SUPPORT_UTF */
! 88: c = *ptr;
1.1 misho 89:
90: if (type == NLTYPE_ANYCRLF) switch(c)
91: {
92: case 0x000a: *lenptr = 1; return TRUE; /* LF */
93: case 0x000d: *lenptr = (ptr < endptr - 1 && ptr[1] == 0x0a)? 2 : 1;
94: return TRUE; /* CR */
95: default: return FALSE;
96: }
97:
98: /* NLTYPE_ANY */
99:
100: else switch(c)
101: {
102: case 0x000a: /* LF */
103: case 0x000b: /* VT */
104: case 0x000c: *lenptr = 1; return TRUE; /* FF */
105: case 0x000d: *lenptr = (ptr < endptr - 1 && ptr[1] == 0x0a)? 2 : 1;
106: return TRUE; /* CR */
1.1.1.2 ! misho 107: #ifdef COMPILE_PCRE8
! 108: case 0x0085: *lenptr = utf? 2 : 1; return TRUE; /* NEL */
1.1 misho 109: case 0x2028: /* LS */
110: case 0x2029: *lenptr = 3; return TRUE; /* PS */
1.1.1.2 ! misho 111: #else
! 112: case 0x0085: /* NEL */
! 113: case 0x2028: /* LS */
! 114: case 0x2029: *lenptr = 1; return TRUE; /* PS */
! 115: #endif /* COMPILE_PCRE8 */
1.1 misho 116: default: return FALSE;
117: }
118: }
119:
120:
121:
122: /*************************************************
123: * Check for newline at previous position *
124: *************************************************/
125:
126: /* It is guaranteed that the initial value of ptr is greater than the start of
127: the string that is being processed.
128:
129: Arguments:
130: ptr pointer to possible newline
131: type the newline type
132: startptr pointer to the start of the string
133: lenptr where to return the length
1.1.1.2 ! misho 134: utf TRUE if in utf mode
1.1 misho 135:
136: Returns: TRUE or FALSE
137: */
138:
139: BOOL
1.1.1.2 ! misho 140: PRIV(was_newline)(PCRE_PUCHAR ptr, int type, PCRE_PUCHAR startptr, int *lenptr,
! 141: BOOL utf)
1.1 misho 142: {
143: int c;
1.1.1.2 ! misho 144: (void)utf;
1.1 misho 145: ptr--;
1.1.1.2 ! misho 146: #ifdef SUPPORT_UTF
! 147: if (utf)
1.1 misho 148: {
149: BACKCHAR(ptr);
150: GETCHAR(c, ptr);
151: }
1.1.1.2 ! misho 152: else
! 153: #endif /* SUPPORT_UTF */
! 154: c = *ptr;
1.1 misho 155:
156: if (type == NLTYPE_ANYCRLF) switch(c)
157: {
158: case 0x000a: *lenptr = (ptr > startptr && ptr[-1] == 0x0d)? 2 : 1;
159: return TRUE; /* LF */
160: case 0x000d: *lenptr = 1; return TRUE; /* CR */
161: default: return FALSE;
162: }
163:
164: else switch(c)
165: {
166: case 0x000a: *lenptr = (ptr > startptr && ptr[-1] == 0x0d)? 2 : 1;
167: return TRUE; /* LF */
168: case 0x000b: /* VT */
169: case 0x000c: /* FF */
170: case 0x000d: *lenptr = 1; return TRUE; /* CR */
1.1.1.2 ! misho 171: #ifdef COMPILE_PCRE8
! 172: case 0x0085: *lenptr = utf? 2 : 1; return TRUE; /* NEL */
1.1 misho 173: case 0x2028: /* LS */
174: case 0x2029: *lenptr = 3; return TRUE; /* PS */
1.1.1.2 ! misho 175: #else
! 176: case 0x0085: /* NEL */
! 177: case 0x2028: /* LS */
! 178: case 0x2029: *lenptr = 1; return TRUE; /* PS */
! 179: #endif /* COMPILE_PCRE8 */
1.1 misho 180: default: return FALSE;
181: }
182: }
183:
184: /* End of pcre_newline.c */
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>