Annotation of embedaddon/php/ext/mysqlnd/mysqlnd_charset.c, revision 1.1.1.3
1.1 misho 1: /*
2: +----------------------------------------------------------------------+
3: | PHP Version 5 |
4: +----------------------------------------------------------------------+
1.1.1.3 ! misho 5: | Copyright (c) 2006-2013 The PHP Group |
1.1 misho 6: +----------------------------------------------------------------------+
7: | This source file is subject to version 3.01 of the PHP license, |
8: | that is bundled with this package in the file LICENSE, and is |
9: | available through the world-wide-web at the following url: |
10: | http://www.php.net/license/3_01.txt |
11: | If you did not receive a copy of the PHP license and are unable to |
12: | obtain it through the world-wide-web, please send a note to |
13: | license@php.net so we can mail you a copy immediately. |
14: +----------------------------------------------------------------------+
15: | Authors: Georg Richter <georg@mysql.com> |
16: | Andrey Hristov <andrey@mysql.com> |
17: | Ulf Wendel <uwendel@mysql.com> |
18: +----------------------------------------------------------------------+
19: */
20: #include "php.h"
21: #include "php_globals.h"
22: #include "mysqlnd.h"
23: #include "mysqlnd_priv.h"
24: #include "mysqlnd_debug.h"
1.1.1.2 misho 25: #include "mysqlnd_charset.h"
1.1 misho 26:
27: /* {{{ utf8 functions */
28: static unsigned int check_mb_utf8mb3_sequence(const char *start, const char *end)
29: {
30: zend_uchar c;
31:
32: if (start >= end) {
33: return 0;
34: }
35:
36: c = (zend_uchar) start[0];
37:
38: if (c < 0x80) {
39: return 1; /* single byte character */
40: }
41: if (c < 0xC2) {
42: return 0; /* invalid mb character */
43: }
44: if (c < 0xE0) {
45: if (start + 2 > end) {
46: return 0; /* too small */
47: }
48: if (!(((zend_uchar)start[1] ^ 0x80) < 0x40)) {
49: return 0;
50: }
51: return 2;
52: }
53: if (c < 0xF0) {
54: if (start + 3 > end) {
55: return 0; /* too small */
56: }
57: if (!(((zend_uchar)start[1] ^ 0x80) < 0x40 && ((zend_uchar)start[2] ^ 0x80) < 0x40 &&
58: (c >= 0xE1 || (zend_uchar)start[1] >= 0xA0))) {
59: return 0; /* invalid utf8 character */
60: }
61: return 3;
62: }
63: return 0;
64: }
65:
66:
67: static unsigned int check_mb_utf8_sequence(const char *start, const char *end)
68: {
69: zend_uchar c;
70:
71: if (start >= end) {
72: return 0;
73: }
74:
75: c = (zend_uchar) start[0];
76:
77: if (c < 0x80) {
78: return 1; /* single byte character */
79: }
80: if (c < 0xC2) {
81: return 0; /* invalid mb character */
82: }
83: if (c < 0xE0) {
84: if (start + 2 > end) {
85: return 0; /* too small */
86: }
87: if (!(((zend_uchar)start[1] ^ 0x80) < 0x40)) {
88: return 0;
89: }
90: return 2;
91: }
92: if (c < 0xF0) {
93: if (start + 3 > end) {
94: return 0; /* too small */
95: }
96: if (!(((zend_uchar)start[1] ^ 0x80) < 0x40 && ((zend_uchar)start[2] ^ 0x80) < 0x40 &&
97: (c >= 0xE1 || (zend_uchar)start[1] >= 0xA0))) {
98: return 0; /* invalid utf8 character */
99: }
100: return 3;
101: }
102: if (c < 0xF5) {
103: if (start + 4 > end) { /* We need 4 characters */
104: return 0; /* too small */
105: }
106:
107: /*
108: UTF-8 quick four-byte mask:
109: 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx
110: Encoding allows to encode U+00010000..U+001FFFFF
111:
112: The maximum character defined in the Unicode standard is U+0010FFFF.
113: Higher characters U+00110000..U+001FFFFF are not used.
114:
115: 11110000.10010000.10xxxxxx.10xxxxxx == F0.90.80.80 == U+00010000 (min)
116: 11110100.10001111.10111111.10111111 == F4.8F.BF.BF == U+0010FFFF (max)
117:
118: Valid codes:
119: [F0][90..BF][80..BF][80..BF]
120: [F1][80..BF][80..BF][80..BF]
121: [F2][80..BF][80..BF][80..BF]
122: [F3][80..BF][80..BF][80..BF]
123: [F4][80..8F][80..BF][80..BF]
124: */
125:
126: if (!(((zend_uchar)start[1] ^ 0x80) < 0x40 &&
127: ((zend_uchar)start[2] ^ 0x80) < 0x40 &&
128: ((zend_uchar)start[3] ^ 0x80) < 0x40 &&
129: (c >= 0xf1 || (zend_uchar)start[1] >= 0x90) &&
130: (c <= 0xf3 || (zend_uchar)start[1] <= 0x8F)))
131: {
132: return 0; /* invalid utf8 character */
133: }
134: return 4;
135: }
136: return 0;
137: }
138:
139: static unsigned int check_mb_utf8mb3_valid(const char *start, const char *end)
140: {
141: unsigned int len = check_mb_utf8mb3_sequence(start, end);
142: return (len > 1)? len:0;
143: }
144:
145: static unsigned int check_mb_utf8_valid(const char *start, const char *end)
146: {
147: unsigned int len = check_mb_utf8_sequence(start, end);
148: return (len > 1)? len:0;
149: }
150:
151:
152: static unsigned int mysqlnd_mbcharlen_utf8mb3(unsigned int utf8)
153: {
154: if (utf8 < 0x80) {
155: return 1; /* single byte character */
156: }
157: if (utf8 < 0xC2) {
158: return 0; /* invalid multibyte header */
159: }
160: if (utf8 < 0xE0) {
161: return 2; /* double byte character */
162: }
163: if (utf8 < 0xF0) {
164: return 3; /* triple byte character */
165: }
166: return 0;
167: }
168:
169:
170: static unsigned int mysqlnd_mbcharlen_utf8(unsigned int utf8)
171: {
172: if (utf8 < 0x80) {
173: return 1; /* single byte character */
174: }
175: if (utf8 < 0xC2) {
176: return 0; /* invalid multibyte header */
177: }
178: if (utf8 < 0xE0) {
179: return 2; /* double byte character */
180: }
181: if (utf8 < 0xF0) {
182: return 3; /* triple byte character */
183: }
184: if (utf8 < 0xF8) {
185: return 4; /* four byte character */
186: }
187: return 0;
188: }
189: /* }}} */
190:
191:
192: /* {{{ big5 functions */
193: #define valid_big5head(c) (0xA1 <= (unsigned int)(c) && (unsigned int)(c) <= 0xF9)
194: #define valid_big5tail(c) ((0x40 <= (unsigned int)(c) && (unsigned int)(c) <= 0x7E) || \
195: (0xA1 <= (unsigned int)(c) && (unsigned int)(c) <= 0xFE))
196:
197: #define isbig5code(c,d) (isbig5head(c) && isbig5tail(d))
198:
199: static unsigned int check_mb_big5(const char *start, const char *end)
200: {
201: return (valid_big5head(*(start)) && (end - start) > 1 && valid_big5tail(*(start + 1)) ? 2 : 0);
202: }
203:
204:
205: static unsigned int mysqlnd_mbcharlen_big5(unsigned int big5)
206: {
207: return (valid_big5head(big5)) ? 2 : 1;
208: }
209: /* }}} */
210:
211:
212: /* {{{ cp932 functions */
213: #define valid_cp932head(c) ((0x81 <= (c) && (c) <= 0x9F) || (0xE0 <= (c) && c <= 0xFC))
214: #define valid_cp932tail(c) ((0x40 <= (c) && (c) <= 0x7E) || (0x80 <= (c) && c <= 0xFC))
215:
216:
217: static unsigned int check_mb_cp932(const char *start, const char *end)
218: {
219: return (valid_cp932head((zend_uchar)start[0]) && (end - start > 1) &&
220: valid_cp932tail((zend_uchar)start[1])) ? 2 : 0;
221: }
222:
223:
224: static unsigned int mysqlnd_mbcharlen_cp932(unsigned int cp932)
225: {
226: return (valid_cp932head((zend_uchar)cp932)) ? 2 : 1;
227: }
228: /* }}} */
229:
230:
231: /* {{{ euckr functions */
232: #define valid_euckr(c) ((0xA1 <= (zend_uchar)(c) && (zend_uchar)(c) <= 0xFE))
233:
234: static unsigned int check_mb_euckr(const char *start, const char *end)
235: {
236: if (end - start <= 1) {
237: return 0; /* invalid length */
238: }
239: if (*(zend_uchar *)start < 0x80) {
240: return 0; /* invalid euckr character */
241: }
242: if (valid_euckr(start[1])) {
243: return 2;
244: }
245: return 0;
246: }
247:
248:
249: static unsigned int mysqlnd_mbcharlen_euckr(unsigned int kr)
250: {
251: return (valid_euckr(kr)) ? 2 : 1;
252: }
253: /* }}} */
254:
255:
256: /* {{{ eucjpms functions */
257: #define valid_eucjpms(c) (((c) & 0xFF) >= 0xA1 && ((c) & 0xFF) <= 0xFE)
258: #define valid_eucjpms_kata(c) (((c) & 0xFF) >= 0xA1 && ((c) & 0xFF) <= 0xDF)
259: #define valid_eucjpms_ss2(c) (((c) & 0xFF) == 0x8E)
260: #define valid_eucjpms_ss3(c) (((c) & 0xFF) == 0x8F)
261:
262: static unsigned int check_mb_eucjpms(const char *start, const char *end)
263: {
264: if (*((zend_uchar *)start) < 0x80) {
265: return 0; /* invalid eucjpms character */
266: }
267: if (valid_eucjpms(start[0]) && (end - start) > 1 && valid_eucjpms(start[1])) {
268: return 2;
269: }
270: if (valid_eucjpms_ss2(start[0]) && (end - start) > 1 && valid_eucjpms_kata(start[1])) {
271: return 2;
272: }
273: if (valid_eucjpms_ss3(start[0]) && (end - start) > 2 && valid_eucjpms(start[1]) &&
274: valid_eucjpms(start[2])) {
275: return 2;
276: }
277: return 0;
278: }
279:
280:
281: static unsigned int mysqlnd_mbcharlen_eucjpms(unsigned int jpms)
282: {
283: if (valid_eucjpms(jpms) || valid_eucjpms_ss2(jpms)) {
284: return 2;
285: }
286: if (valid_eucjpms_ss3(jpms)) {
287: return 3;
288: }
289: return 1;
290: }
291: /* }}} */
292:
293:
294: /* {{{ gb2312 functions */
295: #define valid_gb2312_head(c) (0xA1 <= (zend_uchar)(c) && (zend_uchar)(c) <= 0xF7)
296: #define valid_gb2312_tail(c) (0xA1 <= (zend_uchar)(c) && (zend_uchar)(c) <= 0xFE)
297:
298:
299: static unsigned int check_mb_gb2312(const char *start, const char *end)
300: {
301: return (valid_gb2312_head((unsigned int)start[0]) && end - start > 1 &&
302: valid_gb2312_tail((unsigned int)start[1])) ? 2 : 0;
303: }
304:
305:
306: static unsigned int mysqlnd_mbcharlen_gb2312(unsigned int gb)
307: {
308: return (valid_gb2312_head(gb)) ? 2 : 1;
309: }
310: /* }}} */
311:
312:
313: /* {{{ gbk functions */
314: #define valid_gbk_head(c) (0x81<=(zend_uchar)(c) && (zend_uchar)(c)<=0xFE)
315: #define valid_gbk_tail(c) ((0x40<=(zend_uchar)(c) && (zend_uchar)(c)<=0x7E) || (0x80<=(zend_uchar)(c) && (zend_uchar)(c)<=0xFE))
316:
317: static unsigned int check_mb_gbk(const char *start, const char *end)
318: {
319: return (valid_gbk_head(start[0]) && (end) - (start) > 1 && valid_gbk_tail(start[1])) ? 2 : 0;
320: }
321:
322: static unsigned int mysqlnd_mbcharlen_gbk(unsigned int gbk)
323: {
324: return (valid_gbk_head(gbk) ? 2 : 1);
325: }
326: /* }}} */
327:
328:
1.1.1.2 misho 329: /* {{{ sjis functions */
1.1 misho 330: #define valid_sjis_head(c) ((0x81 <= (c) && (c) <= 0x9F) || (0xE0 <= (c) && (c) <= 0xFC))
331: #define valid_sjis_tail(c) ((0x40 <= (c) && (c) <= 0x7E) || (0x80 <= (c) && (c) <= 0xFC))
332:
333:
334: static unsigned int check_mb_sjis(const char *start, const char *end)
335: {
336: return (valid_sjis_head((zend_uchar)start[0]) && (end - start) > 1 && valid_sjis_tail((zend_uchar)start[1])) ? 2 : 0;
337: }
338:
339:
340: static unsigned int mysqlnd_mbcharlen_sjis(unsigned int sjis)
341: {
342: return (valid_sjis_head((zend_uchar)sjis)) ? 2 : 1;
343: }
344: /* }}} */
345:
346:
347: /* {{{ ucs2 functions */
348: static unsigned int check_mb_ucs2(const char *start __attribute((unused)), const char *end __attribute((unused)))
349: {
350: return 2; /* always 2 */
351: }
352:
353: static unsigned int mysqlnd_mbcharlen_ucs2(unsigned int ucs2 __attribute((unused)))
354: {
355: return 2; /* always 2 */
356: }
357: /* }}} */
358:
359:
360: /* {{{ ujis functions */
361: #define valid_ujis(c) ((0xA1 <= ((c)&0xFF) && ((c)&0xFF) <= 0xFE))
362: #define valid_ujis_kata(c) ((0xA1 <= ((c)&0xFF) && ((c)&0xFF) <= 0xDF))
363: #define valid_ujis_ss2(c) (((c)&0xFF) == 0x8E)
364: #define valid_ujis_ss3(c) (((c)&0xFF) == 0x8F)
365:
366: static unsigned int check_mb_ujis(const char *start, const char *end)
367: {
368: if (*(zend_uchar*)start < 0x80) {
369: return 0; /* invalid ujis character */
370: }
371: if (valid_ujis(*(start)) && valid_ujis(*((start)+1))) {
372: return 2;
373: }
374: if (valid_ujis_ss2(*(start)) && valid_ujis_kata(*((start)+1))) {
375: return 2;
376: }
377: if (valid_ujis_ss3(*(start)) && (end-start) > 2 && valid_ujis(*((start)+1)) && valid_ujis(*((start)+2))) {
378: return 3;
379: }
380: return 0;
381: }
382:
383:
384: static unsigned int mysqlnd_mbcharlen_ujis(unsigned int ujis)
385: {
386: return (valid_ujis(ujis)? 2: valid_ujis_ss2(ujis)? 2: valid_ujis_ss3(ujis)? 3: 1);
387: }
388: /* }}} */
389:
390:
391:
392: /* {{{ utf16 functions */
393: #define UTF16_HIGH_HEAD(x) ((((zend_uchar) (x)) & 0xFC) == 0xD8)
394: #define UTF16_LOW_HEAD(x) ((((zend_uchar) (x)) & 0xFC) == 0xDC)
395:
396: static unsigned int check_mb_utf16(const char *start, const char *end)
397: {
398: if (start + 2 > end) {
399: return 0;
400: }
401:
402: if (UTF16_HIGH_HEAD(*start)) {
403: return (start + 4 <= end) && UTF16_LOW_HEAD(start[2]) ? 4 : 0;
404: }
405:
406: if (UTF16_LOW_HEAD(*start)) {
407: return 0;
408: }
409: return 2;
410: }
411:
412:
413: static uint mysqlnd_mbcharlen_utf16(unsigned int utf16)
414: {
415: return UTF16_HIGH_HEAD(utf16) ? 4 : 2;
416: }
417: /* }}} */
418:
419:
420: /* {{{ utf32 functions */
421: static uint
422: check_mb_utf32(const char *start __attribute((unused)), const char *end __attribute((unused)))
423: {
424: return 4;
425: }
426:
427:
428: static uint
429: mysqlnd_mbcharlen_utf32(unsigned int utf32 __attribute((unused)))
430: {
431: return 4;
432: }
433: /* }}} */
434:
435: /*
436: The server compiles sometimes the full utf-8 (the mb4) as utf8m4, and the old as utf8,
437: for BC reasons. Sometimes, utf8mb4 is just utf8 but the old charsets are utf8mb3.
438: Change easily now, with a macro, could be made compilastion dependable.
439: */
440:
441: #define UTF8_MB4 "utf8mb4"
442: #define UTF8_MB3 "utf8"
443:
444: /* {{{ mysqlnd_charsets */
445: const MYSQLND_CHARSET mysqlnd_charsets[] =
446: {
447: { 1, "big5","big5_chinese_ci", 1, 2, "", mysqlnd_mbcharlen_big5, check_mb_big5},
448: { 3, "dec8", "dec8_swedisch_ci", 1, 1, "", NULL, NULL},
449: { 4, "cp850", "cp850_general_ci", 1, 1, "", NULL, NULL},
450: { 6, "hp8", "hp8_english_ci", 1, 1, "", NULL, NULL},
451: { 7, "koi8r", "koi8r_general_ci", 1, 1, "", NULL, NULL},
452: { 8, "latin1", "latin1_swedish_ci", 1, 1, "", NULL, NULL},
1.1.1.3 ! misho 453: { 5, "latin1", "latin1_german_ci", 1, 1, "", NULL, NULL}, /* should be after 0x9 because swedish_ci is the default collation */
1.1 misho 454: { 9, "latin2", "latin2_general_ci", 1, 1, "", NULL, NULL},
1.1.1.3 ! misho 455: { 2, "latin2", "latin2_czech_cs", 1, 1, "", NULL, NULL}, /* should be after 0x9 because general_ci is the default collation */
1.1 misho 456: { 10, "swe7", "swe7_swedish_ci", 1, 1, "", NULL, NULL},
457: { 11, "ascii", "ascii_general_ci", 1, 1, "", NULL, NULL},
458: { 12, "ujis", "ujis_japanese_ci", 1, 3, "", mysqlnd_mbcharlen_ujis, check_mb_ujis},
459: { 13, "sjis", "sjis_japanese_ci", 1, 2, "", mysqlnd_mbcharlen_sjis, check_mb_sjis},
460: { 16, "hebrew", "hebrew_general_ci", 1, 1, "", NULL, NULL},
1.1.1.3 ! misho 461: { 17, "filename", "filename", 1, 5, "", NULL, NULL},
1.1 misho 462: { 18, "tis620", "tis620_thai_ci", 1, 1, "", NULL, NULL},
463: { 19, "euckr", "euckr_korean_ci", 1, 2, "", mysqlnd_mbcharlen_euckr, check_mb_euckr},
1.1.1.3 ! misho 464: { 21, "latin2", "latin2_hungarian_ci", 1, 1, "", NULL, NULL},
! 465: { 27, "latin2", "latin2_croatian_ci", 1, 1, "", NULL, NULL},
1.1 misho 466: { 22, "koi8u", "koi8u_general_ci", 1, 1, "", NULL, NULL},
467: { 24, "gb2312", "gb2312_chinese_ci", 1, 2, "", mysqlnd_mbcharlen_gb2312, check_mb_gb2312},
468: { 25, "greek", "greek_general_ci", 1, 1, "", NULL, NULL},
469: { 26, "cp1250", "cp1250_general_ci", 1, 1, "", NULL, NULL},
470: { 28, "gbk", "gbk_chinese_ci", 1, 2, "", mysqlnd_mbcharlen_gbk, check_mb_gbk},
471: { 30, "latin5", "latin5_turkish_ci", 1, 1, "", NULL, NULL},
1.1.1.3 ! misho 472: { 31, "latin1", "latin1_german2_ci", 1, 1, "", NULL, NULL},
! 473: { 15, "latin1", "latin1_danish_ci", 1, 1, "", NULL, NULL},
1.1 misho 474: { 32, "armscii8", "armscii8_general_ci", 1, 1, "", NULL, NULL},
475: { 33, UTF8_MB3, UTF8_MB3"_general_ci", 1, 3, "UTF-8 Unicode", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
476: { 35, "ucs2", "ucs2_general_ci", 2, 2, "UCS-2 Unicode", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
477: { 36, "cp866", "cp866_general_ci", 1, 1, "", NULL, NULL},
478: { 37, "keybcs2", "keybcs2_general_ci", 1, 1, "", NULL, NULL},
479: { 38, "macce", "macce_general_ci", 1, 1, "", NULL, NULL},
480: { 39, "macroman", "macroman_general_ci", 1, 1, "", NULL, NULL},
481: { 40, "cp852", "cp852_general_ci", 1, 1, "", NULL, NULL},
482: { 41, "latin7", "latin7_general_ci", 1, 1, "", NULL, NULL},
1.1.1.3 ! misho 483: { 20, "latin7", "latin7_estonian_cs", 1, 1, "", NULL, NULL},
1.1 misho 484: { 57, "cp1256", "cp1256_general_ci", 1, 1, "", NULL, NULL},
485: { 59, "cp1257", "cp1257_general_ci", 1, 1, "", NULL, NULL},
486: { 63, "binary", "binary", 1, 1, "", NULL, NULL},
487: { 97, "eucjpms", "eucjpms_japanese_ci", 1, 3, "", mysqlnd_mbcharlen_eucjpms, check_mb_eucjpms},
488: { 29, "cp1257", "cp1257_lithunian_ci", 1, 1, "", NULL, NULL},
489: { 31, "latin1", "latin1_german2_ci", 1, 1, "", NULL, NULL},
490: { 34, "cp1250", "cp1250_czech_cs", 1, 1, "", NULL, NULL},
491: { 42, "latin7", "latin7_general_cs", 1, 1, "", NULL, NULL},
492: { 43, "macce", "macce_bin", 1, 1, "", NULL, NULL},
493: { 44, "cp1250", "cp1250_croatian_ci", 1, 1, "", NULL, NULL},
1.1.1.2 misho 494: { 45, UTF8_MB4, UTF8_MB4"_general_ci", 1, 4, "UTF-8 Unicode", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
495: { 46, UTF8_MB4, UTF8_MB4"_bin", 1, 4, "UTF-8 Unicode", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
1.1 misho 496: { 47, "latin1", "latin1_bin", 1, 1, "", NULL, NULL},
497: { 48, "latin1", "latin1_general_ci", 1, 1, "", NULL, NULL},
498: { 49, "latin1", "latin1_general_cs", 1, 1, "", NULL, NULL},
1.1.1.3 ! misho 499: { 51, "cp1251", "cp1251_general_ci", 1, 1, "", NULL, NULL},
! 500: { 14, "cp1251", "cp1251_bulgarian_ci", 1, 1, "", NULL, NULL},
! 501: { 23, "cp1251", "cp1251_ukrainian_ci", 1, 1, "", NULL, NULL},
1.1 misho 502: { 50, "cp1251", "cp1251_bin", 1, 1, "", NULL, NULL},
503: { 52, "cp1251", "cp1251_general_cs", 1, 1, "", NULL, NULL},
504: { 53, "macroman", "macroman_bin", 1, 1, "", NULL, NULL},
505: { 54, "utf16", "utf16_general_ci", 2, 4, "UTF-16 Unicode", mysqlnd_mbcharlen_utf16, check_mb_utf16},
506: { 55, "utf16", "utf16_bin", 2, 4, "UTF-16 Unicode", mysqlnd_mbcharlen_utf16, check_mb_utf16},
1.1.1.3 ! misho 507: { 56, "utf16le", "utf16le_general_ci", 2, 4, "UTF-16LE Unicode", mysqlnd_mbcharlen_utf16, check_mb_utf16},
1.1 misho 508: { 58, "cp1257", "cp1257_bin", 1, 1, "", NULL, NULL},
509: #ifdef USED_TO_BE_SO_BEFORE_MYSQL_5_5
510: { 60, "armascii8", "armascii8_bin", 1, 1, "", NULL, NULL},
511: #endif
1.1.1.3 ! misho 512: /*55*/{ 60, "utf32", "utf32_general_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 513: /*55*/{ 61, "utf32", "utf32_bin", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 514: { 62, "utf16le", "utf16le_bin", 2, 4, "UTF-16LE Unicode", mysqlnd_mbcharlen_utf16, check_mb_utf16},
1.1 misho 515: { 65, "ascii", "ascii_bin", 1, 1, "", NULL, NULL},
516: { 66, "cp1250", "cp1250_bin", 1, 1, "", NULL, NULL},
517: { 67, "cp1256", "cp1256_bin", 1, 1, "", NULL, NULL},
518: { 68, "cp866", "cp866_bin", 1, 1, "", NULL, NULL},
519: { 69, "dec8", "dec8_bin", 1, 1, "", NULL, NULL},
520: { 70, "greek", "greek_bin", 1, 1, "", NULL, NULL},
521: { 71, "hebew", "hebrew_bin", 1, 1, "", NULL, NULL},
522: { 72, "hp8", "hp8_bin", 1, 1, "", NULL, NULL},
523: { 73, "keybcs2", "keybcs2_bin", 1, 1, "", NULL, NULL},
524: { 74, "koi8r", "koi8r_bin", 1, 1, "", NULL, NULL},
525: { 75, "koi8u", "koi8u_bin", 1, 1, "", NULL, NULL},
526: { 77, "latin2", "latin2_bin", 1, 1, "", NULL, NULL},
527: { 78, "latin5", "latin5_bin", 1, 1, "", NULL, NULL},
528: { 79, "latin7", "latin7_bin", 1, 1, "", NULL, NULL},
529: { 80, "cp850", "cp850_bin", 1, 1, "", NULL, NULL},
530: { 81, "cp852", "cp852_bin", 1, 1, "", NULL, NULL},
531: { 82, "swe7", "swe7_bin", 1, 1, "", NULL, NULL},
532: { 83, UTF8_MB3, UTF8_MB3"_bin", 1, 3, "UTF-8 Unicode", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
533: { 84, "big5", "big5_bin", 1, 2, "", mysqlnd_mbcharlen_big5, check_mb_big5},
534: { 85, "euckr", "euckr_bin", 1, 2, "", mysqlnd_mbcharlen_euckr, check_mb_euckr},
535: { 86, "gb2312", "gb2312_bin", 1, 2, "", mysqlnd_mbcharlen_gb2312, check_mb_gb2312},
536: { 87, "gbk", "gbk_bin", 1, 2, "", mysqlnd_mbcharlen_gbk, check_mb_gbk},
537: { 88, "sjis", "sjis_bin", 1, 2, "", mysqlnd_mbcharlen_sjis, check_mb_sjis},
538: { 89, "tis620", "tis620_bin", 1, 1, "", NULL, NULL},
539: { 90, "ucs2", "ucs2_bin", 2, 2, "UCS-2 Unicode", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
540: { 91, "ujis", "ujis_bin", 1, 3, "", mysqlnd_mbcharlen_ujis, check_mb_ujis},
1.1.1.3 ! misho 541: { 92, "geostd8", "geostd8_general_ci", 1, 1, "", NULL, NULL},
! 542: { 93, "geostd8", "geostd8_bin", 1, 1, "", NULL, NULL},
1.1 misho 543: { 94, "latin1", "latin1_spanish_ci", 1, 1, "", NULL, NULL},
1.1.1.3 ! misho 544: { 95, "cp932", "cp932_japanese_ci", 1, 2, "", mysqlnd_mbcharlen_cp932, check_mb_cp932},
1.1 misho 545: { 96, "cp932", "cp932_bin", 1, 2, "", mysqlnd_mbcharlen_cp932, check_mb_cp932},
1.1.1.3 ! misho 546: { 97, "eucjpms", "eucjpms_japanese_ci", 1, 3, "", mysqlnd_mbcharlen_eucjpms, check_mb_eucjpms},
1.1 misho 547: { 98, "eucjpms", "eucjpms_bin", 1, 3, "", mysqlnd_mbcharlen_eucjpms, check_mb_eucjpms},
1.1.1.3 ! misho 548: { 99, "cp1250", "cp1250_polish_ci", 1, 1, "", NULL, NULL},
1.1 misho 549: { 128, "ucs2", "ucs2_unicode_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
550: { 129, "ucs2", "ucs2_icelandic_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
551: { 130, "ucs2", "ucs2_latvian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
552: { 131, "ucs2", "ucs2_romanian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
553: { 132, "ucs2", "ucs2_slovenian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
554: { 133, "ucs2", "ucs2_polish_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
555: { 134, "ucs2", "ucs2_estonian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
556: { 135, "ucs2", "ucs2_spanish_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
557: { 136, "ucs2", "ucs2_swedish_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
558: { 137, "ucs2", "ucs2_turkish_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
559: { 138, "ucs2", "ucs2_czech_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
560: { 139, "ucs2", "ucs2_danish_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
561: { 140, "ucs2", "ucs2_lithunian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
562: { 141, "ucs2", "ucs2_slovak_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
563: { 142, "ucs2", "ucs2_spanish2_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
564: { 143, "ucs2", "ucs2_roman_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
565: { 144, "ucs2", "ucs2_persian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
566: { 145, "ucs2", "ucs2_esperanto_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
567: { 146, "ucs2", "ucs2_hungarian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
568: { 147, "ucs2", "ucs2_sinhala_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
1.1.1.3 ! misho 569: { 148, "ucs2", "ucs2_german2_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
! 570: { 149, "ucs2", "ucs2_croatian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
! 571: { 150, "ucs2", "ucs2_unicode_520_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
! 572: { 151, "ucs2", "ucs2_vietnamese_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
! 573:
! 574: /*56*/{160, "utf32", "utf32_unicode_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 575: /*56*/{161, "utf32", "utf32_icelandic_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 576: /*56*/{162, "utf32", "utf32_latvian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 577: /*56*/{163, "utf32", "utf32_romanian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 578: /*56*/{164, "utf32", "utf32_slovenian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 579: /*56*/{165, "utf32", "utf32_polish_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 580: /*56*/{166, "utf32", "utf32_estonian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 581: /*56*/{167, "utf32", "utf32_spanish_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 582: /*56*/{168, "utf32", "utf32_swedish_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 583: /*56*/{169, "utf32", "utf32_turkish_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 584: /*56*/{170, "utf32", "utf32_czech_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 585: /*56*/{171, "utf32", "utf32_danish_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 586: /*56*/{172, "utf32", "utf32_lithuanian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 587: /*56*/{173, "utf32", "utf32_slovak_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 588: /*56*/{174, "utf32", "utf32_spanish2_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 589: /*56*/{175, "utf32", "utf32_roman_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 590: /*56*/{176, "utf32", "utf32_persian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 591: /*56*/{177, "utf32", "utf32_esperanto_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 592: /*56*/{178, "utf32", "utf32_hungarian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 593: /*56*/{179, "utf32", "utf32_sinhala_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 594: /*56*/{180, "utf32", "utf32_german2_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 595: /*56*/{181, "utf32", "utf32_croatian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 596: /*56*/{182, "utf32", "utf32_unicode_520_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
! 597: /*56*/{183, "utf32", "utf32_vietnamese_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
1.1 misho 598:
599: { 192, UTF8_MB3, UTF8_MB3"_general_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
600: { 193, UTF8_MB3, UTF8_MB3"_icelandic_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
601: { 194, UTF8_MB3, UTF8_MB3"_latvian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
602: { 195, UTF8_MB3, UTF8_MB3"_romanian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
603: { 196, UTF8_MB3, UTF8_MB3"_slovenian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
604: { 197, UTF8_MB3, UTF8_MB3"_polish_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
605: { 198, UTF8_MB3, UTF8_MB3"_estonian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
1.1.1.3 ! misho 606: { 199, UTF8_MB3, UTF8_MB3"_spanish_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
1.1 misho 607: { 200, UTF8_MB3, UTF8_MB3"_swedish_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
608: { 201, UTF8_MB3, UTF8_MB3"_turkish_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
609: { 202, UTF8_MB3, UTF8_MB3"_czech_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
610: { 203, UTF8_MB3, UTF8_MB3"_danish_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid },
611: { 204, UTF8_MB3, UTF8_MB3"_lithunian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid },
612: { 205, UTF8_MB3, UTF8_MB3"_slovak_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
613: { 206, UTF8_MB3, UTF8_MB3"_spanish2_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
614: { 207, UTF8_MB3, UTF8_MB3"_roman_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
615: { 208, UTF8_MB3, UTF8_MB3"_persian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
616: { 209, UTF8_MB3, UTF8_MB3"_esperanto_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
617: { 210, UTF8_MB3, UTF8_MB3"_hungarian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
618: { 211, UTF8_MB3, UTF8_MB3"_sinhala_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
1.1.1.3 ! misho 619: { 211, UTF8_MB3, UTF8_MB3"_german2_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
! 620: { 213, UTF8_MB3, UTF8_MB3"_croatian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
! 621: { 214, UTF8_MB3, UTF8_MB3"_unicode_520_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
! 622: { 215, UTF8_MB3, UTF8_MB3"_vietnamese_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
1.1 misho 623:
624: { 224, UTF8_MB4, UTF8_MB4"_unicode_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
625: { 225, UTF8_MB4, UTF8_MB4"_icelandic_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
626: { 226, UTF8_MB4, UTF8_MB4"_latvian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
627: { 227, UTF8_MB4, UTF8_MB4"_romanian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
628: { 228, UTF8_MB4, UTF8_MB4"_slovenian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
629: { 229, UTF8_MB4, UTF8_MB4"_polish_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
630: { 230, UTF8_MB4, UTF8_MB4"_estonian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
631: { 231, UTF8_MB4, UTF8_MB4"_spanish_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
632: { 232, UTF8_MB4, UTF8_MB4"_swedish_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
633: { 233, UTF8_MB4, UTF8_MB4"_turkish_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
634: { 234, UTF8_MB4, UTF8_MB4"_czech_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
635: { 235, UTF8_MB4, UTF8_MB4"_danish_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
636: { 236, UTF8_MB4, UTF8_MB4"_lithuanian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
637: { 237, UTF8_MB4, UTF8_MB4"_slovak_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
638: { 238, UTF8_MB4, UTF8_MB4"_spanish2_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
639: { 239, UTF8_MB4, UTF8_MB4"_roman_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
640: { 240, UTF8_MB4, UTF8_MB4"_persian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
641: { 241, UTF8_MB4, UTF8_MB4"_esperanto_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
642: { 242, UTF8_MB4, UTF8_MB4"_hungarian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
643: { 243, UTF8_MB4, UTF8_MB4"_sinhala_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
1.1.1.3 ! misho 644: { 244, UTF8_MB4, UTF8_MB4"_german2_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
! 645: { 245, UTF8_MB4, UTF8_MB4"_croatian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
! 646: { 246, UTF8_MB4, UTF8_MB4"_unicode_520_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
! 647: { 247, UTF8_MB4, UTF8_MB4"_vietnamese_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
1.1 misho 648:
649: { 254, UTF8_MB3, UTF8_MB3"_general_cs", 1, 3, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
650: { 0, NULL, NULL, 0, 0, NULL, NULL, NULL}
651: };
652: /* }}} */
653:
654:
655: /* {{{ mysqlnd_find_charset_nr */
656: PHPAPI const MYSQLND_CHARSET * mysqlnd_find_charset_nr(unsigned int charsetnr)
657: {
658: const MYSQLND_CHARSET * c = mysqlnd_charsets;
659:
660: do {
661: if (c->nr == charsetnr) {
662: return c;
663: }
664: ++c;
665: } while (c[0].nr != 0);
666: return NULL;
667: }
668: /* }}} */
669:
670:
671: /* {{{ mysqlnd_find_charset_name */
672: PHPAPI const MYSQLND_CHARSET * mysqlnd_find_charset_name(const char * const name)
673: {
1.1.1.3 ! misho 674: if (name) {
! 675: const MYSQLND_CHARSET * c = mysqlnd_charsets;
! 676: do {
! 677: if (!strcasecmp(c->name, name)) {
! 678: return c;
! 679: }
! 680: ++c;
! 681: } while (c[0].nr != 0);
! 682: }
1.1 misho 683: return NULL;
684: }
685: /* }}} */
686:
687:
688: /* {{{ mysqlnd_cset_escape_quotes */
689: PHPAPI ulong mysqlnd_cset_escape_quotes(const MYSQLND_CHARSET * const cset, char *newstr,
690: const char * escapestr, size_t escapestr_len TSRMLS_DC)
691: {
692: const char *newstr_s = newstr;
693: const char *newstr_e = newstr + 2 * escapestr_len;
694: const char *end = escapestr + escapestr_len;
695: zend_bool escape_overflow = FALSE;
696:
697: DBG_ENTER("mysqlnd_cset_escape_quotes");
698:
699: for (;escapestr < end; escapestr++) {
700: unsigned int len = 0;
701: /* check unicode characters */
702:
703: if (cset->char_maxlen > 1 && (len = cset->mb_valid(escapestr, end))) {
704:
705: /* check possible overflow */
706: if ((newstr + len) > newstr_e) {
707: escape_overflow = TRUE;
708: break;
709: }
710: /* copy mb char without escaping it */
711: while (len--) {
712: *newstr++ = *escapestr++;
713: }
714: escapestr--;
715: continue;
716: }
717: if (*escapestr == '\'') {
718: if (newstr + 2 > newstr_e) {
719: escape_overflow = TRUE;
720: break;
721: }
722: *newstr++ = '\'';
723: *newstr++ = '\'';
724: } else {
725: if (newstr + 1 > newstr_e) {
726: escape_overflow = TRUE;
727: break;
728: }
729: *newstr++ = *escapestr;
730: }
731: }
732: *newstr = '\0';
733:
734: if (escape_overflow) {
735: DBG_RETURN((ulong)~0);
736: }
737: DBG_RETURN((ulong)(newstr - newstr_s));
738: }
739: /* }}} */
740:
741:
742: /* {{{ mysqlnd_cset_escape_slashes */
743: PHPAPI ulong mysqlnd_cset_escape_slashes(const MYSQLND_CHARSET * const cset, char *newstr,
744: const char * escapestr, size_t escapestr_len TSRMLS_DC)
745: {
746: const char *newstr_s = newstr;
747: const char *newstr_e = newstr + 2 * escapestr_len;
748: const char *end = escapestr + escapestr_len;
749: zend_bool escape_overflow = FALSE;
750:
751: DBG_ENTER("mysqlnd_cset_escape_slashes");
752: DBG_INF_FMT("charset=%s", cset->name);
753:
754: for (;escapestr < end; escapestr++) {
755: char esc = '\0';
756: unsigned int len = 0;
757:
758: /* check unicode characters */
759: if (cset->char_maxlen > 1 && (len = cset->mb_valid(escapestr, end))) {
760: /* check possible overflow */
761: if ((newstr + len) > newstr_e) {
762: escape_overflow = TRUE;
763: break;
764: }
765: /* copy mb char without escaping it */
766: while (len--) {
767: *newstr++ = *escapestr++;
768: }
769: escapestr--;
770: continue;
771: }
772: if (cset->char_maxlen > 1 && cset->mb_charlen(*escapestr) > 1) {
773: esc = *escapestr;
774: } else {
775: switch (*escapestr) {
776: case 0:
777: esc = '0';
778: break;
779: case '\n':
780: esc = 'n';
781: break;
782: case '\r':
783: esc = 'r';
784: break;
785: case '\\':
786: case '\'':
787: case '"':
788: esc = *escapestr;
789: break;
790: case '\032':
791: esc = 'Z';
792: break;
793: }
794: }
795: if (esc) {
796: if (newstr + 2 > newstr_e) {
797: escape_overflow = TRUE;
798: break;
799: }
800: /* copy escaped character */
801: *newstr++ = '\\';
802: *newstr++ = esc;
803: } else {
804: if (newstr + 1 > newstr_e) {
805: escape_overflow = TRUE;
806: break;
807: }
808: /* copy non escaped character */
809: *newstr++ = *escapestr;
810: }
811: }
812: *newstr = '\0';
813:
814: if (escape_overflow) {
815: DBG_RETURN((ulong)~0);
816: }
817: DBG_RETURN((ulong)(newstr - newstr_s));
818: }
819: /* }}} */
820:
1.1.1.2 misho 821:
822: static struct st_mysqlnd_plugin_charsets mysqlnd_plugin_charsets_plugin =
823: {
824: {
825: MYSQLND_PLUGIN_API_VERSION,
826: "charsets",
827: MYSQLND_VERSION_ID,
828: MYSQLND_VERSION,
829: "PHP License 3.01",
830: "Andrey Hristov <andrey@mysql.com>, Ulf Wendel <uwendel@mysql.com>, Georg Richter <georg@mysql.com>",
831: {
832: NULL, /* no statistics , will be filled later if there are some */
833: NULL, /* no statistics */
834: },
835: {
836: NULL /* plugin shutdown */
837: }
838: },
839: {/* methods */
840: mysqlnd_find_charset_nr,
841: mysqlnd_find_charset_name,
842: mysqlnd_cset_escape_quotes,
843: mysqlnd_cset_escape_slashes
844: }
845: };
846:
847:
848: /* {{{ mysqlnd_charsets_plugin_register */
849: void
850: mysqlnd_charsets_plugin_register(TSRMLS_D)
851: {
852: mysqlnd_plugin_register_ex((struct st_mysqlnd_plugin_header *) &mysqlnd_plugin_charsets_plugin TSRMLS_CC);
853: }
854: /* }}} */
855:
856:
1.1 misho 857: /*
858: * Local variables:
859: * tab-width: 4
860: * c-basic-offset: 4
861: * End:
862: * vim600: noet sw=4 ts=4 fdm=marker
863: * vim<600: noet sw=4 ts=4
864: */
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>