Annotation of embedaddon/php/ext/mbstring/libmbfl/filters/mbfilter_cp1252.c, revision 1.1

1.1     ! misho       1: /*
        !             2:  * "streamable kanji code filter and converter"
        !             3:  * Copyright (c) 1998-2002 HappySize, Inc. All rights reserved.
        !             4:  *
        !             5:  * LICENSE NOTICES
        !             6:  *
        !             7:  * This file is part of "streamable kanji code filter and converter",
        !             8:  * which is distributed under the terms of GNU Lesser General Public 
        !             9:  * License (version 2) as published by the Free Software Foundation.
        !            10:  *
        !            11:  * This software is distributed in the hope that it will be useful,
        !            12:  * but WITHOUT ANY WARRANTY; without even the implied warranty of
        !            13:  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
        !            14:  * GNU Lesser General Public License for more details.
        !            15:  *
        !            16:  * You should have received a copy of the GNU Lesser General Public
        !            17:  * License along with "streamable kanji code filter and converter";
        !            18:  * if not, write to the Free Software Foundation, Inc., 59 Temple Place,
        !            19:  * Suite 330, Boston, MA  02111-1307  USA
        !            20:  *
        !            21:  * The author of this part: Wez Furlong <wez@thebrainroom.com>
        !            22:  *
        !            23:  */
        !            24: /*
        !            25:  * the source code included in this files was separated from mbfilter.c
        !            26:  * by moriyoshi koizumi <moriyoshi@php.net> on 4 dec 2002.
        !            27:  *
        !            28:  */
        !            29: 
        !            30: #ifdef HAVE_CONFIG_H
        !            31: #include "config.h"
        !            32: #endif
        !            33: 
        !            34: #include "mbfilter.h"
        !            35: #include "mbfilter_cp1252.h"
        !            36: #include "unicode_table_cp1252.h"
        !            37: 
        !            38: static int mbfl_filt_ident_cp1252(int c, mbfl_identify_filter *filter);
        !            39: 
        !            40: static const char *mbfl_encoding_cp1252_aliases[] = {"cp1252", NULL};
        !            41: 
        !            42: const mbfl_encoding mbfl_encoding_cp1252 = {
        !            43:        mbfl_no_encoding_cp1252,
        !            44:        "Windows-1252",
        !            45:        "Windows-1252",
        !            46:        (const char *(*)[])&mbfl_encoding_cp1252_aliases,
        !            47:        NULL,
        !            48:        MBFL_ENCTYPE_SBCS
        !            49: };
        !            50: 
        !            51: const struct mbfl_identify_vtbl vtbl_identify_cp1252 = {
        !            52:        mbfl_no_encoding_cp1252,
        !            53:        mbfl_filt_ident_common_ctor,
        !            54:        mbfl_filt_ident_common_dtor,
        !            55:        mbfl_filt_ident_cp1252
        !            56: };
        !            57: 
        !            58: const struct mbfl_convert_vtbl vtbl_cp1252_wchar = {
        !            59:        mbfl_no_encoding_cp1252,
        !            60:        mbfl_no_encoding_wchar,
        !            61:        mbfl_filt_conv_common_ctor,
        !            62:        mbfl_filt_conv_common_dtor,
        !            63:        mbfl_filt_conv_cp1252_wchar,
        !            64:        mbfl_filt_conv_common_flush
        !            65: };
        !            66: 
        !            67: const struct mbfl_convert_vtbl vtbl_wchar_cp1252 = {
        !            68:        mbfl_no_encoding_wchar,
        !            69:        mbfl_no_encoding_cp1252,
        !            70:        mbfl_filt_conv_common_ctor,
        !            71:        mbfl_filt_conv_common_dtor,
        !            72:        mbfl_filt_conv_wchar_cp1252,
        !            73:        mbfl_filt_conv_common_flush
        !            74: };
        !            75: 
        !            76: #define CK(statement)  do { if ((statement) < 0) return (-1); } while (0)
        !            77: 
        !            78: /*
        !            79:  * wchar => cp1252
        !            80:  */
        !            81: int mbfl_filt_conv_wchar_cp1252(int c, mbfl_convert_filter *filter)
        !            82: {
        !            83:        int s=-1, n;
        !            84: 
        !            85:        if (c >= 0x100) {
        !            86:                /* look it up from the cp1252 table */
        !            87:                s = -1;
        !            88:                n = 31;
        !            89:                while (n >= 0) {
        !            90:                        if (c == cp1252_ucs_table[n] && c != 0xfffe) {
        !            91:                                s = 0x80 + n;
        !            92:                                break;
        !            93:                        }
        !            94:                        n--;
        !            95:                }
        !            96:                if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_1)
        !            97:                {
        !            98:                        s = c & MBFL_WCSPLANE_MASK;
        !            99:                }
        !           100:        }
        !           101:        else if (c >= 0 && c < 0x100) {
        !           102:                s = c;
        !           103:        }
        !           104:        if (s >= 0) {
        !           105:                CK((*filter->output_function)(s, filter->data));
        !           106:        } else {
        !           107:                if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
        !           108:                        CK(mbfl_filt_conv_illegal_output(c, filter));
        !           109:                }
        !           110:        }
        !           111:        return c;
        !           112: }
        !           113: 
        !           114: /*
        !           115:  * cp1252 => wchar
        !           116:  */
        !           117: int mbfl_filt_conv_cp1252_wchar(int c, mbfl_convert_filter *filter)
        !           118: {
        !           119:        int s;
        !           120: 
        !           121:        if (c >= 0x80 && c < 0xa0) {
        !           122:                s = cp1252_ucs_table[c - 0x80];
        !           123:        } else {
        !           124:                s = c;
        !           125:        }
        !           126: 
        !           127:        CK((*filter->output_function)(s, filter->data));
        !           128: 
        !           129:        return c;
        !           130: }
        !           131: 
        !           132: /* We only distinguish the MS extensions to ISO-8859-1.
        !           133:  * Actually, this is pretty much a NO-OP, since the identification
        !           134:  * system doesn't allow us to discriminate between a positive match,
        !           135:  * a possible match and a definite non-match.
        !           136:  * The problem here is that cp1252 looks like SJIS for certain chars.
        !           137:  * */
        !           138: static int mbfl_filt_ident_cp1252(int c, mbfl_identify_filter *filter)
        !           139: {
        !           140:        if (c >= 0x80 && c < 0xa0)
        !           141:                filter->flag = 0;
        !           142:        else
        !           143:                filter->flag = 1; /* not it */
        !           144:        return c;       
        !           145: }
        !           146: 
        !           147: 

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>