File:  [ELWIX - Embedded LightWeight unIX -] / embedaddon / libiconv / tools / Makefile
Revision 1.1.1.3 (vendor branch): download - view: text, annotated - select for diffs - revision graph
Wed Mar 17 13:38:46 2021 UTC (3 years, 3 months ago) by misho
Branches: libiconv, MAIN
CVS tags: v1_16p0, HEAD
libiconv 1.16

    1: 
    2: # Directory containing conversion tables.
    3: # You have to unpack the conversion-tables.tar.gz package.
    4: TABLESDIR = /home/bruno/chs/conversion-tables
    5: 
    6: ALL = \
    7:  ascii.h \
    8:  iso8859_1.h \
    9:  iso8859_2.h \
   10:  iso8859_3.h \
   11:  iso8859_4.h \
   12:  iso8859_5.h \
   13:  iso8859_6.h \
   14:  iso8859_7.h \
   15:  iso8859_8.h \
   16:  iso8859_9.h \
   17:  iso8859_10.h \
   18:  iso8859_11.h \
   19:  iso8859_13.h \
   20:  iso8859_14.h \
   21:  iso8859_15.h \
   22:  iso8859_16.h \
   23:  koi8_r.h \
   24:  koi8_u.h \
   25:  koi8_ru.h \
   26:  cp1250.h \
   27:  cp1251.h \
   28:  cp1252.h \
   29:  cp1253.h \
   30:  cp1254.h \
   31:  cp1255.h \
   32:  cp1256.h \
   33:  cp1257.h \
   34:  cp1258.h \
   35:  cp850.h \
   36:  cp862.h \
   37:  cp866.h \
   38:  cp1131.h \
   39:  mac_roman.h \
   40:  mac_centraleurope.h \
   41:  mac_iceland.h \
   42:  mac_croatian.h \
   43:  mac_romania.h \
   44:  mac_cyrillic.h \
   45:  mac_ukraine.h \
   46:  mac_greek.h \
   47:  mac_turkish.h \
   48:  mac_hebrew.h \
   49:  mac_arabic.h \
   50:  mac_thai.h \
   51:  hp_roman8.h \
   52:  nextstep.h \
   53:  armscii_8.h \
   54:  georgian_academy.h \
   55:  georgian_ps.h \
   56:  koi8_t.h \
   57:  pt154.h \
   58:  rk1048.h \
   59:  mulelao.h \
   60:  cp1133.h \
   61:  tis620.h \
   62:  cp874.h \
   63:  viscii.h \
   64:  tcvn.h \
   65:  jisx0201.h \
   66:  jisx0208.h \
   67:  jisx0212.h \
   68:  cp932ext.h \
   69:  cp50221_0208_ext.h \
   70:  cp50221_0212_ext.h \
   71:  gb2312.h \
   72:  isoir165ext.h \
   73:  gb12345ext.h \
   74:  gbkext1.h \
   75:  gbkext2.h \
   76:  gbkext_inv.h \
   77:  cp936ext.h \
   78:  gb18030ext.h \
   79:  gb18030uni.h \
   80:  cns11643_1.h \
   81:  cns11643_2.h \
   82:  cns11643_3.h \
   83:  cns11643_4a.h \
   84:  cns11643_4b.h \
   85:  cns11643_5.h \
   86:  cns11643_6.h \
   87:  cns11643_7.h \
   88:  cns11643_15.h \
   89:  cns11643_inv.h \
   90:  big5.h \
   91:  cp950ext.h \
   92:  hkscs1999.h \
   93:  hkscs2001.h \
   94:  hkscs2004.h \
   95:  hkscs2008.h \
   96:  ksc5601.h \
   97:  uhc_1.h \
   98:  uhc_2.h \
   99:  johab_hangul.h \
  100:  cp856.h \
  101:  cp922.h \
  102:  cp1046.h \
  103:  cp1124.h \
  104:  cp1129.h \
  105:  cp1161.h \
  106:  cp1162.h \
  107:  cp1163.h \
  108:  cp437.h \
  109:  cp737.h \
  110:  cp775.h \
  111:  cp852.h \
  112:  cp853.h \
  113:  cp855.h \
  114:  cp857.h \
  115:  cp858.h \
  116:  cp860.h \
  117:  cp861.h \
  118:  cp863.h \
  119:  cp864.h \
  120:  cp865.h \
  121:  cp869.h \
  122:  cp1125.h \
  123:  jisx0213.h \
  124:  tds565.h \
  125:  atarist.h \
  126:  riscos1.h \
  127:  cjk_variants.h
  128: 
  129: all : $(ALL)
  130: 
  131: ascii.h : $(TABLESDIR)/glibc-2.1-iconv/ASCII.TXT 8bit_tab_to_h
  132: 	./8bit_tab_to_h ASCII ascii < $<
  133: 
  134: iso8859_1.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-1.TXT 8bit_tab_to_h
  135: 	./8bit_tab_to_h ISO-8859-1 iso8859_1 < $<
  136: 
  137: iso8859_2.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-2.TXT 8bit_tab_to_h
  138: 	./8bit_tab_to_h ISO-8859-2 iso8859_2 < $<
  139: 
  140: iso8859_3.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-3.TXT 8bit_tab_to_h
  141: 	./8bit_tab_to_h ISO-8859-3 iso8859_3 < $<
  142: 
  143: iso8859_4.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-4.TXT 8bit_tab_to_h
  144: 	./8bit_tab_to_h ISO-8859-4 iso8859_4 < $<
  145: 
  146: iso8859_5.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-5.TXT 8bit_tab_to_h
  147: 	./8bit_tab_to_h ISO-8859-5 iso8859_5 < $<
  148: 
  149: iso8859_6.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-6.TXT 8bit_tab_to_h
  150: 	./8bit_tab_to_h ISO-8859-6 iso8859_6 < $<
  151: 
  152: iso8859_7.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-7-2003.TXT 8bit_tab_to_h
  153: 	./8bit_tab_to_h ISO-8859-7 iso8859_7 < $<
  154: 
  155: iso8859_8.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-8.TXT 8bit_tab_to_h
  156: 	./8bit_tab_to_h ISO-8859-8 iso8859_8 < $<
  157: 
  158: iso8859_9.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-9.TXT 8bit_tab_to_h
  159: 	./8bit_tab_to_h ISO-8859-9 iso8859_9 < $<
  160: 
  161: iso8859_10.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-10.TXT 8bit_tab_to_h
  162: 	./8bit_tab_to_h ISO-8859-10 iso8859_10 < $<
  163: 
  164: iso8859_11.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-11.TXT 8bit_tab_to_h
  165: 	./8bit_tab_to_h ISO-8859-11 iso8859_11 < $<
  166: 
  167: iso8859_13.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-13.TXT 8bit_tab_to_h
  168: 	./8bit_tab_to_h ISO-8859-13 iso8859_13 < $<
  169: 
  170: iso8859_14.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-14.TXT 8bit_tab_to_h
  171: 	./8bit_tab_to_h ISO-8859-14 iso8859_14 < $<
  172: 
  173: iso8859_15.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-15.TXT 8bit_tab_to_h
  174: 	./8bit_tab_to_h ISO-8859-15 iso8859_15 < $<
  175: 
  176: iso8859_16.h : $(TABLESDIR)/unicode.org-mappings/ISO8859/8859-16.TXT 8bit_tab_to_h
  177: 	./8bit_tab_to_h ISO-8859-16 iso8859_16 < $<
  178: 
  179: koi8_r.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MISC/KOI8-R.TXT 8bit_tab_to_h
  180: 	./8bit_tab_to_h KOI8-R koi8_r < $<
  181: 
  182: koi8_u.h : $(TABLESDIR)/csets-new/KOI8-U.TXT 8bit_tab_to_h
  183: 	./8bit_tab_to_h KOI8-U koi8_u < $<
  184: 
  185: koi8_ru.h : $(TABLESDIR)/freebsd-iconv-0.4/KOI8-RU.TXT 8bit_tab_to_h
  186: 	./8bit_tab_to_h KOI8-RU koi8_ru < $<
  187: 
  188: cp1250.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP1250.TXT 8bit_tab_to_h
  189: 	./8bit_tab_to_h CP1250 cp1250 < $<
  190: 
  191: cp1251.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP1251.TXT 8bit_tab_to_h
  192: 	./8bit_tab_to_h CP1251 cp1251 < $<
  193: 
  194: cp1252.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP1252.TXT 8bit_tab_to_h
  195: 	./8bit_tab_to_h CP1252 cp1252 < $<
  196: 
  197: cp1253.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP1253.TXT 8bit_tab_to_h
  198: 	./8bit_tab_to_h CP1253 cp1253 < $<
  199: 
  200: cp1254.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP1254.TXT 8bit_tab_to_h
  201: 	./8bit_tab_to_h CP1254 cp1254 < $<
  202: 
  203: cp1255.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP1255.TXT 8bit_tab_to_h
  204: 	./8bit_tab_to_h CP1255 cp1255 < $<
  205: 
  206: cp1256.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP1256.TXT 8bit_tab_to_h
  207: 	./8bit_tab_to_h CP1256 cp1256 < $<
  208: 
  209: cp1257.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP1257.TXT 8bit_tab_to_h
  210: 	./8bit_tab_to_h CP1257 cp1257 < $<
  211: 
  212: cp1258.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP1258.TXT 8bit_tab_to_h
  213: 	./8bit_tab_to_h CP1258 cp1258 < $<
  214: 
  215: cp850.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP850.TXT 8bit_tab_to_h
  216: 	./8bit_tab_to_h CP850 cp850 < $<
  217: 
  218: cp862.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP862.TXT 8bit_tab_to_h
  219: 	./8bit_tab_to_h CP862 cp862 < $<
  220: 
  221: cp866.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP866.TXT 8bit_tab_to_h
  222: 	./8bit_tab_to_h CP866 cp866 < $<
  223: 
  224: cp1131.h : $(TABLESDIR)/other/CP1131.TXT 8bit_tab_to_h
  225: 	(echo '#' ; cat $<) | ./8bit_tab_to_h CP1131 cp1131
  226: 
  227: mac_roman.h : $(TABLESDIR)/jdk-1.1.7b/MAC-ROMAN.TXT 8bit_tab_to_h
  228: 	./8bit_tab_to_h MacRoman mac_roman < $<
  229: 
  230: mac_centraleurope.h : $(TABLESDIR)/jdk-1.1.7b/MAC-CENTRAL-EUROPE.TXT 8bit_tab_to_h
  231: 	./8bit_tab_to_h MacCentralEurope mac_centraleurope < $<
  232: 
  233: mac_iceland.h : $(TABLESDIR)/jdk-1.1.7b/MAC-ICELAND.TXT 8bit_tab_to_h
  234: 	./8bit_tab_to_h MacIceland mac_iceland < $<
  235: 
  236: mac_croatian.h : $(TABLESDIR)/jdk-1.1.7b/MAC-CROATIAN.TXT 8bit_tab_to_h
  237: 	./8bit_tab_to_h MacCroatian mac_croatian < $<
  238: 
  239: mac_romania.h : $(TABLESDIR)/jdk-1.1.7b/MAC-ROMANIA.TXT 8bit_tab_to_h
  240: 	./8bit_tab_to_h MacRomania mac_romania < $<
  241: 
  242: mac_cyrillic.h : $(TABLESDIR)/jdk-1.1.7b/MAC-CYRILLIC.TXT 8bit_tab_to_h
  243: 	./8bit_tab_to_h MacCyrillic mac_cyrillic < $<
  244: 
  245: mac_ukraine.h : $(TABLESDIR)/jdk-1.1.7b/MAC-UKRAINE.TXT 8bit_tab_to_h
  246: 	./8bit_tab_to_h MacUkraine mac_ukraine < $<
  247: 
  248: mac_greek.h : $(TABLESDIR)/jdk-1.1.7b/MAC-GREEK.TXT 8bit_tab_to_h
  249: 	./8bit_tab_to_h MacGreek mac_greek < $<
  250: 
  251: mac_turkish.h : $(TABLESDIR)/jdk-1.1.7b/MAC-TURKISH.TXT 8bit_tab_to_h
  252: 	./8bit_tab_to_h MacTurkish mac_turkish < $<
  253: 
  254: mac_hebrew.h : $(TABLESDIR)/jdk-1.1.7b/MAC-HEBREW.TXT 8bit_tab_to_h
  255: 	./8bit_tab_to_h MacHebrew mac_hebrew < $<
  256: 
  257: mac_arabic.h : $(TABLESDIR)/jdk-1.1.7b/MAC-ARABIC.TXT 8bit_tab_to_h
  258: 	./8bit_tab_to_h MacArabic mac_arabic < $<
  259: 
  260: mac_thai.h : $(TABLESDIR)/jdk-1.1.7b/MAC-THAI.TXT 8bit_tab_to_h
  261: 	./8bit_tab_to_h MacThai mac_thai < $<
  262: 
  263: hp_roman8.h : $(TABLESDIR)/glibc-2.1-iconv/HP-ROMAN8.TXT 8bit_tab_to_h
  264: 	./8bit_tab_to_h HP-ROMAN8 hp_roman8 < $<
  265: 
  266: nextstep.h : $(TABLESDIR)/clisp/NEXTSTEP.TXT 8bit_tab_to_h
  267: 	./8bit_tab_to_h NEXTSTEP nextstep < $<
  268: 
  269: armscii_8.h : $(TABLESDIR)/glibc-2.2.90-iconv/ARMSCII-8.TXT 8bit_tab_to_h
  270: 	(echo '#' ; cat $<) | ./8bit_tab_to_h ARMSCII-8 armscii_8
  271: 
  272: georgian_academy.h : $(TABLESDIR)/csets-1.6/GEO-ITA.TXT 8bit_tab_to_h
  273: 	./8bit_tab_to_h GEORGIAN-ACADEMY georgian_academy < $<
  274: 
  275: georgian_ps.h : $(TABLESDIR)/csets-1.6/GEO-PS.TXT 8bit_tab_to_h
  276: 	./8bit_tab_to_h GEORGIAN-PS georgian_ps < $<
  277: 
  278: koi8_t.h : $(TABLESDIR)/glibc-2.2.90-iconv/KOI8-T.TXT
  279: 	(echo '#' ; cat $<) | ./8bit_tab_to_h KOI8-T koi8_t
  280: 
  281: pt154.h : $(TABLESDIR)/IANA/PTCP154.TXT
  282: 	./8bit_tab_to_h PT154 pt154 < $<
  283: 
  284: rk1048.h : $(TABLESDIR)/IANA/KZ-1048.TXT
  285: 	(echo '#' ; cat $<) | ./8bit_tab_to_h RK1048 rk1048
  286: 
  287: mulelao.h : $(TABLESDIR)/csets-new/MULELAO1.TXT 8bit_tab_to_h
  288: 	./8bit_tab_to_h MULELAO-1 mulelao < $<
  289: 
  290: cp1133.h : $(TABLESDIR)/csets-new/CP1133.TXT 8bit_tab_to_h
  291: 	./8bit_tab_to_h IBM-CP1133 cp1133 < $<
  292: 
  293: tis620.h : $(TABLESDIR)/glibc-2.1-iconv/TIS-620.TXT 8bit_tab_to_h
  294: 	./8bit_tab_to_h TIS620.2533-1 tis620 < $<
  295: 
  296: cp874.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP874.TXT 8bit_tab_to_h
  297: 	./8bit_tab_to_h CP874 cp874 < $<
  298: 
  299: viscii.h : $(TABLESDIR)/csets-1.6/VISCII.TXT 8bit_tab_to_h
  300: 	./8bit_tab_to_h VISCII1.1-1 viscii < $<
  301: 
  302: tcvn.h : $(TABLESDIR)/csets-1.6/VN5712-1.TXT 8bit_tab_to_h
  303: 	./8bit_tab_to_h TCVN-5712 tcvn < $<
  304: 
  305: jisx0201.h : $(TABLESDIR)/clisp/JIS_X0201.TXT 8bit_tab_to_h
  306: 	./8bit_tab_to_h JISX0201.1976-0 jisx0201 < $<
  307: 
  308: # We use modified JISX0208 and JISX0212 tables. Why?
  309: # Hironori Sakamoto and Tomohiro Kubota explain that
  310: # - EUC-JP and SHIFT_JIS contain JISX0208 exactly,
  311: # - Their round-trip conversion to Unicode and back must be the identity,
  312: # - Conversions between EUC-JP, SHIFT_JIS, CP932, ISO-2022-JP must behave
  313: #   as if no Unicode conversion was involved,
  314: # - When JISX0208 is used as a CES (i.e. combined with ASCII) its mapping of
  315: #   REVERSE SOLIDUS becomes a FULLWIDTH REVERSE SOLIDUS, apparently because
  316: #   round-trip conversion stability is more important than a particular glyph.
  317: #   Only with CCS the character is a REVERSE SOLIDUS.
  318: # As a consequence, we use FULLWIDTH REVERSE SOLIDUS in EUC-JP's JISX0208 part,
  319: # and for consistency also in SHIFT_JIS and ISO-2022-JP, i.e. everywhere.
  320: # JISX0208 never occurs as a CCS in practice. Similarly with JISX0212.
  321: 
  322: # Unicode.org maps 0x2140 to U+005C. We map it to U+FF3C.
  323: jisx0208.h : $(TABLESDIR)/unicode.org-mappings/EASTASIA/JIS/JIS0208.TXT cjk_tab_to_h
  324: 	sed -e 's,^0x....[ 	]*\(0x....[ 	]*0x.....*\)$$,\1,' < $< | sed -e 's,\([ 	]\)0x005C,\10xFF3C,' | ./cjk_tab_to_h JISX0208.1990-0 jisx0208 > $@
  325: 
  326: # Unicode.org maps 0x2237 to U+007E. We map it to U+FF5E.
  327: jisx0212.h : $(TABLESDIR)/unicode.org-mappings/EASTASIA/JIS/JIS0212.TXT cjk_tab_to_h
  328: 	sed -e 's,\([ 	]\)0x007E,\10xFF5E,' < $< | ./cjk_tab_to_h JISX0212.1990-0 jisx0212 > $@
  329: 
  330: cp932ext.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP932.TXT cjk_tab_to_h
  331: 	(echo '#' ; grep '^0x\(87\|E[D-F]\|F[0-9A-F]\)[0-9A-F][0-9A-F]' < $< ) | ./cjk_tab_to_h 'CP932 extensions' cp932ext > $@
  332: 
  333: cp50221_0208_ext.h : CP50221-0208-EXT.TXT 8bit_tab_to_h
  334: 	./8bit_tab_to_h 'CP50221 JISX0208 extensions' cp50221_0208_ext < $<
  335: 
  336: cp50221_0212_ext.h : CP50221-0212-EXT.TXT 8bit_tab_to_h
  337: 	./8bit_tab_to_h 'CP50221 JISX0212 extensions' cp50221_0212_ext < $<
  338: 
  339: gb2312.h : $(TABLESDIR)/unicode.org-mappings/EASTASIA/GB/GB2312.TXT cjk_tab_to_h
  340: 	./cjk_tab_to_h GB2312.1980-0 gb2312 < $< > $@
  341: 
  342: isoir165ext.h : $(TABLESDIR)/csets-new/ISO-IR-165-additions.TXT cjk_tab_to_h
  343: 	(echo '#' ; grep -v '^0x2[8A]' < $<) | ./cjk_tab_to_h 'ISO-IR-165 extensions' isoir165ext > $@
  344: 
  345: gb12345ext.h : $(TABLESDIR)/unicode.org-mappings/EASTASIA/GB/GB2312.TXT $(TABLESDIR)/unicode.org-mappings/EASTASIA/GB/GB12345-FIXED.TXT $(TABLESDIR)/csets-new/GB12345-more.TXT cjk_tab_to_h
  346: 	(echo '#' ; sed -e '/^0x..[ 	]*#UNDEFINED/d' -e 's/#.*$$//' -e '/^[ 	]*$$/d' $(TABLESDIR)/unicode.org-mappings/EASTASIA/GB/GB2312.TXT > tmp1.TXT ; sed -e '/^0x..[ 	]*#UNDEFINED/d' -e 's/#.*$$//' -e '/^[ 	]*$$/d' $(TABLESDIR)/unicode.org-mappings/EASTASIA/GB/GB12345-FIXED.TXT > tmp2.TXT ; diff tmp1.TXT tmp2.TXT | grep '^> ' | sed -e 's,^> ,,' ; cat $(TABLESDIR)/csets-new/GB12345-more.TXT ) | ./cjk_tab_to_h 'GB/T 12345.1990-0 extensions' gb12345ext > $@ && rm -f tmp1.TXT tmp2.TXT
  347: 
  348: gbkext1.h : GBKext.TXT cjk_tab_to_h
  349: 	(echo '#' ; grep '^0x\([89].\|A0\)' < GBKext.TXT) | ./cjk_tab_to_h 'GBK/3 extensions' gbkext1 > $@
  350: 
  351: gbkext2.h : GBKext.TXT cjk_tab_to_h
  352: 	(echo '#' ; grep '^0x\(A[1-9A-F]\|[B-F][0-9A-F]\)\([4-9].\|A0\)' < GBKext.TXT) | ./cjk_tab_to_h 'GBK/4 and GBK/5 extensions' gbkext2 > $@
  353: 
  354: gbkext_inv.h : GBKext.TXT cjk_tab_to_h
  355: 	(echo '#' ; grep '^0x\([89].\|A0\)' < GBKext.TXT ; grep '^0x\(A[1-9A-F]\|[B-F][0-9A-F]\)\([4-9].\|A0\)' < GBKext.TXT) | ./cjk_tab_to_h 'GBK extensions' gbkext_inv > $@
  356: 
  357: cp936ext.h : GBKext.TXT cjk_tab_to_h
  358: 	(echo '#' ; grep '^0xA[1-9][B-F].' < GBKext.TXT) | ./cjk_tab_to_h 'CP936 extensions' cp936ext > $@
  359: 
  360: GBKext.TXT : $(TABLESDIR)/unicode.org-mappings/EASTASIA/GB/GB2312.TXT $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP936.TXT
  361: 	sed -e 's,^0x2,0xA,' -e 's,^0x3,0xB,' -e 's,^0x4,0xC,' -e 's,^0x5,0xD,' -e 's,^0x6,0xE,' -e 's,^0x7,0xF,' -e 's,^0x\(..\)2,0x\1A,' -e 's,^0x\(..\)3,0x\1B,' -e 's,^0x\(..\)4,0x\1C,' -e 's,^0x\(..\)5,0x\1D,' -e 's,^0x\(..\)6,0x\1E,' -e 's,^0x\(..\)7,0x\1F,' $(TABLESDIR)/unicode.org-mappings/EASTASIA/GB/GB2312.TXT > tmpEUCCN.TXT ; sed -e '/^0x..[ 	]*#UNDEFINED/d' -e 's/#.*$$//' -e '/^[ 	]*$$/d' tmpEUCCN.TXT > tmp1.TXT ; sed -e '/^0x..[ 	]/d' -e 's/#.*$$//' -e '/^[ 	]*$$/d' $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP936.TXT > tmp2.TXT ; diff -c1 tmp1.TXT tmp2.TXT | grep '^+ ' | sed -e 's,^+ ,,' > $@ && rm -f tmpEUCCN.TXT tmp1.TXT tmp2.TXT
  362: 
  363: gb18030ext.h : GB18030ext.TXT cjk_tab_to_h
  364: 	(echo '#' ; cat GB18030ext.TXT) | ./cjk_tab_to_h 'GB18030 two-byte extension' gb18030ext > $@
  365: 
  366: GB18030ext.TXT : $(TABLESDIR)/glibc-2.2.2-iconv/GB18030.TXT $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP936.TXT
  367: 	cat $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP936.TXT | sed -e 's/[ 	]*#.*$$//' | grep '^0x[0-9A-F]*	0x....$$' > tmpGBK.TXT ; diff tmpGBK.TXT $(TABLESDIR)/glibc-2.2.2-iconv/GB18030.TXT | grep '^> 0x....	0x....$$' | sed -e 's/^> //' > $@ && rm -f tmpGBK.TXT
  368: 
  369: gb18030uni.h : GB18030uni.TXT cjk_tab_to_h
  370: 	./cjk_tab_to_h 'GB18030 four-byte extension' gb18030uni < GB18030uni.TXT > $@
  371: 
  372: GB18030uni.TXT : $(TABLESDIR)/gb18030/filled-GB18030.TXT
  373: 	grep '^0x........	0x....$$' < $(TABLESDIR)/gb18030/filled-GB18030.TXT > $@
  374: 
  375: cns11643_1.h : $(TABLESDIR)/csets-new/CNS11643-Unicode32.TXT cjk_tab_to_h
  376: 	grep '^\(#\|0x1\)' < $< | sed -e 's,^0x1,0x,' | ./cjk_tab_to_h 'CNS 11643-1992 plane 1' cns11643_1 > $@
  377: 
  378: cns11643_2.h : $(TABLESDIR)/csets-new/CNS11643-Unicode32.TXT cjk_tab_to_h
  379: 	grep '^\(#\|0x2\)' < $< | sed -e 's,^0x2,0x,' | ./cjk_tab_to_h 'CNS 11643-1992 plane 2' cns11643_2 > $@
  380: 
  381: cns11643_3.h : $(TABLESDIR)/csets-new/CNS11643-Unicode32.TXT cjk_tab_to_h
  382: 	grep '^\(#\|0x3\)' < $< | sed -e 's,^0x3,0x,' | ./cjk_tab_to_h 'CNS 11643-1992 plane 3' cns11643_3 > $@
  383: 
  384: cns11643_4a.h : $(TABLESDIR)/csets-new/CNS11643-Unicode32.TXT cjk_tab_to_h
  385: 	grep '^\(#\|0x4[0-3]\)' < $< | sed -e 's,^0x4,0x,' | ./cjk_tab_to_h 'CNS 11643-1992 plane 4 part a' cns11643_4a > $@
  386: 
  387: cns11643_4b.h : $(TABLESDIR)/csets-new/CNS11643-Unicode32.TXT cjk_tab_to_h
  388: 	grep '^\(#\|0x4[4-7]\)' < $< | sed -e 's,^0x4,0x,' | ./cjk_tab_to_h 'CNS 11643-1992 plane 4 part b' cns11643_4b > $@
  389: 
  390: cns11643_5.h : $(TABLESDIR)/csets-new/CNS11643-Unicode32.TXT cjk_tab_to_h
  391: 	grep '^\(#\|0x5\)' < $< | sed -e 's,^0x5,0x,' | ./cjk_tab_to_h 'CNS 11643-1992 plane 5' cns11643_5 > $@
  392: 
  393: cns11643_6.h : $(TABLESDIR)/csets-new/CNS11643-Unicode32.TXT cjk_tab_to_h
  394: 	grep '^\(#\|0x6\)' < $< | sed -e 's,^0x6,0x,' | ./cjk_tab_to_h 'CNS 11643-1992 plane 6' cns11643_6 > $@
  395: 
  396: cns11643_7.h : $(TABLESDIR)/csets-new/CNS11643-Unicode32.TXT cjk_tab_to_h
  397: 	grep '^\(#\|0x7\)' < $< | sed -e 's,^0x7,0x,' | ./cjk_tab_to_h 'CNS 11643-1992 plane 7' cns11643_7 > $@
  398: 
  399: cns11643_15.h : $(TABLESDIR)/csets-new/CNS11643-Unicode32.TXT cjk_tab_to_h
  400: 	grep '^\(#\|0xF\)' < $< | sed -e 's,^0xF,0x,' | ./cjk_tab_to_h 'CNS 11643-1992 plane 15' cns11643_15 > $@
  401: 
  402: cns11643_inv.h : $(TABLESDIR)/csets-new/CNS11643-Unicode32.TXT cjk_tab_to_h
  403: 	./cjk_tab_to_h 'CNS 11643-1992 planes 1-7, CNS 11643-1986 plane 15' cns11643_inv < $< > $@
  404: 
  405: big5.h : $(TABLESDIR)/unicode.org-mappings/EASTASIA/OTHER/BIG5.TXT cjk_tab_to_h
  406: 	./cjk_tab_to_h BIG5 big5 < $< > $@
  407: 
  408: cp950ext.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/WINDOWS/CP950.TXT cjk_tab_to_h
  409: 	(echo '#' ; grep '^0xF9\(D[6-9A-F]\|[EF][0-9A-F]\)' < $< ) | ./cjk_tab_to_h 'CP950 extensions' cp950ext > $@
  410: 
  411: hkscs1999.h : $(TABLESDIR)/big5hkscs/HKSCS-1999_2006.TXT cjk_tab_to_h
  412: 	(echo '#' ; grep -v , $<) | ./cjk_tab_to_h HKSCS:1999 hkscs1999 > $@
  413: 
  414: hkscs2001.h : $(TABLESDIR)/big5hkscs/HKSCS-2001_2006-DELTA.TXT cjk_tab_to_h
  415: 	(echo '#' ; grep -v , $<) | ./cjk_tab_to_h HKSCS:2001 hkscs2001 > $@
  416: 
  417: hkscs2004.h : $(TABLESDIR)/big5hkscs/HKSCS-2004_2006-DELTA.TXT cjk_tab_to_h
  418: 	(echo '#' ; grep -v , $<) | ./cjk_tab_to_h HKSCS:2004 hkscs2004 > $@
  419: 
  420: hkscs2008.h : $(TABLESDIR)/big5hkscs/HKSCS-2008_2010-DELTA.TXT cjk_tab_to_h
  421: 	(echo '#' ; grep -v , $<) | ./cjk_tab_to_h HKSCS:2008 hkscs2008 > $@
  422: 
  423: # We use a modified KSC 5601 = KSX 1001 table. Jungshik Shin <jshin@mailaps.org>
  424: # reports that Prof. GIM Geongseog (KIM Keyongseok) <gimgs@asadal.cs.pusan.ac.kr>
  425: # (who represents South Korea in ISO/IEC JTC1 SC2/WG2 and SC22/WG20) says that
  426: # these two characters were added to KSX 1001 in December 1998. According to
  427: # http://std.dkuug.dk/jtc1/sc2/wg2/docs/N2815.doc, one more character
  428: # (Korean postal code sign) was added in 2002.
  429: ksc5601.h : $(TABLESDIR)/unicode.org-mappings/EASTASIA/KSC/KSC5601.TXT cjk_tab_to_h
  430: 	(cat $< ; echo '0xA2E6	0x20AC'; echo '0xA2E7	0x00AE'; echo '0xA2E8	0x327E') | ./cjk_tab_to_h 'KSC5601.1987-0, now KS X 1001:2002' ksc5601 > $@
  431: 
  432: uhc_1.h : $(TABLESDIR)/unicode.org-mappings/EASTASIA/KSC/KSC5601.TXT cjk_tab_to_h
  433: 	(echo '#' ; grep '^0x\([8-9]\|A0\)' < $< ) | ./cjk_tab_to_h 'Unified Hangul Code part 1' uhc_1 > $@
  434: 
  435: uhc_2.h : $(TABLESDIR)/unicode.org-mappings/EASTASIA/KSC/KSC5601.TXT cjk_tab_to_h
  436: 	(echo '#' ; grep '^0x\(A[1-9A-F]\|[B-F][0-9A-F]\)\([0-9]\|A0\)' < $< ) | ./cjk_tab_to_h 'Unified Hangul Code part 2' uhc_2 > $@
  437: 
  438: johab_hangul.h : $(TABLESDIR)/unicode.org-mappings/EASTASIA/KSC/JOHAB.TXT cjk_tab_to_h
  439: 	(echo '#' ; grep '^0x\([8-C]...\|D[0-7]..\)' < $< ) | ./cjk_tab_to_h 'JOHAB Hangul' johab_hangul > $@
  440: 
  441: 
  442: cp856.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MISC/CP856.TXT 8bit_tab_to_h
  443: 	./8bit_tab_to_h CP856 cp856 < $<
  444: 
  445: cp922.h : $(TABLESDIR)/aix-4.3.2/IBM-922.TXT 8bit_tab_to_h
  446: 	(echo '#' ; cat $<) | ./8bit_tab_to_h CP922 cp922
  447: 
  448: cp1046.h : $(TABLESDIR)/aix-4.3.2/IBM-1046.TXT 8bit_tab_to_h
  449: 	(echo '#' ; cat $<) | ./8bit_tab_to_h CP1046 cp1046
  450: 
  451: cp1124.h : $(TABLESDIR)/aix-4.3.2/IBM-1124.TXT 8bit_tab_to_h
  452: 	(echo '#' ; cat $<) | ./8bit_tab_to_h CP1124 cp1124
  453: 
  454: cp1129.h : $(TABLESDIR)/aix-4.3.2/IBM-1129.TXT 8bit_tab_to_h
  455: 	(echo '#' ; cat $<) | ./8bit_tab_to_h CP1129 cp1129
  456: 
  457: cp1161.h : $(TABLESDIR)/glibc-2.2.90-iconv/IBM1161.TXT
  458: 	(echo '#' ; cat $(TABLESDIR)/glibc-2.2-iconv/ASCII.TXT ; grep -v '^0x[0-7]' $<) | ./8bit_tab_to_h CP1161 cp1161
  459: 
  460: cp1162.h : $(TABLESDIR)/glibc-2.2.90-iconv/IBM1162.TXT
  461: 	(echo '#' ; cat $<) | ./8bit_tab_to_h CP1162 cp1162
  462: 
  463: cp1163.h : $(TABLESDIR)/glibc-2.2.90-iconv/IBM1163.TXT
  464: 	(echo '#' ; cat $<) | ./8bit_tab_to_h CP1163 cp1163
  465: 
  466: 
  467: cp437.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP437.TXT 8bit_tab_to_h
  468: 	./8bit_tab_to_h CP437 cp437 < $<
  469: 
  470: cp737.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP737.TXT 8bit_tab_to_h
  471: 	./8bit_tab_to_h CP737 cp737 < $<
  472: 
  473: cp775.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP775.TXT 8bit_tab_to_h
  474: 	./8bit_tab_to_h CP775 cp775 < $<
  475: 
  476: cp852.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP852.TXT 8bit_tab_to_h
  477: 	./8bit_tab_to_h CP852 cp852 < $<
  478: 
  479: cp853.h : $(TABLESDIR)/other/CP853.TXT 8bit_tab_to_h
  480: 	(echo '#'; cat $<) | ./8bit_tab_to_h CP853 cp853
  481: 
  482: cp855.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP855.TXT 8bit_tab_to_h
  483: 	./8bit_tab_to_h CP855 cp855 < $<
  484: 
  485: cp857.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP857.TXT 8bit_tab_to_h
  486: 	./8bit_tab_to_h CP857 cp857 < $<
  487: 
  488: cp858.h : $(TABLESDIR)/windows-2000/CP858.TXT 8bit_tab_to_h
  489: 	(echo '#' ; cat $<) | ./8bit_tab_to_h CP858 cp858
  490: 
  491: cp860.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP860.TXT 8bit_tab_to_h
  492: 	./8bit_tab_to_h CP860 cp860 < $<
  493: 
  494: cp861.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP861.TXT 8bit_tab_to_h
  495: 	./8bit_tab_to_h CP861 cp861 < $<
  496: 
  497: cp863.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP863.TXT 8bit_tab_to_h
  498: 	./8bit_tab_to_h CP863 cp863 < $<
  499: 
  500: cp864.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP864.TXT 8bit_tab_to_h
  501: 	./8bit_tab_to_h CP864 cp864 < $<
  502: 
  503: cp865.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP865.TXT 8bit_tab_to_h
  504: 	./8bit_tab_to_h CP865 cp865 < $<
  505: 
  506: cp869.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MICSFT/PC/CP869.TXT 8bit_tab_to_h
  507: 	./8bit_tab_to_h CP869 cp869 < $<
  508: 
  509: cp1125.h : $(TABLESDIR)/csets-new/CP1125.TXT 8bit_tab_to_h
  510: 	./8bit_tab_to_h CP1125 cp1125 < $<
  511: 
  512: 
  513: jisx0213.h : JISX0213.TXT cjk_tab_to_h
  514: 	./cjk_tab_to_h JISX0213:2004 jisx0213 < $< > $@
  515: 
  516: tds565.h : $(TABLESDIR)/recode-cvs/TDS565.TXT 8bit_tab_to_h
  517: 	(echo '#'; cat $<) | ./8bit_tab_to_h TDS565 tds565 > $@
  518: 
  519: atarist.h : $(TABLESDIR)/unicode.org-mappings/VENDORS/MISC/ATARIST.TXT
  520: 	./8bit_tab_to_h 'Atari ST' atarist < $< > $@
  521: 
  522: riscos1.h : $(TABLESDIR)/recode-cvs/RISCOS-LATIN1.TXT 8bit_tab_to_h
  523: 	(echo '#'; cat $<) | ./8bit_tab_to_h RISCOS-LATIN1 riscos1 > $@
  524: 
  525: 
  526: cjk_variants.h : $(TABLESDIR)/yasuoka/UniVariants cjk_variants
  527: 	./cjk_variants < $< > $@
  528: 
  529: 
  530: 8bit_tab_to_h : 8bit_tab_to_h.c
  531: 	gcc -O -Wall -g $< -o $@
  532: 
  533: cjk_tab_to_h : cjk_tab_to_h.c
  534: 	gcc -O -Wall -g $< -o $@
  535: 
  536: cjk_variants : cjk_variants.c
  537: 	gcc -O -Wall -g $< -o $@
  538: 
  539: 
  540: clean : force
  541: 	rm -f 8bit_tab_to_h cjk_tab_to_h cjk_variants $(ALL) GBKext.TXT
  542: 
  543: force :
  544: 

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>