OLD | NEW |
1 # Note: A number of encodings are handled with purely algorithmic converters, | 1 # Note: A number of encodings are handled with purely algorithmic converters, |
2 # without any mapping tables: | 2 # without any mapping tables: |
3 # US-ASCII, ISO 8859-1, UTF-7/8/16/32, SCSU | 3 # US-ASCII, ISO 8859-1, UTF-7/8/16/32, SCSU |
4 | 4 |
5 # Listed here: | 5 # Listed here: |
6 | 6 |
7 # * ISO 8859-2..8,10,13,14,15,16 | 7 # * ISO 8859-2..8,10,13,14,15,16 |
8 # - 8859-11 table is not included. It's rather treated as a synonym of | 8 # - 8859-11 table is not included. It's rather treated as a synonym of |
9 # Windows-874 | 9 # Windows-874 |
10 # * Windows-125[0-8] | 10 # * Windows-125[0-8] |
11 # * Simplified Chinese : GBK(Windows cp936), GB 18030 | 11 # * Simplified Chinese : GBK(Windows cp936), GB 18030 |
12 # - GB2312 table was removed and 4 aliases for GB2312 were added | 12 # - GB2312 table was removed and 4 aliases for GB2312 were added |
13 # to GBK in convrtrs.txt to treat GB2312 as a synonym of GBK. | 13 # to GBK in convrtrs.txt to treat GB2312 as a synonym of GBK. |
14 # - GB-HZ is supported now that it uses the GBK table. | 14 # - GB-HZ is supported now that it uses the GBK table. |
15 # * Traditional Chinese : Big5 (Windows cp950), Big5HKSCS (no PUA) | 15 # * Traditional Chinese : Big5 (Windows cp950), Big5HKSCS (no PUA) |
16 # * Japanese : SJIS (shift_jis-html5), EUC-JP (euc-jp_html5) | 16 # * Japanese : SJIS (shift_jis-html), EUC-JP (euc-jp-html) |
17 # * Korean : Windows-949 | 17 # * Korean : Windows-949 |
18 # - EUC-KR table was removed. It's different from Windows-949, but | 18 # - EUC-KR table was removed. It's different from Windows-949, but |
19 # in practice EUC-KR and Windows-949 are treated synonymously. | 19 # in practice EUC-KR and Windows-949 are treated synonymously. |
20 # - ISO-2022-KR is now supported by with a one-line change | 20 # - ISO-2022-KR is now supported by with a one-line change |
21 # in common/ucnv2022.c and other changes in convrtrs.txt to make it | 21 # in common/ucnv2022.c and other changes in convrtrs.txt to make it |
22 # use the windows-949 table. | 22 # use the windows-949 table. |
23 # * Thai : Windows-874 | 23 # * Thai : Windows-874 |
24 # - TIS-620 and ISO-8859-11 are treated as synonyms of Windows-874 | 24 # - TIS-620 and ISO-8859-11 are treated as synonyms of Windows-874 |
25 # although they're not the same. | 25 # although they're not the same. |
26 # * Mac encodings : MacRoman, MacCyrillic | 26 # * Mac encodings : MacRoman, MacCyrillic |
27 # * Cyrillic : KOI8-R, KOI8-U, IBM-866 | 27 # * Cyrillic : KOI8-R, KOI8-U, IBM-866 |
28 # | 28 # |
29 # * Missing | 29 # * Missing |
30 # - Armenian, Georgian : extremly rare | 30 # - Armenian, Georgian : extremly rare |
31 # - Mac encodings (other than Roman and Cyrillic) : extremly rare | 31 # - Mac encodings (other than Roman and Cyrillic) : extremly rare |
32 | 32 |
33 UCM_SOURCE_FILES= | 33 UCM_SOURCE_FILES= |
34 | 34 |
35 UCM_SOURCE_CORE=ibm-912_P100-1995.ucm ibm-913_P100-2000.ucm\ | 35 |
36 ibm-914_P100-1995.ucm ibm-915_P100-1995.ucm\ | 36 UCM_SOURCE_CORE=iso-8859-2-html.ucm iso-8859-3-html.ucm iso-8859-4-html.ucm\ |
37 ibm-1089_P100-1995.ucm ibm-9005_X110-2007.ucm\ | 37 iso-8859-5-html.ucm iso-8859-6-html.ucm iso-8859-7-html.ucm \ |
38 ibm-5012_P100-1999.ucm\ | 38 iso-8859-8-html.ucm iso-8859-10-html.ucm iso-8859-13-html.ucm \ |
39 iso-8859_10-1998.ucm\ | 39 iso-8859-14-html.ucm iso-8859-15-html.ucm iso-8859-16-html.ucm \ |
40 ibm-921_P100-1995.ucm iso-8859_14-1998.ucm ibm-923_P100-1998.ucm\ | 40 windows-1250-html.ucm windows-1251-html.ucm windows-1252-html.ucm\ |
41 iso-8859_16-2001.ucm\ | 41 windows-1253-html.ucm windows-1254-html.ucm windows-1255-html.ucm\ |
42 ibm-5346_P100-1998.ucm ibm-5347_P100-1998.ucm ibm-5348_P100-1997.ucm\ | 42 windows-1256-html.ucm windows-1257-html.ucm windows-1258-html.ucm\ |
43 ibm-5349_P100-1998.ucm ibm-5350_P100-1998.ucm ibm-9447_P100-2002.ucm\ | |
44 ibm-9448_X100-2005.ucm ibm-9449_P100-2002.ucm ibm-5354_P100-1998.ucm\ | |
45 windows-936-2000.ucm gb18030.ucm\ | 43 windows-936-2000.ucm gb18030.ucm\ |
46 windows-950-2000.ucm ibm-1375_P100-2007.ucm\ | 44 windows-950-2000.ucm ibm-1375_P100-2007.ucm\ |
47 shift_jis-html.ucm euc-jp-html.ucm\ | 45 shift_jis-html.ucm euc-jp-html.ucm\ |
48 windows-949-2000.ucm\ | 46 windows-949-2000.ucm\ |
49 windows-874-2000.ucm\ | 47 windows-874-html.ucm \ |
50 macos-0_2-10.2.ucm macos-7_3-10.2.ucm\ | 48 macintosh-html.ucm x-mac-cyrillic-html.ucm\ |
51 ibm-878_P100-1996.ucm ibm-1168_P100-2002.ucm ibm866-html.ucm | 49 ibm866-html.ucm koi8-r-html.ucm koi8-u-html.ucm |
| 50 |
52 | 51 |
53 | 52 |
54 # Do not build EBCDIC converters. | 53 # Do not build EBCDIC converters. |
55 # ibm-37 and ibm-1047 are hardcoded in Makefile.in and | 54 # ibm-37 and ibm-1047 are hardcoded in Makefile.in and |
56 # they're removed by modifying the file. It's also hard-coded in makedata.mak fo
r | 55 # they're removed by modifying the file. It's also hard-coded in makedata.mak fo
r |
57 # Winwodws, but we don't have to touch it because the data dll is generated out
of | 56 # Winwodws, but we don't have to touch it because the data dll is generated out
of |
58 # icu*.dat file generated on Linux. | 57 # icu*.dat file generated on Linux. |
59 UCM_SOURCE_EBCDIC = | 58 UCM_SOURCE_EBCDIC = |
OLD | NEW |