OLD | NEW |
1 # *************************************************************************** | 1 # *************************************************************************** |
2 # * | 2 # * |
3 # * Copyright (C) 1995-2014, International Business Machines | 3 # * Copyright (C) 1995-2014, International Business Machines |
4 # * Corporation and others. All Rights Reserved. | 4 # * Corporation and others. All Rights Reserved. |
5 # * | 5 # * |
6 # * Generated per the algorithm for Big5 | 6 # * Generated per the algorithm for Big5 |
7 # * described at http://encoding.spec.whatwg.org/#big5 | 7 # * described at http://encoding.spec.whatwg.org/#big5 |
8 # * | 8 # * |
9 # *************************************************************************** | 9 # *************************************************************************** |
10 <code_set_name> "big5-html" | 10 <code_set_name> "big5-html" |
11 <char_name_mask> "AXXXX" | 11 <char_name_mask> "AXXXX" |
12 <mb_cur_max> 2 | 12 <mb_cur_max> 2 |
13 <mb_cur_min> 1 | 13 <mb_cur_min> 1 |
14 <uconv_class> "MBCS" | 14 <uconv_class> "MBCS" |
15 <subchar> \x3F | 15 <subchar> \x3F |
16 <icu:charsetFamily> "ASCII" | 16 <icu:charsetFamily> "ASCII" |
17 | 17 |
18 # 'p' is for the range that may produce non-BMP code points. | 18 # 'p' is for the range that may produce non-BMP code points. |
| 19 # 'i' is to make the code range illegal. |
| 20 # Big5 has a lot of small holes in the 2nd byte. If it's in the ASCII range, |
| 21 # the 2nd byte has to be added back to the stream to be compliant to the |
| 22 # encoding spec. Each state adds 1kB in the data size. |
19 # See http://userguide.icu-project.org/conversion/data. | 23 # See http://userguide.icu-project.org/conversion/data. |
20 <icu:state> 0-7f, 87-fe:1, 87-a0:2, c8:2, fa-fe:2 | 24 <icu:state> 0-7f, a1-fe:1, 87-a0:2, c8:2, fa-fe:2, 87:3, 89:4,
8a:5, 8b:6, 8d:7, 9b:8, 9f:9, a0:a |
21 <icu:state> 40-7e, a1-fe | 25 <icu:state> 40-7e, a1-fe |
22 <icu:state> 40-7e.p, a1-fe.p | 26 <icu:state> 40-7e.p, a1-fe.p |
| 27 <icu:state> 40-7e.p, a1-fe.p, 66.i |
| 28 <icu:state> 40-7e.p, a1-fe.p, 42.i, 44.i, 45.i, 4a-4b.i |
| 29 <icu:state> 40-7e.p, a1-fe.p, 42.i, 63.i, 75.i |
| 30 <icu:state> 40-7e.p, a1-fe.p, 54.i |
| 31 <icu:state> 40-7e.p, a1-fe.p, 41.i |
| 32 <icu:state> 40-7e.p, a1-fe.p, 61.i |
| 33 <icu:state> 40-7e.p, a1-fe.p, 4e.i |
| 34 <icu:state> 40-7e.p, a1-fe.p, 54.i, 57.i, 5a.i, 62.i, 72.i |
23 | 35 |
24 CHARMAP | 36 CHARMAP |
25 <U0000> \x00 |0 | 37 <U0000> \x00 |0 |
26 <U0001> \x01 |0 | 38 <U0001> \x01 |0 |
27 <U0002> \x02 |0 | 39 <U0002> \x02 |0 |
28 <U0003> \x03 |0 | 40 <U0003> \x03 |0 |
29 <U0004> \x04 |0 | 41 <U0004> \x04 |0 |
30 <U0005> \x05 |0 | 42 <U0005> \x05 |0 |
31 <U0006> \x06 |0 | 43 <U0006> \x06 |0 |
32 <U0007> \x07 |0 | 44 <U0007> \x07 |0 |
(...skipping 18705 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
18738 <U2F840> \xA0\x47 |3 | 18750 <U2F840> \xA0\x47 |3 |
18739 <U2F878> \x8B\xC3 |3 | 18751 <U2F878> \x8B\xC3 |3 |
18740 <U2F894> \xFC\x48 |0 | 18752 <U2F894> \xFC\x48 |0 |
18741 <U2F8A6> \xFC\x77 |0 | 18753 <U2F8A6> \xFC\x77 |0 |
18742 <U2F8CD> \x9C\x52 |3 | 18754 <U2F8CD> \x9C\x52 |3 |
18743 <U2F994> \x8E\xFD |3 | 18755 <U2F994> \x8E\xFD |3 |
18744 <U2F9B2> \x8F\xA8 |3 | 18756 <U2F9B2> \x8F\xA8 |3 |
18745 <U2F9BC> \x95\x7A |3 | 18757 <U2F9BC> \x95\x7A |3 |
18746 <U2F9D4> \x8F\xF0 |3 | 18758 <U2F9D4> \x8F\xF0 |3 |
18747 END CHARMAP | 18759 END CHARMAP |
OLD | NEW |