| Index: icu46/source/test/testdata/test4.ucm
|
| ===================================================================
|
| --- icu46/source/test/testdata/test4.ucm (revision 0)
|
| +++ icu46/source/test/testdata/test4.ucm (revision 0)
|
| @@ -0,0 +1,64 @@
|
| +# *******************************************************************************
|
| +# * Copyright (C) 2001-2003, International Business Machines
|
| +# * Corporation and others. All Rights Reserved.
|
| +# *******************************************************************************
|
| +#
|
| +# test4.ucm
|
| +#
|
| +# Test file for MBCS conversion with four-byte codepage data.
|
| +
|
| +<code_set_name> "test4"
|
| +<mb_cur_max> 4
|
| +<mb_cur_min> 1
|
| +<uconv_class> "MBCS"
|
| +
|
| +# both subchars are single-byters, which does not make sense
|
| +# but works - adding subchar1 for tests but don't want to
|
| +# change old tests for a new subchar -- markus 20031028
|
| +<subchar> \xff
|
| +<subchar1> \xe1
|
| +<icu:state> 0, 1:1, 5-9, e1, ff
|
| +<icu:state> 2:2
|
| +<icu:state> 3:3
|
| +<icu:state> a-f.p, ff
|
| +
|
| +CHARMAP
|
| +
|
| +# fromUnicode result is zero byte from other than U+0000
|
| +<U20ac> \x00 |0
|
| +
|
| +# fallback from non-zero to zero possible with extension table
|
| +<U20ad> \x00 |1
|
| +
|
| +# nothing special
|
| +<U0005> \x05 |0
|
| +
|
| +# toUnicode result is fallback direct
|
| +<U0006> \x06 |3
|
| +
|
| +# toUnicode result is direct non-BMP code point
|
| +<U101234> \x07 |0
|
| +<Ufebcd> \x08 |3
|
| +
|
| +#unassigned \x09
|
| +
|
| +# toUnicode result is surrogate pair: test real pair, single unit, unassigned
|
| +<U23456> \x01\x02\x03\x0a |0
|
| +<U000b> \x01\x02\x03\x0b |0
|
| +#unassigned \x01\x02\x03\x0c
|
| +<U34567> \x01\x02\x03\x0d |3
|
| +<U000e> \x01\x02\x03\x0e |3
|
| +#unassigned \x01\x02\x03\x0f
|
| +
|
| +# <subchar1> non-mapping
|
| +<U50005> \xe1 |2
|
| +# add a mapping that turns the above's Unicode side into a prefix
|
| +<U50005><U60006> \x06 |1
|
| +
|
| +# many bytes, and bytes per UChar
|
| +<U30ab><U309a> \x01\x02\x03\x0a\x01\x02\x03\x0b\x01\x02\x03\x0c\x01\x02\x03\x0d\x01\x02\x03\x0e\x01\x02\x03\x0f\x01\x02\x03\x0a\x05\x06\x07 |0
|
| +
|
| +# many UChars, and UChars per byte
|
| +<U304b><U309a><U304d><U309a><U304f><U309a><U3051><U309a><U3053><U309a><U30ab><U309a><U30ad><U309a><U30af><U309a><U30b1><U309a><U0300> \x08\x09 |0
|
| +
|
| +END CHARMAP
|
|
|