Index: icu46/source/data/brkitr/char_th.txt |
=================================================================== |
--- icu46/source/data/brkitr/char_th.txt (revision 0) |
+++ icu46/source/data/brkitr/char_th.txt (revision 0) |
@@ -0,0 +1,63 @@ |
+# |
+# Copyright (C) 2002-2010, International Business Machines Corporation and others. |
+# All Rights Reserved. |
+# |
+# file: char_th.txt |
+# |
+# ICU Character Break Rules, also known as Grapheme Cluster Boundaries |
+# See Unicode Standard Annex #29. |
+# These rules are based on TR29 Revision 16, for Unicode Version 6.0 |
+# |
+ |
+# |
+# Character Class Definitions. |
+# |
+$CR = [\p{Grapheme_Cluster_Break = CR}]; |
+$LF = [\p{Grapheme_Cluster_Break = LF}]; |
+$Control = [\p{Grapheme_Cluster_Break = Control}]; |
+$Extend = [\p{Grapheme_Cluster_Break = Extend} + [\u0E33 \u0EB3]]; |
+ |
+# |
+# Korean Syllable Definitions |
+# |
+$L = [\p{Grapheme_Cluster_Break = L}]; |
+$V = [\p{Grapheme_Cluster_Break = V}]; |
+$T = [\p{Grapheme_Cluster_Break = T}]; |
+ |
+$LV = [\p{Grapheme_Cluster_Break = LV}]; |
+$LVT = [\p{Grapheme_Cluster_Break = LVT}]; |
+ |
+ |
+## ------------------------------------------------- |
+!!chain; |
+ |
+!!forward; |
+ |
+$CR $LF; |
+ |
+$L ($L | $V | $LV | $LVT); |
+($LV | $V) ($V | $T); |
+($LVT | $T) $T; |
+ |
+[^$Control $CR $LF] $Extend; |
+ |
+## ------------------------------------------------- |
+ |
+!!reverse; |
+$LF $CR; |
+($L | $V | $LV | $LVT) $L; |
+($V | $T) ($LV | $V); |
+$T ($LVT | $T); |
+ |
+$Extend [^$Control $CR $LF]; |
+ |
+ |
+## ------------------------------------------------- |
+ |
+!!safe_reverse; |
+ |
+ |
+## ------------------------------------------------- |
+ |
+!!safe_forward; |
+ |
Property changes on: icu46/source/data/brkitr/char_th.txt |
___________________________________________________________________ |
Added: svn:eol-style |
+ LF |