Index: source/data/brkitr/line.txt |
=================================================================== |
--- source/data/brkitr/line.txt (revision 90787) |
+++ source/data/brkitr/line.txt (working copy) |
@@ -58,7 +58,12 @@ |
# |
# See rule LB 19 for an example. |
# |
+$SmallHira = [\u3041 \u3043 \u3045 \u3047 \u3049 \u3063 \u3083 \u3085 \u3087 \u308E \u3095 \u3096]; |
+$SmallKata = [\u30A1 \u30A3 \u30A5 \u30A7 \u30A9 \u30C3 \u30E3 \u30E5 \u30E7 \u30EE \u30F5 \u30F6]; |
+$SmallKataExt = [\u31F0 \u31F1 \u31F2 \u31F3 \u31F4 \u31F5 \u31F6 \u31F7 \u31F8 \u31F9 \u31FA \u31FB \u31FC \u31FD \u31FE \u31FF]; |
+$SmallKanaAndProlongedMark = [[$SmallHira] [$SmallKata] [$SmallKataExt] [\u30FC]]; |
+ |
$AI = [:LineBreak = Ambiguous:]; |
$AL = [[:LineBreak = Alphabetic:] - [[:Hebrew:] & [:Letter:]] - [\u23B4\u23B5]]; |
$HL = [[:Hebrew:] & [:Letter:]]; |
@@ -77,7 +82,7 @@ |
$HY = [:LineBreak = Hyphen:]; |
$H2 = [:LineBreak = H2:]; |
$H3 = [:LineBreak = H3:]; |
-$ID = [[:LineBreak = Ideographic:] - [\uFE51]]; |
+$ID = [[[:LineBreak = Ideographic:] - [\uFE51]] [$SmallKanaAndProlongedMark]]; |
$IN = [:LineBreak = Inseperable:]; |
$IS = [[:LineBreak = Infix_Numeric:] - [\uFE10]]; |
$JL = [:LineBreak = JL:]; |
@@ -85,7 +90,7 @@ |
$JT = [:LineBreak = JT:]; |
$LF = [:LineBreak = Line_Feed:]; |
$NL = [:LineBreak = Next_Line:]; |
-$NS = [:LineBreak = Nonstarter:]; |
+$NS = [[:LineBreak = Nonstarter:] - [$SmallKanaAndProlongedMark]]; |
$NU = [:LineBreak = Numeric:]; |
$OP = [[:LineBreak = Open_Punctuation:] \u23B4]; |
$PO = [:LineBreak = Postfix_Numeric:]; |