Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(1)

Unified Diff: icu52.android/android/brkitr.patch

Issue 248043003: Check in the pre-built ICU data for Android (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/deps/third_party/
Patch Set: Created 6 years, 8 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
« no previous file with comments | « icu52.android/README.chromium ('k') | icu52.android/android/icudtl.dat » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
Index: icu52.android/android/brkitr.patch
===================================================================
--- icu52.android/android/brkitr.patch (revision 0)
+++ icu52.android/android/brkitr.patch (working copy)
@@ -1,93 +1,42 @@
-diff --git a/source/data/brkitr/brklocal.mk b/source/data/brkitr/brklocal.mk
-index 91754f1..ccac4d1 100644
---- a/source/data/brkitr/brklocal.mk
-+++ b/source/data/brkitr/brklocal.mk
-@@ -34,15 +34,15 @@ BRK_RES_ALIAS_SOURCE = $(BRK_RES_SYNTHETIC_ALIAS)
+Index: source/data/brkitr/word.txt
+===================================================================
+--- source/data/brkitr/word.txt (revision 264859)
++++ source/data/brkitr/word.txt (working copy)
+@@ -56,15 +56,13 @@
+ # 5.0 or later as the definition of Complex_Context was corrected to include all
+ # characters requiring dictionary break.
-
- # List of compact trie dictionary files (ctd).
--BRK_CTD_SOURCE = thaidict.txt cjdict.txt
-+BRK_CTD_SOURCE = thaidict.txt
-
-
- # List of break iterator files (brk).
--# Chrome change: remove word_ja.txt and line_he.txt
--BRK_SOURCE = sent_el.txt word_POSIX.txt line_fi.txt char.txt word.txt line.txt sent.txt title.txt char_th.txt
-+# Chrome change: remove line_he.txt
-+BRK_SOURCE = sent_el.txt word_POSIX.txt line_fi.txt word_ja.txt char.txt word.txt line.txt sent.txt title.txt char_th.txt
-
-
- # Ordinary resources
--# Chrome change: remove ja.txt and he.txt
-+# Chrome change: remove he.txt
- BRK_RES_SOURCE = el.txt en.txt en_US.txt en_US_POSIX.txt\
-- fi.txt th.txt
-+ fi.txt ja.txt th.txt
-diff --git a/source/data/brkitr/root.txt b/source/data/brkitr/root.txt
-index fb83ac3..5d839bd 100644
---- a/source/data/brkitr/root.txt
-+++ b/source/data/brkitr/root.txt
-@@ -17,8 +17,5 @@ root{
- }
- dictionaries{
- Thai:process(dependency){"thaidict.ctd"}
-- Hani:process(dependency){"cjdict.ctd"}
-- Hira:process(dependency){"cjdict.ctd"}
-- Kata:process(dependency){"cjdict.ctd"}
- }
- }
-diff --git a/source/data/brkitr/word.txt b/source/data/brkitr/word.txt
-index 0b49377..a0e1ceb 100644
---- a/source/data/brkitr/word.txt
-+++ b/source/data/brkitr/word.txt
-@@ -60,11 +60,10 @@ $Control = [\p{Grapheme_Cluster_Break = Control}];
+-$Control = [\p{Grapheme_Cluster_Break = Control}];
++$Control = [\p{Grapheme_Cluster_Break = Control}];
$HangulSyllable = [\uac00-\ud7a3];
$ComplexContext = [:LineBreak = Complex_Context:];
$KanaKanji = [$Han $Hiragana $Katakana];
-$dictionaryCJK = [$KanaKanji $HangulSyllable];
-$dictionary = [$ComplexContext $dictionaryCJK];
-+$dictionary = [:LineBreak = Complex_Context:];
++$dictionary = [$ComplexContext];
-# leave CJK scripts out of ALetterPlus
-$ALetterPlus = [$ALetter-$dictionaryCJK [$ComplexContext-$Extend-$Control]];
-+$ALetterPlus = [$ALetter [$dictionary-$Extend-$Control]]; # Note: default ALetter does not
-+ # include the dictionary characters.
++$ALetterPlus = [$ALetter [$ComplexContext-$Extend-$Control]];
#
-@@ -99,8 +98,7 @@ $CR $LF;
- # begins with a group of Format chars, or with a "word" consisting of a single
- # char that is not in any of the listed word break categories followed by
- # format char(s).
-- # format char(s), or is not a CJK dictionary character.
--[^$CR $LF $Newline $dictionaryCJK]? ($Extend | $Format)+;
-+[^$CR $LF $Newline]? ($Extend | $Format)+;
+@@ -166,11 +164,6 @@
- $NumericEx {100};
- $ALetterEx {200};
-@@ -155,9 +153,6 @@ $ExtendNumLetEx $ALetterEx {200}; # (13b)
- $ExtendNumLetEx $NumericEx {100}; # (13b)
- $ExtendNumLetEx $KatakanaEx {400}; # (13b)
+ $Regional_IndicatorEx $Regional_IndicatorEx;
-# special handling for CJK characters: chain for later dictionary segmentation
-$HangulSyllable $HangulSyllable {200};
--$KanaKanji $KanaKanji {400}; #different rule status if both kanji and kana found
-
-
+-$KanaKanji $KanaKanji {400}; # different rule status if both kana and kanji found
+-
+-
## -------------------------------------------------
-@@ -179,7 +174,7 @@ $BackHebrewLetEx = ($Format | $Extend)* $HebrewLet;
- $LF $CR;
- # rule 4
--($Format | $Extend)* [^$CR $LF $Newline $dictionaryCJK]?;
-+($Format | $Extend)* [^$CR $LF $Newline]?;
+ !!reverse;
+@@ -237,10 +230,6 @@
- # rule 5
+ $BackRegional_IndicatorEx $BackRegional_IndicatorEx;
-@@ -217,10 +212,6 @@ $BackKatakanaEx $BackKatakanaEx;
- $BackExtendNumLetEx ($BackALetterEx | $BackNumericEx | $BackKatakanaEx | $BackExtendNumLetEx);
- ($BackALetterEx | $BackNumericEx | $BackKatakanaEx) $BackExtendNumLetEx;
-
-# special handling for CJK characters: chain for later dictionary segmentation
-$HangulSyllable $HangulSyllable;
-$KanaKanji $KanaKanji; #different rule status if both kanji and kana found
@@ -95,3 +44,50 @@
## -------------------------------------------------
!!safe_reverse;
+Index: source/data/brkitr/brklocal.mk
+===================================================================
+--- source/data/brkitr/brklocal.mk (revision 264859)
++++ source/data/brkitr/brklocal.mk (working copy)
+@@ -34,13 +34,13 @@
+
+
+ # List of dictionary files (dict).
+-BRK_DICT_SOURCE = cjdict.txt khmerdict.txt laodict.txt thaidict.txt
++BRK_DICT_SOURCE = khmerdict.txt laodict.txt thaidict.txt
+
+
+ # List of break iterator files (brk).
+-BRK_SOURCE = char.txt line.txt line_fi.txt sent.txt sent_el.txt title.txt word.txt
++BRK_SOURCE = char.txt line.txt line_fi.txt sent.txt sent_el.txt title.txt word.txt word_ja.txt
+
+
+ # Ordinary resources
+-BRK_RES_SOURCE = el.txt en.txt en_US.txt fi.txt
++BRK_RES_SOURCE = el.txt en.txt en_US.txt fi.txt ja.txt
+
+Index: source/data/brkitr/root.txt
+===================================================================
+--- source/data/brkitr/root.txt (revision 264859)
++++ source/data/brkitr/root.txt (working copy)
+@@ -16,9 +16,6 @@
+ word:process(dependency){"word.brk"}
+ }
+ dictionaries{
+- Hani:process(dependency){"cjdict.dict"}
+- Hira:process(dependency){"cjdict.dict"}
+- Kata:process(dependency){"cjdict.dict"}
+ Khmr:process(dependency){"khmerdict.dict"}
+ Laoo:process(dependency){"laodict.dict"}
+ Thai:process(dependency){"thaidict.dict"}
+Index: source/data/brkitr/ja.txt
+===================================================================
+--- source/data/brkitr/ja.txt (revision 264859)
++++ source/data/brkitr/ja.txt (working copy)
+@@ -9,6 +9,6 @@
+ ja{
+ Version{"1.1"}
+ boundaries{
+- line:process(dependency){"line_ja.brk"}
++ word:process(dependency){"word_ja.brk"}
+ }
+ }
Property changes on: icu52.android/android/brkitr.patch
___________________________________________________________________
Added: svn:eol-style
+ LF
« no previous file with comments | « icu52.android/README.chromium ('k') | icu52.android/android/icudtl.dat » ('j') | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698