OLD | NEW |
1 # | 1 # |
2 # Copyright (C) 2002-2013, International Business Machines Corporation | 2 # Copyright (C) 2002-2014, International Business Machines Corporation |
3 # and others. All Rights Reserved. | 3 # and others. All Rights Reserved. |
4 # | 4 # |
5 # file: word_POSIX.txt | 5 # file: word_POSIX.txt |
6 # | 6 # |
7 # ICU Word Break Rules, POSIX locale. | 7 # ICU Word Break Rules, POSIX locale. |
8 # See Unicode Standard Annex #29. | 8 # See Unicode Standard Annex #29. |
9 # These rules are based on UAX #29 Revision 22 for Unicode Version 6.3 | 9 # These rules are based on UAX #29 Revision 22 for Unicode Version 6.3 |
10 # | 10 # |
11 # Note: Updates to word.txt will usually need to be merged into | 11 # Note: Updates to word.txt will usually need to be merged into |
12 # word_POSIX.txt also. | 12 # word_POSIX.txt also. |
(...skipping 16 matching lines...) Expand all Loading... |
29 $Newline = [\p{Word_Break = Newline}]; | 29 $Newline = [\p{Word_Break = Newline}]; |
30 $Extend = [\p{Word_Break = Extend}]; | 30 $Extend = [\p{Word_Break = Extend}]; |
31 $Regional_Indicator = [\p{Word_Break = Regional_Indicator}]; | 31 $Regional_Indicator = [\p{Word_Break = Regional_Indicator}]; |
32 $Format = [\p{Word_Break = Format}]; | 32 $Format = [\p{Word_Break = Format}]; |
33 $Katakana = [\p{Word_Break = Katakana}]; | 33 $Katakana = [\p{Word_Break = Katakana}]; |
34 $Hebrew_Letter = [\p{Word_Break = Hebrew_Letter}]; | 34 $Hebrew_Letter = [\p{Word_Break = Hebrew_Letter}]; |
35 $ALetter = [\p{Word_Break = ALetter}]; | 35 $ALetter = [\p{Word_Break = ALetter}]; |
36 $Single_Quote = [\p{Word_Break = Single_Quote}]; | 36 $Single_Quote = [\p{Word_Break = Single_Quote}]; |
37 $Double_Quote = [\p{Word_Break = Double_Quote}]; | 37 $Double_Quote = [\p{Word_Break = Double_Quote}]; |
38 $MidNumLet = [\p{Word_Break = MidNumLet} - [.]]; | 38 $MidNumLet = [\p{Word_Break = MidNumLet} - [.]]; |
39 $MidLetter = [\p{Word_Break = MidLetter}]; | 39 $MidLetter = [\p{Word_Break = MidLetter} - [\:]]; |
40 $MidNum = [\p{Word_Break = MidNum} [.]]; | 40 $MidNum = [\p{Word_Break = MidNum} [.]]; |
41 $Numeric = [\p{Word_Break = Numeric}]; | 41 $Numeric = [\p{Word_Break = Numeric}]; |
42 $ExtendNumLet = [\p{Word_Break = ExtendNumLet}]; | 42 $ExtendNumLet = [\p{Word_Break = ExtendNumLet}]; |
43 | 43 |
44 $Han = [:Han:]; | 44 $Han = [:Han:]; |
45 $Hiragana = [:Hiragana:]; | 45 $Hiragana = [:Hiragana:]; |
46 | 46 |
47 | 47 |
48 # Dictionary character set, for triggering language-based break engines. Curre
ntly | 48 # Dictionary character set, for triggering language-based break engines. Curre
ntly |
49 # limited to LineBreak=Complex_Context. Note that this set only works in Unico
de | 49 # limited to LineBreak=Complex_Context. Note that this set only works in Unico
de |
(...skipping 216 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
266 ($MidLetterEx | $MidNumLetEx | $Single_QuoteEx) ($ALetterEx | $Hebrew_LetterEx); | 266 ($MidLetterEx | $MidNumLetEx | $Single_QuoteEx) ($ALetterEx | $Hebrew_LetterEx); |
267 | 267 |
268 # rule 7b | 268 # rule 7b |
269 $Double_QuoteEx $Hebrew_LetterEx; | 269 $Double_QuoteEx $Hebrew_LetterEx; |
270 | 270 |
271 # rule 11 | 271 # rule 11 |
272 ($MidNumEx | $MidNumLetEx | $Single_QuoteEx) $NumericEx; | 272 ($MidNumEx | $MidNumLetEx | $Single_QuoteEx) $NumericEx; |
273 | 273 |
274 # For dictionary-based break | 274 # For dictionary-based break |
275 $dictionary $dictionary; | 275 $dictionary $dictionary; |
OLD | NEW |