Index: icu46/source/i18n/regexcst.h |
=================================================================== |
--- icu46/source/i18n/regexcst.h (revision 0) |
+++ icu46/source/i18n/regexcst.h (revision 0) |
@@ -0,0 +1,504 @@ |
+//--------------------------------------------------------------------------------- |
+// |
+// Generated Header File. Do not edit by hand. |
+// This file contains the state table for the ICU Regular Expression Pattern Parser |
+// It is generated by the Perl script "regexcst.pl" from |
+// the rule parser state definitions file "regexcst.txt". |
+// |
+// Copyright (C) 2002-2007 International Business Machines Corporation |
+// and others. All rights reserved. |
+// |
+//--------------------------------------------------------------------------------- |
+#ifndef RBBIRPT_H |
+#define RBBIRPT_H |
+ |
+U_NAMESPACE_BEGIN |
+// |
+// Character classes for regex pattern scanning. |
+// |
+ static const uint8_t kRuleSet_digit_char = 128; |
+ static const uint8_t kRuleSet_rule_char = 129; |
+ |
+ |
+enum Regex_PatternParseAction { |
+ doLiteralChar, |
+ doSetEnd, |
+ doBackslashA, |
+ doSetBeginUnion, |
+ doNOP, |
+ doSetBackslash_w, |
+ doSetRange, |
+ doBackslashG, |
+ doPerlInline, |
+ doSetAddDash, |
+ doIntevalLowerDigit, |
+ doProperty, |
+ doBackslashX, |
+ doOpenAtomicParen, |
+ doSetLiteralEscaped, |
+ doPatFinish, |
+ doSetBackslash_D, |
+ doSetDifference2, |
+ doNamedChar, |
+ doNGPlus, |
+ doOpenLookBehindNeg, |
+ doIntervalError, |
+ doIntervalSame, |
+ doBackRef, |
+ doPlus, |
+ doOpenCaptureParen, |
+ doMismatchedParenErr, |
+ doBeginMatchMode, |
+ doEscapeError, |
+ doOpenNonCaptureParen, |
+ doDollar, |
+ doSetProp, |
+ doIntervalUpperDigit, |
+ doSetBegin, |
+ doBackslashs, |
+ doOpenLookBehind, |
+ doSetMatchMode, |
+ doOrOperator, |
+ doCaret, |
+ doMatchModeParen, |
+ doStar, |
+ doOpt, |
+ doMatchMode, |
+ doSuppressComments, |
+ doPossessiveInterval, |
+ doOpenLookAheadNeg, |
+ doBackslashW, |
+ doCloseParen, |
+ doSetOpError, |
+ doIntervalInit, |
+ doSetFinish, |
+ doSetIntersection2, |
+ doNGStar, |
+ doEnterQuoteMode, |
+ doSetAddAmp, |
+ doBackslashB, |
+ doBackslashw, |
+ doPossessiveOpt, |
+ doSetNegate, |
+ doRuleError, |
+ doBackslashb, |
+ doConditionalExpr, |
+ doPossessivePlus, |
+ doBadOpenParenType, |
+ doNGInterval, |
+ doSetLiteral, |
+ doSetNamedChar, |
+ doBackslashd, |
+ doSetBeginDifference1, |
+ doBackslashD, |
+ doExit, |
+ doSetBackslash_S, |
+ doInterval, |
+ doSetNoCloseError, |
+ doNGOpt, |
+ doSetPosixProp, |
+ doBackslashS, |
+ doBackslashZ, |
+ doSetBeginIntersection1, |
+ doSetBackslash_W, |
+ doSetBackslash_d, |
+ doOpenLookAhead, |
+ doBadModeFlag, |
+ doPatStart, |
+ doSetNamedRange, |
+ doPossessiveStar, |
+ doEscapedLiteralChar, |
+ doSetBackslash_s, |
+ doBackslashz, |
+ doDotAny, |
+ rbbiLastAction}; |
+ |
+//------------------------------------------------------------------------------- |
+// |
+// RegexTableEl represents the structure of a row in the transition table |
+// for the pattern parser state machine. |
+//------------------------------------------------------------------------------- |
+struct RegexTableEl { |
+ Regex_PatternParseAction fAction; |
+ uint8_t fCharClass; // 0-127: an individual ASCII character |
+ // 128-255: character class index |
+ uint8_t fNextState; // 0-250: normal next-state numbers |
+ // 255: pop next-state from stack. |
+ uint8_t fPushState; |
+ UBool fNextChar; |
+}; |
+ |
+static const struct RegexTableEl gRuleParseStateTable[] = { |
+ {doNOP, 0, 0, 0, TRUE} |
+ , {doPatStart, 255, 2,0, FALSE} // 1 start |
+ , {doLiteralChar, 254, 14,0, TRUE} // 2 term |
+ , {doLiteralChar, 129, 14,0, TRUE} // 3 |
+ , {doSetBegin, 91 /* [ */, 104, 182, TRUE} // 4 |
+ , {doNOP, 40 /* ( */, 27,0, TRUE} // 5 |
+ , {doDotAny, 46 /* . */, 14,0, TRUE} // 6 |
+ , {doCaret, 94 /* ^ */, 14,0, TRUE} // 7 |
+ , {doDollar, 36 /* $ */, 14,0, TRUE} // 8 |
+ , {doNOP, 92 /* \ */, 84,0, TRUE} // 9 |
+ , {doOrOperator, 124 /* | */, 2,0, TRUE} // 10 |
+ , {doCloseParen, 41 /* ) */, 255,0, TRUE} // 11 |
+ , {doPatFinish, 253, 2,0, FALSE} // 12 |
+ , {doRuleError, 255, 183,0, FALSE} // 13 |
+ , {doNOP, 42 /* * */, 63,0, TRUE} // 14 expr-quant |
+ , {doNOP, 43 /* + */, 66,0, TRUE} // 15 |
+ , {doNOP, 63 /* ? */, 69,0, TRUE} // 16 |
+ , {doIntervalInit, 123 /* { */, 72,0, TRUE} // 17 |
+ , {doNOP, 40 /* ( */, 23,0, TRUE} // 18 |
+ , {doNOP, 255, 20,0, FALSE} // 19 |
+ , {doOrOperator, 124 /* | */, 2,0, TRUE} // 20 expr-cont |
+ , {doCloseParen, 41 /* ) */, 255,0, TRUE} // 21 |
+ , {doNOP, 255, 2,0, FALSE} // 22 |
+ , {doSuppressComments, 63 /* ? */, 25,0, TRUE} // 23 open-paren-quant |
+ , {doNOP, 255, 27,0, FALSE} // 24 |
+ , {doNOP, 35 /* # */, 49, 14, TRUE} // 25 open-paren-quant2 |
+ , {doNOP, 255, 29,0, FALSE} // 26 |
+ , {doSuppressComments, 63 /* ? */, 29,0, TRUE} // 27 open-paren |
+ , {doOpenCaptureParen, 255, 2, 14, FALSE} // 28 |
+ , {doOpenNonCaptureParen, 58 /* : */, 2, 14, TRUE} // 29 open-paren-extended |
+ , {doOpenAtomicParen, 62 /* > */, 2, 14, TRUE} // 30 |
+ , {doOpenLookAhead, 61 /* = */, 2, 20, TRUE} // 31 |
+ , {doOpenLookAheadNeg, 33 /* ! */, 2, 20, TRUE} // 32 |
+ , {doNOP, 60 /* < */, 46,0, TRUE} // 33 |
+ , {doNOP, 35 /* # */, 49, 2, TRUE} // 34 |
+ , {doBeginMatchMode, 105 /* i */, 52,0, FALSE} // 35 |
+ , {doBeginMatchMode, 100 /* d */, 52,0, FALSE} // 36 |
+ , {doBeginMatchMode, 109 /* m */, 52,0, FALSE} // 37 |
+ , {doBeginMatchMode, 115 /* s */, 52,0, FALSE} // 38 |
+ , {doBeginMatchMode, 117 /* u */, 52,0, FALSE} // 39 |
+ , {doBeginMatchMode, 119 /* w */, 52,0, FALSE} // 40 |
+ , {doBeginMatchMode, 120 /* x */, 52,0, FALSE} // 41 |
+ , {doBeginMatchMode, 45 /* - */, 52,0, FALSE} // 42 |
+ , {doConditionalExpr, 40 /* ( */, 183,0, TRUE} // 43 |
+ , {doPerlInline, 123 /* { */, 183,0, TRUE} // 44 |
+ , {doBadOpenParenType, 255, 183,0, FALSE} // 45 |
+ , {doOpenLookBehind, 61 /* = */, 2, 20, TRUE} // 46 open-paren-lookbehind |
+ , {doOpenLookBehindNeg, 33 /* ! */, 2, 20, TRUE} // 47 |
+ , {doBadOpenParenType, 255, 183,0, FALSE} // 48 |
+ , {doNOP, 41 /* ) */, 255,0, TRUE} // 49 paren-comment |
+ , {doMismatchedParenErr, 253, 183,0, FALSE} // 50 |
+ , {doNOP, 255, 49,0, TRUE} // 51 |
+ , {doMatchMode, 105 /* i */, 52,0, TRUE} // 52 paren-flag |
+ , {doMatchMode, 100 /* d */, 52,0, TRUE} // 53 |
+ , {doMatchMode, 109 /* m */, 52,0, TRUE} // 54 |
+ , {doMatchMode, 115 /* s */, 52,0, TRUE} // 55 |
+ , {doMatchMode, 117 /* u */, 52,0, TRUE} // 56 |
+ , {doMatchMode, 119 /* w */, 52,0, TRUE} // 57 |
+ , {doMatchMode, 120 /* x */, 52,0, TRUE} // 58 |
+ , {doMatchMode, 45 /* - */, 52,0, TRUE} // 59 |
+ , {doSetMatchMode, 41 /* ) */, 2,0, TRUE} // 60 |
+ , {doMatchModeParen, 58 /* : */, 2, 14, TRUE} // 61 |
+ , {doBadModeFlag, 255, 183,0, FALSE} // 62 |
+ , {doNGStar, 63 /* ? */, 20,0, TRUE} // 63 quant-star |
+ , {doPossessiveStar, 43 /* + */, 20,0, TRUE} // 64 |
+ , {doStar, 255, 20,0, FALSE} // 65 |
+ , {doNGPlus, 63 /* ? */, 20,0, TRUE} // 66 quant-plus |
+ , {doPossessivePlus, 43 /* + */, 20,0, TRUE} // 67 |
+ , {doPlus, 255, 20,0, FALSE} // 68 |
+ , {doNGOpt, 63 /* ? */, 20,0, TRUE} // 69 quant-opt |
+ , {doPossessiveOpt, 43 /* + */, 20,0, TRUE} // 70 |
+ , {doOpt, 255, 20,0, FALSE} // 71 |
+ , {doNOP, 128, 74,0, FALSE} // 72 interval-open |
+ , {doIntervalError, 255, 183,0, FALSE} // 73 |
+ , {doIntevalLowerDigit, 128, 74,0, TRUE} // 74 interval-lower |
+ , {doNOP, 44 /* , */, 78,0, TRUE} // 75 |
+ , {doIntervalSame, 125 /* } */, 81,0, TRUE} // 76 |
+ , {doIntervalError, 255, 183,0, FALSE} // 77 |
+ , {doIntervalUpperDigit, 128, 78,0, TRUE} // 78 interval-upper |
+ , {doNOP, 125 /* } */, 81,0, TRUE} // 79 |
+ , {doIntervalError, 255, 183,0, FALSE} // 80 |
+ , {doNGInterval, 63 /* ? */, 20,0, TRUE} // 81 interval-type |
+ , {doPossessiveInterval, 43 /* + */, 20,0, TRUE} // 82 |
+ , {doInterval, 255, 20,0, FALSE} // 83 |
+ , {doBackslashA, 65 /* A */, 2,0, TRUE} // 84 backslash |
+ , {doBackslashB, 66 /* B */, 2,0, TRUE} // 85 |
+ , {doBackslashb, 98 /* b */, 2,0, TRUE} // 86 |
+ , {doBackslashd, 100 /* d */, 14,0, TRUE} // 87 |
+ , {doBackslashD, 68 /* D */, 14,0, TRUE} // 88 |
+ , {doBackslashG, 71 /* G */, 2,0, TRUE} // 89 |
+ , {doNamedChar, 78 /* N */, 14,0, FALSE} // 90 |
+ , {doProperty, 112 /* p */, 14,0, FALSE} // 91 |
+ , {doProperty, 80 /* P */, 14,0, FALSE} // 92 |
+ , {doEnterQuoteMode, 81 /* Q */, 2,0, TRUE} // 93 |
+ , {doBackslashS, 83 /* S */, 14,0, TRUE} // 94 |
+ , {doBackslashs, 115 /* s */, 14,0, TRUE} // 95 |
+ , {doBackslashW, 87 /* W */, 14,0, TRUE} // 96 |
+ , {doBackslashw, 119 /* w */, 14,0, TRUE} // 97 |
+ , {doBackslashX, 88 /* X */, 14,0, TRUE} // 98 |
+ , {doBackslashZ, 90 /* Z */, 2,0, TRUE} // 99 |
+ , {doBackslashz, 122 /* z */, 2,0, TRUE} // 100 |
+ , {doBackRef, 128, 14,0, TRUE} // 101 |
+ , {doEscapeError, 253, 183,0, FALSE} // 102 |
+ , {doEscapedLiteralChar, 255, 14,0, TRUE} // 103 |
+ , {doSetNegate, 94 /* ^ */, 107,0, TRUE} // 104 set-open |
+ , {doSetPosixProp, 58 /* : */, 109,0, FALSE} // 105 |
+ , {doNOP, 255, 107,0, FALSE} // 106 |
+ , {doSetLiteral, 93 /* ] */, 122,0, TRUE} // 107 set-open2 |
+ , {doNOP, 255, 112,0, FALSE} // 108 |
+ , {doSetEnd, 93 /* ] */, 255,0, TRUE} // 109 set-posix |
+ , {doNOP, 58 /* : */, 112,0, FALSE} // 110 |
+ , {doRuleError, 255, 183,0, FALSE} // 111 |
+ , {doSetEnd, 93 /* ] */, 255,0, TRUE} // 112 set-start |
+ , {doSetBeginUnion, 91 /* [ */, 104, 129, TRUE} // 113 |
+ , {doNOP, 92 /* \ */, 172,0, TRUE} // 114 |
+ , {doNOP, 45 /* - */, 118,0, TRUE} // 115 |
+ , {doNOP, 38 /* & */, 120,0, TRUE} // 116 |
+ , {doSetLiteral, 255, 122,0, TRUE} // 117 |
+ , {doRuleError, 45 /* - */, 183,0, FALSE} // 118 set-start-dash |
+ , {doSetAddDash, 255, 122,0, FALSE} // 119 |
+ , {doRuleError, 38 /* & */, 183,0, FALSE} // 120 set-start-amp |
+ , {doSetAddAmp, 255, 122,0, FALSE} // 121 |
+ , {doSetEnd, 93 /* ] */, 255,0, TRUE} // 122 set-after-lit |
+ , {doSetBeginUnion, 91 /* [ */, 104, 129, TRUE} // 123 |
+ , {doNOP, 45 /* - */, 159,0, TRUE} // 124 |
+ , {doNOP, 38 /* & */, 150,0, TRUE} // 125 |
+ , {doNOP, 92 /* \ */, 172,0, TRUE} // 126 |
+ , {doSetNoCloseError, 253, 183,0, FALSE} // 127 |
+ , {doSetLiteral, 255, 122,0, TRUE} // 128 |
+ , {doSetEnd, 93 /* ] */, 255,0, TRUE} // 129 set-after-set |
+ , {doSetBeginUnion, 91 /* [ */, 104, 129, TRUE} // 130 |
+ , {doNOP, 45 /* - */, 152,0, TRUE} // 131 |
+ , {doNOP, 38 /* & */, 147,0, TRUE} // 132 |
+ , {doNOP, 92 /* \ */, 172,0, TRUE} // 133 |
+ , {doSetNoCloseError, 253, 183,0, FALSE} // 134 |
+ , {doSetLiteral, 255, 122,0, TRUE} // 135 |
+ , {doSetEnd, 93 /* ] */, 255,0, TRUE} // 136 set-after-range |
+ , {doSetBeginUnion, 91 /* [ */, 104, 129, TRUE} // 137 |
+ , {doNOP, 45 /* - */, 155,0, TRUE} // 138 |
+ , {doNOP, 38 /* & */, 157,0, TRUE} // 139 |
+ , {doNOP, 92 /* \ */, 172,0, TRUE} // 140 |
+ , {doSetNoCloseError, 253, 183,0, FALSE} // 141 |
+ , {doSetLiteral, 255, 122,0, TRUE} // 142 |
+ , {doSetBeginUnion, 91 /* [ */, 104, 129, TRUE} // 143 set-after-op |
+ , {doSetOpError, 93 /* ] */, 183,0, FALSE} // 144 |
+ , {doNOP, 92 /* \ */, 172,0, TRUE} // 145 |
+ , {doSetLiteral, 255, 122,0, TRUE} // 146 |
+ , {doSetBeginIntersection1, 91 /* [ */, 104, 129, TRUE} // 147 set-set-amp |
+ , {doSetIntersection2, 38 /* & */, 143,0, TRUE} // 148 |
+ , {doSetAddAmp, 255, 122,0, FALSE} // 149 |
+ , {doSetIntersection2, 38 /* & */, 143,0, TRUE} // 150 set-lit-amp |
+ , {doSetAddAmp, 255, 122,0, FALSE} // 151 |
+ , {doSetBeginDifference1, 91 /* [ */, 104, 129, TRUE} // 152 set-set-dash |
+ , {doSetDifference2, 45 /* - */, 143,0, TRUE} // 153 |
+ , {doSetAddDash, 255, 122,0, FALSE} // 154 |
+ , {doSetDifference2, 45 /* - */, 143,0, TRUE} // 155 set-range-dash |
+ , {doSetAddDash, 255, 122,0, FALSE} // 156 |
+ , {doSetIntersection2, 38 /* & */, 143,0, TRUE} // 157 set-range-amp |
+ , {doSetAddAmp, 255, 122,0, FALSE} // 158 |
+ , {doSetDifference2, 45 /* - */, 143,0, TRUE} // 159 set-lit-dash |
+ , {doSetAddDash, 91 /* [ */, 122,0, FALSE} // 160 |
+ , {doSetAddDash, 93 /* ] */, 122,0, FALSE} // 161 |
+ , {doNOP, 92 /* \ */, 164,0, TRUE} // 162 |
+ , {doSetRange, 255, 136,0, TRUE} // 163 |
+ , {doSetOpError, 115 /* s */, 183,0, FALSE} // 164 set-lit-dash-escape |
+ , {doSetOpError, 83 /* S */, 183,0, FALSE} // 165 |
+ , {doSetOpError, 119 /* w */, 183,0, FALSE} // 166 |
+ , {doSetOpError, 87 /* W */, 183,0, FALSE} // 167 |
+ , {doSetOpError, 100 /* d */, 183,0, FALSE} // 168 |
+ , {doSetOpError, 68 /* D */, 183,0, FALSE} // 169 |
+ , {doSetNamedRange, 78 /* N */, 136,0, FALSE} // 170 |
+ , {doSetRange, 255, 136,0, TRUE} // 171 |
+ , {doSetProp, 112 /* p */, 129,0, FALSE} // 172 set-escape |
+ , {doSetProp, 80 /* P */, 129,0, FALSE} // 173 |
+ , {doSetNamedChar, 78 /* N */, 122,0, FALSE} // 174 |
+ , {doSetBackslash_s, 115 /* s */, 136,0, TRUE} // 175 |
+ , {doSetBackslash_S, 83 /* S */, 136,0, TRUE} // 176 |
+ , {doSetBackslash_w, 119 /* w */, 136,0, TRUE} // 177 |
+ , {doSetBackslash_W, 87 /* W */, 136,0, TRUE} // 178 |
+ , {doSetBackslash_d, 100 /* d */, 136,0, TRUE} // 179 |
+ , {doSetBackslash_D, 68 /* D */, 136,0, TRUE} // 180 |
+ , {doSetLiteralEscaped, 255, 122,0, TRUE} // 181 |
+ , {doSetFinish, 255, 14,0, FALSE} // 182 set-finish |
+ , {doExit, 255, 183,0, TRUE} // 183 errorDeath |
+ }; |
+static const char * const RegexStateNames[] = { 0, |
+ "start", |
+ "term", |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ "expr-quant", |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ "expr-cont", |
+ 0, |
+ 0, |
+ "open-paren-quant", |
+ 0, |
+ "open-paren-quant2", |
+ 0, |
+ "open-paren", |
+ 0, |
+ "open-paren-extended", |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ "open-paren-lookbehind", |
+ 0, |
+ 0, |
+ "paren-comment", |
+ 0, |
+ 0, |
+ "paren-flag", |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ "quant-star", |
+ 0, |
+ 0, |
+ "quant-plus", |
+ 0, |
+ 0, |
+ "quant-opt", |
+ 0, |
+ 0, |
+ "interval-open", |
+ 0, |
+ "interval-lower", |
+ 0, |
+ 0, |
+ 0, |
+ "interval-upper", |
+ 0, |
+ 0, |
+ "interval-type", |
+ 0, |
+ 0, |
+ "backslash", |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ "set-open", |
+ 0, |
+ 0, |
+ "set-open2", |
+ 0, |
+ "set-posix", |
+ 0, |
+ 0, |
+ "set-start", |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ "set-start-dash", |
+ 0, |
+ "set-start-amp", |
+ 0, |
+ "set-after-lit", |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ "set-after-set", |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ "set-after-range", |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ "set-after-op", |
+ 0, |
+ 0, |
+ 0, |
+ "set-set-amp", |
+ 0, |
+ 0, |
+ "set-lit-amp", |
+ 0, |
+ "set-set-dash", |
+ 0, |
+ 0, |
+ "set-range-dash", |
+ 0, |
+ "set-range-amp", |
+ 0, |
+ "set-lit-dash", |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ "set-lit-dash-escape", |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ "set-escape", |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ 0, |
+ "set-finish", |
+ "errorDeath", |
+ 0}; |
+ |
+U_NAMESPACE_END |
+#endif |
Property changes on: icu46/source/i18n/regexcst.h |
___________________________________________________________________ |
Added: svn:eol-style |
+ LF |