| 1 | // © 2016 and later: Unicode, Inc. and others. |
| 2 | // License & terms of use: http://www.unicode.org/copyright.html |
| 3 | //--------------------------------------------------------------------------------- |
| 4 | // |
| 5 | // Generated Header File. Do not edit by hand. |
| 6 | // This file contains the state table for the ICU Rule Based Break Iterator |
| 7 | // rule parser. |
| 8 | // It is generated by the Perl script "rbbicst.pl" from |
| 9 | // the rule parser state definitions file "rbbirpt.txt". |
| 10 | // |
| 11 | // Copyright (C) 2002-2016 International Business Machines Corporation |
| 12 | // and others. All rights reserved. |
| 13 | // |
| 14 | //--------------------------------------------------------------------------------- |
| 15 | #ifndef RBBIRPT_H |
| 16 | #define RBBIRPT_H |
| 17 | |
| 18 | #include "unicode/utypes.h" |
| 19 | |
| 20 | U_NAMESPACE_BEGIN |
| 21 | // |
| 22 | // Character classes for RBBI rule scanning. |
| 23 | // |
| 24 | static const uint8_t kRuleSet_digit_char = 128; |
| 25 | static const uint8_t kRuleSet_name_char = 129; |
| 26 | static const uint8_t kRuleSet_name_start_char = 130; |
| 27 | static const uint8_t kRuleSet_rule_char = 131; |
| 28 | static const uint8_t kRuleSet_white_space = 132; |
| 29 | |
| 30 | |
| 31 | enum RBBI_RuleParseAction { |
| 32 | doCheckVarDef, |
| 33 | doDotAny, |
| 34 | doEndAssign, |
| 35 | doEndOfRule, |
| 36 | doEndVariableName, |
| 37 | doExit, |
| 38 | doExprCatOperator, |
| 39 | doExprFinished, |
| 40 | doExprOrOperator, |
| 41 | doExprRParen, |
| 42 | doExprStart, |
| 43 | doLParen, |
| 44 | doNOP, |
| 45 | doNoChain, |
| 46 | doOptionEnd, |
| 47 | doOptionStart, |
| 48 | doReverseDir, |
| 49 | doRuleChar, |
| 50 | doRuleError, |
| 51 | doRuleErrorAssignExpr, |
| 52 | doScanUnicodeSet, |
| 53 | doSlash, |
| 54 | doStartAssign, |
| 55 | doStartTagValue, |
| 56 | doStartVariableName, |
| 57 | doTagDigit, |
| 58 | doTagExpectedError, |
| 59 | doTagValue, |
| 60 | doUnaryOpPlus, |
| 61 | doUnaryOpQuestion, |
| 62 | doUnaryOpStar, |
| 63 | doVariableNameExpectedErr, |
| 64 | rbbiLastAction}; |
| 65 | |
| 66 | //------------------------------------------------------------------------------- |
| 67 | // |
| 68 | // RBBIRuleTableEl represents the structure of a row in the transition table |
| 69 | // for the rule parser state machine. |
| 70 | //------------------------------------------------------------------------------- |
| 71 | struct RBBIRuleTableEl { |
| 72 | RBBI_RuleParseAction fAction; |
| 73 | uint8_t fCharClass; // 0-127: an individual ASCII character |
| 74 | // 128-255: character class index |
| 75 | uint8_t fNextState; // 0-250: normal next-stat numbers |
| 76 | // 255: pop next-state from stack. |
| 77 | uint8_t fPushState; |
| 78 | UBool fNextChar; |
| 79 | }; |
| 80 | |
| 81 | static const struct RBBIRuleTableEl gRuleParseStateTable[] = { |
| 82 | {doNOP, 0, 0, 0, TRUE} |
| 83 | , {doExprStart, 254, 29, 9, FALSE} // 1 start |
| 84 | , {doNOP, 132, 1,0, TRUE} // 2 |
| 85 | , {doNoChain, 94 /* ^ */, 12, 9, TRUE} // 3 |
| 86 | , {doExprStart, 36 /* $ */, 88, 98, FALSE} // 4 |
| 87 | , {doNOP, 33 /* ! */, 19,0, TRUE} // 5 |
| 88 | , {doNOP, 59 /* ; */, 1,0, TRUE} // 6 |
| 89 | , {doNOP, 252, 0,0, FALSE} // 7 |
| 90 | , {doExprStart, 255, 29, 9, FALSE} // 8 |
| 91 | , {doEndOfRule, 59 /* ; */, 1,0, TRUE} // 9 break-rule-end |
| 92 | , {doNOP, 132, 9,0, TRUE} // 10 |
| 93 | , {doRuleError, 255, 103,0, FALSE} // 11 |
| 94 | , {doExprStart, 254, 29,0, FALSE} // 12 start-after-caret |
| 95 | , {doNOP, 132, 12,0, TRUE} // 13 |
| 96 | , {doRuleError, 94 /* ^ */, 103,0, FALSE} // 14 |
| 97 | , {doExprStart, 36 /* $ */, 88, 37, FALSE} // 15 |
| 98 | , {doRuleError, 59 /* ; */, 103,0, FALSE} // 16 |
| 99 | , {doRuleError, 252, 103,0, FALSE} // 17 |
| 100 | , {doExprStart, 255, 29,0, FALSE} // 18 |
| 101 | , {doNOP, 33 /* ! */, 21,0, TRUE} // 19 rev-option |
| 102 | , {doReverseDir, 255, 28, 9, FALSE} // 20 |
| 103 | , {doOptionStart, 130, 23,0, TRUE} // 21 option-scan1 |
| 104 | , {doRuleError, 255, 103,0, FALSE} // 22 |
| 105 | , {doNOP, 129, 23,0, TRUE} // 23 option-scan2 |
| 106 | , {doOptionEnd, 255, 25,0, FALSE} // 24 |
| 107 | , {doNOP, 59 /* ; */, 1,0, TRUE} // 25 option-scan3 |
| 108 | , {doNOP, 132, 25,0, TRUE} // 26 |
| 109 | , {doRuleError, 255, 103,0, FALSE} // 27 |
| 110 | , {doExprStart, 255, 29, 9, FALSE} // 28 reverse-rule |
| 111 | , {doRuleChar, 254, 38,0, TRUE} // 29 term |
| 112 | , {doNOP, 132, 29,0, TRUE} // 30 |
| 113 | , {doRuleChar, 131, 38,0, TRUE} // 31 |
| 114 | , {doNOP, 91 /* [ */, 94, 38, FALSE} // 32 |
| 115 | , {doLParen, 40 /* ( */, 29, 38, TRUE} // 33 |
| 116 | , {doNOP, 36 /* $ */, 88, 37, FALSE} // 34 |
| 117 | , {doDotAny, 46 /* . */, 38,0, TRUE} // 35 |
| 118 | , {doRuleError, 255, 103,0, FALSE} // 36 |
| 119 | , {doCheckVarDef, 255, 38,0, FALSE} // 37 term-var-ref |
| 120 | , {doNOP, 132, 38,0, TRUE} // 38 expr-mod |
| 121 | , {doUnaryOpStar, 42 /* * */, 43,0, TRUE} // 39 |
| 122 | , {doUnaryOpPlus, 43 /* + */, 43,0, TRUE} // 40 |
| 123 | , {doUnaryOpQuestion, 63 /* ? */, 43,0, TRUE} // 41 |
| 124 | , {doNOP, 255, 43,0, FALSE} // 42 |
| 125 | , {doExprCatOperator, 254, 29,0, FALSE} // 43 expr-cont |
| 126 | , {doNOP, 132, 43,0, TRUE} // 44 |
| 127 | , {doExprCatOperator, 131, 29,0, FALSE} // 45 |
| 128 | , {doExprCatOperator, 91 /* [ */, 29,0, FALSE} // 46 |
| 129 | , {doExprCatOperator, 40 /* ( */, 29,0, FALSE} // 47 |
| 130 | , {doExprCatOperator, 36 /* $ */, 29,0, FALSE} // 48 |
| 131 | , {doExprCatOperator, 46 /* . */, 29,0, FALSE} // 49 |
| 132 | , {doExprCatOperator, 47 /* / */, 55,0, FALSE} // 50 |
| 133 | , {doExprCatOperator, 123 /* { */, 67,0, TRUE} // 51 |
| 134 | , {doExprOrOperator, 124 /* | */, 29,0, TRUE} // 52 |
| 135 | , {doExprRParen, 41 /* ) */, 255,0, TRUE} // 53 |
| 136 | , {doExprFinished, 255, 255,0, FALSE} // 54 |
| 137 | , {doSlash, 47 /* / */, 57,0, TRUE} // 55 look-ahead |
| 138 | , {doNOP, 255, 103,0, FALSE} // 56 |
| 139 | , {doExprCatOperator, 254, 29,0, FALSE} // 57 expr-cont-no-slash |
| 140 | , {doNOP, 132, 43,0, TRUE} // 58 |
| 141 | , {doExprCatOperator, 131, 29,0, FALSE} // 59 |
| 142 | , {doExprCatOperator, 91 /* [ */, 29,0, FALSE} // 60 |
| 143 | , {doExprCatOperator, 40 /* ( */, 29,0, FALSE} // 61 |
| 144 | , {doExprCatOperator, 36 /* $ */, 29,0, FALSE} // 62 |
| 145 | , {doExprCatOperator, 46 /* . */, 29,0, FALSE} // 63 |
| 146 | , {doExprOrOperator, 124 /* | */, 29,0, TRUE} // 64 |
| 147 | , {doExprRParen, 41 /* ) */, 255,0, TRUE} // 65 |
| 148 | , {doExprFinished, 255, 255,0, FALSE} // 66 |
| 149 | , {doNOP, 132, 67,0, TRUE} // 67 tag-open |
| 150 | , {doStartTagValue, 128, 70,0, FALSE} // 68 |
| 151 | , {doTagExpectedError, 255, 103,0, FALSE} // 69 |
| 152 | , {doNOP, 132, 74,0, TRUE} // 70 tag-value |
| 153 | , {doNOP, 125 /* } */, 74,0, FALSE} // 71 |
| 154 | , {doTagDigit, 128, 70,0, TRUE} // 72 |
| 155 | , {doTagExpectedError, 255, 103,0, FALSE} // 73 |
| 156 | , {doNOP, 132, 74,0, TRUE} // 74 tag-close |
| 157 | , {doTagValue, 125 /* } */, 77,0, TRUE} // 75 |
| 158 | , {doTagExpectedError, 255, 103,0, FALSE} // 76 |
| 159 | , {doExprCatOperator, 254, 29,0, FALSE} // 77 expr-cont-no-tag |
| 160 | , {doNOP, 132, 77,0, TRUE} // 78 |
| 161 | , {doExprCatOperator, 131, 29,0, FALSE} // 79 |
| 162 | , {doExprCatOperator, 91 /* [ */, 29,0, FALSE} // 80 |
| 163 | , {doExprCatOperator, 40 /* ( */, 29,0, FALSE} // 81 |
| 164 | , {doExprCatOperator, 36 /* $ */, 29,0, FALSE} // 82 |
| 165 | , {doExprCatOperator, 46 /* . */, 29,0, FALSE} // 83 |
| 166 | , {doExprCatOperator, 47 /* / */, 55,0, FALSE} // 84 |
| 167 | , {doExprOrOperator, 124 /* | */, 29,0, TRUE} // 85 |
| 168 | , {doExprRParen, 41 /* ) */, 255,0, TRUE} // 86 |
| 169 | , {doExprFinished, 255, 255,0, FALSE} // 87 |
| 170 | , {doStartVariableName, 36 /* $ */, 90,0, TRUE} // 88 scan-var-name |
| 171 | , {doNOP, 255, 103,0, FALSE} // 89 |
| 172 | , {doNOP, 130, 92,0, TRUE} // 90 scan-var-start |
| 173 | , {doVariableNameExpectedErr, 255, 103,0, FALSE} // 91 |
| 174 | , {doNOP, 129, 92,0, TRUE} // 92 scan-var-body |
| 175 | , {doEndVariableName, 255, 255,0, FALSE} // 93 |
| 176 | , {doScanUnicodeSet, 91 /* [ */, 255,0, TRUE} // 94 scan-unicode-set |
| 177 | , {doScanUnicodeSet, 112 /* p */, 255,0, TRUE} // 95 |
| 178 | , {doScanUnicodeSet, 80 /* P */, 255,0, TRUE} // 96 |
| 179 | , {doNOP, 255, 103,0, FALSE} // 97 |
| 180 | , {doNOP, 132, 98,0, TRUE} // 98 assign-or-rule |
| 181 | , {doStartAssign, 61 /* = */, 29, 101, TRUE} // 99 |
| 182 | , {doNOP, 255, 37, 9, FALSE} // 100 |
| 183 | , {doEndAssign, 59 /* ; */, 1,0, TRUE} // 101 assign-end |
| 184 | , {doRuleErrorAssignExpr, 255, 103,0, FALSE} // 102 |
| 185 | , {doExit, 255, 103,0, TRUE} // 103 errorDeath |
| 186 | }; |
| 187 | #ifdef RBBI_DEBUG |
| 188 | static const char * const RBBIRuleStateNames[] = { 0, |
| 189 | "start" , |
| 190 | 0, |
| 191 | 0, |
| 192 | 0, |
| 193 | 0, |
| 194 | 0, |
| 195 | 0, |
| 196 | 0, |
| 197 | "break-rule-end" , |
| 198 | 0, |
| 199 | 0, |
| 200 | "start-after-caret" , |
| 201 | 0, |
| 202 | 0, |
| 203 | 0, |
| 204 | 0, |
| 205 | 0, |
| 206 | 0, |
| 207 | "rev-option" , |
| 208 | 0, |
| 209 | "option-scan1" , |
| 210 | 0, |
| 211 | "option-scan2" , |
| 212 | 0, |
| 213 | "option-scan3" , |
| 214 | 0, |
| 215 | 0, |
| 216 | "reverse-rule" , |
| 217 | "term" , |
| 218 | 0, |
| 219 | 0, |
| 220 | 0, |
| 221 | 0, |
| 222 | 0, |
| 223 | 0, |
| 224 | 0, |
| 225 | "term-var-ref" , |
| 226 | "expr-mod" , |
| 227 | 0, |
| 228 | 0, |
| 229 | 0, |
| 230 | 0, |
| 231 | "expr-cont" , |
| 232 | 0, |
| 233 | 0, |
| 234 | 0, |
| 235 | 0, |
| 236 | 0, |
| 237 | 0, |
| 238 | 0, |
| 239 | 0, |
| 240 | 0, |
| 241 | 0, |
| 242 | 0, |
| 243 | "look-ahead" , |
| 244 | 0, |
| 245 | "expr-cont-no-slash" , |
| 246 | 0, |
| 247 | 0, |
| 248 | 0, |
| 249 | 0, |
| 250 | 0, |
| 251 | 0, |
| 252 | 0, |
| 253 | 0, |
| 254 | 0, |
| 255 | "tag-open" , |
| 256 | 0, |
| 257 | 0, |
| 258 | "tag-value" , |
| 259 | 0, |
| 260 | 0, |
| 261 | 0, |
| 262 | "tag-close" , |
| 263 | 0, |
| 264 | 0, |
| 265 | "expr-cont-no-tag" , |
| 266 | 0, |
| 267 | 0, |
| 268 | 0, |
| 269 | 0, |
| 270 | 0, |
| 271 | 0, |
| 272 | 0, |
| 273 | 0, |
| 274 | 0, |
| 275 | 0, |
| 276 | "scan-var-name" , |
| 277 | 0, |
| 278 | "scan-var-start" , |
| 279 | 0, |
| 280 | "scan-var-body" , |
| 281 | 0, |
| 282 | "scan-unicode-set" , |
| 283 | 0, |
| 284 | 0, |
| 285 | 0, |
| 286 | "assign-or-rule" , |
| 287 | 0, |
| 288 | 0, |
| 289 | "assign-end" , |
| 290 | 0, |
| 291 | "errorDeath" , |
| 292 | 0}; |
| 293 | #endif |
| 294 | |
| 295 | U_NAMESPACE_END |
| 296 | #endif |
| 297 | |