icu46/source/i18n/plurrule.cpp - Issue 5516007: Check in the pristine copy of ICU 4.6...

Side by Side Diff: icu46/source/i18n/plurrule.cpp

Issue 5516007: Check in the pristine copy of ICU 4.6... (Closed) Base URL: svn://chrome-svn/chrome/trunk/deps/third_party/

Patch Set: Created 10 years ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch | Annotate | Revision Log

Property Changes:

Added: svn:eol-style
+ LF

OLD	NEW
(Empty)
	1 /*

	2 *******************************************************************************

	3 * Copyright (C) 2007-2010, International Business Machines Corporation and

	4 * others. All Rights Reserved.

	5 *******************************************************************************

	6 *

	7 * File PLURRULE.CPP

	8 *

	9 * Modification History:

	10 *

	11 * Date Name Description

	12 *******************************************************************************

	13 */

	14

	15

	16 #include "unicode/uniset.h"

	17 #include "unicode/utypes.h"

	18 #include "unicode/ures.h"

	19 #include "unicode/plurrule.h"

	20 #include "cmemory.h"

	21 #include "cstring.h"

	22 #include "hash.h"

	23 #include "mutex.h"

	24 #include "plurrule_impl.h"

	25 #include "putilimp.h"

	26 #include "ucln_in.h"

	27 #include "ustrfmt.h"

	28 #include "locutil.h"

	29

	30 /*

	31 // TODO(claireho): remove stdio

	32 #include "stdio.h"

	33 */

	34

	35 #if !UCONFIG_NO_FORMATTING

	36

	37 U_NAMESPACE_BEGIN

	38

	39

	40 #define ARRAY_SIZE(array) (int32_t)(sizeof array / sizeof array[0])

	41

	42 static const UChar PLURAL_KEYWORD_ZERO[] = {LOW_Z,LOW_E,LOW_R,LOW_O, 0};

	43 static const UChar PLURAL_KEYWORD_ONE[]={LOW_O,LOW_N,LOW_E,0};

	44 static const UChar PLURAL_KEYWORD_TWO[]={LOW_T,LOW_W,LOW_O,0};

	45 static const UChar PLURAL_KEYWORD_FEW[]={LOW_F,LOW_E,LOW_W,0};

	46 static const UChar PLURAL_KEYWORD_MANY[]={LOW_M,LOW_A,LOW_N,LOW_Y,0};

	47 static const UChar PLURAL_KEYWORD_OTHER[]={LOW_O,LOW_T,LOW_H,LOW_E,LOW_R,0};

	48 static const UChar PLURAL_DEFAULT_RULE[]={LOW_O,LOW_T,LOW_H,LOW_E,LOW_R,COLON,SP ACE,LOW_N,0};

	49 static const UChar PK_IN[]={LOW_I,LOW_N,0};

	50 static const UChar PK_NOT[]={LOW_N,LOW_O,LOW_T,0};

	51 static const UChar PK_IS[]={LOW_I,LOW_S,0};

	52 static const UChar PK_MOD[]={LOW_M,LOW_O,LOW_D,0};

	53 static const UChar PK_AND[]={LOW_A,LOW_N,LOW_D,0};

	54 static const UChar PK_OR[]={LOW_O,LOW_R,0};

	55 static const UChar PK_VAR_N[]={LOW_N,0};

	56 static const UChar PK_WITHIN[]={LOW_W,LOW_I,LOW_T,LOW_H,LOW_I,LOW_N,0};

	57

	58 UOBJECT_DEFINE_RTTI_IMPLEMENTATION(PluralRules)

	59 UOBJECT_DEFINE_RTTI_IMPLEMENTATION(PluralKeywordEnumeration)

	60

	61 PluralRules::PluralRules(UErrorCode& status)

	62 : UObject(),

	63 mRules(NULL)

	64 {

	65 if (U_FAILURE(status)) {

	66 return;

	67 }

	68 mParser = new RuleParser();

	69 if (mParser==NULL) {

	70 status = U_MEMORY_ALLOCATION_ERROR;

	71 }

	72 }

	73

	74 PluralRules::PluralRules(const PluralRules& other)

	75 : UObject(other),

	76 mRules(NULL),

	77 mParser(new RuleParser())

	78 {

	79 *this=other;

	80 }

	81

	82 PluralRules::~PluralRules() {

	83 delete mRules;

	84 delete mParser;

	85 }

	86

	87 PluralRules*

	88 PluralRules::clone() const {

	89 return new PluralRules(*this);

	90 }

	91

	92 PluralRules&

	93 PluralRules::operator=(const PluralRules& other) {

	94 if (this != &other) {

	95 delete mRules;

	96 if (other.mRules==NULL) {

	97 mRules = NULL;

	98 }

	99 else {

	100 mRules = new RuleChain(*other.mRules);

	101 }

	102 delete mParser;

	103 mParser = new RuleParser();

	104 }

	105

	106 return *this;

	107 }

	108

	109 PluralRules* U_EXPORT2

	110 PluralRules::createRules(const UnicodeString& description, UErrorCode& status) {

	111 RuleChain rules;

	112

	113 if (U_FAILURE(status)) {

	114 return NULL;

	115 }

	116 PluralRules *newRules = new PluralRules(status);

	117 if ( (newRules != NULL)&& U_SUCCESS(status) ) {

	118 newRules->parseDescription((UnicodeString &)description, rules, status);

	119 if (U_SUCCESS(status)) {

	120 newRules->addRules(rules);

	121 }

	122 }

	123 if (U_FAILURE(status)) {

	124 delete newRules;

	125 return NULL;

	126 }

	127 else {

	128 return newRules;

	129 }

	130 }

	131

	132 PluralRules* U_EXPORT2

	133 PluralRules::createDefaultRules(UErrorCode& status) {

	134 return createRules(PLURAL_DEFAULT_RULE, status);

	135 }

	136

	137 PluralRules* U_EXPORT2

	138 PluralRules::forLocale(const Locale& locale, UErrorCode& status) {

	139 RuleChain rChain;

	140 if (U_FAILURE(status)) {

	141 return NULL;

	142 }

	143 PluralRules *newObj = new PluralRules(status);

	144 if (newObj==NULL \|\| U_FAILURE(status)) {

	145 return NULL;

	146 }

	147 UnicodeString locRule = newObj->getRuleFromResource(locale, status);

	148 if ((locRule.length() != 0) && U_SUCCESS(status)) {

	149 newObj->parseDescription(locRule, rChain, status);

	150 if (U_SUCCESS(status)) {

	151 newObj->addRules(rChain);

	152 }

	153 }

	154 if (U_FAILURE(status)\|\|(locRule.length() == 0)) {

	155 // use default plural rule

	156 status = U_ZERO_ERROR;

	157 UnicodeString defRule = UnicodeString(PLURAL_DEFAULT_RULE);

	158 newObj->parseDescription(defRule, rChain, status);

	159 newObj->addRules(rChain);

	160 }

	161

	162 return newObj;

	163 }

	164

	165 UnicodeString

	166 PluralRules::select(int32_t number) const {

	167 if (mRules == NULL) {

	168 return PLURAL_DEFAULT_RULE;

	169 }

	170 else {

	171 return mRules->select(number);

	172 }

	173 }

	174

	175 UnicodeString

	176 PluralRules::select(double number) const {

	177 if (mRules == NULL) {

	178 return PLURAL_DEFAULT_RULE;

	179 }

	180 else {

	181 return mRules->select(number);

	182 }

	183 }

	184

	185 StringEnumeration*

	186 PluralRules::getKeywords(UErrorCode& status) const {

	187 if (U_FAILURE(status)) return NULL;

	188 StringEnumeration* nameEnumerator = new PluralKeywordEnumeration(mRules, sta tus);

	189 if (U_FAILURE(status)) return NULL;

	190

	191 return nameEnumerator;

	192 }

	193

	194

	195 UBool

	196 PluralRules::isKeyword(const UnicodeString& keyword) const {

	197 if ( keyword == PLURAL_KEYWORD_OTHER ) {

	198 return true;

	199 }

	200 else {

	201 if (mRules==NULL) {

	202 return false;

	203 }

	204 else {

	205 return mRules->isKeyword(keyword);

	206 }

	207 }

	208 }

	209

	210 UnicodeString

	211 PluralRules::getKeywordOther() const {

	212 return PLURAL_KEYWORD_OTHER;

	213 }

	214

	215 UBool

	216 PluralRules::operator==(const PluralRules& other) const {

	217 int32_t limit;

	218 UBool sameList = TRUE;

	219 const UnicodeString *ptrKeyword;

	220 UErrorCode status= U_ZERO_ERROR;

	221

	222 if ( this == &other ) {

	223 return TRUE;

	224 }

	225 StringEnumeration* myKeywordList = getKeywords(status);

	226 if (U_FAILURE(status)) {

	227 return FALSE;

	228 }

	229 StringEnumeration* otherKeywordList =other.getKeywords(status);

	230 if (U_FAILURE(status)) {

	231 return FALSE;

	232 }

	233

	234 if (myKeywordList->count(status)!=otherKeywordList->count(status) \|\|

	235 U_FAILURE(status)) {

	236 sameList = FALSE;

	237 }

	238 else {

	239 myKeywordList->reset(status);

	240 if (U_FAILURE(status)) {

	241 return FALSE;

	242 }

	243 while (sameList && (ptrKeyword=myKeywordList->snext(status))!=NULL) {

	244 if (U_FAILURE(status) \|\| !other.isKeyword(*ptrKeyword)) {

	245 sameList = FALSE;

	246 }

	247 }

	248 otherKeywordList->reset(status);

	249 if (U_FAILURE(status)) {

	250 return FALSE;

	251 }

	252 while (sameList && (ptrKeyword=otherKeywordList->snext(status))!=NULL) {

	253 if (U_FAILURE(status)) {

	254 return FALSE;

	255 }

	256 if (!this->isKeyword(*ptrKeyword)) {

	257 sameList = FALSE;

	258 }

	259 }

	260 delete myKeywordList;

	261 delete otherKeywordList;

	262 if (!sameList) {

	263 return FALSE;

	264 }

	265 }

	266

	267 if ((limit=this->getRepeatLimit()) != other.getRepeatLimit()) {

	268 return FALSE;

	269 }

	270 UnicodeString myKeyword, otherKeyword;

	271 for (int32_t i=0; i<limit; ++i) {

	272 myKeyword = this->select(i);

	273 otherKeyword = other.select(i);

	274 if (myKeyword!=otherKeyword) {

	275 return FALSE;

	276 }

	277 }

	278 return TRUE;

	279 }

	280

	281 void

	282 PluralRules::parseDescription(UnicodeString& data, RuleChain& rules, UErrorCode &status)

	283 {

	284 int32_t ruleIndex=0;

	285 UnicodeString token;

	286 tokenType type;

	287 tokenType prevType=none;

	288 RuleChain *ruleChain=NULL;

	289 AndConstraint *curAndConstraint=NULL;

	290 OrConstraint *orNode=NULL;

	291 RuleChain *lastChain=NULL;

	292

	293 if (U_FAILURE(status)) {

	294 return;

	295 }

	296 UnicodeString ruleData = data.toLower();

	297 while (ruleIndex< ruleData.length()) {

	298 mParser->getNextToken(ruleData, &ruleIndex, token, type, status);

	299 if (U_FAILURE(status)) {

	300 return;

	301 }

	302 mParser->checkSyntax(prevType, type, status);

	303 if (U_FAILURE(status)) {

	304 return;

	305 }

	306 switch (type) {

	307 case tAnd:

	308 curAndConstraint = curAndConstraint->add();

	309 break;

	310 case tOr:

	311 lastChain = &rules;

	312 while (lastChain->next !=NULL) {

	313 lastChain = lastChain->next;

	314 }

	315 orNode=lastChain->ruleHeader;

	316 while (orNode->next != NULL) {

	317 orNode = orNode->next;

	318 }

	319 orNode->next= new OrConstraint();

	320 orNode=orNode->next;

	321 orNode->next=NULL;

	322 curAndConstraint = orNode->add();

	323 break;

	324 case tIs:

	325 curAndConstraint->rangeHigh=-1;

	326 break;

	327 case tNot:

	328 curAndConstraint->notIn=TRUE;

	329 break;

	330 case tIn:

	331 curAndConstraint->rangeHigh=PLURAL_RANGE_HIGH;

	332 curAndConstraint->integerOnly = TRUE;

	333 break;

	334 case tWithin:

	335 curAndConstraint->rangeHigh=PLURAL_RANGE_HIGH;

	336 break;

	337 case tNumber:

	338 if ( (curAndConstraint->op==AndConstraint::MOD)&&

	339 (curAndConstraint->opNum == -1 ) ) {

	340 curAndConstraint->opNum=getNumberValue(token);

	341 }

	342 else {

	343 if (curAndConstraint->rangeLow == -1) {

	344 curAndConstraint->rangeLow=getNumberValue(token);

	345 }

	346 else {

	347 curAndConstraint->rangeHigh=getNumberValue(token);

	348 }

	349 }

	350 break;

	351 case tMod:

	352 curAndConstraint->op=AndConstraint::MOD;

	353 break;

	354 case tKeyword:

	355 if (ruleChain==NULL) {

	356 ruleChain = &rules;

	357 }

	358 else {

	359 while (ruleChain->next!=NULL){

	360 ruleChain=ruleChain->next;

	361 }

	362 ruleChain=ruleChain->next=new RuleChain();

	363 }

	364 orNode = ruleChain->ruleHeader = new OrConstraint();

	365 curAndConstraint = orNode->add();

	366 ruleChain->keyword = token;

	367 break;

	368 default:

	369 break;

	370 }

	371 prevType=type;

	372 }

	373 }

	374

	375 int32_t

	376 PluralRules::getNumberValue(const UnicodeString& token) const {

	377 int32_t i;

	378 char digits[128];

	379

	380 i = token.extract(0, token.length(), digits, ARRAY_SIZE(digits), US_INV);

	381 digits[i]='\0';

	382

	383 return((int32_t)atoi(digits));

	384 }

	385

	386

	387 void

	388 PluralRules::getNextLocale(const UnicodeString& localeData, int32_t* curIndex, U nicodeString& localeName) {

	389 int32_t i=*curIndex;

	390

	391 localeName.remove();

	392 while (i< localeData.length()) {

	393 if ( (localeData.charAt(i)!= SPACE) && (localeData.charAt(i)!= COMMA) ) {

	394 break;

	395 }

	396 i++;

	397 }

	398

	399 while (i< localeData.length()) {

	400 if ( (localeData.charAt(i)== SPACE) \|\| (localeData.charAt(i)== COMMA) ) {

	401 break;

	402 }

	403 localeName+=localeData.charAt(i++);

	404 }

	405 *curIndex=i;

	406 }

	407

	408

	409 int32_t

	410 PluralRules::getRepeatLimit() const {

	411 if (mRules!=NULL) {

	412 return mRules->getRepeatLimit();

	413 }

	414 else {

	415 return 0;

	416 }

	417 }

	418

	419

	420 void

	421 PluralRules::addRules(RuleChain& rules) {

	422 RuleChain *newRule = new RuleChain(rules);

	423 this->mRules=newRule;

	424 newRule->setRepeatLimit();

	425 }

	426

	427 UnicodeString

	428 PluralRules::getRuleFromResource(const Locale& locale, UErrorCode& errCode) {

	429 UnicodeString emptyStr;

	430

	431 if (U_FAILURE(errCode)) {

	432 return emptyStr;

	433 }

	434 UResourceBundle *rb=ures_openDirect(NULL, "plurals", &errCode);

	435 if(U_FAILURE(errCode)) {

	436 /* total failure, not even root could be opened */

	437 return emptyStr;

	438 }

	439 UResourceBundle *locRes=ures_getByKey(rb, "locales", NULL, &errCode);

	440 if(U_FAILURE(errCode)) {

	441 ures_close(rb);

	442 return emptyStr;

	443 }

	444 int32_t resLen=0;

	445 const char *curLocaleName=locale.getName();

	446 const UChar* s = ures_getStringByKey(locRes, curLocaleName, &resLen, &errCod e);

	447

	448 if (s == NULL) {

	449 // Check parent locales.

	450 UErrorCode status = U_ZERO_ERROR;

	451 char parentLocaleName[ULOC_FULLNAME_CAPACITY];

	452 const char *curLocaleName=locale.getName();

	453 int32_t localeNameLen=0;

	454 uprv_strcpy(parentLocaleName, curLocaleName);

	455

	456 while ((localeNameLen=uloc_getParent(parentLocaleName, parentLocaleName,

	457 ULOC_FULLNAME_CAPACITY, &status)) > 0) {

	458 resLen=0;

	459 s = ures_getStringByKey(locRes, parentLocaleName, &resLen, &status);

	460 if (s != NULL) {

	461 errCode = U_ZERO_ERROR;

	462 break;

	463 }

	464 status = U_ZERO_ERROR;

	465 }

	466 }

	467 if (s==NULL) {

	468 ures_close(locRes);

	469 ures_close(rb);

	470 return emptyStr;

	471 }

	472

	473 char setKey[256];

	474 UChar result[256];

	475 u_UCharsToChars(s, setKey, resLen + 1);

	476 // printf("\n PluralRule: %s\n", setKey);

	477

	478

	479 UResourceBundle *ruleRes=ures_getByKey(rb, "rules", NULL, &errCode);

	480 if(U_FAILURE(errCode)) {

	481 ures_close(locRes);

	482 ures_close(rb);

	483 return emptyStr;

	484 }

	485 resLen=0;

	486 UResourceBundle *setRes = ures_getByKey(ruleRes, setKey, NULL, &errCode);

	487 if (U_FAILURE(errCode)) {

	488 ures_close(ruleRes);

	489 ures_close(locRes);

	490 ures_close(rb);

	491 return emptyStr;

	492 }

	493

	494 int32_t numberKeys = ures_getSize(setRes);

	495 char *key=NULL;

	496 int32_t len=0;

	497 for(int32_t i=0; i<numberKeys; ++i) {

	498 int32_t keyLen;

	499 resLen=0;

	500 s=ures_getNextString(setRes, &resLen, (const char**)&key, &errCode);

	501 keyLen = (int32_t)uprv_strlen(key);

	502 u_charsToUChars(key, result+len, keyLen);

	503 len += keyLen;

	504 result[len++]=COLON;

	505 uprv_memcpy(result+len, s, resLen*sizeof(UChar));

	506 len += resLen;

	507 result[len++]=SEMI_COLON;

	508 }

	509 result[len++]=0;

	510 u_UCharsToChars(result, setKey, len);

	511 // printf(" Rule: %s\n", setKey);

	512

	513 ures_close(setRes);

	514 ures_close(ruleRes);

	515 ures_close(locRes);

	516 ures_close(rb);

	517 return UnicodeString(result);

	518

	519 }

	520

	521 AndConstraint::AndConstraint() {

	522 op = AndConstraint::NONE;

	523 opNum=-1;

	524 rangeLow=-1;

	525 rangeHigh=-1;

	526 notIn=FALSE;

	527 integerOnly=FALSE;

	528 next=NULL;

	529 }

	530

	531

	532 AndConstraint::AndConstraint(const AndConstraint& other) {

	533 this->op = other.op;

	534 this->opNum=other.opNum;

	535 this->rangeLow=other.rangeLow;

	536 this->rangeHigh=other.rangeHigh;

	537 this->integerOnly=other.integerOnly;

	538 this->notIn=other.notIn;

	539 if (other.next==NULL) {

	540 this->next=NULL;

	541 }

	542 else {

	543 this->next = new AndConstraint(*other.next);

	544 }

	545 }

	546

	547 AndConstraint::~AndConstraint() {

	548 if (next!=NULL) {

	549 delete next;

	550 }

	551 }

	552

	553

	554 UBool

	555 AndConstraint::isFulfilled(double number) {

	556 UBool result=TRUE;

	557 double value=number;

	558

	559 if ( op == MOD ) {

	560 value = (int32_t)value % opNum;

	561 }

	562 if ( rangeHigh == -1 ) {

	563 if ( rangeLow == -1 ) {

	564 result = TRUE; // empty rule

	565 }

	566 else {

	567 if ( value == rangeLow ) {

	568 result = TRUE;

	569 }

	570 else {

	571 result = FALSE;

	572 }

	573 }

	574 }

	575 else {

	576 if ((rangeLow <= value) && (value <= rangeHigh)) {

	577 if (integerOnly) {

	578 if ( value != (int32_t)value) {

	579 result = FALSE;

	580 }

	581 else {

	582 result = TRUE;

	583 }

	584 }

	585 else {

	586 result = TRUE;

	587 }

	588 }

	589 else {

	590 result = FALSE;

	591 }

	592 }

	593 if (notIn) {

	594 return !result;

	595 }

	596 else {

	597 return result;

	598 }

	599 }

	600

	601 int32_t

	602 AndConstraint::updateRepeatLimit(int32_t maxLimit) {

	603

	604 if ( op == MOD ) {

	605 return uprv_max(opNum, maxLimit);

	606 }

	607 else {

	608 if ( rangeHigh == -1 ) {

	609 return uprv_max(rangeLow, maxLimit);

	610 }

	611 else{

	612 return uprv_max(rangeHigh, maxLimit);

	613 }

	614 }

	615 }

	616

	617

	618 AndConstraint*

	619 AndConstraint::add()

	620 {

	621 this->next = new AndConstraint();

	622 return this->next;

	623 }

	624

	625 OrConstraint::OrConstraint() {

	626 childNode=NULL;

	627 next=NULL;

	628 }

	629

	630 OrConstraint::OrConstraint(const OrConstraint& other) {

	631 if ( other.childNode == NULL ) {

	632 this->childNode = NULL;

	633 }

	634 else {

	635 this->childNode = new AndConstraint(*(other.childNode));

	636 }

	637 if (other.next == NULL ) {

	638 this->next = NULL;

	639 }

	640 else {

	641 this->next = new OrConstraint(*(other.next));

	642 }

	643 }

	644

	645 OrConstraint::~OrConstraint() {

	646 if (childNode!=NULL) {

	647 delete childNode;

	648 }

	649 if (next!=NULL) {

	650 delete next;

	651 }

	652 }

	653

	654 AndConstraint*

	655 OrConstraint::add()

	656 {

	657 OrConstraint *curOrConstraint=this;

	658 {

	659 while (curOrConstraint->next!=NULL) {

	660 curOrConstraint = curOrConstraint->next;

	661 }

	662 curOrConstraint->next = NULL;

	663 curOrConstraint->childNode = new AndConstraint();

	664 }

	665 return curOrConstraint->childNode;

	666 }

	667

	668 UBool

	669 OrConstraint::isFulfilled(double number) {

	670 OrConstraint* orRule=this;

	671 UBool result=FALSE;

	672

	673 while (orRule!=NULL && !result) {

	674 result=TRUE;

	675 AndConstraint* andRule = orRule->childNode;

	676 while (andRule!=NULL && result) {

	677 result = andRule->isFulfilled(number);

	678 andRule=andRule->next;

	679 }

	680 orRule = orRule->next;

	681 }

	682

	683 return result;

	684 }

	685

	686

	687 RuleChain::RuleChain() {

	688 ruleHeader=NULL;

	689 next = NULL;

	690 repeatLimit=0;

	691 }

	692

	693 RuleChain::RuleChain(const RuleChain& other) {

	694 this->repeatLimit = other.repeatLimit;

	695 this->keyword=other.keyword;

	696 if (other.ruleHeader != NULL) {

	697 this->ruleHeader = new OrConstraint(*(other.ruleHeader));

	698 }

	699 else {

	700 this->ruleHeader = NULL;

	701 }

	702 if (other.next != NULL ) {

	703 this->next = new RuleChain(*other.next);

	704 }

	705 else

	706 {

	707 this->next = NULL;

	708 }

	709 }

	710

	711 RuleChain::~RuleChain() {

	712 if (next != NULL) {

	713 delete next;

	714 }

	715 if ( ruleHeader != NULL ) {

	716 delete ruleHeader;

	717 }

	718 }

	719

	720 UnicodeString

	721 RuleChain::select(double number) const {

	722

	723 if ( ruleHeader != NULL ) {

	724 if (ruleHeader->isFulfilled(number)) {

	725 return keyword;

	726 }

	727 }

	728 if ( next != NULL ) {

	729 return next->select(number);

	730 }

	731 else {

	732 return PLURAL_KEYWORD_OTHER;

	733 }

	734

	735 }

	736

	737 void

	738 RuleChain::dumpRules(UnicodeString& result) {

	739 UChar digitString[16];

	740

	741 if ( ruleHeader != NULL ) {

	742 result += keyword;

	743 OrConstraint* orRule=ruleHeader;

	744 while ( orRule != NULL ) {

	745 AndConstraint* andRule=orRule->childNode;

	746 while ( andRule != NULL ) {

	747 if ( (andRule->op==AndConstraint::NONE) && (andRule->rangeHigh== -1) ) {

	748 result += UNICODE_STRING_SIMPLE(" n is ");

	749 if (andRule->notIn) {

	750 result += UNICODE_STRING_SIMPLE("not ");

	751 }

	752 uprv_itou(digitString,16, andRule->rangeLow,10,0);

	753 result += UnicodeString(digitString);

	754 }

	755 else {

	756 if (andRule->op==AndConstraint::MOD) {

	757 result += UNICODE_STRING_SIMPLE(" n mod ");

	758 uprv_itou(digitString,16, andRule->opNum,10,0);

	759 result += UnicodeString(digitString);

	760 }

	761 else {

	762 result += UNICODE_STRING_SIMPLE(" n ");

	763 }

	764 if (andRule->rangeHigh==-1) {

	765 if (andRule->notIn) {

	766 result += UNICODE_STRING_SIMPLE(" is not ");

	767 uprv_itou(digitString,16, andRule->rangeLow,10,0);

	768 result += UnicodeString(digitString);

	769 }

	770 else {

	771 result += UNICODE_STRING_SIMPLE(" is ");

	772 uprv_itou(digitString,16, andRule->rangeLow,10,0);

	773 result += UnicodeString(digitString);

	774 }

	775 }

	776 else {

	777 if (andRule->notIn) {

	778 if ( andRule->integerOnly ) {

	779 result += UNICODE_STRING_SIMPLE(" not in ");

	780 }

	781 else {

	782 result += UNICODE_STRING_SIMPLE(" not within ") ;

	783 }

	784 uprv_itou(digitString,16, andRule->rangeLow,10,0);

	785 result += UnicodeString(digitString);

	786 result += UNICODE_STRING_SIMPLE(" .. ");

	787 uprv_itou(digitString,16, andRule->rangeHigh,10,0);

	788 result += UnicodeString(digitString);

	789 }

	790 else {

	791 if ( andRule->integerOnly ) {

	792 result += UNICODE_STRING_SIMPLE(" in ");

	793 }

	794 else {

	795 result += UNICODE_STRING_SIMPLE(" within ");

	796 }

	797 uprv_itou(digitString,16, andRule->rangeLow,10,0);

	798 result += UnicodeString(digitString);

	799 result += UNICODE_STRING_SIMPLE(" .. ");

	800 uprv_itou(digitString,16, andRule->rangeHigh,10,0);

	801 }

	802 }

	803 }

	804 if ( (andRule=andRule->next) != NULL) {

	805 result += PK_AND;

	806 }

	807 }

	808 if ( (orRule = orRule->next) != NULL ) {

	809 result += PK_OR;

	810 }

	811 }

	812 }

	813 if ( next != NULL ) {

	814 next->dumpRules(result);

	815 }

	816 }

	817

	818 int32_t

	819 RuleChain::getRepeatLimit () {

	820 return repeatLimit;

	821 }

	822

	823 void

	824 RuleChain::setRepeatLimit () {

	825 int32_t limit=0;

	826

	827 if ( next != NULL ) {

	828 next->setRepeatLimit();

	829 limit = next->repeatLimit;

	830 }

	831

	832 if ( ruleHeader != NULL ) {

	833 OrConstraint* orRule=ruleHeader;

	834 while ( orRule != NULL ) {

	835 AndConstraint* andRule=orRule->childNode;

	836 while ( andRule != NULL ) {

	837 limit = andRule->updateRepeatLimit(limit);

	838 andRule = andRule->next;

	839 }

	840 orRule = orRule->next;

	841 }

	842 }

	843 repeatLimit = limit;

	844 }

	845

	846 UErrorCode

	847 RuleChain::getKeywords(int32_t capacityOfKeywords, UnicodeString* keywords, int3 2_t& arraySize) const {

	848 if ( arraySize < capacityOfKeywords-1 ) {

	849 keywords[arraySize++]=keyword;

	850 }

	851 else {

	852 return U_BUFFER_OVERFLOW_ERROR;

	853 }

	854

	855 if ( next != NULL ) {

	856 return next->getKeywords(capacityOfKeywords, keywords, arraySize);

	857 }

	858 else {

	859 return U_ZERO_ERROR;

	860 }

	861 }

	862

	863 UBool

	864 RuleChain::isKeyword(const UnicodeString& keywordParam) const {

	865 if ( keyword == keywordParam ) {

	866 return TRUE;

	867 }

	868

	869 if ( next != NULL ) {

	870 return next->isKeyword(keywordParam);

	871 }

	872 else {

	873 return FALSE;

	874 }

	875 }

	876

	877

	878 RuleParser::RuleParser() {

	879 UErrorCode err=U_ZERO_ERROR;

	880 const UnicodeString idStart=UNICODE_STRING_SIMPLE("[[a-z]]");

	881 const UnicodeString idContinue=UNICODE_STRING_SIMPLE("[[a-z][A-Z][_][0-9]]") ;

	882 idStartFilter = new UnicodeSet(idStart, err);

	883 idContinueFilter = new UnicodeSet(idContinue, err);

	884 }

	885

	886 RuleParser::~RuleParser() {

	887 delete idStartFilter;

	888 delete idContinueFilter;

	889 }

	890

	891 void

	892 RuleParser::checkSyntax(tokenType prevType, tokenType curType, UErrorCode &statu s)

	893 {

	894 if (U_FAILURE(status)) {

	895 return;

	896 }

	897 switch(prevType) {

	898 case none:

	899 case tSemiColon:

	900 if (curType!=tKeyword) {

	901 status = U_UNEXPECTED_TOKEN;

	902 }

	903 break;

	904 case tVariableN :

	905 if (curType != tIs && curType != tMod && curType != tIn &&

	906 curType != tNot && curType != tWithin) {

	907 status = U_UNEXPECTED_TOKEN;

	908 }

	909 break;

	910 case tZero:

	911 case tOne:

	912 case tTwo:

	913 case tFew:

	914 case tMany:

	915 case tOther:

	916 case tKeyword:

	917 if (curType != tColon) {

	918 status = U_UNEXPECTED_TOKEN;

	919 }

	920 break;

	921 case tColon :

	922 if (curType != tVariableN) {

	923 status = U_UNEXPECTED_TOKEN;

	924 }

	925 break;

	926 case tIs:

	927 if ( curType != tNumber && curType != tNot) {

	928 status = U_UNEXPECTED_TOKEN;

	929 }

	930 break;

	931 case tNot:

	932 if (curType != tNumber && curType != tIn && curType != tWithin) {

	933 status = U_UNEXPECTED_TOKEN;

	934 }

	935 break;

	936 case tMod:

	937 case tDot:

	938 case tIn:

	939 case tWithin:

	940 case tAnd:

	941 case tOr:

	942 if (curType != tNumber && curType != tVariableN) {

	943 status = U_UNEXPECTED_TOKEN;

	944 }

	945 break;

	946 case tNumber:

	947 if (curType != tDot && curType != tSemiColon && curType != tIs && curTyp e != tNot &&

	948 curType != tIn && curType != tWithin && curType != tAnd && curType ! = tOr)

	949 {

	950 status = U_UNEXPECTED_TOKEN;

	951 }

	952 break;

	953 default:

	954 status = U_UNEXPECTED_TOKEN;

	955 break;

	956 }

	957 }

	958

	959 void

	960 RuleParser::getNextToken(const UnicodeString& ruleData,

	961 int32_t *ruleIndex,

	962 UnicodeString& token,

	963 tokenType& type,

	964 UErrorCode &status)

	965 {

	966 int32_t curIndex= *ruleIndex;

	967 UChar ch;

	968 tokenType prevType=none;

	969

	970 if (U_FAILURE(status)) {

	971 return;

	972 }

	973 while (curIndex<ruleData.length()) {

	974 ch = ruleData.charAt(curIndex);

	975 if ( !inRange(ch, type) ) {

	976 status = U_ILLEGAL_CHARACTER;

	977 return;

	978 }

	979 switch (type) {

	980 case tSpace:

	981 if ( *ruleIndex != curIndex ) { // letter

	982 token=UnicodeString(ruleData, ruleIndex, curIndex-ruleIndex);

	983 *ruleIndex=curIndex;

	984 type=prevType;

	985 getKeyType(token, type, status);

	986 return;

	987 }

	988 else {

	989 ruleIndex=ruleIndex+1;

	990 }

	991 break; // consective space

	992 case tColon:

	993 case tSemiColon:

	994 if ( *ruleIndex != curIndex ) {

	995 token=UnicodeString(ruleData, ruleIndex, curIndex-ruleIndex);

	996 *ruleIndex=curIndex;

	997 type=prevType;

	998 getKeyType(token, type, status);

	999 return;

	1000 }

	1001 else {

	1002 *ruleIndex=curIndex+1;

	1003 return;

	1004 }

	1005 case tLetter:

	1006 if ((type==prevType)\|\|(prevType==none)) {

	1007 prevType=type;

	1008 break;

	1009 }

	1010 break;

	1011 case tNumber:

	1012 if ((type==prevType)\|\|(prevType==none)) {

	1013 prevType=type;

	1014 break;

	1015 }

	1016 else {

	1017 *ruleIndex=curIndex+1;

	1018 return;

	1019 }

	1020 case tDot:

	1021 if (prevType==none) { // first dot

	1022 prevType=type;

	1023 continue;

	1024 }

	1025 else {

	1026 if ( *ruleIndex != curIndex ) {

	1027 token=UnicodeString(ruleData, ruleIndex, curIndex-ruleInde x);

	1028 *ruleIndex=curIndex; // letter

	1029 type=prevType;

	1030 getKeyType(token, type, status);

	1031 return;

	1032 }

	1033 else { // two consective dots

	1034 *ruleIndex=curIndex+2;

	1035 return;

	1036 }

	1037 }

	1038 break;

	1039 default:

	1040 status = U_UNEXPECTED_TOKEN;

	1041 return;

	1042 }

	1043 curIndex++;

	1044 }

	1045 if ( curIndex>=ruleData.length() ) {

	1046 if ( (type == tLetter)\|\|(type == tNumber) ) {

	1047 token=UnicodeString(ruleData, ruleIndex, curIndex-ruleIndex);

	1048 getKeyType(token, type, status);

	1049 if (U_FAILURE(status)) {

	1050 return;

	1051 }

	1052 }

	1053 *ruleIndex = ruleData.length();

	1054 }

	1055 }

	1056

	1057 UBool

	1058 RuleParser::inRange(UChar ch, tokenType& type) {

	1059 if ((ch>=CAP_A) && (ch<=CAP_Z)) {

	1060 // we assume all characters are in lower case already.

	1061 return FALSE;

	1062 }

	1063 if ((ch>=LOW_A) && (ch<=LOW_Z)) {

	1064 type = tLetter;

	1065 return TRUE;

	1066 }

	1067 if ((ch>=U_ZERO) && (ch<=U_NINE)) {

	1068 type = tNumber;

	1069 return TRUE;

	1070 }

	1071 switch (ch) {

	1072 case COLON:

	1073 type = tColon;

	1074 return TRUE;

	1075 case SPACE:

	1076 type = tSpace;

	1077 return TRUE;

	1078 case SEMI_COLON:

	1079 type = tSemiColon;

	1080 return TRUE;

	1081 case DOT:

	1082 type = tDot;

	1083 return TRUE;

	1084 default :

	1085 type = none;

	1086 return FALSE;

	1087 }

	1088 }

	1089

	1090

	1091 void

	1092 RuleParser::getKeyType(const UnicodeString& token, tokenType& keyType, UErrorCod e &status)

	1093 {

	1094 if (U_FAILURE(status)) {

	1095 return;

	1096 }

	1097 if ( keyType==tNumber) {

	1098 }

	1099 else if (token==PK_VAR_N) {

	1100 keyType = tVariableN;

	1101 }

	1102 else if (token==PK_IS) {

	1103 keyType = tIs;

	1104 }

	1105 else if (token==PK_AND) {

	1106 keyType = tAnd;

	1107 }

	1108 else if (token==PK_IN) {

	1109 keyType = tIn;

	1110 }

	1111 else if (token==PK_WITHIN) {

	1112 keyType = tWithin;

	1113 }

	1114 else if (token==PK_NOT) {

	1115 keyType = tNot;

	1116 }

	1117 else if (token==PK_MOD) {

	1118 keyType = tMod;

	1119 }

	1120 else if (token==PK_OR) {

	1121 keyType = tOr;

	1122 }

	1123 else if ( isValidKeyword(token) ) {

	1124 keyType = tKeyword;

	1125 }

	1126 else {

	1127 status = U_UNEXPECTED_TOKEN;

	1128 }

	1129 }

	1130

	1131 UBool

	1132 RuleParser::isValidKeyword(const UnicodeString& token) {

	1133 if ( token.length()==0 ) {

	1134 return FALSE;

	1135 }

	1136 if ( idStartFilter->contains(token.charAt(0) )==TRUE ) {

	1137 int32_t i;

	1138 for (i=1; i< token.length(); i++) {

	1139 if (idContinueFilter->contains(token.charAt(i))== FALSE) {

	1140 return FALSE;

	1141 }

	1142 }

	1143 return TRUE;

	1144 }

	1145 else {

	1146 return FALSE;

	1147 }

	1148 }

	1149

	1150 PluralKeywordEnumeration::PluralKeywordEnumeration(RuleChain *header, UErrorCode & status) :

	1151 fKeywordNames(status)

	1152 {

	1153 RuleChain *node=header;

	1154 UBool addKeywordOther=true;

	1155

	1156 if (U_FAILURE(status)) {

	1157 return;

	1158 }

	1159 pos=0;

	1160 fKeywordNames.removeAllElements();

	1161 while(node!=NULL) {

	1162 fKeywordNames.addElement(new UnicodeString(node->keyword), status);

	1163 if (U_FAILURE(status)) {

	1164 return;

	1165 }

	1166 if (node->keyword == PLURAL_KEYWORD_OTHER) {

	1167 addKeywordOther= false;

	1168 }

	1169 node=node->next;

	1170 }

	1171

	1172 if (addKeywordOther) {

	1173 fKeywordNames.addElement(new UnicodeString(PLURAL_KEYWORD_OTHER), status );

	1174 if (U_FAILURE(status)) {

	1175 return;

	1176 }

	1177 }

	1178 }

	1179

	1180 const UnicodeString*

	1181 PluralKeywordEnumeration::snext(UErrorCode& status) {

	1182 if (U_SUCCESS(status) && pos < fKeywordNames.size()) {

	1183 return (const UnicodeString*)fKeywordNames.elementAt(pos++);

	1184 }

	1185 return NULL;

	1186 }

	1187

	1188 void

	1189 PluralKeywordEnumeration::reset(UErrorCode& /status/) {

	1190 pos=0;

	1191 }

	1192

	1193 int32_t

	1194 PluralKeywordEnumeration::count(UErrorCode& /status/) const {

	1195 return fKeywordNames.size();

	1196 }

	1197

	1198 PluralKeywordEnumeration::~PluralKeywordEnumeration() {

	1199 UnicodeString *s;

	1200 for (int32_t i=0; i<fKeywordNames.size(); ++i) {

	1201 if ((s=(UnicodeString *)fKeywordNames.elementAt(i))!=NULL) {

	1202 delete s;

	1203 }

	1204 }

	1205 }

	1206

	1207 U_NAMESPACE_END

	1208

	1209

	1210 #endif /* #if !UCONFIG_NO_FORMATTING */

	1211

	1212 //eof

OLD	NEW

« no previous file with comments | « icu46/source/i18n/plurfmt.cpp ('k') | icu46/source/i18n/plurrule_impl.h » ('j') | no next file with comments »