icu46/source/i18n/transreg.cpp - Issue 5516007: Check in the pristine copy of ICU 4.6...

Side by Side Diff: icu46/source/i18n/transreg.cpp

Issue 5516007: Check in the pristine copy of ICU 4.6... (Closed) Base URL: svn://chrome-svn/chrome/trunk/deps/third_party/

Patch Set: Created 10 years ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch | Annotate | Revision Log

Property Changes:

Added: svn:eol-style
+ LF

OLD	NEW
(Empty)
	1 /*

	2 **********************************************************************

	3 * Copyright (c) 2001-2010, International Business Machines

	4 * Corporation and others. All Rights Reserved.

	5 **********************************************************************

	6 * Date Name Description

	7 * 08/10/2001 aliu Creation.

	8 **********************************************************************

	9 */

	10

	11 #include "unicode/utypes.h"

	12

	13 #if !UCONFIG_NO_TRANSLITERATION

	14

	15 #include "unicode/translit.h"

	16 #include "unicode/resbund.h"

	17 #include "unicode/uniset.h"

	18 #include "unicode/uscript.h"

	19 #include "rbt.h"

	20 #include "cpdtrans.h"

	21 #include "nultrans.h"

	22 #include "transreg.h"

	23 #include "rbt_data.h"

	24 #include "rbt_pars.h"

	25 #include "tridpars.h"

	26 #include "charstr.h"

	27 #include "uassert.h"

	28 #include "locutil.h"

	29

	30 // Enable the following symbol to add debugging code that tracks the

	31 // allocation, deletion, and use of Entry objects. BoundsChecker has

	32 // reported dangling pointer errors with these objects, but I have

	33 // been unable to confirm them. I suspect BoundsChecker is getting

	34 // confused with pointers going into and coming out of a UHashtable,

	35 // despite the hinting code that is designed to help it.

	36 // #define DEBUG_MEM

	37 #ifdef DEBUG_MEM

	38 #include <stdio.h>

	39 #endif

	40

	41 // UChar constants

	42 static const UChar LOCALE_SEP = 95; // '_'

	43 //static const UChar ID_SEP = 0x002D; /-/

	44 //static const UChar VARIANT_SEP = 0x002F; // '/'

	45

	46 // String constants

	47 static const UChar NO_VARIANT[] = { 0 }; // empty string

	48 static const UChar ANY[] = { 65, 110, 121, 0 }; // Any

	49

	50 /**

	51 * Resource bundle key for the RuleBasedTransliterator rule.

	52 */

	53 //static const char RB_RULE[] = "Rule";

	54

	55 U_NAMESPACE_BEGIN

	56

	57 //------------------------------------------------------------------

	58 // Alias

	59 //------------------------------------------------------------------

	60

	61 TransliteratorAlias::TransliteratorAlias(const UnicodeString& theAliasID,

	62 const UnicodeSet* cpdFilter) :

	63 ID(),

	64 aliasesOrRules(theAliasID),

	65 transes(0),

	66 compoundFilter(cpdFilter),

	67 direction(UTRANS_FORWARD),

	68 type(TransliteratorAlias::SIMPLE) {

	69 }

	70

	71 TransliteratorAlias::TransliteratorAlias(const UnicodeString& theID,

	72 const UnicodeString& idBlocks,

	73 UVector* adoptedTransliterators,

	74 const UnicodeSet* cpdFilter) :

	75 ID(theID),

	76 aliasesOrRules(idBlocks),

	77 transes(adoptedTransliterators),

	78 compoundFilter(cpdFilter),

	79 direction(UTRANS_FORWARD),

	80 type(TransliteratorAlias::COMPOUND) {

	81 }

	82

	83 TransliteratorAlias::TransliteratorAlias(const UnicodeString& theID,

	84 const UnicodeString& rules,

	85 UTransDirection dir) :

	86 ID(theID),

	87 aliasesOrRules(rules),

	88 transes(0),

	89 compoundFilter(0),

	90 direction(dir),

	91 type(TransliteratorAlias::RULES) {

	92 }

	93

	94 TransliteratorAlias::~TransliteratorAlias() {

	95 delete transes;

	96 }

	97

	98

	99 Transliterator* TransliteratorAlias::create(UParseError& pe,

	100 UErrorCode& ec) {

	101 if (U_FAILURE(ec)) {

	102 return 0;

	103 }

	104 Transliterator *t = NULL;

	105 switch (type) {

	106 case SIMPLE:

	107 t = Transliterator::createInstance(aliasesOrRules, UTRANS_FORWARD, pe, e c);

	108 if(U_FAILURE(ec)){

	109 return 0;

	110 }

	111 if (compoundFilter != 0)

	112 t->adoptFilter((UnicodeSet*)compoundFilter->clone());

	113 break;

	114 case COMPOUND:

	115 {

	116 // the total number of transliterators in the compound is the total number of anonymous transliterators

	117 // plus the total number of ID blocks-- we start by assuming the lis t begins and ends with an ID

	118 // block and that each pair anonymous transliterators has an ID bloc k between them. Then we go back

	119 // to see whether there really are ID blocks at the beginning and en d (by looking for U+FFFF, which

	120 // marks the position where an anonymous transliterator goes) and ad just accordingly

	121 int32_t anonymousRBTs = transes->size();

	122 int32_t transCount = anonymousRBTs * 2 + 1;

	123 if (!aliasesOrRules.isEmpty() && aliasesOrRules[0] == (UChar)(0xffff ))

	124 --transCount;

	125 if (aliasesOrRules.length() >= 2 && aliasesOrRules[aliasesOrRules.le ngth() - 1] == (UChar)(0xffff))

	126 --transCount;

	127 UnicodeString noIDBlock((UChar)(0xffff));

	128 noIDBlock += ((UChar)(0xffff));

	129 int32_t pos = aliasesOrRules.indexOf(noIDBlock);

	130 while (pos >= 0) {

	131 --transCount;

	132 pos = aliasesOrRules.indexOf(noIDBlock, pos + 1);

	133 }

	134

	135 UVector transliterators(ec);

	136 UnicodeString idBlock;

	137 int32_t blockSeparatorPos = aliasesOrRules.indexOf((UChar)(0xffff));

	138 while (blockSeparatorPos >= 0) {

	139 aliasesOrRules.extract(0, blockSeparatorPos, idBlock);

	140 aliasesOrRules.remove(0, blockSeparatorPos + 1);

	141 if (!idBlock.isEmpty())

	142 transliterators.addElement(Transliterator::createInstance(id Block, UTRANS_FORWARD, pe, ec), ec);

	143 if (!transes->isEmpty())

	144 transliterators.addElement(transes->orphanElementAt(0), ec);

	145 blockSeparatorPos = aliasesOrRules.indexOf((UChar)(0xffff));

	146 }

	147 if (!aliasesOrRules.isEmpty())

	148 transliterators.addElement(Transliterator::createInstance(aliase sOrRules, UTRANS_FORWARD, pe, ec), ec);

	149 while (!transes->isEmpty())

	150 transliterators.addElement(transes->orphanElementAt(0), ec);

	151

	152 if (U_SUCCESS(ec)) {

	153 t = new CompoundTransliterator(ID, transliterators,

	154 (compoundFilter ? (UnicodeSet*)(compoundFilter->clone()) : 0 ),

	155 anonymousRBTs, pe, ec);

	156 if (t == 0) {

	157 ec = U_MEMORY_ALLOCATION_ERROR;

	158 return 0;

	159 }

	160 } else {

	161 for (int32_t i = 0; i < transliterators.size(); i++)

	162 delete (Transliterator*)(transliterators.elementAt(i));

	163 }

	164 }

	165 break;

	166 case RULES:

	167 U_ASSERT(FALSE); // don't call create() if isRuleBased() returns TRUE!

	168 break;

	169 }

	170 return t;

	171 }

	172

	173 UBool TransliteratorAlias::isRuleBased() const {

	174 return type == RULES;

	175 }

	176

	177 void TransliteratorAlias::parse(TransliteratorParser& parser,

	178 UParseError& pe, UErrorCode& ec) const {

	179 U_ASSERT(type == RULES);

	180 if (U_FAILURE(ec)) {

	181 return;

	182 }

	183

	184 parser.parse(aliasesOrRules, direction, pe, ec);

	185 }

	186

	187 //----------------------------------------------------------------------

	188 // class TransliteratorSpec

	189 //----------------------------------------------------------------------

	190

	191 /**

	192 * A TransliteratorSpec is a string specifying either a source or a target. In more

	193 * general terms, it may also specify a variant, but we only use the

	194 * Spec class for sources and targets.

	195 *

	196 * A Spec may be a locale or a script. If it is a locale, it has a

	197 * fallback chain that goes xx_YY_ZZZ -> xx_YY -> xx -> ssss, where

	198 * ssss is the script mapping of xx_YY_ZZZ. The Spec API methods

	199 * hasFallback(), next(), and reset() iterate over this fallback

	200 * sequence.

	201 *

	202 * The Spec class canonicalizes itself, so the locale is put into

	203 * canonical form, or the script is transformed from an abbreviation

	204 * to a full name.

	205 */

	206 class TransliteratorSpec : public UMemory {

	207 public:

	208 TransliteratorSpec(const UnicodeString& spec);

	209 ~TransliteratorSpec();

	210

	211 const UnicodeString& get() const;

	212 UBool hasFallback() const;

	213 const UnicodeString& next();

	214 void reset();

	215

	216 UBool isLocale() const;

	217 ResourceBundle& getBundle() const;

	218

	219 operator const UnicodeString&() const { return get(); }

	220 const UnicodeString& getTop() const { return top; }

	221

	222 private:

	223 void setupNext();

	224

	225 UnicodeString top;

	226 UnicodeString spec;

	227 UnicodeString nextSpec;

	228 UnicodeString scriptName;

	229 UBool isSpecLocale; // TRUE if spec is a locale

	230 UBool isNextLocale; // TRUE if nextSpec is a locale

	231 ResourceBundle* res;

	232

	233 TransliteratorSpec(const TransliteratorSpec &other); // forbid copying of th is class

	234 TransliteratorSpec &operator=(const TransliteratorSpec &other); // forbid co pying of this class

	235 };

	236

	237 TransliteratorSpec::TransliteratorSpec(const UnicodeString& theSpec)

	238 : top(theSpec),

	239 res(0)

	240 {

	241 UErrorCode status = U_ZERO_ERROR;

	242 Locale topLoc("");

	243 LocaleUtility::initLocaleFromName(theSpec, topLoc);

	244 if (!topLoc.isBogus()) {

	245 res = new ResourceBundle(U_ICUDATA_TRANSLIT, topLoc, status);

	246 /* test for NULL */

	247 if (res == 0) {

	248 return;

	249 }

	250 if (U_FAILURE(status) \|\| status == U_USING_DEFAULT_WARNING) {

	251 delete res;

	252 res = 0;

	253 }

	254 }

	255

	256 // Canonicalize script name -or- do locale->script mapping

	257 status = U_ZERO_ERROR;

	258 static const int32_t capacity = 10;

	259 UScriptCode script[capacity]={USCRIPT_INVALID_CODE};

	260 int32_t num = uscript_getCode(CharString().appendInvariantChars(theSpec, sta tus).data(),

	261 script, capacity, &status);

	262 if (num > 0 && script[0] != USCRIPT_INVALID_CODE) {

	263 scriptName = UnicodeString(uscript_getName(script[0]), -1, US_INV);

	264 }

	265

	266 // Canonicalize top

	267 if (res != 0) {

	268 // Canonicalize locale name

	269 UnicodeString locStr;

	270 LocaleUtility::initNameFromLocale(topLoc, locStr);

	271 if (!locStr.isBogus()) {

	272 top = locStr;

	273 }

	274 } else if (scriptName.length() != 0) {

	275 // We are a script; use canonical name

	276 top = scriptName;

	277 }

	278

	279 // assert(spec != top);

	280 reset();

	281 }

	282

	283 TransliteratorSpec::~TransliteratorSpec() {

	284 delete res;

	285 }

	286

	287 UBool TransliteratorSpec::hasFallback() const {

	288 return nextSpec.length() != 0;

	289 }

	290

	291 void TransliteratorSpec::reset() {

	292 if (spec != top) {

	293 spec = top;

	294 isSpecLocale = (res != 0);

	295 setupNext();

	296 }

	297 }

	298

	299 void TransliteratorSpec::setupNext() {

	300 isNextLocale = FALSE;

	301 if (isSpecLocale) {

	302 nextSpec = spec;

	303 int32_t i = nextSpec.lastIndexOf(LOCALE_SEP);

	304 // If i == 0 then we have _FOO, so we fall through

	305 // to the scriptName.

	306 if (i > 0) {

	307 nextSpec.truncate(i);

	308 isNextLocale = TRUE;

	309 } else {

	310 nextSpec = scriptName; // scriptName may be empty

	311 }

	312 } else {

	313 // spec is a script, so we are at the end

	314 nextSpec.truncate(0);

	315 }

	316 }

	317

	318 // Protocol:

	319 // for(const UnicodeString& s(spec.get());

	320 // spec.hasFallback(); s(spec.next())) { ...

	321

	322 const UnicodeString& TransliteratorSpec::next() {

	323 spec = nextSpec;

	324 isSpecLocale = isNextLocale;

	325 setupNext();

	326 return spec;

	327 }

	328

	329 const UnicodeString& TransliteratorSpec::get() const {

	330 return spec;

	331 }

	332

	333 UBool TransliteratorSpec::isLocale() const {

	334 return isSpecLocale;

	335 }

	336

	337 ResourceBundle& TransliteratorSpec::getBundle() const {

	338 return *res;

	339 }

	340

	341 //----------------------------------------------------------------------

	342

	343 #ifdef DEBUG_MEM

	344

	345 // Vector of Entry pointers currently in use

	346 static UVector* DEBUG_entries = NULL;

	347

	348 static void DEBUG_setup() {

	349 if (DEBUG_entries == NULL) {

	350 UErrorCode ec = U_ZERO_ERROR;

	351 DEBUG_entries = new UVector(ec);

	352 }

	353 }

	354

	355 // Caller must call DEBUG_setup first. Return index of given Entry,

	356 // if it is in use (not deleted yet), or -1 if not found.

	357 static int DEBUG_findEntry(TransliteratorEntry* e) {

	358 for (int i=0; i<DEBUG_entries->size(); ++i) {

	359 if (e == (TransliteratorEntry*) DEBUG_entries->elementAt(i)) {

	360 return i;

	361 }

	362 }

	363 return -1;

	364 }

	365

	366 // Track object creation

	367 static void DEBUG_newEntry(TransliteratorEntry* e) {

	368 DEBUG_setup();

	369 if (DEBUG_findEntry(e) >= 0) {

	370 // This should really never happen unless the heap is broken

	371 printf("ERROR DEBUG_newEntry duplicate new pointer %08X\n", e);

	372 return;

	373 }

	374 UErrorCode ec = U_ZERO_ERROR;

	375 DEBUG_entries->addElement(e, ec);

	376 }

	377

	378 // Track object deletion

	379 static void DEBUG_delEntry(TransliteratorEntry* e) {

	380 DEBUG_setup();

	381 int i = DEBUG_findEntry(e);

	382 if (i < 0) {

	383 printf("ERROR DEBUG_delEntry possible double deletion %08X\n", e);

	384 return;

	385 }

	386 DEBUG_entries->removeElementAt(i);

	387 }

	388

	389 // Track object usage

	390 static void DEBUG_useEntry(TransliteratorEntry* e) {

	391 if (e == NULL) return;

	392 DEBUG_setup();

	393 int i = DEBUG_findEntry(e);

	394 if (i < 0) {

	395 printf("ERROR DEBUG_useEntry possible dangling pointer %08X\n", e);

	396 }

	397 }

	398

	399 #else

	400 // If we're not debugging then make these macros into NOPs

	401 #define DEBUG_newEntry(x)

	402 #define DEBUG_delEntry(x)

	403 #define DEBUG_useEntry(x)

	404 #endif

	405

	406 //----------------------------------------------------------------------

	407 // class Entry

	408 //----------------------------------------------------------------------

	409

	410 /**

	411 * The Entry object stores objects of different types and

	412 * singleton objects as placeholders for rule-based transliterators to

	413 * be built as needed. Instances of this struct can be placeholders,

	414 * can represent prototype transliterators to be cloned, or can

	415 * represent TransliteratorData objects. We don't support storing

	416 * classes in the registry because we don't have the rtti infrastructure

	417 * for it. We could easily add this if there is a need for it in the

	418 * future.

	419 */

	420 class TransliteratorEntry : public UMemory {

	421 public:

	422 enum Type {

	423 RULES_FORWARD,

	424 RULES_REVERSE,

	425 LOCALE_RULES,

	426 PROTOTYPE,

	427 RBT_DATA,

	428 COMPOUND_RBT,

	429 ALIAS,

	430 FACTORY,

	431 NONE // Only used for uninitialized entries

	432 } entryType;

	433 // NOTE: stringArg cannot go inside the union because

	434 // it has a copy constructor

	435 UnicodeString stringArg; // For RULES_*, ALIAS, COMPOUND_RBT

	436 int32_t intArg; // For COMPOUND_RBT, LOCALE_RULES

	437 UnicodeSet* compoundFilter; // For COMPOUND_RBT

	438 union {

	439 Transliterator* prototype; // For PROTOTYPE

	440 TransliterationRuleData* data; // For RBT_DATA

	441 UVector* dataVector; // For COMPOUND_RBT

	442 struct {

	443 Transliterator::Factory function;

	444 Transliterator::Token context;

	445 } factory; // For FACTORY

	446 } u;

	447 TransliteratorEntry();

	448 ~TransliteratorEntry();

	449 void adoptPrototype(Transliterator* adopted);

	450 void setFactory(Transliterator::Factory factory,

	451 Transliterator::Token context);

	452

	453 private:

	454

	455 TransliteratorEntry(const TransliteratorEntry &other); // forbid copying of this class

	456 TransliteratorEntry &operator=(const TransliteratorEntry &other); // forbid copying of this class

	457 };

	458

	459 TransliteratorEntry::TransliteratorEntry() {

	460 u.prototype = 0;

	461 compoundFilter = NULL;

	462 entryType = NONE;

	463 DEBUG_newEntry(this);

	464 }

	465

	466 TransliteratorEntry::~TransliteratorEntry() {

	467 DEBUG_delEntry(this);

	468 if (entryType == PROTOTYPE) {

	469 delete u.prototype;

	470 } else if (entryType == RBT_DATA) {

	471 // The data object is shared between instances of RBT. The

	472 // entry object owns it. It should only be deleted when the

	473 // transliterator component is being cleaned up. Doing so

	474 // invalidates any RBTs that the user has instantiated.

	475 delete u.data;

	476 } else if (entryType == COMPOUND_RBT) {

	477 while (u.dataVector != NULL && !u.dataVector->isEmpty())

	478 delete (TransliterationRuleData*)u.dataVector->orphanElementAt(0);

	479 delete u.dataVector;

	480 }

	481 delete compoundFilter;

	482 }

	483

	484 void TransliteratorEntry::adoptPrototype(Transliterator* adopted) {

	485 if (entryType == PROTOTYPE) {

	486 delete u.prototype;

	487 }

	488 entryType = PROTOTYPE;

	489 u.prototype = adopted;

	490 }

	491

	492 void TransliteratorEntry::setFactory(Transliterator::Factory factory,

	493 Transliterator::Token context) {

	494 if (entryType == PROTOTYPE) {

	495 delete u.prototype;

	496 }

	497 entryType = FACTORY;

	498 u.factory.function = factory;

	499 u.factory.context = context;

	500 }

	501

	502 // UObjectDeleter for Hashtable::setValueDeleter

	503 U_CDECL_BEGIN

	504 static void U_CALLCONV

	505 deleteEntry(void* obj) {

	506 delete (TransliteratorEntry*) obj;

	507 }

	508 U_CDECL_END

	509

	510 //----------------------------------------------------------------------

	511 // class TransliteratorRegistry: Basic public API

	512 //----------------------------------------------------------------------

	513

	514 TransliteratorRegistry::TransliteratorRegistry(UErrorCode& status) :

	515 registry(TRUE, status),

	516 specDAG(TRUE, status),

	517 availableIDs(status)

	518 {

	519 registry.setValueDeleter(deleteEntry);

	520 availableIDs.setDeleter(uhash_deleteUnicodeString);

	521 availableIDs.setComparer(uhash_compareCaselessUnicodeString);

	522 specDAG.setValueDeleter(uhash_deleteHashtable);

	523 }

	524

	525 TransliteratorRegistry::~TransliteratorRegistry() {

	526 // Through the magic of C++, everything cleans itself up

	527 }

	528

	529 Transliterator* TransliteratorRegistry::get(const UnicodeString& ID,

	530 TransliteratorAlias*& aliasReturn,

	531 UErrorCode& status) {

	532 U_ASSERT(aliasReturn == NULL);

	533 TransliteratorEntry *entry = find(ID);

	534 return (entry == 0) ? 0

	535 : instantiateEntry(ID, entry, aliasReturn, status);

	536 }

	537

	538 Transliterator* TransliteratorRegistry::reget(const UnicodeString& ID,

	539 TransliteratorParser& parser,

	540 TransliteratorAlias*& aliasReturn,

	541 UErrorCode& status) {

	542 U_ASSERT(aliasReturn == NULL);

	543 TransliteratorEntry *entry = find(ID);

	544

	545 if (entry == 0) {

	546 // We get to this point if there are two threads, one of which

	547 // is instantiating an ID, and another of which is removing

	548 // the same ID from the registry, and the timing is just right.

	549 return 0;

	550 }

	551

	552 // The usage model for the caller is that they will first call

	553 // reg->get() inside the mutex, they'll get back an alias, they call

	554 // alias->isRuleBased(), and if they get TRUE, they call alias->parse()

	555 // outside the mutex, then reg->reget() inside the mutex again. A real

	556 // mess, but it gets things working for ICU 3.0. [alan].

	557

	558 // Note: It's possible that in between the caller calling

	559 // alias->parse() and reg->reget(), that another thread will have

	560 // called reg->reget(), and the entry will already have been fixed up.

	561 // We have to detect this so we don't stomp over existing entry

	562 // data members and potentially leak memory (u.data and compoundFilter).

	563

	564 if (entry->entryType == TransliteratorEntry::RULES_FORWARD \|\|

	565 entry->entryType == TransliteratorEntry::RULES_REVERSE \|\|

	566 entry->entryType == TransliteratorEntry::LOCALE_RULES) {

	567

	568 if (parser.idBlockVector.isEmpty() && parser.dataVector.isEmpty()) {

	569 entry->u.data = 0;

	570 entry->entryType = TransliteratorEntry::ALIAS;

	571 entry->stringArg = UNICODE_STRING_SIMPLE("Any-NULL");

	572 }

	573 else if (parser.idBlockVector.isEmpty() && parser.dataVector.size() == 1 ) {

	574 entry->u.data = (TransliterationRuleData*)parser.dataVector.orphanEl ementAt(0);

	575 entry->entryType = TransliteratorEntry::RBT_DATA;

	576 }

	577 else if (parser.idBlockVector.size() == 1 && parser.dataVector.isEmpty() ) {

	578 entry->stringArg = (UnicodeString)(parser.idBlockVector.elementAt( 0));

	579 entry->compoundFilter = parser.orphanCompoundFilter();

	580 entry->entryType = TransliteratorEntry::ALIAS;

	581 }

	582 else {

	583 entry->entryType = TransliteratorEntry::COMPOUND_RBT;

	584 entry->compoundFilter = parser.orphanCompoundFilter();

	585 entry->u.dataVector = new UVector(status);

	586 entry->stringArg.remove();

	587

	588 int32_t limit = parser.idBlockVector.size();

	589 if (parser.dataVector.size() > limit)

	590 limit = parser.dataVector.size();

	591

	592 for (int32_t i = 0; i < limit; i++) {

	593 if (i < parser.idBlockVector.size()) {

	594 UnicodeString* idBlock = (UnicodeString*)parser.idBlockVecto r.elementAt(i);

	595 if (!idBlock->isEmpty())

	596 entry->stringArg += *idBlock;

	597 }

	598 if (!parser.dataVector.isEmpty()) {

	599 TransliterationRuleData* data = (TransliterationRuleData*)pa rser.dataVector.orphanElementAt(0);

	600 entry->u.dataVector->addElement(data, status);

	601 entry->stringArg += (UChar)0xffff; // use U+FFFF to mark po sition of RBTs in ID block

	602 }

	603 }

	604 }

	605 }

	606

	607 Transliterator *t =

	608 instantiateEntry(ID, entry, aliasReturn, status);

	609 return t;

	610 }

	611

	612 void TransliteratorRegistry::put(Transliterator* adoptedProto,

	613 UBool visible,

	614 UErrorCode& ec)

	615 {

	616 TransliteratorEntry *entry = new TransliteratorEntry();

	617 if (entry == NULL) {

	618 ec = U_MEMORY_ALLOCATION_ERROR;

	619 return;

	620 }

	621 entry->adoptPrototype(adoptedProto);

	622 registerEntry(adoptedProto->getID(), entry, visible);

	623 }

	624

	625 void TransliteratorRegistry::put(const UnicodeString& ID,

	626 Transliterator::Factory factory,

	627 Transliterator::Token context,

	628 UBool visible,

	629 UErrorCode& ec) {

	630 TransliteratorEntry *entry = new TransliteratorEntry();

	631 if (entry == NULL) {

	632 ec = U_MEMORY_ALLOCATION_ERROR;

	633 return;

	634 }

	635 entry->setFactory(factory, context);

	636 registerEntry(ID, entry, visible);

	637 }

	638

	639 void TransliteratorRegistry::put(const UnicodeString& ID,

	640 const UnicodeString& resourceName,

	641 UTransDirection dir,

	642 UBool readonlyResourceAlias,

	643 UBool visible,

	644 UErrorCode& ec) {

	645 TransliteratorEntry *entry = new TransliteratorEntry();

	646 if (entry == NULL) {

	647 ec = U_MEMORY_ALLOCATION_ERROR;

	648 return;

	649 }

	650 entry->entryType = (dir == UTRANS_FORWARD) ? TransliteratorEntry::RULES_FORW ARD

	651 : TransliteratorEntry::RULES_REVERSE;

	652 if (readonlyResourceAlias) {

	653 entry->stringArg.setTo(TRUE, resourceName.getBuffer(), -1);

	654 }

	655 else {

	656 entry->stringArg = resourceName;

	657 }

	658 registerEntry(ID, entry, visible);

	659 }

	660

	661 void TransliteratorRegistry::put(const UnicodeString& ID,

	662 const UnicodeString& alias,

	663 UBool readonlyAliasAlias,

	664 UBool visible,

	665 UErrorCode& /ec/) {

	666 TransliteratorEntry *entry = new TransliteratorEntry();

	667 // Null pointer check

	668 if (entry != NULL) {

	669 entry->entryType = TransliteratorEntry::ALIAS;

	670 if (readonlyAliasAlias) {

	671 entry->stringArg.setTo(TRUE, alias.getBuffer(), -1);

	672 }

	673 else {

	674 entry->stringArg = alias;

	675 }

	676 registerEntry(ID, entry, visible);

	677 }

	678 }

	679

	680 void TransliteratorRegistry::remove(const UnicodeString& ID) {

	681 UnicodeString source, target, variant;

	682 UBool sawSource;

	683 TransliteratorIDParser::IDtoSTV(ID, source, target, variant, sawSource);

	684 // Only need to do this if ID.indexOf('-') < 0

	685 UnicodeString id;

	686 TransliteratorIDParser::STVtoID(source, target, variant, id);

	687 registry.remove(id);

	688 removeSTV(source, target, variant);

	689 availableIDs.removeElement((void*) &id);

	690 }

	691

	692 //----------------------------------------------------------------------

	693 // class TransliteratorRegistry: Public ID and spec management

	694 //----------------------------------------------------------------------

	695

	696 /**

	697 * == OBSOLETE - remove in ICU 3.4 ==

	698 * Return the number of IDs currently registered with the system.

	699 * To retrieve the actual IDs, call getAvailableID(i) with

	700 * i from 0 to countAvailableIDs() - 1.

	701 */

	702 int32_t TransliteratorRegistry::countAvailableIDs(void) const {

	703 return availableIDs.size();

	704 }

	705

	706 /**

	707 * == OBSOLETE - remove in ICU 3.4 ==

	708 * Return the index-th available ID. index must be between 0

	709 * and countAvailableIDs() - 1, inclusive. If index is out of

	710 * range, the result of getAvailableID(0) is returned.

	711 */

	712 const UnicodeString& TransliteratorRegistry::getAvailableID(int32_t index) const {

	713 if (index < 0 \|\| index >= availableIDs.size()) {

	714 index = 0;

	715 }

	716 return (const UnicodeString) availableIDs[index];

	717 }

	718

	719 StringEnumeration* TransliteratorRegistry::getAvailableIDs() const {

	720 return new Enumeration(*this);

	721 }

	722

	723 int32_t TransliteratorRegistry::countAvailableSources(void) const {

	724 return specDAG.count();

	725 }

	726

	727 UnicodeString& TransliteratorRegistry::getAvailableSource(int32_t index,

	728 UnicodeString& result) const {

	729 int32_t pos = -1;

	730 const UHashElement *e = 0;

	731 while (index-- >= 0) {

	732 e = specDAG.nextElement(pos);

	733 if (e == 0) {

	734 break;

	735 }

	736 }

	737 if (e == 0) {

	738 result.truncate(0);

	739 } else {

	740 result = (UnicodeString) e->key.pointer;

	741 }

	742 return result;

	743 }

	744

	745 int32_t TransliteratorRegistry::countAvailableTargets(const UnicodeString& sourc e) const {

	746 Hashtable targets = (Hashtable) specDAG.get(source);

	747 return (targets == 0) ? 0 : targets->count();

	748 }

	749

	750 UnicodeString& TransliteratorRegistry::getAvailableTarget(int32_t index,

	751 const UnicodeString& s ource,

	752 UnicodeString& result) const {

	753 Hashtable targets = (Hashtable) specDAG.get(source);

	754 if (targets == 0) {

	755 result.truncate(0); // invalid source

	756 return result;

	757 }

	758 int32_t pos = -1;

	759 const UHashElement *e = 0;

	760 while (index-- >= 0) {

	761 e = targets->nextElement(pos);

	762 if (e == 0) {

	763 break;

	764 }

	765 }

	766 if (e == 0) {

	767 result.truncate(0); // invalid index

	768 } else {

	769 result = (UnicodeString) e->key.pointer;

	770 }

	771 return result;

	772 }

	773

	774 int32_t TransliteratorRegistry::countAvailableVariants(const UnicodeString& sour ce,

	775 const UnicodeString& targ et) const {

	776 Hashtable targets = (Hashtable) specDAG.get(source);

	777 if (targets == 0) {

	778 return 0;

	779 }

	780 UVector variants = (UVector) targets->get(target);

	781 // variants may be 0 if the source/target are invalid

	782 return (variants == 0) ? 0 : variants->size();

	783 }

	784

	785 UnicodeString& TransliteratorRegistry::getAvailableVariant(int32_t index,

	786 const UnicodeString& source,

	787 const UnicodeString& target,

	788 UnicodeString& result ) const {

	789 Hashtable targets = (Hashtable) specDAG.get(source);

	790 if (targets == 0) {

	791 result.truncate(0); // invalid source

	792 return result;

	793 }

	794 UVector variants = (UVector) targets->get(target);

	795 if (variants == 0) {

	796 result.truncate(0); // invalid target

	797 return result;

	798 }

	799 UnicodeString v = (UnicodeString) variants->elementAt(index);

	800 if (v == 0) {

	801 result.truncate(0); // invalid index

	802 } else {

	803 result = *v;

	804 }

	805 return result;

	806 }

	807

	808 //----------------------------------------------------------------------

	809 // class TransliteratorRegistry::Enumeration

	810 //----------------------------------------------------------------------

	811

	812 TransliteratorRegistry::Enumeration::Enumeration(const TransliteratorRegistry& _ reg) :

	813 index(0), reg(_reg) {

	814 }

	815

	816 TransliteratorRegistry::Enumeration::~Enumeration() {

	817 }

	818

	819 int32_t TransliteratorRegistry::Enumeration::count(UErrorCode& /status/) const {

	820 return reg.availableIDs.size();

	821 }

	822

	823 const UnicodeString* TransliteratorRegistry::Enumeration::snext(UErrorCode& stat us) {

	824 // This is sloppy but safe -- if we get out of sync with the underlying

	825 // registry, we will still return legal strings, but they might not

	826 // correspond to the snapshot at construction time. So there could be

	827 // duplicate IDs or omitted IDs if insertions or deletions occur in one

	828 // thread while another is iterating. To be more rigorous, add a timestamp,

	829 // which is incremented with any modification, and validate this iterator

	830 // against the timestamp at construction time. This probably isn't worth

	831 // doing as long as there is some possibility of removing this code in favor

	832 // of some new code based on Doug's service framework.

	833 if (U_FAILURE(status)) {

	834 return NULL;

	835 }

	836 int32_t n = reg.availableIDs.size();

	837 if (index > n) {

	838 status = U_ENUM_OUT_OF_SYNC_ERROR;

	839 }

	840 // index == n is okay -- this means we've reached the end

	841 if (index < n) {

	842 // Copy the string! This avoids lifetime problems.

	843 unistr = (const UnicodeString)reg.availableIDs[index++];

	844 return &unistr;

	845 } else {

	846 return NULL;

	847 }

	848 }

	849

	850 void TransliteratorRegistry::Enumeration::reset(UErrorCode& /status/) {

	851 index = 0;

	852 }

	853

	854 UOBJECT_DEFINE_RTTI_IMPLEMENTATION(TransliteratorRegistry::Enumeration)

	855

	856 //----------------------------------------------------------------------

	857 // class TransliteratorRegistry: internal

	858 //----------------------------------------------------------------------

	859

	860 /**

	861 * Convenience method. Calls 6-arg registerEntry().

	862 */

	863 void TransliteratorRegistry::registerEntry(const UnicodeString& source,

	864 const UnicodeString& target,

	865 const UnicodeString& variant,

	866 TransliteratorEntry* adopted,

	867 UBool visible) {

	868 UnicodeString ID;

	869 UnicodeString s(source);

	870 if (s.length() == 0) {

	871 s = ANY;

	872 }

	873 TransliteratorIDParser::STVtoID(source, target, variant, ID);

	874 registerEntry(ID, s, target, variant, adopted, visible);

	875 }

	876

	877 /**

	878 * Convenience method. Calls 6-arg registerEntry().

	879 */

	880 void TransliteratorRegistry::registerEntry(const UnicodeString& ID,

	881 TransliteratorEntry* adopted,

	882 UBool visible) {

	883 UnicodeString source, target, variant;

	884 UBool sawSource;

	885 TransliteratorIDParser::IDtoSTV(ID, source, target, variant, sawSource);

	886 // Only need to do this if ID.indexOf('-') < 0

	887 UnicodeString id;

	888 TransliteratorIDParser::STVtoID(source, target, variant, id);

	889 registerEntry(id, source, target, variant, adopted, visible);

	890 }

	891

	892 /**

	893 * Register an entry object (adopted) with the given ID, source,

	894 * target, and variant strings.

	895 */

	896 void TransliteratorRegistry::registerEntry(const UnicodeString& ID,

	897 const UnicodeString& source,

	898 const UnicodeString& target,

	899 const UnicodeString& variant,

	900 TransliteratorEntry* adopted,

	901 UBool visible) {

	902 UErrorCode status = U_ZERO_ERROR;

	903 registry.put(ID, adopted, status);

	904 if (visible) {

	905 registerSTV(source, target, variant);

	906 if (!availableIDs.contains((void*) &ID)) {

	907 UnicodeString newID = (UnicodeString )ID.clone();

	908 // Check to make sure newID was created.

	909 if (newID != NULL) {

	910 // NUL-terminate the ID string

	911 newID->getTerminatedBuffer();

	912 availableIDs.addElement(newID, status);

	913 }

	914 }

	915 } else {

	916 removeSTV(source, target, variant);

	917 availableIDs.removeElement((void*) &ID);

	918 }

	919 }

	920

	921 /**

	922 * Register a source-target/variant in the specDAG. Variant may be

	923 * empty, but source and target must not be. If variant is empty then

	924 * the special variant NO_VARIANT is stored in slot zero of the

	925 * UVector of variants.

	926 */

	927 void TransliteratorRegistry::registerSTV(const UnicodeString& source,

	928 const UnicodeString& target,

	929 const UnicodeString& variant) {

	930 // assert(source.length() > 0);

	931 // assert(target.length() > 0);

	932 UErrorCode status = U_ZERO_ERROR;

	933 Hashtable targets = (Hashtable) specDAG.get(source);

	934 if (targets == 0) {

	935 targets = new Hashtable(TRUE, status);

	936 if (U_FAILURE(status) \|\| targets == 0) {

	937 return;

	938 }

	939 targets->setValueDeleter(uhash_deleteUObject);

	940 specDAG.put(source, targets, status);

	941 }

	942 UVector variants = (UVector) targets->get(target);

	943 if (variants == 0) {

	944 variants = new UVector(uhash_deleteUnicodeString,

	945 uhash_compareCaselessUnicodeString, status);

	946 if (variants == 0) {

	947 return;

	948 }

	949 targets->put(target, variants, status);

	950 }

	951 // assert(NO_VARIANT == "");

	952 // We add the variant string. If it is the special "no variant"

	953 // string, that is, the empty string, we add it at position zero.

	954 if (!variants->contains((void*) &variant)) {

	955 UnicodeString *tempus; // Used for null pointer check.

	956 if (variant.length() > 0) {

	957 tempus = new UnicodeString(variant);

	958 if (tempus != NULL) {

	959 variants->addElement(tempus, status);

	960 }

	961 } else {

	962 tempus = new UnicodeString(NO_VARIANT) ;

	963 if (tempus != NULL) {

	964 variants->insertElementAt(tempus, 0, status);

	965 }

	966 }

	967 }

	968 }

	969

	970 /**

	971 * Remove a source-target/variant from the specDAG.

	972 */

	973 void TransliteratorRegistry::removeSTV(const UnicodeString& source,

	974 const UnicodeString& target,

	975 const UnicodeString& variant) {

	976 // assert(source.length() > 0);

	977 // assert(target.length() > 0);

	978 // UErrorCode status = U_ZERO_ERROR;

	979 Hashtable targets = (Hashtable) specDAG.get(source);

	980 if (targets == 0) {

	981 return; // should never happen for valid s-t/v

	982 }

	983 UVector variants = (UVector) targets->get(target);

	984 if (variants == 0) {

	985 return; // should never happen for valid s-t/v

	986 }

	987 variants->removeElement((void*) &variant);

	988 if (variants->size() == 0) {

	989 targets->remove(target); // should delete variants

	990 if (targets->count() == 0) {

	991 specDAG.remove(source); // should delete targets

	992 }

	993 }

	994 }

	995

	996 /**

	997 * Attempt to find a source-target/variant in the dynamic registry

	998 * store. Return 0 on failure.

	999 *

	1000 * Caller does NOT own returned object.

	1001 */

	1002 TransliteratorEntry* TransliteratorRegistry::findInDynamicStore(const Transliter atorSpec& src,

	1003 const TransliteratorSpec& trg,

	1004 const UnicodeString& variant) const {

	1005 UnicodeString ID;

	1006 TransliteratorIDParser::STVtoID(src, trg, variant, ID);

	1007 TransliteratorEntry e = (TransliteratorEntry) registry.get(ID);

	1008 DEBUG_useEntry(e);

	1009 return e;

	1010 }

	1011

	1012 /**

	1013 * Attempt to find a source-target/variant in the static locale

	1014 * resource store. Do not perform fallback. Return 0 on failure.

	1015 *

	1016 * On success, create a new entry object, register it in the dynamic

	1017 * store, and return a pointer to it, but do not make it public --

	1018 * just because someone requested something, we do not expand the

	1019 * available ID list (or spec DAG).

	1020 *

	1021 * Caller does NOT own returned object.

	1022 */

	1023 TransliteratorEntry* TransliteratorRegistry::findInStaticStore(const Translitera torSpec& src,

	1024 const TransliteratorSpec& trg,

	1025 const UnicodeString& variant) {

	1026 TransliteratorEntry* entry = 0;

	1027 if (src.isLocale()) {

	1028 entry = findInBundle(src, trg, variant, UTRANS_FORWARD);

	1029 } else if (trg.isLocale()) {

	1030 entry = findInBundle(trg, src, variant, UTRANS_REVERSE);

	1031 }

	1032

	1033 // If we found an entry, store it in the Hashtable for next

	1034 // time.

	1035 if (entry != 0) {

	1036 registerEntry(src.getTop(), trg.getTop(), variant, entry, FALSE);

	1037 }

	1038

	1039 return entry;

	1040 }

	1041

	1042 // As of 2.0, resource bundle keys cannot contain '_'

	1043 static const UChar TRANSLITERATE_TO[] = {84,114,97,110,115,108,105,116,101,114,9 7,116,101,84,111,0}; // "TransliterateTo"

	1044

	1045 static const UChar TRANSLITERATE_FROM[] = {84,114,97,110,115,108,105,116,101,114 ,97,116,101,70,114,111,109,0}; // "TransliterateFrom"

	1046

	1047 static const UChar TRANSLITERATE[] = {84,114,97,110,115,108,105,116,101,114,97,1 16,101,0}; // "Transliterate"

	1048

	1049 /**

	1050 * Attempt to find an entry in a single resource bundle. This is

	1051 * a one-sided lookup. findInStaticStore() performs up to two such

	1052 * lookups, one for the source, and one for the target.

	1053 *

	1054 * Do not perform fallback. Return 0 on failure.

	1055 *

	1056 * On success, create a new Entry object, populate it, and return it.

	1057 * The caller owns the returned object.

	1058 */

	1059 TransliteratorEntry* TransliteratorRegistry::findInBundle(const TransliteratorSp ec& specToOpen,

	1060 const TransliteratorSpec& specToFind ,

	1061 const UnicodeString& variant,

	1062 UTransDirection direction)

	1063 {

	1064 UnicodeString utag;

	1065 UnicodeString resStr;

	1066 int32_t pass;

	1067

	1068 for (pass=0; pass<2; ++pass) {

	1069 utag.truncate(0);

	1070 // First try either TransliteratorTo_xxx or

	1071 // TransliterateFrom_xxx, then try the bidirectional

	1072 // Transliterate_xxx. This precedence order is arbitrary

	1073 // but must be consistent and documented.

	1074 if (pass == 0) {

	1075 utag.append(direction == UTRANS_FORWARD ?

	1076 TRANSLITERATE_TO : TRANSLITERATE_FROM);

	1077 } else {

	1078 utag.append(TRANSLITERATE);

	1079 }

	1080 UnicodeString s(specToFind.get());

	1081 utag.append(s.toUpper(""));

	1082 UErrorCode status = U_ZERO_ERROR;

	1083 ResourceBundle subres(specToOpen.getBundle().get(

	1084 CharString().appendInvariantChars(utag, status).data(), status));

	1085 if (U_FAILURE(status) \|\| status == U_USING_DEFAULT_WARNING) {

	1086 continue;

	1087 }

	1088

	1089 s.truncate(0);

	1090 if (specToOpen.get() != LocaleUtility::initNameFromLocale(subres.getLoca le(), s)) {

	1091 continue;

	1092 }

	1093

	1094 if (variant.length() != 0) {

	1095 status = U_ZERO_ERROR;

	1096 resStr = subres.getStringEx(

	1097 CharString().appendInvariantChars(variant, status).data(), statu s);

	1098 if (U_SUCCESS(status)) {

	1099 // Exit loop successfully

	1100 break;

	1101 }

	1102 } else {

	1103 // Variant is empty, which means match the first variant listed.

	1104 status = U_ZERO_ERROR;

	1105 resStr = subres.getStringEx(1, status);

	1106 if (U_SUCCESS(status)) {

	1107 // Exit loop successfully

	1108 break;

	1109 }

	1110 }

	1111 }

	1112

	1113 if (pass==2) {

	1114 // Failed

	1115 return NULL;

	1116 }

	1117

	1118 // We have succeeded in loading a string from the locale

	1119 // resources. Create a new registry entry to hold it and return it.

	1120 TransliteratorEntry *entry = new TransliteratorEntry();

	1121 if (entry != 0) {

	1122 // The direction is always forward for the

	1123 // TransliterateTo_xxx and TransliterateFrom_xxx

	1124 // items; those are unidirectional forward rules.

	1125 // For the bidirectional Transliterate_xxx items,

	1126 // the direction is the value passed in to this

	1127 // function.

	1128 int32_t dir = (pass == 0) ? UTRANS_FORWARD : direction;

	1129 entry->entryType = TransliteratorEntry::LOCALE_RULES;

	1130 entry->stringArg = resStr;

	1131 entry->intArg = dir;

	1132 }

	1133

	1134 return entry;

	1135 }

	1136

	1137 /**

	1138 * Convenience method. Calls 3-arg find().

	1139 */

	1140 TransliteratorEntry* TransliteratorRegistry::find(const UnicodeString& ID) {

	1141 UnicodeString source, target, variant;

	1142 UBool sawSource;

	1143 TransliteratorIDParser::IDtoSTV(ID, source, target, variant, sawSource);

	1144 return find(source, target, variant);

	1145 }

	1146

	1147 /**

	1148 * Top-level find method. Attempt to find a source-target/variant in

	1149 * either the dynamic or the static (locale resource) store. Perform

	1150 * fallback.

	1151 *

	1152 * Lookup sequence for ss_SS_SSS-tt_TT_TTT/v:

	1153 *

	1154 * ss_SS_SSS-tt_TT_TTT/v -- in hashtable

	1155 * ss_SS_SSS-tt_TT_TTT/v -- in ss_SS_SSS (no fallback)

	1156 *

	1157 * repeat with t = tt_TT_TTT, tt_TT, tt, and tscript

	1158 *

	1159 * ss_SS_SSS-t/ *

	1160 * ss_SS-t/ *

	1161 * ss-t/ *

	1162 * sscript-t/ *

	1163 *

	1164 * Here * matches the first variant listed.

	1165 *

	1166 * Caller does NOT own returned object. Return 0 on failure.

	1167 */

	1168 TransliteratorEntry* TransliteratorRegistry::find(UnicodeString& source,

	1169 UnicodeString& target,

	1170 UnicodeString& variant) {

	1171

	1172 TransliteratorSpec src(source);

	1173 TransliteratorSpec trg(target);

	1174 TransliteratorEntry* entry;

	1175

	1176 // Seek exact match in hashtable. Temporary fix for ICU 4.6.

	1177 // TODO: The general logic for finding a matching transliterator needs to be reviewed.

	1178 // ICU ticket #8089

	1179 UnicodeString ID;

	1180 TransliteratorIDParser::STVtoID(source, target, variant, ID);

	1181 entry = (TransliteratorEntry*) registry.get(ID);

	1182 if (entry != 0) {

	1183 // std::string ss;

	1184 // std::cout << ID.toUTF8String(ss) << std::endl;

	1185 return entry;

	1186 }

	1187

	1188 if (variant.length() != 0) {

	1189

	1190 // Seek exact match in hashtable

	1191 entry = findInDynamicStore(src, trg, variant);

	1192 if (entry != 0) {

	1193 return entry;

	1194 }

	1195

	1196 // Seek exact match in locale resources

	1197 entry = findInStaticStore(src, trg, variant);

	1198 if (entry != 0) {

	1199 return entry;

	1200 }

	1201 }

	1202

	1203 for (;;) {

	1204 src.reset();

	1205 for (;;) {

	1206 // Seek match in hashtable

	1207 entry = findInDynamicStore(src, trg, NO_VARIANT);

	1208 if (entry != 0) {

	1209 return entry;

	1210 }

	1211

	1212 // Seek match in locale resources

	1213 entry = findInStaticStore(src, trg, NO_VARIANT);

	1214 if (entry != 0) {

	1215 return entry;

	1216 }

	1217 if (!src.hasFallback()) {

	1218 break;

	1219 }

	1220 src.next();

	1221 }

	1222 if (!trg.hasFallback()) {

	1223 break;

	1224 }

	1225 trg.next();

	1226 }

	1227

	1228 return 0;

	1229 }

	1230

	1231 /**

	1232 * Given an Entry object, instantiate it. Caller owns result. Return

	1233 * 0 on failure.

	1234 *

	1235 * Return a non-empty aliasReturn value if the ID points to an alias.

	1236 * We cannot instantiate it ourselves because the alias may contain

	1237 * filters or compounds, which we do not understand. Caller should

	1238 * make aliasReturn empty before calling.

	1239 *

	1240 * The entry object is assumed to reside in the dynamic store. It may be

	1241 * modified.

	1242 */

	1243 Transliterator* TransliteratorRegistry::instantiateEntry(const UnicodeString& ID ,

	1244 TransliteratorEntry *en try,

	1245 TransliteratorAlias* &a liasReturn,

	1246 UErrorCode& status) {

	1247 Transliterator *t = 0;

	1248 U_ASSERT(aliasReturn == 0);

	1249

	1250 switch (entry->entryType) {

	1251 case TransliteratorEntry::RBT_DATA:

	1252 t = new RuleBasedTransliterator(ID, entry->u.data);

	1253 if (t == 0) {

	1254 status = U_MEMORY_ALLOCATION_ERROR;

	1255 }

	1256 return t;

	1257 case TransliteratorEntry::PROTOTYPE:

	1258 t = entry->u.prototype->clone();

	1259 if (t == 0) {

	1260 status = U_MEMORY_ALLOCATION_ERROR;

	1261 }

	1262 return t;

	1263 case TransliteratorEntry::ALIAS:

	1264 aliasReturn = new TransliteratorAlias(entry->stringArg, entry->compoundF ilter);

	1265 if (aliasReturn == 0) {

	1266 status = U_MEMORY_ALLOCATION_ERROR;

	1267 }

	1268 return 0;

	1269 case TransliteratorEntry::FACTORY:

	1270 t = entry->u.factory.function(ID, entry->u.factory.context);

	1271 if (t == 0) {

	1272 status = U_MEMORY_ALLOCATION_ERROR;

	1273 }

	1274 return t;

	1275 case TransliteratorEntry::COMPOUND_RBT:

	1276 {

	1277 UVector* rbts = new UVector(entry->u.dataVector->size(), status);

	1278 // Check for null pointer

	1279 if (rbts == NULL) {

	1280 status = U_MEMORY_ALLOCATION_ERROR;

	1281 return NULL;

	1282 }

	1283 int32_t passNumber = 1;

	1284 for (int32_t i = 0; U_SUCCESS(status) && i < entry->u.dataVector->si ze(); i++) {

	1285 Transliterator* t = new RuleBasedTransliterator(UnicodeString(Co mpoundTransliterator::PASS_STRING) + (passNumber++),

	1286 (TransliterationRuleData*)(entry->u.dataVector->elementAt(i) ), FALSE);

	1287 if (t == 0)

	1288 status = U_MEMORY_ALLOCATION_ERROR;

	1289 else

	1290 rbts->addElement(t, status);

	1291 }

	1292 if (U_FAILURE(status)) {

	1293 delete rbts;

	1294 return 0;

	1295 }

	1296 aliasReturn = new TransliteratorAlias(ID, entry->stringArg, rbts, en try->compoundFilter);

	1297 }

	1298 if (aliasReturn == 0) {

	1299 status = U_MEMORY_ALLOCATION_ERROR;

	1300 }

	1301 return 0;

	1302 case TransliteratorEntry::LOCALE_RULES:

	1303 aliasReturn = new TransliteratorAlias(ID, entry->stringArg,

	1304 (UTransDirection) entry->intArg);

	1305 if (aliasReturn == 0) {

	1306 status = U_MEMORY_ALLOCATION_ERROR;

	1307 }

	1308 return 0;

	1309 case TransliteratorEntry::RULES_FORWARD:

	1310 case TransliteratorEntry::RULES_REVERSE:

	1311 // Process the rule data into a TransliteratorRuleData object,

	1312 // and possibly also into an ::id header and/or footer. Then

	1313 // we modify the registry with the parsed data and retry.

	1314 {

	1315 TransliteratorParser parser(status);

	1316

	1317 // We use the file name, taken from another resource bundle

	1318 // 2-d array at static init time, as a locale language. We're

	1319 // just using the locale mechanism to map through to a file

	1320 // name; this in no way represents an actual locale.

	1321 //CharString ch(entry->stringArg);

	1322 //UResourceBundle *bundle = ures_openDirect(0, ch, &status);

	1323 UnicodeString rules = entry->stringArg;

	1324 //ures_close(bundle);

	1325

	1326 //if (U_FAILURE(status)) {

	1327 // We have a failure of some kind. Remove the ID from the

	1328 // registry so we don't keep trying. NOTE: This will throw off

	1329 // anyone who is, at the moment, trying to iterate over the

	1330 // available IDs. That's acceptable since we should never

	1331 // really get here except under installation, configuration,

	1332 // or unrecoverable run time memory failures.

	1333 // remove(ID);

	1334 //} else {

	1335

	1336 // If the status indicates a failure, then we don't have any

	1337 // rules -- there is probably an installation error. The list

	1338 // in the root locale should correspond to all the installed

	1339 // transliterators; if it lists something that's not

	1340 // installed, we'll get an error from ResourceBundle.

	1341 aliasReturn = new TransliteratorAlias(ID, rules,

	1342 ((entry->entryType == TransliteratorEntry::RULES_REVERSE) ?

	1343 UTRANS_REVERSE : UTRANS_FORWARD));

	1344 if (aliasReturn == 0) {

	1345 status = U_MEMORY_ALLOCATION_ERROR;

	1346 }

	1347 //}

	1348 }

	1349 return 0;

	1350 default:

	1351 U_ASSERT(FALSE); // can't get here

	1352 return 0;

	1353 }

	1354 }

	1355 U_NAMESPACE_END

	1356

	1357 #endif /* #if !UCONFIG_NO_TRANSLITERATION */

	1358

	1359 //eof

OLD	NEW

« no previous file with comments | « icu46/source/i18n/transreg.h ('k') | icu46/source/i18n/tridpars.h » ('j') | no next file with comments »