OLD | NEW |
(Empty) | |
| 1 /* |
| 2 * Copyright (C) 2007-2010, International Business Machines Corporation and |
| 3 * others. All Rights Reserved. |
| 4 ******************************************************************************** |
| 5 * |
| 6 * File MSGFMT.H |
| 7 * |
| 8 * Modification History: |
| 9 * |
| 10 * Date Name Description |
| 11 * 02/19/97 aliu Converted from java. |
| 12 * 03/20/97 helena Finished first cut of implementation. |
| 13 * 07/22/98 stephen Removed operator!= (defined in Format) |
| 14 * 08/19/2002 srl Removing Javaisms |
| 15 *******************************************************************************/ |
| 16 |
| 17 #ifndef MSGFMT_H |
| 18 #define MSGFMT_H |
| 19 |
| 20 #include "unicode/utypes.h" |
| 21 |
| 22 /** |
| 23 * \file |
| 24 * \brief C++ API: Formats messages in a language-neutral way. |
| 25 */ |
| 26 |
| 27 #if !UCONFIG_NO_FORMATTING |
| 28 |
| 29 #include "unicode/format.h" |
| 30 #include "unicode/locid.h" |
| 31 #include "unicode/parseerr.h" |
| 32 #include "unicode/uchar.h" |
| 33 |
| 34 U_NAMESPACE_BEGIN |
| 35 |
| 36 class NumberFormat; |
| 37 class DateFormat; |
| 38 |
| 39 /** |
| 40 * |
| 41 * MessageFormat produces concatenated messages in a language-neutral |
| 42 * way. Use this whenever concatenating strings that are displayed to |
| 43 * end users. |
| 44 * |
| 45 * <P>A MessageFormat contains an array of <EM>subformats</EM> arranged |
| 46 * within a <EM>template string</EM>. Together, the subformats and |
| 47 * template string determine how the MessageFormat will operate during |
| 48 * formatting and parsing. |
| 49 * |
| 50 * <P>Typically, both the subformats and the template string are |
| 51 * specified at once in a <EM>pattern</EM>. By using different |
| 52 * patterns for different locales, messages may be localized. |
| 53 * |
| 54 * <P>When formatting, MessageFormat takes an array of arguments |
| 55 * and produces a user-readable string. Each argument is a |
| 56 * Formattable object; they may be passed in in an array, or as a |
| 57 * single Formattable object which itself contains an array. Each |
| 58 * argument is matched up with its corresponding subformat, which then |
| 59 * formats it into a string. The resulting strings are then assembled |
| 60 * within the string template of the MessageFormat to produce the |
| 61 * final output string. |
| 62 * |
| 63 * <p><strong>Note:</strong> |
| 64 * In ICU 4.0 MessageFormat supports named arguments. If a named argument |
| 65 * is used, all arguments must be named. Names start with a character in |
| 66 * <code>UCHAR_ID_START</code> and continue with characters in |
| 67 * <code>UCHARID_CONTINUE</code>, in particular they do not start with a digit. |
| 68 * If named arguments are used, {@link #usesNamedArguments()} will return true. |
| 69 * |
| 70 * <p>The other new methods supporting named arguments are |
| 71 * {@link #getFormatNames(UErrorCode& status)}, |
| 72 * {@link #getFormat(const UnicodeString& formatName, UErrorCode& status)} |
| 73 * {@link #setFormat(const UnicodeString& formatName, const Format& format, UErr
orCode& status)}, |
| 74 * {@link #adoptFormat(const UnicodeString& formatName, Format* formatToAdopt, U
ErrorCode& status)}, |
| 75 * {@link #format(const UnicodeString* argumentNames, const Formattable* argumen
ts, |
| 76 * int32_t count, UnicodeString& appendTo,UErrorCode& status)}. |
| 77 * These methods are all compatible with patterns that do not used named argumen
ts-- |
| 78 * in these cases the keys in the input or output use <code>UnicodeString</code>
s |
| 79 * that name the argument indices, e.g. "0", "1", "2"... etc. |
| 80 * |
| 81 * <p>If this format uses named arguments, certain methods that take or |
| 82 * return arrays do not perform any action, since it is not possible to |
| 83 * identify positions in an array using a name. Of these methods, |
| 84 * UErrorCode is set to U_ILLEGAL_ARGUMENT_ERROR by format, and to |
| 85 * U_ARGUMENT_TYPE_MISMATCH by parse. |
| 86 * These methods are |
| 87 * {@link #adoptFormats(Format** formatsToAdopt, int32_t count)}, |
| 88 * {@link #setFormats(const Format** newFormats,int32_t count)}, |
| 89 * {@link #adoptFormat(int32_t n, Format *newFormat)}, |
| 90 * {@link #setFormat(int32_t n, Format& newFormat)}, |
| 91 * {@link #format(const Formattable* source, int32_t count, UnicodeString& appen
dTo, FieldPosition& ignore, UErrorCode& success)}, |
| 92 * {@link #format(const UnicodeString& pattern,const Formattable* arguments,int3
2_t cnt,UnicodeString& appendTo,UErrorCode& success)}, |
| 93 * {@link #format(const Formattable& source, UnicodeString& appendTo, FieldPosit
ion& ignore, UErrorCode& success)}, |
| 94 * {@link #format(const Formattable* arguments, int32_t cnt, UnicodeString& appe
ndTo, FieldPosition& status, int32_t recursionProtection,UErrorCode& success)}, |
| 95 * {@link #parse(const UnicodeString& source, ParsePosition& pos, int32_t& count
)}, |
| 96 * {@link #parse(const UnicodeString& source, int32_t& cnt, UErrorCode& status)} |
| 97 * |
| 98 * <P> |
| 99 * During parsing, an input string is matched against the string |
| 100 * template of the MessageFormat to produce an array of Formattable |
| 101 * objects. Plain text of the template string is matched directly |
| 102 * against input text. At each position in the template string where |
| 103 * a subformat is located, the subformat is called to parse the |
| 104 * corresponding segment of input text to produce an output argument. |
| 105 * In this way, an array of arguments is created which together |
| 106 * constitute the parse result. |
| 107 * <P> |
| 108 * Parsing may fail or produce unexpected results in a number of |
| 109 * circumstances. |
| 110 * <UL> |
| 111 * <LI>If one of the arguments does not occur in the pattern, it |
| 112 * will be returned as a default Formattable. |
| 113 * <LI>If the format of an argument loses information, such as with |
| 114 * a choice format where a large number formats to "many", then the |
| 115 * parse may not correspond to the originally formatted argument. |
| 116 * <LI>MessageFormat does not handle ChoiceFormat recursion during |
| 117 * parsing; such parses will fail. |
| 118 * <LI>Parsing will not always find a match (or the correct match) if |
| 119 * some part of the parse is ambiguous. For example, if the pattern |
| 120 * "{1},{2}" is used with the string arguments {"a,b", "c"}, it will |
| 121 * format as "a,b,c". When the result is parsed, it will return {"a", |
| 122 * "b,c"}. |
| 123 * <LI>If a single argument is formatted more than once in the string, |
| 124 * then the rightmost subformat in the pattern string will produce the |
| 125 * parse result; prior subformats with the same argument index will |
| 126 * have no effect. |
| 127 * </UL> |
| 128 * Here are some examples of usage: |
| 129 * <P> |
| 130 * Example 1: |
| 131 * <pre> |
| 132 * \code |
| 133 * UErrorCode success = U_ZERO_ERROR; |
| 134 * GregorianCalendar cal(success); |
| 135 * Formattable arguments[] = { |
| 136 * 7L, |
| 137 * Formattable( (Date) cal.getTime(success), Formattable::kIsDate), |
| 138 * "a disturbance in the Force" |
| 139 * }; |
| 140 * |
| 141 * UnicodeString result; |
| 142 * MessageFormat::format( |
| 143 * "At {1,time} on {1,date}, there was {2} on planet {0,number}.", |
| 144 * arguments, 3, result, success ); |
| 145 * |
| 146 * cout << "result: " << result << endl; |
| 147 * //<output>: At 4:34:20 PM on 23-Mar-98, there was a disturbance |
| 148 * // in the Force on planet 7. |
| 149 * \endcode |
| 150 * </pre> |
| 151 * Typically, the message format will come from resources, and the |
| 152 * arguments will be dynamically set at runtime. |
| 153 * <P> |
| 154 * Example 2: |
| 155 * <pre> |
| 156 * \code |
| 157 * success = U_ZERO_ERROR; |
| 158 * Formattable testArgs[] = {3L, "MyDisk"}; |
| 159 * |
| 160 * MessageFormat form( |
| 161 * "The disk \"{1}\" contains {0} file(s).", success ); |
| 162 * |
| 163 * UnicodeString string; |
| 164 * FieldPosition fpos = 0; |
| 165 * cout << "format: " << form.format(testArgs, 2, string, fpos, success ) <<
endl; |
| 166 * |
| 167 * // output, with different testArgs: |
| 168 * // output: The disk "MyDisk" contains 0 file(s). |
| 169 * // output: The disk "MyDisk" contains 1 file(s). |
| 170 * // output: The disk "MyDisk" contains 1,273 file(s). |
| 171 * \endcode |
| 172 * </pre> |
| 173 * |
| 174 * The pattern is of the following form. Legend: |
| 175 * <pre> |
| 176 * \code |
| 177 * {optional item} |
| 178 * (group that may be repeated)* |
| 179 * \endcode |
| 180 * </pre> |
| 181 * Do not confuse optional items with items inside quoted braces, such |
| 182 * as this: "{". Quoted braces are literals. |
| 183 * <pre> |
| 184 * \code |
| 185 * messageFormatPattern := string ( "{" messageFormatElement "}" string )* |
| 186 * |
| 187 * messageFormatElement := argumentIndex | argumentName { "," elementForma
t } |
| 188 * |
| 189 * elementFormat := "time" { "," datetimeStyle } |
| 190 * | "date" { "," datetimeStyle } |
| 191 * | "number" { "," numberStyle } |
| 192 * | "choice" "," choiceStyle |
| 193 * | "spellout" { "," spelloutStyle } |
| 194 * | "ordinal" { "," spelloutStyle } |
| 195 * | "duration" { "," spelloutStyle } |
| 196 * | "plural" "," pluralStyle |
| 197 * | "select" "," selectStyle |
| 198 * |
| 199 * datetimeStyle := "short" |
| 200 * | "medium" |
| 201 * | "long" |
| 202 * | "full" |
| 203 * | dateFormatPattern |
| 204 * |
| 205 * numberStyle := "currency" |
| 206 * | "percent" |
| 207 * | "integer" |
| 208 * | numberFormatPattern |
| 209 * |
| 210 * choiceStyle := choiceFormatPattern |
| 211 * |
| 212 * pluralStyle := pluralFormatPattern |
| 213 * |
| 214 * selectStyle := selectFormatPattern |
| 215 * |
| 216 * spelloutStyle := ruleSetName |
| 217 * \endcode |
| 218 * </pre> |
| 219 * If there is no elementFormat, then the argument must be a string, |
| 220 * which is substituted. If there is no dateTimeStyle or numberStyle, |
| 221 * then the default format is used (e.g. NumberFormat::createInstance(), |
| 222 * DateFormat::createTimeInstance(DateFormat::kDefault, ...) or |
| 223 * DateFormat::createDateInstance(DateFormat::kDefault, ...). For |
| 224 * a RuleBasedNumberFormat, if there is no ruleSetName, the default |
| 225 * rule set is used. For a ChoiceFormat or PluralFormat or SelectFormat, the pat
tern |
| 226 * must always be specified, since there is no default. |
| 227 * <P> |
| 228 * In strings, single quotes can be used to quote syntax characters. |
| 229 * A literal single quote is represented by '', both within and outside |
| 230 * of single-quoted segments. Inside a |
| 231 * messageFormatElement, quotes are <EM>not</EM> removed. For example, |
| 232 * {1,number,$'#',##} will produce a number format with the pound-sign |
| 233 * quoted, with a result such as: "$#31,45". |
| 234 * <P> |
| 235 * If a pattern is used, then unquoted braces in the pattern, if any, |
| 236 * must match: that is, "ab {0} de" and "ab '}' de" are ok, but "ab |
| 237 * {0'}' de" and "ab } de" are not. |
| 238 * <p> |
| 239 * <dl><dt><b>Warning:</b><dd>The rules for using quotes within message |
| 240 * format patterns unfortunately have shown to be somewhat confusing. |
| 241 * In particular, it isn't always obvious to localizers whether single |
| 242 * quotes need to be doubled or not. Make sure to inform localizers about |
| 243 * the rules, and tell them (for example, by using comments in resource |
| 244 * bundle source files) which strings will be processed by MessageFormat. |
| 245 * Note that localizers may need to use single quotes in translated |
| 246 * strings where the original version doesn't have them. |
| 247 * <br>Note also that the simplest way to avoid the problem is to |
| 248 * use the real apostrophe (single quote) character U+2019 (') for |
| 249 * human-readable text, and to use the ASCII apostrophe (U+0027 ' ) |
| 250 * only in program syntax, like quoting in MessageFormat. |
| 251 * See the annotations for U+0027 Apostrophe in The Unicode Standard.</p> |
| 252 * </dl> |
| 253 * <P> |
| 254 * The argumentIndex is a non-negative integer, which corresponds to the |
| 255 * index of the arguments presented in an array to be formatted. The |
| 256 * first argument has argumentIndex 0. |
| 257 * <P> |
| 258 * It is acceptable to have unused arguments in the array. With missing |
| 259 * arguments, or arguments that are not of the right class for the |
| 260 * specified format, a failing UErrorCode result is set. |
| 261 * <P> |
| 262 * <strong>Creating internationalized messages that include plural forms, you |
| 263 * can use a PluralFormat:</strong> |
| 264 * <pre> |
| 265 * \code |
| 266 * UErrorCode err = U_ZERO_ERROR; |
| 267 * UnicodeString t1("{0, plural, one{C''est # fichier} other{Ce sont # fichiers
}} dans la liste."); |
| 268 * MessageFormat* msgFmt = new MessageFormat(t1, Locale("fr"), err); |
| 269 * if (U_FAILURE(err)) { |
| 270 * return err; |
| 271 * } |
| 272 * |
| 273 * Formattable args1[] = {(int32_t)0}; |
| 274 * Formattable args2[] = {(int32_t)3}; |
| 275 * FieldPosition ignore(FieldPosition::DONT_CARE); |
| 276 * UnicodeString result; |
| 277 * msgFmt->format(args1, 1, result, ignore, status); |
| 278 * cout << result << endl; |
| 279 * result.remove(); |
| 280 * msgFmt->format(args2, 1, result, ignore, status); |
| 281 * cout << result << endl; |
| 282 * |
| 283 * // output, with different args |
| 284 * // output: C'est 0,0 fichier dans la liste. |
| 285 * // output: Ce sont 3 fichiers dans la liste." |
| 286 * \endcode |
| 287 * </pre> |
| 288 * Please check PluralFormat and PluralRules for details. |
| 289 * </P> |
| 290 */ |
| 291 class U_I18N_API MessageFormat : public Format { |
| 292 public: |
| 293 /** |
| 294 * Enum type for kMaxFormat. |
| 295 * @obsolete ICU 3.0. The 10-argument limit was removed as of ICU 2.6, |
| 296 * rendering this enum type obsolete. |
| 297 */ |
| 298 enum EFormatNumber { |
| 299 /** |
| 300 * The maximum number of arguments. |
| 301 * @obsolete ICU 3.0. The 10-argument limit was removed as of ICU 2.6, |
| 302 * rendering this constant obsolete. |
| 303 */ |
| 304 kMaxFormat = 10 |
| 305 }; |
| 306 |
| 307 /** |
| 308 * Constructs a new MessageFormat using the given pattern and the |
| 309 * default locale. |
| 310 * |
| 311 * @param pattern Pattern used to construct object. |
| 312 * @param status Input/output error code. If the |
| 313 * pattern cannot be parsed, set to failure code. |
| 314 * @stable ICU 2.0 |
| 315 */ |
| 316 MessageFormat(const UnicodeString& pattern, |
| 317 UErrorCode &status); |
| 318 |
| 319 /** |
| 320 * Constructs a new MessageFormat using the given pattern and locale. |
| 321 * @param pattern Pattern used to construct object. |
| 322 * @param newLocale The locale to use for formatting dates and numbers. |
| 323 * @param status Input/output error code. If the |
| 324 * pattern cannot be parsed, set to failure code. |
| 325 * @stable ICU 2.0 |
| 326 */ |
| 327 MessageFormat(const UnicodeString& pattern, |
| 328 const Locale& newLocale, |
| 329 UErrorCode& status); |
| 330 /** |
| 331 * Constructs a new MessageFormat using the given pattern and locale. |
| 332 * @param pattern Pattern used to construct object. |
| 333 * @param newLocale The locale to use for formatting dates and numbers. |
| 334 * @param parseError Struct to recieve information on position |
| 335 * of error within the pattern. |
| 336 * @param status Input/output error code. If the |
| 337 * pattern cannot be parsed, set to failure code. |
| 338 * @stable ICU 2.0 |
| 339 */ |
| 340 MessageFormat(const UnicodeString& pattern, |
| 341 const Locale& newLocale, |
| 342 UParseError& parseError, |
| 343 UErrorCode& status); |
| 344 /** |
| 345 * Constructs a new MessageFormat from an existing one. |
| 346 * @stable ICU 2.0 |
| 347 */ |
| 348 MessageFormat(const MessageFormat&); |
| 349 |
| 350 /** |
| 351 * Assignment operator. |
| 352 * @stable ICU 2.0 |
| 353 */ |
| 354 const MessageFormat& operator=(const MessageFormat&); |
| 355 |
| 356 /** |
| 357 * Destructor. |
| 358 * @stable ICU 2.0 |
| 359 */ |
| 360 virtual ~MessageFormat(); |
| 361 |
| 362 /** |
| 363 * Clones this Format object polymorphically. The caller owns the |
| 364 * result and should delete it when done. |
| 365 * @stable ICU 2.0 |
| 366 */ |
| 367 virtual Format* clone(void) const; |
| 368 |
| 369 /** |
| 370 * Returns true if the given Format objects are semantically equal. |
| 371 * Objects of different subclasses are considered unequal. |
| 372 * @param other the object to be compared with. |
| 373 * @return true if the given Format objects are semantically equal. |
| 374 * @stable ICU 2.0 |
| 375 */ |
| 376 virtual UBool operator==(const Format& other) const; |
| 377 |
| 378 /** |
| 379 * Sets the locale. This locale is used for fetching default number or date |
| 380 * format information. |
| 381 * @param theLocale the new locale value to be set. |
| 382 * @stable ICU 2.0 |
| 383 */ |
| 384 virtual void setLocale(const Locale& theLocale); |
| 385 |
| 386 /** |
| 387 * Gets the locale. This locale is used for fetching default number or date |
| 388 * format information. |
| 389 * @return the locale of the object. |
| 390 * @stable ICU 2.0 |
| 391 */ |
| 392 virtual const Locale& getLocale(void) const; |
| 393 |
| 394 /** |
| 395 * Applies the given pattern string to this message format. |
| 396 * |
| 397 * @param pattern The pattern to be applied. |
| 398 * @param status Input/output error code. If the |
| 399 * pattern cannot be parsed, set to failure code. |
| 400 * @stable ICU 2.0 |
| 401 */ |
| 402 virtual void applyPattern(const UnicodeString& pattern, |
| 403 UErrorCode& status); |
| 404 /** |
| 405 * Applies the given pattern string to this message format. |
| 406 * |
| 407 * @param pattern The pattern to be applied. |
| 408 * @param parseError Struct to recieve information on position |
| 409 * of error within pattern. |
| 410 * @param status Input/output error code. If the |
| 411 * pattern cannot be parsed, set to failure code. |
| 412 * @stable ICU 2.0 |
| 413 */ |
| 414 virtual void applyPattern(const UnicodeString& pattern, |
| 415 UParseError& parseError, |
| 416 UErrorCode& status); |
| 417 |
| 418 /** |
| 419 * Returns a pattern that can be used to recreate this object. |
| 420 * |
| 421 * @param appendTo Output parameter to receive the pattern. |
| 422 * Result is appended to existing contents. |
| 423 * @return Reference to 'appendTo' parameter. |
| 424 * @stable ICU 2.0 |
| 425 */ |
| 426 virtual UnicodeString& toPattern(UnicodeString& appendTo) const; |
| 427 |
| 428 /** |
| 429 * Sets subformats. |
| 430 * See the class description about format numbering. |
| 431 * The caller should not delete the Format objects after this call. |
| 432 * <EM>The array formatsToAdopt is not itself adopted.</EM> Its |
| 433 * ownership is retained by the caller. If the call fails because |
| 434 * memory cannot be allocated, then the formats will be deleted |
| 435 * by this method, and this object will remain unchanged. |
| 436 * |
| 437 * <p>If this format uses named arguments, the new formats are discarded |
| 438 * and this format remains unchanged. |
| 439 * |
| 440 * @stable ICU 2.0 |
| 441 * @param formatsToAdopt the format to be adopted. |
| 442 * @param count the size of the array. |
| 443 */ |
| 444 virtual void adoptFormats(Format** formatsToAdopt, int32_t count); |
| 445 |
| 446 /** |
| 447 * Sets subformats. |
| 448 * See the class description about format numbering. |
| 449 * Each item in the array is cloned into the internal array. |
| 450 * If the call fails because memory cannot be allocated, then this |
| 451 * object will remain unchanged. |
| 452 * |
| 453 * <p>If this format uses named arguments, the new formats are discarded |
| 454 * and this format remains unchanged. |
| 455 * |
| 456 * @stable ICU 2.0 |
| 457 * @param newFormats the new format to be set. |
| 458 * @param cnt the size of the array. |
| 459 */ |
| 460 virtual void setFormats(const Format** newFormats, int32_t cnt); |
| 461 |
| 462 |
| 463 /** |
| 464 * Sets one subformat. |
| 465 * See the class description about format numbering. |
| 466 * The caller should not delete the Format object after this call. |
| 467 * If the number is over the number of formats already set, |
| 468 * the item will be deleted and ignored. |
| 469 * |
| 470 * <p>If this format uses named arguments, the new format is discarded |
| 471 * and this format remains unchanged. |
| 472 * |
| 473 * @stable ICU 2.0 |
| 474 * @param formatNumber index of the subformat. |
| 475 * @param formatToAdopt the format to be adopted. |
| 476 */ |
| 477 virtual void adoptFormat(int32_t formatNumber, Format* formatToAdopt); |
| 478 |
| 479 /** |
| 480 * Sets one subformat. |
| 481 * See the class description about format numbering. |
| 482 * If the number is over the number of formats already set, |
| 483 * the item will be ignored. |
| 484 * @param formatNumber index of the subformat. |
| 485 * @param format the format to be set. |
| 486 * @stable ICU 2.0 |
| 487 */ |
| 488 virtual void setFormat(int32_t formatNumber, const Format& format); |
| 489 |
| 490 /** |
| 491 * Gets format names. This function returns formatNames in StringEnumeration
s |
| 492 * which can be used with getFormat() and setFormat() to export formattable |
| 493 * array from current MessageFormat to another. It is caller's resposibilit
y |
| 494 * to delete the returned formatNames. |
| 495 * @param status output param set to success/failure code. |
| 496 * @stable ICU 4.0 |
| 497 */ |
| 498 virtual StringEnumeration* getFormatNames(UErrorCode& status); |
| 499 |
| 500 /** |
| 501 * Gets subformat pointer for given format name. |
| 502 * This function supports both named and numbered |
| 503 * arguments-- if numbered, the formatName is the |
| 504 * corresponding UnicodeStrings (e.g. "0", "1", "2"...). |
| 505 * The returned Format object should not be deleted by the caller, |
| 506 * nor should the ponter of other object . The pointer and its |
| 507 * contents remain valid only until the next call to any method |
| 508 * of this class is made with this object. |
| 509 * @param formatName the name or number specifying a format |
| 510 * @param status output param set to success/failure code. |
| 511 * @stable ICU 4.0 |
| 512 */ |
| 513 virtual Format* getFormat(const UnicodeString& formatName, UErrorCode& statu
s); |
| 514 |
| 515 /** |
| 516 * Sets one subformat for given format name. |
| 517 * See the class description about format name. |
| 518 * This function supports both named and numbered |
| 519 * arguments-- if numbered, the formatName is the |
| 520 * corresponding UnicodeStrings (e.g. "0", "1", "2"...). |
| 521 * If there is no matched formatName or wrong type, |
| 522 * the item will be ignored. |
| 523 * @param formatName Name of the subformat. |
| 524 * @param format the format to be set. |
| 525 * @param status output param set to success/failure code. |
| 526 * @stable ICU 4.0 |
| 527 */ |
| 528 virtual void setFormat(const UnicodeString& formatName, const Format& format
, UErrorCode& status); |
| 529 |
| 530 /** |
| 531 * Sets one subformat for given format name. |
| 532 * See the class description about format name. |
| 533 * This function supports both named and numbered |
| 534 * arguments-- if numbered, the formatName is the |
| 535 * corresponding UnicodeStrings (e.g. "0", "1", "2"...). |
| 536 * If there is no matched formatName or wrong type, |
| 537 * the item will be ignored. |
| 538 * The caller should not delete the Format object after this call. |
| 539 * @param formatName Name of the subformat. |
| 540 * @param formatToAdopt Format to be adopted. |
| 541 * @param status output param set to success/failure code. |
| 542 * @stable ICU 4.0 |
| 543 */ |
| 544 virtual void adoptFormat(const UnicodeString& formatName, Format* formatToAd
opt, UErrorCode& status); |
| 545 |
| 546 /** |
| 547 * Gets an array of subformats of this object. The returned array |
| 548 * should not be deleted by the caller, nor should the pointers |
| 549 * within the array. The array and its contents remain valid only |
| 550 * until the next call to this format. See the class description |
| 551 * about format numbering. |
| 552 * |
| 553 * @param count output parameter to receive the size of the array |
| 554 * @return an array of count Format* objects, or NULL if out of |
| 555 * memory. Any or all of the array elements may be NULL. |
| 556 * @stable ICU 2.0 |
| 557 */ |
| 558 virtual const Format** getFormats(int32_t& count) const; |
| 559 |
| 560 |
| 561 using Format::format; |
| 562 |
| 563 /** |
| 564 * Formats the given array of arguments into a user-readable string. |
| 565 * Does not take ownership of the Formattable* array or its contents. |
| 566 * |
| 567 * <p>If this format uses named arguments, appendTo is unchanged and |
| 568 * status is set to U_ILLEGAL_ARGUMENT_ERROR. |
| 569 * |
| 570 * @param source An array of objects to be formatted. |
| 571 * @param count The number of elements of 'source'. |
| 572 * @param appendTo Output parameter to receive result. |
| 573 * Result is appended to existing contents. |
| 574 * @param ignore Not used; inherited from base class API. |
| 575 * @param status Input/output error code. If the |
| 576 * pattern cannot be parsed, set to failure code. |
| 577 * @return Reference to 'appendTo' parameter. |
| 578 * @stable ICU 2.0 |
| 579 */ |
| 580 UnicodeString& format(const Formattable* source, |
| 581 int32_t count, |
| 582 UnicodeString& appendTo, |
| 583 FieldPosition& ignore, |
| 584 UErrorCode& status) const; |
| 585 |
| 586 /** |
| 587 * Formats the given array of arguments into a user-readable string |
| 588 * using the given pattern. |
| 589 * |
| 590 * <p>If this format uses named arguments, appendTo is unchanged and |
| 591 * status is set to U_ILLEGAL_ARGUMENT_ERROR. |
| 592 * |
| 593 * @param pattern The pattern. |
| 594 * @param arguments An array of objects to be formatted. |
| 595 * @param count The number of elements of 'source'. |
| 596 * @param appendTo Output parameter to receive result. |
| 597 * Result is appended to existing contents. |
| 598 * @param status Input/output error code. If the |
| 599 * pattern cannot be parsed, set to failure code. |
| 600 * @return Reference to 'appendTo' parameter. |
| 601 * @stable ICU 2.0 |
| 602 */ |
| 603 static UnicodeString& format(const UnicodeString& pattern, |
| 604 const Formattable* arguments, |
| 605 int32_t count, |
| 606 UnicodeString& appendTo, |
| 607 UErrorCode& status); |
| 608 |
| 609 /** |
| 610 * Formats the given array of arguments into a user-readable |
| 611 * string. The array must be stored within a single Formattable |
| 612 * object of type kArray. If the Formattable object type is not of |
| 613 * type kArray, then returns a failing UErrorCode. |
| 614 * |
| 615 * <p>If this format uses named arguments, appendTo is unchanged and |
| 616 * status is set to U_ILLEGAL_ARGUMENT_ERROR. |
| 617 * |
| 618 * @param obj A Formattable of type kArray containing |
| 619 * arguments to be formatted. |
| 620 * @param appendTo Output parameter to receive result. |
| 621 * Result is appended to existing contents. |
| 622 * @param pos On input: an alignment field, if desired. |
| 623 * On output: the offsets of the alignment field. |
| 624 * @param status Input/output error code. If the |
| 625 * pattern cannot be parsed, set to failure code. |
| 626 * @return Reference to 'appendTo' parameter. |
| 627 * @stable ICU 2.0 |
| 628 */ |
| 629 virtual UnicodeString& format(const Formattable& obj, |
| 630 UnicodeString& appendTo, |
| 631 FieldPosition& pos, |
| 632 UErrorCode& status) const; |
| 633 |
| 634 /** |
| 635 * Formats the given array of arguments into a user-readable |
| 636 * string. The array must be stored within a single Formattable |
| 637 * object of type kArray. If the Formattable object type is not of |
| 638 * type kArray, then returns a failing UErrorCode. |
| 639 * |
| 640 * @param obj The object to format |
| 641 * @param appendTo Output parameter to receive result. |
| 642 * Result is appended to existing contents. |
| 643 * @param status Input/output error code. If the |
| 644 * pattern cannot be parsed, set to failure code. |
| 645 * @return Reference to 'appendTo' parameter. |
| 646 * @stable ICU 2.0 |
| 647 */ |
| 648 UnicodeString& format(const Formattable& obj, |
| 649 UnicodeString& appendTo, |
| 650 UErrorCode& status) const; |
| 651 |
| 652 |
| 653 /** |
| 654 * Formats the given array of arguments into a user-defined argument name |
| 655 * array. This function supports both named and numbered |
| 656 * arguments-- if numbered, the formatName is the |
| 657 * corresponding UnicodeStrings (e.g. "0", "1", "2"...). |
| 658 * |
| 659 * @param argumentNames argument name array |
| 660 * @param arguments An array of objects to be formatted. |
| 661 * @param count The number of elements of 'argumentNames' and |
| 662 * arguments. The number of argumentNames and arguments |
| 663 * must be the same. |
| 664 * @param appendTo Output parameter to receive result. |
| 665 * Result is appended to existing contents. |
| 666 * @param status Input/output error code. If the |
| 667 * pattern cannot be parsed, set to failure code. |
| 668 * @return Reference to 'appendTo' parameter. |
| 669 * @stable ICU 4.0 |
| 670 */ |
| 671 UnicodeString& format(const UnicodeString* argumentNames, |
| 672 const Formattable* arguments, |
| 673 int32_t count, |
| 674 UnicodeString& appendTo, |
| 675 UErrorCode& status) const; |
| 676 /** |
| 677 * Parses the given string into an array of output arguments. |
| 678 * |
| 679 * @param source String to be parsed. |
| 680 * @param pos On input, starting position for parse. On output, |
| 681 * final position after parse. Unchanged if parse |
| 682 * fails. |
| 683 * @param count Output parameter to receive the number of arguments |
| 684 * parsed. |
| 685 * @return an array of parsed arguments. The caller owns both |
| 686 * the array and its contents. |
| 687 * @stable ICU 2.0 |
| 688 */ |
| 689 virtual Formattable* parse(const UnicodeString& source, |
| 690 ParsePosition& pos, |
| 691 int32_t& count) const; |
| 692 |
| 693 /** |
| 694 * Parses the given string into an array of output arguments. |
| 695 * |
| 696 * <p>If this format uses named arguments, status is set to |
| 697 * U_ARGUMENT_TYPE_MISMATCH. |
| 698 * |
| 699 * @param source String to be parsed. |
| 700 * @param count Output param to receive size of returned array. |
| 701 * @param status Input/output error code. If the |
| 702 * pattern cannot be parsed, set to failure code. |
| 703 * @return an array of parsed arguments. The caller owns both |
| 704 * the array and its contents. Returns NULL if status is not U_ZERO_ERROR. |
| 705 * |
| 706 * @stable ICU 2.0 |
| 707 */ |
| 708 virtual Formattable* parse(const UnicodeString& source, |
| 709 int32_t& count, |
| 710 UErrorCode& status) const; |
| 711 |
| 712 /** |
| 713 * Parses the given string into an array of output arguments |
| 714 * stored within a single Formattable of type kArray. |
| 715 * |
| 716 * @param source The string to be parsed into an object. |
| 717 * @param result Formattable to be set to the parse result. |
| 718 * If parse fails, return contents are undefined. |
| 719 * @param pos On input, starting position for parse. On output, |
| 720 * final position after parse. Unchanged if parse |
| 721 * fails. |
| 722 * @stable ICU 2.0 |
| 723 */ |
| 724 virtual void parseObject(const UnicodeString& source, |
| 725 Formattable& result, |
| 726 ParsePosition& pos) const; |
| 727 |
| 728 /** |
| 729 * Convert an 'apostrophe-friendly' pattern into a standard |
| 730 * pattern. Standard patterns treat all apostrophes as |
| 731 * quotes, which is problematic in some languages, e.g. |
| 732 * French, where apostrophe is commonly used. This utility |
| 733 * assumes that only an unpaired apostrophe immediately before |
| 734 * a brace is a true quote. Other unpaired apostrophes are paired, |
| 735 * and the resulting standard pattern string is returned. |
| 736 * |
| 737 * <p><b>Note</b> it is not guaranteed that the returned pattern |
| 738 * is indeed a valid pattern. The only effect is to convert |
| 739 * between patterns having different quoting semantics. |
| 740 * |
| 741 * @param pattern the 'apostrophe-friendly' patttern to convert |
| 742 * @param status Input/output error code. If the pattern |
| 743 * cannot be parsed, the failure code is set. |
| 744 * @return the standard equivalent of the original pattern |
| 745 * @stable ICU 3.4 |
| 746 */ |
| 747 static UnicodeString autoQuoteApostrophe(const UnicodeString& pattern, |
| 748 UErrorCode& status); |
| 749 |
| 750 /** |
| 751 * Returns true if this MessageFormat uses named arguments, |
| 752 * and false otherwise. See class description. |
| 753 * |
| 754 * @return true if named arguments are used. |
| 755 * @stable ICU 4.0 |
| 756 */ |
| 757 UBool usesNamedArguments() const; |
| 758 |
| 759 |
| 760 /** |
| 761 * This API is for ICU internal use only. |
| 762 * Please do not use it. |
| 763 * |
| 764 * Returns argument types count in the parsed pattern. |
| 765 * Used to distinguish pattern "{0} d" and "d". |
| 766 * |
| 767 * @return The number of formattable types in the pattern |
| 768 * @internal |
| 769 */ |
| 770 int32_t getArgTypeCount() const; |
| 771 |
| 772 /** |
| 773 * Returns a unique class ID POLYMORPHICALLY. Pure virtual override. |
| 774 * This method is to implement a simple version of RTTI, since not all |
| 775 * C++ compilers support genuine RTTI. Polymorphic operator==() and |
| 776 * clone() methods call this method. |
| 777 * |
| 778 * @return The class ID for this object. All objects of a |
| 779 * given class have the same class ID. Objects of |
| 780 * other classes have different class IDs. |
| 781 * @stable ICU 2.0 |
| 782 */ |
| 783 virtual UClassID getDynamicClassID(void) const; |
| 784 |
| 785 /** |
| 786 * Return the class ID for this class. This is useful only for |
| 787 * comparing to a return value from getDynamicClassID(). For example: |
| 788 * <pre> |
| 789 * . Base* polymorphic_pointer = createPolymorphicObject(); |
| 790 * . if (polymorphic_pointer->getDynamicClassID() == |
| 791 * . Derived::getStaticClassID()) ... |
| 792 * </pre> |
| 793 * @return The class ID for all objects of this class. |
| 794 * @stable ICU 2.0 |
| 795 */ |
| 796 static UClassID U_EXPORT2 getStaticClassID(void); |
| 797 |
| 798 private: |
| 799 |
| 800 Locale fLocale; |
| 801 UnicodeString fPattern; |
| 802 Format** formatAliases; // see getFormats |
| 803 int32_t formatAliasesCapacity; |
| 804 UProperty idStart; |
| 805 UProperty idContinue; |
| 806 |
| 807 MessageFormat(); // default constructor not implemented |
| 808 |
| 809 /* |
| 810 * A structure representing one subformat of this MessageFormat. |
| 811 * Each subformat has a Format object, an offset into the plain |
| 812 * pattern text fPattern, and an argument number. The argument |
| 813 * number corresponds to the array of arguments to be formatted. |
| 814 * @internal |
| 815 */ |
| 816 class Subformat; |
| 817 |
| 818 /** |
| 819 * A MessageFormat contains an array of subformats. This array |
| 820 * needs to grow dynamically if the MessageFormat is modified. |
| 821 */ |
| 822 Subformat* subformats; |
| 823 int32_t subformatCount; |
| 824 int32_t subformatCapacity; |
| 825 |
| 826 /** |
| 827 * A MessageFormat formats an array of arguments. Each argument |
| 828 * has an expected type, based on the pattern. For example, if |
| 829 * the pattern contains the subformat "{3,number,integer}", then |
| 830 * we expect argument 3 to have type Formattable::kLong. This |
| 831 * array needs to grow dynamically if the MessageFormat is |
| 832 * modified. |
| 833 */ |
| 834 Formattable::Type* argTypes; |
| 835 int32_t argTypeCount; |
| 836 int32_t argTypeCapacity; |
| 837 |
| 838 /** |
| 839 * Is true iff all argument names are non-negative numbers. |
| 840 * |
| 841 */ |
| 842 UBool isArgNumeric; |
| 843 |
| 844 // Variable-size array management |
| 845 UBool allocateSubformats(int32_t capacity); |
| 846 UBool allocateArgTypes(int32_t capacity); |
| 847 |
| 848 /** |
| 849 * Default Format objects used when no format is specified and a |
| 850 * numeric or date argument is formatted. These are volatile |
| 851 * cache objects maintained only for performance. They do not |
| 852 * participate in operator=(), copy constructor(), nor |
| 853 * operator==(). |
| 854 */ |
| 855 NumberFormat* defaultNumberFormat; |
| 856 DateFormat* defaultDateFormat; |
| 857 |
| 858 /** |
| 859 * Method to retrieve default formats (or NULL on failure). |
| 860 * These are semantically const, but may modify *this. |
| 861 */ |
| 862 const NumberFormat* getDefaultNumberFormat(UErrorCode&) const; |
| 863 const DateFormat* getDefaultDateFormat(UErrorCode&) const; |
| 864 |
| 865 /** |
| 866 * Finds the word s, in the keyword list and returns the located index. |
| 867 * @param s the keyword to be searched for. |
| 868 * @param list the list of keywords to be searched with. |
| 869 * @return the index of the list which matches the keyword s. |
| 870 */ |
| 871 static int32_t findKeyword( const UnicodeString& s, |
| 872 const UChar * const *list); |
| 873 |
| 874 /** |
| 875 * Formats the array of arguments and copies the result into the |
| 876 * result buffer, updates the field position. |
| 877 * |
| 878 * @param arguments The formattable objects array. |
| 879 * @param cnt The array count. |
| 880 * @param appendTo Output parameter to receive result. |
| 881 * Result is appended to existing contents. |
| 882 * @param status Field position status. |
| 883 * @param recursionProtection |
| 884 * Initially zero. Bits 0..9 are used to indicate |
| 885 * that a parameter has already been seen, to |
| 886 * avoid recursion. Currently unused. |
| 887 * @param success The error code status. |
| 888 * @return Reference to 'appendTo' parameter. |
| 889 */ |
| 890 UnicodeString& format( const Formattable* arguments, |
| 891 int32_t cnt, |
| 892 UnicodeString& appendTo, |
| 893 FieldPosition& status, |
| 894 int32_t recursionProtection, |
| 895 UErrorCode& success) const; |
| 896 |
| 897 UnicodeString& format( const Formattable* arguments, |
| 898 const UnicodeString *argumentNames, |
| 899 int32_t cnt, |
| 900 UnicodeString& appendTo, |
| 901 FieldPosition& status, |
| 902 int32_t recursionProtection, |
| 903 UErrorCode& success) const; |
| 904 |
| 905 void makeFormat(int32_t offsetNumber, |
| 906 UnicodeString* segments, |
| 907 UParseError& parseError, |
| 908 UErrorCode& success); |
| 909 |
| 910 /** |
| 911 * Convenience method that ought to be in NumberFormat |
| 912 */ |
| 913 NumberFormat* createIntegerFormat(const Locale& locale, UErrorCode& status)
const; |
| 914 |
| 915 /** |
| 916 * Checks the range of the source text to quote the special |
| 917 * characters, { and ' and copy to target buffer. |
| 918 * @param source |
| 919 * @param start the text offset to start the process of in the source string |
| 920 * @param end the text offset to end the process of in the source string |
| 921 * @param appendTo Output parameter to receive result. |
| 922 * Result is appended to existing contents. |
| 923 */ |
| 924 static void copyAndFixQuotes(const UnicodeString& appendTo, int32_t start, i
nt32_t end, UnicodeString& target); |
| 925 |
| 926 /** |
| 927 * Returns array of argument types in the parsed pattern |
| 928 * for use in C API. Only for the use of umsg_vformat(). Not |
| 929 * for public consumption. |
| 930 * @param listCount Output parameter to receive the size of array |
| 931 * @return The array of formattable types in the pattern |
| 932 * @internal |
| 933 */ |
| 934 const Formattable::Type* getArgTypeList(int32_t& listCount) const { |
| 935 listCount = argTypeCount; |
| 936 return argTypes; |
| 937 } |
| 938 |
| 939 /** |
| 940 * Returns FALSE if the argument name is not legal. |
| 941 * @param argName argument name. |
| 942 * @return TRUE if the argument name is legal, otherwise return FALSE. |
| 943 */ |
| 944 UBool isLegalArgName(const UnicodeString& argName) const; |
| 945 |
| 946 friend class MessageFormatAdapter; // getFormatTypeList() access |
| 947 }; |
| 948 |
| 949 inline UnicodeString& |
| 950 MessageFormat::format(const Formattable& obj, |
| 951 UnicodeString& appendTo, |
| 952 UErrorCode& status) const { |
| 953 return Format::format(obj, appendTo, status); |
| 954 } |
| 955 |
| 956 U_NAMESPACE_END |
| 957 |
| 958 #endif /* #if !UCONFIG_NO_FORMATTING */ |
| 959 |
| 960 #endif // _MSGFMT |
| 961 //eof |
OLD | NEW |