| Index: third_party/libaddressinput/chromium/cpp/src/language.cc
|
| diff --git a/third_party/libaddressinput/chromium/cpp/src/language.cc b/third_party/libaddressinput/chromium/cpp/src/language.cc
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..f025e620da15e3d4b9fd01d69047bc7e5f6e8f39
|
| --- /dev/null
|
| +++ b/third_party/libaddressinput/chromium/cpp/src/language.cc
|
| @@ -0,0 +1,102 @@
|
| +// Copyright (C) 2014 Google Inc.
|
| +//
|
| +// Licensed under the Apache License, Version 2.0 (the "License");
|
| +// you may not use this file except in compliance with the License.
|
| +// You may obtain a copy of the License at
|
| +//
|
| +// http://www.apache.org/licenses/LICENSE-2.0
|
| +//
|
| +// Unless required by applicable law or agreed to in writing, software
|
| +// distributed under the License is distributed on an "AS IS" BASIS,
|
| +// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
| +// See the License for the specific language governing permissions and
|
| +// limitations under the License.
|
| +
|
| +#include "language.h"
|
| +
|
| +#include <algorithm>
|
| +#include <cctype>
|
| +#include <string>
|
| +#include <vector>
|
| +
|
| +#include "rule.h"
|
| +#include "util/string_util.h"
|
| +
|
| +namespace i18n {
|
| +namespace addressinput {
|
| +
|
| +Language::Language(const std::string& language_tag) : tag(language_tag),
|
| + base(),
|
| + has_latin_script(false) {
|
| + // Character '-' is the separator for subtags in the BCP 47. However, some
|
| + // legacy code generates tags with '_' instead of '-'.
|
| + static const char kSubtagsSeparator = '-';
|
| + static const char kAlternativeSubtagsSeparator = '_';
|
| + std::replace(tag.begin(), tag.end(), kAlternativeSubtagsSeparator,
|
| + kSubtagsSeparator);
|
| +
|
| + // OK to use 'tolower' because BCP 47 tags are always in ASCII.
|
| + std::string lowercase = tag;
|
| + std::transform(lowercase.begin(), lowercase.end(), lowercase.begin(),
|
| + tolower);
|
| +
|
| + base = lowercase.substr(0, lowercase.find(kSubtagsSeparator));
|
| +
|
| + // The lowercase BCP 47 subtag for Latin script.
|
| + static const char kLowercaseLatinScript[] = "latn";
|
| + std::vector<std::string> subtags;
|
| + SplitString(lowercase, kSubtagsSeparator, &subtags);
|
| +
|
| + // Support only the second and third position for the script.
|
| + has_latin_script =
|
| + (subtags.size() > 1 && subtags[1] == kLowercaseLatinScript) ||
|
| + (subtags.size() > 2 && subtags[2] == kLowercaseLatinScript);
|
| +}
|
| +
|
| +Language::~Language() {}
|
| +
|
| +Language ChooseBestAddressLanguage(const Rule& address_region_rule,
|
| + const Language& ui_language) {
|
| + if (address_region_rule.GetLanguages().empty()) {
|
| + return ui_language;
|
| + }
|
| +
|
| + std::vector<Language> available_languages;
|
| + for (std::vector<std::string>::const_iterator
|
| + language_tag_it = address_region_rule.GetLanguages().begin();
|
| + language_tag_it != address_region_rule.GetLanguages().end();
|
| + ++language_tag_it) {
|
| + available_languages.push_back(Language(*language_tag_it));
|
| + }
|
| +
|
| + if (ui_language.tag.empty()) {
|
| + return available_languages.front();
|
| + }
|
| +
|
| + bool has_latin_format = !address_region_rule.GetLatinFormat().empty();
|
| +
|
| + // The conventionally formatted BCP 47 Latin script with a preceding subtag
|
| + // separator.
|
| + static const char kLatinScriptSuffix[] = "-Latn";
|
| + Language latin_script_language(
|
| + available_languages.front().base + kLatinScriptSuffix);
|
| + if (has_latin_format && ui_language.has_latin_script) {
|
| + return latin_script_language;
|
| + }
|
| +
|
| + for (std::vector<Language>::const_iterator
|
| + available_lang_it = available_languages.begin();
|
| + available_lang_it != available_languages.end(); ++available_lang_it) {
|
| + // Base language comparison works because no region supports the same base
|
| + // language with different scripts, for now. For example, no region supports
|
| + // "zh-Hant" and "zh-Hans" at the same time.
|
| + if (ui_language.base == available_lang_it->base) {
|
| + return *available_lang_it;
|
| + }
|
| + }
|
| +
|
| + return has_latin_format ? latin_script_language : available_languages.front();
|
| +}
|
| +
|
| +} // namespace addressinput
|
| +} // namespace i18n
|
|
|