OLD | NEW |
---|---|
(Empty) | |
1 // Copyright 2014 The Chromium Authors. All rights reserved. | |
please use gerrit instead
2014/06/05 22:22:47
To reduce reviewer burden: Don't delete all unused
| |
2 // Use of this source code is governed by a BSD-style license that can be | |
3 // found in the LICENSE file. | |
4 | |
5 #include "cpp/src/util/canonicalize_string.h" | |
6 | |
7 #include "base/logging.h" | |
8 #include "cpp/include/libaddressinput/util/scoped_ptr.h" | |
9 #include "third_party/icu/source/common/unicode/errorcode.h" | |
10 #include "third_party/icu/source/common/unicode/locid.h" | |
11 #include "third_party/icu/source/common/unicode/unistr.h" | |
12 #include "third_party/icu/source/common/unicode/utypes.h" | |
13 #include "third_party/icu/source/i18n/unicode/coll.h" | |
14 | |
15 namespace i18n { | |
16 namespace addressinput { | |
17 | |
18 namespace { | |
19 | |
20 class ChromeStringCanonicalizer : public StringCanonicalizer { | |
21 public: | |
22 ChromeStringCanonicalizer() | |
23 : error_code_(U_ZERO_ERROR), | |
24 collator_( | |
25 icu::Collator::createInstance( | |
26 icu::Locale::getRoot(), error_code_)) { | |
27 collator_->setStrength(icu::Collator::PRIMARY); | |
28 DCHECK(U_SUCCESS(error_code_)); | |
29 } | |
30 | |
31 virtual ~ChromeStringCanonicalizer() {} | |
32 | |
33 // StringCanonicalizer implementation. | |
34 virtual std::string CanonicalizeString(const std::string& original) { | |
35 // Returns a canonical version of the string that can be used for comparing | |
36 // strings regardless of diacritics and capitalization. | |
37 // CanonicalizeString("Texas") == CanonicalizeString("T\u00E9xas"); | |
38 // CanonicalizeString("Texas") == CanonicalizeString("teXas"); | |
39 // CanonicalizeString("Texas") != CanonicalizeString("California"); | |
40 // | |
41 // The output is not human-readable. | |
42 // CanonicalizeString("Texas") != "Texas"; | |
43 icu::UnicodeString icu_str( | |
44 original.c_str(), static_cast<int32_t>(original.length())); | |
45 int32_t buffer_size = collator_->getSortKey(icu_str, NULL, 0); | |
46 scoped_ptr<uint8_t[]> buffer(new uint8_t[buffer_size]); | |
47 DCHECK(buffer.get()); | |
48 int32_t filled_size = | |
49 collator_->getSortKey(icu_str, buffer.get(), buffer_size); | |
50 DCHECK_EQ(buffer_size, filled_size); | |
51 return std::string(reinterpret_cast<const char*>(buffer.get())); | |
52 } | |
53 | |
54 private: | |
55 UErrorCode error_code_; | |
56 scoped_ptr<icu::Collator> collator_; | |
57 | |
58 DISALLOW_COPY_AND_ASSIGN(ChromeStringCanonicalizer); | |
59 }; | |
60 | |
61 } // namespace | |
62 | |
63 // static | |
64 scoped_ptr<StringCanonicalizer> StringCanonicalizer::Build() { | |
65 return scoped_ptr<StringCanonicalizer>(new ChromeStringCanonicalizer); | |
66 } | |
67 | |
68 } // namespace addressinput | |
69 } // namespace i18n | |
OLD | NEW |