OLD | NEW |
---|---|
1 // Copyright 2013 The Chromium Authors. All rights reserved. | 1 // Copyright 2013 The Chromium Authors. All rights reserved. |
2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
4 | 4 |
5 #include "components/autofill/core/browser/autofill_profile.h" | 5 #include "components/autofill/core/browser/autofill_profile.h" |
6 | 6 |
7 #include <algorithm> | 7 #include <algorithm> |
8 #include <functional> | 8 #include <functional> |
9 #include <map> | 9 #include <map> |
10 #include <memory> | 10 #include <memory> |
11 #include <ostream> | 11 #include <ostream> |
12 #include <set> | 12 #include <set> |
13 | 13 |
14 #include "base/guid.h" | 14 #include "base/guid.h" |
15 #include "base/i18n/case_conversion.h" | 15 #include "base/i18n/case_conversion.h" |
16 #include "base/i18n/char_iterator.h" | 16 #include "base/i18n/char_iterator.h" |
17 #include "base/logging.h" | 17 #include "base/logging.h" |
18 #include "base/macros.h" | 18 #include "base/macros.h" |
19 #include "base/metrics/histogram_macros.h" | 19 #include "base/metrics/histogram_macros.h" |
20 #include "base/sha1.h" | 20 #include "base/sha1.h" |
21 #include "base/strings/string_util.h" | 21 #include "base/strings/string_util.h" |
22 #include "base/strings/utf_string_conversion_utils.h" | 22 #include "base/strings/utf_string_conversion_utils.h" |
23 #include "base/strings/utf_string_conversions.h" | 23 #include "base/strings/utf_string_conversions.h" |
24 #include "components/autofill/core/browser/address.h" | 24 #include "components/autofill/core/browser/address.h" |
25 #include "components/autofill/core/browser/address_i18n.h" | 25 #include "components/autofill/core/browser/address_i18n.h" |
26 #include "components/autofill/core/browser/autofill_country.h" | 26 #include "components/autofill/core/browser/autofill_country.h" |
27 #include "components/autofill/core/browser/autofill_field.h" | 27 #include "components/autofill/core/browser/autofill_field.h" |
28 #include "components/autofill/core/browser/autofill_metrics.h" | 28 #include "components/autofill/core/browser/autofill_metrics.h" |
29 #include "components/autofill/core/browser/autofill_profile_comparator.h" | |
29 #include "components/autofill/core/browser/autofill_type.h" | 30 #include "components/autofill/core/browser/autofill_type.h" |
30 #include "components/autofill/core/browser/contact_info.h" | 31 #include "components/autofill/core/browser/contact_info.h" |
31 #include "components/autofill/core/browser/phone_number.h" | 32 #include "components/autofill/core/browser/phone_number.h" |
32 #include "components/autofill/core/browser/phone_number_i18n.h" | 33 #include "components/autofill/core/browser/phone_number_i18n.h" |
33 #include "components/autofill/core/browser/state_names.h" | 34 #include "components/autofill/core/browser/state_names.h" |
34 #include "components/autofill/core/browser/validation.h" | 35 #include "components/autofill/core/browser/validation.h" |
35 #include "components/autofill/core/common/autofill_l10n_util.h" | 36 #include "components/autofill/core/common/autofill_l10n_util.h" |
36 #include "components/autofill/core/common/form_field_data.h" | 37 #include "components/autofill/core/common/form_field_data.h" |
37 #include "grit/components_strings.h" | 38 #include "grit/components_strings.h" |
38 #include "third_party/icu/source/common/unicode/uchar.h" | 39 #include "third_party/icu/source/common/unicode/uchar.h" |
(...skipping 172 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
211 collapsed_set.insert(PHONE_HOME_WHOLE_NUMBER); | 212 collapsed_set.insert(PHONE_HOME_WHOLE_NUMBER); |
212 break; | 213 break; |
213 | 214 |
214 default: | 215 default: |
215 collapsed_set.insert(it); | 216 collapsed_set.insert(it); |
216 } | 217 } |
217 } | 218 } |
218 std::swap(*type_set, collapsed_set); | 219 std::swap(*type_set, collapsed_set); |
219 } | 220 } |
220 | 221 |
221 base::string16 NormalizeForComparison(const base::string16& text) { | |
222 using icu::UnicodeString; | |
223 using icu::Transliterator; | |
224 | |
225 // Use ICU transliteration to remove diacritics and fold case. | |
226 // See http://userguide.icu-project.org/transforms/general | |
227 UErrorCode status = U_ZERO_ERROR; | |
228 std::unique_ptr<Transliterator> transliterator(Transliterator::createInstance( | |
229 "NFD; [:Nonspacing Mark:] Remove; Lower; NFC", UTRANS_FORWARD, status)); | |
230 if (U_FAILURE(status) || transliterator == nullptr) { | |
231 LOG(ERROR) << "Failed to create ICU Transliterator: " | |
232 << u_errorName(status); | |
233 return text; | |
234 } | |
235 | |
236 UnicodeString value = UnicodeString(text.data(), text.length()); | |
237 transliterator->transliterate(value); | |
238 | |
239 return base::string16(value.getBuffer(), value.length()); | |
240 } | |
241 | |
242 } // namespace | 222 } // namespace |
243 | 223 |
244 AutofillProfile::AutofillProfile(const std::string& guid, | 224 AutofillProfile::AutofillProfile(const std::string& guid, |
245 const std::string& origin) | 225 const std::string& origin) |
246 : AutofillDataModel(guid, origin), | 226 : AutofillDataModel(guid, origin), |
247 record_type_(LOCAL_PROFILE), | 227 record_type_(LOCAL_PROFILE), |
248 phone_number_(this) { | 228 phone_number_(this) { |
249 } | 229 } |
250 | 230 |
251 AutofillProfile::AutofillProfile(RecordType type, const std::string& server_id) | 231 AutofillProfile::AutofillProfile(RecordType type, const std::string& server_id) |
(...skipping 534 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
786 server_id_ = base::SHA1HashString(contents_utf8); | 766 server_id_ = base::SHA1HashString(contents_utf8); |
787 } | 767 } |
788 | 768 |
789 void AutofillProfile::RecordAndLogUse() { | 769 void AutofillProfile::RecordAndLogUse() { |
790 UMA_HISTOGRAM_COUNTS_1000("Autofill.DaysSinceLastUse.Profile", | 770 UMA_HISTOGRAM_COUNTS_1000("Autofill.DaysSinceLastUse.Profile", |
791 (base::Time::Now() - use_date()).InDays()); | 771 (base::Time::Now() - use_date()).InDays()); |
792 RecordUse(); | 772 RecordUse(); |
793 } | 773 } |
794 | 774 |
795 // static | 775 // static |
796 base::string16 AutofillProfile::CanonicalizeProfileString( | 776 base::string16 AutofillProfile::CanonicalizeProfileString( |
Mathieu
2016/06/08 17:56:06
I think it makes sense to replace uses of Canonica
Roger McFarlane (Chromium)
2016/06/09 20:19:11
I'd prefer to do this in a follow-on CL, it touche
| |
797 const base::string16& str) { | 777 const base::string16& str) { |
798 base::string16 ret; | 778 AutofillProfileComparator comparator; |
799 ret.reserve(str.size()); | 779 return comparator.NormalizeForComparison(str); |
800 | |
801 // This algorithm is not designed to be perfect, we could get arbitrarily | |
802 // fancy here trying to canonicalize address lines. Instead, this is designed | |
803 // to handle common cases for all types of data (addresses and names) without | |
804 // the need of domain-specific logic. | |
805 // | |
806 // 1. Convert punctuation to spaces and normalize all whitespace to spaces. | |
807 // This will convert "Mid-Island Plz." -> "Mid Island Plz " (the trailing | |
808 // space will be trimmed off outside of the end of the loop). | |
809 // | |
810 // 2. Collapse consecutive punctuation/whitespace characters to a single | |
811 // space. We pretend the string has already started with whitespace in | |
812 // order to trim leading spaces. | |
813 // | |
814 // 3. Remove diacritics (accents and other non-spacing marks) and perform | |
815 // case folding to lower-case. | |
816 | |
817 bool previous_was_whitespace = true; | |
818 for (base::i18n::UTF16CharIterator iter(&str); !iter.end(); iter.Advance()) { | |
819 switch (u_charType(iter.get())) { | |
820 // Punctuation | |
821 case U_DASH_PUNCTUATION: | |
822 case U_START_PUNCTUATION: | |
823 case U_END_PUNCTUATION: | |
824 case U_CONNECTOR_PUNCTUATION: | |
825 case U_OTHER_PUNCTUATION: | |
826 // Whitespace | |
827 case U_CONTROL_CHAR: // To escape the '\n' character. | |
828 case U_SPACE_SEPARATOR: | |
829 case U_LINE_SEPARATOR: | |
830 case U_PARAGRAPH_SEPARATOR: | |
831 if (!previous_was_whitespace) { | |
832 ret.push_back(' '); | |
833 previous_was_whitespace = true; | |
834 } | |
835 break; | |
836 | |
837 default: | |
838 previous_was_whitespace = false; | |
839 base::WriteUnicodeCharacter(iter.get(), &ret); | |
840 break; | |
841 } | |
842 } | |
843 | |
844 // Trim off trailing whitespace if we left one. | |
845 if (previous_was_whitespace && !ret.empty()) | |
846 ret.resize(ret.size() - 1); | |
847 | |
848 // Remove diacritics and perform case folding. | |
849 return NormalizeForComparison(ret); | |
850 } | 780 } |
851 | 781 |
852 // static | 782 // static |
853 bool AutofillProfile::AreProfileStringsSimilar(const base::string16& a, | 783 bool AutofillProfile::AreProfileStringsSimilar(const base::string16& a, |
Mathieu
2016/06/08 17:56:06
Seems to be unused, remove
Roger McFarlane (Chromium)
2016/06/09 20:19:11
Done.
| |
854 const base::string16& b) { | 784 const base::string16& b) { |
855 return CanonicalizeProfileString(a) == CanonicalizeProfileString(b); | 785 AutofillProfileComparator compare; |
786 return compare.NormalizeForComparison(a) == compare.NormalizeForComparison(b); | |
856 } | 787 } |
857 | 788 |
858 void AutofillProfile::GetSupportedTypes( | 789 void AutofillProfile::GetSupportedTypes( |
859 ServerFieldTypeSet* supported_types) const { | 790 ServerFieldTypeSet* supported_types) const { |
860 FormGroupList info = FormGroups(); | 791 FormGroupList info = FormGroups(); |
861 for (const auto& it : info) { | 792 for (const auto& it : info) { |
862 it->GetSupportedTypes(supported_types); | 793 it->GetSupportedTypes(supported_types); |
863 } | 794 } |
864 } | 795 } |
865 | 796 |
(...skipping 218 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
1084 << " " << UTF16ToUTF8(profile.GetRawInfo(ADDRESS_HOME_CITY)) << " " | 1015 << " " << UTF16ToUTF8(profile.GetRawInfo(ADDRESS_HOME_CITY)) << " " |
1085 << UTF16ToUTF8(profile.GetRawInfo(ADDRESS_HOME_STATE)) << " " | 1016 << UTF16ToUTF8(profile.GetRawInfo(ADDRESS_HOME_STATE)) << " " |
1086 << UTF16ToUTF8(profile.GetRawInfo(ADDRESS_HOME_ZIP)) << " " | 1017 << UTF16ToUTF8(profile.GetRawInfo(ADDRESS_HOME_ZIP)) << " " |
1087 << UTF16ToUTF8(profile.GetRawInfo(ADDRESS_HOME_SORTING_CODE)) << " " | 1018 << UTF16ToUTF8(profile.GetRawInfo(ADDRESS_HOME_SORTING_CODE)) << " " |
1088 << UTF16ToUTF8(profile.GetRawInfo(ADDRESS_HOME_COUNTRY)) << " " | 1019 << UTF16ToUTF8(profile.GetRawInfo(ADDRESS_HOME_COUNTRY)) << " " |
1089 << profile.language_code() << " " | 1020 << profile.language_code() << " " |
1090 << UTF16ToUTF8(profile.GetRawInfo(PHONE_HOME_WHOLE_NUMBER)); | 1021 << UTF16ToUTF8(profile.GetRawInfo(PHONE_HOME_WHOLE_NUMBER)); |
1091 } | 1022 } |
1092 | 1023 |
1093 } // namespace autofill | 1024 } // namespace autofill |
OLD | NEW |