Chromium Code Reviews| OLD | NEW |
|---|---|
| 1 // Copyright 2013 The Chromium Authors. All rights reserved. | 1 // Copyright 2013 The Chromium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
| 4 | 4 |
| 5 #include "components/autofill/core/common/autofill_regexes.h" | 5 #include "components/autofill/core/common/autofill_regexes.h" |
| 6 | 6 |
| 7 #include "base/containers/scoped_ptr_hash_map.h" | 7 #include "base/containers/scoped_ptr_hash_map.h" |
| 8 #include "base/logging.h" | 8 #include "base/logging.h" |
| 9 #include "base/memory/scoped_ptr.h" | 9 #include "base/memory/scoped_ptr.h" |
| 10 #include "base/memory/singleton.h" | 10 #include "base/memory/singleton.h" |
| 11 #include "base/strings/string16.h" | 11 #include "base/strings/string16.h" |
| 12 #include "third_party/icu/source/i18n/unicode/regex.h" | 12 #include "base/strings/utf_string_conversions.h" |
| 13 #include "third_party/re2/re2/re2.h" | |
| 13 | 14 |
| 14 namespace { | 15 namespace { |
| 15 | 16 |
| 16 // A singleton class that serves as a cache of compiled regex patterns. | 17 // A singleton class that serves as a cache of compiled regex patterns. |
| 17 class AutofillRegexes { | 18 class AutofillRegexes { |
| 18 public: | 19 public: |
| 19 static AutofillRegexes* GetInstance(); | 20 static AutofillRegexes* GetInstance(); |
| 20 | 21 |
| 21 // Returns the compiled regex matcher corresponding to |pattern|. | 22 // Returns the compiled regex matcher corresponding to |pattern|. |
| 22 icu::RegexMatcher* GetMatcher(const base::string16& pattern); | 23 re2::RE2* GetMatcher(const base::string16& pattern); |
|
Evan Stade
2015/11/23 16:38:39
can you make this return a const ref?
| |
| 23 | 24 |
| 24 private: | 25 private: |
| 25 AutofillRegexes(); | 26 AutofillRegexes(); |
| 26 ~AutofillRegexes(); | 27 ~AutofillRegexes(); |
| 27 friend struct base::DefaultSingletonTraits<AutofillRegexes>; | 28 friend struct base::DefaultSingletonTraits<AutofillRegexes>; |
| 28 | 29 |
| 29 // Maps patterns to their corresponding regex matchers. | 30 // Maps patterns to their corresponding regex matchers. |
| 30 base::ScopedPtrHashMap<base::string16, scoped_ptr<icu::RegexMatcher>> | 31 base::ScopedPtrHashMap<base::string16, scoped_ptr<re2::RE2>> matchers_; |
| 31 matchers_; | |
| 32 | 32 |
| 33 DISALLOW_COPY_AND_ASSIGN(AutofillRegexes); | 33 DISALLOW_COPY_AND_ASSIGN(AutofillRegexes); |
| 34 }; | 34 }; |
| 35 | 35 |
| 36 // static | 36 // static |
| 37 AutofillRegexes* AutofillRegexes::GetInstance() { | 37 AutofillRegexes* AutofillRegexes::GetInstance() { |
| 38 return base::Singleton<AutofillRegexes>::get(); | 38 return base::Singleton<AutofillRegexes>::get(); |
| 39 } | 39 } |
| 40 | 40 |
| 41 AutofillRegexes::AutofillRegexes() { | 41 AutofillRegexes::AutofillRegexes() { |
| 42 } | 42 } |
| 43 | 43 |
| 44 AutofillRegexes::~AutofillRegexes() { | 44 AutofillRegexes::~AutofillRegexes() { |
| 45 } | 45 } |
| 46 | 46 |
| 47 icu::RegexMatcher* AutofillRegexes::GetMatcher(const base::string16& pattern) { | 47 re2::RE2* AutofillRegexes::GetMatcher(const base::string16& pattern) { |
|
Ilya Sherman
2015/11/20 22:27:59
Please either change this API to use std::string,
| |
| 48 auto it = matchers_.find(pattern); | 48 auto it = matchers_.find(pattern); |
| 49 if (it == matchers_.end()) { | 49 if (it == matchers_.end()) { |
| 50 const icu::UnicodeString icu_pattern(pattern.data(), pattern.length()); | 50 re2::RE2::Options options; |
| 51 | 51 options.set_case_sensitive(false); |
| 52 UErrorCode status = U_ZERO_ERROR; | 52 scoped_ptr<re2::RE2> matcher( |
| 53 scoped_ptr<icu::RegexMatcher> matcher( | 53 new re2::RE2(base::UTF16ToUTF8(pattern), options)); |
| 54 new icu::RegexMatcher(icu_pattern, UREGEX_CASE_INSENSITIVE, status)); | 54 DCHECK(matcher->ok()); |
| 55 DCHECK(U_SUCCESS(status)); | |
| 56 | |
| 57 auto result = matchers_.add(pattern, matcher.Pass()); | 55 auto result = matchers_.add(pattern, matcher.Pass()); |
| 58 DCHECK(result.second); | 56 DCHECK(result.second); |
| 59 it = result.first; | 57 it = result.first; |
| 60 } | 58 } |
| 61 return it->second; | 59 return it->second; |
| 62 } | 60 } |
| 63 | 61 |
| 64 } // namespace | 62 } // namespace |
| 65 | 63 |
| 66 namespace autofill { | 64 namespace autofill { |
| 67 | 65 |
| 68 bool MatchesPattern(const base::string16& input, | 66 bool MatchesPattern(const base::string16& input, |
| 69 const base::string16& pattern) { | 67 const base::string16& pattern) { |
|
Ilya Sherman
2015/11/20 22:27:59
Please either change this API to use std::string f
tfarina
2015/11/25 17:20:23
Done. But if I'm not wrong from looking at the log
| |
| 70 icu::RegexMatcher* matcher = | 68 // TODO(isherman): Run performance tests to determine whether caching regex |
| 71 AutofillRegexes::GetInstance()->GetMatcher(pattern); | 69 // matchers is still useful now that we've switched from ICU to RE2. |
| 72 icu::UnicodeString icu_input(input.data(), input.length()); | 70 // http://crbug.com/470065 |
| 73 matcher->reset(icu_input); | 71 re2::RE2* matcher = AutofillRegexes::GetInstance()->GetMatcher(pattern); |
| 74 | 72 return re2::RE2::PartialMatch(base::UTF16ToUTF8(input), *matcher); |
| 75 UErrorCode status = U_ZERO_ERROR; | |
| 76 UBool match = matcher->find(0, status); | |
| 77 DCHECK(U_SUCCESS(status)); | |
| 78 return match == TRUE; | |
| 79 } | 73 } |
| 80 | 74 |
| 81 } // namespace autofill | 75 } // namespace autofill |
| OLD | NEW |