OLD | NEW |
---|---|
1 // Copyright 2013 The Chromium Authors. All rights reserved. | 1 // Copyright 2013 The Chromium Authors. All rights reserved. |
2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
4 | 4 |
5 #include "components/autofill/core/common/autofill_regexes.h" | 5 #include "components/autofill/core/common/autofill_regexes.h" |
6 | 6 |
7 #include "base/containers/scoped_ptr_hash_map.h" | 7 #include "base/containers/scoped_ptr_hash_map.h" |
8 #include "base/logging.h" | 8 #include "base/logging.h" |
9 #include "base/memory/scoped_ptr.h" | 9 #include "base/memory/scoped_ptr.h" |
10 #include "base/memory/singleton.h" | 10 #include "base/memory/singleton.h" |
11 #include "base/strings/string16.h" | 11 #include "base/strings/string16.h" |
12 #include "third_party/icu/source/i18n/unicode/regex.h" | 12 #include "base/strings/utf_string_conversions.h" |
13 #include "third_party/re2/re2/re2.h" | |
13 | 14 |
14 namespace { | 15 namespace { |
15 | 16 |
16 // A singleton class that serves as a cache of compiled regex patterns. | 17 // A singleton class that serves as a cache of compiled regex patterns. |
17 class AutofillRegexes { | 18 class AutofillRegexes { |
18 public: | 19 public: |
19 static AutofillRegexes* GetInstance(); | 20 static AutofillRegexes* GetInstance(); |
20 | 21 |
21 // Returns the compiled regex matcher corresponding to |pattern|. | 22 // Returns the compiled regex matcher corresponding to |pattern|. |
22 icu::RegexMatcher* GetMatcher(const base::string16& pattern); | 23 re2::RE2* GetMatcher(const base::string16& pattern); |
Evan Stade
2015/11/23 16:38:39
can you make this return a const ref?
| |
23 | 24 |
24 private: | 25 private: |
25 AutofillRegexes(); | 26 AutofillRegexes(); |
26 ~AutofillRegexes(); | 27 ~AutofillRegexes(); |
27 friend struct base::DefaultSingletonTraits<AutofillRegexes>; | 28 friend struct base::DefaultSingletonTraits<AutofillRegexes>; |
28 | 29 |
29 // Maps patterns to their corresponding regex matchers. | 30 // Maps patterns to their corresponding regex matchers. |
30 base::ScopedPtrHashMap<base::string16, scoped_ptr<icu::RegexMatcher>> | 31 base::ScopedPtrHashMap<base::string16, scoped_ptr<re2::RE2>> matchers_; |
31 matchers_; | |
32 | 32 |
33 DISALLOW_COPY_AND_ASSIGN(AutofillRegexes); | 33 DISALLOW_COPY_AND_ASSIGN(AutofillRegexes); |
34 }; | 34 }; |
35 | 35 |
36 // static | 36 // static |
37 AutofillRegexes* AutofillRegexes::GetInstance() { | 37 AutofillRegexes* AutofillRegexes::GetInstance() { |
38 return base::Singleton<AutofillRegexes>::get(); | 38 return base::Singleton<AutofillRegexes>::get(); |
39 } | 39 } |
40 | 40 |
41 AutofillRegexes::AutofillRegexes() { | 41 AutofillRegexes::AutofillRegexes() { |
42 } | 42 } |
43 | 43 |
44 AutofillRegexes::~AutofillRegexes() { | 44 AutofillRegexes::~AutofillRegexes() { |
45 } | 45 } |
46 | 46 |
47 icu::RegexMatcher* AutofillRegexes::GetMatcher(const base::string16& pattern) { | 47 re2::RE2* AutofillRegexes::GetMatcher(const base::string16& pattern) { |
Ilya Sherman
2015/11/20 22:27:59
Please either change this API to use std::string,
| |
48 auto it = matchers_.find(pattern); | 48 auto it = matchers_.find(pattern); |
49 if (it == matchers_.end()) { | 49 if (it == matchers_.end()) { |
50 const icu::UnicodeString icu_pattern(pattern.data(), pattern.length()); | 50 re2::RE2::Options options; |
51 | 51 options.set_case_sensitive(false); |
52 UErrorCode status = U_ZERO_ERROR; | 52 scoped_ptr<re2::RE2> matcher( |
53 scoped_ptr<icu::RegexMatcher> matcher( | 53 new re2::RE2(base::UTF16ToUTF8(pattern), options)); |
54 new icu::RegexMatcher(icu_pattern, UREGEX_CASE_INSENSITIVE, status)); | 54 DCHECK(matcher->ok()); |
55 DCHECK(U_SUCCESS(status)); | |
56 | |
57 auto result = matchers_.add(pattern, matcher.Pass()); | 55 auto result = matchers_.add(pattern, matcher.Pass()); |
58 DCHECK(result.second); | 56 DCHECK(result.second); |
59 it = result.first; | 57 it = result.first; |
60 } | 58 } |
61 return it->second; | 59 return it->second; |
62 } | 60 } |
63 | 61 |
64 } // namespace | 62 } // namespace |
65 | 63 |
66 namespace autofill { | 64 namespace autofill { |
67 | 65 |
68 bool MatchesPattern(const base::string16& input, | 66 bool MatchesPattern(const base::string16& input, |
69 const base::string16& pattern) { | 67 const base::string16& pattern) { |
Ilya Sherman
2015/11/20 22:27:59
Please either change this API to use std::string f
tfarina
2015/11/25 17:20:23
Done. But if I'm not wrong from looking at the log
| |
70 icu::RegexMatcher* matcher = | 68 // TODO(isherman): Run performance tests to determine whether caching regex |
71 AutofillRegexes::GetInstance()->GetMatcher(pattern); | 69 // matchers is still useful now that we've switched from ICU to RE2. |
72 icu::UnicodeString icu_input(input.data(), input.length()); | 70 // http://crbug.com/470065 |
73 matcher->reset(icu_input); | 71 re2::RE2* matcher = AutofillRegexes::GetInstance()->GetMatcher(pattern); |
74 | 72 return re2::RE2::PartialMatch(base::UTF16ToUTF8(input), *matcher); |
75 UErrorCode status = U_ZERO_ERROR; | |
76 UBool match = matcher->find(0, status); | |
77 DCHECK(U_SUCCESS(status)); | |
78 return match == TRUE; | |
79 } | 73 } |
80 | 74 |
81 } // namespace autofill | 75 } // namespace autofill |
OLD | NEW |