Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(681)

Side by Side Diff: components/autofill/core/common/autofill_regexes.cc

Issue 1453193002: autofill: switch autofill_regexes to RE2 library (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master
Patch Set: input is UTF8 Created 5 years, 1 month ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
« no previous file with comments | « components/autofill/core/common/DEPS ('k') | no next file » | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 // Copyright 2013 The Chromium Authors. All rights reserved. 1 // Copyright 2013 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be 2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file. 3 // found in the LICENSE file.
4 4
5 #include "components/autofill/core/common/autofill_regexes.h" 5 #include "components/autofill/core/common/autofill_regexes.h"
6 6
7 #include "base/containers/scoped_ptr_hash_map.h" 7 #include "base/containers/scoped_ptr_hash_map.h"
8 #include "base/logging.h" 8 #include "base/logging.h"
9 #include "base/memory/scoped_ptr.h" 9 #include "base/memory/scoped_ptr.h"
10 #include "base/memory/singleton.h" 10 #include "base/memory/singleton.h"
11 #include "base/strings/string16.h" 11 #include "base/strings/string16.h"
12 #include "third_party/icu/source/i18n/unicode/regex.h" 12 #include "base/strings/utf_string_conversions.h"
13 #include "third_party/re2/re2/re2.h"
13 14
14 namespace { 15 namespace {
15 16
16 // A singleton class that serves as a cache of compiled regex patterns. 17 // A singleton class that serves as a cache of compiled regex patterns.
17 class AutofillRegexes { 18 class AutofillRegexes {
18 public: 19 public:
19 static AutofillRegexes* GetInstance(); 20 static AutofillRegexes* GetInstance();
20 21
21 // Returns the compiled regex matcher corresponding to |pattern|. 22 // Returns the compiled regex matcher corresponding to |pattern|.
22 icu::RegexMatcher* GetMatcher(const base::string16& pattern); 23 re2::RE2* GetMatcher(const base::string16& pattern);
Evan Stade 2015/11/23 16:38:39 can you make this return a const ref?
23 24
24 private: 25 private:
25 AutofillRegexes(); 26 AutofillRegexes();
26 ~AutofillRegexes(); 27 ~AutofillRegexes();
27 friend struct base::DefaultSingletonTraits<AutofillRegexes>; 28 friend struct base::DefaultSingletonTraits<AutofillRegexes>;
28 29
29 // Maps patterns to their corresponding regex matchers. 30 // Maps patterns to their corresponding regex matchers.
30 base::ScopedPtrHashMap<base::string16, scoped_ptr<icu::RegexMatcher>> 31 base::ScopedPtrHashMap<base::string16, scoped_ptr<re2::RE2>> matchers_;
31 matchers_;
32 32
33 DISALLOW_COPY_AND_ASSIGN(AutofillRegexes); 33 DISALLOW_COPY_AND_ASSIGN(AutofillRegexes);
34 }; 34 };
35 35
36 // static 36 // static
37 AutofillRegexes* AutofillRegexes::GetInstance() { 37 AutofillRegexes* AutofillRegexes::GetInstance() {
38 return base::Singleton<AutofillRegexes>::get(); 38 return base::Singleton<AutofillRegexes>::get();
39 } 39 }
40 40
41 AutofillRegexes::AutofillRegexes() { 41 AutofillRegexes::AutofillRegexes() {
42 } 42 }
43 43
44 AutofillRegexes::~AutofillRegexes() { 44 AutofillRegexes::~AutofillRegexes() {
45 } 45 }
46 46
47 icu::RegexMatcher* AutofillRegexes::GetMatcher(const base::string16& pattern) { 47 re2::RE2* AutofillRegexes::GetMatcher(const base::string16& pattern) {
Ilya Sherman 2015/11/20 22:27:59 Please either change this API to use std::string,
48 auto it = matchers_.find(pattern); 48 auto it = matchers_.find(pattern);
49 if (it == matchers_.end()) { 49 if (it == matchers_.end()) {
50 const icu::UnicodeString icu_pattern(pattern.data(), pattern.length()); 50 re2::RE2::Options options;
51 51 options.set_case_sensitive(false);
52 UErrorCode status = U_ZERO_ERROR; 52 scoped_ptr<re2::RE2> matcher(
53 scoped_ptr<icu::RegexMatcher> matcher( 53 new re2::RE2(base::UTF16ToUTF8(pattern), options));
54 new icu::RegexMatcher(icu_pattern, UREGEX_CASE_INSENSITIVE, status)); 54 DCHECK(matcher->ok());
55 DCHECK(U_SUCCESS(status));
56
57 auto result = matchers_.add(pattern, matcher.Pass()); 55 auto result = matchers_.add(pattern, matcher.Pass());
58 DCHECK(result.second); 56 DCHECK(result.second);
59 it = result.first; 57 it = result.first;
60 } 58 }
61 return it->second; 59 return it->second;
62 } 60 }
63 61
64 } // namespace 62 } // namespace
65 63
66 namespace autofill { 64 namespace autofill {
67 65
68 bool MatchesPattern(const base::string16& input, 66 bool MatchesPattern(const base::string16& input,
69 const base::string16& pattern) { 67 const base::string16& pattern) {
Ilya Sherman 2015/11/20 22:27:59 Please either change this API to use std::string f
tfarina 2015/11/25 17:20:23 Done. But if I'm not wrong from looking at the log
70 icu::RegexMatcher* matcher = 68 // TODO(isherman): Run performance tests to determine whether caching regex
71 AutofillRegexes::GetInstance()->GetMatcher(pattern); 69 // matchers is still useful now that we've switched from ICU to RE2.
72 icu::UnicodeString icu_input(input.data(), input.length()); 70 // http://crbug.com/470065
73 matcher->reset(icu_input); 71 re2::RE2* matcher = AutofillRegexes::GetInstance()->GetMatcher(pattern);
74 72 return re2::RE2::PartialMatch(base::UTF16ToUTF8(input), *matcher);
75 UErrorCode status = U_ZERO_ERROR;
76 UBool match = matcher->find(0, status);
77 DCHECK(U_SUCCESS(status));
78 return match == TRUE;
79 } 73 }
80 74
81 } // namespace autofill 75 } // namespace autofill
OLDNEW
« no previous file with comments | « components/autofill/core/common/DEPS ('k') | no next file » | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698