OLD | NEW |
1 // Copyright (c) 2011 The Chromium Authors. All rights reserved. | 1 // Copyright (c) 2011 The Chromium Authors. All rights reserved. |
2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
4 // | 4 // |
5 // PhishingTermFeatureExtractor handles computing term features from the text | 5 // PhishingTermFeatureExtractor handles computing term features from the text |
6 // of a web page for the client-side phishing detection model. To do this, it | 6 // of a web page for the client-side phishing detection model. To do this, it |
7 // takes a list of terms that appear in the model, and scans through the page | 7 // takes a list of terms that appear in the model, and scans through the page |
8 // text looking for them. Any terms that appear will cause a corresponding | 8 // text looking for them. Any terms that appear will cause a corresponding |
9 // features::kPageTerm feature to be added to the FeatureMap. | 9 // features::kPageTerm feature to be added to the FeatureMap. |
10 // | 10 // |
11 // To make it harder for a phisher to enumerate all of the relevant terms in | 11 // To make it harder for a phisher to enumerate all of the relevant terms in |
12 // the model, the terms are provided as SHA-256 hashes, rather than plain text. | 12 // the model, the terms are provided as SHA-256 hashes, rather than plain text. |
13 // | 13 // |
14 // There is one PhishingTermFeatureExtractor per RenderView. | 14 // There is one PhishingTermFeatureExtractor per RenderView. |
15 | 15 |
16 #ifndef CHROME_RENDERER_SAFE_BROWSING_PHISHING_TERM_FEATURE_EXTRACTOR_H_ | 16 #ifndef CHROME_RENDERER_SAFE_BROWSING_PHISHING_TERM_FEATURE_EXTRACTOR_H_ |
17 #define CHROME_RENDERER_SAFE_BROWSING_PHISHING_TERM_FEATURE_EXTRACTOR_H_ | 17 #define CHROME_RENDERER_SAFE_BROWSING_PHISHING_TERM_FEATURE_EXTRACTOR_H_ |
18 | 18 |
19 #include <string> | 19 #include <string> |
20 | 20 |
21 #include "base/basictypes.h" | 21 #include "base/basictypes.h" |
22 #include "base/callback.h" | 22 #include "base/callback.h" |
| 23 #include "base/containers/hash_tables.h" |
23 #include "base/containers/mru_cache.h" | 24 #include "base/containers/mru_cache.h" |
24 #include "base/hash_tables.h" | |
25 #include "base/memory/scoped_ptr.h" | 25 #include "base/memory/scoped_ptr.h" |
26 #include "base/memory/weak_ptr.h" | 26 #include "base/memory/weak_ptr.h" |
27 #include "base/string16.h" | 27 #include "base/string16.h" |
28 #include "base/strings/string_piece.h" | 28 #include "base/strings/string_piece.h" |
29 | 29 |
30 namespace safe_browsing { | 30 namespace safe_browsing { |
31 class FeatureExtractorClock; | 31 class FeatureExtractorClock; |
32 class FeatureMap; | 32 class FeatureMap; |
33 | 33 |
34 class PhishingTermFeatureExtractor { | 34 class PhishingTermFeatureExtractor { |
(...skipping 121 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
156 // Used in scheduling ExtractFeaturesWithTimeout tasks. | 156 // Used in scheduling ExtractFeaturesWithTimeout tasks. |
157 // These pointers are invalidated if extraction is cancelled. | 157 // These pointers are invalidated if extraction is cancelled. |
158 base::WeakPtrFactory<PhishingTermFeatureExtractor> weak_factory_; | 158 base::WeakPtrFactory<PhishingTermFeatureExtractor> weak_factory_; |
159 | 159 |
160 DISALLOW_COPY_AND_ASSIGN(PhishingTermFeatureExtractor); | 160 DISALLOW_COPY_AND_ASSIGN(PhishingTermFeatureExtractor); |
161 }; | 161 }; |
162 | 162 |
163 } // namespace safe_browsing | 163 } // namespace safe_browsing |
164 | 164 |
165 #endif // CHROME_RENDERER_SAFE_BROWSING_PHISHING_TERM_FEATURE_EXTRACTOR_H_ | 165 #endif // CHROME_RENDERER_SAFE_BROWSING_PHISHING_TERM_FEATURE_EXTRACTOR_H_ |
OLD | NEW |