Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(87)

Side by Side Diff: components/dom_distiller/core/distillable_page_detector.h

Issue 1405233009: Add a new distillability model for the new set of page features (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master
Patch Set: merge depend Created 5 years, 1 month ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
OLDNEW
1 // Copyright 2015 The Chromium Authors. All rights reserved. 1 // Copyright 2015 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be 2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file. 3 // found in the LICENSE file.
4 4
5 #ifndef COMPONENTS_DOM_DISTILLER_CORE_DISTILLABLE_PAGE_DETECTOR_H_ 5 #ifndef COMPONENTS_DOM_DISTILLER_CORE_DISTILLABLE_PAGE_DETECTOR_H_
6 #define COMPONENTS_DOM_DISTILLER_CORE_DISTILLABLE_PAGE_DETECTOR_H_ 6 #define COMPONENTS_DOM_DISTILLER_CORE_DISTILLABLE_PAGE_DETECTOR_H_
7 7
8 #include <vector> 8 #include <vector>
9 9
10 #include "base/memory/scoped_ptr.h" 10 #include "base/memory/scoped_ptr.h"
11 #include "components/dom_distiller/core/proto/adaboost.pb.h" 11 #include "components/dom_distiller/core/proto/adaboost.pb.h"
12 12
13 namespace dom_distiller { 13 namespace dom_distiller {
14 14
15 // DistillablePageDetector provides methods to identify whether or not a page is 15 // DistillablePageDetector provides methods to identify whether or not a page is
16 // likely to be distillable based on a vector of derived features (see 16 // likely to be distillable based on a vector of derived features (see
17 // dom_distiller::CalculateDerivedFeatures). It uses a simple AdaBoost-trained 17 // dom_distiller::CalculateDerivedFeatures). It uses a simple AdaBoost-trained
18 // model. 18 // model.
19 class DistillablePageDetector { 19 class DistillablePageDetector {
20 public: 20 public:
21 static const DistillablePageDetector* GetDefault(); 21 static const DistillablePageDetector* GetDefault();
22 static const DistillablePageDetector* GetNewDefault();
mdjones 2015/11/05 00:53:57 Nit: For now, use GetNewModel and later change it
wychen 2015/11/05 02:00:39 Done.
22 explicit DistillablePageDetector(scoped_ptr<AdaBoostProto> proto); 23 explicit DistillablePageDetector(scoped_ptr<AdaBoostProto> proto);
23 ~DistillablePageDetector(); 24 ~DistillablePageDetector();
24 25
25 // Returns true if the model classifies the vector of features as a 26 // Returns true if the model classifies the vector of features as a
26 // distillable page. 27 // distillable page.
27 bool Classify(const std::vector<double>& features) const; 28 bool Classify(const std::vector<double>& features) const;
28 29
29 double Score(const std::vector<double>& features) const; 30 double Score(const std::vector<double>& features) const;
30 double GetThreshold() const; 31 double GetThreshold() const;
31 private: 32 private:
32 scoped_ptr<AdaBoostProto> proto_; 33 scoped_ptr<AdaBoostProto> proto_;
33 double threshold_; 34 double threshold_;
34 DISALLOW_COPY_AND_ASSIGN(DistillablePageDetector); 35 DISALLOW_COPY_AND_ASSIGN(DistillablePageDetector);
35 }; 36 };
36 37
37 38
38 } // namespace dom_distiller 39 } // namespace dom_distiller
39 40
40 #endif // COMPONENTS_DOM_DISTILLER_CORE_DISTILLABLE_PAGE_DETECTOR_H_ 41 #endif // COMPONENTS_DOM_DISTILLER_CORE_DISTILLABLE_PAGE_DETECTOR_H_
OLDNEW

Powered by Google App Engine
This is Rietveld 408576698