third_party/document_image_extractor/third_party/src/document_feature_extractor.js - Issue 1138123002: Update third_party/document_image_extractor

Unified Diff: third_party/document_image_extractor/third_party/src/document_feature_extractor.js

Issue 1138123002: Update third_party/document_image_extractor (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master

Patch Set: Created 5 years, 7 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

« no previous file with comments | « third_party/document_image_extractor/third_party/src/document_feature.js ('k') | third_party/document_image_extractor/third_party/src/document_image.js » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: third_party/document_image_extractor/third_party/src/document_feature_extractor.js

diff --git a/third_party/document_image_extractor/third_party/src/document_feature_extractor.js b/third_party/document_image_extractor/third_party/src/document_feature_extractor.js

deleted file mode 100644

index 200c93728f4008a98e5bf28c17f12a32d96368c1..0000000000000000000000000000000000000000

--- a/third_party/document_image_extractor/third_party/src/document_feature_extractor.js

+++ /dev/null

@@ -1,117 +0,0 @@

-goog.provide('image.collections.extension.DocumentFeatureExtractor');

-goog.require('goog.asserts');

-goog.require('image.collections.extension.DocumentFeature');

-goog.require('image.collections.extension.ElementFilter');

-goog.scope(function() {

-var DocumentFeature = image.collections.extension.DocumentFeature;

-var ElementFilter = image.collections.extension.ElementFilter;

-/**

- * A base class for document feature (title, snippet, image) extractors.

- * @constructor

- */

-image.collections.extension.DocumentFeatureExtractor = function() {

- /** @protected {!Array.<!ElementFilter>} */

- this.filters_ = [];

-};

-var DocumentFeatureExtractor =

- image.collections.extension.DocumentFeatureExtractor;

-/**

- * Installs an element filter.

- * @param {!ElementFilter} filter

- * @protected

- */

-DocumentFeatureExtractor.prototype.addFilter = function(filter) {

- this.filters_.push(filter);

-};

-/**

- * Returns true iff an element passes all the filters.

- * @param {!Element} element

- * @return {boolean}

- */

-DocumentFeatureExtractor.prototype.filter = function(element) {

- for (var i = 0; i < this.filters_.length; ++i) {

- if (!this.filters_[i].filter(element)) {

- return false;

- }

- return true;

-};

-/**

- * Given an HTML document, returns a feature with a highest relevance value.

- * TODO(busaryev): look at the mean, median relevance etc.

- * @param {!Document} doc HTML document.

- * @return {DocumentFeature}

- */

-DocumentFeatureExtractor.prototype.extractBestFromDocument = function(doc) {

- var features = this.extractAllFromDocument(doc);

- if (features.length == 0) return null;

- var best = features[0];

- for (var i = 1; i < features.length; ++i) {

- var feature = features[i];

- if (feature.getRelevance() > best.getRelevance()) {

- best = feature;

- }

- return best;

-};

-/**

- * Given an HTML document, returns an array of features sorted by relevance.

- * By default, this function tries to extract a feature from every DOM element.

- * Derived classes may override this function to look at a subset of DOM (e.g.

- * only <meta> and <link> elements).

- * @param {!Document} doc HTML document.

- * @return {!Array.<!DocumentFeature>}

- */

-DocumentFeatureExtractor.prototype.extractAllFromDocument = function(doc) {

- return this.extractFromNodeList(doc.getElementsByTagName('*'));

-};

-/**

- * This function tries to extract a feature from every node in a nodelist

- * and returns an array of features.

- * @param {!NodeList} nodeList DOM node list.

- * @param {!Object=} opt_context Optional context.

- * @return {!Array.<!DocumentFeature>}

- */

-DocumentFeatureExtractor.prototype.extractFromNodeList = function(

- nodeList, opt_context) {

- goog.asserts.assert(goog.isArrayLike(nodeList));

- var result = [];

- var nodeListLength = nodeList.length;

- for (var j = 0; j < nodeListLength; ++j) {

- var feature = this.extractFromElement(nodeList[j], opt_context);

- if (feature) {

- result.push(feature);

- }

- return result;

-};

-/**

- * This function extracts a feature from an HTML element. It should be

- * overridden in derived classes, unless the feature can be extracted without

- * looking at DOM.

- * @param {!Element} element HTML element.

- * @param {!Object=} opt_context Optional context.

- * @return {DocumentFeature}

- */

-DocumentFeatureExtractor.prototype.extractFromElement = function(

- element, opt_context) {

- return null;

-};

-}); // goog.scope