chrome/browser/safe_browsing/safe_browsing_store.cc - Issue 263833005: Knock out injected safe-browsing prefixes.

Unified Diff: chrome/browser/safe_browsing/safe_browsing_store.cc

Issue 263833005: Knock out injected safe-browsing prefixes. (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/src

Patch Set: add ContainsBrowseUrl test. Created 6 years, 8 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

« no previous file with comments | « chrome/browser/safe_browsing/safe_browsing_database_unittest.cc ('k') | chrome/browser/safe_browsing/safe_browsing_store_unittest.cc » ('j') | chrome/browser/safe_browsing/safe_browsing_store_unittest.cc » ('J')
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: chrome/browser/safe_browsing/safe_browsing_store.cc

diff --git a/chrome/browser/safe_browsing/safe_browsing_store.cc b/chrome/browser/safe_browsing/safe_browsing_store.cc

index e4c15e74b5da2bd9d9d38a2fed561f335f9b3303..b0f6a2a20d0f6134ba5bc834086afbdf5b80b490 100644

--- a/chrome/browser/safe_browsing/safe_browsing_store.cc

+++ b/chrome/browser/safe_browsing/safe_browsing_store.cc

@@ -7,6 +7,7 @@

#include <algorithm>

#include "base/logging.h"

+#include "base/metrics/histogram.h"

namespace {

@@ -88,6 +89,48 @@ void RemoveDeleted(ItemsT* items, const base::hash_set<int32>& del_set) {

items->erase(end_iter, items->end());

}

+// Remove prefixes which are in the same chunk as their fullhash. This was a

+// mistake in earlier implementations.

+template <typename HashesT, typename PrefixesT>

+size_t KnockoutPrefixVolunteers(const HashesT& full_hashes,

+ PrefixesT* prefixes) {

+ typename PrefixesT::iterator prefixes_process = prefixes->begin();

+ typename PrefixesT::iterator prefixes_out = prefixes->begin();

+ typename HashesT::const_iterator hashes_process = full_hashes.begin();

+ size_t skipped_count = 0;

+ while (hashes_process != full_hashes.end()) {

+ // Scan prefixes forward until an item is not less than the current hash.

+ while (prefixes_process != prefixes->end() &&

+ SBAddPrefixLess(*prefixes_process, *hashes_process)) {

+ if (prefixes_process != prefixes_out) {

+ *prefixes_out = *prefixes_process;

+ }

+ prefixes_out++;

+ prefixes_process++;

+ }

+ // If the current hash is also not less than the prefix, that implies they

+ // are equal. Skip the prefix.

+ if (prefixes_process != prefixes->end() &&

+ !SBAddPrefixLess(*hashes_process, *prefixes_process)) {

+ skipped_count++;

+ prefixes_process++;

+ }

+ hashes_process++;

+ }

+ // If any prefixes were skipped, copy over the tail and erase the excess.

+ if (prefixes_process != prefixes_out) {

+ prefixes_out = std::copy(prefixes_process, prefixes->end(), prefixes_out);

+ prefixes->erase(prefixes_out, prefixes->end());

+ }

+ return skipped_count;

} // namespace

void SBProcessSubs(SBAddPrefixes* add_prefixes,

@@ -111,6 +154,17 @@ void SBProcessSubs(SBAddPrefixes* add_prefixes,

DCHECK(sorted(sub_full_hashes->begin(), sub_full_hashes->end(),

SBAddPrefixHashLess<SBSubFullHash,SBSubFullHash>));

+ // Earlier database code added prefixes when it saw fullhashes. The protocol

+ // should never send a chunk of mixed prefixes and fullhashes, the following

+ // removes any such cases which are seen.

+ // TODO(shess): Remove this code once most databases have been processed.

+ // Chunk churn should clean up anyone left over. This only takes a few ms to

+ // run through my current database, so it doesn't seem worthwhile to do much

+ // more than that.

+ size_t skipped = KnockoutPrefixVolunteers(*add_full_hashes, add_prefixes);

+ skipped += KnockoutPrefixVolunteers(*sub_full_hashes, sub_prefixes);

+ UMA_HISTOGRAM_COUNTS("SB2.VolunteerPrefixesRemoved", skipped);

// Factor out the prefix subs.

KnockoutSubs(sub_prefixes, add_prefixes,

SBAddPrefixLess<SBAddPrefix,SBSubPrefix>,