Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(377)

Unified Diff: components/rappor/bloom_filter.cc

Issue 1090683003: Alternative Multi-dimensional Rappor (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master
Patch Set: Use 64-bit shift Created 5 years, 8 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
« no previous file with comments | « components/rappor/bloom_filter.h ('k') | components/rappor/bloom_filter_unittest.cc » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
Index: components/rappor/bloom_filter.cc
diff --git a/components/rappor/bloom_filter.cc b/components/rappor/bloom_filter.cc
index 9ad8f3ca0ce9d68191e8896229dbf3d44c2e1fcc..6c6f65409151fa37f089a9bf86c4ea756c418756 100644
--- a/components/rappor/bloom_filter.cc
+++ b/components/rappor/bloom_filter.cc
@@ -9,6 +9,16 @@
namespace rappor {
+namespace {
+
+uint32_t ComputeHash(const std::string& str, uint32_t seed) {
+ // Using CityHash here because we have support for it in Dremel. Many hash
+ // functions, such as MD5, SHA1, or Murmur, would probably also work.
+ return CityHash64WithSeed(str.data(), str.size(), seed);
+}
+
+} // namespace
+
BloomFilter::BloomFilter(uint32_t bytes_size,
uint32_t hash_function_count,
uint32_t hash_seed_offset)
@@ -25,10 +35,7 @@ void BloomFilter::SetString(const std::string& str) {
bytes_[i] = 0;
}
for (size_t i = 0; i < hash_function_count_; ++i) {
- // Using CityHash here because we have support for it in Dremel. Many hash
- // functions, such as MD5, SHA1, or Murmur, would probably also work.
- uint32_t index =
- CityHash64WithSeed(str.data(), str.size(), hash_seed_offset_ + i);
+ uint32_t index = ComputeHash(str, hash_seed_offset_ + i);
// Note that the "bytes" are uint8_t, so they are always 8-bits.
uint32_t byte_index = (index / 8) % bytes_.size();
uint32_t bit_index = index % 8;
@@ -43,4 +50,23 @@ void BloomFilter::SetBytesForTesting(const ByteVector& bytes) {
}
}
+namespace internal {
+
+uint64_t GetBloomBits(uint32_t bytes_size,
+ uint32_t hash_function_count,
+ uint32_t hash_seed_offset,
+ const std::string& str) {
+ // Make sure result fits in uint64.
+ DCHECK_LE(bytes_size, 8u);
+ uint64_t output = 0;
+ const uint32_t bits_size = bytes_size * 8;
+ for (size_t i = 0; i < hash_function_count; ++i) {
+ uint32_t index = ComputeHash(str, hash_seed_offset + i);
+ output |= 1ULL << uint64_t(index % bits_size);
+ }
+ return output;
+}
+
+} // namespace internal
+
} // namespace rappor
« no previous file with comments | « components/rappor/bloom_filter.h ('k') | components/rappor/bloom_filter_unittest.cc » ('j') | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698