Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(36)

Side by Side Diff: net/disk_cache/simple/simple_index.cc

Issue 2918893002: evict larger entries first (Closed)
Patch Set: faster, cleaner, stronger, better Created 3 years, 6 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
« no previous file with comments | « net/disk_cache/simple/simple_experiment.cc ('k') | no next file » | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 // Copyright (c) 2013 The Chromium Authors. All rights reserved. 1 // Copyright (c) 2013 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be 2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file. 3 // found in the LICENSE file.
4 4
5 #include "net/disk_cache/simple/simple_index.h" 5 #include "net/disk_cache/simple/simple_index.h"
6 6
7 #include <algorithm> 7 #include <algorithm>
8 #include <limits> 8 #include <limits>
9 #include <string> 9 #include <string>
10 #include <utility> 10 #include <utility>
11 11
12 #include "base/bind.h" 12 #include "base/bind.h"
13 #include "base/bind_helpers.h" 13 #include "base/bind_helpers.h"
14 #include "base/bits.h"
14 #include "base/files/file_enumerator.h" 15 #include "base/files/file_enumerator.h"
15 #include "base/files/file_util.h" 16 #include "base/files/file_util.h"
16 #include "base/logging.h" 17 #include "base/logging.h"
17 #include "base/message_loop/message_loop.h" 18 #include "base/message_loop/message_loop.h"
18 #include "base/metrics/field_trial.h" 19 #include "base/metrics/field_trial.h"
19 #include "base/numerics/safe_conversions.h" 20 #include "base/numerics/safe_conversions.h"
20 #include "base/pickle.h" 21 #include "base/pickle.h"
21 #include "base/strings/string_number_conversions.h" 22 #include "base/strings/string_number_conversions.h"
22 #include "base/strings/string_tokenizer.h" 23 #include "base/strings/string_tokenizer.h"
23 #include "base/task_runner.h" 24 #include "base/task_runner.h"
24 #include "base/time/time.h" 25 #include "base/time/time.h"
25 #include "base/trace_event/memory_usage_estimator.h" 26 #include "base/trace_event/memory_usage_estimator.h"
26 #include "net/base/net_errors.h" 27 #include "net/base/net_errors.h"
27 #include "net/disk_cache/simple/simple_entry_format.h" 28 #include "net/disk_cache/simple/simple_entry_format.h"
29 #include "net/disk_cache/simple/simple_experiment.h"
28 #include "net/disk_cache/simple/simple_histogram_macros.h" 30 #include "net/disk_cache/simple/simple_histogram_macros.h"
29 #include "net/disk_cache/simple/simple_index_delegate.h" 31 #include "net/disk_cache/simple/simple_index_delegate.h"
30 #include "net/disk_cache/simple/simple_index_file.h" 32 #include "net/disk_cache/simple/simple_index_file.h"
31 #include "net/disk_cache/simple/simple_synchronous_entry.h" 33 #include "net/disk_cache/simple/simple_synchronous_entry.h"
32 #include "net/disk_cache/simple/simple_util.h" 34 #include "net/disk_cache/simple/simple_util.h"
33 35
34 #if defined(OS_POSIX) 36 #if defined(OS_POSIX)
35 #include <sys/stat.h> 37 #include <sys/stat.h>
36 #include <sys/time.h> 38 #include <sys/time.h>
37 #endif 39 #endif
38 40
39 namespace { 41 namespace {
40 42
41 // How many milliseconds we delay writing the index to disk since the last cache 43 // How many milliseconds we delay writing the index to disk since the last cache
42 // operation has happened. 44 // operation has happened.
43 const int kWriteToDiskDelayMSecs = 20000; 45 const int kWriteToDiskDelayMSecs = 20000;
44 const int kWriteToDiskOnBackgroundDelayMSecs = 100; 46 const int kWriteToDiskOnBackgroundDelayMSecs = 100;
45 47
46 // Divides the cache space into this amount of parts to evict when only one part 48 // Divides the cache space into this amount of parts to evict when only one part
47 // is left. 49 // is left.
48 const uint32_t kEvictionMarginDivisor = 20; 50 const uint32_t kEvictionMarginDivisor = 20;
49 51
50 const uint32_t kBytesInKb = 1024; 52 const uint32_t kBytesInKb = 1024;
51 53
54 // Estimated bytes used above the size of the data itself.
55 static const int kEstimatedEntryOverhead = 512;
Maks Orlovich 2017/06/22 16:30:51 FWIW, GetEntrySize is the size of the file, not of
hubbe 2017/06/22 17:36:10 Updated comment.
56
52 } // namespace 57 } // namespace
53 58
54 namespace disk_cache { 59 namespace disk_cache {
55 60
56 EntryMetadata::EntryMetadata() 61 EntryMetadata::EntryMetadata()
57 : last_used_time_seconds_since_epoch_(0), 62 : last_used_time_seconds_since_epoch_(0),
58 entry_size_(0) { 63 entry_size_(0) {
59 } 64 }
60 65
61 EntryMetadata::EntryMetadata(base::Time last_used_time, 66 EntryMetadata::EntryMetadata(base::Time last_used_time,
(...skipping 240 matching lines...) Expand 10 before | Expand all | Expand 10 after
302 eviction_in_progress_ = true; 307 eviction_in_progress_ = true;
303 eviction_start_time_ = base::TimeTicks::Now(); 308 eviction_start_time_ = base::TimeTicks::Now();
304 SIMPLE_CACHE_UMA( 309 SIMPLE_CACHE_UMA(
305 MEMORY_KB, "Eviction.CacheSizeOnStart2", cache_type_, 310 MEMORY_KB, "Eviction.CacheSizeOnStart2", cache_type_,
306 static_cast<base::HistogramBase::Sample>(cache_size_ / kBytesInKb)); 311 static_cast<base::HistogramBase::Sample>(cache_size_ / kBytesInKb));
307 SIMPLE_CACHE_UMA( 312 SIMPLE_CACHE_UMA(
308 MEMORY_KB, "Eviction.MaxCacheSizeOnStart2", cache_type_, 313 MEMORY_KB, "Eviction.MaxCacheSizeOnStart2", cache_type_,
309 static_cast<base::HistogramBase::Sample>(max_size_ / kBytesInKb)); 314 static_cast<base::HistogramBase::Sample>(max_size_ / kBytesInKb));
310 315
311 // Flatten for sorting. 316 // Flatten for sorting.
312 std::vector<const std::pair<const uint64_t, EntryMetadata>*> entries; 317 typedef std::pair<const uint64_t, EntryMetadata> Entry;
318 typedef std::pair<uint64_t, const Entry*> SortHelper;
319 std::vector<SortHelper> entries;
313 entries.reserve(entries_set_.size()); 320 entries.reserve(entries_set_.size());
321 uint32_t now = (base::Time::Now() - base::Time::UnixEpoch()).InSeconds();
322 bool use_size = base::FeatureList::IsEnabled(kSimpleCacheEvictionWithSize);
314 for (EntrySet::const_iterator i = entries_set_.begin(); 323 for (EntrySet::const_iterator i = entries_set_.begin();
315 i != entries_set_.end(); ++i) { 324 i != entries_set_.end(); ++i) {
316 entries.push_back(&*i); 325 uint64_t sort_value = now - i->second.RawTimeForSorting();
326 if (use_size)
327 sort_value *= i->second.GetEntrySize() + kEstimatedEntryOverhead;
328 // Subtract so we don't need a custom comparitor.
Maks Orlovich 2017/06/22 16:30:51 typo, s/comparitor/comparator/
hubbe 2017/06/22 17:36:10 Done.
329 entries.emplace_back(std::numeric_limits<uint64_t>::max() - sort_value,
330 &*i);
317 } 331 }
318 332
319 std::sort(entries.begin(), entries.end(), 333 // introselect algorithm:
320 [](const std::pair<const uint64_t, EntryMetadata>* a, 334 // Pick a pivot element, partition elements into elements
321 const std::pair<const uint64_t, EntryMetadata>* b) -> bool { 335 // smaller than the pivot and not smaller than pivot.
322 return a->second.RawTimeForSorting() < 336 // Then sum all the sizes from the "smaller" bucket. If it
323 b->second.RawTimeForSorting(); 337 // is still too large, then iterate again, but only consider
324 }); 338 // elements from the "smaller" bucket. If not, add all elements
339 // in the "smaller" bucket to the evict list.
340 // Then iterate again, to partition the "not smaller" bucket.
341 // If we go over 2 * log2(|entries|) iterations, resort to calling
342 // std::sort() to avoid N-squared worst case scenario.
343 uint64_t evicted_so_far_size = 0;
344 const uint64_t amount_to_evict = cache_size_ - low_watermark_;
345 std::vector<uint64_t> entry_hashes;
346 int loops = 2 * base::bits::Log2Ceiling(entries.size());
347 auto begin = entries.begin();
348 auto end = entries.end();
349 while (loops > 0 && evicted_so_far_size < amount_to_evict &&
350 end - begin >= 3) {
351 loops--;
325 352
326 // Remove as many entries from the index to get below |low_watermark_|, 353 // Select a pivot.
327 // collecting least recently used hashes into |entry_hashes|. 354 uint64_t tmp[3];
328 std::vector<uint64_t> entry_hashes; 355 tmp[0] = begin->first;
329 std::vector<const std::pair<const uint64_t, EntryMetadata>*>::iterator it = 356 tmp[1] = (end - 1)->first;
330 entries.begin(); 357 tmp[2] = (begin + (end - begin) / 2)->first;
331 uint64_t evicted_so_far_size = 0; 358 std::sort(tmp, tmp + 3);
332 while (evicted_so_far_size < cache_size_ - low_watermark_) { 359 uint64_t pivot = tmp[1];
333 DCHECK(it != entries.end()); 360
334 entry_hashes.push_back((*it)->first); 361 // Partition
335 evicted_so_far_size += (*it)->second.GetEntrySize(); 362 auto middle = std::partition(begin, end, [pivot](const SortHelper& entry) {
336 ++it; 363 return entry.first < pivot;
364 });
365 if (middle == end || middle == begin) {
366 // No progress will be made.
367 break;
368 }
369 uint64_t lt_sum = 0;
370 for (auto i = begin; i != middle; ++i)
371 lt_sum += i->second->second.GetEntrySize();
372
373 if (evicted_so_far_size + lt_sum > amount_to_evict) {
374 end = middle;
375 } else {
376 evicted_so_far_size += lt_sum;
377 for (auto i = begin; i != middle; ++i)
378 entry_hashes.push_back(i->second->first);
379
380 begin = middle;
381 }
382 }
383
384 if (end > begin && evicted_so_far_size < amount_to_evict) {
385 std::sort(begin, end);
386 for (auto i = begin; i < end; ++i) {
387 if (evicted_so_far_size > amount_to_evict)
Maks Orlovich 2017/06/22 16:30:51 >=, I think?
hubbe 2017/06/22 17:36:10 Done.
388 break;
389 evicted_so_far_size += i->second->second.GetEntrySize();
390 entry_hashes.push_back(i->second->first);
391 }
337 } 392 }
338 393
339 SIMPLE_CACHE_UMA(COUNTS, 394 SIMPLE_CACHE_UMA(COUNTS,
340 "Eviction.EntryCount", cache_type_, entry_hashes.size()); 395 "Eviction.EntryCount", cache_type_, entry_hashes.size());
341 SIMPLE_CACHE_UMA(TIMES, 396 SIMPLE_CACHE_UMA(TIMES,
342 "Eviction.TimeToSelectEntries", cache_type_, 397 "Eviction.TimeToSelectEntries", cache_type_,
343 base::TimeTicks::Now() - eviction_start_time_); 398 base::TimeTicks::Now() - eviction_start_time_);
344 SIMPLE_CACHE_UMA( 399 SIMPLE_CACHE_UMA(
345 MEMORY_KB, "Eviction.SizeOfEvicted2", cache_type_, 400 MEMORY_KB, "Eviction.SizeOfEvicted2", cache_type_,
346 static_cast<base::HistogramBase::Sample>( 401 static_cast<base::HistogramBase::Sample>(
(...skipping 167 matching lines...) Expand 10 before | Expand all | Expand 10 after
514 start - last_write_to_disk_); 569 start - last_write_to_disk_);
515 } 570 }
516 } 571 }
517 last_write_to_disk_ = start; 572 last_write_to_disk_ = start;
518 573
519 index_file_->WriteToDisk(reason, entries_set_, cache_size_, start, 574 index_file_->WriteToDisk(reason, entries_set_, cache_size_, start,
520 app_on_background_, base::Closure()); 575 app_on_background_, base::Closure());
521 } 576 }
522 577
523 } // namespace disk_cache 578 } // namespace disk_cache
OLDNEW
« no previous file with comments | « net/disk_cache/simple/simple_experiment.cc ('k') | no next file » | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698