Index: chrome/browser/ui/title_prefix_matcher.cc |
=================================================================== |
--- chrome/browser/ui/title_prefix_matcher.cc (revision 86295) |
+++ chrome/browser/ui/title_prefix_matcher.cc (working copy) |
@@ -1,117 +0,0 @@ |
-// Copyright (c) 2011 The Chromium Authors. All rights reserved. |
-// Use of this source code is governed by a BSD-style license that can be |
-// found in the LICENSE file. |
- |
-#include "chrome/browser/ui/title_prefix_matcher.h" |
- |
-#include "base/hash_tables.h" |
-#include "base/i18n/break_iterator.h" |
-#include "base/logging.h" |
-#include "base/utf_string_conversions.h" |
- |
-namespace { |
-// We use this value to identify that we have already seen the title associated |
-// to this value in the duplicate_titles hash_set, ans marked it as a duplicate. |
-const size_t kPreviouslySeenIndex = 0xFFFFFFFF; |
-} |
- |
-// static |
-const int TitlePrefixMatcher::kCommonCharsToShow = 2; |
-const size_t TitlePrefixMatcher::kMinElidingLength = |
- TitlePrefixMatcher::kCommonCharsToShow + 3; |
- |
-TitlePrefixMatcher::TitleInfo::TitleInfo( |
- const string16* title, const GURL& url, int caller_value) |
- : title(title), |
- url(url), |
- prefix_length(0), |
- caller_value(caller_value) { |
- DCHECK(title != NULL); |
-} |
- |
-TitlePrefixMatcher::TitleInfo::~TitleInfo() { |
-} |
- |
-// static |
-void TitlePrefixMatcher::CalculatePrefixLengths( |
- std::vector<TitleInfo>* title_infos) { |
- DCHECK(title_infos != NULL); |
- // This set will contain the indexes of the TitleInfo objects in the vector |
- // that have a duplicate. |
- base::hash_set<size_t> duplicate_titles; |
- // This map is used to identify duplicates by remembering the vector indexes |
- // we have seen with a given title string. The vector index is set to |
- // kPreviouslySeenIndex once we identified duplicates and placed their |
- // indices in duplicate_titles. |
- base::hash_map<string16, size_t> existing_title; |
- // We identify if there are identical titles upfront, |
- // because we don't want to remove prefixes for those at all. |
- // We do it as a separate pass so that we don't need to remove |
- // previously parsed titles when we find a duplicate title later on. |
- for (size_t i = 0; i < title_infos->size(); ++i) { |
- // We use pairs to test existence and insert in one shot. |
- std::pair<base::hash_map<string16, size_t>::iterator, bool> insert_result = |
- existing_title.insert(std::make_pair(*(*title_infos)[i].title, i)); |
- if (!insert_result.second) { |
- // insert_result.second is false when we insert a duplicate in the set. |
- // insert_result.first is a map iterator and thus |
- // insert_result.first->first is the string title key of the map. |
- DCHECK_EQ(*(*title_infos)[i].title, insert_result.first->first); |
- duplicate_titles.insert(i); |
- // insert_result.first->second is the value of the title index and if it's |
- // not kPreviouslySeenIndex yet, we must remember it as a duplicate too. |
- if (insert_result.first->second != kPreviouslySeenIndex) { |
- duplicate_titles.insert(insert_result.first->second); |
- insert_result.first->second = kPreviouslySeenIndex; |
- } |
- } |
- } |
- |
- // This next loop accumulates all the potential prefixes, |
- // and remember on which titles we saw them. |
- base::hash_map<string16, std::vector<size_t> > prefixes; |
- for (size_t i = 0; i < title_infos->size(); ++i) { |
- // Duplicate titles are not to be included in this process. |
- if (duplicate_titles.find(i) != duplicate_titles.end()) |
- continue; |
- const TitleInfo& title_info = (*title_infos)[i]; |
- const string16* title = title_info.title; |
- // We prefix the hostname at the beginning, so that we only group |
- // titles that are from the same hostname. |
- string16 hostname = ASCIIToUTF16(title_info.url.host()); |
- // We only create prefixes at word boundaries. |
- base::i18n::BreakIterator iter(title, |
- base::i18n::BreakIterator::BREAK_WORD); |
- // We ignore this title if we can't break it into words, or if it only |
- // contains a single word. |
- if (!iter.Init() || !iter.Advance()) |
- continue; |
- // We continue advancing even though we already advanced to the first |
- // word above, so that we can use iter.prev() to identify the end of the |
- // previous word and more easily ignore the last word while iterating. |
- while (iter.Advance()) { |
- if (iter.IsWord()) |
- prefixes[hostname + title->substr(0, iter.prev())].push_back(i); |
- } |
- } |
- |
- // Now we parse the map to find common prefixes |
- // and keep the largest per title. |
- for (base::hash_map<string16, std::vector<size_t> >::iterator iter = |
- prefixes.begin(); iter != prefixes.end(); ++iter) { |
- // iter->first is the prefix string, iter->second is a vector of indices. |
- if (iter->second.size() > 1) { |
- // We need to subtract the hostname size since we added it to the prefix. |
- const TitleInfo& first_title_info = (*title_infos)[iter->second[0]]; |
- DCHECK_GE(iter->first.size(), first_title_info.url.host().size()); |
- size_t prefix_length = iter->first.size() - |
- first_title_info.url.host().size(); |
- for (size_t i = 0; i < iter->second.size(); ++i){ |
- TitleInfo& title_info = (*title_infos)[iter->second[i]]; |
- DCHECK_EQ(first_title_info.url.host(), title_info.url.host()); |
- if (title_info.prefix_length < prefix_length) |
- title_info.prefix_length = prefix_length; |
- } |
- } |
- } |
-} |