| OLD | NEW |
| (Empty) | |
| 1 // Copyright 2016 The Chromium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. |
| 4 |
| 5 #include "components/translate/core/browser/translate_ranker.h" |
| 6 |
| 7 #include <cmath> |
| 8 |
| 9 #include "base/bind.h" |
| 10 #include "base/bind_helpers.h" |
| 11 #include "base/command_line.h" |
| 12 #include "base/metrics/histogram_macros.h" |
| 13 #include "base/profiler/scoped_tracker.h" |
| 14 #include "base/strings/string_util.h" |
| 15 #include "components/metrics/proto/translate_event.pb.h" |
| 16 #include "components/translate/core/browser/proto/translate_ranker_model.pb.h" |
| 17 #include "components/translate/core/browser/translate_download_manager.h" |
| 18 #include "components/translate/core/browser/translate_prefs.h" |
| 19 #include "components/translate/core/browser/translate_url_fetcher.h" |
| 20 #include "components/translate/core/common/translate_switches.h" |
| 21 |
| 22 namespace translate { |
| 23 |
| 24 namespace { |
| 25 |
| 26 typedef google::protobuf::Map<std::string, float> WeightMap; |
| 27 |
| 28 const double kTranslationOfferThreshold = 0.5; |
| 29 |
| 30 // Parameters for model fetching. |
| 31 const char kTranslateRankerModelURL[] = |
| 32 "https://chromium-i18n.appspot.com/ssl-translate-ranker-model"; |
| 33 const int kMaxRetryOn5xx = 3; |
| 34 const int kDownloadRefractoryPeriodMin = 15; |
| 35 const char kUnknown[] = "UNKNOWN"; |
| 36 |
| 37 // Enumeration denoting the outcome of an attempt to download the translate |
| 38 // ranker model. This must be kept in sync with the TranslateRankerModelStatus |
| 39 // enum in histograms.xml |
| 40 enum ModelStatus { |
| 41 MODEL_STATUS_OK = 0, |
| 42 MODEL_STATUS_DOWNLOAD_THROTTLED = 1, |
| 43 MODEL_STATUS_DOWNLOAD_FAILED = 2, |
| 44 MODEL_STATUS_PARSE_FAILED = 3, |
| 45 MODEL_STATUS_VALIDATION_FAILED = 4, |
| 46 // Insert new values above this line. |
| 47 MODEL_STATUS_MAX |
| 48 }; |
| 49 |
| 50 double Sigmoid(double x) { |
| 51 return 1.0 / (1.0 + exp(-x)); |
| 52 } |
| 53 |
| 54 double ScoreComponent(const WeightMap& weights, const std::string& key) { |
| 55 WeightMap::const_iterator i = weights.find(base::ToLowerASCII(key)); |
| 56 if (i == weights.end()) |
| 57 i = weights.find(kUnknown); |
| 58 return i == weights.end() ? 0.0 : i->second; |
| 59 } |
| 60 |
| 61 GURL GetTranslateRankerURL() { |
| 62 base::CommandLine* command_line = base::CommandLine::ForCurrentProcess(); |
| 63 return GURL(command_line->HasSwitch(switches::kTranslateRankerModelURL) |
| 64 ? command_line->GetSwitchValueASCII( |
| 65 switches::kTranslateRankerModelURL) |
| 66 : kTranslateRankerModelURL); |
| 67 } |
| 68 |
| 69 void ReportModelStatus(ModelStatus model_status) { |
| 70 UMA_HISTOGRAM_ENUMERATION("Translate.Ranker.Model.Status", model_status, |
| 71 MODEL_STATUS_MAX); |
| 72 } |
| 73 |
| 74 } // namespace |
| 75 |
| 76 const base::Feature kTranslateRankerQuery{"TranslateRankerQuery", |
| 77 base::FEATURE_DISABLED_BY_DEFAULT}; |
| 78 |
| 79 const base::Feature kTranslateRankerEnforcement{ |
| 80 "TranslateRankerEnforcement", base::FEATURE_DISABLED_BY_DEFAULT}; |
| 81 |
| 82 const base::Feature kTranslateRankerLogging{"TranslateRankerLogging", |
| 83 base::FEATURE_DISABLED_BY_DEFAULT}; |
| 84 |
| 85 TranslateRanker::~TranslateRanker() {} |
| 86 |
| 87 // static |
| 88 bool TranslateRanker::IsEnabled() { |
| 89 return IsQueryEnabled() || IsEnforcementEnabled(); |
| 90 } |
| 91 |
| 92 // static |
| 93 bool TranslateRanker::IsLoggingEnabled() { |
| 94 return base::FeatureList::IsEnabled(kTranslateRankerLogging); |
| 95 } |
| 96 |
| 97 // static |
| 98 bool TranslateRanker::IsQueryEnabled() { |
| 99 return base::FeatureList::IsEnabled(kTranslateRankerQuery); |
| 100 } |
| 101 |
| 102 // static |
| 103 bool TranslateRanker::IsEnforcementEnabled() { |
| 104 return base::FeatureList::IsEnabled(kTranslateRankerEnforcement); |
| 105 } |
| 106 |
| 107 // static |
| 108 TranslateRanker* TranslateRanker::GetInstance() { |
| 109 return base::Singleton<TranslateRanker>::get(); |
| 110 } |
| 111 |
| 112 std::unique_ptr<TranslateRanker> TranslateRanker::CreateForTesting( |
| 113 const std::string& model_data) { |
| 114 std::unique_ptr<TranslateRanker> ranker(new TranslateRanker()); |
| 115 CHECK(ranker != nullptr); |
| 116 ranker->ParseModel(0, true, model_data); |
| 117 CHECK(ranker->model_ != nullptr); |
| 118 return ranker; |
| 119 } |
| 120 |
| 121 bool TranslateRanker::ShouldOfferTranslation( |
| 122 const TranslatePrefs& translate_prefs, |
| 123 const std::string& src_lang, |
| 124 const std::string& dst_lang) { |
| 125 // The ranker is a gate in the "show a translation prompt" flow. To retain |
| 126 // the pre-existing functionality, it defaults to returning true in the |
| 127 // absence of a model or if enforcement is disabled. As this is ranker is |
| 128 // subsumed into a more general assist ranker, this default will go away |
| 129 // (or become False). |
| 130 const bool kDefaultResponse = true; |
| 131 |
| 132 // If we don't have a model, request one and return the default. |
| 133 if (model_ == nullptr) { |
| 134 FetchModelData(); |
| 135 return kDefaultResponse; |
| 136 } |
| 137 |
| 138 DCHECK(model_->has_logistic_regression_model()); |
| 139 SCOPED_UMA_HISTOGRAM_TIMER("Translate.Ranker.Timer.ShouldOfferTranslation"); |
| 140 |
| 141 // TODO(rogerm): Remove ScopedTracker below once crbug.com/646711 is closed. |
| 142 tracked_objects::ScopedTracker tracking_profile( |
| 143 FROM_HERE_WITH_EXPLICIT_FUNCTION( |
| 144 "646711 translate::TranslateRanker::ShouldOfferTranslation")); |
| 145 |
| 146 const std::string& app_locale = |
| 147 TranslateDownloadManager::GetInstance()->application_locale(); |
| 148 const std::string& country = translate_prefs.GetCountry(); |
| 149 int accept_count = translate_prefs.GetTranslationAcceptedCount(src_lang); |
| 150 int decline_count = translate_prefs.GetTranslationDeniedCount(src_lang); |
| 151 int ignore_count = translate_prefs.GetTranslationIgnoredCount(src_lang); |
| 152 DVLOG(3) << "TranslateRanker: features=[" |
| 153 << "src_lang='" << src_lang << "', dst_lang='" << dst_lang |
| 154 << "', country='" << country << "', locale='" << app_locale |
| 155 << ", accept_count=" << accept_count |
| 156 << ", decline_count=" << decline_count |
| 157 << ", ignore_count=" << ignore_count << "]"; |
| 158 |
| 159 double score = CalculateScore(accept_count, decline_count, ignore_count, |
| 160 src_lang, dst_lang, app_locale, country); |
| 161 |
| 162 DVLOG(2) << "TranslateRanker Score: " << score; |
| 163 |
| 164 bool result = (score >= kTranslationOfferThreshold); |
| 165 |
| 166 UMA_HISTOGRAM_BOOLEAN("Translate.Ranker.QueryResult", result); |
| 167 |
| 168 return result; |
| 169 } |
| 170 |
| 171 TranslateRanker::TranslateRanker() {} |
| 172 |
| 173 double TranslateRanker::CalculateScore(int accept_count, |
| 174 int decline_count, |
| 175 int ignore_count, |
| 176 const std::string& src_lang, |
| 177 const std::string& dst_lang, |
| 178 const std::string& locale, |
| 179 const std::string& country) { |
| 180 SCOPED_UMA_HISTOGRAM_TIMER("Translate.Ranker.Timer.CalculateScore"); |
| 181 DCHECK(model_ != nullptr); |
| 182 DCHECK(model_->has_logistic_regression_model()); |
| 183 |
| 184 int total_count = accept_count + decline_count + ignore_count; |
| 185 double accept_ratio = |
| 186 (total_count == 0) ? 0.0 : (double(accept_count) / total_count); |
| 187 double decline_ratio = |
| 188 (total_count == 0) ? 0.0 : (double(decline_count) / total_count); |
| 189 double ignore_ratio = |
| 190 (total_count == 0) ? 0.0 : (double(ignore_count) / total_count); |
| 191 DVLOG(3) << "TranslateRanker: ratios=[" |
| 192 << ", accept_ratio=" << accept_ratio |
| 193 << ", decline_ratio=" << decline_ratio |
| 194 << ", ignore_ratio=" << ignore_ratio << "]"; |
| 195 |
| 196 const chrome_intelligence::TranslateRankerModel::LogisticRegressionModel& |
| 197 logit = model_->logistic_regression_model(); |
| 198 double dot_product = |
| 199 (accept_ratio * logit.accept_ratio_weight()) + |
| 200 (decline_ratio * logit.decline_ratio_weight()) + |
| 201 (ignore_ratio * logit.ignore_ratio_weight()) + |
| 202 (accept_count * logit.accept_count_weight()) + |
| 203 (decline_count * logit.decline_count_weight()) + |
| 204 (ignore_count * logit.ignore_count_weight()) + |
| 205 ScoreComponent(logit.source_language_weight(), src_lang) + |
| 206 ScoreComponent(logit.dest_language_weight(), dst_lang) + |
| 207 ScoreComponent(logit.country_weight(), country) + |
| 208 ScoreComponent(logit.locale_weight(), locale); |
| 209 return Sigmoid(dot_product + logit.bias()); |
| 210 } |
| 211 |
| 212 int TranslateRanker::GetModelVersion() const { |
| 213 return (model_ == nullptr) ? 0 : model_->version(); |
| 214 } |
| 215 |
| 216 void TranslateRanker::FetchModelData() { |
| 217 // Exit if the model has already been successfully loaded. |
| 218 if (model_ != nullptr) { |
| 219 return; |
| 220 } |
| 221 |
| 222 // Exit if the download has been throttled. |
| 223 if (base::Time::NowFromSystemTime() < next_earliest_download_time_) { |
| 224 return; |
| 225 } |
| 226 |
| 227 // Create the model fetcher if it does not exist. |
| 228 if (model_fetcher_ == nullptr) { |
| 229 model_fetcher_.reset(new TranslateURLFetcher(kFetcherId)); |
| 230 model_fetcher_->set_max_retry_on_5xx(kMaxRetryOn5xx); |
| 231 } |
| 232 |
| 233 // If a request is already in flight, do not issue a new one. |
| 234 if (model_fetcher_->state() == TranslateURLFetcher::REQUESTING) { |
| 235 DVLOG(2) << "TranslateRanker: Download complete or in progress."; |
| 236 return; |
| 237 } |
| 238 |
| 239 DVLOG(2) << "TranslateRanker: Downloading model..."; |
| 240 |
| 241 download_start_time_ = base::Time::Now(); |
| 242 bool result = model_fetcher_->Request( |
| 243 GetTranslateRankerURL(), |
| 244 base::Bind(&TranslateRanker::ParseModel, base::Unretained(this))); |
| 245 |
| 246 if (!result) { |
| 247 ReportModelStatus(MODEL_STATUS_DOWNLOAD_THROTTLED); |
| 248 next_earliest_download_time_ = |
| 249 base::Time::NowFromSystemTime() + |
| 250 base::TimeDelta::FromMinutes(kDownloadRefractoryPeriodMin); |
| 251 } |
| 252 } |
| 253 |
| 254 void TranslateRanker::ParseModel(int /* id */, |
| 255 bool success, |
| 256 const std::string& data) { |
| 257 UMA_HISTOGRAM_MEDIUM_TIMES("Translate.Ranker.Timer.DownloadModel", |
| 258 base::Time::Now() - download_start_time_); |
| 259 |
| 260 SCOPED_UMA_HISTOGRAM_TIMER("Translate.Ranker.Timer.ParseModel"); |
| 261 |
| 262 // We should not be here if the model has already been downloaded and parsed. |
| 263 DCHECK(model_ == nullptr); |
| 264 |
| 265 // On failure, we just abort. The TranslateRanker will retry on a subsequent |
| 266 // translation opportunity. The TranslateURLFetcher enforces a limit for |
| 267 // retried requests. |
| 268 if (!success) { |
| 269 ReportModelStatus(MODEL_STATUS_DOWNLOAD_FAILED); |
| 270 return; |
| 271 } |
| 272 |
| 273 // Create a new model instance, parse and validate the data, and move it over |
| 274 // to be used by the ranker. |
| 275 std::unique_ptr<chrome_intelligence::TranslateRankerModel> new_model( |
| 276 new chrome_intelligence::TranslateRankerModel()); |
| 277 |
| 278 bool is_parseable = new_model->ParseFromString(data); |
| 279 if (!is_parseable) { |
| 280 ReportModelStatus(MODEL_STATUS_PARSE_FAILED); |
| 281 return; |
| 282 } |
| 283 |
| 284 bool is_valid = new_model->has_logistic_regression_model(); |
| 285 if (!is_valid) { |
| 286 ReportModelStatus(MODEL_STATUS_VALIDATION_FAILED); |
| 287 return; |
| 288 } |
| 289 |
| 290 ReportModelStatus(MODEL_STATUS_OK); |
| 291 model_ = std::move(new_model); |
| 292 model_fetcher_.reset(); |
| 293 |
| 294 DVLOG(3) << "Successfully loaded model version " << GetModelVersion() << "."; |
| 295 } |
| 296 |
| 297 void TranslateRanker::FlushTranslateEvents( |
| 298 std::vector<metrics::TranslateEventProto>* translate_events) { |
| 299 if (IsLoggingEnabled()) { |
| 300 translate_events->swap(translate_events_cache_); |
| 301 translate_events_cache_.clear(); |
| 302 } |
| 303 } |
| 304 |
| 305 void TranslateRanker::RecordTranslateEvent( |
| 306 const metrics::TranslateEventProto& translate_event) { |
| 307 if (IsLoggingEnabled()) |
| 308 translate_events_cache_.push_back(translate_event); |
| 309 } |
| 310 |
| 311 } // namespace translate |
| OLD | NEW |