Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(494)

Side by Side Diff: components/translate/core/browser/translate_ranker_impl.cc

Issue 2785493004: Integrate RankerModelLoader with TranslateRanker. (Closed)
Patch Set: fix bogus compile error Created 3 years, 8 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
OLDNEW
(Empty)
1 // Copyright 2016 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4
5 #include "components/translate/core/browser/translate_ranker_impl.h"
6
7 #include <cmath>
8
9 #include "base/bind.h"
10 #include "base/bind_helpers.h"
11 #include "base/command_line.h"
12 #include "base/files/file_path.h"
13 #include "base/files/file_util.h"
14 #include "base/memory/ptr_util.h"
15 #include "base/metrics/histogram_macros.h"
16 #include "base/profiler/scoped_tracker.h"
17 #include "base/strings/string_number_conversions.h"
18 #include "base/strings/string_util.h"
19 #include "base/task_runner.h"
20 #include "base/threading/thread_task_runner_handle.h"
21 #include "components/metrics/proto/translate_event.pb.h"
22 #include "components/translate/core/browser/proto/ranker_model.pb.h"
23 #include "components/translate/core/browser/proto/translate_ranker_model.pb.h"
24 #include "components/translate/core/browser/ranker_model.h"
25 #include "components/translate/core/browser/translate_download_manager.h"
26 #include "components/translate/core/browser/translate_prefs.h"
27 #include "components/translate/core/browser/translate_url_fetcher.h"
28 #include "components/translate/core/common/translate_switches.h"
29 #include "components/variations/variations_associated_data.h"
30 #include "url/gurl.h"
31
32 namespace translate {
33
34 namespace {
35
36 using chrome_intelligence::RankerModel;
37 using chrome_intelligence::RankerModelProto;
38 using chrome_intelligence::TranslateRankerModel;
39
40 const double kTranslationOfferThreshold = 0.5;
41
42 const char kTranslateRankerModelFileName[] = "Translate Ranker Model";
43 const char kUmaPrefix[] = "Translate.Ranker";
44 const char kUnknown[] = "UNKNOWN";
45
46 double Sigmoid(double x) {
47 return 1.0 / (1.0 + exp(-x));
48 }
49
50 double SafeRatio(int numerator, int denominator) {
51 return denominator ? (numerator / static_cast<double>(denominator)) : 0.0;
52 }
53
54 double ScoreComponent(const google::protobuf::Map<std::string, float>& weights,
55 const std::string& key) {
56 auto i = weights.find(base::ToLowerASCII(key));
57 if (i == weights.end())
58 i = weights.find(kUnknown);
59 return i == weights.end() ? 0.0 : i->second;
60 }
61
62 RankerModelStatus ValidateModel(const RankerModel& model) {
63 if (model.proto().model_case() != RankerModelProto::kTranslate)
64 return RankerModelStatus::VALIDATION_FAILED;
65
66 if (model.proto().translate().model_revision_case() !=
67 TranslateRankerModel::kLogisticRegressionModel) {
68 return RankerModelStatus::INCOMPATIBLE;
69 }
70
71 return RankerModelStatus::OK;
72 }
73
74 } // namespace
75
76 const base::Feature kTranslateRankerQuery{"TranslateRankerQuery",
77 base::FEATURE_DISABLED_BY_DEFAULT};
78
79 const base::Feature kTranslateRankerEnforcement{
80 "TranslateRankerEnforcement", base::FEATURE_DISABLED_BY_DEFAULT};
81
82 const base::Feature kTranslateRankerLogging{"TranslateRankerLogging",
83 base::FEATURE_ENABLED_BY_DEFAULT};
84
85 TranslateRankerFeatures::TranslateRankerFeatures() {}
86
87 TranslateRankerFeatures::TranslateRankerFeatures(int accepted,
88 int denied,
89 int ignored,
90 const std::string& src,
91 const std::string& dst,
92 const std::string& cntry,
93 const std::string& locale)
94 : accepted_count(accepted),
95 denied_count(denied),
96 ignored_count(ignored),
97 total_count(accepted_count + denied_count + ignored_count),
98 src_lang(src),
99 dst_lang(dst),
100 country(cntry),
101 app_locale(locale),
102 accepted_ratio(SafeRatio(accepted_count, total_count)),
103 denied_ratio(SafeRatio(denied_count, total_count)),
104 ignored_ratio(SafeRatio(ignored_count, total_count)) {}
105
106 TranslateRankerFeatures::TranslateRankerFeatures(const TranslatePrefs& prefs,
107 const std::string& src,
108 const std::string& dst,
109 const std::string& locale)
110 : TranslateRankerFeatures(prefs.GetTranslationAcceptedCount(src),
111 prefs.GetTranslationDeniedCount(src),
112 prefs.GetTranslationIgnoredCount(src),
113 src,
114 dst,
115 prefs.GetCountry(),
116 locale) {}
117
118 TranslateRankerFeatures::~TranslateRankerFeatures() {}
119
120 void TranslateRankerFeatures::WriteTo(std::ostream& stream) const {
121 stream << "src_lang='" << src_lang << "', "
122 << "dst_lang='" << dst_lang << "', "
123 << "country='" << country << "', "
124 << "app_locale='" << app_locale << "', "
125 << "accept_count=" << accepted_count << ", "
126 << "denied_count=" << denied_count << ", "
127 << "ignored_count=" << ignored_count << ", "
128 << "total_count=" << total_count << ", "
129 << "accept_ratio=" << accepted_ratio << ", "
130 << "decline_ratio=" << denied_ratio << ", "
131 << "ignore_ratio=" << ignored_ratio;
132 }
133
134 TranslateRankerImpl::TranslateRankerImpl(const base::FilePath& model_path,
135 const GURL& model_url)
136 : is_logging_enabled_(
137 base::FeatureList::IsEnabled(kTranslateRankerLogging)),
138 is_query_enabled_(base::FeatureList::IsEnabled(kTranslateRankerQuery)),
139 is_enforcement_enabled_(
140 base::FeatureList::IsEnabled(kTranslateRankerEnforcement)),
141 weak_ptr_factory_(this) {
142 if (IsQueryEnabled() || IsEnforcementEnabled()) {
143 model_loader_ = base::MakeUnique<RankerModelLoader>(
144 base::Bind(&ValidateModel),
145 base::Bind(&TranslateRankerImpl::OnModelAvailable,
146 weak_ptr_factory_.GetWeakPtr()),
147 model_path, model_url, kUmaPrefix);
148 model_loader_->Start();
149 }
150 }
151
152 TranslateRankerImpl::~TranslateRankerImpl() {}
153
154 // static
155 base::FilePath TranslateRankerImpl::GetModelPath(
156 const base::FilePath& data_dir) {
157 if (data_dir.empty())
158 return base::FilePath();
159
160 // Otherwise, look for the file in data dir.
161 return data_dir.AppendASCII(kTranslateRankerModelFileName);
162 }
163
164 // static
165 GURL TranslateRankerImpl::GetModelURL() {
166 // Allow override of the ranker model URL from the command line.
167 std::string raw_url;
168 base::CommandLine* command_line = base::CommandLine::ForCurrentProcess();
169 if (command_line->HasSwitch(switches::kTranslateRankerModelURL)) {
170 raw_url =
171 command_line->GetSwitchValueASCII(switches::kTranslateRankerModelURL);
172 } else {
173 // Otherwise take the ranker model URL from the ranker query variation.
174 raw_url = variations::GetVariationParamValueByFeature(
175 kTranslateRankerQuery, switches::kTranslateRankerModelURL);
176 }
177
178 DVLOG(3) << switches::kTranslateRankerModelURL << " = " << raw_url;
179
180 return GURL(raw_url);
181 }
182
183 void TranslateRankerImpl::EnableLogging(bool value) {
184 is_logging_enabled_ = value;
185 }
186
187 bool TranslateRankerImpl::IsLoggingEnabled() {
188 return is_logging_enabled_;
189 }
190
191 bool TranslateRankerImpl::IsQueryEnabled() {
192 return is_query_enabled_;
193 }
194
195 bool TranslateRankerImpl::IsEnforcementEnabled() {
196 return is_enforcement_enabled_;
197 }
198
199 int TranslateRankerImpl::GetModelVersion() const {
200 return model_ ? model_->proto().translate().version() : 0;
201 }
202
203 bool TranslateRankerImpl::ShouldOfferTranslation(
204 const TranslatePrefs& translate_prefs,
205 const std::string& src_lang,
206 const std::string& dst_lang) {
207 DCHECK(sequence_checker_.CalledOnValidSequence());
208 // The ranker is a gate in the "show a translation prompt" flow. To retain
209 // the pre-existing functionality, it defaults to returning true in the
210 // absence of a model or if enforcement is disabled. As this is ranker is
211 // subsumed into a more general assist ranker, this default will go away
212 // (or become False).
213 const bool kDefaultResponse = true;
214
215 if (model_loader_)
216 model_loader_->NotifyOfRankerActivity();
217
218 // If we don't have a model, request one and return the default.
219 if (model_ == nullptr) {
220 return kDefaultResponse;
221 }
222
223 SCOPED_UMA_HISTOGRAM_TIMER("Translate.Ranker.Timer.ShouldOfferTranslation");
224
225 // TODO(rogerm): Remove ScopedTracker below once crbug.com/646711 is closed.
226 tracked_objects::ScopedTracker tracking_profile(
227 FROM_HERE_WITH_EXPLICIT_FUNCTION(
228 "646711 translate::TranslateRankerImpl::ShouldOfferTranslation"));
229
230 TranslateRankerFeatures features(
231 translate_prefs, src_lang, dst_lang,
232 TranslateDownloadManager::GetInstance()->application_locale());
233
234 double score = CalculateScore(features);
235
236 DVLOG(2) << "TranslateRankerImpl::ShouldOfferTranslation: "
237 << "Score = " << score << ", Features=[" << features << "]";
238
239 bool result = (score >= kTranslationOfferThreshold);
240
241 UMA_HISTOGRAM_BOOLEAN("Translate.Ranker.QueryResult", result);
242
243 return result;
244 }
245
246 double TranslateRankerImpl::CalculateScore(
247 const TranslateRankerFeatures& features) {
248 DCHECK(sequence_checker_.CalledOnValidSequence());
249 SCOPED_UMA_HISTOGRAM_TIMER("Translate.Ranker.Timer.CalculateScore");
250 DCHECK(model_ != nullptr);
251 const TranslateRankerModel::LogisticRegressionModel& logit =
252 model_->proto().translate().logistic_regression_model();
253
254 double dot_product =
255 (features.accepted_count * logit.accept_count_weight()) +
256 (features.denied_count * logit.decline_count_weight()) +
257 (features.ignored_count * logit.ignore_count_weight()) +
258 (features.accepted_ratio * logit.accept_ratio_weight()) +
259 (features.denied_ratio * logit.decline_ratio_weight()) +
260 (features.ignored_ratio * logit.ignore_ratio_weight()) +
261 ScoreComponent(logit.source_language_weight(), features.src_lang) +
262 ScoreComponent(logit.dest_language_weight(), features.dst_lang) +
263 ScoreComponent(logit.country_weight(), features.country) +
264 ScoreComponent(logit.locale_weight(), features.app_locale);
265
266 return Sigmoid(dot_product + logit.bias());
267 }
268
269 void TranslateRankerImpl::FlushTranslateEvents(
270 std::vector<metrics::TranslateEventProto>* events) {
271 DCHECK(sequence_checker_.CalledOnValidSequence());
272 DVLOG(3) << "Flushing translate ranker events.";
273 events->swap(event_cache_);
274 event_cache_.clear();
275 }
276
277 void TranslateRankerImpl::AddTranslateEvent(
278 const metrics::TranslateEventProto& event) {
279 DCHECK(sequence_checker_.CalledOnValidSequence());
280 if (IsLoggingEnabled()) {
281 DVLOG(3) << "Adding translate ranker event.";
282 event_cache_.push_back(event);
283 }
284 }
285
286 void TranslateRankerImpl::OnModelAvailable(std::unique_ptr<RankerModel> model) {
287 DCHECK(sequence_checker_.CalledOnValidSequence());
288 model_ = std::move(model);
289 }
290
291 bool TranslateRankerImpl::CheckModelLoaderForTesting() {
292 return model_loader_ != nullptr;
293 }
294
295 } // namespace translate
296
297 std::ostream& operator<<(std::ostream& stream,
298 const translate::TranslateRankerFeatures& features) {
299 features.WriteTo(stream);
300 return stream;
301 }
OLDNEW

Powered by Google App Engine
This is Rietveld 408576698