Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(76)

Side by Side Diff: chrome/browser/speech/tts_controller.cc

Issue 412783002: Separate out the TtsController interface from it's impl (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master
Patch Set: Created 6 years, 5 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
OLDNEW
(Empty)
1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4
5 #include "chrome/browser/speech/tts_controller.h"
6
7 #include <string>
8 #include <vector>
9
10 #include "base/float_util.h"
11 #include "base/values.h"
12 #include "chrome/browser/browser_process.h"
13 #include "chrome/browser/speech/tts_platform.h"
14
15 namespace {
16 // A value to be used to indicate that there is no char index available.
17 const int kInvalidCharIndex = -1;
18
19 // Given a language/region code of the form 'fr-FR', returns just the basic
20 // language portion, e.g. 'fr'.
21 std::string TrimLanguageCode(std::string lang) {
22 if (lang.size() >= 5 && lang[2] == '-')
23 return lang.substr(0, 2);
24 else
25 return lang;
26 }
27
28 } // namespace
29
30 bool IsFinalTtsEventType(TtsEventType event_type) {
31 return (event_type == TTS_EVENT_END ||
32 event_type == TTS_EVENT_INTERRUPTED ||
33 event_type == TTS_EVENT_CANCELLED ||
34 event_type == TTS_EVENT_ERROR);
35 }
36
37 //
38 // UtteranceContinuousParameters
39 //
40
41
42 UtteranceContinuousParameters::UtteranceContinuousParameters()
43 : rate(-1),
44 pitch(-1),
45 volume(-1) {}
46
47
48 //
49 // VoiceData
50 //
51
52
53 VoiceData::VoiceData()
54 : gender(TTS_GENDER_NONE),
55 remote(false),
56 native(false) {}
57
58 VoiceData::~VoiceData() {}
59
60
61 //
62 // Utterance
63 //
64
65 // static
66 int Utterance::next_utterance_id_ = 0;
67
68 Utterance::Utterance(Profile* profile)
69 : profile_(profile),
70 id_(next_utterance_id_++),
71 src_id_(-1),
72 gender_(TTS_GENDER_NONE),
73 can_enqueue_(false),
74 char_index_(0),
75 finished_(false) {
76 options_.reset(new base::DictionaryValue());
77 }
78
79 Utterance::~Utterance() {
80 DCHECK(finished_);
81 }
82
83 void Utterance::OnTtsEvent(TtsEventType event_type,
84 int char_index,
85 const std::string& error_message) {
86 if (char_index >= 0)
87 char_index_ = char_index;
88 if (IsFinalTtsEventType(event_type))
89 finished_ = true;
90
91 if (event_delegate_)
92 event_delegate_->OnTtsEvent(this, event_type, char_index, error_message);
93 if (finished_)
94 event_delegate_.reset();
95 }
96
97 void Utterance::Finish() {
98 finished_ = true;
99 }
100
101 void Utterance::set_options(const base::Value* options) {
102 options_.reset(options->DeepCopy());
103 }
104
105 //
106 // TtsController
107 //
108
109 // static
110 TtsController* TtsController::GetInstance() {
111 return Singleton<TtsController>::get();
112 }
113
114 TtsController::TtsController()
115 : current_utterance_(NULL),
116 paused_(false),
117 platform_impl_(NULL),
118 tts_engine_delegate_(NULL) {
119 }
120
121 TtsController::~TtsController() {
122 if (current_utterance_) {
123 current_utterance_->Finish();
124 delete current_utterance_;
125 }
126
127 // Clear any queued utterances too.
128 ClearUtteranceQueue(false); // Don't sent events.
129 }
130
131 void TtsController::SpeakOrEnqueue(Utterance* utterance) {
132 // If we're paused and we get an utterance that can't be queued,
133 // flush the queue but stay in the paused state.
134 if (paused_ && !utterance->can_enqueue()) {
135 Stop();
136 paused_ = true;
137 return;
138 }
139
140 if (paused_ || (IsSpeaking() && utterance->can_enqueue())) {
141 utterance_queue_.push(utterance);
142 } else {
143 Stop();
144 SpeakNow(utterance);
145 }
146 }
147
148 void TtsController::SpeakNow(Utterance* utterance) {
149 // Ensure we have all built-in voices loaded. This is a no-op if already
150 // loaded.
151 bool loaded_built_in =
152 GetPlatformImpl()->LoadBuiltInTtsExtension(utterance->profile());
153
154 // Get all available voices and try to find a matching voice.
155 std::vector<VoiceData> voices;
156 GetVoices(utterance->profile(), &voices);
157 int index = GetMatchingVoice(utterance, voices);
158
159 VoiceData voice;
160 if (index != -1) {
161 // Select the matching voice.
162 voice = voices[index];
163 } else {
164 // However, if no match was found on a platform without native tts voices,
165 // attempt to get a voice based only on the current locale without respect
166 // to any supplied voice names.
167 std::vector<VoiceData> native_voices;
168
169 if (GetPlatformImpl()->PlatformImplAvailable())
170 GetPlatformImpl()->GetVoices(&native_voices);
171
172 if (native_voices.empty() && !voices.empty()) {
173 // TODO(dtseng): Notify extension caller of an error.
174 utterance->set_voice_name("");
175 // TODO(gaochun): Replace the global variable g_browser_process with
176 // GetContentClient()->browser() to eliminate the dependency of browser
177 // once TTS implementation was moved to content.
178 utterance->set_lang(g_browser_process->GetApplicationLocale());
179 index = GetMatchingVoice(utterance, voices);
180
181 // If even that fails, just take the first available voice.
182 if (index == -1)
183 index = 0;
184 voice = voices[index];
185 } else {
186 // Otherwise, simply give native voices a chance to handle this utterance.
187 voice.native = true;
188 }
189 }
190
191 GetPlatformImpl()->WillSpeakUtteranceWithVoice(utterance, voice);
192
193 if (!voice.native) {
194 #if !defined(OS_ANDROID)
195 DCHECK(!voice.extension_id.empty());
196 current_utterance_ = utterance;
197 utterance->set_extension_id(voice.extension_id);
198 if (tts_engine_delegate_)
199 tts_engine_delegate_->Speak(utterance, voice);
200 bool sends_end_event =
201 voice.events.find(TTS_EVENT_END) != voice.events.end();
202 if (!sends_end_event) {
203 utterance->Finish();
204 delete utterance;
205 current_utterance_ = NULL;
206 SpeakNextUtterance();
207 }
208 #endif
209 } else {
210 // It's possible for certain platforms to send start events immediately
211 // during |speak|.
212 current_utterance_ = utterance;
213 GetPlatformImpl()->clear_error();
214 bool success = GetPlatformImpl()->Speak(
215 utterance->id(),
216 utterance->text(),
217 utterance->lang(),
218 voice,
219 utterance->continuous_parameters());
220 if (!success)
221 current_utterance_ = NULL;
222
223 // If the native voice wasn't able to process this speech, see if
224 // the browser has built-in TTS that isn't loaded yet.
225 if (!success && loaded_built_in) {
226 utterance_queue_.push(utterance);
227 return;
228 }
229
230 if (!success) {
231 utterance->OnTtsEvent(TTS_EVENT_ERROR, kInvalidCharIndex,
232 GetPlatformImpl()->error());
233 delete utterance;
234 return;
235 }
236 }
237 }
238
239 void TtsController::Stop() {
240 paused_ = false;
241 if (current_utterance_ && !current_utterance_->extension_id().empty()) {
242 #if !defined(OS_ANDROID)
243 if (tts_engine_delegate_)
244 tts_engine_delegate_->Stop(current_utterance_);
245 #endif
246 } else {
247 GetPlatformImpl()->clear_error();
248 GetPlatformImpl()->StopSpeaking();
249 }
250
251 if (current_utterance_)
252 current_utterance_->OnTtsEvent(TTS_EVENT_INTERRUPTED, kInvalidCharIndex,
253 std::string());
254 FinishCurrentUtterance();
255 ClearUtteranceQueue(true); // Send events.
256 }
257
258 void TtsController::Pause() {
259 paused_ = true;
260 if (current_utterance_ && !current_utterance_->extension_id().empty()) {
261 #if !defined(OS_ANDROID)
262 if (tts_engine_delegate_)
263 tts_engine_delegate_->Pause(current_utterance_);
264 #endif
265 } else if (current_utterance_) {
266 GetPlatformImpl()->clear_error();
267 GetPlatformImpl()->Pause();
268 }
269 }
270
271 void TtsController::Resume() {
272 paused_ = false;
273 if (current_utterance_ && !current_utterance_->extension_id().empty()) {
274 #if !defined(OS_ANDROID)
275 if (tts_engine_delegate_)
276 tts_engine_delegate_->Resume(current_utterance_);
277 #endif
278 } else if (current_utterance_) {
279 GetPlatformImpl()->clear_error();
280 GetPlatformImpl()->Resume();
281 } else {
282 SpeakNextUtterance();
283 }
284 }
285
286 void TtsController::OnTtsEvent(int utterance_id,
287 TtsEventType event_type,
288 int char_index,
289 const std::string& error_message) {
290 // We may sometimes receive completion callbacks "late", after we've
291 // already finished the utterance (for example because another utterance
292 // interrupted or we got a call to Stop). This is normal and we can
293 // safely just ignore these events.
294 if (!current_utterance_ || utterance_id != current_utterance_->id()) {
295 return;
296 }
297 current_utterance_->OnTtsEvent(event_type, char_index, error_message);
298 if (current_utterance_->finished()) {
299 FinishCurrentUtterance();
300 SpeakNextUtterance();
301 }
302 }
303
304 void TtsController::GetVoices(Profile* profile,
305 std::vector<VoiceData>* out_voices) {
306 #if !defined(OS_ANDROID)
307 if (profile && tts_engine_delegate_)
308 tts_engine_delegate_->GetVoices(profile, out_voices);
309 #endif
310
311 TtsPlatformImpl* platform_impl = GetPlatformImpl();
312 if (platform_impl) {
313 // Ensure we have all built-in voices loaded. This is a no-op if already
314 // loaded.
315 platform_impl->LoadBuiltInTtsExtension(profile);
316 if (platform_impl->PlatformImplAvailable())
317 platform_impl->GetVoices(out_voices);
318 }
319 }
320
321 bool TtsController::IsSpeaking() {
322 return current_utterance_ != NULL || GetPlatformImpl()->IsSpeaking();
323 }
324
325 void TtsController::FinishCurrentUtterance() {
326 if (current_utterance_) {
327 if (!current_utterance_->finished())
328 current_utterance_->OnTtsEvent(TTS_EVENT_INTERRUPTED, kInvalidCharIndex,
329 std::string());
330 delete current_utterance_;
331 current_utterance_ = NULL;
332 }
333 }
334
335 void TtsController::SpeakNextUtterance() {
336 if (paused_)
337 return;
338
339 // Start speaking the next utterance in the queue. Keep trying in case
340 // one fails but there are still more in the queue to try.
341 while (!utterance_queue_.empty() && !current_utterance_) {
342 Utterance* utterance = utterance_queue_.front();
343 utterance_queue_.pop();
344 SpeakNow(utterance);
345 }
346 }
347
348 void TtsController::RetrySpeakingQueuedUtterances() {
349 if (current_utterance_ == NULL && !utterance_queue_.empty())
350 SpeakNextUtterance();
351 }
352
353 void TtsController::ClearUtteranceQueue(bool send_events) {
354 while (!utterance_queue_.empty()) {
355 Utterance* utterance = utterance_queue_.front();
356 utterance_queue_.pop();
357 if (send_events)
358 utterance->OnTtsEvent(TTS_EVENT_CANCELLED, kInvalidCharIndex,
359 std::string());
360 else
361 utterance->Finish();
362 delete utterance;
363 }
364 }
365
366 void TtsController::SetPlatformImpl(
367 TtsPlatformImpl* platform_impl) {
368 platform_impl_ = platform_impl;
369 }
370
371 int TtsController::QueueSize() {
372 return static_cast<int>(utterance_queue_.size());
373 }
374
375 TtsPlatformImpl* TtsController::GetPlatformImpl() {
376 if (!platform_impl_)
377 platform_impl_ = TtsPlatformImpl::GetInstance();
378 return platform_impl_;
379 }
380
381 int TtsController::GetMatchingVoice(
382 const Utterance* utterance, std::vector<VoiceData>& voices) {
383 // Make two passes: the first time, do strict language matching
384 // ('fr-FR' does not match 'fr-CA'). The second time, do prefix
385 // language matching ('fr-FR' matches 'fr' and 'fr-CA')
386 for (int pass = 0; pass < 2; ++pass) {
387 for (size_t i = 0; i < voices.size(); ++i) {
388 const VoiceData& voice = voices[i];
389
390 if (!utterance->extension_id().empty() &&
391 utterance->extension_id() != voice.extension_id) {
392 continue;
393 }
394
395 if (!voice.name.empty() &&
396 !utterance->voice_name().empty() &&
397 voice.name != utterance->voice_name()) {
398 continue;
399 }
400 if (!voice.lang.empty() && !utterance->lang().empty()) {
401 std::string voice_lang = voice.lang;
402 std::string utterance_lang = utterance->lang();
403 if (pass == 1) {
404 voice_lang = TrimLanguageCode(voice_lang);
405 utterance_lang = TrimLanguageCode(utterance_lang);
406 }
407 if (voice_lang != utterance_lang) {
408 continue;
409 }
410 }
411 if (voice.gender != TTS_GENDER_NONE &&
412 utterance->gender() != TTS_GENDER_NONE &&
413 voice.gender != utterance->gender()) {
414 continue;
415 }
416
417 if (utterance->required_event_types().size() > 0) {
418 bool has_all_required_event_types = true;
419 for (std::set<TtsEventType>::const_iterator iter =
420 utterance->required_event_types().begin();
421 iter != utterance->required_event_types().end();
422 ++iter) {
423 if (voice.events.find(*iter) == voice.events.end()) {
424 has_all_required_event_types = false;
425 break;
426 }
427 }
428 if (!has_all_required_event_types)
429 continue;
430 }
431
432 return static_cast<int>(i);
433 }
434 }
435
436 return -1;
437 }
438
439 void TtsController::VoicesChanged() {
440 for (std::set<VoicesChangedDelegate*>::iterator iter =
441 voices_changed_delegates_.begin();
442 iter != voices_changed_delegates_.end(); ++iter) {
443 (*iter)->OnVoicesChanged();
444 }
445 }
446
447 void TtsController::AddVoicesChangedDelegate(VoicesChangedDelegate* delegate) {
448 voices_changed_delegates_.insert(delegate);
449 }
450
451 void TtsController::RemoveVoicesChangedDelegate(
452 VoicesChangedDelegate* delegate) {
453 voices_changed_delegates_.erase(delegate);
454 }
455
456 void TtsController::SetTtsEngineDelegate(
457 TtsEngineDelegate* delegate) {
458 tts_engine_delegate_ = delegate;
459 }
OLDNEW

Powered by Google App Engine
This is Rietveld 408576698