chrome/browser/speech/tts_controller.cc - Issue 412783002: Separate out the TtsController interface from it's impl

Side by Side Diff: chrome/browser/speech/tts_controller.cc

Issue 412783002: Separate out the TtsController interface from it's impl (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master

Patch Set: Created 6 years, 5 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch

OLD	NEW
	(Empty)
1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.

2 // Use of this source code is governed by a BSD-style license that can be

3 // found in the LICENSE file.

4

5 #include "chrome/browser/speech/tts_controller.h"

6

7 #include <string>

8 #include <vector>

9

10 #include "base/float_util.h"

11 #include "base/values.h"

12 #include "chrome/browser/browser_process.h"

13 #include "chrome/browser/speech/tts_platform.h"

14

15 namespace {

16 // A value to be used to indicate that there is no char index available.

17 const int kInvalidCharIndex = -1;

18

19 // Given a language/region code of the form 'fr-FR', returns just the basic

20 // language portion, e.g. 'fr'.

21 std::string TrimLanguageCode(std::string lang) {

22 if (lang.size() >= 5 && lang[2] == '-')

23 return lang.substr(0, 2);

24 else

25 return lang;

26 }

27

28 } // namespace

29

30 bool IsFinalTtsEventType(TtsEventType event_type) {

31 return (event_type == TTS_EVENT_END \|\|

32 event_type == TTS_EVENT_INTERRUPTED \|\|

33 event_type == TTS_EVENT_CANCELLED \|\|

34 event_type == TTS_EVENT_ERROR);

35 }

36

37 //

38 // UtteranceContinuousParameters

39 //

40

41

42 UtteranceContinuousParameters::UtteranceContinuousParameters()

43 : rate(-1),

44 pitch(-1),

45 volume(-1) {}

46

47

48 //

49 // VoiceData

50 //

51

52

53 VoiceData::VoiceData()

54 : gender(TTS_GENDER_NONE),

55 remote(false),

56 native(false) {}

57

58 VoiceData::~VoiceData() {}

59

60

61 //

62 // Utterance

63 //

64

65 // static

66 int Utterance::next_utterance_id_ = 0;

67

68 Utterance::Utterance(Profile* profile)

69 : profile_(profile),

70 id_(next_utterance_id_++),

71 src_id_(-1),

72 gender_(TTS_GENDER_NONE),

73 can_enqueue_(false),

74 char_index_(0),

75 finished_(false) {

76 options_.reset(new base::DictionaryValue());

77 }

78

79 Utterance::~Utterance() {

80 DCHECK(finished_);

81 }

82

83 void Utterance::OnTtsEvent(TtsEventType event_type,

84 int char_index,

85 const std::string& error_message) {

86 if (char_index >= 0)

87 char_index_ = char_index;

88 if (IsFinalTtsEventType(event_type))

89 finished_ = true;

90

91 if (event_delegate_)

92 event_delegate_->OnTtsEvent(this, event_type, char_index, error_message);

93 if (finished_)

94 event_delegate_.reset();

95 }

96

97 void Utterance::Finish() {

98 finished_ = true;

99 }

100

101 void Utterance::set_options(const base::Value* options) {

102 options_.reset(options->DeepCopy());

103 }

104

105 //

106 // TtsController

107 //

108

109 // static

110 TtsController* TtsController::GetInstance() {

111 return Singleton<TtsController>::get();

112 }

113

114 TtsController::TtsController()

115 : current_utterance_(NULL),

116 paused_(false),

117 platform_impl_(NULL),

118 tts_engine_delegate_(NULL) {

119 }

120

121 TtsController::~TtsController() {

122 if (current_utterance_) {

123 current_utterance_->Finish();

124 delete current_utterance_;

125 }

126

127 // Clear any queued utterances too.

128 ClearUtteranceQueue(false); // Don't sent events.

129 }

130

131 void TtsController::SpeakOrEnqueue(Utterance* utterance) {

132 // If we're paused and we get an utterance that can't be queued,

133 // flush the queue but stay in the paused state.

134 if (paused_ && !utterance->can_enqueue()) {

135 Stop();

136 paused_ = true;

137 return;

138 }

139

140 if (paused_ \|\| (IsSpeaking() && utterance->can_enqueue())) {

141 utterance_queue_.push(utterance);

142 } else {

143 Stop();

144 SpeakNow(utterance);

145 }

146 }

147

148 void TtsController::SpeakNow(Utterance* utterance) {

149 // Ensure we have all built-in voices loaded. This is a no-op if already

150 // loaded.

151 bool loaded_built_in =

152 GetPlatformImpl()->LoadBuiltInTtsExtension(utterance->profile());

153

154 // Get all available voices and try to find a matching voice.

155 std::vector<VoiceData> voices;

156 GetVoices(utterance->profile(), &voices);

157 int index = GetMatchingVoice(utterance, voices);

158

159 VoiceData voice;

160 if (index != -1) {

161 // Select the matching voice.

162 voice = voices[index];

163 } else {

164 // However, if no match was found on a platform without native tts voices,

165 // attempt to get a voice based only on the current locale without respect

166 // to any supplied voice names.

167 std::vector<VoiceData> native_voices;

168

169 if (GetPlatformImpl()->PlatformImplAvailable())

170 GetPlatformImpl()->GetVoices(&native_voices);

171

172 if (native_voices.empty() && !voices.empty()) {

173 // TODO(dtseng): Notify extension caller of an error.

174 utterance->set_voice_name("");

175 // TODO(gaochun): Replace the global variable g_browser_process with

176 // GetContentClient()->browser() to eliminate the dependency of browser

177 // once TTS implementation was moved to content.

178 utterance->set_lang(g_browser_process->GetApplicationLocale());

179 index = GetMatchingVoice(utterance, voices);

180

181 // If even that fails, just take the first available voice.

182 if (index == -1)

183 index = 0;

184 voice = voices[index];

185 } else {

186 // Otherwise, simply give native voices a chance to handle this utterance.

187 voice.native = true;

188 }

189 }

190

191 GetPlatformImpl()->WillSpeakUtteranceWithVoice(utterance, voice);

192

193 if (!voice.native) {

194 #if !defined(OS_ANDROID)

195 DCHECK(!voice.extension_id.empty());

196 current_utterance_ = utterance;

197 utterance->set_extension_id(voice.extension_id);

198 if (tts_engine_delegate_)

199 tts_engine_delegate_->Speak(utterance, voice);

200 bool sends_end_event =

201 voice.events.find(TTS_EVENT_END) != voice.events.end();

202 if (!sends_end_event) {

203 utterance->Finish();

204 delete utterance;

205 current_utterance_ = NULL;

206 SpeakNextUtterance();

207 }

208 #endif

209 } else {

210 // It's possible for certain platforms to send start events immediately

211 // during \|speak\|.

212 current_utterance_ = utterance;

213 GetPlatformImpl()->clear_error();

214 bool success = GetPlatformImpl()->Speak(

215 utterance->id(),

216 utterance->text(),

217 utterance->lang(),

218 voice,

219 utterance->continuous_parameters());

220 if (!success)

221 current_utterance_ = NULL;

222

223 // If the native voice wasn't able to process this speech, see if

224 // the browser has built-in TTS that isn't loaded yet.

225 if (!success && loaded_built_in) {

226 utterance_queue_.push(utterance);

227 return;

228 }

229

230 if (!success) {

231 utterance->OnTtsEvent(TTS_EVENT_ERROR, kInvalidCharIndex,

232 GetPlatformImpl()->error());

233 delete utterance;

234 return;

235 }

236 }

237 }

238

239 void TtsController::Stop() {

240 paused_ = false;

241 if (current_utterance_ && !current_utterance_->extension_id().empty()) {

242 #if !defined(OS_ANDROID)

243 if (tts_engine_delegate_)

244 tts_engine_delegate_->Stop(current_utterance_);

245 #endif

246 } else {

247 GetPlatformImpl()->clear_error();

248 GetPlatformImpl()->StopSpeaking();

249 }

250

251 if (current_utterance_)

252 current_utterance_->OnTtsEvent(TTS_EVENT_INTERRUPTED, kInvalidCharIndex,

253 std::string());

254 FinishCurrentUtterance();

255 ClearUtteranceQueue(true); // Send events.

256 }

257

258 void TtsController::Pause() {

259 paused_ = true;

260 if (current_utterance_ && !current_utterance_->extension_id().empty()) {

261 #if !defined(OS_ANDROID)

262 if (tts_engine_delegate_)

263 tts_engine_delegate_->Pause(current_utterance_);

264 #endif

265 } else if (current_utterance_) {

266 GetPlatformImpl()->clear_error();

267 GetPlatformImpl()->Pause();

268 }

269 }

270

271 void TtsController::Resume() {

272 paused_ = false;

273 if (current_utterance_ && !current_utterance_->extension_id().empty()) {

274 #if !defined(OS_ANDROID)

275 if (tts_engine_delegate_)

276 tts_engine_delegate_->Resume(current_utterance_);

277 #endif

278 } else if (current_utterance_) {

279 GetPlatformImpl()->clear_error();

280 GetPlatformImpl()->Resume();

281 } else {

282 SpeakNextUtterance();

283 }

284 }

285

286 void TtsController::OnTtsEvent(int utterance_id,

287 TtsEventType event_type,

288 int char_index,

289 const std::string& error_message) {

290 // We may sometimes receive completion callbacks "late", after we've

291 // already finished the utterance (for example because another utterance

292 // interrupted or we got a call to Stop). This is normal and we can

293 // safely just ignore these events.

294 if (!current_utterance_ \|\| utterance_id != current_utterance_->id()) {

295 return;

296 }

297 current_utterance_->OnTtsEvent(event_type, char_index, error_message);

298 if (current_utterance_->finished()) {

299 FinishCurrentUtterance();

300 SpeakNextUtterance();

301 }

302 }

303

304 void TtsController::GetVoices(Profile* profile,

305 std::vector<VoiceData>* out_voices) {

306 #if !defined(OS_ANDROID)

307 if (profile && tts_engine_delegate_)

308 tts_engine_delegate_->GetVoices(profile, out_voices);

309 #endif

310

311 TtsPlatformImpl* platform_impl = GetPlatformImpl();

312 if (platform_impl) {

313 // Ensure we have all built-in voices loaded. This is a no-op if already

314 // loaded.

315 platform_impl->LoadBuiltInTtsExtension(profile);

316 if (platform_impl->PlatformImplAvailable())

317 platform_impl->GetVoices(out_voices);

318 }

319 }

320

321 bool TtsController::IsSpeaking() {

322 return current_utterance_ != NULL \|\| GetPlatformImpl()->IsSpeaking();

323 }

324

325 void TtsController::FinishCurrentUtterance() {

326 if (current_utterance_) {

327 if (!current_utterance_->finished())

328 current_utterance_->OnTtsEvent(TTS_EVENT_INTERRUPTED, kInvalidCharIndex,

329 std::string());

330 delete current_utterance_;

331 current_utterance_ = NULL;

332 }

333 }

334

335 void TtsController::SpeakNextUtterance() {

336 if (paused_)

337 return;

338

339 // Start speaking the next utterance in the queue. Keep trying in case

340 // one fails but there are still more in the queue to try.

341 while (!utterance_queue_.empty() && !current_utterance_) {

342 Utterance* utterance = utterance_queue_.front();

343 utterance_queue_.pop();

344 SpeakNow(utterance);

345 }

346 }

347

348 void TtsController::RetrySpeakingQueuedUtterances() {

349 if (current_utterance_ == NULL && !utterance_queue_.empty())

350 SpeakNextUtterance();

351 }

352

353 void TtsController::ClearUtteranceQueue(bool send_events) {

354 while (!utterance_queue_.empty()) {

355 Utterance* utterance = utterance_queue_.front();

356 utterance_queue_.pop();

357 if (send_events)

358 utterance->OnTtsEvent(TTS_EVENT_CANCELLED, kInvalidCharIndex,

359 std::string());

360 else

361 utterance->Finish();

362 delete utterance;

363 }

364 }

365

366 void TtsController::SetPlatformImpl(

367 TtsPlatformImpl* platform_impl) {

368 platform_impl_ = platform_impl;

369 }

370

371 int TtsController::QueueSize() {

372 return static_cast<int>(utterance_queue_.size());

373 }

374

375 TtsPlatformImpl* TtsController::GetPlatformImpl() {

376 if (!platform_impl_)

377 platform_impl_ = TtsPlatformImpl::GetInstance();

378 return platform_impl_;

379 }

380

381 int TtsController::GetMatchingVoice(

382 const Utterance* utterance, std::vector<VoiceData>& voices) {

383 // Make two passes: the first time, do strict language matching

384 // ('fr-FR' does not match 'fr-CA'). The second time, do prefix

385 // language matching ('fr-FR' matches 'fr' and 'fr-CA')

386 for (int pass = 0; pass < 2; ++pass) {

387 for (size_t i = 0; i < voices.size(); ++i) {

388 const VoiceData& voice = voices[i];

389

390 if (!utterance->extension_id().empty() &&

391 utterance->extension_id() != voice.extension_id) {

392 continue;

393 }

394

395 if (!voice.name.empty() &&

396 !utterance->voice_name().empty() &&

397 voice.name != utterance->voice_name()) {

398 continue;

399 }

400 if (!voice.lang.empty() && !utterance->lang().empty()) {

401 std::string voice_lang = voice.lang;

402 std::string utterance_lang = utterance->lang();

403 if (pass == 1) {

404 voice_lang = TrimLanguageCode(voice_lang);

405 utterance_lang = TrimLanguageCode(utterance_lang);

406 }

407 if (voice_lang != utterance_lang) {

408 continue;

409 }

410 }

411 if (voice.gender != TTS_GENDER_NONE &&

412 utterance->gender() != TTS_GENDER_NONE &&

413 voice.gender != utterance->gender()) {

414 continue;

415 }

416

417 if (utterance->required_event_types().size() > 0) {

418 bool has_all_required_event_types = true;

419 for (std::set<TtsEventType>::const_iterator iter =

420 utterance->required_event_types().begin();

421 iter != utterance->required_event_types().end();

422 ++iter) {

423 if (voice.events.find(*iter) == voice.events.end()) {

424 has_all_required_event_types = false;

425 break;

426 }

427 }

428 if (!has_all_required_event_types)

429 continue;

430 }

431

432 return static_cast<int>(i);

433 }

434 }

435

436 return -1;

437 }

438

439 void TtsController::VoicesChanged() {

440 for (std::set<VoicesChangedDelegate*>::iterator iter =

441 voices_changed_delegates_.begin();

442 iter != voices_changed_delegates_.end(); ++iter) {

443 (*iter)->OnVoicesChanged();

444 }

445 }

446

447 void TtsController::AddVoicesChangedDelegate(VoicesChangedDelegate* delegate) {

448 voices_changed_delegates_.insert(delegate);

449 }

450

451 void TtsController::RemoveVoicesChangedDelegate(

452 VoicesChangedDelegate* delegate) {

453 voices_changed_delegates_.erase(delegate);

454 }

455

456 void TtsController::SetTtsEngineDelegate(

457 TtsEngineDelegate* delegate) {

458 tts_engine_delegate_ = delegate;

459 }

OLD	NEW

« no previous file with comments | « chrome/browser/speech/tts_controller.h ('k') | chrome/browser/speech/tts_controller_impl.h » ('j') | chrome/browser/speech/tts_controller_impl.h » ('J')