Chromium Code Reviews| OLD | NEW |
|---|---|
| (Empty) | |
| 1 // Copyright 2014 The Chromium Authors. All rights reserved. | |
| 2 // Use of this source code is governed by a BSD-style license that can be | |
| 3 // found in the LICENSE file. | |
| 4 | |
| 5 #include "chrome/browser/ui/app_list/speech_recognizer.h" | |
| 6 | |
| 7 #include <algorithm> | |
| 8 | |
| 9 #include "base/bind.h" | |
| 10 #include "base/strings/string16.h" | |
| 11 #include "chrome/browser/ui/app_list/speech_recognizer_delegate.h" | |
| 12 #include "content/public/browser/browser_thread.h" | |
| 13 #include "content/public/browser/render_process_host.h" | |
| 14 #include "content/public/browser/speech_recognition_manager.h" | |
| 15 #include "content/public/browser/speech_recognition_session_config.h" | |
| 16 #include "content/public/browser/web_contents.h" | |
| 17 #include "content/public/common/speech_recognition_error.h" | |
| 18 | |
| 19 namespace app_list { | |
| 20 | |
| 21 // Length of timeout to cancel recognition if there's no speech heard. | |
| 22 static const int kNoSpeechTimeoutInSeconds = 5; | |
| 23 | |
| 24 // Speech recognizer listener. This is separate from SpeechRecognizer because | |
| 25 // the speech recognition engine must function from the IO thread. Because of | |
| 26 // this, the lifecycle of this class must be decoupled from the lifecycle of | |
| 27 // SpeechRecognizer. To avoid circular references, this class has no reference | |
| 28 // to SpeechRecognizer. Instead, it has a reference to the | |
| 29 // SpeechRecognizerDelegate via a weak pointer that is only ever referenced from | |
| 30 // the UI thread. | |
| 31 class SpeechRecognizer::EventListener | |
| 32 : public base::RefCountedThreadSafe<SpeechRecognizer::EventListener>, | |
| 33 public content::SpeechRecognitionEventListener, | |
| 34 public SpeechRecognizerDelegate { | |
| 35 public: | |
| 36 EventListener(base::WeakPtr<SpeechRecognizerDelegate> delegate, | |
| 37 net::URLRequestContextGetter* url_request_context_getter, | |
| 38 const std::string& locale); | |
| 39 | |
| 40 void StartOnIOThread(int render_process_id); | |
| 41 void StopOnIOThread(); | |
| 42 | |
| 43 private: | |
| 44 friend class base::RefCountedThreadSafe<SpeechRecognizer::EventListener>; | |
| 45 ~EventListener(); | |
| 46 | |
| 47 void NotifyRecognitionStateChanged(SpeechRecognitionState new_state); | |
| 48 | |
| 49 void StartSpeechTimeout(); | |
| 50 void StopSpeechTimeout(); | |
| 51 void SpeechTimeout(); | |
| 52 | |
| 53 // Overridden from app_list::SpeechRecognizerDelegate: | |
| 54 // Always called on the UI thread and used to dispatch to delegate_. | |
| 55 void OnSpeechResult(const base::string16& query, bool is_final) override; | |
| 56 void OnSpeechSoundLevelChanged(int16_t level) override; | |
| 57 void OnSpeechRecognitionStateChanged( | |
| 58 SpeechRecognitionState new_state) override; | |
| 59 content::WebContents* GetSpeechContents() override; | |
| 60 | |
| 61 // Overidden from content::SpeechRecognitionEventListener: | |
| 62 // These are always called on the IO thread. | |
| 63 void OnRecognitionStart(int session_id) override; | |
| 64 void OnRecognitionEnd(int session_id) override; | |
| 65 void OnRecognitionResults( | |
| 66 int session_id, | |
| 67 const content::SpeechRecognitionResults& results) override; | |
| 68 void OnRecognitionError( | |
| 69 int session_id, const content::SpeechRecognitionError& error) override; | |
| 70 void OnSoundStart(int session_id) override; | |
| 71 void OnSoundEnd(int session_id) override; | |
| 72 void OnAudioLevelsChange( | |
| 73 int session_id, float volume, float noise_volume) override; | |
| 74 void OnEnvironmentEstimationComplete(int session_id) override; | |
| 75 void OnAudioStart(int session_id) override; | |
| 76 void OnAudioEnd(int session_id) override; | |
| 77 | |
| 78 // Only access from the UI thread. | |
| 79 base::WeakPtr<SpeechRecognizerDelegate> delegate_; | |
| 80 | |
| 81 scoped_refptr<net::URLRequestContextGetter> url_request_context_getter_; | |
| 82 std::string locale_; | |
| 83 base::Timer speech_timeout_; | |
| 84 int session_; | |
| 85 | |
| 86 base::WeakPtrFactory<EventListener> weak_factory_; | |
| 87 | |
| 88 DISALLOW_COPY_AND_ASSIGN(EventListener); | |
| 89 }; | |
| 90 | |
| 91 SpeechRecognizer::EventListener::EventListener( | |
| 92 base::WeakPtr<SpeechRecognizerDelegate> delegate, | |
| 93 net::URLRequestContextGetter* url_request_context_getter, | |
| 94 const std::string& locale) | |
| 95 : delegate_(delegate), | |
| 96 url_request_context_getter_(url_request_context_getter), | |
| 97 locale_(locale), | |
| 98 speech_timeout_(false, false), | |
| 99 session_(-1), | |
| 100 weak_factory_(this) { | |
| 101 DCHECK_CURRENTLY_ON(content::BrowserThread::UI); | |
| 102 } | |
| 103 | |
| 104 SpeechRecognizer::EventListener::~EventListener() { | |
| 105 DCHECK(!speech_timeout_.IsRunning()); | |
| 106 } | |
| 107 | |
| 108 void SpeechRecognizer::EventListener::StartOnIOThread(int render_process_id) { | |
| 109 DCHECK_CURRENTLY_ON(content::BrowserThread::IO); | |
| 110 if (session_ != -1) | |
| 111 StopOnIOThread(); | |
| 112 | |
| 113 content::SpeechRecognitionSessionConfig config; | |
| 114 config.language = locale_; | |
| 115 config.is_legacy_api = false; | |
| 116 config.continuous = true; | |
| 117 config.interim_results = true; | |
| 118 config.max_hypotheses = 1; | |
| 119 config.filter_profanities = true; | |
| 120 config.url_request_context_getter = url_request_context_getter_; | |
| 121 config.event_listener = weak_factory_.GetWeakPtr(); | |
| 122 config.initial_context.render_process_id = render_process_id; | |
| 123 | |
| 124 auto speech_instance = content::SpeechRecognitionManager::GetInstance(); | |
| 125 session_ = speech_instance->CreateSession(config); | |
| 126 speech_instance->StartSession(session_); | |
| 127 } | |
| 128 | |
| 129 void SpeechRecognizer::EventListener::StopOnIOThread() { | |
| 130 DCHECK_CURRENTLY_ON(content::BrowserThread::IO); | |
| 131 if (session_ == -1) | |
| 132 return; | |
| 133 | |
| 134 // Prevent recursion. | |
| 135 int session = session_; | |
| 136 session_ = -1; | |
| 137 StopSpeechTimeout(); | |
| 138 content::SpeechRecognitionManager::GetInstance()->StopAudioCaptureForSession( | |
| 139 session); | |
| 140 } | |
| 141 | |
| 142 void SpeechRecognizer::EventListener::NotifyRecognitionStateChanged( | |
| 143 SpeechRecognitionState new_state) { | |
| 144 content::BrowserThread::PostTask( | |
| 145 content::BrowserThread::UI, | |
| 146 FROM_HERE, | |
| 147 base::Bind(&SpeechRecognizerDelegate::OnSpeechRecognitionStateChanged, | |
| 148 this, | |
| 149 new_state)); | |
| 150 } | |
| 151 | |
| 152 void SpeechRecognizer::EventListener::StartSpeechTimeout() { | |
| 153 DCHECK_CURRENTLY_ON(content::BrowserThread::IO); | |
| 154 speech_timeout_.Start( | |
| 155 FROM_HERE, | |
| 156 base::TimeDelta::FromSeconds(kNoSpeechTimeoutInSeconds), | |
| 157 base::Bind(&SpeechRecognizer::EventListener::SpeechTimeout, this)); | |
| 158 } | |
| 159 | |
| 160 void SpeechRecognizer::EventListener::StopSpeechTimeout() { | |
| 161 DCHECK_CURRENTLY_ON(content::BrowserThread::IO); | |
| 162 speech_timeout_.Stop(); | |
| 163 } | |
| 164 | |
| 165 void SpeechRecognizer::EventListener::SpeechTimeout() { | |
| 166 DCHECK_CURRENTLY_ON(content::BrowserThread::IO); | |
| 167 StopOnIOThread(); | |
| 168 } | |
| 169 | |
| 170 void SpeechRecognizer::EventListener::OnRecognitionStart(int session_id) { | |
| 171 NotifyRecognitionStateChanged(SPEECH_RECOGNITION_RECOGNIZING); | |
| 172 } | |
| 173 | |
| 174 void SpeechRecognizer::EventListener::OnRecognitionEnd(int session_id) { | |
| 175 StopOnIOThread(); | |
| 176 NotifyRecognitionStateChanged(SPEECH_RECOGNITION_READY); | |
| 177 } | |
| 178 | |
| 179 void SpeechRecognizer::EventListener::OnRecognitionResults( | |
| 180 int session_id, const content::SpeechRecognitionResults& results) { | |
| 181 base::string16 result_str; | |
| 182 size_t final_count = 0; | |
| 183 for (const auto& result : results) { | |
| 184 if (!result.is_provisional) | |
| 185 final_count++; | |
| 186 result_str += result.hypotheses[0].utterance; | |
| 187 } | |
| 188 StopSpeechTimeout(); | |
| 189 content::BrowserThread::PostTask( | |
| 190 content::BrowserThread::UI, | |
| 191 FROM_HERE, | |
| 192 base::Bind(&SpeechRecognizerDelegate::OnSpeechResult, | |
| 193 this, | |
| 194 result_str, | |
| 195 final_count == results.size())); | |
| 196 | |
| 197 // Stop the moment we have a final result. | |
| 198 if (final_count == results.size()) | |
| 199 StopOnIOThread(); | |
| 200 } | |
| 201 | |
| 202 void SpeechRecognizer::EventListener::OnRecognitionError( | |
| 203 int session_id, const content::SpeechRecognitionError& error) { | |
| 204 StopOnIOThread(); | |
| 205 if (error.code == content::SPEECH_RECOGNITION_ERROR_NETWORK) { | |
| 206 NotifyRecognitionStateChanged(SPEECH_RECOGNITION_NETWORK_ERROR); | |
| 207 } | |
| 208 NotifyRecognitionStateChanged(SPEECH_RECOGNITION_READY); | |
| 209 } | |
| 210 | |
| 211 void SpeechRecognizer::EventListener::OnSoundStart(int session_id) { | |
| 212 StartSpeechTimeout(); | |
| 213 NotifyRecognitionStateChanged(SPEECH_RECOGNITION_IN_SPEECH); | |
| 214 } | |
| 215 | |
| 216 void SpeechRecognizer::EventListener::OnSoundEnd(int session_id) { | |
| 217 StopOnIOThread(); | |
| 218 NotifyRecognitionStateChanged(SPEECH_RECOGNITION_RECOGNIZING); | |
| 219 } | |
| 220 | |
| 221 void SpeechRecognizer::EventListener::OnAudioLevelsChange( | |
| 222 int session_id, float volume, float noise_volume) { | |
| 223 DCHECK_LE(0.0, volume); | |
| 224 DCHECK_GE(1.0, volume); | |
| 225 DCHECK_LE(0.0, noise_volume); | |
| 226 DCHECK_GE(1.0, noise_volume); | |
| 227 volume = std::max(0.0f, volume - noise_volume); | |
| 228 // Both |volume| and |noise_volume| are defined to be in the range [0.0, 1.0]. | |
| 229 // See: content/public/browser/speech_recognition_event_listener.h | |
| 230 int16_t sound_level = static_cast<int16_t>(INT16_MAX * volume); | |
| 231 content::BrowserThread::PostTask( | |
| 232 content::BrowserThread::UI, | |
| 233 FROM_HERE, | |
| 234 base::Bind(&SpeechRecognizerDelegate::OnSpeechSoundLevelChanged, | |
| 235 this, | |
| 236 sound_level)); | |
| 237 } | |
| 238 | |
| 239 void SpeechRecognizer::EventListener::OnEnvironmentEstimationComplete( | |
| 240 int session_id) { | |
| 241 } | |
| 242 | |
| 243 void SpeechRecognizer::EventListener::OnAudioStart(int session_id) { | |
| 244 } | |
| 245 | |
| 246 void SpeechRecognizer::EventListener::OnAudioEnd(int session_id) { | |
| 247 } | |
| 248 | |
| 249 void SpeechRecognizer::EventListener::OnSpeechResult( | |
|
Lei Zhang
2014/11/05 00:54:15
Why not put this in SpeechRecognizer?
Anand Mistry (off Chromium)
2014/11/05 02:58:33
I've learned that using WeakPtr<> with callbacks "
| |
| 250 const base::string16& query, bool is_final) { | |
| 251 DCHECK_CURRENTLY_ON(content::BrowserThread::UI); | |
| 252 if (delegate_) | |
| 253 delegate_->OnSpeechResult(query, is_final); | |
| 254 } | |
| 255 | |
| 256 void SpeechRecognizer::EventListener::OnSpeechSoundLevelChanged(int16_t level) { | |
| 257 DCHECK_CURRENTLY_ON(content::BrowserThread::UI); | |
| 258 if (delegate_) | |
| 259 delegate_->OnSpeechSoundLevelChanged(level); | |
| 260 } | |
| 261 | |
| 262 void SpeechRecognizer::EventListener::OnSpeechRecognitionStateChanged( | |
| 263 SpeechRecognitionState new_state) { | |
| 264 DCHECK_CURRENTLY_ON(content::BrowserThread::UI); | |
| 265 if (delegate_) | |
| 266 delegate_->OnSpeechRecognitionStateChanged(new_state); | |
| 267 } | |
| 268 | |
| 269 content::WebContents* SpeechRecognizer::EventListener::GetSpeechContents() { | |
| 270 NOTREACHED(); | |
| 271 return nullptr; | |
| 272 } | |
| 273 | |
| 274 SpeechRecognizer::SpeechRecognizer( | |
| 275 SpeechRecognizerDelegate* delegate, | |
| 276 net::URLRequestContextGetter* url_request_context_getter, | |
| 277 const std::string& locale) | |
| 278 : delegate_(delegate), | |
| 279 delegate_weak_factory_(delegate) { | |
| 280 DCHECK_CURRENTLY_ON(content::BrowserThread::UI); | |
| 281 | |
| 282 // Must be done after delegate_weak_factory_ has been constructed. | |
| 283 speech_event_listener_ = new EventListener( | |
| 284 delegate_weak_factory_.GetWeakPtr(), url_request_context_getter, locale); | |
| 285 } | |
| 286 | |
| 287 SpeechRecognizer::~SpeechRecognizer() { | |
| 288 DCHECK_CURRENTLY_ON(content::BrowserThread::UI); | |
| 289 Stop(); | |
| 290 } | |
| 291 | |
| 292 void SpeechRecognizer::Start() { | |
| 293 DCHECK_CURRENTLY_ON(content::BrowserThread::UI); | |
| 294 // The speech recognizer checks to see if the request is allowed by looking | |
| 295 // up the renderer process. A renderer containing the app-list is hard-coded | |
| 296 // to be allowed. | |
| 297 content::WebContents* contents = delegate_->GetSpeechContents(); | |
| 298 if (!contents) | |
| 299 return; | |
| 300 | |
| 301 content::BrowserThread::PostTask( | |
| 302 content::BrowserThread::IO, | |
| 303 FROM_HERE, | |
| 304 base::Bind(&SpeechRecognizer::EventListener::StartOnIOThread, | |
| 305 speech_event_listener_, | |
| 306 contents->GetRenderProcessHost()->GetID())); | |
| 307 } | |
| 308 | |
| 309 void SpeechRecognizer::Stop() { | |
| 310 DCHECK_CURRENTLY_ON(content::BrowserThread::UI); | |
| 311 content::BrowserThread::PostTask( | |
| 312 content::BrowserThread::IO, | |
| 313 FROM_HERE, | |
| 314 base::Bind(&SpeechRecognizer::EventListener::StopOnIOThread, | |
| 315 speech_event_listener_)); | |
| 316 } | |
| 317 | |
| 318 } // namespace app_list | |
| OLD | NEW |