chrome/browser/ui/app_list/speech_recognizer.cc - Issue 676593003: Implement native speech recognition for the launcher.

Unified Diff: chrome/browser/ui/app_list/speech_recognizer.cc

Issue 676593003: Implement native speech recognition for the launcher. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master

Patch Set: Rebase. Created 6 years, 1 month ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

« chrome/browser/ui/app_list/speech_recognizer.h ('K') | « chrome/browser/ui/app_list/speech_recognizer.h ('k') | chrome/browser/ui/app_list/speech_recognizer_browsertest.cc » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: chrome/browser/ui/app_list/speech_recognizer.cc

diff --git a/chrome/browser/ui/app_list/speech_recognizer.cc b/chrome/browser/ui/app_list/speech_recognizer.cc

new file mode 100644

index 0000000000000000000000000000000000000000..383b858118484ff47225a18fb1c2436328880b04

--- /dev/null

+++ b/chrome/browser/ui/app_list/speech_recognizer.cc

@@ -0,0 +1,318 @@

+// Use of this source code is governed by a BSD-style license that can be

+// found in the LICENSE file.

+#include "chrome/browser/ui/app_list/speech_recognizer.h"

+#include <algorithm>

+#include "base/bind.h"

+#include "base/strings/string16.h"

+#include "chrome/browser/ui/app_list/speech_recognizer_delegate.h"

+#include "content/public/browser/browser_thread.h"

+#include "content/public/browser/render_process_host.h"

+#include "content/public/browser/speech_recognition_manager.h"

+#include "content/public/browser/speech_recognition_session_config.h"

+#include "content/public/browser/web_contents.h"

+#include "content/public/common/speech_recognition_error.h"

+namespace app_list {

+// Length of timeout to cancel recognition if there's no speech heard.

+static const int kNoSpeechTimeoutInSeconds = 5;

+// Speech recognizer listener. This is separate from SpeechRecognizer because

+// the speech recognition engine must function from the IO thread. Because of

+// this, the lifecycle of this class must be decoupled from the lifecycle of

+// SpeechRecognizer. To avoid circular references, this class has no reference

+// to SpeechRecognizer. Instead, it has a reference to the

+// SpeechRecognizerDelegate via a weak pointer that is only ever referenced from

+// the UI thread.

+class SpeechRecognizer::EventListener

+ : public base::RefCountedThreadSafe<SpeechRecognizer::EventListener>,

+ public content::SpeechRecognitionEventListener,

+ public SpeechRecognizerDelegate {

+ public:

+ EventListener(base::WeakPtr<SpeechRecognizerDelegate> delegate,

+ net::URLRequestContextGetter* url_request_context_getter,

+ const std::string& locale);

+ void StartOnIOThread(int render_process_id);

+ void StopOnIOThread();

+ private:

+ friend class base::RefCountedThreadSafe<SpeechRecognizer::EventListener>;

+ ~EventListener();

+ void NotifyRecognitionStateChanged(SpeechRecognitionState new_state);

+ void StartSpeechTimeout();

+ void StopSpeechTimeout();

+ void SpeechTimeout();

+ // Overridden from app_list::SpeechRecognizerDelegate:

+ // Always called on the UI thread and used to dispatch to delegate_.

+ void OnSpeechResult(const base::string16& query, bool is_final) override;

+ void OnSpeechSoundLevelChanged(int16_t level) override;

+ void OnSpeechRecognitionStateChanged(

+ SpeechRecognitionState new_state) override;

+ content::WebContents* GetSpeechContents() override;

+ // Overidden from content::SpeechRecognitionEventListener:

+ // These are always called on the IO thread.

+ void OnRecognitionStart(int session_id) override;

+ void OnRecognitionEnd(int session_id) override;

+ void OnRecognitionResults(

+ int session_id,

+ const content::SpeechRecognitionResults& results) override;

+ void OnRecognitionError(

+ int session_id, const content::SpeechRecognitionError& error) override;

+ void OnSoundStart(int session_id) override;

+ void OnSoundEnd(int session_id) override;

+ void OnAudioLevelsChange(

+ int session_id, float volume, float noise_volume) override;

+ void OnEnvironmentEstimationComplete(int session_id) override;

+ void OnAudioStart(int session_id) override;

+ void OnAudioEnd(int session_id) override;

+ // Only access from the UI thread.

+ base::WeakPtr<SpeechRecognizerDelegate> delegate_;

+ scoped_refptr<net::URLRequestContextGetter> url_request_context_getter_;

+ std::string locale_;

+ base::Timer speech_timeout_;

+ int session_;

+ base::WeakPtrFactory<EventListener> weak_factory_;

+ DISALLOW_COPY_AND_ASSIGN(EventListener);

+};

+SpeechRecognizer::EventListener::EventListener(

+ base::WeakPtr<SpeechRecognizerDelegate> delegate,

+ net::URLRequestContextGetter* url_request_context_getter,

+ const std::string& locale)

+ : delegate_(delegate),

+ url_request_context_getter_(url_request_context_getter),

+ locale_(locale),

+ speech_timeout_(false, false),

+ session_(-1),

+ weak_factory_(this) {

+ DCHECK_CURRENTLY_ON(content::BrowserThread::UI);

+SpeechRecognizer::EventListener::~EventListener() {

+ DCHECK(!speech_timeout_.IsRunning());

+void SpeechRecognizer::EventListener::StartOnIOThread(int render_process_id) {

+ DCHECK_CURRENTLY_ON(content::BrowserThread::IO);

+ if (session_ != -1)

+ StopOnIOThread();

+ content::SpeechRecognitionSessionConfig config;

+ config.language = locale_;

+ config.is_legacy_api = false;

+ config.continuous = true;

+ config.interim_results = true;

+ config.max_hypotheses = 1;

+ config.filter_profanities = true;

+ config.url_request_context_getter = url_request_context_getter_;

+ config.event_listener = weak_factory_.GetWeakPtr();

+ config.initial_context.render_process_id = render_process_id;

+ auto speech_instance = content::SpeechRecognitionManager::GetInstance();

+ session_ = speech_instance->CreateSession(config);

+ speech_instance->StartSession(session_);

+void SpeechRecognizer::EventListener::StopOnIOThread() {

+ DCHECK_CURRENTLY_ON(content::BrowserThread::IO);

+ if (session_ == -1)

+ return;

+ // Prevent recursion.

+ int session = session_;

+ session_ = -1;

+ StopSpeechTimeout();

+ content::SpeechRecognitionManager::GetInstance()->StopAudioCaptureForSession(

+ session);

+void SpeechRecognizer::EventListener::NotifyRecognitionStateChanged(

+ SpeechRecognitionState new_state) {

+ content::BrowserThread::PostTask(

+ content::BrowserThread::UI,

+ FROM_HERE,

+ base::Bind(&SpeechRecognizerDelegate::OnSpeechRecognitionStateChanged,

+ this,

+ new_state));

+void SpeechRecognizer::EventListener::StartSpeechTimeout() {

+ DCHECK_CURRENTLY_ON(content::BrowserThread::IO);

+ speech_timeout_.Start(

+ FROM_HERE,

+ base::TimeDelta::FromSeconds(kNoSpeechTimeoutInSeconds),

+ base::Bind(&SpeechRecognizer::EventListener::SpeechTimeout, this));

+void SpeechRecognizer::EventListener::StopSpeechTimeout() {

+ DCHECK_CURRENTLY_ON(content::BrowserThread::IO);

+ speech_timeout_.Stop();

+void SpeechRecognizer::EventListener::SpeechTimeout() {

+ DCHECK_CURRENTLY_ON(content::BrowserThread::IO);

+ StopOnIOThread();

+void SpeechRecognizer::EventListener::OnRecognitionStart(int session_id) {

+ NotifyRecognitionStateChanged(SPEECH_RECOGNITION_RECOGNIZING);

+void SpeechRecognizer::EventListener::OnRecognitionEnd(int session_id) {

+ StopOnIOThread();

+ NotifyRecognitionStateChanged(SPEECH_RECOGNITION_READY);

+void SpeechRecognizer::EventListener::OnRecognitionResults(

+ int session_id, const content::SpeechRecognitionResults& results) {

+ base::string16 result_str;

+ size_t final_count = 0;

+ for (const auto& result : results) {

+ if (!result.is_provisional)

+ final_count++;

+ result_str += result.hypotheses[0].utterance;

+ }

+ StopSpeechTimeout();

+ content::BrowserThread::PostTask(

+ content::BrowserThread::UI,

+ FROM_HERE,

+ base::Bind(&SpeechRecognizerDelegate::OnSpeechResult,

+ this,

+ result_str,

+ final_count == results.size()));

+ // Stop the moment we have a final result.

+ if (final_count == results.size())

+ StopOnIOThread();

+void SpeechRecognizer::EventListener::OnRecognitionError(

+ int session_id, const content::SpeechRecognitionError& error) {

+ StopOnIOThread();

+ if (error.code == content::SPEECH_RECOGNITION_ERROR_NETWORK) {

+ NotifyRecognitionStateChanged(SPEECH_RECOGNITION_NETWORK_ERROR);

+ }

+ NotifyRecognitionStateChanged(SPEECH_RECOGNITION_READY);

+void SpeechRecognizer::EventListener::OnSoundStart(int session_id) {

+ StartSpeechTimeout();

+ NotifyRecognitionStateChanged(SPEECH_RECOGNITION_IN_SPEECH);

+void SpeechRecognizer::EventListener::OnSoundEnd(int session_id) {

+ StopOnIOThread();

+ NotifyRecognitionStateChanged(SPEECH_RECOGNITION_RECOGNIZING);

+void SpeechRecognizer::EventListener::OnAudioLevelsChange(

+ int session_id, float volume, float noise_volume) {

+ DCHECK_LE(0.0, volume);

+ DCHECK_GE(1.0, volume);

+ DCHECK_LE(0.0, noise_volume);

+ DCHECK_GE(1.0, noise_volume);

+ volume = std::max(0.0f, volume - noise_volume);

+ // Both |volume| and |noise_volume| are defined to be in the range [0.0, 1.0].

+ // See: content/public/browser/speech_recognition_event_listener.h

+ int16_t sound_level = static_cast<int16_t>(INT16_MAX * volume);

+ content::BrowserThread::PostTask(

+ content::BrowserThread::UI,

+ FROM_HERE,

+ base::Bind(&SpeechRecognizerDelegate::OnSpeechSoundLevelChanged,

+ this,

+ sound_level));

+void SpeechRecognizer::EventListener::OnEnvironmentEstimationComplete(

+ int session_id) {

+void SpeechRecognizer::EventListener::OnAudioStart(int session_id) {

+void SpeechRecognizer::EventListener::OnAudioEnd(int session_id) {

+void SpeechRecognizer::EventListener::OnSpeechResult(

Lei Zhang 2014/11/05 00:54:15 Why not put this in SpeechRecognizer?

Anand Mistry (off Chromium) 2014/11/05 02:58:33 I've learned that using WeakPtr<> with callbacks "

+ const base::string16& query, bool is_final) {

+ DCHECK_CURRENTLY_ON(content::BrowserThread::UI);

+ if (delegate_)

+ delegate_->OnSpeechResult(query, is_final);

+void SpeechRecognizer::EventListener::OnSpeechSoundLevelChanged(int16_t level) {

+ DCHECK_CURRENTLY_ON(content::BrowserThread::UI);

+ if (delegate_)

+ delegate_->OnSpeechSoundLevelChanged(level);

+void SpeechRecognizer::EventListener::OnSpeechRecognitionStateChanged(

+ SpeechRecognitionState new_state) {

+ DCHECK_CURRENTLY_ON(content::BrowserThread::UI);

+ if (delegate_)

+ delegate_->OnSpeechRecognitionStateChanged(new_state);

+content::WebContents* SpeechRecognizer::EventListener::GetSpeechContents() {

+ NOTREACHED();

+ return nullptr;

+SpeechRecognizer::SpeechRecognizer(

+ SpeechRecognizerDelegate* delegate,

+ net::URLRequestContextGetter* url_request_context_getter,

+ const std::string& locale)

+ : delegate_(delegate),

+ delegate_weak_factory_(delegate) {

+ DCHECK_CURRENTLY_ON(content::BrowserThread::UI);

+ // Must be done after delegate_weak_factory_ has been constructed.

+ speech_event_listener_ = new EventListener(

+ delegate_weak_factory_.GetWeakPtr(), url_request_context_getter, locale);

+SpeechRecognizer::~SpeechRecognizer() {

+ DCHECK_CURRENTLY_ON(content::BrowserThread::UI);

+ Stop();

+void SpeechRecognizer::Start() {

+ DCHECK_CURRENTLY_ON(content::BrowserThread::UI);

+ // The speech recognizer checks to see if the request is allowed by looking

+ // up the renderer process. A renderer containing the app-list is hard-coded

+ // to be allowed.

+ content::WebContents* contents = delegate_->GetSpeechContents();

+ if (!contents)

+ return;

+ content::BrowserThread::PostTask(

+ content::BrowserThread::IO,

+ FROM_HERE,

+ base::Bind(&SpeechRecognizer::EventListener::StartOnIOThread,

+ speech_event_listener_,

+ contents->GetRenderProcessHost()->GetID()));

+void SpeechRecognizer::Stop() {

+ DCHECK_CURRENTLY_ON(content::BrowserThread::UI);

+ content::BrowserThread::PostTask(

+ content::BrowserThread::IO,

+ FROM_HERE,

+ base::Bind(&SpeechRecognizer::EventListener::StopOnIOThread,

+ speech_event_listener_));

+} // namespace app_list