Chromium Code Reviews| OLD | NEW |
|---|---|
| 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. | 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
| 4 | 4 |
| 5 #ifndef CONTENT_PUBLIC_BROWSER_SPEECH_RECOGNITION_MANAGER_H_ | 5 #ifndef CONTENT_PUBLIC_BROWSER_SPEECH_RECOGNITION_MANAGER_H_ |
| 6 #define CONTENT_PUBLIC_BROWSER_SPEECH_RECOGNITION_MANAGER_H_ | 6 #define CONTENT_PUBLIC_BROWSER_SPEECH_RECOGNITION_MANAGER_H_ |
| 7 | 7 |
| 8 #include "base/string16.h" | 8 #include "base/string16.h" |
| 9 #include "base/callback.h" | |
| 9 #include "content/common/content_export.h" | 10 #include "content/common/content_export.h" |
| 11 #include "content/public/common/speech_recognition_result.h" | |
| 10 | 12 |
| 11 namespace content { | 13 namespace content { |
| 12 | 14 |
| 13 // This is the gatekeeper for speech recognition in the browser process. It | 15 class SpeechRecognitionEventListener; |
| 14 // handles requests received from various render views and makes sure only one | 16 struct SpeechRecognitionSessionConfig; |
| 15 // of them can use speech recognition at a time. It also sends recognition | 17 struct SpeechRecognitionSessionContext; |
| 16 // results and status events to the render views when required. | 18 |
| 17 class SpeechRecognitionManager { | 19 // The SpeechRecognitionManager (SRM) is a singleton class that handles SR |
|
Satish
2012/04/19 13:03:19
I like this comment block :) but feels verbose. Ca
Primiano Tucci (use gerrit)
2012/04/20 16:06:43
Done.
| |
| 20 // functionalities within Chrome. Everyone that needs to perform SR should | |
| 21 // interface exclusively with the SRM. Usually SR requires the operation and | |
| 22 // coordination of several objects (an audio controller, a SR engine...). The | |
| 23 // aim of the SRM is to make all this activities transparent to end users, | |
| 24 // which will perceive only the SRM methods and the callback interface | |
| 25 // SpeechRecognitionEventListener. | |
| 26 // Since many different sources can use SR in different times (some overlapping | |
| 27 // is allowed while waiting for results), the SRM has the further responsibility | |
| 28 // of handling separately and reliably these different sessions, distinguishing | |
| 29 // them by means of a session_id. | |
| 30 // The rationale behind the word "reliably" is that while most of the classes, | |
| 31 // that are (should be) NOT directly accessible to the end-user are designed to | |
| 32 // work in an ideal flow (the SpeechRecognizer will get extremely offended if | |
| 33 // asked to start recognition while it is already in progress), the SRM is | |
| 34 // designed to interface with an evil world (the user interface / JS APIs) in | |
| 35 // which very bad people that will try any possible sequence of commands, often | |
| 36 // without a particular logic. | |
| 37 // In this sense a session, within the SRM, models the ongoing evolution of a | |
| 38 // SR request from the viewpoint of the end-user (abstracting all the concrete | |
| 39 // operations that must be carried out, that will be handled by inner classes). | |
| 40 // SR session requires for most of the time (i.e. audio capture) exclusive | |
| 41 // interaction with the user (popup/notifications/consensus). For this reason, | |
| 42 // while many SR sessions can be alive during the lifetime of the browser, | |
| 43 // only one, the interactive session, is allowed to capture audio and interact | |
| 44 // with the user. After the audio capture is terminated the session may | |
| 45 // eventually be detached (will continue processing recorded audio and gathering | |
| 46 // the results without interacting with the user). A SR session finally dies | |
| 47 // either when it retrieves a valid result or when, after reporting a visible | |
| 48 class CONTENT_EXPORT SpeechRecognitionManager { | |
| 18 public: | 49 public: |
| 50 static const int kSessionIDInvalid; | |
| 51 | |
| 19 // Returns the singleton instance. | 52 // Returns the singleton instance. |
| 20 CONTENT_EXPORT static SpeechRecognitionManager* GetInstance(); | 53 static SpeechRecognitionManager* GetInstance(); |
| 21 | 54 |
| 22 // Starts/restarts recognition for an existing request. | 55 // Creates a new recognition session. |
| 23 virtual void StartRecognitionForRequest(int session_id) = 0; | 56 virtual int CreateSession(SpeechRecognitionSessionConfig& config, |
| 57 SpeechRecognitionEventListener* listener) = 0; | |
| 24 | 58 |
| 25 // Cancels recognition for an existing request. | 59 // Starts/restarts recognition for an existing session. |
| 26 virtual void CancelRecognitionForRequest(int session_id) = 0; | 60 virtual void StartSession(int session_id) = 0; |
| 27 | 61 |
| 28 // Called when the user clicks outside the speech input UI causing it to close | 62 // Aborts recognition for an existing session, without providing any result. |
| 29 // and possibly have speech input go to another element. | 63 virtual void AbortSession(int session_id) = 0; |
| 30 virtual void FocusLostForRequest(int session_id) = 0; | 64 |
| 65 // Aborts all sessions for a given listener, without providing any result. | |
| 66 virtual void AbortAllSessionsForListener( | |
| 67 SpeechRecognitionEventListener* listener) = 0; | |
| 68 | |
| 69 // Stops audio capture for an existing session. The audio captured before the | |
| 70 // call will be processed, possibly ending up with a result. | |
| 71 virtual void StopAudioCaptureForSession(int session_id) = 0; | |
| 72 | |
| 73 // Detaches the session preventing it from interacting further with the | |
| 74 // browser (typically invoked when the user clicks outside the speech UI). | |
| 75 // The session will be silently continued in background if possible (in the | |
| 76 // case it already finished capturing audio and was just waiting for the | |
| 77 // result) or will be aborted if user interaction (e.g., audio recording) was | |
| 78 // involved at the time DetachSession was called. | |
| 79 virtual void DetachSession(int session_id) = 0; | |
| 80 | |
| 81 // Retrieves the context associated to a session. | |
| 82 virtual SpeechRecognitionSessionContext& GetSessionContext( | |
| 83 int session_id) const = 0; | |
| 84 | |
| 85 // Looks-up an existing session using a caller-provided matcher function. | |
| 86 virtual int LookupSessionByContext( | |
| 87 base::Callback<bool( | |
| 88 const content::SpeechRecognitionSessionContext&)> matcher) | |
| 89 const = 0; | |
| 31 | 90 |
| 32 // Returns true if the OS reports existence of audio recording devices. | 91 // Returns true if the OS reports existence of audio recording devices. |
| 33 virtual bool HasAudioInputDevices() = 0; | 92 virtual bool HasAudioInputDevices() = 0; |
| 34 | 93 |
| 35 // Used to determine if something else is currently making use of audio input. | 94 // Used to determine if something else is currently making use of audio input. |
| 36 virtual bool IsCapturingAudio() = 0; | 95 virtual bool IsCapturingAudio() = 0; |
| 37 | 96 |
| 38 // Returns a human readable string for the model/make of the active audio | 97 // Returns a human readable string for the model/make of the active audio |
| 39 // input device for this computer. | 98 // input device for this computer. |
| 40 virtual string16 GetAudioInputDeviceModel() = 0; | 99 virtual string16 GetAudioInputDeviceModel() = 0; |
| 41 | 100 |
| 42 // Invokes the platform provided microphone settings UI in a non-blocking way, | 101 // Invokes the platform provided microphone settings UI in a non-blocking way, |
| 43 // via the BrowserThread::FILE thread. | 102 // via the BrowserThread::FILE thread. |
| 44 virtual void ShowAudioInputSettings() = 0; | 103 virtual void ShowAudioInputSettings() = 0; |
| 45 | 104 |
| 46 protected: | 105 protected: |
| 47 virtual ~SpeechRecognitionManager() {} | 106 virtual ~SpeechRecognitionManager() {} |
| 48 }; | 107 }; |
| 49 | 108 |
| 50 } // namespace content | 109 } // namespace content |
| 51 | 110 |
| 52 #endif // CONTENT_PUBLIC_BROWSER_SPEECH_RECOGNITION_MANAGER_H_ | 111 #endif // CONTENT_PUBLIC_BROWSER_SPEECH_RECOGNITION_MANAGER_H_ |
| OLD | NEW |