media/audio/win/audio_low_latency_output_win.cc - Issue 12049070: Avoids irregular OnMoreData callbacks on Windows using Core Audio

Unified Diff: media/audio/win/audio_low_latency_output_win.cc

Issue 12049070: Avoids irregular OnMoreData callbacks on Windows using Core Audio (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/src

Patch Set: Non trivial rebase Created 7 years, 11 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: media/audio/win/audio_low_latency_output_win.cc

diff --git a/media/audio/win/audio_low_latency_output_win.cc b/media/audio/win/audio_low_latency_output_win.cc

index 30375894a02b1b576c108f7757edf548d6671c47..e0376b301163023833389405ad0a6b05c205d2a4 100644

--- a/media/audio/win/audio_low_latency_output_win.cc

+++ b/media/audio/win/audio_low_latency_output_win.cc

@@ -7,6 +7,7 @@

#include <Functiondiscoverykeys_devpkey.h>

#include "base/command_line.h"

+#include "base/debug/trace_event.h"

#include "base/logging.h"

#include "base/memory/scoped_ptr.h"

#include "base/metrics/histogram.h"

@@ -14,6 +15,7 @@

#include "media/audio/audio_util.h"

#include "media/audio/win/audio_manager_win.h"

#include "media/audio/win/avrt_wrapper_win.h"

+#include "media/audio/win/core_audio_util_win.h"

#include "media/base/limits.h"

#include "media/base/media_switches.h"

@@ -25,53 +27,6 @@ namespace media {

typedef uint32 ChannelConfig;

-// Retrieves the stream format that the audio engine uses for its internal

-// processing/mixing of shared-mode streams.

-static HRESULT GetMixFormat(ERole device_role, WAVEFORMATEX** device_format) {

- // Note that we are using the IAudioClient::GetMixFormat() API to get the

- // device format in this function. It is in fact possible to be "more native",

- // and ask the endpoint device directly for its properties. Given a reference

- // to the IMMDevice interface of an endpoint object, a client can obtain a

- // reference to the endpoint object's property store by calling the

- // IMMDevice::OpenPropertyStore() method. However, I have not been able to

- // access any valuable information using this method on my HP Z600 desktop,

- // hence it feels more appropriate to use the IAudioClient::GetMixFormat()

- // approach instead.

- // Calling this function only makes sense for shared mode streams, since

- // if the device will be opened in exclusive mode, then the application

- // specified format is used instead. However, the result of this method can

- // be useful for testing purposes so we don't DCHECK here.

- DLOG_IF(WARNING, WASAPIAudioOutputStream::GetShareMode() ==

- AUDCLNT_SHAREMODE_EXCLUSIVE) <<

- "The mixing sample rate will be ignored for exclusive-mode streams.";

- // It is assumed that this static method is called from a COM thread, i.e.,

- // CoInitializeEx() is not called here again to avoid STA/MTA conflicts.

- ScopedComPtr<IMMDeviceEnumerator> enumerator;

- HRESULT hr = CoCreateInstance(__uuidof(MMDeviceEnumerator),

- NULL,

- CLSCTX_INPROC_SERVER,

- __uuidof(IMMDeviceEnumerator),

- enumerator.ReceiveVoid());

- if (FAILED(hr))

- return hr;

- ScopedComPtr<IMMDevice> endpoint_device;

- hr = enumerator->GetDefaultAudioEndpoint(eRender,

- device_role,

- endpoint_device.Receive());

- if (FAILED(hr))

- return hr;

- ScopedComPtr<IAudioClient> audio_client;

- hr = endpoint_device->Activate(__uuidof(IAudioClient),

- CLSCTX_INPROC_SERVER,

- NULL,

- audio_client.ReceiveVoid());

- return SUCCEEDED(hr) ? audio_client->GetMixFormat(device_format) : hr;

// Retrieves an integer mask which corresponds to the channel layout the

// audio engine uses for its internal processing/mixing of shared-mode

// streams. This mask indicates which channels are present in the multi-

@@ -81,53 +36,23 @@ static HRESULT GetMixFormat(ERole device_role, WAVEFORMATEX** device_format) {

// See http://msdn.microsoft.com/en-us/library/windows/hardware/ff537083(v=vs.85).aspx

// for more details.

static ChannelConfig GetChannelConfig() {

- // Use a WAVEFORMATEXTENSIBLE structure since it can specify both the

- // number of channels and the mapping of channels to speakers for

- // multichannel devices.

- base::win::ScopedCoMem<WAVEFORMATPCMEX> format_ex;

- HRESULT hr = S_FALSE;

- hr = GetMixFormat(eConsole, reinterpret_cast<WAVEFORMATEX**>(&format_ex));

- if (FAILED(hr))

- return 0;

- // The dwChannelMask member specifies which channels are present in the

- // multichannel stream. The least significant bit corresponds to the

- // front left speaker, the next least significant bit corresponds to the

- // front right speaker, and so on.

- // See http://msdn.microsoft.com/en-us/library/windows/desktop/dd757714(v=vs.85).aspx

- // for more details on the channel mapping.

- DVLOG(2) << "dwChannelMask: 0x" << std::hex << format_ex->dwChannelMask;

-#if !defined(NDEBUG)

- // See http://en.wikipedia.org/wiki/Surround_sound for more details on

- // how to name various speaker configurations. The list below is not complete.

- const char* speaker_config = "Undefined";

- switch (format_ex->dwChannelMask) {

- case KSAUDIO_SPEAKER_MONO:

- speaker_config = "Mono";

- break;

- case KSAUDIO_SPEAKER_STEREO:

- speaker_config = "Stereo";

- break;

- case KSAUDIO_SPEAKER_5POINT1_SURROUND:

- speaker_config = "5.1 surround";

- break;

- case KSAUDIO_SPEAKER_5POINT1:

- speaker_config = "5.1";

- break;

- case KSAUDIO_SPEAKER_7POINT1_SURROUND:

- speaker_config = "7.1 surround";

- break;

- case KSAUDIO_SPEAKER_7POINT1:

- speaker_config = "7.1";

- break;

- default:

- break;

- }

- DVLOG(2) << "speaker configuration: " << speaker_config;

-#endif

+ WAVEFORMATPCMEX format;

+ return SUCCEEDED(CoreAudioUtil::GetDefaultSharedModeMixFormat(

+ eRender, eConsole, &format)) ?

+ static_cast<int>(format.dwChannelMask) : 0;

- return static_cast<ChannelConfig>(format_ex->dwChannelMask);

+// Compare two sets of audio parameters and return true if they are equal.

+// Note that bits_per_sample() is excluded from this comparison since Core

+// Audio can deal with most bit depths. As an example, if the native/mixing

+// bit depth is 32 bits (default), opening at 16 or 24 still works fine and

+// the audio engine will do the required conversion for us.

+static bool CompareAudioParametersNoBitDepth(const media::AudioParameters& a,

+ const media::AudioParameters& b) {

+ return (a.format() == b.format() &&

+ a.channels() == b.channels() &&

+ a.sample_rate() == b.sample_rate() &&

+ a.frames_per_buffer() == b.frames_per_buffer());

}

// Converts Microsoft's channel configuration to ChannelLayout.

@@ -172,31 +97,63 @@ AUDCLNT_SHAREMODE WASAPIAudioOutputStream::GetShareMode() {

return AUDCLNT_SHAREMODE_SHARED;

}

+// static

+int WASAPIAudioOutputStream::HardwareChannelCount() {

+ WAVEFORMATPCMEX format;

+ return SUCCEEDED(CoreAudioUtil::GetDefaultSharedModeMixFormat(

+ eRender, eConsole, &format)) ?

+ static_cast<int>(format.Format.nChannels) : 0;

+// static

+ChannelLayout WASAPIAudioOutputStream::HardwareChannelLayout() {

+ return ChannelConfigToChannelLayout(GetChannelConfig());

+// static

+int WASAPIAudioOutputStream::HardwareSampleRate() {

+ WAVEFORMATPCMEX format;

+ return SUCCEEDED(CoreAudioUtil::GetDefaultSharedModeMixFormat(

+ eRender, eConsole, &format)) ?

+ static_cast<int>(format.Format.nSamplesPerSec) : 0;

WASAPIAudioOutputStream::WASAPIAudioOutputStream(AudioManagerWin* manager,

const AudioParameters& params,

ERole device_role)

: creating_thread_id_(base::PlatformThread::CurrentId()),

manager_(manager),

opened_(false),

- restart_rendering_mode_(false),

+ audio_parmeters_are_valid_(false),

volume_(1.0),

endpoint_buffer_size_frames_(0),

device_role_(device_role),

share_mode_(GetShareMode()),

- client_channel_count_(params.channels()),

num_written_frames_(0),

source_(NULL),

audio_bus_(AudioBus::Create(params)) {

DCHECK(manager_);

+ DVLOG(1) << "WASAPIAudioOutputStream::WASAPIAudioOutputStream()";

+ DVLOG_IF(1, share_mode_ == AUDCLNT_SHAREMODE_EXCLUSIVE)

+ << "Core Audio (WASAPI) EXCLUSIVE MODE is enabled.";

+ if (share_mode_ == AUDCLNT_SHAREMODE_SHARED) {

+ // Verify that the input audio parameters are identical (bit depth is

+ // excluded) to the preferred (native) audio parameters. Open() will fail

+ // if this is not the case.

+ AudioParameters preferred_params;

+ HRESULT hr = CoreAudioUtil::GetPreferredAudioParameters(

+ eRender, device_role, &preferred_params);

+ audio_parmeters_are_valid_ = SUCCEEDED(hr) &&

+ CompareAudioParametersNoBitDepth(params, preferred_params);

+ DLOG_IF(WARNING, !audio_parmeters_are_valid_)

+ << "Input and preferred parameters are not identical.";

+ }

// Load the Avrt DLL if not already loaded. Required to support MMCSS.

bool avrt_init = avrt::Initialize();

DCHECK(avrt_init) << "Failed to load the avrt.dll";

- if (share_mode_ == AUDCLNT_SHAREMODE_EXCLUSIVE) {

- VLOG(1) << ">> Note that EXCLUSIVE MODE is enabled <<";

- }

// Set up the desired render format specified by the client. We use the

// WAVE_FORMAT_EXTENSIBLE structure to ensure that multiple channel ordering

// and high precision data can be supported.

@@ -204,7 +161,7 @@ WASAPIAudioOutputStream::WASAPIAudioOutputStream(AudioManagerWin* manager,

// Begin with the WAVEFORMATEX structure that specifies the basic format.

WAVEFORMATEX* format = &format_.Format;

format->wFormatTag = WAVE_FORMAT_EXTENSIBLE;

- format->nChannels = client_channel_count_;

+ format->nChannels = params.channels();

format->nSamplesPerSec = params.sample_rate();

format->wBitsPerSample = params.bits_per_sample();

format->nBlockAlign = (format->wBitsPerSample / 8) * format->nChannels;

@@ -216,15 +173,12 @@ WASAPIAudioOutputStream::WASAPIAudioOutputStream(AudioManagerWin* manager,

format_.dwChannelMask = GetChannelConfig();

format_.SubFormat = KSDATAFORMAT_SUBTYPE_PCM;

- // Size in bytes of each audio frame.

- frame_size_ = format->nBlockAlign;

// Store size (in different units) of audio packets which we expect to

// get from the audio endpoint device in each render event.

- packet_size_frames_ = params.GetBytesPerBuffer() / format->nBlockAlign;

+ packet_size_frames_ = params.frames_per_buffer();

packet_size_bytes_ = params.GetBytesPerBuffer();

packet_size_ms_ = (1000.0 * packet_size_frames_) / params.sample_rate();

- DVLOG(1) << "Number of bytes per audio frame : " << frame_size_;

+ DVLOG(1) << "Number of bytes per audio frame : " << format->nBlockAlign;

DVLOG(1) << "Number of audio frames per packet: " << packet_size_frames_;

DVLOG(1) << "Number of bytes per packet : " << packet_size_bytes_;

DVLOG(1) << "Number of milliseconds per packet: " << packet_size_ms_;

@@ -244,55 +198,88 @@ WASAPIAudioOutputStream::WASAPIAudioOutputStream(AudioManagerWin* manager,

WASAPIAudioOutputStream::~WASAPIAudioOutputStream() {}

bool WASAPIAudioOutputStream::Open() {

+ DVLOG(1) << "WASAPIAudioOutputStream::Open()";

DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);

if (opened_)

return true;

- // Channel mixing is not supported, it must be handled by ChannelMixer.

- if (format_.Format.nChannels != client_channel_count_) {

- LOG(ERROR) << "Channel down-mixing is not supported.";

- return false;

+ // Audio parameters must be identical to the preferred set of parameters

+ // if shared mode (default) is utilized.

+ if (share_mode_ == AUDCLNT_SHAREMODE_SHARED) {

+ if (!audio_parmeters_are_valid_) {

+ LOG(ERROR) << "Audio parameters are not valid.";

+ return false;

+ }

}

- // Create an IMMDeviceEnumerator interface and obtain a reference to

- // the IMMDevice interface of the default rendering device with the

- // specified role.

- HRESULT hr = SetRenderDevice();

- if (FAILED(hr)) {

+ // Create an IAudioClient interface for the default rendering IMMDevice.

+ ScopedComPtr<IAudioClient> audio_client =

+ CoreAudioUtil::CreateDefaultClient(eRender, device_role_);

+ if (!audio_client)

return false;

- }

- // Obtain an IAudioClient interface which enables us to create and initialize

- // an audio stream between an audio application and the audio engine.

- hr = ActivateRenderDevice();

- if (FAILED(hr)) {

+ // Extra sanity to ensure that the provided device format is still valid.

+ if (!CoreAudioUtil::IsFormatSupported(audio_client,

+ share_mode_,

+ &format_)) {

return false;

}

- // Verify that the selected audio endpoint supports the specified format

- // set during construction.

- // In exclusive mode, the client can choose to open the stream in any audio

- // format that the endpoint device supports. In shared mode, the client must

- // open the stream in the mix format that is currently in use by the audio

- // engine (or a format that is similar to the mix format). The audio engine's

- // input streams and the output mix from the engine are all in this format.

- if (!DesiredFormatIsSupported()) {

- return false;

+ HRESULT hr = S_FALSE;

+ if (share_mode_ == AUDCLNT_SHAREMODE_SHARED) {

+ // Initialize the audio stream between the client and the device in shared

+ // mode and using event-driven buffer handling.

+ hr = CoreAudioUtil::SharedModeInitialize(

+ audio_client, &format_, audio_samples_render_event_.Get(),

+ &endpoint_buffer_size_frames_);

+ if (FAILED(hr))

+ return false;

+ // We know from experience that the best possible callback sequence is

+ // achieved when the packet size (given by the native device period)

+ // is an even multiple of the endpoint buffer size.

+ // Examples: 48kHz => 960 % 480, 44.1kHz => 896 % 448 or 882 % 441.

+ if (endpoint_buffer_size_frames_ % packet_size_frames_ != 0) {

DaleCurtis 2013/02/02 00:19:51 Might be better to CHECK() this since we know all

henrika (OOO until Aug 14) 2013/02/04 08:25:38 I did consider doing just that but now actually fe

+ DLOG(ERROR) << "Bailing out due to non-perfect timing.";

+ return false;

+ }

+ } else {

+ // TODO(henrika): break out to CoreAudioUtil::ExclusiveModeInitialize()

+ // when removing the enable-exclusive-audio flag.

+ hr = ExclusiveModeInitialization(audio_client,

+ audio_samples_render_event_.Get(),

+ &endpoint_buffer_size_frames_);

+ if (FAILED(hr))

+ return false;

+ // The buffer scheme for exclusive mode streams is not designed for max

+ // flexibility. We only allow a "perfect match" between the packet size set

+ // by the user and the actual endpoint buffer size.

+ if (endpoint_buffer_size_frames_ != packet_size_frames_) {

+ DLOG(ERROR) << "Bailing out due to non-perfect timing.";

+ return false;

+ }

}

- // Initialize the audio stream between the client and the device using

- // shared or exclusive mode and a lowest possible glitch-free latency.

- // We will enter different code paths depending on the specified share mode.

- hr = InitializeAudioEngine();

- if (FAILED(hr)) {

+ // Create an IAudioRenderClient client for an initialized IAudioClient.

+ // The IAudioRenderClient interface enables us to write output data to

+ // a rendering endpoint buffer.

+ ScopedComPtr<IAudioRenderClient> audio_render_client =

+ CoreAudioUtil::CreateRenderClient(audio_client);

+ if (!audio_render_client)

return false;

- }

+ // Store valid COM interfaces.

+ audio_client_ = audio_client;

+ audio_render_client_ = audio_render_client;

opened_ = true;

return true;

}

void WASAPIAudioOutputStream::Start(AudioSourceCallback* callback) {

+ DVLOG(1) << "WASAPIAudioOutputStream::Start()";

DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);

CHECK(callback);

CHECK(opened_);

@@ -302,49 +289,30 @@ void WASAPIAudioOutputStream::Start(AudioSourceCallback* callback) {

return;

}

- if (restart_rendering_mode_) {

- // The selected audio device has been removed or disabled and a new

- // default device has been enabled instead. The current implementation

- // does not to support this sequence of events. Given that Open()

- // and Start() are usually called in one sequence; it should be a very

- // rare event.

- // TODO(henrika): it is possible to extend the functionality here.

- LOG(ERROR) << "Unable to start since the selected default device has "

- "changed since Open() was called.";

- return;

- }

source_ = callback;

- // Avoid start-up glitches by filling up the endpoint buffer with "silence"

- // before starting the stream.

- BYTE* data_ptr = NULL;

- HRESULT hr = audio_render_client_->GetBuffer(endpoint_buffer_size_frames_,

- &data_ptr);

- if (FAILED(hr)) {

- DLOG(ERROR) << "Failed to use rendering audio buffer: " << std::hex << hr;

- return;

- }

- // Using the AUDCLNT_BUFFERFLAGS_SILENT flag eliminates the need to

- // explicitly write silence data to the rendering buffer.

- audio_render_client_->ReleaseBuffer(endpoint_buffer_size_frames_,

- AUDCLNT_BUFFERFLAGS_SILENT);

- num_written_frames_ = endpoint_buffer_size_frames_;

- // Sanity check: verify that the endpoint buffer is filled with silence.

- UINT32 num_queued_frames = 0;

- audio_client_->GetCurrentPadding(&num_queued_frames);

- DCHECK(num_queued_frames == num_written_frames_);

// Create and start the thread that will drive the rendering by waiting for

// render events.

render_thread_.reset(

new base::DelegateSimpleThread(this, "wasapi_render_thread"));

render_thread_->Start();

+ if (!render_thread_->HasBeenStarted()) {

+ DLOG(ERROR) << "Failed to start WASAPI render thread.";

+ return;

+ }

+ // Ensure that the endpoint buffer is prepared with silence.

+ if (share_mode_ == AUDCLNT_SHAREMODE_SHARED) {

+ if (!CoreAudioUtil::FillRenderEndpointBufferWithSilence(

+ audio_client_, audio_render_client_)) {

+ DLOG(WARNING) << "Failed to prepare endpoint buffers with silence.";

+ return;

+ }

+ num_written_frames_ = endpoint_buffer_size_frames_;

// Start streaming data between the endpoint buffer and the audio engine.

- hr = audio_client_->Start();

+ HRESULT hr = audio_client_->Start();

if (FAILED(hr)) {

SetEvent(stop_render_event_.Get());

render_thread_->Join();

@@ -354,6 +322,7 @@ void WASAPIAudioOutputStream::Start(AudioSourceCallback* callback) {

}

void WASAPIAudioOutputStream::Stop() {

+ DVLOG(1) << "WASAPIAudioOutputStream::Stop()";

DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);

if (!render_thread_.get())

return;

@@ -396,6 +365,7 @@ void WASAPIAudioOutputStream::Stop() {

}

void WASAPIAudioOutputStream::Close() {

+ DVLOG(1) << "WASAPIAudioOutputStream::Close()";

DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);

// It is valid to call Close() before calling open or Start().

@@ -421,40 +391,6 @@ void WASAPIAudioOutputStream::GetVolume(double* volume) {

*volume = static_cast<double>(volume_);

}

-// static

-int WASAPIAudioOutputStream::HardwareChannelCount() {

- // Use a WAVEFORMATEXTENSIBLE structure since it can specify both the

- // number of channels and the mapping of channels to speakers for

- // multichannel devices.

- base::win::ScopedCoMem<WAVEFORMATPCMEX> format_ex;

- HRESULT hr = GetMixFormat(

- eConsole, reinterpret_cast<WAVEFORMATEX**>(&format_ex));

- if (FAILED(hr))

- return 0;

- // Number of channels in the stream. Corresponds to the number of bits

- // set in the dwChannelMask.

- DVLOG(1) << "endpoint channels (out): " << format_ex->Format.nChannels;

- return static_cast<int>(format_ex->Format.nChannels);

-// static

-ChannelLayout WASAPIAudioOutputStream::HardwareChannelLayout() {

- return ChannelConfigToChannelLayout(GetChannelConfig());

-// static

-int WASAPIAudioOutputStream::HardwareSampleRate(ERole device_role) {

- base::win::ScopedCoMem<WAVEFORMATEX> format;

- HRESULT hr = GetMixFormat(device_role, &format);

- if (FAILED(hr))

- return 0;

- DVLOG(2) << "nSamplesPerSec: " << format->nSamplesPerSec;

- return static_cast<int>(format->nSamplesPerSec);

void WASAPIAudioOutputStream::Run() {

ScopedCOMInitializer com_init(ScopedCOMInitializer::kMTA);

@@ -514,6 +450,8 @@ void WASAPIAudioOutputStream::Run() {

break;

case WAIT_OBJECT_0 + 1:

{

+ TRACE_EVENT0("audio", "WASAPIAudioOutputStream::Run");

// |audio_samples_render_event_| has been set.

UINT32 num_queued_frames = 0;

uint8* audio_data = NULL;

@@ -541,97 +479,100 @@ void WASAPIAudioOutputStream::Run() {

// directly on the buffer size.

num_available_frames = endpoint_buffer_size_frames_;

}

+ if (FAILED(hr)) {

+ DLOG(ERROR) << "Failed to retrieve amount of available space: "

+ << std::hex << hr;

+ continue;

+ }

- // Check if there is enough available space to fit the packet size

- // specified by the client.

- if (FAILED(hr) || (num_available_frames < packet_size_frames_))

+ // It is my current assumption that we will always end up with a

+ // perfect match here where the packet size is identical to what

+ // the audio engine needs (num_available_frames). I am adding a

+ // DLOG to be able to track down any deviations from this theory.

+ if ((num_available_frames > 0) &&

+ (num_available_frames != packet_size_frames_)) {

+ DLOG(WARNING) << "Non-perfect timing case detected.";

continue;

+ }

- // Derive the number of packets we need get from the client to

- // fill up the available area in the endpoint buffer.

- // |num_packets| will always be one for exclusive-mode streams.

- size_t num_packets = (num_available_frames / packet_size_frames_);

- // Get data from the client/source.

- for (size_t n = 0; n < num_packets; ++n) {

- // Grab all available space in the rendering endpoint buffer

- // into which the client can write a data packet.

- hr = audio_render_client_->GetBuffer(packet_size_frames_,

- &audio_data);

- if (FAILED(hr)) {

- DLOG(ERROR) << "Failed to use rendering audio buffer: "

- << std::hex << hr;

- continue;

- }

- // Derive the audio delay which corresponds to the delay between

- // a render event and the time when the first audio sample in a

- // packet is played out through the speaker. This delay value

- // can typically be utilized by an acoustic echo-control (AEC)

- // unit at the render side.

- UINT64 position = 0;

- int audio_delay_bytes = 0;

- hr = audio_clock->GetPosition(&position, NULL);

- if (SUCCEEDED(hr)) {

- // Stream position of the sample that is currently playing

- // through the speaker.

- double pos_sample_playing_frames = format_.Format.nSamplesPerSec *

- (static_cast<double>(position) / device_frequency);

- // Stream position of the last sample written to the endpoint

- // buffer. Note that, the packet we are about to receive in

- // the upcoming callback is also included.

- size_t pos_last_sample_written_frames =

- num_written_frames_ + packet_size_frames_;

- // Derive the actual delay value which will be fed to the

- // render client using the OnMoreData() callback.

- audio_delay_bytes = (pos_last_sample_written_frames -

- pos_sample_playing_frames) * frame_size_;

- }

- // Read a data packet from the registered client source and

- // deliver a delay estimate in the same callback to the client.

- // A time stamp is also stored in the AudioBuffersState. This

- // time stamp can be used at the client side to compensate for

- // the delay between the usage of the delay value and the time

- // of generation.

- uint32 num_filled_bytes = 0;

- const int bytes_per_sample = format_.Format.wBitsPerSample >> 3;

- int frames_filled = source_->OnMoreData(

- audio_bus_.get(), AudioBuffersState(0, audio_delay_bytes));

- num_filled_bytes = frames_filled * frame_size_;

- DCHECK_LE(num_filled_bytes, packet_size_bytes_);

- // Note: If this ever changes to output raw float the data must be

- // clipped and sanitized since it may come from an untrusted

- // source such as NaCl.

- audio_bus_->ToInterleaved(

- frames_filled, bytes_per_sample, audio_data);

- // Perform in-place, software-volume adjustments.

- media::AdjustVolume(audio_data,

- num_filled_bytes,

- audio_bus_->channels(),

- bytes_per_sample,

- volume_);

- // Zero out the part of the packet which has not been filled by

- // the client. Using silence is the least bad option in this

- // situation.

- if (num_filled_bytes < packet_size_bytes_) {

- memset(&audio_data[num_filled_bytes], 0,

- (packet_size_bytes_ - num_filled_bytes));

- }

- // Release the buffer space acquired in the GetBuffer() call.

- DWORD flags = 0;

- audio_render_client_->ReleaseBuffer(packet_size_frames_,

- flags);

- num_written_frames_ += packet_size_frames_;

+ // Grab all available space in the rendering endpoint buffer

+ // into which the client can write a data packet.

+ hr = audio_render_client_->GetBuffer(packet_size_frames_,

+ &audio_data);

+ if (FAILED(hr)) {

+ DLOG(ERROR) << "Failed to use rendering audio buffer: "

+ << std::hex << hr;

+ continue;

}

DaleCurtis 2013/02/02 00:19:51 CHECK? I doubt you'll ever see this DLOG if it's n

henrika (OOO until Aug 14) 2013/02/04 08:25:38 See comment above.

+ // Derive the audio delay which corresponds to the delay between

+ // a render event and the time when the first audio sample in a

+ // packet is played out through the speaker. This delay value

+ // can typically be utilized by an acoustic echo-control (AEC)

+ // unit at the render side.

+ UINT64 position = 0;

+ int audio_delay_bytes = 0;

+ hr = audio_clock->GetPosition(&position, NULL);

+ if (SUCCEEDED(hr)) {

+ // Stream position of the sample that is currently playing

+ // through the speaker.

+ double pos_sample_playing_frames = format_.Format.nSamplesPerSec *

+ (static_cast<double>(position) / device_frequency);

+ // Stream position of the last sample written to the endpoint

+ // buffer. Note that, the packet we are about to receive in

+ // the upcoming callback is also included.

+ size_t pos_last_sample_written_frames =

+ num_written_frames_ + packet_size_frames_;

+ // Derive the actual delay value which will be fed to the

+ // render client using the OnMoreData() callback.

+ audio_delay_bytes = (pos_last_sample_written_frames -

+ pos_sample_playing_frames) * format_.Format.nBlockAlign;

+ }

+ // Read a data packet from the registered client source and

+ // deliver a delay estimate in the same callback to the client.

+ // A time stamp is also stored in the AudioBuffersState. This

+ // time stamp can be used at the client side to compensate for

+ // the delay between the usage of the delay value and the time

+ // of generation.

+ uint32 num_filled_bytes = 0;

+ const int bytes_per_sample = format_.Format.wBitsPerSample >> 3;

+ int frames_filled = source_->OnMoreData(

+ audio_bus_.get(), AudioBuffersState(0, audio_delay_bytes));

+ num_filled_bytes = frames_filled * format_.Format.nBlockAlign;

+ DCHECK_LE(num_filled_bytes, packet_size_bytes_);

+ // Note: If this ever changes to output raw float the data must be

+ // clipped and sanitized since it may come from an untrusted

+ // source such as NaCl.

+ audio_bus_->ToInterleaved(

+ frames_filled, bytes_per_sample, audio_data);

+ // Perform in-place, software-volume adjustments.

+ media::AdjustVolume(audio_data,

+ num_filled_bytes,

+ audio_bus_->channels(),

+ bytes_per_sample,

+ volume_);

+ // Zero out the part of the packet which has not been filled by

+ // the client. Using silence is the least bad option in this

+ // situation.

+ if (num_filled_bytes < packet_size_bytes_) {

+ memset(&audio_data[num_filled_bytes], 0,

+ (packet_size_bytes_ - num_filled_bytes));

+ }

+ // Release the buffer space acquired in the GetBuffer() call.

+ DWORD flags = 0;

+ audio_render_client_->ReleaseBuffer(packet_size_frames_,

+ flags);

+ num_written_frames_ += packet_size_frames_;

}

break;

default:

@@ -662,224 +603,21 @@ void WASAPIAudioOutputStream::HandleError(HRESULT err) {

source_->OnError(this, static_cast<int>(err));

}

-HRESULT WASAPIAudioOutputStream::SetRenderDevice() {

- ScopedComPtr<IMMDeviceEnumerator> device_enumerator;

- ScopedComPtr<IMMDevice> endpoint_device;

- // Create the IMMDeviceEnumerator interface.

- HRESULT hr = CoCreateInstance(__uuidof(MMDeviceEnumerator),

- NULL,

- CLSCTX_INPROC_SERVER,

- __uuidof(IMMDeviceEnumerator),

- device_enumerator.ReceiveVoid());

- if (SUCCEEDED(hr)) {

- // Retrieve the default render audio endpoint for the specified role.

- // Note that, in Windows Vista, the MMDevice API supports device roles

- // but the system-supplied user interface programs do not.

- hr = device_enumerator->GetDefaultAudioEndpoint(

- eRender, device_role_, endpoint_device.Receive());

- if (FAILED(hr))

- return hr;

- // Verify that the audio endpoint device is active. That is, the audio

- // adapter that connects to the endpoint device is present and enabled.

- DWORD state = DEVICE_STATE_DISABLED;

- hr = endpoint_device->GetState(&state);

- if (SUCCEEDED(hr)) {

- if (!(state & DEVICE_STATE_ACTIVE)) {

- DLOG(ERROR) << "Selected render device is not active.";

- hr = E_ACCESSDENIED;

- }

- if (SUCCEEDED(hr)) {

- device_enumerator_ = device_enumerator;

- endpoint_device_ = endpoint_device;

- }

- return hr;

-HRESULT WASAPIAudioOutputStream::ActivateRenderDevice() {

- ScopedComPtr<IAudioClient> audio_client;

- // Creates and activates an IAudioClient COM object given the selected

- // render endpoint device.

- HRESULT hr = endpoint_device_->Activate(__uuidof(IAudioClient),

- CLSCTX_INPROC_SERVER,

- NULL,

- audio_client.ReceiveVoid());

- if (SUCCEEDED(hr)) {

- // Retrieve the stream format that the audio engine uses for its internal

- // processing/mixing of shared-mode streams.

- audio_engine_mix_format_.Reset(NULL);

- hr = audio_client->GetMixFormat(

- reinterpret_cast<WAVEFORMATEX**>(&audio_engine_mix_format_));

- if (SUCCEEDED(hr)) {

- audio_client_ = audio_client;

- }

- return hr;

-bool WASAPIAudioOutputStream::DesiredFormatIsSupported() {

- // Determine, before calling IAudioClient::Initialize(), whether the audio

- // engine supports a particular stream format.

- // In shared mode, the audio engine always supports the mix format,

- // which is stored in the |audio_engine_mix_format_| member and it is also

- // possible to receive a proposed (closest) format if the current format is

- // not supported.

- base::win::ScopedCoMem<WAVEFORMATEXTENSIBLE> closest_match;

- HRESULT hr = audio_client_->IsFormatSupported(

- share_mode_, reinterpret_cast<WAVEFORMATEX*>(&format_),

- reinterpret_cast<WAVEFORMATEX**>(&closest_match));

- // This log can only be triggered for shared mode.

- DLOG_IF(ERROR, hr == S_FALSE) << "Format is not supported "

- << "but a closest match exists.";

- // This log can be triggered both for shared and exclusive modes.

- DLOG_IF(ERROR, hr == AUDCLNT_E_UNSUPPORTED_FORMAT) << "Unsupported format.";

- if (hr == S_FALSE) {

- DVLOG(1) << "wFormatTag : " << closest_match->Format.wFormatTag;

- DVLOG(1) << "nChannels : " << closest_match->Format.nChannels;

- DVLOG(1) << "nSamplesPerSec: " << closest_match->Format.nSamplesPerSec;

- DVLOG(1) << "wBitsPerSample: " << closest_match->Format.wBitsPerSample;

- }

- return (hr == S_OK);

-HRESULT WASAPIAudioOutputStream::InitializeAudioEngine() {

-#if !defined(NDEBUG)

- // The period between processing passes by the audio engine is fixed for a

- // particular audio endpoint device and represents the smallest processing

- // quantum for the audio engine. This period plus the stream latency between

- // the buffer and endpoint device represents the minimum possible latency

- // that an audio application can achieve in shared mode.

- {

- REFERENCE_TIME default_device_period = 0;

- REFERENCE_TIME minimum_device_period = 0;

- HRESULT hr_dbg = audio_client_->GetDevicePeriod(&default_device_period,

- &minimum_device_period);

- if (SUCCEEDED(hr_dbg)) {

- // Shared mode device period.

- DVLOG(1) << "shared mode (default) device period: "

- << static_cast<double>(default_device_period / 10000.0)

- << " [ms]";

- // Exclusive mode device period.

- DVLOG(1) << "exclusive mode (minimum) device period: "

- << static_cast<double>(minimum_device_period / 10000.0)

- << " [ms]";

- }

- REFERENCE_TIME latency = 0;

- hr_dbg = audio_client_->GetStreamLatency(&latency);

- if (SUCCEEDED(hr_dbg)) {

- DVLOG(1) << "stream latency: " << static_cast<double>(latency / 10000.0)

- << " [ms]";

- }

-#endif

- HRESULT hr = S_FALSE;

- // Perform different initialization depending on if the device shall be

- // opened in shared mode or in exclusive mode.

- hr = (share_mode_ == AUDCLNT_SHAREMODE_SHARED) ?

- SharedModeInitialization() : ExclusiveModeInitialization();

- if (FAILED(hr)) {

- LOG(WARNING) << "IAudioClient::Initialize() failed: " << std::hex << hr;

- return hr;

- }

- // Retrieve the length of the endpoint buffer. The buffer length represents

- // the maximum amount of rendering data that the client can write to

- // the endpoint buffer during a single processing pass.

- // A typical value is 960 audio frames <=> 20ms @ 48kHz sample rate.

- hr = audio_client_->GetBufferSize(&endpoint_buffer_size_frames_);

- if (FAILED(hr))

- return hr;

- DVLOG(1) << "endpoint buffer size: " << endpoint_buffer_size_frames_

- << " [frames]";

- // The buffer scheme for exclusive mode streams is not designed for max

- // flexibility. We only allow a "perfect match" between the packet size set

- // by the user and the actual endpoint buffer size.

- if (share_mode_ == AUDCLNT_SHAREMODE_EXCLUSIVE &&

- endpoint_buffer_size_frames_ != packet_size_frames_) {

- hr = AUDCLNT_E_INVALID_SIZE;

- DLOG(ERROR) << "AUDCLNT_E_INVALID_SIZE";

- return hr;

- }

- // Set the event handle that the audio engine will signal each time

- // a buffer becomes ready to be processed by the client.

- hr = audio_client_->SetEventHandle(audio_samples_render_event_.Get());

- if (FAILED(hr))

- return hr;

- // Get access to the IAudioRenderClient interface. This interface

- // enables us to write output data to a rendering endpoint buffer.

- // The methods in this interface manage the movement of data packets

- // that contain audio-rendering data.

- hr = audio_client_->GetService(__uuidof(IAudioRenderClient),

- audio_render_client_.ReceiveVoid());

- return hr;

-HRESULT WASAPIAudioOutputStream::SharedModeInitialization() {

- DCHECK_EQ(share_mode_, AUDCLNT_SHAREMODE_SHARED);

- // TODO(henrika): this buffer scheme is still under development.

- // The exact details are yet to be determined based on tests with different

- // audio clients.

- int glitch_free_buffer_size_ms = static_cast<int>(packet_size_ms_ + 0.5);

- if (audio_engine_mix_format_->Format.nSamplesPerSec % 8000 == 0) {

- // Initial tests have shown that we have to add 10 ms extra to

- // ensure that we don't run empty for any packet size.

- glitch_free_buffer_size_ms += 10;

- } else if (audio_engine_mix_format_->Format.nSamplesPerSec % 11025 == 0) {

- // Initial tests have shown that we have to add 20 ms extra to

- // ensure that we don't run empty for any packet size.

- glitch_free_buffer_size_ms += 20;

- } else {

- DLOG(WARNING) << "Unsupported sample rate "

- << audio_engine_mix_format_->Format.nSamplesPerSec << " detected";

- glitch_free_buffer_size_ms += 20;

- }

- DVLOG(1) << "glitch_free_buffer_size_ms: " << glitch_free_buffer_size_ms;

- REFERENCE_TIME requested_buffer_duration =

- static_cast<REFERENCE_TIME>(glitch_free_buffer_size_ms * 10000);

- // Initialize the audio stream between the client and the device.

- // We connect indirectly through the audio engine by using shared mode

- // and WASAPI is initialized in an event driven mode.

- // Note that this API ensures that the buffer is never smaller than the

- // minimum buffer size needed to ensure glitch-free rendering.

- // If we requests a buffer size that is smaller than the audio engine's

- // minimum required buffer size, the method sets the buffer size to this

- // minimum buffer size rather than to the buffer size requested.

- HRESULT hr = S_FALSE;

- hr = audio_client_->Initialize(AUDCLNT_SHAREMODE_SHARED,

- AUDCLNT_STREAMFLAGS_EVENTCALLBACK |

- AUDCLNT_STREAMFLAGS_NOPERSIST,

- requested_buffer_duration,

- 0,

- reinterpret_cast<WAVEFORMATEX*>(&format_),

- NULL);

- return hr;

-HRESULT WASAPIAudioOutputStream::ExclusiveModeInitialization() {

+HRESULT WASAPIAudioOutputStream::ExclusiveModeInitialization(

+ IAudioClient* client, HANDLE event_handle, size_t* endpoint_buffer_size) {

DCHECK_EQ(share_mode_, AUDCLNT_SHAREMODE_EXCLUSIVE);

float f = (1000.0 * packet_size_frames_) / format_.Format.nSamplesPerSec;

REFERENCE_TIME requested_buffer_duration =

static_cast<REFERENCE_TIME>(f * 10000.0 + 0.5);

+ DWORD stream_flags = AUDCLNT_STREAMFLAGS_NOPERSIST;

+ bool use_event = (event_handle != NULL &&

+ event_handle != INVALID_HANDLE_VALUE);

+ if (use_event)

+ stream_flags |= AUDCLNT_STREAMFLAGS_EVENTCALLBACK;

+ DVLOG(2) << "stream_flags: 0x" << std::hex << stream_flags;

// Initialize the audio stream between the client and the device.

// For an exclusive-mode stream that uses event-driven buffering, the

// caller must specify nonzero values for hnsPeriodicity and

@@ -889,21 +627,19 @@ HRESULT WASAPIAudioOutputStream::ExclusiveModeInitialization() {

// Following the Initialize call for a rendering stream, the caller should

// fill the first of the two buffers before starting the stream.

HRESULT hr = S_FALSE;

- hr = audio_client_->Initialize(AUDCLNT_SHAREMODE_EXCLUSIVE,

- AUDCLNT_STREAMFLAGS_EVENTCALLBACK |

- AUDCLNT_STREAMFLAGS_NOPERSIST,

- requested_buffer_duration,

- reinterpret_cast<WAVEFORMATEX*>(&format_),

- NULL);

+ hr = client->Initialize(AUDCLNT_SHAREMODE_EXCLUSIVE,

+ stream_flags,

+ requested_buffer_duration,

+ reinterpret_cast<WAVEFORMATEX*>(&format_),

+ NULL);

if (FAILED(hr)) {

if (hr == AUDCLNT_E_BUFFER_SIZE_NOT_ALIGNED) {

LOG(ERROR) << "AUDCLNT_E_BUFFER_SIZE_NOT_ALIGNED";

UINT32 aligned_buffer_size = 0;

- audio_client_->GetBufferSize(&aligned_buffer_size);

+ client->GetBufferSize(&aligned_buffer_size);

DVLOG(1) << "Use aligned buffer size instead: " << aligned_buffer_size;

- audio_client_.Release();

// Calculate new aligned periodicity. Each unit of reference time

// is 100 nanoseconds.

@@ -923,34 +659,27 @@ HRESULT WASAPIAudioOutputStream::ExclusiveModeInitialization() {

// the minimum supported size (usually ~3ms on Windows 7).

LOG(ERROR) << "AUDCLNT_E_INVALID_DEVICE_PERIOD";

}

+ return hr;

}

- return hr;

-std::string WASAPIAudioOutputStream::GetDeviceName(LPCWSTR device_id) const {

- std::string name;

- ScopedComPtr<IMMDevice> audio_device;

- // Get the IMMDevice interface corresponding to the given endpoint ID string.

- HRESULT hr = device_enumerator_->GetDevice(device_id, audio_device.Receive());

- if (SUCCEEDED(hr)) {

- // Retrieve user-friendly name of endpoint device.

- // Example: "Speakers (Realtek High Definition Audio)".

- ScopedComPtr<IPropertyStore> properties;

- hr = audio_device->OpenPropertyStore(STGM_READ, properties.Receive());

- if (SUCCEEDED(hr)) {

- PROPVARIANT friendly_name;

- PropVariantInit(&friendly_name);

- hr = properties->GetValue(PKEY_Device_FriendlyName, &friendly_name);

- if (SUCCEEDED(hr) && friendly_name.vt == VT_LPWSTR) {

- if (friendly_name.pwszVal)

- name = WideToUTF8(friendly_name.pwszVal);

- }

- PropVariantClear(&friendly_name);

+ if (use_event) {

+ hr = client->SetEventHandle(event_handle);

+ if (FAILED(hr)) {

+ DVLOG(1) << "IAudioClient::SetEventHandle: " << std::hex << hr;

+ return hr;

}

- return name;

+ UINT32 buffer_size_in_frames = 0;

+ hr = client->GetBufferSize(&buffer_size_in_frames);

+ if (FAILED(hr)) {

+ DVLOG(1) << "IAudioClient::GetBufferSize: " << std::hex << hr;

+ return hr;

+ }

+ *endpoint_buffer_size = static_cast<size_t>(buffer_size_in_frames);

+ DVLOG(2) << "endpoint buffer size: " << buffer_size_in_frames;

+ return hr;

}

} // namespace media

« media/audio/audio_util.cc ('K') | « media/audio/win/audio_low_latency_output_win.h ('k') | media/audio/win/audio_low_latency_output_win_unittest.cc » ('j') | no next file with comments »