blob: 30375894a02b1b576c108f7757edf548d6671c47 [file] [log] [blame]
// Copyright (c) 2012 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "media/audio/win/audio_low_latency_output_win.h"
#include <Functiondiscoverykeys_devpkey.h>
#include "base/command_line.h"
#include "base/logging.h"
#include "base/memory/scoped_ptr.h"
#include "base/metrics/histogram.h"
#include "base/utf_string_conversions.h"
#include "media/audio/audio_util.h"
#include "media/audio/win/audio_manager_win.h"
#include "media/audio/win/avrt_wrapper_win.h"
#include "media/base/limits.h"
#include "media/base/media_switches.h"
using base::win::ScopedComPtr;
using base::win::ScopedCOMInitializer;
using base::win::ScopedCoMem;
namespace media {
typedef uint32 ChannelConfig;
// Retrieves the stream format that the audio engine uses for its internal
// processing/mixing of shared-mode streams.
static HRESULT GetMixFormat(ERole device_role, WAVEFORMATEX** device_format) {
// Note that we are using the IAudioClient::GetMixFormat() API to get the
// device format in this function. It is in fact possible to be "more native",
// and ask the endpoint device directly for its properties. Given a reference
// to the IMMDevice interface of an endpoint object, a client can obtain a
// reference to the endpoint object's property store by calling the
// IMMDevice::OpenPropertyStore() method. However, I have not been able to
// access any valuable information using this method on my HP Z600 desktop,
// hence it feels more appropriate to use the IAudioClient::GetMixFormat()
// approach instead.
// Calling this function only makes sense for shared mode streams, since
// if the device will be opened in exclusive mode, then the application
// specified format is used instead. However, the result of this method can
// be useful for testing purposes so we don't DCHECK here.
DLOG_IF(WARNING, WASAPIAudioOutputStream::GetShareMode() ==
AUDCLNT_SHAREMODE_EXCLUSIVE) <<
"The mixing sample rate will be ignored for exclusive-mode streams.";
// It is assumed that this static method is called from a COM thread, i.e.,
// CoInitializeEx() is not called here again to avoid STA/MTA conflicts.
ScopedComPtr<IMMDeviceEnumerator> enumerator;
HRESULT hr = CoCreateInstance(__uuidof(MMDeviceEnumerator),
NULL,
CLSCTX_INPROC_SERVER,
__uuidof(IMMDeviceEnumerator),
enumerator.ReceiveVoid());
if (FAILED(hr))
return hr;
ScopedComPtr<IMMDevice> endpoint_device;
hr = enumerator->GetDefaultAudioEndpoint(eRender,
device_role,
endpoint_device.Receive());
if (FAILED(hr))
return hr;
ScopedComPtr<IAudioClient> audio_client;
hr = endpoint_device->Activate(__uuidof(IAudioClient),
CLSCTX_INPROC_SERVER,
NULL,
audio_client.ReceiveVoid());
return SUCCEEDED(hr) ? audio_client->GetMixFormat(device_format) : hr;
}
// Retrieves an integer mask which corresponds to the channel layout the
// audio engine uses for its internal processing/mixing of shared-mode
// streams. This mask indicates which channels are present in the multi-
// channel stream. The least significant bit corresponds with the Front Left
// speaker, the next least significant bit corresponds to the Front Right
// speaker, and so on, continuing in the order defined in KsMedia.h.
// See http://msdn.microsoft.com/en-us/library/windows/hardware/ff537083(v=vs.85).aspx
// for more details.
static ChannelConfig GetChannelConfig() {
// Use a WAVEFORMATEXTENSIBLE structure since it can specify both the
// number of channels and the mapping of channels to speakers for
// multichannel devices.
base::win::ScopedCoMem<WAVEFORMATPCMEX> format_ex;
HRESULT hr = S_FALSE;
hr = GetMixFormat(eConsole, reinterpret_cast<WAVEFORMATEX**>(&format_ex));
if (FAILED(hr))
return 0;
// The dwChannelMask member specifies which channels are present in the
// multichannel stream. The least significant bit corresponds to the
// front left speaker, the next least significant bit corresponds to the
// front right speaker, and so on.
// See http://msdn.microsoft.com/en-us/library/windows/desktop/dd757714(v=vs.85).aspx
// for more details on the channel mapping.
DVLOG(2) << "dwChannelMask: 0x" << std::hex << format_ex->dwChannelMask;
#if !defined(NDEBUG)
// See http://en.wikipedia.org/wiki/Surround_sound for more details on
// how to name various speaker configurations. The list below is not complete.
const char* speaker_config = "Undefined";
switch (format_ex->dwChannelMask) {
case KSAUDIO_SPEAKER_MONO:
speaker_config = "Mono";
break;
case KSAUDIO_SPEAKER_STEREO:
speaker_config = "Stereo";
break;
case KSAUDIO_SPEAKER_5POINT1_SURROUND:
speaker_config = "5.1 surround";
break;
case KSAUDIO_SPEAKER_5POINT1:
speaker_config = "5.1";
break;
case KSAUDIO_SPEAKER_7POINT1_SURROUND:
speaker_config = "7.1 surround";
break;
case KSAUDIO_SPEAKER_7POINT1:
speaker_config = "7.1";
break;
default:
break;
}
DVLOG(2) << "speaker configuration: " << speaker_config;
#endif
return static_cast<ChannelConfig>(format_ex->dwChannelMask);
}
// Converts Microsoft's channel configuration to ChannelLayout.
// This mapping is not perfect but the best we can do given the current
// ChannelLayout enumerator and the Windows-specific speaker configurations
// defined in ksmedia.h. Don't assume that the channel ordering in
// ChannelLayout is exactly the same as the Windows specific configuration.
// As an example: KSAUDIO_SPEAKER_7POINT1_SURROUND is mapped to
// CHANNEL_LAYOUT_7_1 but the positions of Back L, Back R and Side L, Side R
// speakers are different in these two definitions.
static ChannelLayout ChannelConfigToChannelLayout(ChannelConfig config) {
switch (config) {
case KSAUDIO_SPEAKER_DIRECTOUT:
return CHANNEL_LAYOUT_NONE;
case KSAUDIO_SPEAKER_MONO:
return CHANNEL_LAYOUT_MONO;
case KSAUDIO_SPEAKER_STEREO:
return CHANNEL_LAYOUT_STEREO;
case KSAUDIO_SPEAKER_QUAD:
return CHANNEL_LAYOUT_QUAD;
case KSAUDIO_SPEAKER_SURROUND:
return CHANNEL_LAYOUT_4_0;
case KSAUDIO_SPEAKER_5POINT1:
return CHANNEL_LAYOUT_5_1_BACK;
case KSAUDIO_SPEAKER_5POINT1_SURROUND:
return CHANNEL_LAYOUT_5_1;
case KSAUDIO_SPEAKER_7POINT1:
return CHANNEL_LAYOUT_7_1_WIDE;
case KSAUDIO_SPEAKER_7POINT1_SURROUND:
return CHANNEL_LAYOUT_7_1;
default:
DVLOG(1) << "Unsupported channel layout: " << config;
return CHANNEL_LAYOUT_UNSUPPORTED;
}
}
// static
AUDCLNT_SHAREMODE WASAPIAudioOutputStream::GetShareMode() {
const CommandLine* cmd_line = CommandLine::ForCurrentProcess();
if (cmd_line->HasSwitch(switches::kEnableExclusiveAudio))
return AUDCLNT_SHAREMODE_EXCLUSIVE;
return AUDCLNT_SHAREMODE_SHARED;
}
WASAPIAudioOutputStream::WASAPIAudioOutputStream(AudioManagerWin* manager,
const AudioParameters& params,
ERole device_role)
: creating_thread_id_(base::PlatformThread::CurrentId()),
manager_(manager),
opened_(false),
restart_rendering_mode_(false),
volume_(1.0),
endpoint_buffer_size_frames_(0),
device_role_(device_role),
share_mode_(GetShareMode()),
client_channel_count_(params.channels()),
num_written_frames_(0),
source_(NULL),
audio_bus_(AudioBus::Create(params)) {
DCHECK(manager_);
// Load the Avrt DLL if not already loaded. Required to support MMCSS.
bool avrt_init = avrt::Initialize();
DCHECK(avrt_init) << "Failed to load the avrt.dll";
if (share_mode_ == AUDCLNT_SHAREMODE_EXCLUSIVE) {
VLOG(1) << ">> Note that EXCLUSIVE MODE is enabled <<";
}
// Set up the desired render format specified by the client. We use the
// WAVE_FORMAT_EXTENSIBLE structure to ensure that multiple channel ordering
// and high precision data can be supported.
// Begin with the WAVEFORMATEX structure that specifies the basic format.
WAVEFORMATEX* format = &format_.Format;
format->wFormatTag = WAVE_FORMAT_EXTENSIBLE;
format->nChannels = client_channel_count_;
format->nSamplesPerSec = params.sample_rate();
format->wBitsPerSample = params.bits_per_sample();
format->nBlockAlign = (format->wBitsPerSample / 8) * format->nChannels;
format->nAvgBytesPerSec = format->nSamplesPerSec * format->nBlockAlign;
format->cbSize = sizeof(WAVEFORMATEXTENSIBLE) - sizeof(WAVEFORMATEX);
// Add the parts which are unique to WAVE_FORMAT_EXTENSIBLE.
format_.Samples.wValidBitsPerSample = params.bits_per_sample();
format_.dwChannelMask = GetChannelConfig();
format_.SubFormat = KSDATAFORMAT_SUBTYPE_PCM;
// Size in bytes of each audio frame.
frame_size_ = format->nBlockAlign;
// Store size (in different units) of audio packets which we expect to
// get from the audio endpoint device in each render event.
packet_size_frames_ = params.GetBytesPerBuffer() / format->nBlockAlign;
packet_size_bytes_ = params.GetBytesPerBuffer();
packet_size_ms_ = (1000.0 * packet_size_frames_) / params.sample_rate();
DVLOG(1) << "Number of bytes per audio frame : " << frame_size_;
DVLOG(1) << "Number of audio frames per packet: " << packet_size_frames_;
DVLOG(1) << "Number of bytes per packet : " << packet_size_bytes_;
DVLOG(1) << "Number of milliseconds per packet: " << packet_size_ms_;
// All events are auto-reset events and non-signaled initially.
// Create the event which the audio engine will signal each time
// a buffer becomes ready to be processed by the client.
audio_samples_render_event_.Set(CreateEvent(NULL, FALSE, FALSE, NULL));
DCHECK(audio_samples_render_event_.IsValid());
// Create the event which will be set in Stop() when capturing shall stop.
stop_render_event_.Set(CreateEvent(NULL, FALSE, FALSE, NULL));
DCHECK(stop_render_event_.IsValid());
}
WASAPIAudioOutputStream::~WASAPIAudioOutputStream() {}
bool WASAPIAudioOutputStream::Open() {
DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);
if (opened_)
return true;
// Channel mixing is not supported, it must be handled by ChannelMixer.
if (format_.Format.nChannels != client_channel_count_) {
LOG(ERROR) << "Channel down-mixing is not supported.";
return false;
}
// Create an IMMDeviceEnumerator interface and obtain a reference to
// the IMMDevice interface of the default rendering device with the
// specified role.
HRESULT hr = SetRenderDevice();
if (FAILED(hr)) {
return false;
}
// Obtain an IAudioClient interface which enables us to create and initialize
// an audio stream between an audio application and the audio engine.
hr = ActivateRenderDevice();
if (FAILED(hr)) {
return false;
}
// Verify that the selected audio endpoint supports the specified format
// set during construction.
// In exclusive mode, the client can choose to open the stream in any audio
// format that the endpoint device supports. In shared mode, the client must
// open the stream in the mix format that is currently in use by the audio
// engine (or a format that is similar to the mix format). The audio engine's
// input streams and the output mix from the engine are all in this format.
if (!DesiredFormatIsSupported()) {
return false;
}
// Initialize the audio stream between the client and the device using
// shared or exclusive mode and a lowest possible glitch-free latency.
// We will enter different code paths depending on the specified share mode.
hr = InitializeAudioEngine();
if (FAILED(hr)) {
return false;
}
opened_ = true;
return true;
}
void WASAPIAudioOutputStream::Start(AudioSourceCallback* callback) {
DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);
CHECK(callback);
CHECK(opened_);
if (render_thread_.get()) {
CHECK_EQ(callback, source_);
return;
}
if (restart_rendering_mode_) {
// The selected audio device has been removed or disabled and a new
// default device has been enabled instead. The current implementation
// does not to support this sequence of events. Given that Open()
// and Start() are usually called in one sequence; it should be a very
// rare event.
// TODO(henrika): it is possible to extend the functionality here.
LOG(ERROR) << "Unable to start since the selected default device has "
"changed since Open() was called.";
return;
}
source_ = callback;
// Avoid start-up glitches by filling up the endpoint buffer with "silence"
// before starting the stream.
BYTE* data_ptr = NULL;
HRESULT hr = audio_render_client_->GetBuffer(endpoint_buffer_size_frames_,
&data_ptr);
if (FAILED(hr)) {
DLOG(ERROR) << "Failed to use rendering audio buffer: " << std::hex << hr;
return;
}
// Using the AUDCLNT_BUFFERFLAGS_SILENT flag eliminates the need to
// explicitly write silence data to the rendering buffer.
audio_render_client_->ReleaseBuffer(endpoint_buffer_size_frames_,
AUDCLNT_BUFFERFLAGS_SILENT);
num_written_frames_ = endpoint_buffer_size_frames_;
// Sanity check: verify that the endpoint buffer is filled with silence.
UINT32 num_queued_frames = 0;
audio_client_->GetCurrentPadding(&num_queued_frames);
DCHECK(num_queued_frames == num_written_frames_);
// Create and start the thread that will drive the rendering by waiting for
// render events.
render_thread_.reset(
new base::DelegateSimpleThread(this, "wasapi_render_thread"));
render_thread_->Start();
// Start streaming data between the endpoint buffer and the audio engine.
hr = audio_client_->Start();
if (FAILED(hr)) {
SetEvent(stop_render_event_.Get());
render_thread_->Join();
render_thread_.reset();
HandleError(hr);
}
}
void WASAPIAudioOutputStream::Stop() {
DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);
if (!render_thread_.get())
return;
// Stop output audio streaming.
HRESULT hr = audio_client_->Stop();
if (FAILED(hr)) {
DLOG_IF(ERROR, hr != AUDCLNT_E_NOT_INITIALIZED)
<< "Failed to stop output streaming: " << std::hex << hr;
}
// Wait until the thread completes and perform cleanup.
SetEvent(stop_render_event_.Get());
render_thread_->Join();
render_thread_.reset();
// Ensure that we don't quit the main thread loop immediately next
// time Start() is called.
ResetEvent(stop_render_event_.Get());
// Clear source callback, it'll be set again on the next Start() call.
source_ = NULL;
// Flush all pending data and reset the audio clock stream position to 0.
hr = audio_client_->Reset();
if (FAILED(hr)) {
DLOG_IF(ERROR, hr != AUDCLNT_E_NOT_INITIALIZED)
<< "Failed to reset streaming: " << std::hex << hr;
}
// Extra safety check to ensure that the buffers are cleared.
// If the buffers are not cleared correctly, the next call to Start()
// would fail with AUDCLNT_E_BUFFER_ERROR at IAudioRenderClient::GetBuffer().
// This check is is only needed for shared-mode streams.
if (share_mode_ == AUDCLNT_SHAREMODE_SHARED) {
UINT32 num_queued_frames = 0;
audio_client_->GetCurrentPadding(&num_queued_frames);
DCHECK_EQ(0u, num_queued_frames);
}
}
void WASAPIAudioOutputStream::Close() {
DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);
// It is valid to call Close() before calling open or Start().
// It is also valid to call Close() after Start() has been called.
Stop();
// Inform the audio manager that we have been closed. This will cause our
// destruction.
manager_->ReleaseOutputStream(this);
}
void WASAPIAudioOutputStream::SetVolume(double volume) {
DVLOG(1) << "SetVolume(volume=" << volume << ")";
float volume_float = static_cast<float>(volume);
if (volume_float < 0.0f || volume_float > 1.0f) {
return;
}
volume_ = volume_float;
}
void WASAPIAudioOutputStream::GetVolume(double* volume) {
DVLOG(1) << "GetVolume()";
*volume = static_cast<double>(volume_);
}
// static
int WASAPIAudioOutputStream::HardwareChannelCount() {
// Use a WAVEFORMATEXTENSIBLE structure since it can specify both the
// number of channels and the mapping of channels to speakers for
// multichannel devices.
base::win::ScopedCoMem<WAVEFORMATPCMEX> format_ex;
HRESULT hr = GetMixFormat(
eConsole, reinterpret_cast<WAVEFORMATEX**>(&format_ex));
if (FAILED(hr))
return 0;
// Number of channels in the stream. Corresponds to the number of bits
// set in the dwChannelMask.
DVLOG(1) << "endpoint channels (out): " << format_ex->Format.nChannels;
return static_cast<int>(format_ex->Format.nChannels);
}
// static
ChannelLayout WASAPIAudioOutputStream::HardwareChannelLayout() {
return ChannelConfigToChannelLayout(GetChannelConfig());
}
// static
int WASAPIAudioOutputStream::HardwareSampleRate(ERole device_role) {
base::win::ScopedCoMem<WAVEFORMATEX> format;
HRESULT hr = GetMixFormat(device_role, &format);
if (FAILED(hr))
return 0;
DVLOG(2) << "nSamplesPerSec: " << format->nSamplesPerSec;
return static_cast<int>(format->nSamplesPerSec);
}
void WASAPIAudioOutputStream::Run() {
ScopedCOMInitializer com_init(ScopedCOMInitializer::kMTA);
// Increase the thread priority.
render_thread_->SetThreadPriority(base::kThreadPriority_RealtimeAudio);
// Enable MMCSS to ensure that this thread receives prioritized access to
// CPU resources.
DWORD task_index = 0;
HANDLE mm_task = avrt::AvSetMmThreadCharacteristics(L"Pro Audio",
&task_index);
bool mmcss_is_ok =
(mm_task && avrt::AvSetMmThreadPriority(mm_task, AVRT_PRIORITY_CRITICAL));
if (!mmcss_is_ok) {
// Failed to enable MMCSS on this thread. It is not fatal but can lead
// to reduced QoS at high load.
DWORD err = GetLastError();
LOG(WARNING) << "Failed to enable MMCSS (error code=" << err << ").";
}
HRESULT hr = S_FALSE;
bool playing = true;
bool error = false;
HANDLE wait_array[] = { stop_render_event_,
audio_samples_render_event_ };
UINT64 device_frequency = 0;
// The IAudioClock interface enables us to monitor a stream's data
// rate and the current position in the stream. Allocate it before we
// start spinning.
ScopedComPtr<IAudioClock> audio_clock;
hr = audio_client_->GetService(__uuidof(IAudioClock),
audio_clock.ReceiveVoid());
if (SUCCEEDED(hr)) {
// The device frequency is the frequency generated by the hardware clock in
// the audio device. The GetFrequency() method reports a constant frequency.
hr = audio_clock->GetFrequency(&device_frequency);
}
error = FAILED(hr);
PLOG_IF(ERROR, error) << "Failed to acquire IAudioClock interface: "
<< std::hex << hr;
// Keep rendering audio until the stop event or the stream-switch event
// is signaled. An error event can also break the main thread loop.
while (playing && !error) {
// Wait for a close-down event, stream-switch event or a new render event.
DWORD wait_result = WaitForMultipleObjects(arraysize(wait_array),
wait_array,
FALSE,
INFINITE);
switch (wait_result) {
case WAIT_OBJECT_0 + 0:
// |stop_render_event_| has been set.
playing = false;
break;
case WAIT_OBJECT_0 + 1:
{
// |audio_samples_render_event_| has been set.
UINT32 num_queued_frames = 0;
uint8* audio_data = NULL;
// Contains how much new data we can write to the buffer without
// the risk of overwriting previously written data that the audio
// engine has not yet read from the buffer.
size_t num_available_frames = 0;
if (share_mode_ == AUDCLNT_SHAREMODE_SHARED) {
// Get the padding value which represents the amount of rendering
// data that is queued up to play in the endpoint buffer.
hr = audio_client_->GetCurrentPadding(&num_queued_frames);
num_available_frames =
endpoint_buffer_size_frames_ - num_queued_frames;
} else {
// While the stream is running, the system alternately sends one
// buffer or the other to the client. This form of double buffering
// is referred to as "ping-ponging". Each time the client receives
// a buffer from the system (triggers this event) the client must
// process the entire buffer. Calls to the GetCurrentPadding method
// are unnecessary because the packet size must always equal the
// buffer size. In contrast to the shared mode buffering scheme,
// the latency for an event-driven, exclusive-mode stream depends
// directly on the buffer size.
num_available_frames = endpoint_buffer_size_frames_;
}
// Check if there is enough available space to fit the packet size
// specified by the client.
if (FAILED(hr) || (num_available_frames < packet_size_frames_))
continue;
// Derive the number of packets we need get from the client to
// fill up the available area in the endpoint buffer.
// |num_packets| will always be one for exclusive-mode streams.
size_t num_packets = (num_available_frames / packet_size_frames_);
// Get data from the client/source.
for (size_t n = 0; n < num_packets; ++n) {
// Grab all available space in the rendering endpoint buffer
// into which the client can write a data packet.
hr = audio_render_client_->GetBuffer(packet_size_frames_,
&audio_data);
if (FAILED(hr)) {
DLOG(ERROR) << "Failed to use rendering audio buffer: "
<< std::hex << hr;
continue;
}
// Derive the audio delay which corresponds to the delay between
// a render event and the time when the first audio sample in a
// packet is played out through the speaker. This delay value
// can typically be utilized by an acoustic echo-control (AEC)
// unit at the render side.
UINT64 position = 0;
int audio_delay_bytes = 0;
hr = audio_clock->GetPosition(&position, NULL);
if (SUCCEEDED(hr)) {
// Stream position of the sample that is currently playing
// through the speaker.
double pos_sample_playing_frames = format_.Format.nSamplesPerSec *
(static_cast<double>(position) / device_frequency);
// Stream position of the last sample written to the endpoint
// buffer. Note that, the packet we are about to receive in
// the upcoming callback is also included.
size_t pos_last_sample_written_frames =
num_written_frames_ + packet_size_frames_;
// Derive the actual delay value which will be fed to the
// render client using the OnMoreData() callback.
audio_delay_bytes = (pos_last_sample_written_frames -
pos_sample_playing_frames) * frame_size_;
}
// Read a data packet from the registered client source and
// deliver a delay estimate in the same callback to the client.
// A time stamp is also stored in the AudioBuffersState. This
// time stamp can be used at the client side to compensate for
// the delay between the usage of the delay value and the time
// of generation.
uint32 num_filled_bytes = 0;
const int bytes_per_sample = format_.Format.wBitsPerSample >> 3;
int frames_filled = source_->OnMoreData(
audio_bus_.get(), AudioBuffersState(0, audio_delay_bytes));
num_filled_bytes = frames_filled * frame_size_;
DCHECK_LE(num_filled_bytes, packet_size_bytes_);
// Note: If this ever changes to output raw float the data must be
// clipped and sanitized since it may come from an untrusted
// source such as NaCl.
audio_bus_->ToInterleaved(
frames_filled, bytes_per_sample, audio_data);
// Perform in-place, software-volume adjustments.
media::AdjustVolume(audio_data,
num_filled_bytes,
audio_bus_->channels(),
bytes_per_sample,
volume_);
// Zero out the part of the packet which has not been filled by
// the client. Using silence is the least bad option in this
// situation.
if (num_filled_bytes < packet_size_bytes_) {
memset(&audio_data[num_filled_bytes], 0,
(packet_size_bytes_ - num_filled_bytes));
}
// Release the buffer space acquired in the GetBuffer() call.
DWORD flags = 0;
audio_render_client_->ReleaseBuffer(packet_size_frames_,
flags);
num_written_frames_ += packet_size_frames_;
}
}
break;
default:
error = true;
break;
}
}
if (playing && error) {
// Stop audio rendering since something has gone wrong in our main thread
// loop. Note that, we are still in a "started" state, hence a Stop() call
// is required to join the thread properly.
audio_client_->Stop();
PLOG(ERROR) << "WASAPI rendering failed.";
}
// Disable MMCSS.
if (mm_task && !avrt::AvRevertMmThreadCharacteristics(mm_task)) {
PLOG(WARNING) << "Failed to disable MMCSS";
}
}
void WASAPIAudioOutputStream::HandleError(HRESULT err) {
CHECK((started() && GetCurrentThreadId() == render_thread_->tid()) ||
(!started() && GetCurrentThreadId() == creating_thread_id_));
NOTREACHED() << "Error code: " << std::hex << err;
if (source_)
source_->OnError(this, static_cast<int>(err));
}
HRESULT WASAPIAudioOutputStream::SetRenderDevice() {
ScopedComPtr<IMMDeviceEnumerator> device_enumerator;
ScopedComPtr<IMMDevice> endpoint_device;
// Create the IMMDeviceEnumerator interface.
HRESULT hr = CoCreateInstance(__uuidof(MMDeviceEnumerator),
NULL,
CLSCTX_INPROC_SERVER,
__uuidof(IMMDeviceEnumerator),
device_enumerator.ReceiveVoid());
if (SUCCEEDED(hr)) {
// Retrieve the default render audio endpoint for the specified role.
// Note that, in Windows Vista, the MMDevice API supports device roles
// but the system-supplied user interface programs do not.
hr = device_enumerator->GetDefaultAudioEndpoint(
eRender, device_role_, endpoint_device.Receive());
if (FAILED(hr))
return hr;
// Verify that the audio endpoint device is active. That is, the audio
// adapter that connects to the endpoint device is present and enabled.
DWORD state = DEVICE_STATE_DISABLED;
hr = endpoint_device->GetState(&state);
if (SUCCEEDED(hr)) {
if (!(state & DEVICE_STATE_ACTIVE)) {
DLOG(ERROR) << "Selected render device is not active.";
hr = E_ACCESSDENIED;
}
}
}
if (SUCCEEDED(hr)) {
device_enumerator_ = device_enumerator;
endpoint_device_ = endpoint_device;
}
return hr;
}
HRESULT WASAPIAudioOutputStream::ActivateRenderDevice() {
ScopedComPtr<IAudioClient> audio_client;
// Creates and activates an IAudioClient COM object given the selected
// render endpoint device.
HRESULT hr = endpoint_device_->Activate(__uuidof(IAudioClient),
CLSCTX_INPROC_SERVER,
NULL,
audio_client.ReceiveVoid());
if (SUCCEEDED(hr)) {
// Retrieve the stream format that the audio engine uses for its internal
// processing/mixing of shared-mode streams.
audio_engine_mix_format_.Reset(NULL);
hr = audio_client->GetMixFormat(
reinterpret_cast<WAVEFORMATEX**>(&audio_engine_mix_format_));
if (SUCCEEDED(hr)) {
audio_client_ = audio_client;
}
}
return hr;
}
bool WASAPIAudioOutputStream::DesiredFormatIsSupported() {
// Determine, before calling IAudioClient::Initialize(), whether the audio
// engine supports a particular stream format.
// In shared mode, the audio engine always supports the mix format,
// which is stored in the |audio_engine_mix_format_| member and it is also
// possible to receive a proposed (closest) format if the current format is
// not supported.
base::win::ScopedCoMem<WAVEFORMATEXTENSIBLE> closest_match;
HRESULT hr = audio_client_->IsFormatSupported(
share_mode_, reinterpret_cast<WAVEFORMATEX*>(&format_),
reinterpret_cast<WAVEFORMATEX**>(&closest_match));
// This log can only be triggered for shared mode.
DLOG_IF(ERROR, hr == S_FALSE) << "Format is not supported "
<< "but a closest match exists.";
// This log can be triggered both for shared and exclusive modes.
DLOG_IF(ERROR, hr == AUDCLNT_E_UNSUPPORTED_FORMAT) << "Unsupported format.";
if (hr == S_FALSE) {
DVLOG(1) << "wFormatTag : " << closest_match->Format.wFormatTag;
DVLOG(1) << "nChannels : " << closest_match->Format.nChannels;
DVLOG(1) << "nSamplesPerSec: " << closest_match->Format.nSamplesPerSec;
DVLOG(1) << "wBitsPerSample: " << closest_match->Format.wBitsPerSample;
}
return (hr == S_OK);
}
HRESULT WASAPIAudioOutputStream::InitializeAudioEngine() {
#if !defined(NDEBUG)
// The period between processing passes by the audio engine is fixed for a
// particular audio endpoint device and represents the smallest processing
// quantum for the audio engine. This period plus the stream latency between
// the buffer and endpoint device represents the minimum possible latency
// that an audio application can achieve in shared mode.
{
REFERENCE_TIME default_device_period = 0;
REFERENCE_TIME minimum_device_period = 0;
HRESULT hr_dbg = audio_client_->GetDevicePeriod(&default_device_period,
&minimum_device_period);
if (SUCCEEDED(hr_dbg)) {
// Shared mode device period.
DVLOG(1) << "shared mode (default) device period: "
<< static_cast<double>(default_device_period / 10000.0)
<< " [ms]";
// Exclusive mode device period.
DVLOG(1) << "exclusive mode (minimum) device period: "
<< static_cast<double>(minimum_device_period / 10000.0)
<< " [ms]";
}
REFERENCE_TIME latency = 0;
hr_dbg = audio_client_->GetStreamLatency(&latency);
if (SUCCEEDED(hr_dbg)) {
DVLOG(1) << "stream latency: " << static_cast<double>(latency / 10000.0)
<< " [ms]";
}
}
#endif
HRESULT hr = S_FALSE;
// Perform different initialization depending on if the device shall be
// opened in shared mode or in exclusive mode.
hr = (share_mode_ == AUDCLNT_SHAREMODE_SHARED) ?
SharedModeInitialization() : ExclusiveModeInitialization();
if (FAILED(hr)) {
LOG(WARNING) << "IAudioClient::Initialize() failed: " << std::hex << hr;
return hr;
}
// Retrieve the length of the endpoint buffer. The buffer length represents
// the maximum amount of rendering data that the client can write to
// the endpoint buffer during a single processing pass.
// A typical value is 960 audio frames <=> 20ms @ 48kHz sample rate.
hr = audio_client_->GetBufferSize(&endpoint_buffer_size_frames_);
if (FAILED(hr))
return hr;
DVLOG(1) << "endpoint buffer size: " << endpoint_buffer_size_frames_
<< " [frames]";
// The buffer scheme for exclusive mode streams is not designed for max
// flexibility. We only allow a "perfect match" between the packet size set
// by the user and the actual endpoint buffer size.
if (share_mode_ == AUDCLNT_SHAREMODE_EXCLUSIVE &&
endpoint_buffer_size_frames_ != packet_size_frames_) {
hr = AUDCLNT_E_INVALID_SIZE;
DLOG(ERROR) << "AUDCLNT_E_INVALID_SIZE";
return hr;
}
// Set the event handle that the audio engine will signal each time
// a buffer becomes ready to be processed by the client.
hr = audio_client_->SetEventHandle(audio_samples_render_event_.Get());
if (FAILED(hr))
return hr;
// Get access to the IAudioRenderClient interface. This interface
// enables us to write output data to a rendering endpoint buffer.
// The methods in this interface manage the movement of data packets
// that contain audio-rendering data.
hr = audio_client_->GetService(__uuidof(IAudioRenderClient),
audio_render_client_.ReceiveVoid());
return hr;
}
HRESULT WASAPIAudioOutputStream::SharedModeInitialization() {
DCHECK_EQ(share_mode_, AUDCLNT_SHAREMODE_SHARED);
// TODO(henrika): this buffer scheme is still under development.
// The exact details are yet to be determined based on tests with different
// audio clients.
int glitch_free_buffer_size_ms = static_cast<int>(packet_size_ms_ + 0.5);
if (audio_engine_mix_format_->Format.nSamplesPerSec % 8000 == 0) {
// Initial tests have shown that we have to add 10 ms extra to
// ensure that we don't run empty for any packet size.
glitch_free_buffer_size_ms += 10;
} else if (audio_engine_mix_format_->Format.nSamplesPerSec % 11025 == 0) {
// Initial tests have shown that we have to add 20 ms extra to
// ensure that we don't run empty for any packet size.
glitch_free_buffer_size_ms += 20;
} else {
DLOG(WARNING) << "Unsupported sample rate "
<< audio_engine_mix_format_->Format.nSamplesPerSec << " detected";
glitch_free_buffer_size_ms += 20;
}
DVLOG(1) << "glitch_free_buffer_size_ms: " << glitch_free_buffer_size_ms;
REFERENCE_TIME requested_buffer_duration =
static_cast<REFERENCE_TIME>(glitch_free_buffer_size_ms * 10000);
// Initialize the audio stream between the client and the device.
// We connect indirectly through the audio engine by using shared mode
// and WASAPI is initialized in an event driven mode.
// Note that this API ensures that the buffer is never smaller than the
// minimum buffer size needed to ensure glitch-free rendering.
// If we requests a buffer size that is smaller than the audio engine's
// minimum required buffer size, the method sets the buffer size to this
// minimum buffer size rather than to the buffer size requested.
HRESULT hr = S_FALSE;
hr = audio_client_->Initialize(AUDCLNT_SHAREMODE_SHARED,
AUDCLNT_STREAMFLAGS_EVENTCALLBACK |
AUDCLNT_STREAMFLAGS_NOPERSIST,
requested_buffer_duration,
0,
reinterpret_cast<WAVEFORMATEX*>(&format_),
NULL);
return hr;
}
HRESULT WASAPIAudioOutputStream::ExclusiveModeInitialization() {
DCHECK_EQ(share_mode_, AUDCLNT_SHAREMODE_EXCLUSIVE);
float f = (1000.0 * packet_size_frames_) / format_.Format.nSamplesPerSec;
REFERENCE_TIME requested_buffer_duration =
static_cast<REFERENCE_TIME>(f * 10000.0 + 0.5);
// Initialize the audio stream between the client and the device.
// For an exclusive-mode stream that uses event-driven buffering, the
// caller must specify nonzero values for hnsPeriodicity and
// hnsBufferDuration, and the values of these two parameters must be equal.
// The Initialize method allocates two buffers for the stream. Each buffer
// is equal in duration to the value of the hnsBufferDuration parameter.
// Following the Initialize call for a rendering stream, the caller should
// fill the first of the two buffers before starting the stream.
HRESULT hr = S_FALSE;
hr = audio_client_->Initialize(AUDCLNT_SHAREMODE_EXCLUSIVE,
AUDCLNT_STREAMFLAGS_EVENTCALLBACK |
AUDCLNT_STREAMFLAGS_NOPERSIST,
requested_buffer_duration,
requested_buffer_duration,
reinterpret_cast<WAVEFORMATEX*>(&format_),
NULL);
if (FAILED(hr)) {
if (hr == AUDCLNT_E_BUFFER_SIZE_NOT_ALIGNED) {
LOG(ERROR) << "AUDCLNT_E_BUFFER_SIZE_NOT_ALIGNED";
UINT32 aligned_buffer_size = 0;
audio_client_->GetBufferSize(&aligned_buffer_size);
DVLOG(1) << "Use aligned buffer size instead: " << aligned_buffer_size;
audio_client_.Release();
// Calculate new aligned periodicity. Each unit of reference time
// is 100 nanoseconds.
REFERENCE_TIME aligned_buffer_duration = static_cast<REFERENCE_TIME>(
(10000000.0 * aligned_buffer_size / format_.Format.nSamplesPerSec)
+ 0.5);
// It is possible to re-activate and re-initialize the audio client
// at this stage but we bail out with an error code instead and
// combine it with a log message which informs about the suggested
// aligned buffer size which should be used instead.
DVLOG(1) << "aligned_buffer_duration: "
<< static_cast<double>(aligned_buffer_duration / 10000.0)
<< " [ms]";
} else if (hr == AUDCLNT_E_INVALID_DEVICE_PERIOD) {
// We will get this error if we try to use a smaller buffer size than
// the minimum supported size (usually ~3ms on Windows 7).
LOG(ERROR) << "AUDCLNT_E_INVALID_DEVICE_PERIOD";
}
}
return hr;
}
std::string WASAPIAudioOutputStream::GetDeviceName(LPCWSTR device_id) const {
std::string name;
ScopedComPtr<IMMDevice> audio_device;
// Get the IMMDevice interface corresponding to the given endpoint ID string.
HRESULT hr = device_enumerator_->GetDevice(device_id, audio_device.Receive());
if (SUCCEEDED(hr)) {
// Retrieve user-friendly name of endpoint device.
// Example: "Speakers (Realtek High Definition Audio)".
ScopedComPtr<IPropertyStore> properties;
hr = audio_device->OpenPropertyStore(STGM_READ, properties.Receive());
if (SUCCEEDED(hr)) {
PROPVARIANT friendly_name;
PropVariantInit(&friendly_name);
hr = properties->GetValue(PKEY_Device_FriendlyName, &friendly_name);
if (SUCCEEDED(hr) && friendly_name.vt == VT_LPWSTR) {
if (friendly_name.pwszVal)
name = WideToUTF8(friendly_name.pwszVal);
}
PropVariantClear(&friendly_name);
}
}
return name;
}
} // namespace media