audio_low_latency_input_win.cc revision 116680a4aac90f2aa7413d9095a592090648e557
15821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// Copyright (c) 2012 The Chromium Authors. All rights reserved.
25821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// Use of this source code is governed by a BSD-style license that can be
35821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// found in the LICENSE file.
45821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
55821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)#include "media/audio/win/audio_low_latency_input_win.h"
65821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
72a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)#include "base/logging.h"
8bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch#include "base/memory/scoped_ptr.h"
92a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)#include "base/strings/utf_string_conversions.h"
10868fa2fe829687343ffae624259930155e16dbd8Torne (Richard Coles)#include "media/audio/win/audio_manager_win.h"
111e9bf3e0803691d0a228da41fc608347b6db4340Torne (Richard Coles)#include "media/audio/win/avrt_wrapper_win.h"
121e9bf3e0803691d0a228da41fc608347b6db4340Torne (Richard Coles)#include "media/audio/win/core_audio_util_win.h"
135821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)#include "media/base/audio_bus.h"
142a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
155821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)using base::win::ScopedComPtr;
162a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)using base::win::ScopedCOMInitializer;
172a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
182a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)namespace media {
19c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)namespace {
20c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
21eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch// Returns true if |device| represents the default communication capture device.
22c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)bool IsDefaultCommunicationDevice(IMMDeviceEnumerator* enumerator,
235821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                                  IMMDevice* device) {
245821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  ScopedComPtr<IMMDevice> communications;
255821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  if (FAILED(enumerator->GetDefaultAudioEndpoint(eCapture, eCommunications,
265821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                                                 communications.Receive()))) {
275821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    return false;
282a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  }
295821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
305821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  base::win::ScopedCoMem<WCHAR> communications_id, device_id;
315821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  device->GetId(&device_id);
325821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  communications->GetId(&communications_id);
332a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  return lstrcmpW(communications_id, device_id) == 0;
345821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)}
355821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
36bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch}  // namespace
37eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
3858537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)WASAPIAudioInputStream::WASAPIAudioInputStream(AudioManagerWin* manager,
397d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)                                               const AudioParameters& params,
405821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                                               const std::string& device_id)
415821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    : manager_(manager),
425821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      capture_thread_(NULL),
431e9bf3e0803691d0a228da41fc608347b6db4340Torne (Richard Coles)      opened_(false),
444e180b6a0b4720a9b8e9e959a882386f690f08ffTorne (Richard Coles)      started_(false),
455821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      frame_size_(0),
462a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      packet_size_frames_(0),
475821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      packet_size_bytes_(0),
482a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      endpoint_buffer_size_frames_(0),
4990dce4d38c5ff5333bea97d859d4e484e27edf0cTorne (Richard Coles)      effects_(params.effects()),
505821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      device_id_(device_id),
515821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      perf_count_to_100ns_units_(0.0),
522a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      ms_to_frame_count_(0.0),
5368043e1e95eeb07d5cae7aca370b26518b0867d6Torne (Richard Coles)      sink_(NULL),
545821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      audio_bus_(media::AudioBus::Create(params)) {
555821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  DCHECK(manager_);
565821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
572a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Load the Avrt DLL if not already loaded. Required to support MMCSS.
58d0247b1b59f9c528cb6df88b4f2b9afaf80d181eTorne (Richard Coles)  bool avrt_init = avrt::Initialize();
59d0247b1b59f9c528cb6df88b4f2b9afaf80d181eTorne (Richard Coles)  DCHECK(avrt_init) << "Failed to load the Avrt.dll";
602a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
612a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Set up the desired capture format specified by the client.
622a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  format_.nSamplesPerSec = params.sample_rate();
632a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  format_.wFormatTag = WAVE_FORMAT_PCM;
645821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  format_.wBitsPerSample = params.bits_per_sample();
655821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  format_.nChannels = params.channels();
665821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  format_.nBlockAlign = (format_.wBitsPerSample / 8) * format_.nChannels;
672a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  format_.nAvgBytesPerSec = format_.nSamplesPerSec * format_.nBlockAlign;
685821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  format_.cbSize = 0;
695821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
705821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Size in bytes of each audio frame.
715821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  frame_size_ = format_.nBlockAlign;
725821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Store size of audio packets which we expect to get from the audio
735821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // endpoint device in each capture event.
745821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  packet_size_frames_ = params.GetBytesPerBuffer() / format_.nBlockAlign;
755821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  packet_size_bytes_ = params.GetBytesPerBuffer();
765821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  DVLOG(1) << "Number of bytes per audio frame  : " << frame_size_;
775821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  DVLOG(1) << "Number of audio frames per packet: " << packet_size_frames_;
78bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch
79bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch  // All events are auto-reset events and non-signaled initially.
80bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch
81bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch  // Create the event which the audio engine will signal each time
82bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch  // a buffer becomes ready to be processed by the client.
832a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  audio_samples_ready_event_.Set(CreateEvent(NULL, FALSE, FALSE, NULL));
842a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DCHECK(audio_samples_ready_event_.IsValid());
852a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
862a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Create the event which will be set in Stop() when capturing shall stop.
872a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  stop_capture_event_.Set(CreateEvent(NULL, FALSE, FALSE, NULL));
882a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DCHECK(stop_capture_event_.IsValid());
892a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
902a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  ms_to_frame_count_ = static_cast<double>(params.sample_rate()) / 1000.0;
912a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
922a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  LARGE_INTEGER performance_frequency;
932a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  if (QueryPerformanceFrequency(&performance_frequency)) {
942a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    perf_count_to_100ns_units_ =
95c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)        (10000000.0 / static_cast<double>(performance_frequency.QuadPart));
96c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  } else {
97c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    DLOG(ERROR) << "High-resolution performance counters are not supported.";
98c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  }
99c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)}
100c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
101c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)WASAPIAudioInputStream::~WASAPIAudioInputStream() {
102c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  DCHECK(CalledOnValidThread());
103c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)}
104c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
105c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)bool WASAPIAudioInputStream::Open() {
1062a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DCHECK(CalledOnValidThread());
1072a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Verify that we are not already opened.
1082a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  if (opened_)
109c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    return false;
1102a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
1112a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Obtain a reference to the IMMDevice interface of the capturing
1122a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // device with the specified unique identifier or role which was
1132a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // set at construction.
1142a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  HRESULT hr = SetCaptureDevice();
1152a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  if (FAILED(hr))
1162a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    return false;
1172a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
1182a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Obtain an IAudioClient interface which enables us to create and initialize
1192a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // an audio stream between an audio application and the audio engine.
1202a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  hr = ActivateCaptureDevice();
1212a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  if (FAILED(hr))
1222a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    return false;
1232a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
1242a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Retrieve the stream format which the audio engine uses for its internal
125c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // processing/mixing of shared-mode streams. This function call is for
1267dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch  // diagnostic purposes only and only in debug mode.
127c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)#ifndef NDEBUG
128c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  hr = GetAudioEngineStreamFormat();
12968043e1e95eeb07d5cae7aca370b26518b0867d6Torne (Richard Coles)#endif
13068043e1e95eeb07d5cae7aca370b26518b0867d6Torne (Richard Coles)
131c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // Verify that the selected audio endpoint supports the specified format
132c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // set during construction.
133c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  if (!DesiredFormatIsSupported())
1342a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    return false;
1352a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
1362a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Initialize the audio stream between the client and the device using
1372a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // shared mode and a lowest possible glitch-free latency.
1382a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  hr = InitializeAudioEngine();
1392a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
1402a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  opened_ = SUCCEEDED(hr);
1412a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  return opened_;
1422a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)}
1432a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
1442a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)void WASAPIAudioInputStream::Start(AudioInputCallback* callback) {
1452a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DCHECK(CalledOnValidThread());
1462a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DCHECK(callback);
1472a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DLOG_IF(ERROR, !opened_) << "Open() has not been called successfully";
1482a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  if (!opened_)
1492a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    return;
1502a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
1512a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  if (started_)
1522a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    return;
1532a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
1542a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DCHECK(!sink_);
1552a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  sink_ = callback;
1562a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
1572a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Starts periodic AGC microphone measurements if the AGC has been enabled
1582a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // using SetAutomaticGainControl().
1592a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  StartAgc();
1602a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
1612a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Create and start the thread that will drive the capturing by waiting for
1622a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // capture events.
1632a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  capture_thread_ =
1642a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      new base::DelegateSimpleThread(this, "wasapi_capture_thread");
1652a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  capture_thread_->Start();
1662a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
1672a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Start streaming data between the endpoint buffer and the audio engine.
1682a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  HRESULT hr = audio_client_->Start();
1695821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  DLOG_IF(ERROR, FAILED(hr)) << "Failed to start input streaming.";
1705821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
171c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  if (SUCCEEDED(hr) && audio_render_client_for_loopback_)
1725821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    hr = audio_render_client_for_loopback_->Start();
1735821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1745821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  started_ = SUCCEEDED(hr);
1755821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)}
1765821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
177c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)void WASAPIAudioInputStream::Stop() {
178c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  DCHECK(CalledOnValidThread());
179c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  DVLOG(1) << "WASAPIAudioInputStream::Stop()";
1805821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  if (!started_)
1815821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    return;
1825821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1835821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Stops periodic AGC microphone measurements.
184c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  StopAgc();
1855821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1865821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Shut down the capture thread.
1875821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  if (stop_capture_event_.IsValid()) {
1885821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    SetEvent(stop_capture_event_.Get());
1895821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  }
1905821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1915821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Stop the input audio streaming.
1925821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  HRESULT hr = audio_client_->Stop();
1935821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  if (FAILED(hr)) {
1945821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    LOG(ERROR) << "Failed to stop input streaming.";
1955821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  }
1965821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1975821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Wait until the thread completes and perform cleanup.
1985821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  if (capture_thread_) {
1995821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    SetEvent(stop_capture_event_.Get());
2005821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    capture_thread_->Join();
2015821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    capture_thread_ = NULL;
20290dce4d38c5ff5333bea97d859d4e484e27edf0cTorne (Richard Coles)  }
2035821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
2045821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  started_ = false;
2055821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  sink_ = NULL;
2065821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)}
2075821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
208c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)void WASAPIAudioInputStream::Close() {
2095821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  DVLOG(1) << "WASAPIAudioInputStream::Close()";
2105821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // It is valid to call Close() before calling open or Start().
2115821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // It is also valid to call Close() after Start() has been called.
2125821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  Stop();
2135821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
2145821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Inform the audio manager that we have been closed. This will cause our
2155821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // destruction.
2165821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  manager_->ReleaseInputStream(this);
2175821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)}
2185821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
2195821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)double WASAPIAudioInputStream::GetMaxVolume() {
2205821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Verify that Open() has been called succesfully, to ensure that an audio
2215821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // session exists and that an ISimpleAudioVolume interface has been created.
2225821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  DLOG_IF(ERROR, !opened_) << "Open() has not been called successfully";
2235821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  if (!opened_)
2245821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    return 0.0;
2255821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
2265821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // The effective volume value is always in the range 0.0 to 1.0, hence
2275821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // we can return a fixed value (=1.0) here.
2285821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  return 1.0;
2295821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)}
2305821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
2315821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)void WASAPIAudioInputStream::SetVolume(double volume) {
2325821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  DVLOG(1) << "SetVolume(volume=" << volume << ")";
2335821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  DCHECK(CalledOnValidThread());
2345821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  DCHECK_GE(volume, 0.0);
2355821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  DCHECK_LE(volume, 1.0);
2365821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
2375821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  DLOG_IF(ERROR, !opened_) << "Open() has not been called successfully";
2385821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  if (!opened_)
2395821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    return;
2405821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
2415821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Set a new master volume level. Valid volume levels are in the range
2425821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // 0.0 to 1.0. Ignore volume-change events.
24358537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)  HRESULT hr = simple_audio_volume_->SetMasterVolume(static_cast<float>(volume),
24458537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)      NULL);
24558537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)  DLOG_IF(WARNING, FAILED(hr)) << "Failed to set new input master volume.";
24658537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)
24758537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)  // Update the AGC volume level based on the last setting above. Note that,
24858537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)  // the volume-level resolution is not infinite and it is therefore not
24958537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)  // possible to assume that the volume provided as input parameter can be
25058537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)  // used directly. Instead, a new query to the audio hardware is required.
25158537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)  // This method does nothing if AGC is disabled.
25258537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)  UpdateAgcVolume();
25358537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)}
25458537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)
25558537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)double WASAPIAudioInputStream::GetVolume() {
25658537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)  DLOG_IF(ERROR, !opened_) << "Open() has not been called successfully";
25758537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)  if (!opened_)
25858537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)    return 0.0;
25958537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)
26058537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)  // Retrieve the current volume level. The value is in the range 0.0 to 1.0.
261eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  float level = 0.0f;
262eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  HRESULT hr = simple_audio_volume_->GetMasterVolume(&level);
2632a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DLOG_IF(WARNING, FAILED(hr)) << "Failed to get input master volume.";
26458537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)
26558537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)  return static_cast<double>(level);
26658537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)}
26758537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)
26858537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)// static
26958537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)AudioParameters WASAPIAudioInputStream::GetInputStreamParameters(
27058537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)    const std::string& device_id) {
2715821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  int sample_rate = 48000;
2725821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  ChannelLayout channel_layout = CHANNEL_LAYOUT_STEREO;
2735821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
2745821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  base::win::ScopedCoMem<WAVEFORMATEX> audio_engine_mix_format;
2755821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  int effects = AudioParameters::NO_EFFECTS;
2765821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  if (SUCCEEDED(GetMixFormat(device_id, &audio_engine_mix_format, &effects))) {
2775821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    sample_rate = static_cast<int>(audio_engine_mix_format->nSamplesPerSec);
2785821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    channel_layout = audio_engine_mix_format->nChannels == 1 ?
279eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch        CHANNEL_LAYOUT_MONO : CHANNEL_LAYOUT_STEREO;
2805821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  }
2815821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
2825821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Use 10ms frame size as default.
2835821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  int frames_per_buffer = sample_rate / 100;
2842a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  return AudioParameters(
2852a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      AudioParameters::AUDIO_PCM_LOW_LATENCY, channel_layout, 0, sample_rate,
2865821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      16, frames_per_buffer, effects);
2875821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)}
2885821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
2895821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// static
2905821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)HRESULT WASAPIAudioInputStream::GetMixFormat(const std::string& device_id,
2915821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                                             WAVEFORMATEX** device_format,
2925821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                                             int* effects) {
2935821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  DCHECK(effects);
2945821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
2955821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // It is assumed that this static method is called from a COM thread, i.e.,
2965821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // CoInitializeEx() is not called here to avoid STA/MTA conflicts.
297eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  ScopedComPtr<IMMDeviceEnumerator> enumerator;
298eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  HRESULT hr = enumerator.CreateInstance(__uuidof(MMDeviceEnumerator), NULL,
2995821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                                         CLSCTX_INPROC_SERVER);
3005821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  if (FAILED(hr))
3015821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    return hr;
3027d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)
3035821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  ScopedComPtr<IMMDevice> endpoint_device;
3045821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  if (device_id == AudioManagerBase::kDefaultDeviceId) {
3055821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // Retrieve the default capture audio endpoint.
3065821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    hr = enumerator->GetDefaultAudioEndpoint(eCapture, eConsole,
3075821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                                             endpoint_device.Receive());
3085821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  } else if (device_id == AudioManagerBase::kLoopbackInputDeviceId) {
3095821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // Get the mix format of the default playback stream.
3105821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    hr = enumerator->GetDefaultAudioEndpoint(eRender, eConsole,
3115821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                                             endpoint_device.Receive());
3125821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  } else {
3135821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // Retrieve a capture endpoint device that is specified by an endpoint
3145821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // device-identification string.
3155821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    hr = enumerator->GetDevice(base::UTF8ToUTF16(device_id).c_str(),
3167d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)                               endpoint_device.Receive());
3175821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  }
3185821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
3195821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  if (FAILED(hr))
3205821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    return hr;
3215821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
3225821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  *effects = IsDefaultCommunicationDevice(enumerator, endpoint_device) ?
3235821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      AudioParameters::DUCKING : AudioParameters::NO_EFFECTS;
3245821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
325eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  ScopedComPtr<IAudioClient> audio_client;
3265821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  hr = endpoint_device->Activate(__uuidof(IAudioClient),
3275821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                                 CLSCTX_INPROC_SERVER,
3285821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                                 NULL,
3295821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                                 audio_client.ReceiveVoid());
3305821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  return SUCCEEDED(hr) ? audio_client->GetMixFormat(device_format) : hr;
3315821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)}
33290dce4d38c5ff5333bea97d859d4e484e27edf0cTorne (Richard Coles)
33390dce4d38c5ff5333bea97d859d4e484e27edf0cTorne (Richard Coles)void WASAPIAudioInputStream::Run() {
33490dce4d38c5ff5333bea97d859d4e484e27edf0cTorne (Richard Coles)  ScopedCOMInitializer com_init(ScopedCOMInitializer::kMTA);
3355821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
3365821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Increase the thread priority.
337f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  capture_thread_->SetThreadPriority(base::kThreadPriority_RealtimeAudio);
3385821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
339f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // Enable MMCSS to ensure that this thread receives prioritized access to
3405821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // CPU resources.
341f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  DWORD task_index = 0;
3425821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  HANDLE mm_task = avrt::AvSetMmThreadCharacteristics(L"Pro Audio",
343f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)                                                      &task_index);
3445821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  bool mmcss_is_ok =
345f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)      (mm_task && avrt::AvSetMmThreadPriority(mm_task, AVRT_PRIORITY_CRITICAL));
3465821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  if (!mmcss_is_ok) {
3475821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // Failed to enable MMCSS on this thread. It is not fatal but can lead
3485821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // to reduced QoS at high load.
3495821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    DWORD err = GetLastError();
350f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    LOG(WARNING) << "Failed to enable MMCSS (error code=" << err << ").";
351f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  }
3525821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
353f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // Allocate a buffer with a size that enables us to take care of cases like:
3545821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // 1) The recorded buffer size is smaller, or does not match exactly with,
355f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  //    the selected packet size used in each callback.
3565821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // 2) The selected buffer size is larger than the recorded buffer size in
357f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  //    each event.
358f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  size_t buffer_frame_index = 0;
3595821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  size_t capture_buffer_size = std::max(
3605821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      2 * endpoint_buffer_size_frames_ * frame_size_,
3615821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      2 * packet_size_frames_ * frame_size_);
3625821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  scoped_ptr<uint8[]> capture_buffer(new uint8[capture_buffer_size]);
3635821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
364f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  LARGE_INTEGER now_count;
3655821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  bool recording = true;
366f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  bool error = false;
3675821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  double volume = GetVolume();
368f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  HANDLE wait_array[2] = {stop_capture_event_, audio_samples_ready_event_};
3695821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
370f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  while (recording && !error) {
3715821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    HRESULT hr = S_FALSE;
3725821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
3735821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // Wait for a close-down event or a new capture event.
374eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    DWORD wait_result = WaitForMultipleObjects(2, wait_array, FALSE, INFINITE);
375eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    switch (wait_result) {
376eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      case WAIT_FAILED:
377eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch        error = true;
378eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch        break;
379eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      case WAIT_OBJECT_0 + 0:
380eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch        // |stop_capture_event_| has been set.
381eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch        recording = false;
382eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch        break;
383eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      case WAIT_OBJECT_0 + 1:
384eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch        {
385eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          // |audio_samples_ready_event_| has been set.
386eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          BYTE* data_ptr = NULL;
387eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          UINT32 num_frames_to_read = 0;
388eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          DWORD flags = 0;
389eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          UINT64 device_position = 0;
390eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          UINT64 first_audio_frame_timestamp = 0;
391eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
392eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          // Retrieve the amount of data in the capture endpoint buffer,
393eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          // replace it with silence if required, create callbacks for each
394eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          // packet and store non-delivered data for the next event.
395eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          hr = audio_capture_client_->GetBuffer(&data_ptr,
396eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                                                &num_frames_to_read,
397eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                                                &flags,
398eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                                                &device_position,
399eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                                                &first_audio_frame_timestamp);
400eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          if (FAILED(hr)) {
401eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch            DLOG(ERROR) << "Failed to get data from the capture buffer";
402eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch            continue;
403eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          }
404eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
405eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          if (num_frames_to_read != 0) {
406eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch            size_t pos = buffer_frame_index * frame_size_;
407eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch            size_t num_bytes = num_frames_to_read * frame_size_;
408eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch            DCHECK_GE(capture_buffer_size, pos + num_bytes);
409eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
410eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch            if (flags & AUDCLNT_BUFFERFLAGS_SILENT) {
411eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch              // Clear out the local buffer since silence is reported.
412eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch              memset(&capture_buffer[pos], 0, num_bytes);
413eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch            } else {
414eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch              // Copy captured data from audio engine buffer to local buffer.
415eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch              memcpy(&capture_buffer[pos], data_ptr, num_bytes);
416eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch            }
417eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
4185821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)            buffer_frame_index += num_frames_to_read;
4195821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)          }
4202a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
4212a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)          hr = audio_capture_client_->ReleaseBuffer(num_frames_to_read);
4222a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)          DLOG_IF(ERROR, FAILED(hr)) << "Failed to release capture buffer";
4232a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
4242a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)          // Derive a delay estimate for the captured audio packet.
4252a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)          // The value contains two parts (A+B), where A is the delay of the
426eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          // first audio frame in the packet and B is the extra delay
427eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          // contained in any stored data. Unit is in audio frames.
4282a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)          QueryPerformanceCounter(&now_count);
429eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          double audio_delay_frames =
430eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch              ((perf_count_to_100ns_units_ * now_count.QuadPart -
431eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                first_audio_frame_timestamp) / 10000.0) * ms_to_frame_count_ +
432eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                buffer_frame_index - num_frames_to_read;
4332a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
4342a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)          // Get a cached AGC volume level which is updated once every second
4352a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)          // on the audio manager thread. Note that, |volume| is also updated
436eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          // each time SetVolume() is called through IPC by the render-side AGC.
4372a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)          GetAgcVolume(&volume);
4382a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
4392a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)          // Deliver captured data to the registered consumer using a packet
4402a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)          // size which was specified at construction.
4412a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)          uint32 delay_frames = static_cast<uint32>(audio_delay_frames + 0.5);
4422a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)          while (buffer_frame_index >= packet_size_frames_) {
4432a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)            // Copy data to audio bus to match the OnData interface.
4442a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)            uint8* audio_data = reinterpret_cast<uint8*>(capture_buffer.get());
4452a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)            audio_bus_->FromInterleaved(
4462a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)                audio_data, audio_bus_->frames(), format_.wBitsPerSample / 8);
4472a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
4482a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)            // Deliver data packet, delay estimation and volume level to
4492a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)            // the user.
4502a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)            sink_->OnData(
4512a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)                this, audio_bus_.get(), delay_frames * frame_size_, volume);
4522a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
4532a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)            // Store parts of the recorded data which can't be delivered
4542a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)            // using the current packet size. The stored section will be used
455c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            // either in the next while-loop iteration or in the next
456c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            // capture event.
4572a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)            memmove(&capture_buffer[0],
4582a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)                    &capture_buffer[packet_size_bytes_],
4592a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)                    (buffer_frame_index - packet_size_frames_) * frame_size_);
4602a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
4612a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)            buffer_frame_index -= packet_size_frames_;
4622a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)            delay_frames -= packet_size_frames_;
463eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          }
464eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch        }
4652a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)        break;
4662a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      default:
4672a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)        error = true;
468eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch        break;
469eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    }
470eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  }
471eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
472eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  if (recording && error) {
473eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    // TODO(henrika): perhaps it worth improving the cleanup here by e.g.
474eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    // stopping the audio client, joining the thread etc.?
475eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    NOTREACHED() << "WASAPI capturing failed with error code "
476eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                 << GetLastError();
477eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  }
4782a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
4792a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Disable MMCSS.
4802a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  if (mm_task && !avrt::AvRevertMmThreadCharacteristics(mm_task)) {
4812a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    PLOG(WARNING) << "Failed to disable MMCSS";
4822a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  }
4832a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)}
4842a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
4852a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)void WASAPIAudioInputStream::HandleError(HRESULT err) {
486eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  NOTREACHED() << "Error code: " << err;
4872a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  if (sink_)
4882a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    sink_->OnError(this);
4892a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)}
4902a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
4912a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)HRESULT WASAPIAudioInputStream::SetCaptureDevice() {
4922a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DCHECK(!endpoint_device_);
4932a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
494eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  ScopedComPtr<IMMDeviceEnumerator> enumerator;
4952a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  HRESULT hr = enumerator.CreateInstance(__uuidof(MMDeviceEnumerator),
4962a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)                                         NULL, CLSCTX_INPROC_SERVER);
4972a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  if (FAILED(hr))
498eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    return hr;
499eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
500eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // Retrieve the IMMDevice by using the specified role or the specified
501eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // unique endpoint device-identification string.
502eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
5032a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  if (effects_ & AudioParameters::DUCKING) {
504eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    // Ducking has been requested and it is only supported for the default
5052a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    // communication device.  So, let's open up the communication device and
5062a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    // see if the ID of that device matches the requested ID.
5072a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    // We consider a kDefaultDeviceId as well as an explicit device id match,
5082a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    // to be valid matches.
5092a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    hr = enumerator->GetDefaultAudioEndpoint(eCapture, eCommunications,
5102a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)                                             endpoint_device_.Receive());
511eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    if (endpoint_device_ && device_id_ != AudioManagerBase::kDefaultDeviceId) {
512eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      base::win::ScopedCoMem<WCHAR> communications_id;
513eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      endpoint_device_->GetId(&communications_id);
514eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      if (device_id_ !=
515eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch          base::WideToUTF8(static_cast<WCHAR*>(communications_id))) {
516eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch        DLOG(WARNING) << "Ducking has been requested for a non-default device."
517eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                         "Not supported.";
518eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch        // We can't honor the requested effect flag, so turn it off and
5197dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch        // continue.  We'll check this flag later to see if we've actually
520eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch        // opened up the communications device, so it's important that it
521eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch        // reflects the active state.
52268043e1e95eeb07d5cae7aca370b26518b0867d6Torne (Richard Coles)        effects_ &= ~AudioParameters::DUCKING;
52368043e1e95eeb07d5cae7aca370b26518b0867d6Torne (Richard Coles)        endpoint_device_.Release();  // Fall back on code below.
524eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      }
525eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    }
526eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  }
527eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
528eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  if (!endpoint_device_) {
529eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    if (device_id_ == AudioManagerBase::kDefaultDeviceId) {
530eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      // Retrieve the default capture audio endpoint for the specified role.
531eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      // Note that, in Windows Vista, the MMDevice API supports device roles
532eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      // but the system-supplied user interface programs do not.
533eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      hr = enumerator->GetDefaultAudioEndpoint(eCapture, eConsole,
534eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                                               endpoint_device_.Receive());
535eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    } else if (device_id_ == AudioManagerBase::kLoopbackInputDeviceId) {
536eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      // Capture the default playback stream.
537eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      hr = enumerator->GetDefaultAudioEndpoint(eRender, eConsole,
538eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                                               endpoint_device_.Receive());
539eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    } else {
540eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      hr = enumerator->GetDevice(base::UTF8ToUTF16(device_id_).c_str(),
541eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                                 endpoint_device_.Receive());
542eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    }
543eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  }
544eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
545eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  if (FAILED(hr))
546eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    return hr;
547eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
548eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // Verify that the audio endpoint device is active, i.e., the audio
549eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // adapter that connects to the endpoint device is present and enabled.
550eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  DWORD state = DEVICE_STATE_DISABLED;
551eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  hr = endpoint_device_->GetState(&state);
552eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  if (FAILED(hr))
553eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    return hr;
554eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
555eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  if (!(state & DEVICE_STATE_ACTIVE)) {
556eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    DLOG(ERROR) << "Selected capture device is not active.";
557eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    hr = E_ACCESSDENIED;
558eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  }
559eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
560eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  return hr;
561eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch}
562eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
563eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen MurdochHRESULT WASAPIAudioInputStream::ActivateCaptureDevice() {
564eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // Creates and activates an IAudioClient COM object given the selected
565eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // capture endpoint device.
566eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  HRESULT hr = endpoint_device_->Activate(__uuidof(IAudioClient),
567eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                                          CLSCTX_INPROC_SERVER,
568eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                                          NULL,
569eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                                          audio_client_.ReceiveVoid());
570eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  return hr;
571eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch}
572eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
573eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen MurdochHRESULT WASAPIAudioInputStream::GetAudioEngineStreamFormat() {
574eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  HRESULT hr = S_OK;
575eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch#ifndef NDEBUG
576eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // The GetMixFormat() method retrieves the stream format that the
577eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // audio engine uses for its internal processing of shared-mode streams.
578eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // The method always uses a WAVEFORMATEXTENSIBLE structure, instead
579eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // of a stand-alone WAVEFORMATEX structure, to specify the format.
580eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // An WAVEFORMATEXTENSIBLE structure can specify both the mapping of
581eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // channels to speakers and the number of bits of precision in each sample.
582eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  base::win::ScopedCoMem<WAVEFORMATEXTENSIBLE> format_ex;
583eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  hr = audio_client_->GetMixFormat(
584eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      reinterpret_cast<WAVEFORMATEX**>(&format_ex));
585eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
586eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // See http://msdn.microsoft.com/en-us/windows/hardware/gg463006#EFH
5872a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // for details on the WAVE file format.
5882a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  WAVEFORMATEX format = format_ex->Format;
5892a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DVLOG(2) << "WAVEFORMATEX:";
5902a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DVLOG(2) << "  wFormatTags    : 0x" << std::hex << format.wFormatTag;
5912a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DVLOG(2) << "  nChannels      : " << format.nChannels;
5922a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DVLOG(2) << "  nSamplesPerSec : " << format.nSamplesPerSec;
5932a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DVLOG(2) << "  nAvgBytesPerSec: " << format.nAvgBytesPerSec;
5942a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DVLOG(2) << "  nBlockAlign    : " << format.nBlockAlign;
5952a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DVLOG(2) << "  wBitsPerSample : " << format.wBitsPerSample;
5962a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DVLOG(2) << "  cbSize         : " << format.cbSize;
5972a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
5982a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DVLOG(2) << "WAVEFORMATEXTENSIBLE:";
5992a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DVLOG(2) << " wValidBitsPerSample: " <<
6002a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      format_ex->Samples.wValidBitsPerSample;
6012a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DVLOG(2) << " dwChannelMask      : 0x" << std::hex <<
6022a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      format_ex->dwChannelMask;
6032a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  if (format_ex->SubFormat == KSDATAFORMAT_SUBTYPE_PCM)
6042a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    DVLOG(2) << " SubFormat          : KSDATAFORMAT_SUBTYPE_PCM";
6052a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  else if (format_ex->SubFormat == KSDATAFORMAT_SUBTYPE_IEEE_FLOAT)
6062a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    DVLOG(2) << " SubFormat          : KSDATAFORMAT_SUBTYPE_IEEE_FLOAT";
6072a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  else if (format_ex->SubFormat == KSDATAFORMAT_SUBTYPE_WAVEFORMATEX)
6082a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    DVLOG(2) << " SubFormat          : KSDATAFORMAT_SUBTYPE_WAVEFORMATEX";
6092a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)#endif
6102a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  return hr;
6112a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)}
6122a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
613eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdochbool WASAPIAudioInputStream::DesiredFormatIsSupported() {
614eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // An application that uses WASAPI to manage shared-mode streams can rely
615eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // on the audio engine to perform only limited format conversions. The audio
6162a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // engine can convert between a standard PCM sample size used by the
617eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // application and the floating-point samples that the engine uses for its
618eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // internal processing. However, the format for an application stream
619eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // typically must have the same number of channels and the same sample
620eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // rate as the stream format used by the device.
621eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // Many audio devices support both PCM and non-PCM stream formats. However,
6222a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // the audio engine can mix only PCM streams.
6232a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  base::win::ScopedCoMem<WAVEFORMATEX> closest_match;
6242a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  HRESULT hr = audio_client_->IsFormatSupported(AUDCLNT_SHAREMODE_SHARED,
6252a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)                                                &format_,
626eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                                                &closest_match);
627eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  DLOG_IF(ERROR, hr == S_FALSE) << "Format is not supported "
628eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch                                << "but a closest match exists.";
629eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  return (hr == S_OK);
630eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch}
631eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch
632eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen MurdochHRESULT WASAPIAudioInputStream::InitializeAudioEngine() {
633eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  DWORD flags;
634eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // Use event-driven mode only fo regular input devices. For loopback the
635eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // EVENTCALLBACK flag is specified when intializing
636eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  // |audio_render_client_for_loopback_|.
637eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  if (device_id_ == AudioManagerBase::kLoopbackInputDeviceId) {
638eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    flags = AUDCLNT_STREAMFLAGS_LOOPBACK | AUDCLNT_STREAMFLAGS_NOPERSIST;
639eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch  } else {
640eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch    flags =
641eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch      AUDCLNT_STREAMFLAGS_EVENTCALLBACK | AUDCLNT_STREAMFLAGS_NOPERSIST;
6422a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  }
6432a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
6442a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Initialize the audio stream between the client and the device.
6452a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // We connect indirectly through the audio engine by using shared mode.
6462a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Note that, |hnsBufferDuration| is set of 0, which ensures that the
6472a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // buffer is never smaller than the minimum buffer size needed to ensure
6482a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // that glitches do not occur between the periodic processing passes.
6492a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // This setting should lead to lowest possible latency.
6502a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  HRESULT hr = audio_client_->Initialize(
6512a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      AUDCLNT_SHAREMODE_SHARED,
6522a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      flags,
6532a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      0,  // hnsBufferDuration
6542a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      0,
6552a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      &format_,
6562a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)      (effects_ & AudioParameters::DUCKING) ? &kCommunicationsSessionId : NULL);
6572a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
658f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  if (FAILED(hr))
659f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    return hr;
660f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
661f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // Retrieve the length of the endpoint buffer shared between the client
662f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // and the audio engine. The buffer length determines the maximum amount
6632a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // of capture data that the audio engine can read from the endpoint buffer
6642a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // during a single processing pass.
6652a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // A typical value is 960 audio frames <=> 20ms @ 48kHz sample rate.
6662a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  hr = audio_client_->GetBufferSize(&endpoint_buffer_size_frames_);
6671e9bf3e0803691d0a228da41fc608347b6db4340Torne (Richard Coles)  if (FAILED(hr))
6681e9bf3e0803691d0a228da41fc608347b6db4340Torne (Richard Coles)    return hr;
6692a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
6702a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  DVLOG(1) << "endpoint buffer size: " << endpoint_buffer_size_frames_
671f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)           << " [frames]";
672f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
673f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#ifndef NDEBUG
674f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // The period between processing passes by the audio engine is fixed for a
675f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // particular audio endpoint device and represents the smallest processing
676f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // quantum for the audio engine. This period plus the stream latency between
677f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // the buffer and endpoint device represents the minimum possible latency
678f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // that an audio application can achieve.
679f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // TODO(henrika): possibly remove this section when all parts are ready.
680f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  REFERENCE_TIME device_period_shared_mode = 0;
681f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  REFERENCE_TIME device_period_exclusive_mode = 0;
682f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  HRESULT hr_dbg = audio_client_->GetDevicePeriod(
683f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)      &device_period_shared_mode, &device_period_exclusive_mode);
684f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  if (SUCCEEDED(hr_dbg)) {
685f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    DVLOG(1) << "device period: "
686f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)             << static_cast<double>(device_period_shared_mode / 10000.0)
6872a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)             << " [ms]";
6882a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  }
6892a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)
690f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  REFERENCE_TIME latency = 0;
691f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  hr_dbg = audio_client_->GetStreamLatency(&latency);
692f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  if (SUCCEEDED(hr_dbg)) {
693f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    DVLOG(1) << "stream latency: " << static_cast<double>(latency / 10000.0)
694f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)             << " [ms]";
695f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  }
696f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#endif
697f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
698f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // Set the event handle that the audio engine will signal each time a buffer
699f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // becomes ready to be processed by the client.
700f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  //
701f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // In loopback case the capture device doesn't receive any events, so we
702f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // need to create a separate playback client to get notifications. According
703f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // to MSDN:
704f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  //
705f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  //   A pull-mode capture client does not receive any events when a stream is
706f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  //   initialized with event-driven buffering and is loopback-enabled. To
707f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  //   work around this, initialize a render stream in event-driven mode. Each
708f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  //   time the client receives an event for the render stream, it must signal
709f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  //   the capture client to run the capture thread that reads the next set of
710f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  //   samples from the capture endpoint buffer.
711f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  //
712f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // http://msdn.microsoft.com/en-us/library/windows/desktop/dd316551(v=vs.85).aspx
713f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  if (device_id_ == AudioManagerBase::kLoopbackInputDeviceId) {
714f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    hr = endpoint_device_->Activate(
715f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)        __uuidof(IAudioClient), CLSCTX_INPROC_SERVER, NULL,
716f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)        audio_render_client_for_loopback_.ReceiveVoid());
717f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    if (FAILED(hr))
718f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)      return hr;
719f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
720f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    hr = audio_render_client_for_loopback_->Initialize(
721f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)        AUDCLNT_SHAREMODE_SHARED,
722f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)        AUDCLNT_STREAMFLAGS_EVENTCALLBACK | AUDCLNT_STREAMFLAGS_NOPERSIST,
723f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)        0, 0, &format_, NULL);
724f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    if (FAILED(hr))
725f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)      return hr;
726f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
727f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    hr = audio_render_client_for_loopback_->SetEventHandle(
728f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)        audio_samples_ready_event_.Get());
729f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  } else {
730f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    hr = audio_client_->SetEventHandle(audio_samples_ready_event_.Get());
731f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  }
732f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
7332a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  if (FAILED(hr))
7342a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)    return hr;
735f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
7362a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // Get access to the IAudioCaptureClient interface. This interface
7372a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  // enables us to read input data from the capture endpoint buffer.
7382a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)  hr = audio_client_->GetService(__uuidof(IAudioCaptureClient),
739f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)                                 audio_capture_client_.ReceiveVoid());
740f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  if (FAILED(hr))
741f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    return hr;
742f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
743f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // Obtain a reference to the ISimpleAudioVolume interface which enables
744f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // us to control the master volume level of an audio session.
745f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  hr = audio_client_->GetService(__uuidof(ISimpleAudioVolume),
746f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)                                 simple_audio_volume_.ReceiveVoid());
747f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  return hr;
748f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)}
749f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
750f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)}  // namespace media
751f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)