audio_low_latency_input_win.cc revision 116680a4aac90f2aa7413d9095a592090648e557
15821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// Copyright (c) 2012 The Chromium Authors. All rights reserved. 25821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// Use of this source code is governed by a BSD-style license that can be 35821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// found in the LICENSE file. 45821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 55821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)#include "media/audio/win/audio_low_latency_input_win.h" 65821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 72a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)#include "base/logging.h" 8bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch#include "base/memory/scoped_ptr.h" 92a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)#include "base/strings/utf_string_conversions.h" 10868fa2fe829687343ffae624259930155e16dbd8Torne (Richard Coles)#include "media/audio/win/audio_manager_win.h" 111e9bf3e0803691d0a228da41fc608347b6db4340Torne (Richard Coles)#include "media/audio/win/avrt_wrapper_win.h" 121e9bf3e0803691d0a228da41fc608347b6db4340Torne (Richard Coles)#include "media/audio/win/core_audio_util_win.h" 135821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)#include "media/base/audio_bus.h" 142a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 155821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)using base::win::ScopedComPtr; 162a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)using base::win::ScopedCOMInitializer; 172a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 182a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)namespace media { 19c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)namespace { 20c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) 21eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch// Returns true if |device| represents the default communication capture device. 22c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)bool IsDefaultCommunicationDevice(IMMDeviceEnumerator* enumerator, 235821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) IMMDevice* device) { 245821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) ScopedComPtr<IMMDevice> communications; 255821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) if (FAILED(enumerator->GetDefaultAudioEndpoint(eCapture, eCommunications, 265821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) communications.Receive()))) { 275821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) return false; 282a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) } 295821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 305821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) base::win::ScopedCoMem<WCHAR> communications_id, device_id; 315821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) device->GetId(&device_id); 325821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) communications->GetId(&communications_id); 332a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) return lstrcmpW(communications_id, device_id) == 0; 345821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)} 355821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 36bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch} // namespace 37eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 3858537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)WASAPIAudioInputStream::WASAPIAudioInputStream(AudioManagerWin* manager, 397d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) const AudioParameters& params, 405821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) const std::string& device_id) 415821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) : manager_(manager), 425821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) capture_thread_(NULL), 431e9bf3e0803691d0a228da41fc608347b6db4340Torne (Richard Coles) opened_(false), 444e180b6a0b4720a9b8e9e959a882386f690f08ffTorne (Richard Coles) started_(false), 455821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) frame_size_(0), 462a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) packet_size_frames_(0), 475821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) packet_size_bytes_(0), 482a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) endpoint_buffer_size_frames_(0), 4990dce4d38c5ff5333bea97d859d4e484e27edf0cTorne (Richard Coles) effects_(params.effects()), 505821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) device_id_(device_id), 515821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) perf_count_to_100ns_units_(0.0), 522a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) ms_to_frame_count_(0.0), 5368043e1e95eeb07d5cae7aca370b26518b0867d6Torne (Richard Coles) sink_(NULL), 545821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) audio_bus_(media::AudioBus::Create(params)) { 555821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) DCHECK(manager_); 565821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 572a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Load the Avrt DLL if not already loaded. Required to support MMCSS. 58d0247b1b59f9c528cb6df88b4f2b9afaf80d181eTorne (Richard Coles) bool avrt_init = avrt::Initialize(); 59d0247b1b59f9c528cb6df88b4f2b9afaf80d181eTorne (Richard Coles) DCHECK(avrt_init) << "Failed to load the Avrt.dll"; 602a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 612a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Set up the desired capture format specified by the client. 622a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) format_.nSamplesPerSec = params.sample_rate(); 632a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) format_.wFormatTag = WAVE_FORMAT_PCM; 645821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) format_.wBitsPerSample = params.bits_per_sample(); 655821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) format_.nChannels = params.channels(); 665821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) format_.nBlockAlign = (format_.wBitsPerSample / 8) * format_.nChannels; 672a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) format_.nAvgBytesPerSec = format_.nSamplesPerSec * format_.nBlockAlign; 685821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) format_.cbSize = 0; 695821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 705821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Size in bytes of each audio frame. 715821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) frame_size_ = format_.nBlockAlign; 725821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Store size of audio packets which we expect to get from the audio 735821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // endpoint device in each capture event. 745821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) packet_size_frames_ = params.GetBytesPerBuffer() / format_.nBlockAlign; 755821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) packet_size_bytes_ = params.GetBytesPerBuffer(); 765821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) DVLOG(1) << "Number of bytes per audio frame : " << frame_size_; 775821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) DVLOG(1) << "Number of audio frames per packet: " << packet_size_frames_; 78bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch 79bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch // All events are auto-reset events and non-signaled initially. 80bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch 81bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch // Create the event which the audio engine will signal each time 82bbcdd45c55eb7c4641ab97aef9889b0fc828e7d3Ben Murdoch // a buffer becomes ready to be processed by the client. 832a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) audio_samples_ready_event_.Set(CreateEvent(NULL, FALSE, FALSE, NULL)); 842a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DCHECK(audio_samples_ready_event_.IsValid()); 852a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 862a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Create the event which will be set in Stop() when capturing shall stop. 872a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) stop_capture_event_.Set(CreateEvent(NULL, FALSE, FALSE, NULL)); 882a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DCHECK(stop_capture_event_.IsValid()); 892a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 902a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) ms_to_frame_count_ = static_cast<double>(params.sample_rate()) / 1000.0; 912a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 922a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) LARGE_INTEGER performance_frequency; 932a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) if (QueryPerformanceFrequency(&performance_frequency)) { 942a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) perf_count_to_100ns_units_ = 95c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) (10000000.0 / static_cast<double>(performance_frequency.QuadPart)); 96c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) } else { 97c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) DLOG(ERROR) << "High-resolution performance counters are not supported."; 98c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) } 99c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)} 100c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) 101c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)WASAPIAudioInputStream::~WASAPIAudioInputStream() { 102c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) DCHECK(CalledOnValidThread()); 103c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)} 104c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) 105c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)bool WASAPIAudioInputStream::Open() { 1062a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DCHECK(CalledOnValidThread()); 1072a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Verify that we are not already opened. 1082a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) if (opened_) 109c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) return false; 1102a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 1112a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Obtain a reference to the IMMDevice interface of the capturing 1122a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // device with the specified unique identifier or role which was 1132a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // set at construction. 1142a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) HRESULT hr = SetCaptureDevice(); 1152a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) if (FAILED(hr)) 1162a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) return false; 1172a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 1182a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Obtain an IAudioClient interface which enables us to create and initialize 1192a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // an audio stream between an audio application and the audio engine. 1202a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) hr = ActivateCaptureDevice(); 1212a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) if (FAILED(hr)) 1222a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) return false; 1232a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 1242a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Retrieve the stream format which the audio engine uses for its internal 125c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) // processing/mixing of shared-mode streams. This function call is for 1267dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch // diagnostic purposes only and only in debug mode. 127c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)#ifndef NDEBUG 128c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) hr = GetAudioEngineStreamFormat(); 12968043e1e95eeb07d5cae7aca370b26518b0867d6Torne (Richard Coles)#endif 13068043e1e95eeb07d5cae7aca370b26518b0867d6Torne (Richard Coles) 131c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) // Verify that the selected audio endpoint supports the specified format 132c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) // set during construction. 133c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) if (!DesiredFormatIsSupported()) 1342a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) return false; 1352a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 1362a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Initialize the audio stream between the client and the device using 1372a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // shared mode and a lowest possible glitch-free latency. 1382a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) hr = InitializeAudioEngine(); 1392a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 1402a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) opened_ = SUCCEEDED(hr); 1412a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) return opened_; 1422a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)} 1432a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 1442a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)void WASAPIAudioInputStream::Start(AudioInputCallback* callback) { 1452a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DCHECK(CalledOnValidThread()); 1462a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DCHECK(callback); 1472a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DLOG_IF(ERROR, !opened_) << "Open() has not been called successfully"; 1482a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) if (!opened_) 1492a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) return; 1502a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 1512a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) if (started_) 1522a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) return; 1532a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 1542a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DCHECK(!sink_); 1552a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) sink_ = callback; 1562a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 1572a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Starts periodic AGC microphone measurements if the AGC has been enabled 1582a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // using SetAutomaticGainControl(). 1592a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) StartAgc(); 1602a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 1612a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Create and start the thread that will drive the capturing by waiting for 1622a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // capture events. 1632a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) capture_thread_ = 1642a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) new base::DelegateSimpleThread(this, "wasapi_capture_thread"); 1652a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) capture_thread_->Start(); 1662a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 1672a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Start streaming data between the endpoint buffer and the audio engine. 1682a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) HRESULT hr = audio_client_->Start(); 1695821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) DLOG_IF(ERROR, FAILED(hr)) << "Failed to start input streaming."; 1705821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 171c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) if (SUCCEEDED(hr) && audio_render_client_for_loopback_) 1725821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) hr = audio_render_client_for_loopback_->Start(); 1735821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 1745821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) started_ = SUCCEEDED(hr); 1755821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)} 1765821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 177c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)void WASAPIAudioInputStream::Stop() { 178c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) DCHECK(CalledOnValidThread()); 179c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) DVLOG(1) << "WASAPIAudioInputStream::Stop()"; 1805821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) if (!started_) 1815821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) return; 1825821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 1835821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Stops periodic AGC microphone measurements. 184c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) StopAgc(); 1855821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 1865821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Shut down the capture thread. 1875821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) if (stop_capture_event_.IsValid()) { 1885821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) SetEvent(stop_capture_event_.Get()); 1895821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) } 1905821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 1915821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Stop the input audio streaming. 1925821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) HRESULT hr = audio_client_->Stop(); 1935821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) if (FAILED(hr)) { 1945821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) LOG(ERROR) << "Failed to stop input streaming."; 1955821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) } 1965821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 1975821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Wait until the thread completes and perform cleanup. 1985821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) if (capture_thread_) { 1995821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) SetEvent(stop_capture_event_.Get()); 2005821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) capture_thread_->Join(); 2015821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) capture_thread_ = NULL; 20290dce4d38c5ff5333bea97d859d4e484e27edf0cTorne (Richard Coles) } 2035821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 2045821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) started_ = false; 2055821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) sink_ = NULL; 2065821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)} 2075821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 208c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)void WASAPIAudioInputStream::Close() { 2095821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) DVLOG(1) << "WASAPIAudioInputStream::Close()"; 2105821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // It is valid to call Close() before calling open or Start(). 2115821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // It is also valid to call Close() after Start() has been called. 2125821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) Stop(); 2135821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 2145821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Inform the audio manager that we have been closed. This will cause our 2155821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // destruction. 2165821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) manager_->ReleaseInputStream(this); 2175821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)} 2185821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 2195821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)double WASAPIAudioInputStream::GetMaxVolume() { 2205821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Verify that Open() has been called succesfully, to ensure that an audio 2215821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // session exists and that an ISimpleAudioVolume interface has been created. 2225821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) DLOG_IF(ERROR, !opened_) << "Open() has not been called successfully"; 2235821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) if (!opened_) 2245821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) return 0.0; 2255821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 2265821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // The effective volume value is always in the range 0.0 to 1.0, hence 2275821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // we can return a fixed value (=1.0) here. 2285821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) return 1.0; 2295821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)} 2305821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 2315821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)void WASAPIAudioInputStream::SetVolume(double volume) { 2325821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) DVLOG(1) << "SetVolume(volume=" << volume << ")"; 2335821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) DCHECK(CalledOnValidThread()); 2345821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) DCHECK_GE(volume, 0.0); 2355821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) DCHECK_LE(volume, 1.0); 2365821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 2375821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) DLOG_IF(ERROR, !opened_) << "Open() has not been called successfully"; 2385821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) if (!opened_) 2395821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) return; 2405821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 2415821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Set a new master volume level. Valid volume levels are in the range 2425821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // 0.0 to 1.0. Ignore volume-change events. 24358537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) HRESULT hr = simple_audio_volume_->SetMasterVolume(static_cast<float>(volume), 24458537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) NULL); 24558537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) DLOG_IF(WARNING, FAILED(hr)) << "Failed to set new input master volume."; 24658537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) 24758537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) // Update the AGC volume level based on the last setting above. Note that, 24858537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) // the volume-level resolution is not infinite and it is therefore not 24958537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) // possible to assume that the volume provided as input parameter can be 25058537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) // used directly. Instead, a new query to the audio hardware is required. 25158537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) // This method does nothing if AGC is disabled. 25258537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) UpdateAgcVolume(); 25358537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)} 25458537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) 25558537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)double WASAPIAudioInputStream::GetVolume() { 25658537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) DLOG_IF(ERROR, !opened_) << "Open() has not been called successfully"; 25758537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) if (!opened_) 25858537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) return 0.0; 25958537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) 26058537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) // Retrieve the current volume level. The value is in the range 0.0 to 1.0. 261eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch float level = 0.0f; 262eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch HRESULT hr = simple_audio_volume_->GetMasterVolume(&level); 2632a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DLOG_IF(WARNING, FAILED(hr)) << "Failed to get input master volume."; 26458537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) 26558537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) return static_cast<double>(level); 26658537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)} 26758537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) 26858537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)// static 26958537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles)AudioParameters WASAPIAudioInputStream::GetInputStreamParameters( 27058537e28ecd584eab876aee8be7156509866d23aTorne (Richard Coles) const std::string& device_id) { 2715821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) int sample_rate = 48000; 2725821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) ChannelLayout channel_layout = CHANNEL_LAYOUT_STEREO; 2735821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 2745821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) base::win::ScopedCoMem<WAVEFORMATEX> audio_engine_mix_format; 2755821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) int effects = AudioParameters::NO_EFFECTS; 2765821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) if (SUCCEEDED(GetMixFormat(device_id, &audio_engine_mix_format, &effects))) { 2775821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) sample_rate = static_cast<int>(audio_engine_mix_format->nSamplesPerSec); 2785821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) channel_layout = audio_engine_mix_format->nChannels == 1 ? 279eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch CHANNEL_LAYOUT_MONO : CHANNEL_LAYOUT_STEREO; 2805821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) } 2815821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 2825821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Use 10ms frame size as default. 2835821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) int frames_per_buffer = sample_rate / 100; 2842a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) return AudioParameters( 2852a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) AudioParameters::AUDIO_PCM_LOW_LATENCY, channel_layout, 0, sample_rate, 2865821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 16, frames_per_buffer, effects); 2875821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)} 2885821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 2895821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// static 2905821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)HRESULT WASAPIAudioInputStream::GetMixFormat(const std::string& device_id, 2915821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) WAVEFORMATEX** device_format, 2925821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) int* effects) { 2935821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) DCHECK(effects); 2945821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 2955821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // It is assumed that this static method is called from a COM thread, i.e., 2965821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // CoInitializeEx() is not called here to avoid STA/MTA conflicts. 297eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch ScopedComPtr<IMMDeviceEnumerator> enumerator; 298eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch HRESULT hr = enumerator.CreateInstance(__uuidof(MMDeviceEnumerator), NULL, 2995821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) CLSCTX_INPROC_SERVER); 3005821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) if (FAILED(hr)) 3015821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) return hr; 3027d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 3035821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) ScopedComPtr<IMMDevice> endpoint_device; 3045821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) if (device_id == AudioManagerBase::kDefaultDeviceId) { 3055821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Retrieve the default capture audio endpoint. 3065821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) hr = enumerator->GetDefaultAudioEndpoint(eCapture, eConsole, 3075821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) endpoint_device.Receive()); 3085821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) } else if (device_id == AudioManagerBase::kLoopbackInputDeviceId) { 3095821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Get the mix format of the default playback stream. 3105821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) hr = enumerator->GetDefaultAudioEndpoint(eRender, eConsole, 3115821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) endpoint_device.Receive()); 3125821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) } else { 3135821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Retrieve a capture endpoint device that is specified by an endpoint 3145821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // device-identification string. 3155821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) hr = enumerator->GetDevice(base::UTF8ToUTF16(device_id).c_str(), 3167d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) endpoint_device.Receive()); 3175821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) } 3185821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 3195821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) if (FAILED(hr)) 3205821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) return hr; 3215821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 3225821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) *effects = IsDefaultCommunicationDevice(enumerator, endpoint_device) ? 3235821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) AudioParameters::DUCKING : AudioParameters::NO_EFFECTS; 3245821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 325eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch ScopedComPtr<IAudioClient> audio_client; 3265821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) hr = endpoint_device->Activate(__uuidof(IAudioClient), 3275821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) CLSCTX_INPROC_SERVER, 3285821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) NULL, 3295821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) audio_client.ReceiveVoid()); 3305821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) return SUCCEEDED(hr) ? audio_client->GetMixFormat(device_format) : hr; 3315821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)} 33290dce4d38c5ff5333bea97d859d4e484e27edf0cTorne (Richard Coles) 33390dce4d38c5ff5333bea97d859d4e484e27edf0cTorne (Richard Coles)void WASAPIAudioInputStream::Run() { 33490dce4d38c5ff5333bea97d859d4e484e27edf0cTorne (Richard Coles) ScopedCOMInitializer com_init(ScopedCOMInitializer::kMTA); 3355821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 3365821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Increase the thread priority. 337f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) capture_thread_->SetThreadPriority(base::kThreadPriority_RealtimeAudio); 3385821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 339f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // Enable MMCSS to ensure that this thread receives prioritized access to 3405821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // CPU resources. 341f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) DWORD task_index = 0; 3425821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) HANDLE mm_task = avrt::AvSetMmThreadCharacteristics(L"Pro Audio", 343f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) &task_index); 3445821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) bool mmcss_is_ok = 345f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) (mm_task && avrt::AvSetMmThreadPriority(mm_task, AVRT_PRIORITY_CRITICAL)); 3465821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) if (!mmcss_is_ok) { 3475821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Failed to enable MMCSS on this thread. It is not fatal but can lead 3485821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // to reduced QoS at high load. 3495821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) DWORD err = GetLastError(); 350f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) LOG(WARNING) << "Failed to enable MMCSS (error code=" << err << ")."; 351f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) } 3525821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 353f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // Allocate a buffer with a size that enables us to take care of cases like: 3545821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // 1) The recorded buffer size is smaller, or does not match exactly with, 355f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // the selected packet size used in each callback. 3565821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // 2) The selected buffer size is larger than the recorded buffer size in 357f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // each event. 358f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) size_t buffer_frame_index = 0; 3595821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) size_t capture_buffer_size = std::max( 3605821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 2 * endpoint_buffer_size_frames_ * frame_size_, 3615821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 2 * packet_size_frames_ * frame_size_); 3625821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) scoped_ptr<uint8[]> capture_buffer(new uint8[capture_buffer_size]); 3635821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 364f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) LARGE_INTEGER now_count; 3655821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) bool recording = true; 366f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) bool error = false; 3675821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) double volume = GetVolume(); 368f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) HANDLE wait_array[2] = {stop_capture_event_, audio_samples_ready_event_}; 3695821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 370f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) while (recording && !error) { 3715821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) HRESULT hr = S_FALSE; 3725821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) 3735821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) // Wait for a close-down event or a new capture event. 374eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch DWORD wait_result = WaitForMultipleObjects(2, wait_array, FALSE, INFINITE); 375eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch switch (wait_result) { 376eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch case WAIT_FAILED: 377eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch error = true; 378eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch break; 379eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch case WAIT_OBJECT_0 + 0: 380eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // |stop_capture_event_| has been set. 381eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch recording = false; 382eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch break; 383eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch case WAIT_OBJECT_0 + 1: 384eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch { 385eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // |audio_samples_ready_event_| has been set. 386eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch BYTE* data_ptr = NULL; 387eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch UINT32 num_frames_to_read = 0; 388eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch DWORD flags = 0; 389eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch UINT64 device_position = 0; 390eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch UINT64 first_audio_frame_timestamp = 0; 391eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 392eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // Retrieve the amount of data in the capture endpoint buffer, 393eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // replace it with silence if required, create callbacks for each 394eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // packet and store non-delivered data for the next event. 395eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch hr = audio_capture_client_->GetBuffer(&data_ptr, 396eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch &num_frames_to_read, 397eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch &flags, 398eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch &device_position, 399eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch &first_audio_frame_timestamp); 400eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch if (FAILED(hr)) { 401eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch DLOG(ERROR) << "Failed to get data from the capture buffer"; 402eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch continue; 403eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } 404eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 405eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch if (num_frames_to_read != 0) { 406eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch size_t pos = buffer_frame_index * frame_size_; 407eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch size_t num_bytes = num_frames_to_read * frame_size_; 408eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch DCHECK_GE(capture_buffer_size, pos + num_bytes); 409eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 410eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch if (flags & AUDCLNT_BUFFERFLAGS_SILENT) { 411eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // Clear out the local buffer since silence is reported. 412eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch memset(&capture_buffer[pos], 0, num_bytes); 413eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } else { 414eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // Copy captured data from audio engine buffer to local buffer. 415eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch memcpy(&capture_buffer[pos], data_ptr, num_bytes); 416eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } 417eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 4185821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) buffer_frame_index += num_frames_to_read; 4195821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) } 4202a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 4212a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) hr = audio_capture_client_->ReleaseBuffer(num_frames_to_read); 4222a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DLOG_IF(ERROR, FAILED(hr)) << "Failed to release capture buffer"; 4232a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 4242a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Derive a delay estimate for the captured audio packet. 4252a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // The value contains two parts (A+B), where A is the delay of the 426eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // first audio frame in the packet and B is the extra delay 427eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // contained in any stored data. Unit is in audio frames. 4282a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) QueryPerformanceCounter(&now_count); 429eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch double audio_delay_frames = 430eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch ((perf_count_to_100ns_units_ * now_count.QuadPart - 431eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch first_audio_frame_timestamp) / 10000.0) * ms_to_frame_count_ + 432eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch buffer_frame_index - num_frames_to_read; 4332a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 4342a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Get a cached AGC volume level which is updated once every second 4352a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // on the audio manager thread. Note that, |volume| is also updated 436eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // each time SetVolume() is called through IPC by the render-side AGC. 4372a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) GetAgcVolume(&volume); 4382a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 4392a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Deliver captured data to the registered consumer using a packet 4402a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // size which was specified at construction. 4412a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) uint32 delay_frames = static_cast<uint32>(audio_delay_frames + 0.5); 4422a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) while (buffer_frame_index >= packet_size_frames_) { 4432a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Copy data to audio bus to match the OnData interface. 4442a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) uint8* audio_data = reinterpret_cast<uint8*>(capture_buffer.get()); 4452a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) audio_bus_->FromInterleaved( 4462a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) audio_data, audio_bus_->frames(), format_.wBitsPerSample / 8); 4472a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 4482a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Deliver data packet, delay estimation and volume level to 4492a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // the user. 4502a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) sink_->OnData( 4512a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) this, audio_bus_.get(), delay_frames * frame_size_, volume); 4522a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 4532a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Store parts of the recorded data which can't be delivered 4542a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // using the current packet size. The stored section will be used 455c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) // either in the next while-loop iteration or in the next 456c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles) // capture event. 4572a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) memmove(&capture_buffer[0], 4582a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) &capture_buffer[packet_size_bytes_], 4592a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) (buffer_frame_index - packet_size_frames_) * frame_size_); 4602a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 4612a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) buffer_frame_index -= packet_size_frames_; 4622a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) delay_frames -= packet_size_frames_; 463eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } 464eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } 4652a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) break; 4662a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) default: 4672a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) error = true; 468eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch break; 469eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } 470eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } 471eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 472eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch if (recording && error) { 473eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // TODO(henrika): perhaps it worth improving the cleanup here by e.g. 474eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // stopping the audio client, joining the thread etc.? 475eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch NOTREACHED() << "WASAPI capturing failed with error code " 476eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch << GetLastError(); 477eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } 4782a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 4792a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Disable MMCSS. 4802a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) if (mm_task && !avrt::AvRevertMmThreadCharacteristics(mm_task)) { 4812a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) PLOG(WARNING) << "Failed to disable MMCSS"; 4822a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) } 4832a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)} 4842a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 4852a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)void WASAPIAudioInputStream::HandleError(HRESULT err) { 486eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch NOTREACHED() << "Error code: " << err; 4872a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) if (sink_) 4882a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) sink_->OnError(this); 4892a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)} 4902a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 4912a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)HRESULT WASAPIAudioInputStream::SetCaptureDevice() { 4922a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DCHECK(!endpoint_device_); 4932a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 494eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch ScopedComPtr<IMMDeviceEnumerator> enumerator; 4952a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) HRESULT hr = enumerator.CreateInstance(__uuidof(MMDeviceEnumerator), 4962a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) NULL, CLSCTX_INPROC_SERVER); 4972a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) if (FAILED(hr)) 498eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch return hr; 499eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 500eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // Retrieve the IMMDevice by using the specified role or the specified 501eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // unique endpoint device-identification string. 502eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 5032a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) if (effects_ & AudioParameters::DUCKING) { 504eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // Ducking has been requested and it is only supported for the default 5052a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // communication device. So, let's open up the communication device and 5062a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // see if the ID of that device matches the requested ID. 5072a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // We consider a kDefaultDeviceId as well as an explicit device id match, 5082a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // to be valid matches. 5092a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) hr = enumerator->GetDefaultAudioEndpoint(eCapture, eCommunications, 5102a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) endpoint_device_.Receive()); 511eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch if (endpoint_device_ && device_id_ != AudioManagerBase::kDefaultDeviceId) { 512eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch base::win::ScopedCoMem<WCHAR> communications_id; 513eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch endpoint_device_->GetId(&communications_id); 514eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch if (device_id_ != 515eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch base::WideToUTF8(static_cast<WCHAR*>(communications_id))) { 516eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch DLOG(WARNING) << "Ducking has been requested for a non-default device." 517eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch "Not supported."; 518eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // We can't honor the requested effect flag, so turn it off and 5197dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch // continue. We'll check this flag later to see if we've actually 520eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // opened up the communications device, so it's important that it 521eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // reflects the active state. 52268043e1e95eeb07d5cae7aca370b26518b0867d6Torne (Richard Coles) effects_ &= ~AudioParameters::DUCKING; 52368043e1e95eeb07d5cae7aca370b26518b0867d6Torne (Richard Coles) endpoint_device_.Release(); // Fall back on code below. 524eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } 525eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } 526eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } 527eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 528eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch if (!endpoint_device_) { 529eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch if (device_id_ == AudioManagerBase::kDefaultDeviceId) { 530eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // Retrieve the default capture audio endpoint for the specified role. 531eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // Note that, in Windows Vista, the MMDevice API supports device roles 532eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // but the system-supplied user interface programs do not. 533eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch hr = enumerator->GetDefaultAudioEndpoint(eCapture, eConsole, 534eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch endpoint_device_.Receive()); 535eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } else if (device_id_ == AudioManagerBase::kLoopbackInputDeviceId) { 536eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // Capture the default playback stream. 537eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch hr = enumerator->GetDefaultAudioEndpoint(eRender, eConsole, 538eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch endpoint_device_.Receive()); 539eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } else { 540eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch hr = enumerator->GetDevice(base::UTF8ToUTF16(device_id_).c_str(), 541eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch endpoint_device_.Receive()); 542eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } 543eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } 544eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 545eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch if (FAILED(hr)) 546eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch return hr; 547eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 548eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // Verify that the audio endpoint device is active, i.e., the audio 549eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // adapter that connects to the endpoint device is present and enabled. 550eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch DWORD state = DEVICE_STATE_DISABLED; 551eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch hr = endpoint_device_->GetState(&state); 552eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch if (FAILED(hr)) 553eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch return hr; 554eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 555eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch if (!(state & DEVICE_STATE_ACTIVE)) { 556eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch DLOG(ERROR) << "Selected capture device is not active."; 557eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch hr = E_ACCESSDENIED; 558eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } 559eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 560eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch return hr; 561eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch} 562eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 563eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen MurdochHRESULT WASAPIAudioInputStream::ActivateCaptureDevice() { 564eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // Creates and activates an IAudioClient COM object given the selected 565eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // capture endpoint device. 566eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch HRESULT hr = endpoint_device_->Activate(__uuidof(IAudioClient), 567eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch CLSCTX_INPROC_SERVER, 568eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch NULL, 569eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch audio_client_.ReceiveVoid()); 570eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch return hr; 571eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch} 572eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 573eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen MurdochHRESULT WASAPIAudioInputStream::GetAudioEngineStreamFormat() { 574eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch HRESULT hr = S_OK; 575eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch#ifndef NDEBUG 576eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // The GetMixFormat() method retrieves the stream format that the 577eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // audio engine uses for its internal processing of shared-mode streams. 578eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // The method always uses a WAVEFORMATEXTENSIBLE structure, instead 579eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // of a stand-alone WAVEFORMATEX structure, to specify the format. 580eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // An WAVEFORMATEXTENSIBLE structure can specify both the mapping of 581eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // channels to speakers and the number of bits of precision in each sample. 582eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch base::win::ScopedCoMem<WAVEFORMATEXTENSIBLE> format_ex; 583eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch hr = audio_client_->GetMixFormat( 584eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch reinterpret_cast<WAVEFORMATEX**>(&format_ex)); 585eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 586eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // See http://msdn.microsoft.com/en-us/windows/hardware/gg463006#EFH 5872a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // for details on the WAVE file format. 5882a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) WAVEFORMATEX format = format_ex->Format; 5892a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << "WAVEFORMATEX:"; 5902a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << " wFormatTags : 0x" << std::hex << format.wFormatTag; 5912a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << " nChannels : " << format.nChannels; 5922a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << " nSamplesPerSec : " << format.nSamplesPerSec; 5932a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << " nAvgBytesPerSec: " << format.nAvgBytesPerSec; 5942a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << " nBlockAlign : " << format.nBlockAlign; 5952a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << " wBitsPerSample : " << format.wBitsPerSample; 5962a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << " cbSize : " << format.cbSize; 5972a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 5982a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << "WAVEFORMATEXTENSIBLE:"; 5992a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << " wValidBitsPerSample: " << 6002a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) format_ex->Samples.wValidBitsPerSample; 6012a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << " dwChannelMask : 0x" << std::hex << 6022a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) format_ex->dwChannelMask; 6032a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) if (format_ex->SubFormat == KSDATAFORMAT_SUBTYPE_PCM) 6042a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << " SubFormat : KSDATAFORMAT_SUBTYPE_PCM"; 6052a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) else if (format_ex->SubFormat == KSDATAFORMAT_SUBTYPE_IEEE_FLOAT) 6062a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << " SubFormat : KSDATAFORMAT_SUBTYPE_IEEE_FLOAT"; 6072a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) else if (format_ex->SubFormat == KSDATAFORMAT_SUBTYPE_WAVEFORMATEX) 6082a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(2) << " SubFormat : KSDATAFORMAT_SUBTYPE_WAVEFORMATEX"; 6092a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)#endif 6102a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) return hr; 6112a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles)} 6122a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 613eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdochbool WASAPIAudioInputStream::DesiredFormatIsSupported() { 614eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // An application that uses WASAPI to manage shared-mode streams can rely 615eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // on the audio engine to perform only limited format conversions. The audio 6162a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // engine can convert between a standard PCM sample size used by the 617eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // application and the floating-point samples that the engine uses for its 618eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // internal processing. However, the format for an application stream 619eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // typically must have the same number of channels and the same sample 620eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // rate as the stream format used by the device. 621eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // Many audio devices support both PCM and non-PCM stream formats. However, 6222a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // the audio engine can mix only PCM streams. 6232a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) base::win::ScopedCoMem<WAVEFORMATEX> closest_match; 6242a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) HRESULT hr = audio_client_->IsFormatSupported(AUDCLNT_SHAREMODE_SHARED, 6252a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) &format_, 626eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch &closest_match); 627eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch DLOG_IF(ERROR, hr == S_FALSE) << "Format is not supported " 628eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch << "but a closest match exists."; 629eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch return (hr == S_OK); 630eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch} 631eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch 632eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen MurdochHRESULT WASAPIAudioInputStream::InitializeAudioEngine() { 633eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch DWORD flags; 634eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // Use event-driven mode only fo regular input devices. For loopback the 635eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // EVENTCALLBACK flag is specified when intializing 636eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch // |audio_render_client_for_loopback_|. 637eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch if (device_id_ == AudioManagerBase::kLoopbackInputDeviceId) { 638eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch flags = AUDCLNT_STREAMFLAGS_LOOPBACK | AUDCLNT_STREAMFLAGS_NOPERSIST; 639eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch } else { 640eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch flags = 641eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch AUDCLNT_STREAMFLAGS_EVENTCALLBACK | AUDCLNT_STREAMFLAGS_NOPERSIST; 6422a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) } 6432a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 6442a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Initialize the audio stream between the client and the device. 6452a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // We connect indirectly through the audio engine by using shared mode. 6462a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Note that, |hnsBufferDuration| is set of 0, which ensures that the 6472a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // buffer is never smaller than the minimum buffer size needed to ensure 6482a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // that glitches do not occur between the periodic processing passes. 6492a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // This setting should lead to lowest possible latency. 6502a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) HRESULT hr = audio_client_->Initialize( 6512a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) AUDCLNT_SHAREMODE_SHARED, 6522a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) flags, 6532a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 0, // hnsBufferDuration 6542a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 0, 6552a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) &format_, 6562a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) (effects_ & AudioParameters::DUCKING) ? &kCommunicationsSessionId : NULL); 6572a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 658f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) if (FAILED(hr)) 659f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) return hr; 660f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 661f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // Retrieve the length of the endpoint buffer shared between the client 662f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // and the audio engine. The buffer length determines the maximum amount 6632a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // of capture data that the audio engine can read from the endpoint buffer 6642a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // during a single processing pass. 6652a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // A typical value is 960 audio frames <=> 20ms @ 48kHz sample rate. 6662a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) hr = audio_client_->GetBufferSize(&endpoint_buffer_size_frames_); 6671e9bf3e0803691d0a228da41fc608347b6db4340Torne (Richard Coles) if (FAILED(hr)) 6681e9bf3e0803691d0a228da41fc608347b6db4340Torne (Richard Coles) return hr; 6692a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 6702a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) DVLOG(1) << "endpoint buffer size: " << endpoint_buffer_size_frames_ 671f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) << " [frames]"; 672f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 673f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#ifndef NDEBUG 674f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // The period between processing passes by the audio engine is fixed for a 675f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // particular audio endpoint device and represents the smallest processing 676f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // quantum for the audio engine. This period plus the stream latency between 677f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // the buffer and endpoint device represents the minimum possible latency 678f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // that an audio application can achieve. 679f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // TODO(henrika): possibly remove this section when all parts are ready. 680f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) REFERENCE_TIME device_period_shared_mode = 0; 681f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) REFERENCE_TIME device_period_exclusive_mode = 0; 682f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) HRESULT hr_dbg = audio_client_->GetDevicePeriod( 683f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) &device_period_shared_mode, &device_period_exclusive_mode); 684f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) if (SUCCEEDED(hr_dbg)) { 685f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) DVLOG(1) << "device period: " 686f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) << static_cast<double>(device_period_shared_mode / 10000.0) 6872a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) << " [ms]"; 6882a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) } 6892a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) 690f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) REFERENCE_TIME latency = 0; 691f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) hr_dbg = audio_client_->GetStreamLatency(&latency); 692f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) if (SUCCEEDED(hr_dbg)) { 693f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) DVLOG(1) << "stream latency: " << static_cast<double>(latency / 10000.0) 694f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) << " [ms]"; 695f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) } 696f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#endif 697f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 698f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // Set the event handle that the audio engine will signal each time a buffer 699f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // becomes ready to be processed by the client. 700f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // 701f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // In loopback case the capture device doesn't receive any events, so we 702f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // need to create a separate playback client to get notifications. According 703f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // to MSDN: 704f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // 705f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // A pull-mode capture client does not receive any events when a stream is 706f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // initialized with event-driven buffering and is loopback-enabled. To 707f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // work around this, initialize a render stream in event-driven mode. Each 708f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // time the client receives an event for the render stream, it must signal 709f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // the capture client to run the capture thread that reads the next set of 710f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // samples from the capture endpoint buffer. 711f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // 712f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // http://msdn.microsoft.com/en-us/library/windows/desktop/dd316551(v=vs.85).aspx 713f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) if (device_id_ == AudioManagerBase::kLoopbackInputDeviceId) { 714f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) hr = endpoint_device_->Activate( 715f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) __uuidof(IAudioClient), CLSCTX_INPROC_SERVER, NULL, 716f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) audio_render_client_for_loopback_.ReceiveVoid()); 717f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) if (FAILED(hr)) 718f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) return hr; 719f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 720f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) hr = audio_render_client_for_loopback_->Initialize( 721f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) AUDCLNT_SHAREMODE_SHARED, 722f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) AUDCLNT_STREAMFLAGS_EVENTCALLBACK | AUDCLNT_STREAMFLAGS_NOPERSIST, 723f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 0, 0, &format_, NULL); 724f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) if (FAILED(hr)) 725f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) return hr; 726f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 727f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) hr = audio_render_client_for_loopback_->SetEventHandle( 728f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) audio_samples_ready_event_.Get()); 729f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) } else { 730f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) hr = audio_client_->SetEventHandle(audio_samples_ready_event_.Get()); 731f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) } 732f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 7332a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) if (FAILED(hr)) 7342a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) return hr; 735f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 7362a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // Get access to the IAudioCaptureClient interface. This interface 7372a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) // enables us to read input data from the capture endpoint buffer. 7382a99a7e74a7f215066514fe81d2bfa6639d9edddTorne (Richard Coles) hr = audio_client_->GetService(__uuidof(IAudioCaptureClient), 739f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) audio_capture_client_.ReceiveVoid()); 740f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) if (FAILED(hr)) 741f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) return hr; 742f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 743f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // Obtain a reference to the ISimpleAudioVolume interface which enables 744f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // us to control the master volume level of an audio session. 745f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) hr = audio_client_->GetService(__uuidof(ISimpleAudioVolume), 746f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) simple_audio_volume_.ReceiveVoid()); 747f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) return hr; 748f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)} 749f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 750f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)} // namespace media 751f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)