1 /*
2  *  Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
3  *
4  *  Use of this source code is governed by a BSD-style license
5  *  that can be found in the LICENSE file in the root of the source
6  *  tree. An additional intellectual property rights grant can be found
7  *  in the file PATENTS.  All contributing project authors may
8  *  be found in the AUTHORS file in the root of the source tree.
9  */
10 
11 #include "modules/audio_device/win/core_audio_output_win.h"
12 
13 #include <memory>
14 
15 #include "modules/audio_device/audio_device_buffer.h"
16 #include "modules/audio_device/fine_audio_buffer.h"
17 #include "rtc_base/bind.h"
18 #include "rtc_base/checks.h"
19 #include "rtc_base/logging.h"
20 #include "rtc_base/time_utils.h"
21 
22 using Microsoft::WRL::ComPtr;
23 
24 namespace webrtc {
25 namespace webrtc_win {
26 
CoreAudioOutput(bool automatic_restart)27 CoreAudioOutput::CoreAudioOutput(bool automatic_restart)
28     : CoreAudioBase(
29           CoreAudioBase::Direction::kOutput,
30           automatic_restart,
31           [this](uint64_t freq) { return OnDataCallback(freq); },
__anonc8aa5fe70202(ErrorType err) 32           [this](ErrorType err) { return OnErrorCallback(err); }) {
33   RTC_DLOG(INFO) << __FUNCTION__;
34   RTC_DCHECK_RUN_ON(&thread_checker_);
35   thread_checker_audio_.Detach();
36 }
37 
~CoreAudioOutput()38 CoreAudioOutput::~CoreAudioOutput() {
39   RTC_DLOG(INFO) << __FUNCTION__;
40   RTC_DCHECK_RUN_ON(&thread_checker_);
41   Terminate();
42 }
43 
Init()44 int CoreAudioOutput::Init() {
45   RTC_DLOG(INFO) << __FUNCTION__;
46   RTC_DCHECK_RUN_ON(&thread_checker_);
47   return 0;
48 }
49 
Terminate()50 int CoreAudioOutput::Terminate() {
51   RTC_DLOG(INFO) << __FUNCTION__;
52   RTC_DCHECK_RUN_ON(&thread_checker_);
53   StopPlayout();
54   return 0;
55 }
56 
NumDevices() const57 int CoreAudioOutput::NumDevices() const {
58   RTC_DCHECK_RUN_ON(&thread_checker_);
59   return core_audio_utility::NumberOfActiveDevices(eRender);
60 }
61 
SetDevice(int index)62 int CoreAudioOutput::SetDevice(int index) {
63   RTC_DLOG(INFO) << __FUNCTION__ << ": " << index;
64   RTC_DCHECK_GE(index, 0);
65   RTC_DCHECK_RUN_ON(&thread_checker_);
66   return CoreAudioBase::SetDevice(index);
67 }
68 
SetDevice(AudioDeviceModule::WindowsDeviceType device)69 int CoreAudioOutput::SetDevice(AudioDeviceModule::WindowsDeviceType device) {
70   RTC_DLOG(INFO) << __FUNCTION__ << ": "
71                  << ((device == AudioDeviceModule::kDefaultDevice)
72                          ? "Default"
73                          : "DefaultCommunication");
74   RTC_DCHECK_RUN_ON(&thread_checker_);
75   return SetDevice((device == AudioDeviceModule::kDefaultDevice) ? 0 : 1);
76 }
77 
DeviceName(int index,std::string * name,std::string * guid)78 int CoreAudioOutput::DeviceName(int index,
79                                 std::string* name,
80                                 std::string* guid) {
81   RTC_DLOG(INFO) << __FUNCTION__ << ": " << index;
82   RTC_DCHECK_RUN_ON(&thread_checker_);
83   RTC_DCHECK(name);
84   return CoreAudioBase::DeviceName(index, name, guid);
85 }
86 
AttachAudioBuffer(AudioDeviceBuffer * audio_buffer)87 void CoreAudioOutput::AttachAudioBuffer(AudioDeviceBuffer* audio_buffer) {
88   RTC_DLOG(INFO) << __FUNCTION__;
89   RTC_DCHECK_RUN_ON(&thread_checker_);
90   audio_device_buffer_ = audio_buffer;
91 }
92 
PlayoutIsInitialized() const93 bool CoreAudioOutput::PlayoutIsInitialized() const {
94   RTC_DLOG(INFO) << __FUNCTION__;
95   RTC_DCHECK_RUN_ON(&thread_checker_);
96   return initialized_;
97 }
98 
InitPlayout()99 int CoreAudioOutput::InitPlayout() {
100   RTC_DLOG(INFO) << __FUNCTION__ << ": " << IsRestarting();
101   RTC_DCHECK(!initialized_);
102   RTC_DCHECK(!Playing());
103   RTC_DCHECK(!audio_render_client_);
104 
105   // Creates an IAudioClient instance and stores the valid interface pointer in
106   // |audio_client3_|, |audio_client2_|, or |audio_client_| depending on
107   // platform support. The base class will use optimal output parameters and do
108   // an event driven shared mode initialization. The utilized format will be
109   // stored in |format_| and can be used for configuration and allocation of
110   // audio buffers.
111   if (!CoreAudioBase::Init()) {
112     return -1;
113   }
114   RTC_DCHECK(audio_client_);
115 
116   // Configure the playout side of the audio device buffer using |format_|
117   // after a trivial sanity check of the format structure.
118   RTC_DCHECK(audio_device_buffer_);
119   WAVEFORMATEX* format = &format_.Format;
120   RTC_DCHECK_EQ(format->wFormatTag, WAVE_FORMAT_EXTENSIBLE);
121   audio_device_buffer_->SetPlayoutSampleRate(format->nSamplesPerSec);
122   audio_device_buffer_->SetPlayoutChannels(format->nChannels);
123 
124   // Create a modified audio buffer class which allows us to ask for any number
125   // of samples (and not only multiple of 10ms) to match the optimal
126   // buffer size per callback used by Core Audio.
127   // TODO(henrika): can we share one FineAudioBuffer with the input side?
128   fine_audio_buffer_ = std::make_unique<FineAudioBuffer>(audio_device_buffer_);
129 
130   // Create an IAudioRenderClient for an initialized IAudioClient.
131   // The IAudioRenderClient interface enables us to write output data to
132   // a rendering endpoint buffer.
133   ComPtr<IAudioRenderClient> audio_render_client =
134       core_audio_utility::CreateRenderClient(audio_client_.Get());
135   if (!audio_render_client.Get()) {
136     return -1;
137   }
138 
139   ComPtr<IAudioClock> audio_clock =
140       core_audio_utility::CreateAudioClock(audio_client_.Get());
141   if (!audio_clock.Get()) {
142     return -1;
143   }
144 
145   // Store valid COM interfaces.
146   audio_render_client_ = audio_render_client;
147   audio_clock_ = audio_clock;
148 
149   initialized_ = true;
150   return 0;
151 }
152 
StartPlayout()153 int CoreAudioOutput::StartPlayout() {
154   RTC_DLOG(INFO) << __FUNCTION__ << ": " << IsRestarting();
155   RTC_DCHECK(!Playing());
156   RTC_DCHECK(fine_audio_buffer_);
157   RTC_DCHECK(audio_device_buffer_);
158   if (!initialized_) {
159     RTC_DLOG(LS_WARNING)
160         << "Playout can not start since InitPlayout must succeed first";
161   }
162 
163   fine_audio_buffer_->ResetPlayout();
164   if (!IsRestarting()) {
165     audio_device_buffer_->StartPlayout();
166   }
167 
168   if (!core_audio_utility::FillRenderEndpointBufferWithSilence(
169           audio_client_.Get(), audio_render_client_.Get())) {
170     RTC_LOG(LS_WARNING) << "Failed to prepare output endpoint with silence";
171   }
172 
173   num_frames_written_ = endpoint_buffer_size_frames_;
174 
175   if (!Start()) {
176     return -1;
177   }
178 
179   is_active_ = true;
180   return 0;
181 }
182 
StopPlayout()183 int CoreAudioOutput::StopPlayout() {
184   RTC_DLOG(INFO) << __FUNCTION__ << ": " << IsRestarting();
185   if (!initialized_) {
186     return 0;
187   }
188 
189   // Release resources allocated in InitPlayout() and then return if this
190   // method is called without any active output audio.
191   if (!Playing()) {
192     RTC_DLOG(WARNING) << "No output stream is active";
193     ReleaseCOMObjects();
194     initialized_ = false;
195     return 0;
196   }
197 
198   if (!Stop()) {
199     RTC_LOG(LS_ERROR) << "StopPlayout failed";
200     return -1;
201   }
202 
203   if (!IsRestarting()) {
204     RTC_DCHECK(audio_device_buffer_);
205     audio_device_buffer_->StopPlayout();
206   }
207 
208   // Release all allocated resources to allow for a restart without
209   // intermediate destruction.
210   ReleaseCOMObjects();
211 
212   initialized_ = false;
213   is_active_ = false;
214   return 0;
215 }
216 
Playing()217 bool CoreAudioOutput::Playing() {
218   RTC_DLOG(INFO) << __FUNCTION__ << ": " << is_active_;
219   return is_active_;
220 }
221 
222 // TODO(henrika): finalize support of audio session volume control. As is, we
223 // are not compatible with the old ADM implementation since it allows accessing
224 // the volume control with any active audio output stream.
VolumeIsAvailable(bool * available)225 int CoreAudioOutput::VolumeIsAvailable(bool* available) {
226   RTC_DLOG(INFO) << __FUNCTION__;
227   RTC_DCHECK_RUN_ON(&thread_checker_);
228   return IsVolumeControlAvailable(available) ? 0 : -1;
229 }
230 
231 // Triggers the restart sequence. Only used for testing purposes to emulate
232 // a real event where e.g. an active output device is removed.
RestartPlayout()233 int CoreAudioOutput::RestartPlayout() {
234   RTC_DLOG(INFO) << __FUNCTION__;
235   RTC_DCHECK_RUN_ON(&thread_checker_);
236   if (!Playing()) {
237     return 0;
238   }
239   if (!Restart()) {
240     RTC_LOG(LS_ERROR) << "RestartPlayout failed";
241     return -1;
242   }
243   return 0;
244 }
245 
Restarting() const246 bool CoreAudioOutput::Restarting() const {
247   RTC_DLOG(INFO) << __FUNCTION__;
248   RTC_DCHECK_RUN_ON(&thread_checker_);
249   return IsRestarting();
250 }
251 
SetSampleRate(uint32_t sample_rate)252 int CoreAudioOutput::SetSampleRate(uint32_t sample_rate) {
253   RTC_DLOG(INFO) << __FUNCTION__;
254   RTC_DCHECK_RUN_ON(&thread_checker_);
255   sample_rate_ = sample_rate;
256   return 0;
257 }
258 
ReleaseCOMObjects()259 void CoreAudioOutput::ReleaseCOMObjects() {
260   RTC_DLOG(INFO) << __FUNCTION__;
261   CoreAudioBase::ReleaseCOMObjects();
262   if (audio_render_client_.Get()) {
263     audio_render_client_.Reset();
264   }
265 }
266 
OnErrorCallback(ErrorType error)267 bool CoreAudioOutput::OnErrorCallback(ErrorType error) {
268   RTC_DLOG(INFO) << __FUNCTION__ << ": " << as_integer(error);
269   RTC_DCHECK_RUN_ON(&thread_checker_audio_);
270   if (!initialized_ || !Playing()) {
271     return true;
272   }
273 
274   if (error == CoreAudioBase::ErrorType::kStreamDisconnected) {
275     HandleStreamDisconnected();
276   } else {
277     RTC_DLOG(WARNING) << "Unsupported error type";
278   }
279   return true;
280 }
281 
OnDataCallback(uint64_t device_frequency)282 bool CoreAudioOutput::OnDataCallback(uint64_t device_frequency) {
283   RTC_DCHECK_RUN_ON(&thread_checker_audio_);
284   if (num_data_callbacks_ == 0) {
285     RTC_LOG(INFO) << "--- Output audio stream is alive ---";
286   }
287   // Get the padding value which indicates the amount of valid unread data that
288   // the endpoint buffer currently contains.
289   UINT32 num_unread_frames = 0;
290   _com_error error = audio_client_->GetCurrentPadding(&num_unread_frames);
291   if (error.Error() == AUDCLNT_E_DEVICE_INVALIDATED) {
292     // Avoid breaking the thread loop implicitly by returning false and return
293     // true instead for AUDCLNT_E_DEVICE_INVALIDATED even it is a valid error
294     // message. We will use notifications about device changes instead to stop
295     // data callbacks and attempt to restart streaming .
296     RTC_DLOG(LS_ERROR) << "AUDCLNT_E_DEVICE_INVALIDATED";
297     return true;
298   }
299   if (FAILED(error.Error())) {
300     RTC_LOG(LS_ERROR) << "IAudioClient::GetCurrentPadding failed: "
301                       << core_audio_utility::ErrorToString(error);
302     return false;
303   }
304 
305   // Contains how much new data we can write to the buffer without the risk of
306   // overwriting previously written data that the audio engine has not yet read
307   // from the buffer. I.e., it is the maximum buffer size we can request when
308   // calling IAudioRenderClient::GetBuffer().
309   UINT32 num_requested_frames =
310       endpoint_buffer_size_frames_ - num_unread_frames;
311   if (num_requested_frames == 0) {
312     RTC_DLOG(LS_WARNING)
313         << "Audio thread is signaled but no new audio samples are needed";
314     return true;
315   }
316 
317   // Request all available space in the rendering endpoint buffer into which the
318   // client can later write an audio packet.
319   uint8_t* audio_data;
320   error = audio_render_client_->GetBuffer(num_requested_frames, &audio_data);
321   if (FAILED(error.Error())) {
322     RTC_LOG(LS_ERROR) << "IAudioRenderClient::GetBuffer failed: "
323                       << core_audio_utility::ErrorToString(error);
324     return false;
325   }
326 
327   // Update output delay estimate but only about once per second to save
328   // resources. The estimate is usually stable.
329   if (num_data_callbacks_ % 100 == 0) {
330     // TODO(henrika): note that FineAudioBuffer adds latency as well.
331     latency_ms_ = EstimateOutputLatencyMillis(device_frequency);
332     if (num_data_callbacks_ % 500 == 0) {
333       RTC_DLOG(INFO) << "latency: " << latency_ms_;
334     }
335   }
336 
337   // Get audio data from WebRTC and write it to the allocated buffer in
338   // |audio_data|. The playout latency is not updated for each callback.
339   fine_audio_buffer_->GetPlayoutData(
340       rtc::MakeArrayView(reinterpret_cast<int16_t*>(audio_data),
341                          num_requested_frames * format_.Format.nChannels),
342       latency_ms_);
343 
344   // Release the buffer space acquired in IAudioRenderClient::GetBuffer.
345   error = audio_render_client_->ReleaseBuffer(num_requested_frames, 0);
346   if (FAILED(error.Error())) {
347     RTC_LOG(LS_ERROR) << "IAudioRenderClient::ReleaseBuffer failed: "
348                       << core_audio_utility::ErrorToString(error);
349     return false;
350   }
351 
352   num_frames_written_ += num_requested_frames;
353   ++num_data_callbacks_;
354 
355   return true;
356 }
357 
358 // TODO(henrika): IAudioClock2::GetDevicePosition could perhaps be used here
359 // instead. Tried it once, but it crashed for capture devices.
EstimateOutputLatencyMillis(uint64_t device_frequency)360 int CoreAudioOutput::EstimateOutputLatencyMillis(uint64_t device_frequency) {
361   UINT64 position = 0;
362   UINT64 qpc_position = 0;
363   int delay_ms = 0;
364   // Get the device position through output parameter |position|. This is the
365   // stream position of the sample that is currently playing through the
366   // speakers.
367   _com_error error = audio_clock_->GetPosition(&position, &qpc_position);
368   if (error.Error() == S_OK) {
369     // Number of frames already played out through the speaker.
370     const uint64_t num_played_out_frames =
371         format_.Format.nSamplesPerSec * position / device_frequency;
372 
373     // Number of frames that have been written to the buffer but not yet
374     // played out corresponding to the estimated latency measured in number
375     // of audio frames.
376     const uint64_t delay_frames = num_frames_written_ - num_played_out_frames;
377 
378     // Convert latency in number of frames into milliseconds.
379     webrtc::TimeDelta delay =
380         webrtc::TimeDelta::Micros(delay_frames * rtc::kNumMicrosecsPerSec /
381                                   format_.Format.nSamplesPerSec);
382     delay_ms = delay.ms();
383   }
384   return delay_ms;
385 }
386 
387 // Called from OnErrorCallback() when error type is kStreamDisconnected.
388 // Note that this method is called on the audio thread and the internal restart
389 // sequence is also executed on that same thread. The audio thread is therefore
390 // not stopped during restart. Such a scheme also makes the restart process less
391 // complex.
392 // Note that, none of the called methods are thread checked since they can also
393 // be called on the main thread. Thread checkers are instead added on one layer
394 // above (in audio_device_module.cc) which ensures that the public API is thread
395 // safe.
396 // TODO(henrika): add more details.
HandleStreamDisconnected()397 bool CoreAudioOutput::HandleStreamDisconnected() {
398   RTC_DLOG(INFO) << "<<<--- " << __FUNCTION__;
399   RTC_DCHECK_RUN_ON(&thread_checker_audio_);
400   RTC_DCHECK(automatic_restart());
401 
402   if (StopPlayout() != 0) {
403     return false;
404   }
405 
406   if (!SwitchDeviceIfNeeded()) {
407     return false;
408   }
409 
410   if (InitPlayout() != 0) {
411     return false;
412   }
413   if (StartPlayout() != 0) {
414     return false;
415   }
416 
417   RTC_DLOG(INFO) << __FUNCTION__ << " --->>>";
418   return true;
419 }
420 
421 }  // namespace webrtc_win
422 
423 }  // namespace webrtc
424