audio/win/audio_low_latency_output_win.cc - chromium/src/media - Git at Google

 // Copyright 2012 The Chromium Authors
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "media/audio/win/audio_low_latency_output_win.h"

 #include <objbase.h>

 #include <Functiondiscoverykeys_devpkey.h>
 #include <audiopolicy.h>
 #include <inttypes.h>

 #include <climits>
 #include <memory>

 #include "base/command_line.h"
 #include "base/functional/callback.h"
 #include "base/logging.h"
 #include "base/metrics/histogram.h"
 #include "base/metrics/histogram_functions.h"
 #include "base/metrics/histogram_macros.h"
 #include "base/strings/stringprintf.h"
 #include "base/strings/utf_string_conversions.h"
 #include "base/task/bind_post_task.h"
 #include "base/time/time.h"
 #include "base/trace_event/base_tracing.h"
 #include "base/win/scoped_propvariant.h"
 #include "media/audio/audio_device_description.h"
 #include "media/audio/win/audio_manager_win.h"
 #include "media/audio/win/audio_session_event_listener_win.h"
 #include "media/audio/win/avrt_wrapper_win.h"
 #include "media/audio/win/core_audio_util_win.h"
 #include "media/base/amplitude_peak_detector.h"
 #include "media/base/audio_glitch_info.h"
 #include "media/base/audio_sample_types.h"
 #include "media/base/audio_timestamp_helper.h"
 #include "media/base/limits.h"
 #include "media/base/media_switches.h"

 using base::win::ScopedCoMem;
 using base::win::ScopedCOMInitializer;

 namespace media {

 namespace {

 constexpr char kOpenFailureHistogram[] = "Media.Audio.Output.Win.OpenError";
 constexpr char kStartFailureHistogram[] = "Media.Audio.Output.Win.StartError";
 constexpr char kStopFailureHistogram[] = "Media.Audio.Output.Win.StopError";
 constexpr char kRunFailureHistogram[] = "Media.Audio.Output.Win.RunError";
 constexpr char kRenderFailureHistogram[] = "Media.Audio.Output.Win.RenderError";

 void RecordAudioFailure(const char* histogram, HRESULT hr) {
   base::UmaHistogramSparse(histogram, hr);
 }

 // Converts a COM error into a human-readable string.
 std::string ErrorToString(HRESULT hresult) {
   return CoreAudioUtil::ErrorToString(hresult);
 }

 const char* RoleToString(const ERole role) {
   switch (role) {
     case eConsole:
       return "Console";
     case eMultimedia:
       return "Multimedia";
     case eCommunications:
       return "Communications";
     default:
       return "Unsupported";
   }
 }

 }  // namespace

 // static
 AUDCLNT_SHAREMODE
 WASAPIAudioOutputStream::GetShareMode() {
   const base::CommandLine* cmd_line = base::CommandLine::ForCurrentProcess();
   if (cmd_line->HasSwitch(switches::kEnableExclusiveAudio))
     return AUDCLNT_SHAREMODE_EXCLUSIVE;
   return AUDCLNT_SHAREMODE_SHARED;
 }

 WASAPIAudioOutputStream::WASAPIAudioOutputStream(
     AudioManagerWin* manager,
     const std::string& device_id,
     const AudioParameters& params,
     ERole device_role,
     AudioManager::LogCallback log_callback)
     : creating_thread_id_(base::PlatformThread::CurrentId()),
       manager_(manager),
       glitch_reporter_(SystemGlitchReporter::StreamType::kRender),
       format_(),
       params_(params),
       opened_(false),
       volume_(1.0),
       packet_size_frames_(0),
       requested_iaudioclient3_buffer_size_(0),
       packet_size_bytes_(0),
       endpoint_buffer_size_frames_(0),
       device_id_(device_id),
       device_role_(device_role),
       share_mode_(GetShareMode()),
       num_written_frames_(0),
       source_(nullptr),
       log_callback_(std::move(log_callback)) {
   DCHECK(manager_);
 #if BUILDFLAG(ENABLE_PLATFORM_DTS_AUDIO)
   if (params.format() == AudioParameters::AUDIO_BITSTREAM_DTS)
     DCHECK_EQ(GetShareMode(), AUDCLNT_SHAREMODE_EXCLUSIVE);
 #endif  // BUILDFLAG(ENABLE_PLATFORM_DTS_AUDIO)

   // The empty string is used to indicate a default device and the
   // |device_role_| member controls whether that's the default or default
   // communications device.
   DCHECK_NE(device_id_, AudioDeviceDescription::kDefaultDeviceId);
   DCHECK_NE(device_id_, AudioDeviceDescription::kCommunicationsDeviceId);

   SendLogMessage("%s({device_id=%s}, {params=[%s]}, {role=%s})", __func__,
                  device_id.c_str(), params.AsHumanReadableString().c_str(),
                  RoleToString(device_role));

   // Load the Avrt DLL if not already loaded. Required to support MMCSS.
   bool avrt_init = avrt::Initialize();
   if (!avrt_init)
     SendLogMessage("%s => (WARNING: failed to load Avrt.dll)", __func__);

   // The param passed in may not be for audio offload, and we need to force
   // disable audio offload if the param is not preferred for it.
   audio_bus_ = AudioBus::Create(params);

   AudioParameters::HardwareCapabilities hardware_capabilities =
       params.hardware_capabilities().value_or(
           AudioParameters::HardwareCapabilities());

   // Only request an explicit buffer size if we are requesting the non-default
   // and the minimum supported by the hardware, everything else uses the older
   // IAudioClient API.
   if (params.frames_per_buffer() !=
           hardware_capabilities.default_frames_per_buffer &&
       params.frames_per_buffer() ==
           hardware_capabilities.min_frames_per_buffer) {
     requested_iaudioclient3_buffer_size_ =
         hardware_capabilities.min_frames_per_buffer;
   }

   // All events are auto-reset events and non-signaled initially.

   // Create the event which the audio engine will signal each time
   // a buffer becomes ready to be processed by the client.
   audio_samples_render_event_.Set(CreateEvent(nullptr, FALSE, FALSE, nullptr));
   DCHECK(audio_samples_render_event_.IsValid());

   // Create the event which will be set in Stop() when capturing shall stop.
   stop_render_event_.Set(CreateEvent(nullptr, FALSE, FALSE, nullptr));
   DCHECK(stop_render_event_.IsValid());
 }

 WASAPIAudioOutputStream::~WASAPIAudioOutputStream() {
   DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);

   StopAudioSessionEventListener();
 }

 bool WASAPIAudioOutputStream::Open() {
   DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);
   SendLogMessage("%s([opened=%s])", __func__, opened_ ? "true" : "false");
   if (opened_)
     return true;

   DCHECK(!audio_client_.Get());
   DCHECK(!audio_render_client_.Get());

   const bool communications_device =
       device_id_.empty() ? (device_role_ == eCommunications) : false;

   Microsoft::WRL::ComPtr<IAudioClient> audio_client(
       CoreAudioUtil::CreateClient(device_id_, eRender, device_role_));
   if (!audio_client.Get()) {
     RecordAudioFailure(kOpenFailureHistogram, GetLastError());
     SendLogMessage("%s => (ERROR: CAU::CreateClient failed)", __func__);
     return false;
   }

   HRESULT hr = S_FALSE;
   enable_audio_offload_ = params_.RequireOffload();

   if (share_mode_ == AUDCLNT_SHAREMODE_SHARED && enable_audio_offload_) {
     enable_audio_offload_ =
         CoreAudioUtil::EnableOffloadForClient(audio_client.Get());
     if (!enable_audio_offload_) {
       SendLogMessage("%s => (INFO: Not enrolling into audio offload.",
                      __func__);
       // Return here to allow falling back to non-offload mode.
       return false;
     }
   }

   // Setup wave format after possible audio offload enabling.
   SetupWaveFormat();

   // Extra sanity to ensure that the provided device format is still valid.
   if (!CoreAudioUtil::IsFormatSupported(audio_client.Get(), share_mode_,
                                         &format_)) {
     RecordAudioFailure(kOpenFailureHistogram, GetLastError());
     SendLogMessage("%s => (ERROR: CAU::IsFormatSupported failed)", __func__);
     return false;
   }

   if (share_mode_ == AUDCLNT_SHAREMODE_SHARED) {
     // Initialize the audio stream between the client and the device in shared
     // mode and using event-driven buffer handling.
     hr = CoreAudioUtil::SharedModeInitialize(
         audio_client.Get(), &format_, audio_samples_render_event_.Get(),
         requested_iaudioclient3_buffer_size_, &endpoint_buffer_size_frames_,
         communications_device ? &kCommunicationsSessionId : nullptr,
         enable_audio_offload_);
     if (FAILED(hr)) {
       RecordAudioFailure(kOpenFailureHistogram, hr);
       SendLogMessage("%s => (ERROR: IAudioClient::SharedModeInitialize=[%s])",
                      __func__, ErrorToString(hr).c_str());
       // With audio offload requested, initialization may fail if resource for
       // audio offload is limited. For low latency output, audio output
       // resampler will fallback to non-offload mode first; If still fails to
       // initialize, will then fallback to linear PCM.
       return false;
     }

     REFERENCE_TIME device_period = 0;
     if (FAILED(CoreAudioUtil::GetDevicePeriod(
             audio_client.Get(), AUDCLNT_SHAREMODE_SHARED, &device_period))) {
       RecordAudioFailure(kOpenFailureHistogram, GetLastError());
       return false;
     }

     UINT32 preferred_frames_per_buffer = 0;
     if (enable_audio_offload_) {
       audio_client->GetBufferSize(&preferred_frames_per_buffer);

       // if the granted buffer size is not the same as requested buffer size
       // re-initializing audio bus.
       if (packet_size_frames_ != preferred_frames_per_buffer) {
         AudioParameters params = AudioParameters(params_);
         params.set_frames_per_buffer(preferred_frames_per_buffer);
         audio_bus_ = AudioBus::Create(params);
         // For Offload case GetBuffer API requires the preferred buffer size to
         // be used or it will fail.
         packet_size_frames_ = preferred_frames_per_buffer;
         packet_size_bytes_ = params.GetBytesPerBuffer(kSampleFormatS16);
       }
     } else {
       preferred_frames_per_buffer = AudioTimestampHelper::TimeToFrames(
           CoreAudioUtil::ReferenceTimeToTimeDelta(device_period),
           format_.Format.nSamplesPerSec);
     }

     SendLogMessage("%s => (preferred_frames_per_buffer=[%d audio frames])",
                    __func__, preferred_frames_per_buffer);

     // Packet size should always be an even divisor of the device period for
     // best performance; things will still work otherwise, but may glitch for a
     // couple of reasons.
     //
     // The first reason is if/when repeated RenderAudioFromSource() hit the
     // shared memory boundary between the renderer and the browser.  The next
     // audio buffer is always requested after the current request is consumed.
     // With back-to-back calls the round-trip may not be fast enough and thus
     // audio will glitch as we fail to deliver audio in a timely manner.
     //
     // The second reason is event wakeup efficiency.  We may have too few or too
     // many frames to fill the output buffer requested by WASAPI.  If too few,
     // we'll refuse the render event and wait until more output space is
     // available.  If we have too many frames, we'll only partially fill and
     // wait for the next render event.  In either case certain remainders may
     // leave us unable to fulfill the request in a timely manner, thus glitches.
     //
     // Log a warning in these cases so we can help users in the field.
     // Examples: 48kHz => 960 % 480, 44.1kHz => 896 % 448 or 882 % 441.
     if (preferred_frames_per_buffer % packet_size_frames_) {
       SendLogMessage(
           "%s => (WARNING: Using output audio with a non-optimal buffer size)",
           __func__);
     }
   } else {
     SendLogMessage(
         "%s => (WARNING: Using exclusive mode can lead to bad performance)",
         __func__);
     // TODO(henrika): break out to CoreAudioUtil::ExclusiveModeInitialize()
     // when removing the enable-exclusive-audio flag.
     hr = ExclusiveModeInitialization(audio_client.Get(),
                                      audio_samples_render_event_.Get(),
                                      &endpoint_buffer_size_frames_);
     if (FAILED(hr))
       return false;

     // The buffer scheme for exclusive mode streams is not designed for max
     // flexibility. We only allow a "perfect match" between the packet size set
     // by the user and the actual endpoint buffer size.
     if (endpoint_buffer_size_frames_ != packet_size_frames_) {
       LOG(ERROR) << "Bailing out due to non-perfect timing.";
       return false;
     }
   }

   // Create an IAudioRenderClient client for an initialized IAudioClient.
   // The IAudioRenderClient interface enables us to write output data to
   // a rendering endpoint buffer.
   Microsoft::WRL::ComPtr<IAudioRenderClient> audio_render_client =
       CoreAudioUtil::CreateRenderClient(audio_client.Get());
   if (!audio_render_client.Get()) {
     RecordAudioFailure(kOpenFailureHistogram, GetLastError());
     SendLogMessage("%s => (ERROR: CAU::CreateRenderClient failed)", __func__);
     return false;
   }

   // Store valid COM interfaces.
   audio_client_ = audio_client;
   audio_render_client_ = audio_render_client;

   hr = audio_client_->GetService(IID_PPV_ARGS(&audio_clock_));
   if (FAILED(hr)) {
     RecordAudioFailure(kOpenFailureHistogram, hr);
     SendLogMessage("%s => (ERROR: IAudioClient::GetService(IAudioClock)=[%s])",
                    __func__, ErrorToString(hr).c_str());
     return false;
   }

   StartAudioSessionEventListener();

   opened_ = true;
   return true;
 }

 void WASAPIAudioOutputStream::Start(AudioSourceCallback* callback) {
   DVLOG(1) << "WASAPIAudioOutputStream::Start()";
   DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);
   CHECK(callback);
   CHECK(opened_);
   SendLogMessage("%s([opened=%s, started=%s])", __func__,
                  opened_ ? "true" : "false", render_thread_ ? "true" : "false");

   if (render_thread_) {
     CHECK_EQ(callback, source_);
     return;
   }

   // Since a device change may occur between Open() and Start() we need to
   // signal the change once we have a |callback|. It's okay if this ends up
   // being delivered multiple times.
   if (device_changed_) {
     callback->OnError(AudioSourceCallback::ErrorType::kDeviceChange);
     return;
   }

   // Ensure that the endpoint buffer is prepared with silence. Also serves as
   // a sanity check for the IAudioClient and IAudioRenderClient which may have
   // been invalidated by Windows since the last Stop() call.
   //
   // While technically we only need to retry when WASAPI tells us the device has
   // been invalidated (AUDCLNT_E_DEVICE_INVALIDATED), we retry for all errors
   // for simplicity and due to large sites like YouTube reporting high success
   // rates with a simple retry upon detection of an audio output error.
   if (share_mode_ == AUDCLNT_SHAREMODE_SHARED) {
     if (!CoreAudioUtil::FillRenderEndpointBufferWithSilence(
             audio_client_.Get(), audio_render_client_.Get())) {
       // Failed to prepare endpoint buffers with silence. Attempting recovery
       // with a new IAudioClient and IAudioRenderClient."
       SendLogMessage(
           "%s => (WARNING: CAU::FillRenderEndpointBufferWithSilence failed)",
           __func__);
       opened_ = false;
       audio_client_.Reset();
       audio_render_client_.Reset();
       if (!Open() || !CoreAudioUtil::FillRenderEndpointBufferWithSilence(
                          audio_client_.Get(), audio_render_client_.Get())) {
         RecordAudioFailure(kStartFailureHistogram, GetLastError());
         SendLogMessage("%s => (ERROR: Recovery attempt failed)", __func__);
         callback->OnError(AudioSourceCallback::ErrorType::kUnknown);
         return;
       }
     }
   }

   source_ = callback;
   num_written_frames_ = endpoint_buffer_size_frames_;
   last_position_ = 0;
   last_qpc_position_ = 0;

   // Recreate `peak_detector_` everytime we create a new `render_thread_`, to
   // avoid ThreadChecker DCHECKs.
   peak_detector_ = std::make_unique<AmplitudePeakDetector>(base::BindRepeating(
       &AudioManager::TraceAmplitudePeak, base::Unretained(manager_),
       /*trace_start=*/false));

   // Create and start the thread that will drive the rendering by waiting for
   // render events.
   render_thread_ = std::make_unique<base::DelegateSimpleThread>(
       this, "wasapi_render_thread",
       base::SimpleThread::Options(base::ThreadType::kRealtimeAudio));
   render_thread_->Start();
   if (!render_thread_->HasBeenStarted()) {
     RecordAudioFailure(kStartFailureHistogram, GetLastError());
     SendLogMessage("%s => (ERROR: Failed to start \"wasapi_render_thread\")",
                    __func__);
     StopThread();
     callback->OnError(AudioSourceCallback::ErrorType::kUnknown);
     return;
   }

   // Start streaming data between the endpoint buffer and the audio engine.
   HRESULT hr = audio_client_->Start();
   if (FAILED(hr)) {
     RecordAudioFailure(kStartFailureHistogram, hr);
     SendLogMessage("%s => (ERROR: IAudioClient::Start=[%s])", __func__,
                    ErrorToString(hr).c_str());
     StopThread();
     callback->OnError(AudioSourceCallback::ErrorType::kUnknown);
   }
 }

 void WASAPIAudioOutputStream::Stop() {
   DVLOG(1) << "WASAPIAudioOutputStream::Stop()";
   DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);
   SendLogMessage("%s([started=%s])", __func__,
                  render_thread_ ? "true" : "false");

   if (!render_thread_)
     return;

   // Stop output audio streaming.
   HRESULT hr = audio_client_->Stop();
   if (FAILED(hr)) {
     RecordAudioFailure(kStopFailureHistogram, hr);
     SendLogMessage("%s => (ERROR: IAudioClient::Stop=[%s])", __func__,
                    ErrorToString(hr).c_str());
     source_->OnError(AudioSourceCallback::ErrorType::kUnknown);
   }

   // Make a local copy of |source_| since StopThread() will clear it.
   AudioSourceCallback* callback = source_;
   StopThread();

   // Flush all pending data and reset the audio clock stream position to 0.
   hr = audio_client_->Reset();
   if (FAILED(hr)) {
     RecordAudioFailure(kStopFailureHistogram, hr);
     SendLogMessage("%s => (ERROR: IAudioClient::Reset=[%s])", __func__,
                    ErrorToString(hr).c_str());
     callback->OnError(AudioSourceCallback::ErrorType::kUnknown);
   }

   ReportAndResetStats();

   // Extra safety check to ensure that the buffers are cleared.
   // If the buffers are not cleared correctly, the next call to Start()
   // would fail with AUDCLNT_E_BUFFER_ERROR at IAudioRenderClient::GetBuffer().
   // This check is is only needed for shared-mode streams.
   if (share_mode_ == AUDCLNT_SHAREMODE_SHARED) {
     UINT32 num_queued_frames = 0;
     audio_client_->GetCurrentPadding(&num_queued_frames);
     DCHECK_EQ(0u, num_queued_frames);
     if (num_queued_frames > 0) {
       SendLogMessage("%s => (WARNING: Buffers are not cleared correctly)",
                      __func__);
     }
   }
 }

 void WASAPIAudioOutputStream::Close() {
   DVLOG(1) << "WASAPIAudioOutputStream::Close()";
   DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);
   SendLogMessage("%s()", __func__);

   StopAudioSessionEventListener();

   // It is valid to call Close() before calling open or Start().
   // It is also valid to call Close() after Start() has been called.
   Stop();

   // Inform the audio manager that we have been closed. This will cause our
   // destruction.
   manager_->ReleaseOutputStream(this);
 }

 // This stream is always used with sub second buffer sizes, where it's
 // sufficient to simply always flush upon Start().
 void WASAPIAudioOutputStream::Flush() {}

 void WASAPIAudioOutputStream::SetVolume(double volume) {
 #if BUILDFLAG(ENABLE_PLATFORM_DTS_AUDIO)
   if (params_.format() == AudioParameters::AUDIO_BITSTREAM_DTS)
     return;
 #endif  // BUILDFLAG(ENABLE_PLATFORM_DTS_AUDIO)
   SendLogMessage("%s({volume=%.2f})", __func__, volume);
   float volume_float = static_cast<float>(volume);
   if (volume_float < 0.0f || volume_float > 1.0f) {
     return;
   }
   volume_ = volume_float;
 }

 void WASAPIAudioOutputStream::GetVolume(double* volume) {
   *volume = static_cast<double>(volume_);
 }

 void WASAPIAudioOutputStream::SendLogMessage(const char* format, ...) {
   if (log_callback_.is_null())
     return;
   va_list args;
   va_start(args, format);
   log_callback_.Run("WAOS::" + base::StringPrintV(format, args) +
                     base::StringPrintf(" [this=0x%" PRIXPTR "]",
                                        reinterpret_cast<uintptr_t>(this)));
   va_end(args);
 }

 void WASAPIAudioOutputStream::Run() {
   ScopedCOMInitializer com_init(ScopedCOMInitializer::kMTA);

   // Enable MMCSS to ensure that this thread receives prioritized access to
   // CPU resources.
   DWORD task_index = 0;
   HANDLE mm_task =
       avrt::AvSetMmThreadCharacteristics(L"Pro Audio", &task_index);
   bool mmcss_is_ok =
       (mm_task && avrt::AvSetMmThreadPriority(mm_task, AVRT_PRIORITY_CRITICAL));
   if (!mmcss_is_ok) {
     // Failed to enable MMCSS on this thread. It is not fatal but can lead
     // to reduced QoS at high load.
     DWORD err = GetLastError();
     LOG(ERROR) << "WAOS::" << __func__
                << " => (ERROR: Failed to enable MMCSS (error code=" << err
                << "))";
   }

   HRESULT hr = S_FALSE;

   bool playing = true;
   bool error = false;
   HANDLE wait_array[] = {stop_render_event_.Get(),
                          audio_samples_render_event_.Get()};
   UINT64 device_frequency = 0;

   // The device frequency is the frequency generated by the hardware clock in
   // the audio device. The GetFrequency() method reports a constant frequency.
   hr = audio_clock_->GetFrequency(&device_frequency);
   error = FAILED(hr);
   if (error) {
     RecordAudioFailure(kRunFailureHistogram, hr);
     LOG(ERROR) << "WAOS::" << __func__
                << " => (ERROR: IAudioClock::GetFrequency=["
                << ErrorToString(hr).c_str() << "])";
   }

   // Keep rendering audio until the stop event or the stream-switch event
   // is signaled. An error event can also break the main thread loop.
   while (playing && !error) {
     // Wait for a close-down event, stream-switch event or a new render event.
     DWORD wait_result = WaitForMultipleObjects(std::size(wait_array),
                                                wait_array, FALSE, INFINITE);

     switch (wait_result) {
       case WAIT_OBJECT_0 + 0:
         // |stop_render_event_| has been set.
         playing = false;
         break;
       case WAIT_OBJECT_0 + 1:
         // |audio_samples_render_event_| has been set.
         error = !RenderAudioFromSource(device_frequency);
         break;
       default:
         error = true;
         break;
     }
   }

   if (playing && error) {
     RecordAudioFailure(kRunFailureHistogram, GetLastError());
     LOG(ERROR) << "WAOS::" << __func__
                << " => (ERROR: WASAPI rendering failed)";

     // Stop audio rendering since something has gone wrong in our main thread
     // loop. Note that, we are still in a "started" state, hence a Stop() call
     // is required to join the thread properly.
     audio_client_->Stop();

     // Notify clients that something has gone wrong and that this stream should
     // be destroyed instead of reused in the future.
     source_->OnError(AudioSourceCallback::ErrorType::kUnknown);
   }

   // Disable MMCSS.
   if (mm_task && !avrt::AvRevertMmThreadCharacteristics(mm_task)) {
     LOG(WARNING) << "WAOS::" << __func__
                  << " => (WARNING: Failed to disable MMCSS)";
   }
 }

 bool WASAPIAudioOutputStream::RenderAudioFromSource(UINT64 device_frequency) {
   TRACE_EVENT(
       "audio", "RenderAudioFromSource", [&](perfetto::EventContext ctx) {
         auto* event = ctx.event<perfetto::protos::pbzero::ChromeTrackEvent>();
         auto* data = event->set_win_render_audio_from_source();
         data->set_iaudioclock_device_frequency(device_frequency);
         data->set_iaudioclient_buffer_size_frames(endpoint_buffer_size_frames_);
       });

   const base::TimeDelta buffer_duration =
       media::AudioTimestampHelper::FramesToTime(packet_size_frames_,
                                                 format_.Format.nSamplesPerSec);
   HRESULT hr = S_FALSE;
   UINT32 num_queued_frames = 0;
   uint8_t* audio_data = nullptr;

   // Contains how much new data we can write to the buffer without
   // the risk of overwriting previously written data that the audio
   // engine has not yet read from the buffer.
   UINT32 num_available_frames = 0;

   if (share_mode_ == AUDCLNT_SHAREMODE_SHARED) {
     // Get the padding value which represents the amount of rendering
     // data that is queued up to play in the endpoint buffer.
     hr = audio_client_->GetCurrentPadding(&num_queued_frames);
     if (FAILED(hr)) {
       RecordAudioFailure(kRenderFailureHistogram, hr);
       LOG(ERROR) << "WAOS::" << __func__
                  << " => (ERROR: IAudioClient::GetCurrentPadding=["
                  << ErrorToString(hr).c_str() << "])";
       return false;
     }
     TRACE_COUNTER_ID1(TRACE_DISABLED_BY_DEFAULT("audio"),
                       "IAudioClient_queued_frames", this, num_queued_frames);
     if (!num_queued_frames) {
       TRACE_EVENT_INSTANT0(TRACE_DISABLED_BY_DEFAULT("audio"), "buffer empty",
                            TRACE_EVENT_SCOPE_THREAD);
     }
     num_available_frames = endpoint_buffer_size_frames_ - num_queued_frames;
   } else {
     // While the stream is running, the system alternately sends one
     // buffer or the other to the client. This form of double buffering
     // is referred to as "ping-ponging". Each time the client receives
     // a buffer from the system (triggers this event) the client must
     // process the entire buffer. Calls to the GetCurrentPadding method
     // are unnecessary because the packet size must always equal the
     // buffer size. In contrast to the shared mode buffering scheme,
     // the latency for an event-driven, exclusive-mode stream depends
     // directly on the buffer size.
     num_available_frames = endpoint_buffer_size_frames_;
   }

   TRACE_EVENT(
       TRACE_DISABLED_BY_DEFAULT("audio"), "IAudioClient frames",
       [&](perfetto::EventContext ctx) {
         auto* event = ctx.event<perfetto::protos::pbzero::ChromeTrackEvent>();
         auto* data = event->set_win_render_audio_from_source();
         data->set_iaudioclient_buffer_unfilled_frames(num_available_frames);
       });

   // Check if there is enough available space to fit the packet size
   // specified by the client.  If not, wait until a future callback.
   if (num_available_frames < packet_size_frames_)
     return true;

   // Derive the number of packets we need to get from the client to fill up the
   // available area in the endpoint buffer.  Well-behaved (> Vista) clients and
   // exclusive mode streams should generally have a |num_packets| value of 1.
   //
   // Vista clients are not able to maintain reliable callbacks, so the endpoint
   // buffer may exhaust itself such that back-to-back callbacks are occasionally
   // necessary to avoid glitches.  In such cases we have no choice but to issue
   // back-to-back reads and pray that the browser side has enough data cached or
   // that the render can fulfill the read before we glitch anyways.
   //
   // API documentation does not guarantee that even on Win7+ clients we won't
   // need to fill more than a period size worth of buffers; but in practice this
   // appears to be infrequent.
   //
   // See http://crbug.com/524947.
   const size_t num_packets = num_available_frames / packet_size_frames_;
   for (size_t n = 0; n < num_packets; ++n) {
     TRACE_EVENT(TRACE_DISABLED_BY_DEFAULT("audio"), "Write packet",
                 [&](perfetto::EventContext ctx) {
                   auto* event =
                       ctx.event<perfetto::protos::pbzero::ChromeTrackEvent>();
                   auto* data = event->set_win_render_audio_from_source();
                   data->set_packet_size_frames(packet_size_frames_);
                 });
     // Grab all available space in the rendering endpoint buffer
     // into which the client can write a data packet.
     hr = audio_render_client_->GetBuffer(packet_size_frames_, &audio_data);
     if (FAILED(hr)) {
       RecordAudioFailure(kRenderFailureHistogram, hr);
       LOG(ERROR) << "WAOS::" << __func__
                  << " => (ERROR: IAudioRenderClient::GetBuffer=["
                  << ErrorToString(hr).c_str() << "])";
       return false;
     }

     // Stores glitch info to be passed on to OnMoreData().
     AudioGlitchInfo::Accumulator glitch_info_accumulator;
     base::TimeDelta delay;
     base::TimeTicks delay_timestamp;
     UINT64 position = 0;
     UINT64 qpc_position = 0;
     // TODO(http://crbug.com/1453566): avoid using IAudioClock::GetPosition() on
     // a RT thread.
     hr = audio_clock_->GetPosition(&position, &qpc_position);
     if (SUCCEEDED(hr)) {
       TRACE_EVENT_BEGIN(
           TRACE_DISABLED_BY_DEFAULT("audio"), "IAudioClock position",
           [&](perfetto::EventContext ctx) {
             auto* event =
                 ctx.event<perfetto::protos::pbzero::ChromeTrackEvent>();
             auto* data = event->set_win_render_audio_from_source();
             data->set_iaudioclock_stream_position(position);
             data->set_iaudioclock_qpc_position(qpc_position);
             data->set_num_written_frames(num_written_frames_);
           });
       // Check for glitches. Records a glitch whenever the stream's position has
       // moved forward significantly less than the performance counter has. The
       // threshold is set to half the buffer size, to limit false positives.
       // When a stream begins running, its device position might remain 0
       // until the audio data has propagated from the endpoint buffer to the
       // rendering device. The device position changes to a nonzero value when
       // the data begins playing through the device.
       if (last_position_ != 0) {
         CHECK(last_qpc_position_);

         // The device position is the offset from the start of the stream to the
         // current position in the stream. The units in which this offset is
         // expressed are undefined, the value has meaning only in relation to
         // the frequency reported by the IAudioClock::GetFrequency() method,
         // passed  as |device_frequency| here. It's expected to monotonically
         // non-decrease. It won't advance if we make the render client starve by
         // not providing frames to render. Note: WASAPIAudioOutputStream::Run()
         // assumes that the frequency is constant throughout the stream
         // lifetime. CoreAudio documentation is not exactly clear on that: it
         // only says that the device frequency reported by successive calls to
         // GetFrequency never changes during the lifetime of a stream "in
         // Windows Vista".
         if (position < last_position_) {
           // http://crbug.com/1473580: according to MS documentation |position|
           // is monotonic, but in practice it's not always so.
           TRACE_EVENT_INSTANT0(TRACE_DISABLED_BY_DEFAULT("audio"),
                                "position decrease", TRACE_EVENT_SCOPE_THREAD);
         }
         // If |position_time_increase| is negative, it means we are likely to
         // have a larger |gap_duration| and to register a glitch. In reality,
         // it's unclear if there's a glitch in such "it should never happen"
         // case or not.
         base::TimeDelta position_time_increase =
             media::AudioTimestampHelper::FramesToTime(position - last_position_,
                                                       device_frequency);

         // The QPC values are in 100 ns units, according to
         // IAudioClock::GetPosition() documentation. Presumably monotonically
         // increasing, but there are known cases when it can jump backward due
         // to driver bugs, etc.
         base::TimeDelta qpc_position_time_increase =
             qpc_position < last_qpc_position_
                 ? base::TimeDelta()
                 : base::Microseconds((qpc_position - last_qpc_position_) / 10);

         TRACE_EVENT(
             TRACE_DISABLED_BY_DEFAULT("audio"), "gap estimation",
             [&](perfetto::EventContext ctx) {
               auto* event =
                   ctx.event<perfetto::protos::pbzero::ChromeTrackEvent>();
               auto* data = event->set_win_render_audio_from_source();
               data->set_iaudioclock_stream_position_increase_ms(
                   position_time_increase.InMilliseconds());
               data->set_iaudioclock_qpc_position_increase_ms(
                   qpc_position_time_increase.InMilliseconds());
             });
         // We probably should not trust qpc_position being reported in 100 ns
         // intervals in some cases, in a remote desktop situation, for example.
         // Let's see how qpc-based time compares to base::TimeTicks. Even if we
         // are using a low resolution timers (~15 ms precision), the difference
         // between the two should be well under 40 ms. But let's be
         // concervative.
         // |gap_duration| can be positive or negative. Negative means a bigger
         // chunk of the buffer was consumed. Too big (how big?) positive means
         // no audio was played for a while, which potentially resulted in a
         // glitch.
         base::TimeDelta gap_duration =
             qpc_position_time_increase - position_time_increase;

         // TODO(crbug.com/40257462): Investigate precisely what gap duration
         // should be counted as a glitch.
         bool is_glitch = gap_duration > buffer_duration / 2;
         glitch_reporter_.UpdateStats(is_glitch ? gap_duration
                                                : base::TimeDelta());
         if (is_glitch) {
           TRACE_EVENT_INSTANT0(TRACE_DISABLED_BY_DEFAULT("audio"), "glitch",
                                TRACE_EVENT_SCOPE_THREAD);
           glitch_info_accumulator.Add(
               AudioGlitchInfo::SingleBoundedSystemGlitch(
                   gap_duration, AudioGlitchInfo::Direction::kRender));
         }
       }

       last_position_ = position;
       last_qpc_position_ = qpc_position;

       // Number of frames already played out through the speaker (estimation).
       const uint64_t played_out_frames =
           format_.Format.nSamplesPerSec * position / device_frequency;

       // Number of frames that have been written to the buffer but not yet
       // played out. Should theoretically be non-negative, but since
       // |played_out_frames| is an approximation, we don't trust this fact
       // entirely.
       const uint64_t delay_frames =
           num_written_frames_ > played_out_frames
               ? num_written_frames_ - played_out_frames
               : 0;

       // Convert the delay from frames to time.
       delay = media::AudioTimestampHelper::FramesToTime(
           delay_frames, format_.Format.nSamplesPerSec);

       // Note: the obtained |qpc_position| value is in 100ns intervals and from
       // the same time origin as QPC. We can simply convert it into us dividing
       // by 10.0 since 10x100ns = 1us.
       delay_timestamp += base::Microseconds(qpc_position * 0.1);
       TRACE_EVENT_END(
           TRACE_DISABLED_BY_DEFAULT("audio"),
           //  "IAudioClock position",
           [&](perfetto::EventContext ctx) {
             auto* event =
                 ctx.event<perfetto::protos::pbzero::ChromeTrackEvent>();
             auto* data = event->set_win_render_audio_from_source();
             data->set_num_played_out_frames(played_out_frames);
             data->set_playout_delay_ms(delay.InMilliseconds());
           });
     } else {
       RecordAudioFailure(kRenderFailureHistogram, hr);
       LOG(ERROR) << "WAOS::" << __func__
                  << " => (ERROR: IAudioClock::GetPosition=["
                  << ErrorToString(hr).c_str() << "])";
       // Use a delay of zero.
       delay_timestamp = base::TimeTicks::Now();
     }

     UMA_HISTOGRAM_COUNTS_1000("Media.Audio.Render.SystemDelay",
                               delay.InMilliseconds());

     // Read a data packet from the registered client source and
     // deliver a delay estimate in the same callback to the client.

 #if BUILDFLAG(ENABLE_PLATFORM_DTS_AUDIO)
     if (params_.format() == AudioParameters::AUDIO_BITSTREAM_DTS) {
       std::unique_ptr<AudioBus> audio_bus(
           AudioBus::WrapMemory(params_, audio_data));
       audio_bus_->set_is_bitstream_format(true);
       int frames_filled = source_->OnMoreData(
           BoundedDelay(delay), delay_timestamp,
           glitch_info_accumulator.GetAndReset(), audio_bus.get());

       // During pause/seek, keep the pipeline filled with zero'ed frames.
       if (!frames_filled) {
         memset(audio_data, 0, packet_size_frames_);
       }

       peak_detector_->FindPeak(audio_bus_.get());

       // Release the buffer space acquired in the GetBuffer() call.
       // Render silence if we were not able to fill up the buffer totally.
       audio_render_client_->ReleaseBuffer(packet_size_frames_, 0);
       num_written_frames_ += packet_size_frames_;
       return true;
     }
 #endif  // BUILDFLAG(ENABLE_PLATFORM_DTS_AUDIO)
     int frames_filled = source_->OnMoreData(
         BoundedDelay(delay), delay_timestamp,
         glitch_info_accumulator.GetAndReset(), audio_bus_.get());
     uint32_t num_filled_bytes = frames_filled * format_.Format.nBlockAlign;
     DCHECK_LE(num_filled_bytes, packet_size_bytes_);
     audio_bus_->Scale(volume_);

     if (enable_audio_offload_) {
       audio_bus_->ToInterleaved<SignedInt16SampleTypeTraits>(
           frames_filled, reinterpret_cast<short*>(audio_data));
     } else {
       // We skip clipping since that occurs at the shared memory boundary.
       audio_bus_->ToInterleaved<Float32SampleTypeTraitsNoClip>(
           frames_filled, reinterpret_cast<float*>(audio_data));
     }

     peak_detector_->FindPeak(audio_bus_.get());

     // Release the buffer space acquired in the GetBuffer() call.
     // Render silence if we were not able to fill up the buffer totally.
     DWORD flags = (num_filled_bytes < packet_size_bytes_)
                       ? AUDCLNT_BUFFERFLAGS_SILENT
                       : 0;
     audio_render_client_->ReleaseBuffer(packet_size_frames_, flags);

     num_written_frames_ += packet_size_frames_;
   }

   return true;
 }

 HRESULT WASAPIAudioOutputStream::ExclusiveModeInitialization(
     IAudioClient* client,
     HANDLE event_handle,
     uint32_t* endpoint_buffer_size) {
   DCHECK_EQ(share_mode_, AUDCLNT_SHAREMODE_EXCLUSIVE);

   float f = (1000.0 * packet_size_frames_) / format_.Format.nSamplesPerSec;
   REFERENCE_TIME requested_buffer_duration =
       static_cast<REFERENCE_TIME>(f * 10000.0 + 0.5);

   DWORD stream_flags = AUDCLNT_STREAMFLAGS_NOPERSIST;
   bool use_event =
       (event_handle != nullptr && event_handle != INVALID_HANDLE_VALUE);
   if (use_event)
     stream_flags |= AUDCLNT_STREAMFLAGS_EVENTCALLBACK;
   DVLOG(2) << "stream_flags: 0x" << std::hex << stream_flags;

   // Initialize the audio stream between the client and the device.
   // For an exclusive-mode stream that uses event-driven buffering, the
   // caller must specify nonzero values for hnsPeriodicity and
   // hnsBufferDuration, and the values of these two parameters must be equal.
   // The Initialize method allocates two buffers for the stream. Each buffer
   // is equal in duration to the value of the hnsBufferDuration parameter.
   // Following the Initialize call for a rendering stream, the caller should
   // fill the first of the two buffers before starting the stream.
   HRESULT hr = S_FALSE;
   hr = client->Initialize(AUDCLNT_SHAREMODE_EXCLUSIVE, stream_flags,
                           requested_buffer_duration, requested_buffer_duration,
                           reinterpret_cast<WAVEFORMATEX*>(&format_), nullptr);
   if (FAILED(hr)) {
     if (hr == AUDCLNT_E_BUFFER_SIZE_NOT_ALIGNED) {
       LOG(ERROR) << "AUDCLNT_E_BUFFER_SIZE_NOT_ALIGNED";

       UINT32 aligned_buffer_size = 0;
       client->GetBufferSize(&aligned_buffer_size);
       DVLOG(1) << "Use aligned buffer size instead: " << aligned_buffer_size;

       // Calculate new aligned periodicity. Each unit of reference time
       // is 100 nanoseconds.
       REFERENCE_TIME aligned_buffer_duration = static_cast<REFERENCE_TIME>(
           (10000000.0 * aligned_buffer_size / format_.Format.nSamplesPerSec) +
           0.5);

       // It is possible to re-activate and re-initialize the audio client
       // at this stage but we bail out with an error code instead and
       // combine it with a log message which informs about the suggested
       // aligned buffer size which should be used instead.
       DVLOG(1) << "aligned_buffer_duration: "
                << static_cast<double>(aligned_buffer_duration / 10000.0)
                << " [ms]";
     } else if (hr == AUDCLNT_E_INVALID_DEVICE_PERIOD) {
       // We will get this error if we try to use a smaller buffer size than
       // the minimum supported size (usually ~3ms on Windows 7).
       LOG(ERROR) << "AUDCLNT_E_INVALID_DEVICE_PERIOD";
     }
     return hr;
   }

   if (use_event) {
     hr = client->SetEventHandle(event_handle);
     if (FAILED(hr)) {
       DVLOG(1) << "IAudioClient::SetEventHandle: " << std::hex << hr;
       return hr;
     }
   }

   UINT32 buffer_size_in_frames = 0;
   hr = client->GetBufferSize(&buffer_size_in_frames);
   if (FAILED(hr)) {
     DVLOG(1) << "IAudioClient::GetBufferSize: " << std::hex << hr;
     return hr;
   }

   *endpoint_buffer_size = buffer_size_in_frames;
   DVLOG(2) << "endpoint buffer size: " << buffer_size_in_frames;
   return hr;
 }

 void WASAPIAudioOutputStream::StopThread() {
   if (render_thread_) {
     if (render_thread_->HasBeenStarted()) {
       // Wait until the thread completes and perform cleanup.
       SetEvent(stop_render_event_.Get());
       render_thread_->Join();
     }

     render_thread_.reset();
     peak_detector_.reset();

     // Ensure that we don't quit the main thread loop immediately next
     // time Start() is called.
     ResetEvent(stop_render_event_.Get());
   }

   source_ = nullptr;
 }

 void WASAPIAudioOutputStream::ReportAndResetStats() {
   SystemGlitchReporter::Stats stats =
       glitch_reporter_.GetLongTermStatsAndReset();
   SendLogMessage(
       "%s => (num_glitches_detected=[%d], cumulative_audio_lost=[%llu ms], "
       "largest_glitch=[%llu ms])",
       __func__, stats.glitches_detected,
       stats.total_glitch_duration.InMilliseconds(),
       stats.largest_glitch_duration.InMilliseconds());
 }

 void WASAPIAudioOutputStream::StartAudioSessionEventListener() {
   DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);

   if (session_listener_) {
     // Already started listening!
     return;
   }

   HRESULT hr = audio_client_->GetService(IID_PPV_ARGS(&audio_session_control_));
   if (FAILED(hr)) {
     DLOG(ERROR) << "Failed to get IAudioSessionControl service: " << std::hex
                 << hr;
     return;
   }

   session_listener_ = Microsoft::WRL::Make<AudioSessionEventListener>(
       base::BindPostTaskToCurrentDefault(
           base::BindOnce(&WASAPIAudioOutputStream::OnDeviceChanged,
                          weak_factory_.GetWeakPtr())));

   hr = audio_session_control_->RegisterAudioSessionNotification(
       session_listener_.Get());

   DLOG_IF(ERROR, FAILED(hr))
       << "IAudioSessionControl::RegisterAudioSessionNotification() failed: "
       << std::hex << hr;
 }

 void WASAPIAudioOutputStream::StopAudioSessionEventListener() {
   DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);

   if (!session_listener_) {
     // Already stopped listening!
     return;
   }

   HRESULT hr = audio_session_control_->UnregisterAudioSessionNotification(
       session_listener_.Get());

   DLOG_IF(ERROR, FAILED(hr))
       << "IAudioSessionControl::UnregisterAudioSessionNotification() failed: "
       << std::hex << hr;

   audio_session_control_.Reset();
   session_listener_.Reset();
 }

 void WASAPIAudioOutputStream::OnDeviceChanged() {
   DCHECK_EQ(GetCurrentThreadId(), creating_thread_id_);

   device_changed_ = true;
   if (source_)
     source_->OnError(AudioSourceCallback::ErrorType::kDeviceChange);
 }

 void WASAPIAudioOutputStream::SetupWaveFormat() {
   // We use the WAVE_FORMAT_EXTENSIBLE structure to ensure that multiple
   // channel ordering
   // and high precision data can be supported.
   // Begin with the WAVEFORMATEX structure that specifies the basic format.
   WAVEFORMATEX* format = &format_.Format;
   // Override for audio offload.
   if (enable_audio_offload_) {
     format_.SubFormat = KSDATAFORMAT_SUBTYPE_PCM;
     format->wBitsPerSample = 16;
     packet_size_bytes_ = params_.GetBytesPerBuffer(kSampleFormatS16);
   } else {
     format->wBitsPerSample = sizeof(float) * 8;
     format_.SubFormat = KSDATAFORMAT_SUBTYPE_IEEE_FLOAT;
     packet_size_bytes_ = params_.GetBytesPerBuffer(kSampleFormatF32);
   }
   format->wFormatTag = WAVE_FORMAT_EXTENSIBLE;
   format->nChannels = params_.channels();
   format->nSamplesPerSec = params_.sample_rate();
   format->nBlockAlign = (format->wBitsPerSample / 8) * format->nChannels;
   format->nAvgBytesPerSec = format->nSamplesPerSec * format->nBlockAlign;
   format->cbSize = sizeof(WAVEFORMATEXTENSIBLE) - sizeof(WAVEFORMATEX);

   // Add the parts which are unique to WAVE_FORMAT_EXTENSIBLE.
   format_.Samples.wValidBitsPerSample = format->wBitsPerSample;
   format_.dwChannelMask = CoreAudioUtil::GetChannelConfig(device_id_, eRender);

   // Store size (in different units) of audio packets which we expect to
   // get from the audio endpoint device in each render event.
   packet_size_frames_ = params_.frames_per_buffer();

 #if BUILDFLAG(ENABLE_PLATFORM_DTS_AUDIO)
   if (params_.format() == AudioParameters::AUDIO_BITSTREAM_DTS) {
     format_.SubFormat = KSDATAFORMAT_SUBTYPE_IEC61937_DTS;
     format->wBitsPerSample = 16;
     format->nChannels = 2;
     format_.dwChannelMask = KSAUDIO_SPEAKER_STEREO;
     format_.Samples.wValidBitsPerSample = format->wBitsPerSample;
     format->nBlockAlign = (format->wBitsPerSample / 8) * format->nChannels;
     format->nAvgBytesPerSec = format->nSamplesPerSec * format->nBlockAlign;
     packet_size_frames_ = 512;
     packet_size_bytes_ = params_.GetBytesPerBuffer(kSampleFormatS16);
   }
 #endif  // BUILDFLAG(ENABLE_PLATFORM_DTS_AUDIO)
   SendLogMessage("%s => (audio engine format=[%s])", __func__,
                  CoreAudioUtil::WaveFormatToString(&format_).c_str());

   SendLogMessage("%s => (packet size=[%zu bytes/%zu audio frames/%.3f ms])",
                  __func__, packet_size_bytes_, packet_size_frames_,
                  params_.GetBufferDuration().InMillisecondsF());
 }

 }  // namespace media