media/gpu/windows/media_foundation_video_encode_accelerator_win.cc - chromium/src - Git at Google

 // Copyright 2016 The Chromium Authors
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "media/gpu/windows/media_foundation_video_encode_accelerator_win.h"

 #include <codecapi.h>
 #include <d3d11_1.h>
 #include <mferror.h>
 #include <mftransform.h>
 #include <objbase.h>

 #include <algorithm>
 #include <iterator>
 #include <memory>
 #include <utility>
 #include <vector>

 #include "base/features.h"
 #include "base/memory/shared_memory_mapping.h"
 #include "base/memory/unsafe_shared_memory_region.h"
 #include "base/task/sequenced_task_runner.h"
 #include "base/task/thread_pool.h"
 #include "base/time/time.h"
 #include "base/trace_event/trace_event.h"
 #include "base/win/scoped_co_mem.h"
 #include "base/win/scoped_variant.h"
 #include "build/build_config.h"
 #include "gpu/ipc/common/dxgi_helpers.h"
 #include "media/base/bitstream_buffer.h"
 #include "media/base/media_log.h"
 #include "media/base/media_switches.h"
 #include "media/base/video_frame.h"
 #include "media/base/video_util.h"
 #include "media/base/win/color_space_util_win.h"
 #include "media/base/win/mf_helpers.h"
 #include "media/base/win/mf_initializer.h"
 #include "media/filters/win/media_foundation_utils.h"
 #include "media/gpu/gpu_video_encode_accelerator_helpers.h"
 #include "media/gpu/windows/vp9_video_rate_control_wrapper.h"
 #include "third_party/libvpx/source/libvpx/vp9/ratectrl_rtc.h"
 #include "third_party/libyuv/include/libyuv.h"
 #include "ui/gfx/color_space_win.h"
 #include "ui/gfx/gpu_memory_buffer.h"

 #if BUILDFLAG(ENABLE_LIBAOM)
 #include "media/gpu/windows/av1_video_rate_control_wrapper.h"
 #include "third_party/libaom/source/libaom/av1/ratectrl_rtc.h"
 #endif

 namespace media {

 namespace {
 constexpr uint32_t kDefaultGOPLength = 3000;
 constexpr uint32_t kDefaultTargetBitrate = 5000000u;
 constexpr size_t kMaxFrameRateNumerator = 30;
 constexpr size_t kMaxFrameRateDenominator = 1;
 constexpr size_t kNumInputBuffers = 3;
 // Media Foundation uses 100 nanosecond units for time, see
 // https://msdn.microsoft.com/en-us/library/windows/desktop/ms697282(v=vs.85).aspx.
 constexpr size_t kOneMicrosecondInMFSampleTimeUnits = 10;
 constexpr size_t kPrefixNALLocatedBytePos = 3;
 constexpr uint64_t kH264MaxQp = 51;
 constexpr uint64_t kVP9MaxQp = 63;
 constexpr uint64_t kAV1MaxQp = 63;

 // Quantizer parameter used in libvpx vp9 rate control, whose range is 0-63.
 // These are based on WebRTC's defaults, cite from
 // third_party/webrtc/media/engine/webrtc_video_engine.h.
 constexpr uint8_t kVP9MinQuantizer = 2;
 constexpr uint8_t kVP9MaxQuantizer = 56;
 // Default value from
 // //third_party/webrtc/modules/video_coding/codecs/av1/libaom_av1_encoder.cc,
 constexpr uint8_t kAV1MinQuantizer = 10;
 // //third_party/webrtc/media/engine/webrtc_video_engine.h.
 constexpr uint8_t kAV1MaxQuantizer = 56;

 constexpr CLSID kIntelAV1HybridEncoderCLSID = {
     0x62c053ce,
     0x5357,
     0x4794,
     {0x8c, 0x5a, 0xfb, 0xef, 0xfe, 0xff, 0xb8, 0x2d}};

 #ifndef ARCH_CPU_X86
 // Temporal layers are reported to be supported by the Intel driver but cause
 // initialization errors.
 BASE_FEATURE(kMediaFoundationIntelVP9TemporalLayerSupport,
              "MediaFoundationIntelVP9TemporalLayerSupport",
              base::FEATURE_DISABLED_BY_DEFAULT);
 #endif  // !defined(ARCH_CPU_X86)

 eAVEncH264VProfile GetH264VProfile(VideoCodecProfile profile,
                                    bool is_constrained_h264) {
   switch (profile) {
     case H264PROFILE_BASELINE:
       return is_constrained_h264 ? eAVEncH264VProfile_ConstrainedBase
                                  : eAVEncH264VProfile_Base;
     case H264PROFILE_MAIN:
       return eAVEncH264VProfile_Main;
     case H264PROFILE_HIGH:
       return eAVEncH264VProfile_High;
     default:
       return eAVEncH264VProfile_unknown;
   }
 }

 // Convert AV1/VP9 qindex (0-255) to the quantizer parameter input in MF
 // AVEncVideoEncodeQP. AVEncVideoEncodeQP maps it to libvpx qp tuning parameter
 // and thus the range is 0-63.
 uint8_t QindextoAVEncQP(uint8_t q_index) {
   // The following computation is based on the table in
   // //third_party/libvpx/source/libvpx/vp9/encoder/vp9_quantize.c.
   // //third_party/libaom/source/libaom/av1/encoder/av1_quantize.c
   // {
   //   0,   4,   8,   12,  16,  20,  24,  28,  32,  36,  40,  44,  48,
   //   52,  56,  60,  64,  68,  72,  76,  80,  84,  88,  92,  96,  100,
   //   104, 108, 112, 116, 120, 124, 128, 132, 136, 140, 144, 148, 152,
   //   156, 160, 164, 168, 172, 176, 180, 184, 188, 192, 196, 200, 204,
   //   208, 212, 216, 220, 224, 228, 232, 236, 240, 244, 249, 255,
   // };
   if (q_index <= 244)
     return (q_index + 3) / 4;
   if (q_index <= 249)
     return 62;
   return 63;
 }

 bool IsValidQp(VideoCodec codec, uint64_t qp) {
   switch (codec) {
     case VideoCodec::kH264:
       return qp <= kH264MaxQp;
     case VideoCodec::kVP9:
       return qp <= kVP9MaxQp;
     case VideoCodec::kAV1:
       return qp <= kAV1MaxQp;
     default:
       return false;
   }
 }
 // Only eAVEncVP9VProfile_420_8 is supported on Intel graphics.
 eAVEncVP9VProfile GetVP9VProfile(VideoCodecProfile profile) {
   switch (profile) {
     case VP9PROFILE_PROFILE0:
       return eAVEncVP9VProfile_420_8;
     default:
       return eAVEncVP9VProfile_unknown;
   }
 }

 // Only eAVEncH265Vprofile_Main_420_8 is supported.
 eAVEncH265VProfile GetHEVCProfile(VideoCodecProfile profile) {
   switch (profile) {
     case HEVCPROFILE_MAIN:
       return eAVEncH265VProfile_Main_420_8;
     default:
       return eAVEncH265VProfile_unknown;
   }
 }

 MediaFoundationVideoEncodeAccelerator::DriverVendor GetDriverVendor(
     IMFActivate* encoder) {
   using DriverVendor = MediaFoundationVideoEncodeAccelerator::DriverVendor;
   base::win::ScopedCoMem<WCHAR> vendor_id;
   UINT32 id_length;
   encoder->GetAllocatedString(MFT_ENUM_HARDWARE_VENDOR_ID_Attribute, &vendor_id,
                               &id_length);
   if (id_length != 8) {  // Normal vendor ids have length 8.
     return DriverVendor::kOther;
   }
   if (!_wcsnicmp(vendor_id.get(), L"VEN_10DE", id_length)) {
     return DriverVendor::kNvidia;
   }
   if (!_wcsnicmp(vendor_id.get(), L"VEN_1002", id_length)) {
     return DriverVendor::kAMD;
   }
   if (!_wcsnicmp(vendor_id.get(), L"VEN_8086 ", id_length)) {
     return DriverVendor::kIntel;
   }
   return DriverVendor::kOther;
 }

 bool IsSvcSupported(IMFActivate* activate, VideoCodec codec) {
 #if defined(ARCH_CPU_X86)
   // x86 systems sometimes crash in video drivers here.
   // More info: https://crbug.com/1253748
   return false;
 #else
   using DriverVendor = MediaFoundationVideoEncodeAccelerator::DriverVendor;
   // crbug.com/1373780: Nvidia HEVC encoder reports supporting 3 temporal
   // layers, but will fail initialization if configured to encoded with
   // more than one temporal layers, thus we block Nvidia HEVC encoder for
   // temporal SVC encoding.
   // crbug.com/1425117: Intel VP9 HW encoder reports supporting 3 temporal
   // layers, but will fail initialization if configured with more than one
   // temporal layers.
   auto vendor = GetDriverVendor(activate);
   if ((codec == VideoCodec::kHEVC && vendor == DriverVendor::kNvidia) ||
       (!base::FeatureList::IsEnabled(
            kMediaFoundationIntelVP9TemporalLayerSupport) &&
        codec == VideoCodec::kVP9 && vendor == DriverVendor::kIntel)) {
     return false;
   }

   Microsoft::WRL::ComPtr<IMFTransform> encoder;
   Microsoft::WRL::ComPtr<ICodecAPI> codec_api;
   HRESULT hr = activate->ActivateObject(IID_PPV_ARGS(&encoder));
   if (FAILED(hr)) {
     // Log to VLOG since errors are expected as part of GetSupportedProfiles().
     DVLOG(2) << "Failed to activate encoder: " << PrintHr(hr);
     return false;
   }

   hr = encoder.As(&codec_api);
   if (FAILED(hr)) {
     // Log to VLOG since errors are expected as part of GetSupportedProfiles().
     DVLOG(2) << "Failed to get encoder as CodecAPI: " << PrintHr(hr);
     return false;
   }

   if (codec_api->IsSupported(&CODECAPI_AVEncVideoTemporalLayerCount) != S_OK) {
     return false;
   }

   base::win::ScopedVariant min, max, step;
   if (FAILED(codec_api->GetParameterRange(
           &CODECAPI_AVEncVideoTemporalLayerCount, min.AsInput(), max.AsInput(),
           step.AsInput()))) {
     return false;
   }

   return V_UI4(min.ptr()) <= 1u && V_UI4(max.ptr()) >= 3u;
 #endif  // defined(ARCH_CPU_X86)
 }

 uint32_t EnumerateHardwareEncoders(VideoCodec codec, IMFActivate*** activates) {
   if (!InitializeMediaFoundation()) {
     return 0;
   }

   uint32_t flags = MFT_ENUM_FLAG_HARDWARE | MFT_ENUM_FLAG_SORTANDFILTER;
   MFT_REGISTER_TYPE_INFO input_info;
   input_info.guidMajorType = MFMediaType_Video;
   input_info.guidSubtype = MFVideoFormat_NV12;
   MFT_REGISTER_TYPE_INFO output_info;
   output_info.guidMajorType = MFMediaType_Video;
   output_info.guidSubtype = VideoCodecToMFSubtype(codec);

   uint32_t count = 0;
   auto hr = MFTEnumEx(MFT_CATEGORY_VIDEO_ENCODER, flags, &input_info,
                       &output_info, activates, &count);
   if (FAILED(hr)) {
     // Log to VLOG since errors are expected as part of GetSupportedProfiles().
     DVLOG(2) << "Failed to enumerate hardware encoders for "
              << GetCodecName(codec) << ": " << PrintHr(hr);
     return 0;
   }

   return count;
 }

 bool IsCodecSupportedForEncoding(VideoCodec codec, bool* svc_supported) {
   base::win::ScopedCoMem<IMFActivate*> activates;
   const auto encoder_count = EnumerateHardwareEncoders(codec, &activates);
   if (encoder_count == 0 || !activates) {
     DVLOG(1) << "Hardware encode acceleration is not available for "
              << GetCodecName(codec);
     return false;
   }

   *svc_supported = false;
   for (UINT32 i = 0; i < encoder_count; i++) {
     if (!*svc_supported && IsSvcSupported(activates[i], codec)) {
       *svc_supported = true;
     }
     activates[i]->Release();
   }

   return true;
 }

 // Per
 // https://learn.microsoft.com/en-us/windows/win32/medfound/handling-stream-changes,
 // encoders should only accept an input type that matches the currently
 // configured output type. If we want to change the frame rate, a
 // stream restart flow is needed, which in turn generates a key-frame on the
 // stream restart. This is not friendly for WebRTC encoding, which adjusts the
 // encoding frame rate frequently.
 // To mitigate this, we only configure the frame rate during HMFT
 // initialization. On subsequent frame rate update request, if new frame rate is
 // larger than currently configured frame rate and bitrate is kept unchanged,
 // this implies average encoded frame size should decrease proportionally. Since
 // we don't actually configure the new frame rate into HMFT(to avoid stream
 // restart), we emulate this average frame size decrease by proportionally
 // decreasing the target/peak bitrate(which does not require stream restart).
 // This is similar for frame rate update request that is lower than currently
 // configured, by increasing bitrate to emulate average frame size increase.
 // See https://crbug.com/1295815 for more details.
 uint32_t AdjustBitrateToFrameRate(uint32_t bitrate,
                                   uint32_t configured_framerate,
                                   uint32_t requested_framerate) {
   if (requested_framerate == 0u) {
     return 0u;
   }

   return bitrate * configured_framerate / requested_framerate;
 }

 VideoRateControlWrapper::RateControlConfig CreateRateControllerConfig(
     const VideoBitrateAllocation& bitrate_allocation,
     gfx::Size size,
     uint32_t frame_rate,
     int num_temporal_layers,
     VideoCodec codec) {
   // Fill rate control config variables.
   VideoRateControlWrapper::RateControlConfig config;
   config.width = size.width();
   config.height = size.height();
   config.target_bandwidth = bitrate_allocation.GetSumBps() / 1000;
   config.framerate = frame_rate;
   config.ss_number_layers = 1;
   config.ts_number_layers = num_temporal_layers;
   switch (codec) {
     case VideoCodec::kVP9: {
       config.max_quantizer = kVP9MaxQuantizer;
       config.min_quantizer = kVP9MinQuantizer;
       break;
     }
     case VideoCodec::kAV1: {
       config.max_quantizer = kAV1MaxQuantizer;
       config.min_quantizer = kAV1MinQuantizer;
       break;
     }
     default:
       NOTREACHED();
       break;
   }
   int bitrate_sum = 0;
   for (int tid = 0; tid < num_temporal_layers; ++tid) {
     bitrate_sum += bitrate_allocation.GetBitrateBps(0, tid);
     config.layer_target_bitrate[tid] = bitrate_sum / 1000;
     config.ts_rate_decimator[tid] = 1u << (num_temporal_layers - tid - 1);
     config.min_quantizers[tid] = config.min_quantizer;
     config.max_quantizers[tid] = config.max_quantizer;
   }
   return config;
 }

 VideoEncoder::PendingEncode MakeInput(scoped_refptr<media::VideoFrame> frame,
                                       bool keyframe) {
   VideoEncoder::PendingEncode result;
   result.frame = std::move(frame);
   result.options.key_frame = keyframe;
   return result;
 }

 }  // namespace

 class MediaFoundationVideoEncodeAccelerator::EncodeOutput {
  public:
   EncodeOutput(uint32_t size,
                bool key_frame,
                base::TimeDelta timestamp,
                int temporal_id,
                absl::optional<gfx::ColorSpace> color_space)
       : keyframe(key_frame),
         capture_timestamp(timestamp),
         temporal_layer_id(temporal_id),
         color_space(color_space),
         data_(size) {}

   EncodeOutput(const EncodeOutput&) = delete;
   EncodeOutput& operator=(const EncodeOutput&) = delete;

   uint8_t* memory() { return data_.data(); }

   int size() const { return static_cast<int>(data_.size()); }
   void SetQp(int32_t qp_val) { frame_qp.emplace(qp_val); }

   const bool keyframe;
   const base::TimeDelta capture_timestamp;
   const int temporal_layer_id;
   absl::optional<int32_t> frame_qp;
   const absl::optional<gfx::ColorSpace> color_space;

  private:
   std::vector<uint8_t> data_;
 };

 struct MediaFoundationVideoEncodeAccelerator::BitstreamBufferRef {
   BitstreamBufferRef() = delete;

   BitstreamBufferRef(int32_t id,
                      base::WritableSharedMemoryMapping mapping,
                      size_t size)
       : id(id), mapping(std::move(mapping)), size(size) {}

   BitstreamBufferRef(const BitstreamBufferRef&) = delete;
   BitstreamBufferRef& operator=(const BitstreamBufferRef&) = delete;

   const int32_t id;
   const base::WritableSharedMemoryMapping mapping;
   const size_t size;
 };

 MediaFoundationVideoEncodeAccelerator::MediaFoundationVideoEncodeAccelerator(
     const gpu::GpuPreferences& gpu_preferences,
     const gpu::GpuDriverBugWorkarounds& gpu_workarounds,
     CHROME_LUID luid)
     : task_runner_(base::SingleThreadTaskRunner::GetCurrentDefault()),
       luid_(luid) {
   weak_ptr_ = weak_factory_.GetWeakPtr();
   bitrate_allocation_.SetBitrate(0, 0, kDefaultTargetBitrate);
 }

 MediaFoundationVideoEncodeAccelerator::
     ~MediaFoundationVideoEncodeAccelerator() {
   DVLOG(3) << __func__;
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   DCHECK(async_callback_ref_.IsOne());
 }

 VideoEncodeAccelerator::SupportedProfiles
 MediaFoundationVideoEncodeAccelerator::GetSupportedProfiles() {
   TRACE_EVENT0("gpu,startup",
                "MediaFoundationVideoEncodeAccelerator::GetSupportedProfiles");
   DVLOG(3) << __func__;
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);

   std::vector<VideoCodec> supported_codecs(
       {VideoCodec::kH264, VideoCodec::kVP9, VideoCodec::kAV1});

 #if BUILDFLAG(ENABLE_PLATFORM_HEVC)
   if (base::FeatureList::IsEnabled(kPlatformHEVCEncoderSupport)) {
     supported_codecs.emplace_back(VideoCodec::kHEVC);
   }
 #endif

   // There's no easy way to enumerate the supported resolution bounds, so we
   // just choose reasonable default values.
   const SupportedProfile kDefaultProfile = []() {
     SupportedProfile profile(VIDEO_CODEC_PROFILE_UNKNOWN,
                              /*max_resolution=*/gfx::Size(1920, 1088),
                              kMaxFrameRateNumerator, kMaxFrameRateDenominator,
                              VideoEncodeAccelerator::kConstantMode |
                                  VideoEncodeAccelerator::kVariableMode,
                              {SVCScalabilityMode::kL1T1});
     profile.min_resolution = gfx::Size(32, 32);
     return profile;
   }();

   SupportedProfiles profiles;
   for (auto codec : supported_codecs) {
     bool svc_supported = false;
     if (!IsCodecSupportedForEncoding(codec, &svc_supported)) {
       continue;
     }

     SupportedProfile profile(kDefaultProfile);
     if (svc_supported) {
       profile.scalability_modes.push_back(SVCScalabilityMode::kL1T2);
       profile.scalability_modes.push_back(SVCScalabilityMode::kL1T3);
     }

     SupportedProfile portrait_profile(profile);
     portrait_profile.max_resolution.Transpose();
     portrait_profile.min_resolution.Transpose();

     std::vector<VideoCodecProfile> codec_profiles;
     if (codec == VideoCodec::kH264) {
       codec_profiles = {H264PROFILE_BASELINE, H264PROFILE_MAIN,
                         H264PROFILE_HIGH};
     } else if (codec == VideoCodec::kVP9) {
       codec_profiles = {VP9PROFILE_PROFILE0};
     } else if (codec == VideoCodec::kAV1) {
       codec_profiles = {AV1PROFILE_PROFILE_MAIN};
     } else if (codec == VideoCodec::kHEVC) {
       codec_profiles = {HEVCPROFILE_MAIN};
     }

     for (const auto codec_profile : codec_profiles) {
       profile.profile = portrait_profile.profile = codec_profile;
       profiles.push_back(profile);
       profiles.push_back(portrait_profile);
     }
   }

   return profiles;
 }

 bool MediaFoundationVideoEncodeAccelerator::Initialize(
     const Config& config,
     Client* client,
     std::unique_ptr<MediaLog> media_log) {
   DVLOG(3) << __func__ << ": " << config.AsHumanReadableString();
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   media_log_ = std::move(media_log);

   if (PIXEL_FORMAT_I420 != config.input_format &&
       PIXEL_FORMAT_NV12 != config.input_format) {
     MEDIA_LOG(ERROR, media_log_)
         << "Input format not supported= "
         << VideoPixelFormatToString(config.input_format);
     return false;
   }

   if (config.output_profile >= H264PROFILE_MIN &&
       config.output_profile <= H264PROFILE_MAX) {
     if (GetH264VProfile(config.output_profile, config.is_constrained_h264) ==
         eAVEncH264VProfile_unknown) {
       MEDIA_LOG(ERROR, media_log_)
           << "Output profile not supported = " << config.output_profile;
       return false;
     }
     codec_ = VideoCodec::kH264;
   } else if (config.output_profile >= VP9PROFILE_MIN &&
              config.output_profile <= VP9PROFILE_MAX) {
     if (GetVP9VProfile(config.output_profile) == eAVEncVP9VProfile_unknown) {
       MEDIA_LOG(ERROR, media_log_)
           << "Output profile not supported = " << config.output_profile;
       return false;
     }
     codec_ = VideoCodec::kVP9;
   } else if (config.output_profile == AV1PROFILE_PROFILE_MAIN) {
     codec_ = VideoCodec::kAV1;
   } else if (config.output_profile == HEVCPROFILE_MAIN) {
 #if BUILDFLAG(ENABLE_PLATFORM_HEVC)
     if (base::FeatureList::IsEnabled(kPlatformHEVCEncoderSupport)) {
       codec_ = VideoCodec::kHEVC;
     }
 #endif
   }

   if (codec_ == VideoCodec::kUnknown) {
     MEDIA_LOG(ERROR, media_log_)
         << "Output profile not supported = " << config.output_profile;
     return false;
   }

   if (config.HasSpatialLayer()) {
     MEDIA_LOG(ERROR, media_log_) << "MediaFoundation does not support "
                                     "spatial layer encoding.";
     return false;
   }
   client_ = client;
   input_visible_size_ = config.input_visible_size;
   if (config.initial_framerate.has_value() && config.initial_framerate.value())
     frame_rate_ = config.initial_framerate.value();
   else
     frame_rate_ = kMaxFrameRateNumerator / kMaxFrameRateDenominator;
   bitrate_allocation_ = AllocateBitrateForDefaultEncoding(config);

   bitstream_buffer_size_ = config.input_visible_size.GetArea();
   gop_length_ = config.gop_length.value_or(kDefaultGOPLength);
   low_latency_mode_ = config.require_low_delay;

   if (config.HasTemporalLayer())
     num_temporal_layers_ = config.spatial_layers.front().num_of_temporal_layers;

   // Use SW BRC only in the case CBR and non layer encoding.
   const bool use_sw_brc =
       bitrate_allocation_.GetMode() == Bitrate::Mode::kConstant &&
       base::FeatureList::IsEnabled(kMediaFoundationUseSoftwareRateCtrl) &&
       !config.HasTemporalLayer();

   if (use_sw_brc && (codec_ == VideoCodec::kVP9
 #if BUILDFLAG(ENABLE_LIBAOM)
                      || codec_ == VideoCodec::kAV1
 #endif
                      )) {
     VideoRateControlWrapper::RateControlConfig rate_config =
         CreateRateControllerConfig(bitrate_allocation_, input_visible_size_,
                                    frame_rate_, /*num_temporal_layers=*/1,
                                    codec_);
     if (codec_ == VideoCodec::kVP9) {
       rate_ctrl_ = VP9RateControl::Create(rate_config);
     } else if (codec_ == VideoCodec::kAV1) {
 #if BUILDFLAG(ENABLE_LIBAOM)
       // If libaom is not enabled, |rate_ctrl_| will not be initialized.
       rate_ctrl_ = AV1RateControl::Create(rate_config);
 #endif
     }
   }

   SetState(kInitializing);
   IMFActivate** pp_activates = nullptr;

   uint32_t encoder_count = EnumerateHardwareEncoders(codec_, &pp_activates);

   if (encoder_count == 0) {
     NotifyErrorStatus({EncoderStatus::Codes::kEncoderInitializationError,
                        "Failed finding a hardware encoder MFT"});
     return false;
   }

   bool activated = ActivateAsyncEncoder(pp_activates, encoder_count,
                                         config.is_constrained_h264);
   if (pp_activates) {
     // Release the enumerated instances if any.
     // According to Windows Dev Center,
     // https://docs.microsoft.com/en-us/windows/win32/api/mfapi/nf-mfapi-mftenumex
     // The caller must release the pointers.
     for (UINT32 i = 0; i < encoder_count; i++) {
       if (pp_activates[i]) {
         pp_activates[i]->Release();
         pp_activates[i] = nullptr;
       }
     }
     CoTaskMemFree(pp_activates);
   }

   if (!activated) {
     NotifyErrorStatus({EncoderStatus::Codes::kEncoderInitializationError,
                        "Failed activating an async hardware encoder MFT"});
     return false;
   }
   if (!SetEncoderModes()) {
     NotifyErrorStatus({EncoderStatus::Codes::kEncoderInitializationError,
                        "Failed to set encoder modes"});
     return false;
   }

   if (!InitializeInputOutputParameters(config.output_profile,
                                        config.is_constrained_h264)) {
     NotifyErrorStatus({EncoderStatus::Codes::kEncoderInitializationError,
                        "Failed to set input/output param."});
     return false;
   }

   auto hr = MFCreateSample(&input_sample_);
   if (FAILED(hr)) {
     NotifyErrorStatus({EncoderStatus::Codes::kEncoderInitializationError,
                        "Failed to create sample"});
     return false;
   }

   if (IsMediaFoundationD3D11VideoCaptureEnabled()) {
     MEDIA_LOG(INFO, media_log_)
         << "Preferred DXGI device " << luid_.HighPart << ":" << luid_.LowPart;
     dxgi_device_manager_ = DXGIDeviceManager::Create(luid_);
     if (!dxgi_device_manager_) {
       NotifyErrorStatus({EncoderStatus::Codes::kEncoderInitializationError,
                          "Failed to create DXGIDeviceManager"});
       return false;
     }

     auto mf_dxgi_device_manager =
         dxgi_device_manager_->GetMFDXGIDeviceManager();
     hr = encoder_->ProcessMessage(
         MFT_MESSAGE_SET_D3D_MANAGER,
         reinterpret_cast<ULONG_PTR>(mf_dxgi_device_manager.Get()));
     // If HMFT rejects setting D3D manager, fallback to non-D3D11 encoding.
     if (FAILED(hr)) {
       dxgi_resource_mapping_required_ = true;
       MEDIA_LOG(INFO, media_log_)
           << "Couldn't set DXGIDeviceManager, fallback to non-D3D11 encoding";
     }
   }

   hr = encoder_->QueryInterface(IID_PPV_ARGS(&event_generator_));
   if (FAILED(hr)) {
     NotifyErrorStatus({EncoderStatus::Codes::kEncoderInitializationError,
                        "Couldn't get event generator"});
     return false;
   }

   event_generator_->BeginGetEvent(this, nullptr);

   // Start the asynchronous processing model
   hr = encoder_->ProcessMessage(MFT_MESSAGE_COMMAND_FLUSH, 0);
   if (FAILED(hr)) {
     NotifyErrorStatus(
         {EncoderStatus::Codes::kEncoderInitializationError,
          "Couldn't set ProcessMessage MFT_MESSAGE_COMMAND_FLUSH"});
     return false;
   }
   hr = encoder_->ProcessMessage(MFT_MESSAGE_NOTIFY_BEGIN_STREAMING, 0);
   if (FAILED(hr)) {
     NotifyErrorStatus(
         {EncoderStatus::Codes::kEncoderInitializationError,
          "Couldn't set ProcessMessage MFT_MESSAGE_NOTIFY_BEGIN_STREAMING"});
     return false;
   }
   hr = encoder_->ProcessMessage(MFT_MESSAGE_NOTIFY_START_OF_STREAM, 0);
   if (FAILED(hr)) {
     NotifyErrorStatus(
         {EncoderStatus::Codes::kEncoderInitializationError,
          "Couldn't set ProcessMessage MFT_MESSAGE_NOTIFY_START_OF_STREAM"});
     return false;
   }

   encoder_info_.implementation_name = "MediaFoundationVideoEncodeAccelerator";
   // Currently, MFVEA does not support odd resolution well. The implementation
   // here reports alignment of 2 in the EncoderInfo, together with simulcast
   // layers applied.
   // See https://crbug.com/1275453 for more details.
   encoder_info_.requested_resolution_alignment = 2;
   encoder_info_.apply_alignment_to_all_simulcast_layers = true;
   encoder_info_.has_trusted_rate_controller = false;
   DCHECK(encoder_info_.is_hardware_accelerated);
   DCHECK(encoder_info_.supports_native_handle);
   DCHECK(encoder_info_.reports_average_qp);
   DCHECK(!encoder_info_.supports_simulcast);
   if (config.HasSpatialLayer() || config.HasTemporalLayer()) {
     DCHECK(!config.spatial_layers.empty());
     for (size_t i = 0; i < config.spatial_layers.size(); ++i) {
       encoder_info_.fps_allocation[i] =
           GetFpsAllocation(config.spatial_layers[i].num_of_temporal_layers);
     }
   } else {
     constexpr uint8_t kFullFramerate = 255;
     encoder_info_.fps_allocation[0] = {kFullFramerate};
   }

   return true;
 }

 void MediaFoundationVideoEncodeAccelerator::Encode(
     scoped_refptr<VideoFrame> frame,
     bool force_keyframe) {
   DVLOG(3) << __func__;
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);

   switch (state_) {
     case kEncoding: {
       pending_input_queue_.push_back(
           MakeInput(std::move(frame), force_keyframe));
       FeedInputs();
       break;
     }
     case kInitializing: {
       pending_input_queue_.push_back(
           MakeInput(std::move(frame), force_keyframe));
       break;
     }
     default:
       NotifyErrorStatus({EncoderStatus::Codes::kEncoderFailedEncode,
                          "Unexpected encoder state"});
       DCHECK(false) << "Abandon input frame for video encoder."
                     << " State: " << static_cast<int>(state_);
   }
 }

 void MediaFoundationVideoEncodeAccelerator::UseOutputBitstreamBuffer(
     BitstreamBuffer buffer) {
   DVLOG(3) << __func__ << ": buffer size=" << buffer.size();
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);

   if (buffer.size() < bitstream_buffer_size_) {
     NotifyErrorStatus({EncoderStatus::Codes::kInvalidOutputBuffer,
                        "Output BitstreamBuffer isn't big enough: " +
                            base::NumberToString(buffer.size()) + " vs. " +
                            base::NumberToString(bitstream_buffer_size_)});
     return;
   }

   // After mapping, |region| is no longer necessary and it can be destroyed.
   // |mapping| will keep the shared memory region open.
   auto region = buffer.TakeRegion();
   auto mapping = region.Map();
   if (!mapping.IsValid()) {
     NotifyErrorStatus({EncoderStatus::Codes::kSystemAPICallError,
                        "Failed mapping shared memory"});
     return;
   }
   auto buffer_ref = std::make_unique<BitstreamBufferRef>(
       buffer.id(), std::move(mapping), buffer.size());

   if (encoder_output_queue_.empty()) {
     bitstream_buffer_queue_.push_back(std::move(buffer_ref));
     return;
   }
   auto encode_output = std::move(encoder_output_queue_.front());
   encoder_output_queue_.pop_front();
   memcpy(buffer_ref->mapping.memory(), encode_output->memory(),
          encode_output->size());

   BitstreamBufferMetadata md(encode_output->size(), encode_output->keyframe,
                              encode_output->capture_timestamp);
   if (encode_output->frame_qp) {
     md.qp = *encode_output->frame_qp;
   }
   if (temporal_scalable_coding()) {
     md.h264.emplace().temporal_idx = encode_output->temporal_layer_id;
   }
   if (encode_output->color_space) {
     md.encoded_color_space = *encode_output->color_space;
   }

   client_->BitstreamBufferReady(buffer_ref->id, md);
 }

 void MediaFoundationVideoEncodeAccelerator::RequestEncodingParametersChange(
     const Bitrate& bitrate,
     uint32_t framerate) {
   DVLOG(3) << __func__ << ": bitrate=" << bitrate.ToString()
            << ": framerate=" << framerate;
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);

   VideoBitrateAllocation allocation(bitrate.mode());
   allocation.SetBitrate(0, 0, bitrate.target_bps());
   if (bitrate.mode() == Bitrate::Mode::kVariable) {
     allocation.SetPeakBps(bitrate.peak_bps());
   }

   RequestEncodingParametersChange(allocation, framerate);
 }

 void MediaFoundationVideoEncodeAccelerator::RequestEncodingParametersChange(
     const VideoBitrateAllocation& bitrate_allocation,
     uint32_t framerate) {
   DVLOG(3) << __func__ << ": bitrate=" << bitrate_allocation.GetSumBps()
            << ": framerate=" << framerate;
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);

   DCHECK(imf_output_media_type_);
   DCHECK(imf_input_media_type_);
   DCHECK(encoder_);
   RETURN_ON_FAILURE(
       bitrate_allocation.GetMode() == bitrate_allocation_.GetMode(),
       "Invalid bitrate mode", );
   framerate =
       std::clamp(framerate, 1u, static_cast<uint32_t>(kMaxFrameRateNumerator));

   if (framerate == frame_rate_ && bitrate_allocation == bitrate_allocation_) {
     return;
   }

   bitrate_allocation_ = bitrate_allocation;
   frame_rate_ = framerate;
   // For SW BRC we don't reconfigure the encoder.
   if (rate_ctrl_) {
     rate_ctrl_->UpdateRateControl(CreateRateControllerConfig(
         bitrate_allocation_, input_visible_size_, frame_rate_,
         /*num_temporal_layers=*/1, codec_));
     return;
   }

   VARIANT var;
   var.vt = VT_UI4;
   var.ulVal = AdjustBitrateToFrameRate(bitrate_allocation_.GetSumBps(),
                                        configured_frame_rate_, framerate);
   HRESULT hr = codec_api_->SetValue(&CODECAPI_AVEncCommonMeanBitRate, &var);
   RETURN_ON_HR_FAILURE(hr, "Couldn't update mean bitrate", );

   if (bitrate_allocation_.GetMode() == Bitrate::Mode::kVariable) {
     var.ulVal = AdjustBitrateToFrameRate(bitrate_allocation_.GetPeakBps(),
                                          configured_frame_rate_, framerate);
     hr = codec_api_->SetValue(&CODECAPI_AVEncCommonMaxBitRate, &var);
     RETURN_ON_HR_FAILURE(hr, "Couldn't set max bitrate", );
   }
 }

 void MediaFoundationVideoEncodeAccelerator::Destroy() {
   DVLOG(3) << __func__;
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);

   if (activate_) {
     activate_->ShutdownObject();
     activate_->Release();
   }
   delete this;
 }

 void MediaFoundationVideoEncodeAccelerator::DrainEncoder() {
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   auto hr = encoder_->ProcessMessage(MFT_MESSAGE_COMMAND_DRAIN, 0);
   if (FAILED(hr)) {
     std::move(flush_callback_).Run(/*success=*/false);
     return;
   }
   SetState(kFlushing);
 }

 void MediaFoundationVideoEncodeAccelerator::Flush(
     FlushCallback flush_callback) {
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   DCHECK(flush_callback);

   if (state_ != kEncoding || !encoder_) {
     DCHECK(false) << "Called Flush() with unexpected state."
                   << " State: " << static_cast<int>(state_);
     std::move(flush_callback).Run(/*success=*/false);
     return;
   }

   flush_callback_ = std::move(flush_callback);
   if (pending_input_queue_.empty()) {
     // There are no pending inputs we can just ask MF encoder to drain without
     // having to wait for any more METransformNeedInput requests.
     DrainEncoder();
   } else {
     // Otherwise METransformNeedInput will call DrainEncoder() when all the
     // inputs from `pending_input_queue_` were fed to the MF encoder.
     SetState(kPreFlushing);
   }
 }

 bool MediaFoundationVideoEncodeAccelerator::IsFlushSupported() {
   return true;
 }

 bool MediaFoundationVideoEncodeAccelerator::IsGpuFrameResizeSupported() {
   return true;
 }

 bool MediaFoundationVideoEncodeAccelerator::ActivateAsyncEncoder(
     IMFActivate** pp_activate,
     uint32_t encoder_count,
     bool is_constrained_h264) {
   DVLOG(3) << __func__;
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);

   // Try to create the encoder with priority according to merit value.
   HRESULT hr = E_FAIL;
   for (UINT32 i = 0; i < encoder_count; i++) {
     auto vendor = GetDriverVendor(pp_activate[i]);
     // Skip flawky Intel hybrid AV1 encoder.
     if (codec_ == VideoCodec::kAV1 && vendor == DriverVendor::kIntel) {
       // Get the CLSID GUID of the HMFT.
       GUID mft_guid = {0};
       pp_activate[i]->GetGUID(MFT_TRANSFORM_CLSID_Attribute, &mft_guid);
       if (mft_guid == kIntelAV1HybridEncoderCLSID) {
         DLOG(WARNING) << "Skipped Intel hybrid AV1 encoder MFT.";
         continue;
       }
     }

     // Skip NVIDIA GPU due to https://crbug.com/1088650 for constrained
     // baseline profile H.264 encoding, and go to the next instance according
     // to merit value.
     if (codec_ == VideoCodec::kH264 && is_constrained_h264 &&
         vendor == DriverVendor::kNvidia) {
       DLOG(WARNING) << "Skipped NVIDIA GPU due to https://crbug.com/1088650";
       continue;
     }

     DCHECK(!encoder_);
     DCHECK(!activate_);
     hr = pp_activate[i]->ActivateObject(IID_PPV_ARGS(&encoder_));
     if (encoder_.Get() != nullptr) {
       DCHECK(SUCCEEDED(hr));
       activate_ = pp_activate[i];
       vendor_ = vendor;
       pp_activate[i] = nullptr;

       // Print the friendly name.
       base::win::ScopedCoMem<WCHAR> friendly_name;
       UINT32 name_length;
       activate_->GetAllocatedString(MFT_FRIENDLY_NAME_Attribute, &friendly_name,
                                     &name_length);
       DVLOG(3) << "Selected asynchronous hardware encoder's friendly name: "
                << friendly_name;
       // Encoder is successfully activated.
       break;
     } else {
       DCHECK(FAILED(hr));

       // The component that calls ActivateObject is
       // responsible for calling ShutdownObject,
       // https://docs.microsoft.com/en-us/windows/win32/api/mfobjects/nf-mfobjects-imfactivate-shutdownobject.
       pp_activate[i]->ShutdownObject();
     }
   }

   RETURN_ON_HR_FAILURE(hr, "Couldn't activate asynchronous hardware encoder",
                        false);
   RETURN_ON_FAILURE((encoder_.Get() != nullptr),
                     "No asynchronous hardware encoder instance created", false);

   Microsoft::WRL::ComPtr<IMFAttributes> all_attributes;
   hr = encoder_->GetAttributes(&all_attributes);
   if (SUCCEEDED(hr)) {
     // An asynchronous MFT must support dynamic format changes,
     // https://docs.microsoft.com/en-us/windows/win32/medfound/asynchronous-mfts#format-changes.
     UINT32 dynamic = FALSE;
     hr = all_attributes->GetUINT32(MFT_SUPPORT_DYNAMIC_FORMAT_CHANGE, &dynamic);
     if (!dynamic) {
       DLOG(ERROR) << "Couldn't support dynamic format change.";
       return false;
     }

     // Unlock the selected asynchronous MFTs,
     // https://docs.microsoft.com/en-us/windows/win32/medfound/asynchronous-mfts#unlocking-asynchronous-mfts.
     UINT32 async = FALSE;
     hr = all_attributes->GetUINT32(MF_TRANSFORM_ASYNC, &async);
     if (!async) {
       DLOG(ERROR) << "MFT encoder is not asynchronous.";
       return false;
     }

     hr = all_attributes->SetUINT32(MF_TRANSFORM_ASYNC_UNLOCK, TRUE);
     RETURN_ON_HR_FAILURE(hr, "Couldn't unlock transform async", false);
   }

   return true;
 }

 bool MediaFoundationVideoEncodeAccelerator::InitializeInputOutputParameters(
     VideoCodecProfile output_profile,
     bool is_constrained_h264) {
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   DCHECK(encoder_);

   DWORD input_count = 0;
   DWORD output_count = 0;
   HRESULT hr = encoder_->GetStreamCount(&input_count, &output_count);
   RETURN_ON_HR_FAILURE(hr, "Couldn't get stream count", false);
   if (input_count < 1 || output_count < 1) {
     DLOG(ERROR) << "Stream count too few: input " << input_count << ", output "
                 << output_count;
     return false;
   }

   std::vector<DWORD> input_ids(input_count, 0);
   std::vector<DWORD> output_ids(output_count, 0);
   hr = encoder_->GetStreamIDs(input_count, input_ids.data(), output_count,
                               output_ids.data());
   if (hr == S_OK) {
     input_stream_id_ = input_ids[0];
     output_stream_id_ = output_ids[0];
   } else if (hr == E_NOTIMPL) {
     input_stream_id_ = 0;
     output_stream_id_ = 0;
   } else {
     DLOG(ERROR) << "Couldn't find stream ids from hardware encoder.";
     return false;
   }

   // Initialize output parameters.
   hr = MFCreateMediaType(&imf_output_media_type_);
   RETURN_ON_HR_FAILURE(hr, "Couldn't create output media type", false);
   hr = imf_output_media_type_->SetGUID(MF_MT_MAJOR_TYPE, MFMediaType_Video);
   RETURN_ON_HR_FAILURE(hr, "Couldn't set media type", false);
   hr = imf_output_media_type_->SetGUID(MF_MT_SUBTYPE,
                                        VideoCodecToMFSubtype(codec_));
   RETURN_ON_HR_FAILURE(hr, "Couldn't set video format", false);

   if (!rate_ctrl_) {
     hr = imf_output_media_type_->SetUINT32(
         MF_MT_AVG_BITRATE,
         AdjustBitrateToFrameRate(bitrate_allocation_.GetSumBps(), frame_rate_,
                                  frame_rate_));
     RETURN_ON_HR_FAILURE(hr, "Couldn't set bitrate", false);
   }
   configured_frame_rate_ = frame_rate_;

   hr = MFSetAttributeRatio(imf_output_media_type_.Get(), MF_MT_FRAME_RATE,
                            configured_frame_rate_, 1);
   RETURN_ON_HR_FAILURE(hr, "Couldn't set frame rate", false);
   hr = MFSetAttributeSize(imf_output_media_type_.Get(), MF_MT_FRAME_SIZE,
                           input_visible_size_.width(),
                           input_visible_size_.height());
   RETURN_ON_HR_FAILURE(hr, "Couldn't set frame size", false);
   hr = imf_output_media_type_->SetUINT32(MF_MT_INTERLACE_MODE,
                                          MFVideoInterlace_Progressive);
   RETURN_ON_HR_FAILURE(hr, "Couldn't set interlace mode", false);
   if (codec_ == VideoCodec::kH264) {
     hr = imf_output_media_type_->SetUINT32(
         MF_MT_MPEG2_PROFILE,
         GetH264VProfile(output_profile, is_constrained_h264));
   } else if (codec_ == VideoCodec::kVP9) {
     hr = imf_output_media_type_->SetUINT32(MF_MT_MPEG2_PROFILE,
                                            GetVP9VProfile(output_profile));
   } else if (codec_ == VideoCodec::kHEVC) {
     hr = imf_output_media_type_->SetUINT32(MF_MT_MPEG2_PROFILE,
                                            GetHEVCProfile(output_profile));
   }
   RETURN_ON_HR_FAILURE(hr, "Couldn't set codec profile", false);
   hr = encoder_->SetOutputType(output_stream_id_, imf_output_media_type_.Get(),
                                0);
   RETURN_ON_HR_FAILURE(hr, "Couldn't set output media type", false);

   // Initialize input parameters.
   hr = MFCreateMediaType(&imf_input_media_type_);
   RETURN_ON_HR_FAILURE(hr, "Couldn't create input media type", false);
   hr = imf_input_media_type_->SetGUID(MF_MT_MAJOR_TYPE, MFMediaType_Video);
   RETURN_ON_HR_FAILURE(hr, "Couldn't set media type", false);
   hr = imf_input_media_type_->SetGUID(MF_MT_SUBTYPE, MFVideoFormat_NV12);
   RETURN_ON_HR_FAILURE(hr, "Couldn't set video format", false);
   hr = MFSetAttributeRatio(imf_input_media_type_.Get(), MF_MT_FRAME_RATE,
                            configured_frame_rate_, 1);
   RETURN_ON_HR_FAILURE(hr, "Couldn't set frame rate", false);
   hr = MFSetAttributeSize(imf_input_media_type_.Get(), MF_MT_FRAME_SIZE,
                           input_visible_size_.width(),
                           input_visible_size_.height());
   RETURN_ON_HR_FAILURE(hr, "Couldn't set frame size", false);
   hr = imf_input_media_type_->SetUINT32(MF_MT_INTERLACE_MODE,
                                         MFVideoInterlace_Progressive);
   RETURN_ON_HR_FAILURE(hr, "Couldn't set interlace mode", false);
   hr = encoder_->SetInputType(input_stream_id_, imf_input_media_type_.Get(), 0);
   RETURN_ON_HR_FAILURE(hr, "Couldn't set input media type", false);

   return true;
 }

 bool MediaFoundationVideoEncodeAccelerator::SetEncoderModes() {
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   DCHECK(encoder_);

   HRESULT hr = encoder_.As(&codec_api_);
   RETURN_ON_HR_FAILURE(hr, "Couldn't get ICodecAPI", false);

   VARIANT var;
   var.vt = VT_UI4;
   switch (bitrate_allocation_.GetMode()) {
     case Bitrate::Mode::kConstant:
       if (rate_ctrl_)
         var.ulVal = eAVEncCommonRateControlMode_Quality;
       else
         var.ulVal = eAVEncCommonRateControlMode_CBR;
       break;
     case Bitrate::Mode::kVariable: {
       DCHECK(!rate_ctrl_);
       var.ulVal = eAVEncCommonRateControlMode_PeakConstrainedVBR;
       break;
     }
     case Bitrate::Mode::kExternal:
       // Unsupported.
       return false;
   }
   hr = codec_api_->SetValue(&CODECAPI_AVEncCommonRateControlMode, &var);
   RETURN_ON_HR_FAILURE(hr, "Couldn't set CommonRateControlMode", false);

   // Intel drivers want the layer count to be set explicitly for H.264/HEVC,
   // even if it's one.
   const bool set_svc_layer_count =
       (num_temporal_layers_ > 1) ||
       (vendor_ == DriverVendor::kIntel &&
        (codec_ == VideoCodec::kH264 || codec_ == VideoCodec::kHEVC));
   if (set_svc_layer_count) {
     var.ulVal = num_temporal_layers_;
     hr = codec_api_->SetValue(&CODECAPI_AVEncVideoTemporalLayerCount, &var);
     RETURN_ON_HR_FAILURE(hr, "Couldn't set temporal layer count", false);
   }

   if (!rate_ctrl_) {
     var.ulVal = AdjustBitrateToFrameRate(bitrate_allocation_.GetSumBps(),
                                          configured_frame_rate_, frame_rate_);
     hr = codec_api_->SetValue(&CODECAPI_AVEncCommonMeanBitRate, &var);
     RETURN_ON_HR_FAILURE(hr, "Couldn't set bitrate", false);
   }

   if (bitrate_allocation_.GetMode() == Bitrate::Mode::kVariable) {
     var.ulVal = AdjustBitrateToFrameRate(bitrate_allocation_.GetPeakBps(),
                                          configured_frame_rate_, frame_rate_);
     hr = codec_api_->SetValue(&CODECAPI_AVEncCommonMaxBitRate, &var);
     RETURN_ON_HR_FAILURE(hr, "Couldn't set bitrate", false);
   }

   if (S_OK == codec_api_->IsModifiable(&CODECAPI_AVEncAdaptiveMode)) {
     var.ulVal = eAVEncAdaptiveMode_Resolution;
     hr = codec_api_->SetValue(&CODECAPI_AVEncAdaptiveMode, &var);
     RETURN_ON_HR_FAILURE(hr, "Couldn't set adaptive mode", false);
   }

   var.ulVal = gop_length_;
   hr = codec_api_->SetValue(&CODECAPI_AVEncMPVGOPSize, &var);
   RETURN_ON_HR_FAILURE(hr, "Couldn't set keyframe interval", false);

   if (S_OK == codec_api_->IsModifiable(&CODECAPI_AVLowLatencyMode)) {
     var.vt = VT_BOOL;
     var.boolVal = low_latency_mode_ ? VARIANT_TRUE : VARIANT_FALSE;
     hr = codec_api_->SetValue(&CODECAPI_AVLowLatencyMode, &var);
     RETURN_ON_HR_FAILURE(hr, "Couldn't set low latency mode", false);
   }

   return true;
 }

 void MediaFoundationVideoEncodeAccelerator::NotifyErrorStatus(
     EncoderStatus status) {
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   CHECK(!status.is_ok());
   CHECK(media_log_);
   SetState(kError);
   MEDIA_LOG(ERROR, media_log_) << status.message();
   DLOG(ERROR) << "Call NotifyErrorStatus(): code="
               << static_cast<int>(status.code())
               << ", message=" << status.message();
   CHECK(client_);
   client_->NotifyErrorStatus(std::move(status));
 }

 void MediaFoundationVideoEncodeAccelerator::FeedInputs() {
   if (pending_input_queue_.empty()) {
     return;
   }

   // There's no point in trying to feed more than one input here,
   // because MF encoder never accepts more than one input in a row.
   auto& next_input = pending_input_queue_.front();

   HRESULT hr = ProcessInput(next_input);
   if (hr == MF_E_NOTACCEPTING) {
     return;
   }
   if (FAILED(hr)) {
     NotifyErrorStatus({EncoderStatus::Codes::kSystemAPICallError,
                        "Failed to encode pending frame. " + PrintHr(hr)});
     return;
   }
   pending_input_queue_.pop_front();
 }

 HRESULT MediaFoundationVideoEncodeAccelerator::ProcessInput(
     const PendingInput& input) {
   DVLOG(3) << __func__;
   DCHECK(input_sample_);
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   TRACE_EVENT1("media", "MediaFoundationVideoEncodeAccelerator::ProcessInput",
                "timestamp", input.frame->timestamp());

   if (has_prepared_input_sample_) {
     if (DCHECK_IS_ON()) {
       // Let's validate that prepared sample actually matches the frame
       // we encode.
       LONGLONG sample_ts = 0;
       auto hr = input_sample_->GetSampleTime(&sample_ts);
       DCHECK_EQ(hr, S_OK) << PrintHr(hr);
       int64_t frame_ts = input.frame->timestamp().InMicroseconds() *
                          kOneMicrosecondInMFSampleTimeUnits;
       DCHECK_EQ(frame_ts, sample_ts)
           << "Prepared sample timestamp doesn't match frame timestamp.";
     }
   } else {
     const auto frame_cs = input.frame->ColorSpace();
     if (encoder_color_space_.value_or(gfx::ColorSpace()) != frame_cs) {
       encoder_color_space_ = frame_cs;
       SetEncoderColorSpace();
     }

     // Prepare input sample if it hasn't been done yet.
     HRESULT hr = PopulateInputSampleBuffer(input);
     RETURN_ON_HR_FAILURE(hr, "Couldn't populate input sample buffer", hr);

     if (rate_ctrl_) {
       VideoRateControlWrapper::FrameParams frame_params{};
       frame_params.frame_type =
           input.options.key_frame
               ? VideoRateControlWrapper::FrameParams::FrameType::kKeyFrame
               : VideoRateControlWrapper::FrameParams::FrameType::kInterFrame;
       int qp = rate_ctrl_->ComputeQP(frame_params);
       VARIANT var;
       var.vt = VT_UI8;
       var.ulVal = QindextoAVEncQP(static_cast<uint8_t>(qp));
       hr = codec_api_->SetValue(&CODECAPI_AVEncVideoEncodeQP, &var);
       RETURN_ON_HR_FAILURE(hr, "Couldn't set current layer QP", hr);
       hr = input_sample_->SetUINT64(MFSampleExtension_VideoEncodeQP, var.ulVal);
       RETURN_ON_HR_FAILURE(hr, "Couldn't set input sample attribute QP", hr);
     }

     output_color_spaces_.push_back(encoder_color_space_);
     has_prepared_input_sample_ = true;
   }

   HRESULT hr = 0;
   {
     TRACE_EVENT1("media", "IMFTransform::ProcessInput", "timestamp",
                  input.frame->timestamp());
     hr = encoder_->ProcessInput(input_stream_id_, input_sample_.Get(), 0);
   }
   // Check if ProcessInput() actually accepted the sample, if not, remember
   // that we don't need to prepare sample next time and can just use it.
   has_prepared_input_sample_ = (hr == MF_E_NOTACCEPTING);
   return hr;
 }

 HRESULT MediaFoundationVideoEncodeAccelerator::PopulateInputSampleBuffer(
     const PendingInput& input) {
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   auto frame = input.frame;
   if (frame->storage_type() !=
           VideoFrame::StorageType::STORAGE_GPU_MEMORY_BUFFER &&
       !frame->IsMappable()) {
     LOG(ERROR) << "Unsupported video frame storage type";
     return MF_E_INVALID_STREAM_DATA;
   }

   TRACE_EVENT1(
       "media",
       "MediaFoundationVideoEncodeAccelerator::PopulateInputSampleBuffer",
       "timestamp", frame->timestamp());

   if (frame->format() != PIXEL_FORMAT_NV12 &&
       frame->format() != PIXEL_FORMAT_I420) {
     LOG(ERROR) << "Unsupported video frame format";
     return MF_E_INVALID_STREAM_DATA;
   }

   auto hr = input_sample_->SetSampleTime(frame->timestamp().InMicroseconds() *
                                          kOneMicrosecondInMFSampleTimeUnits);
   RETURN_ON_HR_FAILURE(hr, "SetSampleTime() failed", hr);

   UINT64 sample_duration = 0;
   hr = MFFrameRateToAverageTimePerFrame(frame_rate_, 1, &sample_duration);
   RETURN_ON_HR_FAILURE(hr, "Couldn't calculate sample duration", hr);

   hr = input_sample_->SetSampleDuration(sample_duration);
   RETURN_ON_HR_FAILURE(hr, "SetSampleDuration() failed", hr);

   if (input.options.key_frame) {
     VARIANT var;
     var.vt = VT_UI4;
     var.ulVal = 1;
     hr = codec_api_->SetValue(&CODECAPI_AVEncVideoForceKeyFrame, &var);
     RETURN_ON_HR_FAILURE(hr, "Set CODECAPI_AVEncVideoForceKeyFrame failed", hr);
   }

   if (frame->storage_type() ==
       VideoFrame::StorageType::STORAGE_GPU_MEMORY_BUFFER) {
     gfx::GpuMemoryBuffer* gmb = frame->GetGpuMemoryBuffer();
     if (!gmb) {
       LOG(ERROR) << "Failed to get GMB for input frame";
       return MF_E_INVALID_STREAM_DATA;
     }

     if (gmb->GetType() != gfx::GpuMemoryBufferType::DXGI_SHARED_HANDLE &&
         gmb->GetType() != gfx::GpuMemoryBufferType::SHARED_MEMORY_BUFFER) {
       LOG(ERROR) << "Unsupported GMB type";
       return MF_E_INVALID_STREAM_DATA;
     }

     if (gmb->GetType() == gfx::GpuMemoryBufferType::DXGI_SHARED_HANDLE &&
         dxgi_device_manager_ != nullptr) {
       if (!dxgi_resource_mapping_required_) {
         return PopulateInputSampleBufferGpu(std::move(frame));
       } else {
         return CopyInputSampleBufferFromGpu(*(frame.get()));
       }
     }

     // ConvertToMemoryMappedFrame() doesn't copy pixel data,
     // it just maps GPU buffer owned by |frame| and presents it as mapped
     // view in CPU memory. |frame| will unmap the buffer when destructed.
     frame = ConvertToMemoryMappedFrame(std::move(frame));
     if (!frame) {
       LOG(ERROR) << "Failed to map shared memory GMB";
       return E_FAIL;
     }
   }

   const auto kTargetPixelFormat = PIXEL_FORMAT_NV12;
   Microsoft::WRL::ComPtr<IMFMediaBuffer> input_buffer;
   hr = input_sample_->GetBufferByIndex(0, &input_buffer);
   if (FAILED(hr)) {
     // Allocate a new buffer.
     MFT_INPUT_STREAM_INFO input_stream_info;
     hr = encoder_->GetInputStreamInfo(input_stream_id_, &input_stream_info);
     RETURN_ON_HR_FAILURE(hr, "Couldn't get input stream info", hr);
     hr = MFCreateAlignedMemoryBuffer(
         input_stream_info.cbSize ? input_stream_info.cbSize
                                  : VideoFrame::AllocationSize(
                                        kTargetPixelFormat, input_visible_size_),
         input_stream_info.cbAlignment == 0 ? input_stream_info.cbAlignment
                                            : input_stream_info.cbAlignment - 1,
         &input_buffer);
     RETURN_ON_HR_FAILURE(hr, "Failed to create memory buffer", hr);
     hr = input_sample_->AddBuffer(input_buffer.Get());
     RETURN_ON_HR_FAILURE(hr, "Failed to add buffer to sample", hr);
   }

   // Establish plain pointers into the input buffer, where we will copy pixel
   // data to.
   MediaBufferScopedPointer scoped_buffer(input_buffer.Get());
   DCHECK(scoped_buffer.get());
   uint8_t* dst_y = scoped_buffer.get();
   size_t dst_y_stride = VideoFrame::RowBytes(
       VideoFrame::kYPlane, kTargetPixelFormat, input_visible_size_.width());
   uint8_t* dst_uv =
       scoped_buffer.get() +
       dst_y_stride * VideoFrame::Rows(VideoFrame::kYPlane, kTargetPixelFormat,
                                       input_visible_size_.height());
   size_t dst_uv_stride = VideoFrame::RowBytes(
       VideoFrame::kUVPlane, kTargetPixelFormat, input_visible_size_.width());
   uint8_t* end = dst_uv + dst_uv_stride * frame->rows(VideoFrame::kUVPlane);
   DCHECK_GE(static_cast<ptrdiff_t>(scoped_buffer.max_length()),
             end - scoped_buffer.get());

   // Set up a VideoFrame with the data pointing into the input buffer.
   // We need it to ease copying and scaling by reusing ConvertAndScaleFrame()
   auto frame_in_buffer = VideoFrame::WrapExternalYuvData(
       kTargetPixelFormat, input_visible_size_, gfx::Rect(input_visible_size_),
       input_visible_size_, dst_y_stride, dst_uv_stride, dst_y, dst_uv,
       frame->timestamp());

   auto status = ConvertAndScaleFrame(*frame, *frame_in_buffer, resize_buffer_);
   if (!status.is_ok()) {
     LOG(ERROR) << "ConvertAndScaleFrame failed with error code: "
                << static_cast<uint32_t>(status.code());
     return E_FAIL;
   }
   return S_OK;
 }

 // Handle case where video frame is backed by a GPU texture, but needs to be
 // copied to CPU memory, if HMFT does not accept texture from adapter
 // different from that is currently used for encoding.
 HRESULT MediaFoundationVideoEncodeAccelerator::CopyInputSampleBufferFromGpu(
     const VideoFrame& frame) {
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   DCHECK_EQ(frame.storage_type(),
             VideoFrame::StorageType::STORAGE_GPU_MEMORY_BUFFER);
   DCHECK(frame.HasGpuMemoryBuffer());
   DCHECK_EQ(frame.GetGpuMemoryBuffer()->GetType(),
             gfx::GpuMemoryBufferType::DXGI_SHARED_HANDLE);
   DCHECK(dxgi_device_manager_);

   gfx::GpuMemoryBufferHandle buffer_handle =
       frame.GetGpuMemoryBuffer()->CloneHandle();

   auto d3d_device = dxgi_device_manager_->GetDevice();
   if (!d3d_device) {
     LOG(ERROR) << "Failed to get device from MF DXGI device manager";
     return E_HANDLE;
   }
   Microsoft::WRL::ComPtr<ID3D11Device1> device1;
   HRESULT hr = d3d_device.As(&device1);

   RETURN_ON_HR_FAILURE(hr, "Failed to query ID3D11Device1", hr);
   Microsoft::WRL::ComPtr<ID3D11Texture2D> input_texture;
   hr = device1->OpenSharedResource1(buffer_handle.dxgi_handle.Get(),
                                     IID_PPV_ARGS(&input_texture));
   RETURN_ON_HR_FAILURE(hr, "Failed to open shared GMB D3D texture", hr);

   // Check if we need to scale the input texture
   D3D11_TEXTURE2D_DESC input_desc = {};
   input_texture->GetDesc(&input_desc);

   Microsoft::WRL::ComPtr<ID3D11Texture2D> sample_texture;
   if (input_desc.Width != static_cast<uint32_t>(input_visible_size_.width()) ||
       input_desc.Height !=
           static_cast<uint32_t>(input_visible_size_.height())) {
     hr = PerformD3DScaling(input_texture.Get());
     RETURN_ON_HR_FAILURE(hr, "Failed to perform D3D video processing", hr);
     sample_texture = scaled_d3d11_texture_;
   } else {
     sample_texture = input_texture;
   }

   const auto kTargetPixelFormat = PIXEL_FORMAT_NV12;
   Microsoft::WRL::ComPtr<IMFMediaBuffer> input_buffer;

   // Allocate a new buffer.
   MFT_INPUT_STREAM_INFO input_stream_info;
   hr = encoder_->GetInputStreamInfo(input_stream_id_, &input_stream_info);
   RETURN_ON_HR_FAILURE(hr, "Couldn't get input stream info", hr);
   hr = MFCreateAlignedMemoryBuffer(
       input_stream_info.cbSize
           ? input_stream_info.cbSize
           : VideoFrame::AllocationSize(kTargetPixelFormat, input_visible_size_),
       input_stream_info.cbAlignment == 0 ? input_stream_info.cbAlignment
                                          : input_stream_info.cbAlignment - 1,
       &input_buffer);
   RETURN_ON_HR_FAILURE(hr, "Failed to create memory buffer for input sample",
                        hr);

   MediaBufferScopedPointer scoped_buffer(input_buffer.Get());
   bool copy_succeeded = gpu::CopyD3D11TexToMem(
       sample_texture.Get(), scoped_buffer.get(), scoped_buffer.max_length(),
       d3d_device.Get(), &staging_texture_);
   if (!copy_succeeded) {
     LOG(ERROR) << "Failed to copy sample to memory.";
     return E_FAIL;
   }
   size_t copied_bytes =
       input_visible_size_.width() * input_visible_size_.height() * 3 / 2;
   hr = input_buffer->SetCurrentLength(copied_bytes);
   RETURN_ON_HR_FAILURE(hr, "Failed to set current buffer length", hr);
   hr = input_sample_->RemoveAllBuffers();
   RETURN_ON_HR_FAILURE(hr, "Failed to remove buffers from sample", hr);
   hr = input_sample_->AddBuffer(input_buffer.Get());
   RETURN_ON_HR_FAILURE(hr, "Failed to add buffer to sample", hr);
   return S_OK;
 }

 // Handle case where video frame is backed by a GPU texture
 HRESULT MediaFoundationVideoEncodeAccelerator::PopulateInputSampleBufferGpu(
     scoped_refptr<VideoFrame> frame) {
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   DCHECK_EQ(frame->storage_type(),
             VideoFrame::StorageType::STORAGE_GPU_MEMORY_BUFFER);
   DCHECK(frame->HasGpuMemoryBuffer());
   DCHECK_EQ(frame->GetGpuMemoryBuffer()->GetType(),
             gfx::GpuMemoryBufferType::DXGI_SHARED_HANDLE);
   DCHECK(dxgi_device_manager_);

   gfx::GpuMemoryBufferHandle buffer_handle =
       frame->GetGpuMemoryBuffer()->CloneHandle();

   auto d3d_device = dxgi_device_manager_->GetDevice();
   if (!d3d_device) {
     LOG(ERROR) << "Failed to get device from MF DXGI device manager";
     return E_HANDLE;
   }

   Microsoft::WRL::ComPtr<ID3D11Device1> device1;
   HRESULT hr = d3d_device.As(&device1);
   RETURN_ON_HR_FAILURE(hr, "Failed to query ID3D11Device1", hr);

   Microsoft::WRL::ComPtr<ID3D11Texture2D> input_texture;
   hr = device1->OpenSharedResource1(buffer_handle.dxgi_handle.Get(),
                                     IID_PPV_ARGS(&input_texture));
   RETURN_ON_HR_FAILURE(hr, "Failed to open shared GMB D3D texture", hr);

   // Check if we need to scale the input texture
   D3D11_TEXTURE2D_DESC input_desc = {};
   input_texture->GetDesc(&input_desc);

   Microsoft::WRL::ComPtr<ID3D11Texture2D> sample_texture;
   if (input_desc.Width != static_cast<uint32_t>(input_visible_size_.width()) ||
       input_desc.Height !=
           static_cast<uint32_t>(input_visible_size_.height())) {
     hr = PerformD3DScaling(input_texture.Get());
     RETURN_ON_HR_FAILURE(hr, "Failed to perform D3D video processing", hr);
     sample_texture = scaled_d3d11_texture_;
   } else {
     sample_texture = input_texture;
   }

   Microsoft::WRL::ComPtr<IMFMediaBuffer> input_buffer;
   hr = MFCreateDXGISurfaceBuffer(__uuidof(ID3D11Texture2D),
                                  sample_texture.Get(), 0, FALSE, &input_buffer);
   RETURN_ON_HR_FAILURE(hr, "Failed to create MF DXGI surface buffer", hr);

   // Some encoder MFTs (e.g. Qualcomm) depend on the sample buffer having a
   // valid current length. Call GetMaxLength() to compute the plane size.
   DWORD buffer_length = 0;
   hr = input_buffer->GetMaxLength(&buffer_length);
   RETURN_ON_HR_FAILURE(hr, "Failed to get max buffer length", hr);
   hr = input_buffer->SetCurrentLength(buffer_length);
   RETURN_ON_HR_FAILURE(hr, "Failed to set current buffer length", hr);

   hr = input_sample_->RemoveAllBuffers();
   RETURN_ON_HR_FAILURE(hr, "Failed to remove buffers from sample", hr);
   hr = input_sample_->AddBuffer(input_buffer.Get());
   RETURN_ON_HR_FAILURE(hr, "Failed to add buffer to sample", hr);
   return S_OK;
 }

 int MediaFoundationVideoEncodeAccelerator::AssignTemporalIdBySvcSpec(
     bool keyframe) {
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   int result = 0;

   if (keyframe) {
     outputs_since_keyframe_count_ = 0;
   }

   switch (num_temporal_layers_) {
     case 1:
       return 0;
     case 2: {
       const static std::array<int, 2> kTwoTemporalLayers = {0, 1};
       result = kTwoTemporalLayers[outputs_since_keyframe_count_ %
                                   kTwoTemporalLayers.size()];
       break;
     }
     case 3: {
       const static std::array<int, 4> kThreeTemporalLayers = {0, 2, 1, 2};
       result = kThreeTemporalLayers[outputs_since_keyframe_count_ %
                                     kThreeTemporalLayers.size()];
       break;
     }
   }
   outputs_since_keyframe_count_++;
   return result;
 }

 bool MediaFoundationVideoEncodeAccelerator::AssignTemporalId(
     Microsoft::WRL::ComPtr<IMFMediaBuffer> output_buffer,
     size_t size,
     int* temporal_id,
     bool keyframe) {
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   *temporal_id = 0;

   // H264, HEVC, VP9 and AV1 have hardware SVC support on windows. H264 can
   // parse the information from Nalu(7.3.1 NAL unit syntax); AV1 can parse the
   // OBU(5.3.3. OBU extension header syntax), it's future work. Unfortunately,
   // VP9 spec doesn't provide the temporal information, we can only assign it
   // based on spec.
   if (codec_ == VideoCodec::kH264) {
     // See the 7.3.1 NAL unit syntax in H264 spec.
     // https://www.itu.int/rec/T-REC-H.264
     MediaBufferScopedPointer scoped_buffer(output_buffer.Get());
     h264_parser_.SetStream(scoped_buffer.get(), size);
     H264NALU nalu;
     H264Parser::Result result;
     while ((result = h264_parser_.AdvanceToNextNALU(&nalu)) !=
            H264Parser::kEOStream) {
       // Fallback to software when the stream is invalid.
       if (result == H264Parser::Result::kInvalidStream) {
         return false;
       }

       if (nalu.nal_unit_type == H264NALU::kPrefix) {
         *temporal_id = (nalu.data[kPrefixNALLocatedBytePos] & 0b1110'0000) >> 5;
         return true;
       }
     }
   }
 #if BUILDFLAG(ENABLE_PLATFORM_HEVC)
   else if (codec_ == VideoCodec::kHEVC) {
     // See section 7.3.1.1, NAL unit syntax in H265 spec.
     // https://www.itu.int/rec/T-REC-H.265
     // Unlike AVC, HEVC stores the temporal ID information in VCL NAL unit
     // header instead of using prefix NAL unit.
     MediaBufferScopedPointer scoped_buffer(output_buffer.Get());
     h265_nalu_parser_.SetStream(scoped_buffer.get(), size);
     H265NALU nalu;
     H265NaluParser::Result result;
     while ((result = h265_nalu_parser_.AdvanceToNextNALU(&nalu)) !=
            H265NaluParser::kEOStream) {
       if (result == H265NaluParser::Result::kInvalidStream) {
         return false;
       }
       // We only check VCL NAL units
       if (nalu.nal_unit_type <= H265NALU::RSV_VCL31) {
         *temporal_id = nalu.nuh_temporal_id_plus1 - 1;
         return true;
       }
     }
   }
 #endif

   // If we run to this point, it means that we have not assigned temporalId
   // through parsing stream, we always return true once we parse out temporalId.
   // Now we will assign the ID based on spec.
   *temporal_id = AssignTemporalIdBySvcSpec(keyframe);

   return true;
 }

 void MediaFoundationVideoEncodeAccelerator::ProcessOutput() {
   DVLOG(3) << __func__;
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   TRACE_EVENT0("media", "MediaFoundationVideoEncodeAccelerator::ProcessOutput");

   MFT_OUTPUT_DATA_BUFFER output_data_buffer = {0};
   output_data_buffer.dwStreamID = output_stream_id_;
   output_data_buffer.dwStatus = 0;
   output_data_buffer.pEvents = nullptr;
   output_data_buffer.pSample = nullptr;
   DWORD status = 0;
   HRESULT hr = encoder_->ProcessOutput(0, 1, &output_data_buffer, &status);
   if (hr == MF_E_TRANSFORM_STREAM_CHANGE) {
     hr = S_OK;
     Microsoft::WRL::ComPtr<IMFMediaType> media_type;
     for (DWORD type_index = 0; SUCCEEDED(hr); ++type_index) {
       hr = encoder_->GetOutputAvailableType(output_stream_id_, type_index,
                                             &media_type);
       if (SUCCEEDED(hr)) {
         break;
       }
     }
     hr = encoder_->SetOutputType(output_stream_id_, media_type.Get(), 0);
     return;
   }

   RETURN_ON_HR_FAILURE(hr, "Couldn't get encoded data", );
   DVLOG(3) << "Got encoded data " << hr;

   Microsoft::WRL::ComPtr<IMFMediaBuffer> output_buffer;
   hr = output_data_buffer.pSample->GetBufferByIndex(0, &output_buffer);
   RETURN_ON_HR_FAILURE(hr, "Couldn't get buffer by index", );

   base::TimeDelta timestamp;
   LONGLONG sample_time;
   hr = output_data_buffer.pSample->GetSampleTime(&sample_time);
   if (SUCCEEDED(hr)) {
     timestamp =
         base::Microseconds(sample_time / kOneMicrosecondInMFSampleTimeUnits);
   }

   // If `frame_qp` is set here, it will be plumbed down to WebRTC.
   // If not set, the QP may be parsed by WebRTC from the bitstream but only if
   // the QP is trusted (`encoder_info_.reports_average_qp` is true, which it is
   // by default).
   absl::optional<int32_t> frame_qp;
   bool should_notify_encoder_info_change = false;
   // In the case of VP9, `frame_qp_from_sample` is always 0 here
   // (https://crbug.com/1434633) so we prefer WebRTC to parse the bitstream for
   // us by leaving `frame_qp` unset.
   if (codec_ != VideoCodec::kVP9) {
     // For HMFT that continuously reports valid QP, update encoder info so that
     // WebRTC will not use bandwidth quality scaler for resolution adaptation.
     uint64_t frame_qp_from_sample = 0xfffful;
     hr = output_data_buffer.pSample->GetUINT64(MFSampleExtension_VideoEncodeQP,
                                                &frame_qp_from_sample);
     if (vendor_ == DriverVendor::kIntel) {
       if (codec_ == VideoCodec::kH264) {
         if ((FAILED(hr) || !IsValidQp(codec_, frame_qp_from_sample)) &&
             encoder_info_.reports_average_qp) {
           should_notify_encoder_info_change = true;
           encoder_info_.reports_average_qp = false;
         }
       } else if (codec_ == VideoCodec::kAV1) {
         if (!rate_ctrl_) {
           encoder_info_.reports_average_qp = false;
         }
       }
     }
     // Bits 0-15: Default QP.
     if (SUCCEEDED(hr)) {
       frame_qp = frame_qp_from_sample & 0xfffful;
     }
   }
   if (!encoder_info_sent_ || should_notify_encoder_info_change) {
     client_->NotifyEncoderInfoChange(encoder_info_);
     encoder_info_sent_ = true;
   }

   const bool keyframe = MFGetAttributeUINT32(
       output_data_buffer.pSample, MFSampleExtension_CleanPoint, false);
   DWORD size = 0;
   hr = output_buffer->GetCurrentLength(&size);
   RETURN_ON_HR_FAILURE(hr, "Couldn't get buffer length", );
   DCHECK_NE(size, 0u);
   int temporal_id = 0;
   if (!AssignTemporalId(output_buffer, size, &temporal_id, keyframe)) {
     NotifyErrorStatus({EncoderStatus::Codes::kEncoderHardwareDriverError,
                        "Parse temporalId failed"});
     return;
   }
   if (rate_ctrl_) {
     VideoRateControlWrapper::FrameParams frame_params{};
     frame_params.frame_type =
         keyframe ? VideoRateControlWrapper::FrameParams::FrameType::kKeyFrame
                  : VideoRateControlWrapper::FrameParams::FrameType::kInterFrame;
     frame_params.temporal_layer_id = temporal_id;
     // Notify SW BRC about recent encoded frame size.
     rate_ctrl_->PostEncodeUpdate(size, frame_params);
   }
   DVLOG(3) << "Encoded data with size:" << size << " keyframe " << keyframe;

   DCHECK(!output_color_spaces_.empty());
   auto output_cs = output_color_spaces_.front();
   output_color_spaces_.pop_front();

   // If no bit stream buffer presents, queue the output first.
   if (bitstream_buffer_queue_.empty()) {
     DVLOG(3) << "No bitstream buffers.";

     // We need to copy the output so that encoding can continue.
     auto encode_output = std::make_unique<EncodeOutput>(
         size, keyframe, timestamp, temporal_id, output_cs);
     {
       MediaBufferScopedPointer scoped_buffer(output_buffer.Get());
       memcpy(encode_output->memory(), scoped_buffer.get(), size);
       if (frame_qp.has_value() && IsValidQp(codec_, *frame_qp)) {
         encode_output->SetQp(*frame_qp);
       }
     }
     encoder_output_queue_.push_back(std::move(encode_output));
     output_data_buffer.pSample->Release();
     output_data_buffer.pSample = nullptr;
     return;
   }

   // Immediately return encoded buffer with BitstreamBuffer to client.
   auto buffer_ref = std::move(bitstream_buffer_queue_.back());
   bitstream_buffer_queue_.pop_back();

   {
     MediaBufferScopedPointer scoped_buffer(output_buffer.Get());
     if (!buffer_ref->mapping.IsValid() || !scoped_buffer.get()) {
       DLOG(ERROR) << "Failed to copy bitstream media buffer.";
       return;
     }

     memcpy(buffer_ref->mapping.memory(), scoped_buffer.get(), size);
   }

   output_data_buffer.pSample->Release();
   output_data_buffer.pSample = nullptr;

   BitstreamBufferMetadata md(size, keyframe, timestamp);
   if (frame_qp.has_value() && IsValidQp(codec_, *frame_qp)) {
     md.qp = *frame_qp;
   }

   if (temporal_scalable_coding()) {
     if (codec_ == VideoCodec::kH264) {
       md.h264.emplace().temporal_idx = temporal_id;
     } else if (codec_ == VideoCodec::kHEVC) {
       md.h265.emplace().temporal_idx = temporal_id;
     }
   }
   if (output_cs) {
     md.encoded_color_space = *output_cs;
   }

   client_->BitstreamBufferReady(buffer_ref->id, md);
 }

 void MediaFoundationVideoEncodeAccelerator::MediaEventHandler(
     MediaEventType event_type,
     HRESULT status) {
   DVLOG(3) << __func__;
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   DCHECK(event_generator_);

   if (FAILED(status)) {
     NotifyErrorStatus({EncoderStatus::Codes::kSystemAPICallError,
                        "Media Foundation async error: " + PrintHr(status)});
     return;
   }

   switch (event_type) {
     case METransformNeedInput: {
       if (state_ == kInitializing) {
         // HMFT is not ready for receiving inputs until the first
         // METransformNeedInput event is published.
         client_->RequireBitstreamBuffers(kNumInputBuffers, input_visible_size_,
                                          bitstream_buffer_size_);
         SetState(kEncoding);
       } else if (state_ == kEncoding) {
         FeedInputs();
       } else if (state_ == kPreFlushing) {
         FeedInputs();
         if (pending_input_queue_.empty()) {
           // All pending inputs are sent to the MF encoder, it's time to tell it
           // to drain and produce all outputs.
           DrainEncoder();
         }
       }
       break;
     }
     case METransformHaveOutput: {
       ProcessOutput();
       break;
     }
     case METransformDrainComplete: {
       DCHECK(pending_input_queue_.empty());
       DCHECK(encoder_output_queue_.empty());
       DCHECK(output_color_spaces_.empty());
       DCHECK_EQ(state_, kFlushing);
       auto hr = encoder_->ProcessMessage(MFT_MESSAGE_NOTIFY_START_OF_STREAM, 0);
       if (FAILED(hr)) {
         SetState(kError);
         std::move(flush_callback_).Run(false);
         return;
       }
       SetState(kEncoding);
       std::move(flush_callback_).Run(true);
       break;
     }
     default:
       break;
   }
   event_generator_->BeginGetEvent(this, nullptr);
 }

 void MediaFoundationVideoEncodeAccelerator::SetState(State state) {
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);

   DVLOG(3) << "Setting state to: " << state;
   state_ = state;
 }

 HRESULT MediaFoundationVideoEncodeAccelerator::InitializeD3DVideoProcessing(
     ID3D11Texture2D* input_texture) {
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   D3D11_TEXTURE2D_DESC input_desc = {};
   input_texture->GetDesc(&input_desc);
   if (vp_desc_.InputWidth == input_desc.Width &&
       vp_desc_.InputHeight == input_desc.Height) {
     return S_OK;
   }

   // Input/output framerates are dummy values for passthrough.
   D3D11_VIDEO_PROCESSOR_CONTENT_DESC vp_desc = {
       .InputFrameFormat = D3D11_VIDEO_FRAME_FORMAT_PROGRESSIVE,
       .InputFrameRate = {60, 1},
       .InputWidth = input_desc.Width,
       .InputHeight = input_desc.Height,
       .OutputFrameRate = {60, 1},
       .OutputWidth = static_cast<UINT>(input_visible_size_.width()),
       .OutputHeight = static_cast<UINT>(input_visible_size_.height()),
       .Usage = D3D11_VIDEO_USAGE_PLAYBACK_NORMAL};

   Microsoft::WRL::ComPtr<ID3D11Device> texture_device;
   input_texture->GetDevice(&texture_device);
   Microsoft::WRL::ComPtr<ID3D11VideoDevice> video_device;
   HRESULT hr = texture_device.As(&video_device);
   RETURN_ON_HR_FAILURE(hr, "Failed to query for ID3D11VideoDevice", hr);

   Microsoft::WRL::ComPtr<ID3D11VideoProcessorEnumerator>
       video_processor_enumerator;
   hr = video_device->CreateVideoProcessorEnumerator(
       &vp_desc, &video_processor_enumerator);
   RETURN_ON_HR_FAILURE(hr, "CreateVideoProcessorEnumerator failed", hr);

   Microsoft::WRL::ComPtr<ID3D11VideoProcessor> video_processor;
   hr = video_device->CreateVideoProcessor(video_processor_enumerator.Get(), 0,
                                           &video_processor);
   RETURN_ON_HR_FAILURE(hr, "CreateVideoProcessor failed", hr);

   Microsoft::WRL::ComPtr<ID3D11DeviceContext> device_context;
   texture_device->GetImmediateContext(&device_context);
   Microsoft::WRL::ComPtr<ID3D11VideoContext> video_context;
   hr = device_context.As(&video_context);
   RETURN_ON_HR_FAILURE(hr, "Failed to query for ID3D11VideoContext", hr);

   // Auto stream processing (the default) can hurt power consumption.
   video_context->VideoProcessorSetStreamAutoProcessingMode(
       video_processor.Get(), 0, FALSE);

   D3D11_TEXTURE2D_DESC scaled_desc = {
       .Width = static_cast<UINT>(input_visible_size_.width()),
       .Height = static_cast<UINT>(input_visible_size_.height()),
       .MipLevels = 1,
       .ArraySize = 1,
       .Format = DXGI_FORMAT_NV12,
       .SampleDesc = {1, 0},
       .Usage = D3D11_USAGE_DEFAULT,
       .BindFlags = D3D11_BIND_SHADER_RESOURCE | D3D11_BIND_RENDER_TARGET,
       .CPUAccessFlags = 0,
       .MiscFlags = 0};
   Microsoft::WRL::ComPtr<ID3D11Texture2D> scaled_d3d11_texture;
   hr = texture_device->CreateTexture2D(&scaled_desc, nullptr,
                                        &scaled_d3d11_texture);
   RETURN_ON_HR_FAILURE(hr, "Failed to create texture", hr);

   hr = SetDebugName(scaled_d3d11_texture.Get(),
                     "MFVideoEncodeAccelerator_ScaledTexture");
   RETURN_ON_HR_FAILURE(hr, "Failed to set debug name", hr);

   D3D11_VIDEO_PROCESSOR_OUTPUT_VIEW_DESC output_desc = {};
   output_desc.ViewDimension = D3D11_VPOV_DIMENSION_TEXTURE2D;
   output_desc.Texture2D.MipSlice = 0;
   Microsoft::WRL::ComPtr<ID3D11VideoProcessorOutputView> vp_output_view;
   hr = video_device->CreateVideoProcessorOutputView(
       scaled_d3d11_texture.Get(), video_processor_enumerator.Get(),
       &output_desc, &vp_output_view);
   RETURN_ON_HR_FAILURE(hr, "CreateVideoProcessorOutputView failed", hr);

   video_device_ = std::move(video_device);
   video_processor_enumerator_ = std::move(video_processor_enumerator);
   video_processor_ = std::move(video_processor);
   video_context_ = std::move(video_context);
   vp_desc_ = std::move(vp_desc);
   scaled_d3d11_texture_ = std::move(scaled_d3d11_texture);
   vp_output_view_ = std::move(vp_output_view);
   return S_OK;
 }

 HRESULT MediaFoundationVideoEncodeAccelerator::PerformD3DScaling(
     ID3D11Texture2D* input_texture) {
   DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
   HRESULT hr = InitializeD3DVideoProcessing(input_texture);
   RETURN_ON_HR_FAILURE(hr, "Couldn't initialize D3D video processing", hr);

   // Set the color space for passthrough.
   auto src_color_space = gfx::ColorSpace::CreateSRGB();
   auto output_color_space = gfx::ColorSpace::CreateSRGB();

   D3D11_VIDEO_PROCESSOR_COLOR_SPACE src_d3d11_color_space =
       gfx::ColorSpaceWin::GetD3D11ColorSpace(src_color_space);
   video_context_->VideoProcessorSetStreamColorSpace(video_processor_.Get(), 0,
                                                     &src_d3d11_color_space);
   D3D11_VIDEO_PROCESSOR_COLOR_SPACE output_d3d11_color_space =
       gfx::ColorSpaceWin::GetD3D11ColorSpace(output_color_space);
   video_context_->VideoProcessorSetOutputColorSpace(video_processor_.Get(),
                                                     &output_d3d11_color_space);

   {
     absl::optional<gpu::DXGIScopedReleaseKeyedMutex> release_keyed_mutex;
     Microsoft::WRL::ComPtr<IDXGIKeyedMutex> keyed_mutex;
     hr = input_texture->QueryInterface(IID_PPV_ARGS(&keyed_mutex));
     if (SUCCEEDED(hr)) {
       // The producer may still be using this texture for a short period of
       // time, so wait long enough to hopefully avoid glitches. For example,
       // all levels of the texture share the same keyed mutex, so if the
       // hardware decoder acquired the mutex to decode into a different array
       // level then it still may block here temporarily.
       constexpr int kMaxSyncTimeMs = 100;
       hr = keyed_mutex->AcquireSync(0, kMaxSyncTimeMs);
       RETURN_ON_HR_FAILURE(hr, "Failed to acquire keyed mutex", hr);
       release_keyed_mutex.emplace(std::move(keyed_mutex), 0);
     }

     // Setup |video_context_| for VPBlt operation.
     D3D11_VIDEO_PROCESSOR_INPUT_VIEW_DESC input_desc = {};
     input_desc.ViewDimension = D3D11_VPIV_DIMENSION_TEXTURE2D;
     input_desc.Texture2D.ArraySlice = 0;
     Microsoft::WRL::ComPtr<ID3D11VideoProcessorInputView> input_view;
     hr = video_device_->CreateVideoProcessorInputView(
         input_texture, video_processor_enumerator_.Get(), &input_desc,
         &input_view);
     RETURN_ON_HR_FAILURE(hr, "CreateVideoProcessorInputView failed", hr);

     D3D11_VIDEO_PROCESSOR_STREAM stream = {.Enable = true,
                                            .OutputIndex = 0,
                                            .InputFrameOrField = 0,
                                            .PastFrames = 0,
                                            .FutureFrames = 0,
                                            .pInputSurface = input_view.Get()};

     D3D11_TEXTURE2D_DESC input_texture_desc = {};
     input_texture->GetDesc(&input_texture_desc);
     RECT source_rect = {0, 0, static_cast<LONG>(input_texture_desc.Width),
                         static_cast<LONG>(input_texture_desc.Height)};
     video_context_->VideoProcessorSetStreamSourceRect(video_processor_.Get(), 0,
                                                       TRUE, &source_rect);

     D3D11_TEXTURE2D_DESC output_texture_desc = {};
     scaled_d3d11_texture_->GetDesc(&output_texture_desc);
     RECT dest_rect = {0, 0, static_cast<LONG>(output_texture_desc.Width),
                       static_cast<LONG>(output_texture_desc.Height)};
     video_context_->VideoProcessorSetOutputTargetRect(video_processor_.Get(),
                                                       TRUE, &dest_rect);
     video_context_->VideoProcessorSetStreamDestRect(video_processor_.Get(), 0,
                                                     TRUE, &dest_rect);

     hr = video_context_->VideoProcessorBlt(
         video_processor_.Get(), vp_output_view_.Get(), 0, 1, &stream);
     RETURN_ON_HR_FAILURE(hr, "VideoProcessorBlt failed", hr);
   }

   return hr;
 }

 HRESULT MediaFoundationVideoEncodeAccelerator::GetParameters(DWORD* pdwFlags,
                                                              DWORD* pdwQueue) {
   return MFASYNC_FAST_IO_PROCESSING_CALLBACK;
 }

 HRESULT MediaFoundationVideoEncodeAccelerator::Invoke(
     IMFAsyncResult* pAsyncResult) {
   Microsoft::WRL::ComPtr<IMFMediaEvent> media_event;
   RETURN_IF_FAILED(event_generator_->EndGetEvent(pAsyncResult, &media_event));

   MediaEventType event_type = MEUnknown;
   RETURN_IF_FAILED(media_event->GetType(&event_type));

   HRESULT status = S_OK;
   media_event->GetStatus(&status);

   // Invoke() is called on some random OS thread, so we must post to our event
   // handler since MediaFoundationVideoEncodeAccelerator is single threaded.
   task_runner_->PostTask(
       FROM_HERE,
       base::BindOnce(&MediaFoundationVideoEncodeAccelerator::MediaEventHandler,
                      weak_ptr_, event_type, status));
   return status;
 }

 ULONG MediaFoundationVideoEncodeAccelerator::AddRef() {
   return async_callback_ref_.Increment();
 }

 ULONG MediaFoundationVideoEncodeAccelerator::Release() {
   DCHECK(!async_callback_ref_.IsOne());
   return async_callback_ref_.Decrement() ? 1 : 0;
 }

 HRESULT MediaFoundationVideoEncodeAccelerator::QueryInterface(REFIID riid,
                                                               void** ppv) {
   static const QITAB kQI[] = {
       QITABENT(MediaFoundationVideoEncodeAccelerator, IMFAsyncCallback), {0}};
   return QISearch(this, kQI, riid, ppv);
 }

 void MediaFoundationVideoEncodeAccelerator::SetEncoderColorSpace() {
   DCHECK(encoder_color_space_);
   if (!encoder_color_space_->IsValid()) {
     return;
   }

   MFVideoPrimaries primary;
   MFVideoTransferFunction transfer;
   MFVideoTransferMatrix matrix;
   MFNominalRange range;
   GetMediaTypeColorValues(*encoder_color_space_, &primary, &transfer, &matrix,
                           &range);

   // Set appropriate color space keys. Note: This may do nothing depending on
   // the hardware MFT. It's expected that if the MFT does not support color
   // space info that it either won't write any color info in the bitstream or it
   // will write the values for UNSPECIFIED (see VideoColorSpace).
   auto set_color_space = [&](IMFMediaType* type) {
     auto hr = type->SetUINT32(MF_MT_VIDEO_PRIMARIES, primary);
     RETURN_ON_HR_FAILURE(hr, "Couldn't set primaries", hr);
     hr = type->SetUINT32(MF_MT_TRANSFER_FUNCTION, transfer);
     RETURN_ON_HR_FAILURE(hr, "Couldn't set transfer", hr);
     hr = type->SetUINT32(MF_MT_YUV_MATRIX, matrix);
     RETURN_ON_HR_FAILURE(hr, "Couldn't set matrix", hr);
     hr = type->SetUINT32(MF_MT_VIDEO_NOMINAL_RANGE, range);
     RETURN_ON_HR_FAILURE(hr, "Couldn't set range", hr);
     return hr;
   };

   // Set input and output color spaces to the same value so we don't
   // inadvertently enable any kind of color space conversion.
   RETURN_ON_HR_FAILURE(set_color_space(imf_output_media_type_.Get()),
                        "Couldn't set output color space", );
   RETURN_ON_HR_FAILURE(encoder_->SetOutputType(output_stream_id_,
                                                imf_output_media_type_.Get(), 0),
                        "Couldn't change output media type", );

   RETURN_ON_HR_FAILURE(set_color_space(imf_input_media_type_.Get()),
                        "Couldn't set input color space", );
   RETURN_ON_HR_FAILURE(
       encoder_->SetInputType(input_stream_id_, imf_input_media_type_.Get(), 0),
       "Couldn't change input media type", );

   DVLOG(1) << "Set encoder color space to: "
            << encoder_color_space_->ToString();
 }

 }  // namespace media