media/gpu/v4l2/v4l2_video_encode_accelerator.cc - chromium/src - Git at Google

 // Copyright 2014 The Chromium Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "media/gpu/v4l2/v4l2_video_encode_accelerator.h"

 #include <fcntl.h>
 #include <linux/videodev2.h>
 #include <poll.h>
 #include <string.h>
 #include <sys/eventfd.h>
 #include <sys/ioctl.h>
 #include <sys/mman.h>

 #include <numeric>
 #include <utility>

 #include "base/bind.h"
 #include "base/bits.h"
 #include "base/callback.h"
 #include "base/callback_helpers.h"
 #include "base/command_line.h"
 #include "base/numerics/safe_conversions.h"
 #include "base/single_thread_task_runner.h"
 #include "base/stl_util.h"
 #include "base/threading/thread_task_runner_handle.h"
 #include "base/trace_event/trace_event.h"
 #include "media/base/bind_to_current_loop.h"
 #include "media/base/bitstream_buffer.h"
 #include "media/base/color_plane_layout.h"
 #include "media/base/scopedfd_helper.h"
 #include "media/base/unaligned_shared_memory.h"
 #include "media/base/video_frame_layout.h"
 #include "media/base/video_types.h"
 #include "media/gpu/chromeos/fourcc.h"
 #include "media/gpu/gpu_video_encode_accelerator_helpers.h"
 #include "media/gpu/image_processor_factory.h"
 #include "media/gpu/linux/platform_video_frame_utils.h"
 #include "media/gpu/macros.h"
 #include "media/video/h264_level_limits.h"
 #include "media/video/h264_parser.h"

 #define NOTIFY_ERROR(x)                      \
   do {                                       \
     VLOGF(1) << "Setting error state:" << x; \
     SetErrorState(x);                        \
   } while (0)

 #define IOCTL_OR_ERROR_RETURN_VALUE(type, arg, value, type_str) \
   do {                                                          \
     if (device_->Ioctl(type, arg) != 0) {                       \
       VPLOGF(1) << "ioctl() failed: " << type_str;              \
       NOTIFY_ERROR(kPlatformFailureError);                      \
       return value;                                             \
     }                                                           \
   } while (0)

 #define IOCTL_OR_ERROR_RETURN(type, arg) \
   IOCTL_OR_ERROR_RETURN_VALUE(type, arg, ((void)0), #type)

 #define IOCTL_OR_ERROR_RETURN_FALSE(type, arg) \
   IOCTL_OR_ERROR_RETURN_VALUE(type, arg, false, #type)

 #define IOCTL_OR_LOG_ERROR(type, arg)              \
   do {                                             \
     if (device_->Ioctl(type, arg) != 0)            \
       VPLOGF(1) << "ioctl() failed: " << #type;    \
   } while (0)

 namespace {
 const uint8_t kH264StartCode[] = {0, 0, 0, 1};
 const size_t kH264StartCodeSize = sizeof(kH264StartCode);

 // Copy a H.264 NALU of size |src_size| (without start code), located at |src|,
 // into a buffer starting at |dst| of size |dst_size|, prepending it with
 // a H.264 start code (as long as both fit). After copying, update |dst| to
 // point to the address immediately after the copied data, and update |dst_size|
 // to contain remaining destination buffer size.
 static void CopyNALUPrependingStartCode(const uint8_t* src,
                                         size_t src_size,
                                         uint8_t** dst,
                                         size_t* dst_size) {
   size_t size_to_copy = kH264StartCodeSize + src_size;
   if (size_to_copy > *dst_size) {
     VLOGF(1) << "Could not copy a NALU, not enough space in destination buffer";
     return;
   }

   memcpy(*dst, kH264StartCode, kH264StartCodeSize);
   memcpy(*dst + kH264StartCodeSize, src, src_size);

   *dst += size_to_copy;
   *dst_size -= size_to_copy;
 }
 }  // namespace

 namespace media {

 struct V4L2VideoEncodeAccelerator::BitstreamBufferRef {
   BitstreamBufferRef(int32_t id, std::unique_ptr<UnalignedSharedMemory> shm)
       : id(id), shm(std::move(shm)) {}
   const int32_t id;
   const std::unique_ptr<UnalignedSharedMemory> shm;
 };

 V4L2VideoEncodeAccelerator::InputRecord::InputRecord() = default;

 V4L2VideoEncodeAccelerator::InputRecord::InputRecord(const InputRecord&) =
     default;

 V4L2VideoEncodeAccelerator::InputRecord::~InputRecord() = default;

 V4L2VideoEncodeAccelerator::InputFrameInfo::InputFrameInfo()
     : InputFrameInfo(nullptr, false) {}

 V4L2VideoEncodeAccelerator::InputFrameInfo::InputFrameInfo(
     scoped_refptr<VideoFrame> frame,
     bool force_keyframe)
     : frame(frame), force_keyframe(force_keyframe) {}

 V4L2VideoEncodeAccelerator::InputFrameInfo::InputFrameInfo(
     scoped_refptr<VideoFrame> frame,
     bool force_keyframe,
     size_t index)
     : frame(std::move(frame)),
       force_keyframe(force_keyframe),
       ip_output_buffer_index(index) {}

 V4L2VideoEncodeAccelerator::InputFrameInfo::InputFrameInfo(
     const InputFrameInfo&) = default;

 V4L2VideoEncodeAccelerator::InputFrameInfo::~InputFrameInfo() {}

 V4L2VideoEncodeAccelerator::V4L2VideoEncodeAccelerator(
     const scoped_refptr<V4L2Device>& device)
     : child_task_runner_(base::ThreadTaskRunnerHandle::Get()),
       output_buffer_byte_size_(0),
       output_format_fourcc_(0),
       encoder_state_(kUninitialized),
       device_(device),
       input_memory_type_(V4L2_MEMORY_USERPTR),
       is_flush_supported_(false),
       encoder_thread_("V4L2EncoderThread"),
       device_poll_thread_("V4L2EncoderDevicePollThread"),
       weak_this_ptr_factory_(this) {
   weak_this_ = weak_this_ptr_factory_.GetWeakPtr();
 }

 V4L2VideoEncodeAccelerator::~V4L2VideoEncodeAccelerator() {
   DCHECK(!encoder_thread_.IsRunning());
   DCHECK(!device_poll_thread_.IsRunning());
   VLOGF(2);
 }

 bool V4L2VideoEncodeAccelerator::Initialize(const Config& config,
                                             Client* client) {
   TRACE_EVENT0("media,gpu", "V4L2VEA::Initialize");
   VLOGF(2) << ": " << config.AsHumanReadableString();

   visible_size_ = config.input_visible_size;

   client_ptr_factory_.reset(new base::WeakPtrFactory<Client>(client));
   client_ = client_ptr_factory_->GetWeakPtr();

   DCHECK(child_task_runner_->BelongsToCurrentThread());
   DCHECK_EQ(encoder_state_, kUninitialized);

   output_format_fourcc_ =
       V4L2Device::VideoCodecProfileToV4L2PixFmt(config.output_profile, false);
   if (!output_format_fourcc_) {
     VLOGF(1) << "invalid output_profile="
              << GetProfileName(config.output_profile);
     return false;
   }

   if (!device_->Open(V4L2Device::Type::kEncoder, output_format_fourcc_)) {
     VLOGF(1) << "Failed to open device for profile="
              << GetProfileName(config.output_profile)
              << ", fourcc=" << FourccToString(output_format_fourcc_);
     return false;
   }

   // Ask if V4L2_ENC_CMD_STOP (Flush) is supported.
   struct v4l2_encoder_cmd cmd = {};
   cmd.cmd = V4L2_ENC_CMD_STOP;
   is_flush_supported_ = (device_->Ioctl(VIDIOC_TRY_ENCODER_CMD, &cmd) == 0);
   if (!is_flush_supported_)
     VLOGF(2) << "V4L2_ENC_CMD_STOP is not supported.";

   struct v4l2_capability caps {};
   const __u32 kCapsRequired = V4L2_CAP_VIDEO_M2M_MPLANE | V4L2_CAP_STREAMING;
   IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_QUERYCAP, &caps);
   if ((caps.capabilities & kCapsRequired) != kCapsRequired) {
     VLOGF(1) << "caps check failed: 0x" << std::hex << caps.capabilities;
     return false;
   }

   if (!encoder_thread_.Start()) {
     VLOGF(1) << "encoder thread failed to start";
     return false;
   }

   bool result = false;
   base::WaitableEvent done;
   encoder_thread_.task_runner()->PostTask(
       FROM_HERE,
       base::BindOnce(&V4L2VideoEncodeAccelerator::InitializeTask,
                      base::Unretained(this), config, &result, &done));
   done.Wait();
   return result;
 }

 void V4L2VideoEncodeAccelerator::InitializeTask(const Config& config,
                                                 bool* result,
                                                 base::WaitableEvent* done) {
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());

   // Signal the event when leaving the method.
   base::ScopedClosureRunner signal_event(
       base::BindOnce(&base::WaitableEvent::Signal, base::Unretained(done)));
   *result = false;

   input_queue_ = device_->GetQueue(V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE);
   output_queue_ = device_->GetQueue(V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE);
   if (!input_queue_ || !output_queue_) {
     VLOGF(1) << "Failed to get V4L2Queue.";
     NOTIFY_ERROR(kPlatformFailureError);
     return;
   }

   if (!SetFormats(config.input_format, config.output_profile)) {
     VLOGF(1) << "Failed setting up formats";
     return;
   }

   if (config.input_format != device_input_layout_->format()) {
     VLOGF(2) << "Input format: " << config.input_format << " is not supported "
              << "by the HW. Will try to convert to "
              << device_input_layout_->format();

     // TODO(hiroh): Decide the appropriate planar in some way.
     auto input_layout = VideoFrameLayout::CreateMultiPlanar(
         config.input_format, visible_size_,
         std::vector<ColorPlaneLayout>(
             VideoFrame::NumPlanes(config.input_format)));
     if (!input_layout) {
       VLOGF(1) << "Invalid image processor input layout";
       return;
     }

     if (!CreateImageProcessor(*input_layout, *device_input_layout_,
                               visible_size_)) {
       VLOGF(1) << "Failed to create image processor";
       return;
     }
   }

   if (!InitInputMemoryType(config))
     return;
   if (!InitControls(config))
     return;
   if (!CreateOutputBuffers())
     return;

   encoder_state_ = kInitialized;
   RequestEncodingParametersChangeTask(
       config.initial_bitrate, config.initial_framerate.value_or(
                                   VideoEncodeAccelerator::kDefaultFramerate));
   child_task_runner_->PostTask(
       FROM_HERE,
       base::BindOnce(
           &Client::RequireBitstreamBuffers, client_, kInputBufferCount,
           image_processor_.get() ? image_processor_->input_layout().coded_size()
                                  : input_allocated_size_,
           output_buffer_byte_size_));

   // Finish initialization.
   *result = true;
 }

 bool V4L2VideoEncodeAccelerator::CreateImageProcessor(
     const VideoFrameLayout& input_layout,
     const VideoFrameLayout& output_layout,
     const gfx::Size& visible_size) {
   VLOGF(2);
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DCHECK_NE(input_layout.format(), output_layout.format());

   // Convert from |config.input_format| to |device_input_layout_->format()|,
   // keeping the size at |visible_size| and requiring the output buffers to
   // be of at least |device_input_layout_->coded_size()|.
   // |input_storage_type| can be STORAGE_SHMEM and STORAGE_MOJO_SHARED_BUFFER.
   // However, it doesn't matter VideoFrame::STORAGE_OWNED_MEMORY is specified
   // for |input_storage_type| here, as long as VideoFrame on Process()'s data
   // can be accessed by VideoFrame::data().
   image_processor_ = ImageProcessorFactory::Create(
       ImageProcessor::PortConfig(input_layout, visible_size,
                                  {VideoFrame::STORAGE_OWNED_MEMORY}),
       ImageProcessor::PortConfig(
           output_layout, visible_size,
           {VideoFrame::STORAGE_DMABUFS, VideoFrame::STORAGE_OWNED_MEMORY}),
       // Try OutputMode::ALLOCATE first because we want v4l2IP chooses
       // ALLOCATE mode. For libyuvIP, it accepts only IMPORT.
       {ImageProcessor::OutputMode::ALLOCATE,
        ImageProcessor::OutputMode::IMPORT},
       kImageProcBufferCount,
       // Unretained(this) is safe here, because image_processor is destroyed
       // before video_encoder_thread stops.
       BindToCurrentLoop(
           base::BindRepeating(&V4L2VideoEncodeAccelerator::ImageProcessorError,
                               base::Unretained(this))));
   if (!image_processor_) {
     VLOGF(1) << "Failed initializing image processor";
     return false;
   }

   // The output of image processor is the input of encoder. Output coded
   // width of processor must be the same as input coded width of encoder.
   // Output coded height of processor can be larger but not smaller than the
   // input coded height of encoder. For example, suppose input size of encoder
   // is 320x193. It is OK if the output of processor is 320x208.
   const auto& ip_output_size = image_processor_->output_layout().coded_size();
   if (ip_output_size.width() != output_layout.coded_size().width() ||
       ip_output_size.height() < output_layout.coded_size().height()) {
     VLOGF(1) << "Invalid image processor output coded size "
              << ip_output_size.ToString() << ", expected output coded size is "
              << output_layout.coded_size().ToString();
     return false;
   }

   // Initialize |free_image_processor_output_buffer_indices_|.
   free_image_processor_output_buffer_indices_.resize(kImageProcBufferCount);
   std::iota(free_image_processor_output_buffer_indices_.begin(),
             free_image_processor_output_buffer_indices_.end(), 0);
   return AllocateImageProcessorOutputBuffers(kImageProcBufferCount,
                                              visible_size);
 }

 bool V4L2VideoEncodeAccelerator::AllocateImageProcessorOutputBuffers(
     size_t count,
     const gfx::Size& visible_size) {
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DCHECK(image_processor_);
   // Allocate VideoFrames for image processor output if its mode is IMPORT.
   if (image_processor_->output_mode() != ImageProcessor::OutputMode::IMPORT) {
     return true;
   }

   image_processor_output_buffers_.resize(count);
   const auto output_storage_type = image_processor_->output_storage_type();
   for (size_t i = 0; i < count; i++) {
     switch (output_storage_type) {
       case VideoFrame::STORAGE_OWNED_MEMORY:
         image_processor_output_buffers_[i] = VideoFrame::CreateFrameWithLayout(
             *device_input_layout_, gfx::Rect(visible_size), visible_size,
             base::TimeDelta(), true);
         if (!image_processor_output_buffers_[i]) {
           VLOG(1) << "Failed to create VideoFrame";
           return false;
         }
         break;
       // TODO(crbug.com/910590): Support VideoFrame::STORAGE_DMABUFS.
       default:
         VLOGF(1) << "Unsupported output storage type of image processor: "
                  << output_storage_type;
         return false;
     }
   }
   return true;
 }

 bool V4L2VideoEncodeAccelerator::InitInputMemoryType(const Config& config) {
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   if (image_processor_) {
     const auto storage_type = image_processor_->output_storage_type();
     if (storage_type == VideoFrame::STORAGE_DMABUFS) {
       input_memory_type_ = V4L2_MEMORY_DMABUF;
     } else if (VideoFrame::IsStorageTypeMappable(storage_type)) {
       input_memory_type_ = V4L2_MEMORY_USERPTR;
     } else {
       VLOGF(1) << "Unsupported image processor's output StorageType: "
                << storage_type;
       return false;
     }
   } else {
     switch (config.storage_type.value_or(Config::StorageType::kShmem)) {
       case Config::StorageType::kShmem:
         input_memory_type_ = V4L2_MEMORY_USERPTR;
         break;
       case Config::StorageType::kDmabuf:
         input_memory_type_ = V4L2_MEMORY_DMABUF;
         break;
     }
   }
   return true;
 }

 void V4L2VideoEncodeAccelerator::ImageProcessorError() {
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   VLOGF(1) << "Image processor error";
   NOTIFY_ERROR(kPlatformFailureError);
 }

 void V4L2VideoEncodeAccelerator::Encode(scoped_refptr<VideoFrame> frame,
                                         bool force_keyframe) {
   DVLOGF(4) << "force_keyframe=" << force_keyframe;
   DCHECK(child_task_runner_->BelongsToCurrentThread());

   encoder_thread_.task_runner()->PostTask(
       FROM_HERE,
       base::BindOnce(&V4L2VideoEncodeAccelerator::EncodeTask,
                      base::Unretained(this), std::move(frame), force_keyframe));
 }

 void V4L2VideoEncodeAccelerator::UseOutputBitstreamBuffer(
     BitstreamBuffer buffer) {
   DVLOGF(4) << "id=" << buffer.id();
   DCHECK(child_task_runner_->BelongsToCurrentThread());

   encoder_thread_.task_runner()->PostTask(
       FROM_HERE,
       base::BindOnce(&V4L2VideoEncodeAccelerator::UseOutputBitstreamBufferTask,
                      base::Unretained(this), std::move(buffer)));
 }

 void V4L2VideoEncodeAccelerator::RequestEncodingParametersChange(
     uint32_t bitrate,
     uint32_t framerate) {
   VLOGF(2) << "bitrate=" << bitrate << ", framerate=" << framerate;
   DCHECK(child_task_runner_->BelongsToCurrentThread());

   encoder_thread_.task_runner()->PostTask(
       FROM_HERE,
       base::BindOnce(
           &V4L2VideoEncodeAccelerator::RequestEncodingParametersChangeTask,
           base::Unretained(this), bitrate, framerate));
 }

 void V4L2VideoEncodeAccelerator::Destroy() {
   VLOGF(2);
   DCHECK(child_task_runner_->BelongsToCurrentThread());

   // We're destroying; cancel all callbacks.
   client_ptr_factory_.reset();
   weak_this_ptr_factory_.InvalidateWeakPtrs();

   // If the encoder thread is running, destroy using posted task.
   if (encoder_thread_.IsRunning()) {
     encoder_thread_.task_runner()->PostTask(
         FROM_HERE, base::BindOnce(&V4L2VideoEncodeAccelerator::DestroyTask,
                                   base::Unretained(this)));
     // DestroyTask() will put the encoder into kError state and cause all tasks
     // to no-op.
     encoder_thread_.Stop();
   } else {
     // Otherwise, call the destroy task directly.
     DestroyTask();
   }

   // If a flush is pending, notify client that it did not finish.
   if (flush_callback_)
     std::move(flush_callback_).Run(false);

   // Set to kError state just in case.
   encoder_state_ = kError;

   delete this;
 }

 void V4L2VideoEncodeAccelerator::Flush(FlushCallback flush_callback) {
   VLOGF(2);
   DCHECK(child_task_runner_->BelongsToCurrentThread());

   encoder_thread_.task_runner()->PostTask(
       FROM_HERE,
       base::BindOnce(&V4L2VideoEncodeAccelerator::FlushTask,
                      base::Unretained(this), std::move(flush_callback)));
 }

 void V4L2VideoEncodeAccelerator::FlushTask(FlushCallback flush_callback) {
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());

   if (flush_callback_ || encoder_state_ != kEncoding) {
     VLOGF(1) << "Flush failed: there is a pending flush, "
              << "or VideoEncodeAccelerator is not in kEncoding state";
     NOTIFY_ERROR(kIllegalStateError);
     child_task_runner_->PostTask(
         FROM_HERE, base::BindOnce(std::move(flush_callback), false));
     return;
   }
   flush_callback_ = std::move(flush_callback);
   // Push a null frame to indicate Flush.
   EncodeTask(nullptr, false);
 }

 bool V4L2VideoEncodeAccelerator::IsFlushSupported() {
   return is_flush_supported_;
 }

 VideoEncodeAccelerator::SupportedProfiles
 V4L2VideoEncodeAccelerator::GetSupportedProfiles() {
   scoped_refptr<V4L2Device> device = V4L2Device::Create();
   if (!device)
     return SupportedProfiles();

   return device->GetSupportedEncodeProfiles();
 }

 void V4L2VideoEncodeAccelerator::FrameProcessed(
     bool force_keyframe,
     base::TimeDelta timestamp,
     size_t output_buffer_index,
     scoped_refptr<VideoFrame> frame) {
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DVLOGF(4) << "force_keyframe=" << force_keyframe
             << ", output_buffer_index=" << output_buffer_index;
   DCHECK_GE(output_buffer_index, 0u);

   encoder_input_queue_.emplace(std::move(frame), force_keyframe,
                                output_buffer_index);
   encoder_thread_.task_runner()->PostTask(
       FROM_HERE, base::BindOnce(&V4L2VideoEncodeAccelerator::Enqueue,
                                 base::Unretained(this)));
 }

 void V4L2VideoEncodeAccelerator::ReuseImageProcessorOutputBuffer(
     size_t output_buffer_index) {
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DVLOGF(4) << "output_buffer_index=" << output_buffer_index;
   free_image_processor_output_buffer_indices_.push_back(output_buffer_index);
   InputImageProcessorTask();
 }

 size_t V4L2VideoEncodeAccelerator::CopyIntoOutputBuffer(
     const uint8_t* bitstream_data,
     size_t bitstream_size,
     std::unique_ptr<BitstreamBufferRef> buffer_ref) {
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   uint8_t* dst_ptr = static_cast<uint8_t*>(buffer_ref->shm->memory());
   size_t remaining_dst_size = buffer_ref->shm->size();

   if (!inject_sps_and_pps_) {
     if (bitstream_size <= remaining_dst_size) {
       memcpy(dst_ptr, bitstream_data, bitstream_size);
       return bitstream_size;
     } else {
       VLOGF(1) << "Output data did not fit in the BitstreamBuffer";
       return 0;
     }
   }

   // Cache the newest SPS and PPS found in the stream, and inject them before
   // each IDR found.
   H264Parser parser;
   parser.SetStream(bitstream_data, bitstream_size);
   H264NALU nalu;

   while (parser.AdvanceToNextNALU(&nalu) == H264Parser::kOk) {
     // nalu.size is always without the start code, regardless of the NALU type.
     if (nalu.size + kH264StartCodeSize > remaining_dst_size) {
       VLOGF(1) << "Output data did not fit in the BitstreamBuffer";
       break;
     }

     switch (nalu.nal_unit_type) {
       case H264NALU::kSPS:
         cached_sps_.resize(nalu.size);
         memcpy(cached_sps_.data(), nalu.data, nalu.size);
         cached_h264_header_size_ =
             cached_sps_.size() + cached_pps_.size() + 2 * kH264StartCodeSize;
         break;

       case H264NALU::kPPS:
         cached_pps_.resize(nalu.size);
         memcpy(cached_pps_.data(), nalu.data, nalu.size);
         cached_h264_header_size_ =
             cached_sps_.size() + cached_pps_.size() + 2 * kH264StartCodeSize;
         break;

       case H264NALU::kIDRSlice:
         // Only inject if we have both headers cached, and enough space for both
         // the headers and the NALU itself.
         if (cached_sps_.empty() || cached_pps_.empty() ||
             cached_h264_header_size_ + nalu.size + kH264StartCodeSize >
                 remaining_dst_size) {
           VLOGF(1) << "Not enough space to inject a stream header before IDR";
           break;
         }

         CopyNALUPrependingStartCode(cached_sps_.data(), cached_sps_.size(),
                                     &dst_ptr, &remaining_dst_size);
         CopyNALUPrependingStartCode(cached_pps_.data(), cached_pps_.size(),
                                     &dst_ptr, &remaining_dst_size);
         VLOGF(2) << "Stream header injected before IDR";
         break;
     }

     CopyNALUPrependingStartCode(nalu.data, nalu.size, &dst_ptr,
                                 &remaining_dst_size);
   }

   return buffer_ref->shm->size() - remaining_dst_size;
 }

 void V4L2VideoEncodeAccelerator::EncodeTask(scoped_refptr<VideoFrame> frame,
                                             bool force_keyframe) {
   DVLOGF(4) << "force_keyframe=" << force_keyframe;
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DCHECK_NE(encoder_state_, kUninitialized);

   if (encoder_state_ == kError) {
     DVLOGF(1) << "early out: kError state";
     return;
   }

   if (frame &&
       !ReconfigureFormatIfNeeded(frame->format(), frame->coded_size())) {
     NOTIFY_ERROR(kInvalidArgumentError);
     encoder_state_ = kError;
     return;
   }

   // If a video frame to be encoded is fed, then call VIDIOC_REQBUFS if it has
   // not been called yet.
   if (frame && input_buffer_map_.empty() && !CreateInputBuffers())
     return;

   if (image_processor_) {
     image_processor_input_queue_.emplace(std::move(frame), force_keyframe);
     InputImageProcessorTask();
   } else {
     encoder_input_queue_.emplace(std::move(frame), force_keyframe);
     Enqueue();
   }
 }

 bool V4L2VideoEncodeAccelerator::ReconfigureFormatIfNeeded(
     VideoPixelFormat format,
     const gfx::Size& new_frame_size) {
   // We should apply the frame size change to ImageProcessor if there is.
   if (image_processor_) {
     // Stride is the same. There is no need of executing S_FMT again.
     if (image_processor_->input_layout().coded_size() == new_frame_size) {
       return true;
     }

     VLOGF(2) << "Call S_FMT with a new size=" << new_frame_size.ToString()
              << ", the previous size ="
              << device_input_layout_->coded_size().ToString();
     if (!input_buffer_map_.empty()) {
       VLOGF(1) << "Input frame size is changed during encoding";
       NOTIFY_ERROR(kInvalidArgumentError);
       return false;
     }

     // TODO(hiroh): Decide the appropriate planar in some way.
     auto input_layout = VideoFrameLayout::CreateMultiPlanar(
         format, new_frame_size,
         std::vector<ColorPlaneLayout>(VideoFrame::NumPlanes(format)));
     if (!input_layout) {
       VLOGF(1) << "Invalid image processor input layout";
       return false;
     }

     if (!CreateImageProcessor(*input_layout, *device_input_layout_,
                               visible_size_)) {
       NOTIFY_ERROR(kPlatformFailureError);
       return false;
     }
     if (image_processor_->input_layout().coded_size().width() !=
         new_frame_size.width()) {
       NOTIFY_ERROR(kPlatformFailureError);
       return false;
     }

     return true;
   }

   // Here we should compare |device_input_layout_->coded_size()|. However, VEA
   // requests a client |input_allocated_size_|, which might be a larger size
   // than |device_input_layout_->coded_size()|. The size is larger if there is
   // an extra data in planes, that happens on MediaTek.
   // This comparison will work because VEAClient within Chrome gives the buffer
   // whose frame size as |input_allocated_size_|. VEAClient for ARC++ might give
   // a different frame size but |input_allocated_size_| is always the same as
   // |device_input_layout_->coded_size()|.
   if (new_frame_size != input_allocated_size_) {
     VLOGF(2) << "Call S_FMT with a new size=" << new_frame_size.ToString()
              << ", the previous size ="
              << device_input_layout_->coded_size().ToString()
              << " (the size requested to client="
              << input_allocated_size_.ToString();
     if (!input_buffer_map_.empty()) {
       VLOGF(1) << "Input frame size is changed during encoding";
       NOTIFY_ERROR(kInvalidArgumentError);
       return false;
     }
     if (!NegotiateInputFormat(device_input_layout_->format(), new_frame_size)) {
       NOTIFY_ERROR(kPlatformFailureError);
       return false;
     }
     if (device_input_layout_->coded_size().width() != new_frame_size.width()) {
       NOTIFY_ERROR(kPlatformFailureError);
       return false;
     }
   }

   return true;
 }

 void V4L2VideoEncodeAccelerator::InputImageProcessorTask() {
   if (free_image_processor_output_buffer_indices_.empty())
     return;
   if (image_processor_input_queue_.empty())
     return;
   const size_t output_buffer_index =
       free_image_processor_output_buffer_indices_.back();
   free_image_processor_output_buffer_indices_.pop_back();

   InputFrameInfo frame_info = std::move(image_processor_input_queue_.front());
   image_processor_input_queue_.pop();
   auto frame = std::move(frame_info.frame);
   const bool force_keyframe = frame_info.force_keyframe;
   auto timestamp = frame->timestamp();
   if (image_processor_->output_mode() == ImageProcessor::OutputMode::IMPORT) {
     const auto& buf = image_processor_output_buffers_[output_buffer_index];
     auto output_frame = VideoFrame::WrapVideoFrame(
         buf, buf->format(), buf->visible_rect(), buf->natural_size());

     // Unretained(this) is safe here, because image_processor is destroyed
     // before video_encoder_thread stops.
     if (!image_processor_->Process(
             std::move(frame), std::move(output_frame),
             BindToCurrentLoop(
                 base::BindOnce(&V4L2VideoEncodeAccelerator::FrameProcessed,
                                base::Unretained(this), force_keyframe,
                                timestamp, output_buffer_index)))) {
       NOTIFY_ERROR(kPlatformFailureError);
     }
   } else {
     if (!image_processor_->Process(
             std::move(frame),
             BindToCurrentLoop(base::BindOnce(
                 &V4L2VideoEncodeAccelerator::FrameProcessed,
                 base::Unretained(this), force_keyframe, timestamp)))) {
       NOTIFY_ERROR(kPlatformFailureError);
     }
   }
 }

 void V4L2VideoEncodeAccelerator::UseOutputBitstreamBufferTask(
     BitstreamBuffer buffer) {
   DVLOGF(4) << "id=" << buffer.id();
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());

   if (buffer.size() < output_buffer_byte_size_) {
     NOTIFY_ERROR(kInvalidArgumentError);
     return;
   }
   auto shm = std::make_unique<UnalignedSharedMemory>(buffer.TakeRegion(),
                                                      buffer.size(), false);
   if (!shm->MapAt(buffer.offset(), buffer.size())) {
     NOTIFY_ERROR(kPlatformFailureError);
     return;
   }

   bitstream_buffer_pool_.push_back(
       std::make_unique<BitstreamBufferRef>(buffer.id(), std::move(shm)));
   PumpBitstreamBuffers();

   if (encoder_state_ == kInitialized) {
     if (!StartDevicePoll())
       return;
     encoder_state_ = kEncoding;
   }
 }

 void V4L2VideoEncodeAccelerator::DestroyTask() {
   VLOGF(2);

   // DestroyTask() should run regardless of encoder_state_.

   // Stop streaming and the device_poll_thread_.
   StopDevicePoll();

   // Set our state to kError, and early-out all tasks.
   encoder_state_ = kError;

   if (encoder_thread_.task_runner() &&
       encoder_thread_.task_runner()->BelongsToCurrentThread()) {
     DestroyInputBuffers();
     DestroyOutputBuffers();
     input_queue_ = nullptr;
     output_queue_ = nullptr;
     image_processor_ = nullptr;
   }
 }

 void V4L2VideoEncodeAccelerator::ServiceDeviceTask() {
   DVLOGF(3);
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DCHECK_NE(encoder_state_, kUninitialized);
   DCHECK_NE(encoder_state_, kInitialized);

   if (encoder_state_ == kError) {
     DVLOGF(1) << "early out: kError state";
     return;
   }

   Dequeue();
   Enqueue();

   // Clear the interrupt fd.
   if (!device_->ClearDevicePollInterrupt())
     return;

   // Device can be polled as soon as either input or output buffers are queued.
   bool poll_device = (input_queue_->QueuedBuffersCount() +
                           output_queue_->QueuedBuffersCount() >
                       0);

   // ServiceDeviceTask() should only ever be scheduled from DevicePollTask(),
   // so either:
   // * device_poll_thread_ is running normally
   // * device_poll_thread_ scheduled us, but then a DestroyTask() shut it down,
   //   in which case we're in kError state, and we should have early-outed
   //   already.
   DCHECK(device_poll_thread_.task_runner());
   // Queue the DevicePollTask() now.
   device_poll_thread_.task_runner()->PostTask(
       FROM_HERE, base::BindOnce(&V4L2VideoEncodeAccelerator::DevicePollTask,
                                 base::Unretained(this), poll_device));

   DVLOGF(3) << encoder_input_queue_.size() << "] => DEVICE["
             << input_queue_->FreeBuffersCount() << "+"
             << input_queue_->QueuedBuffersCount() << "/"
             << input_buffer_map_.size() << "->"
             << output_queue_->FreeBuffersCount() << "+"
             << output_queue_->QueuedBuffersCount() << "/"
             << output_queue_->AllocatedBuffersCount() << "] => OUT["
             << bitstream_buffer_pool_.size() << "]";
 }

 void V4L2VideoEncodeAccelerator::Enqueue() {
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   TRACE_EVENT0("media,gpu", "V4L2VEA::Enqueue");

   DVLOGF(4) << "free_input_buffers: " << input_queue_->FreeBuffersCount()
             << "input_queue: " << encoder_input_queue_.size();

   bool do_streamon = false;
   // Enqueue all the inputs we can.
   const size_t old_inputs_queued = input_queue_->QueuedBuffersCount();
   while (!encoder_input_queue_.empty() &&
          input_queue_->FreeBuffersCount() > 0) {
     // A null frame indicates a flush.
     if (encoder_input_queue_.front().frame == nullptr) {
       DVLOGF(3) << "All input frames needed to be flushed are enqueued.";
       encoder_input_queue_.pop();

       // If we are not streaming, the device is not running and there is no need
       // to call V4L2_ENC_CMD_STOP to request a flush. This also means there is
       // nothing left to process, so we can return flush success back to the
       // client.
       if (!input_queue_->IsStreaming()) {
         child_task_runner_->PostTask(
             FROM_HERE, base::BindOnce(std::move(flush_callback_), true));
         return;
       }
       struct v4l2_encoder_cmd cmd{};
       cmd.cmd = V4L2_ENC_CMD_STOP;
       if (device_->Ioctl(VIDIOC_ENCODER_CMD, &cmd) != 0) {
         VPLOGF(1) << "ioctl() failed: VIDIOC_ENCODER_CMD";
         NOTIFY_ERROR(kPlatformFailureError);
         child_task_runner_->PostTask(
             FROM_HERE, base::BindOnce(std::move(flush_callback_), false));
         return;
       }
       encoder_state_ = kFlushing;
       break;
     }
     if (!EnqueueInputRecord())
       return;
   }
   if (old_inputs_queued == 0 && input_queue_->QueuedBuffersCount() != 0) {
     // We just started up a previously empty queue.
     // Queue state changed; signal interrupt.
     if (!device_->SetDevicePollInterrupt())
       return;
     // Shall call VIDIOC_STREAMON if we haven't yet.
     do_streamon = !input_queue_->IsStreaming();
   }

   if (!input_queue_->IsStreaming() && !do_streamon) {
     // We don't have to enqueue any buffers in the output queue until we enqueue
     // buffers in the input queue. This enables to call S_FMT in Encode() on
     // the first frame.
     return;
   }

   // Enqueue all the outputs we can.
   const size_t old_outputs_queued = output_queue_->QueuedBuffersCount();
   while (output_queue_->FreeBuffersCount() > 0) {
     if (!EnqueueOutputRecord())
       return;
   }
   if (old_outputs_queued == 0 && output_queue_->QueuedBuffersCount() != 0) {
     // We just started up a previously empty queue.
     // Queue state changed; signal interrupt.
     if (!device_->SetDevicePollInterrupt())
       return;
   }

   // STREAMON in CAPTURE queue first and then OUTPUT queue.
   // This is a workaround of a tegra driver bug that STREAMON in CAPTURE queue
   // will never return (i.e. blocks |encoder_thread_| forever) if the STREAMON
   // in CAPTURE queue is called after STREAMON in OUTPUT queue.
   // Once nyan_kitty, which uses tegra driver, reaches EOL, crrev.com/c/1753982
   // should be reverted.
   if (do_streamon) {
     DCHECK(!output_queue_->IsStreaming() && !input_queue_->IsStreaming());
     // When VIDIOC_STREAMON can be executed in OUTPUT queue, it is fine to call
     // STREAMON in CAPTURE queue.
     output_queue_->Streamon();
     input_queue_->Streamon();
   }
 }

 void V4L2VideoEncodeAccelerator::Dequeue() {
   DVLOGF(4);
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   TRACE_EVENT0("media,gpu", "V4L2VEA::Dequeue");

   // Dequeue completed input (VIDEO_OUTPUT) buffers, and recycle to the free
   // list.
   while (input_queue_->QueuedBuffersCount() > 0) {
     DVLOGF(4) << "inputs queued: " << input_queue_->QueuedBuffersCount();
     DCHECK(input_queue_->IsStreaming());

     auto ret = input_queue_->DequeueBuffer();
     if (!ret.first) {
       NOTIFY_ERROR(kPlatformFailureError);
       return;
     }
     if (!ret.second) {
       // We're just out of buffers to dequeue.
       break;
     }

     InputRecord& input_record = input_buffer_map_[ret.second->BufferId()];
     input_record.frame = nullptr;
     if (input_record.ip_output_buffer_index)
       ReuseImageProcessorOutputBuffer(*input_record.ip_output_buffer_index);
   }

   // Dequeue completed output (VIDEO_CAPTURE) buffers, and recycle to the
   // free list.  Notify the client that an output buffer is complete.
   bool buffer_dequeued = false;
   while (output_queue_->QueuedBuffersCount() > 0) {
     DCHECK(output_queue_->IsStreaming());

     auto ret = output_queue_->DequeueBuffer();
     if (!ret.first) {
       NOTIFY_ERROR(kPlatformFailureError);
       return;
     }
     if (!ret.second) {
       // We're just out of buffers to dequeue.
       break;
     }

     output_buffer_queue_.push_back(std::move(ret.second));
     buffer_dequeued = true;
   }

   if (buffer_dequeued)
     PumpBitstreamBuffers();
 }

 void V4L2VideoEncodeAccelerator::PumpBitstreamBuffers() {
   DVLOGF(4);
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());

   while (!output_buffer_queue_.empty()) {
     auto output_buf = std::move(output_buffer_queue_.front());
     output_buffer_queue_.pop_front();

     size_t bitstream_size = base::checked_cast<size_t>(
         output_buf->GetPlaneBytesUsed(0) - output_buf->GetPlaneDataOffset(0));
     if (bitstream_size > 0) {
       if (bitstream_buffer_pool_.empty()) {
         DVLOGF(4) << "No free bitstream buffer, skip.";
         output_buffer_queue_.push_front(std::move(output_buf));
         return;
       }

       auto buffer_ref = std::move(bitstream_buffer_pool_.back());
       auto buffer_id = buffer_ref->id;
       bitstream_buffer_pool_.pop_back();

       size_t output_data_size = CopyIntoOutputBuffer(
           static_cast<const uint8_t*>(output_buf->GetPlaneMapping(0)) +
               output_buf->GetPlaneDataOffset(0),
           bitstream_size, std::move(buffer_ref));

       DVLOGF(4) << "returning buffer_id=" << buffer_id
                 << ", size=" << output_data_size
                 << ", key_frame=" << output_buf->IsKeyframe();
       child_task_runner_->PostTask(
           FROM_HERE,
           base::BindOnce(&Client::BitstreamBufferReady, client_, buffer_id,
                          BitstreamBufferMetadata(
                              output_data_size, output_buf->IsKeyframe(),
                              base::TimeDelta::FromMicroseconds(
                                  output_buf->GetTimeStamp().tv_usec +
                                  output_buf->GetTimeStamp().tv_sec *
                                      base::Time::kMicrosecondsPerSecond))));
     }

     if ((encoder_state_ == kFlushing) && output_buf->IsLast()) {
       // Notify client that flush has finished successfully. The flush callback
       // should be called after notifying the last buffer is ready.
       DVLOGF(3) << "Flush completed. Start the encoder again.";
       encoder_state_ = kEncoding;
       child_task_runner_->PostTask(
           FROM_HERE, base::BindOnce(std::move(flush_callback_), true));
       // Start the encoder again.
       struct v4l2_encoder_cmd cmd{};
       cmd.cmd = V4L2_ENC_CMD_START;
       IOCTL_OR_ERROR_RETURN(VIDIOC_ENCODER_CMD, &cmd);
     }
   }
 }

 bool V4L2VideoEncodeAccelerator::EnqueueInputRecord() {
   DVLOGF(4);
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DCHECK_GT(input_queue_->FreeBuffersCount(), 0u);
   DCHECK(!encoder_input_queue_.empty());
   TRACE_EVENT0("media,gpu", "V4L2VEA::EnqueueInputRecord");

   // Enqueue an input (VIDEO_OUTPUT) buffer.
   InputFrameInfo frame_info = encoder_input_queue_.front();
   if (frame_info.force_keyframe) {
     std::vector<struct v4l2_ext_control> ctrls;
     struct v4l2_ext_control ctrl{};
     ctrl.id = V4L2_CID_MPEG_VIDEO_FORCE_KEY_FRAME;
     ctrls.push_back(ctrl);
     if (!SetExtCtrls(ctrls)) {
       VLOGF(1) << "Failed requesting keyframe";
       NOTIFY_ERROR(kPlatformFailureError);
       return false;
     }
   }

   scoped_refptr<VideoFrame> frame = frame_info.frame;

   V4L2WritableBufferRef input_buf = input_queue_->GetFreeBuffer();
   DCHECK(input_buf.IsValid());
   size_t buffer_id = input_buf.BufferId();

   struct timeval timestamp;
   timestamp.tv_sec = static_cast<time_t>(frame->timestamp().InSeconds());
   timestamp.tv_usec =
       frame->timestamp().InMicroseconds() -
       frame->timestamp().InSeconds() * base::Time::kMicrosecondsPerSecond;
   input_buf.SetTimeStamp(timestamp);

   DCHECK_EQ(device_input_layout_->format(), frame->format());
   size_t num_planes = V4L2Device::GetNumPlanesOfV4L2PixFmt(
       V4L2Device::VideoFrameLayoutToV4L2PixFmt(*device_input_layout_));

   // Create GpuMemoryBufferHandle for native_input_mode.
   gfx::GpuMemoryBufferHandle gmb_handle;
   if (input_buf.Memory() == V4L2_MEMORY_DMABUF) {
     gmb_handle = CreateGpuMemoryBufferHandle(frame.get());
     if (gmb_handle.is_null() || gmb_handle.type != gfx::NATIVE_PIXMAP) {
       VLOGF(1) << "Failed to create native GpuMemoryBufferHandle";
       NOTIFY_ERROR(kPlatformFailureError);
       return false;
     }
   }

   for (size_t i = 0; i < num_planes; ++i) {
     // Single-buffer input format may have multiple color planes, so bytesused
     // of the single buffer should be sum of each color planes' size.
     size_t bytesused = 0;
     if (num_planes == 1) {
       bytesused = VideoFrame::AllocationSize(
           frame->format(), device_input_layout_->coded_size());
     } else {
       bytesused = base::checked_cast<size_t>(
           VideoFrame::PlaneSize(frame->format(), i,
                                 device_input_layout_->coded_size())
               .GetArea());
     }

     switch (input_buf.Memory()) {
       case V4L2_MEMORY_USERPTR:
         // Use buffer_size VideoEncodeAccelerator HW requested by S_FMT.
         input_buf.SetPlaneSize(i, device_input_layout_->planes()[i].size);
         break;

       case V4L2_MEMORY_DMABUF: {
         const std::vector<gfx::NativePixmapPlane>& planes =
             gmb_handle.native_pixmap_handle.planes;
         // TODO(crbug.com/901264): The way to pass an offset within a DMA-buf is
         // not defined in V4L2 specification, so we abuse data_offset for now.
         // Fix it when we have the right interface, including any necessary
         // validation and potential alignment
         input_buf.SetPlaneDataOffset(i, planes[i].offset);
         bytesused += planes[i].offset;
         // Workaround: filling length should not be needed. This is a bug of
         // videobuf2 library.
         input_buf.SetPlaneSize(
             i, device_input_layout_->planes()[i].size + planes[i].offset);
         break;
       }
       default:
         NOTREACHED();
         return false;
     }

     input_buf.SetPlaneBytesUsed(i, bytesused);
   }

   switch (input_buf.Memory()) {
     case V4L2_MEMORY_USERPTR: {
       std::vector<void*> user_ptrs;
       for (size_t i = 0; i < num_planes; ++i)
         user_ptrs.push_back(frame->data(i));
       std::move(input_buf).QueueUserPtr(std::move(user_ptrs));
       break;
     }
     case V4L2_MEMORY_DMABUF: {
       std::move(input_buf).QueueDMABuf(gmb_handle.native_pixmap_handle.planes);
       break;
     }
     default:
       NOTREACHED() << "Unknown input memory type: "
                    << static_cast<int>(input_buf.Memory());
       return false;
   }

   // Keep |gmb_handle| alive as long as |frame| is alive so that fds passed
   // to the driver are valid during encoding.
   frame->AddDestructionObserver(
       base::BindOnce([](gfx::GpuMemoryBufferHandle) {}, std::move(gmb_handle)));

   InputRecord& input_record = input_buffer_map_[buffer_id];
   input_record.frame = frame;
   input_record.ip_output_buffer_index = frame_info.ip_output_buffer_index;
   encoder_input_queue_.pop();
   return true;
 }

 bool V4L2VideoEncodeAccelerator::EnqueueOutputRecord() {
   DVLOGF(4);
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DCHECK_GT(output_queue_->FreeBuffersCount(), 0u);
   TRACE_EVENT0("media,gpu", "V4L2VEA::EnqueueOutputRecord");

   // Enqueue an output (VIDEO_CAPTURE) buffer.
   V4L2WritableBufferRef output_buf = output_queue_->GetFreeBuffer();
   DCHECK(output_buf.IsValid());
   if (!std::move(output_buf).QueueMMap()) {
     VLOGF(1) << "Failed to QueueMMap.";
     return false;
   }
   return true;
 }

 bool V4L2VideoEncodeAccelerator::StartDevicePoll() {
   DVLOGF(3);
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DCHECK(!device_poll_thread_.IsRunning());

   // Start up the device poll thread and schedule its first DevicePollTask().
   if (!device_poll_thread_.Start()) {
     VLOGF(1) << "StartDevicePoll(): Device thread failed to start";
     NOTIFY_ERROR(kPlatformFailureError);
     return false;
   }
   // Enqueue a poll task with no devices to poll on -- it will wait only on the
   // interrupt fd.
   device_poll_thread_.task_runner()->PostTask(
       FROM_HERE, base::BindOnce(&V4L2VideoEncodeAccelerator::DevicePollTask,
                                 base::Unretained(this), false));

   return true;
 }

 bool V4L2VideoEncodeAccelerator::StopDevicePoll() {
   DVLOGF(3);

   // Signal the DevicePollTask() to stop, and stop the device poll thread.
   if (!device_->SetDevicePollInterrupt())
     return false;
   device_poll_thread_.Stop();
   // Clear the interrupt now, to be sure.
   if (!device_->ClearDevicePollInterrupt())
     return false;

   // Tegra driver cannot call Streamoff() when the stream is off, so we check
   // IsStreaming() first.
   if (input_queue_ && input_queue_->IsStreaming() && !input_queue_->Streamoff())
     return false;

   if (output_queue_ && output_queue_->IsStreaming() &&
       !output_queue_->Streamoff())
     return false;

   // Reset all our accounting info.
   while (!encoder_input_queue_.empty())
     encoder_input_queue_.pop();
   for (size_t i = 0; i < input_buffer_map_.size(); ++i) {
     InputRecord& input_record = input_buffer_map_[i];
     input_record.frame = nullptr;
   }

   bitstream_buffer_pool_.clear();

   DVLOGF(3) << "device poll stopped";
   return true;
 }

 void V4L2VideoEncodeAccelerator::DevicePollTask(bool poll_device) {
   DVLOGF(4);
   DCHECK(device_poll_thread_.task_runner()->BelongsToCurrentThread());

   bool event_pending;
   if (!device_->Poll(poll_device, &event_pending)) {
     NOTIFY_ERROR(kPlatformFailureError);
     return;
   }

   // All processing should happen on ServiceDeviceTask(), since we shouldn't
   // touch encoder state from this thread.
   encoder_thread_.task_runner()->PostTask(
       FROM_HERE, base::BindOnce(&V4L2VideoEncodeAccelerator::ServiceDeviceTask,
                                 base::Unretained(this)));
 }

 void V4L2VideoEncodeAccelerator::NotifyError(Error error) {
   VLOGF(1) << "error=" << error;

   if (!child_task_runner_->BelongsToCurrentThread()) {
     child_task_runner_->PostTask(
         FROM_HERE, base::BindOnce(&V4L2VideoEncodeAccelerator::NotifyError,
                                   weak_this_, error));
     return;
   }

   if (client_) {
     client_->NotifyError(error);
     client_ptr_factory_.reset();
   }
 }

 void V4L2VideoEncodeAccelerator::SetErrorState(Error error) {
   // We can touch encoder_state_ only if this is the encoder thread or the
   // encoder thread isn't running.
   scoped_refptr<base::SingleThreadTaskRunner> task_runner =
       encoder_thread_.task_runner();
   if (task_runner && !task_runner->BelongsToCurrentThread()) {
     task_runner->PostTask(
         FROM_HERE, base::BindOnce(&V4L2VideoEncodeAccelerator::SetErrorState,
                                   base::Unretained(this), error));
     return;
   }

   // Post NotifyError only if we are already initialized, as the API does
   // not allow doing so before that.
   if (encoder_state_ != kError && encoder_state_ != kUninitialized)
     NotifyError(error);

   encoder_state_ = kError;
 }

 void V4L2VideoEncodeAccelerator::RequestEncodingParametersChangeTask(
     uint32_t bitrate,
     uint32_t framerate) {
   VLOGF(2) << "bitrate=" << bitrate << ", framerate=" << framerate;
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   TRACE_EVENT2("media,gpu", "V4L2VEA::RequestEncodingParametersChangeTask",
                "bitrate", bitrate, "framerate", framerate);

   DCHECK_GT(bitrate, 0u);
   DCHECK_GT(framerate, 0u);

   std::vector<struct v4l2_ext_control> ctrls;
   struct v4l2_ext_control ctrl{};
   ctrl.id = V4L2_CID_MPEG_VIDEO_BITRATE;
   ctrl.value = bitrate;
   ctrls.push_back(ctrl);
   if (!SetExtCtrls(ctrls)) {
     VLOGF(1) << "Failed changing bitrate";
     NOTIFY_ERROR(kPlatformFailureError);
     return;
   }

   struct v4l2_streamparm parms{};
   parms.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
   // Note that we are provided "frames per second" but V4L2 expects "time per
   // frame"; hence we provide the reciprocal of the framerate here.
   parms.parm.output.timeperframe.numerator = 1;
   parms.parm.output.timeperframe.denominator = framerate;
   IOCTL_OR_ERROR_RETURN(VIDIOC_S_PARM, &parms);
 }

 bool V4L2VideoEncodeAccelerator::SetOutputFormat(
     VideoCodecProfile output_profile) {
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DCHECK(!input_queue_->IsStreaming());
   DCHECK(!output_queue_->IsStreaming());

   DCHECK(!visible_size_.IsEmpty());
   output_buffer_byte_size_ = GetEncodeBitstreamBufferSize(visible_size_);

   struct v4l2_format format{};
   format.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
   format.fmt.pix_mp.width = visible_size_.width();
   format.fmt.pix_mp.height = visible_size_.height();
   format.fmt.pix_mp.pixelformat = output_format_fourcc_;
   format.fmt.pix_mp.plane_fmt[0].sizeimage =
       base::checked_cast<__u32>(output_buffer_byte_size_);
   format.fmt.pix_mp.num_planes = 1;
   IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_S_FMT, &format);
   DCHECK_EQ(format.fmt.pix_mp.pixelformat, output_format_fourcc_);

   // Device might have adjusted the required output size.
   size_t adjusted_output_buffer_size =
       base::checked_cast<size_t>(format.fmt.pix_mp.plane_fmt[0].sizeimage);
   output_buffer_byte_size_ = adjusted_output_buffer_size;

   return true;
 }

 bool V4L2VideoEncodeAccelerator::NegotiateInputFormat(
     VideoPixelFormat input_format,
     const gfx::Size& size) {
   VLOGF(2);
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DCHECK(!input_queue_->IsStreaming());
   DCHECK(!output_queue_->IsStreaming());

   // First see if the device can use the provided format directly.
   std::vector<uint32_t> pix_fmt_candidates;
   uint32_t pix_fmt =
       Fourcc::FromVideoPixelFormat(input_format, false).ToV4L2PixFmt();
   if (pix_fmt)
     pix_fmt_candidates.push_back(pix_fmt);
   // Second try preferred input formats for both single-planar and
   // multi-planar.
   for (auto preferred_format :
        device_->PreferredInputFormat(V4L2Device::Type::kEncoder)) {
     pix_fmt_candidates.push_back(preferred_format);
   }

   for (const auto pix_fmt : pix_fmt_candidates) {
     size_t planes_count = V4L2Device::GetNumPlanesOfV4L2PixFmt(pix_fmt);
     DCHECK_GT(planes_count, 0u);
     DCHECK_LE(planes_count, static_cast<size_t>(VIDEO_MAX_PLANES));
     DVLOGF(3) << "Trying S_FMT with " << FourccToString(pix_fmt);

     struct v4l2_format format{};
     format.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
     format.fmt.pix_mp.width = size.width();
     format.fmt.pix_mp.height = size.height();
     format.fmt.pix_mp.pixelformat = pix_fmt;
     format.fmt.pix_mp.num_planes = planes_count;
     if (device_->Ioctl(VIDIOC_S_FMT, &format) == 0 &&
         format.fmt.pix_mp.pixelformat == pix_fmt) {
       DVLOGF(3) << "Success: S_FMT with " << FourccToString(pix_fmt);
       device_input_layout_ = V4L2Device::V4L2FormatToVideoFrameLayout(format);
       if (!device_input_layout_) {
         VLOGF(1) << "Invalid device_input_layout_";
         return false;
       }
       DVLOG(3) << "Negotiated device_input_layout_: " << *device_input_layout_;
       if (!gfx::Rect(device_input_layout_->coded_size())
                .Contains(gfx::Rect(size))) {
         VLOGF(1) << "Input size " << size.ToString()
                  << " exceeds encoder capability. Size encoder can handle: "
                  << device_input_layout_->coded_size().ToString();
         return false;
       }
       // TODO(crbug.com/914700): Remove this once
       // Client::RequireBitstreamBuffers uses input's VideoFrameLayout to
       // allocate input buffer.
       input_allocated_size_ = V4L2Device::AllocatedSizeFromV4L2Format(format);
       return true;
     }
   }
   return false;
 }

 bool V4L2VideoEncodeAccelerator::SetFormats(VideoPixelFormat input_format,
                                             VideoCodecProfile output_profile) {
   VLOGF(2);
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DCHECK(!input_queue_->IsStreaming());
   DCHECK(!output_queue_->IsStreaming());

   if (!SetOutputFormat(output_profile))
     return false;

   if (!NegotiateInputFormat(input_format, visible_size_))
     return false;

   struct v4l2_rect visible_rect;
   visible_rect.left = 0;
   visible_rect.top = 0;
   visible_rect.width = visible_size_.width();
   visible_rect.height = visible_size_.height();

   struct v4l2_selection selection_arg{};
   selection_arg.type = V4L2_BUF_TYPE_VIDEO_OUTPUT;
   selection_arg.target = V4L2_SEL_TGT_CROP;
   selection_arg.r = visible_rect;

   // The width and height might be adjusted by driver.
   // Need to read it back and set to visible_size_.
   if (device_->Ioctl(VIDIOC_S_SELECTION, &selection_arg) == 0) {
     DVLOGF(2) << "VIDIOC_S_SELECTION is supported";
     visible_rect = selection_arg.r;
   } else {
     VLOGF(2) << "Fallback to VIDIOC_S/G_CROP";
     struct v4l2_crop crop{};
     crop.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
     crop.c = visible_rect;
     IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_S_CROP, &crop);
     IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_G_CROP, &crop);
     visible_rect = crop.c;
   }

   visible_size_.SetSize(visible_rect.width, visible_rect.height);
   VLOGF(2) << "After adjusted by driver, visible_size_="
            << visible_size_.ToString();

   return true;
 }

 bool V4L2VideoEncodeAccelerator::IsCtrlExposed(uint32_t ctrl_id) {
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   struct v4l2_queryctrl query_ctrl{};
   query_ctrl.id = ctrl_id;

   return device_->Ioctl(VIDIOC_QUERYCTRL, &query_ctrl) == 0;
 }

 bool V4L2VideoEncodeAccelerator::SetExtCtrls(
     std::vector<struct v4l2_ext_control> ctrls) {
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   struct v4l2_ext_controls ext_ctrls{};
   ext_ctrls.ctrl_class = V4L2_CTRL_CLASS_MPEG;
   ext_ctrls.count = ctrls.size();
   ext_ctrls.controls = &ctrls[0];
   return device_->Ioctl(VIDIOC_S_EXT_CTRLS, &ext_ctrls) == 0;
 }

 bool V4L2VideoEncodeAccelerator::InitControls(const Config& config) {
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   std::vector<struct v4l2_ext_control> ctrls;
   struct v4l2_ext_control ctrl{};

   // Enable frame-level bitrate control. This is the only mandatory control.
   ctrl.id = V4L2_CID_MPEG_VIDEO_FRAME_RC_ENABLE;
   ctrl.value = 1;
   ctrls.push_back(ctrl);
   if (!SetExtCtrls(ctrls)) {
     VLOGF(1) << "Failed enabling bitrate control";
     NOTIFY_ERROR(kPlatformFailureError);
     return false;
   }

   ctrls.clear();
   if (output_format_fourcc_ == V4L2_PIX_FMT_H264) {
 #ifndef V4L2_CID_MPEG_VIDEO_H264_SPS_PPS_BEFORE_IDR
 #define V4L2_CID_MPEG_VIDEO_H264_SPS_PPS_BEFORE_IDR (V4L2_CID_MPEG_BASE + 388)
 #endif
     // Request to inject SPS and PPS before each IDR, if the device supports
     // that feature. Otherwise we'll have to cache and inject ourselves.
     if (IsCtrlExposed(V4L2_CID_MPEG_VIDEO_H264_SPS_PPS_BEFORE_IDR)) {
       memset(&ctrl, 0, sizeof(ctrl));
       ctrl.id = V4L2_CID_MPEG_VIDEO_H264_SPS_PPS_BEFORE_IDR;
       ctrl.value = 1;
       ctrls.push_back(ctrl);
       if (!SetExtCtrls(ctrls)) {
         NOTIFY_ERROR(kPlatformFailureError);
         return false;
       }
       ctrls.clear();
       inject_sps_and_pps_ = false;
       DVLOGF(2) << "Device supports injecting SPS+PPS before each IDR";
     } else {
       inject_sps_and_pps_ = true;
       DVLOGF(2) << "Will inject SPS+PPS before each IDR, unsupported by device";
     }

     // Optional controls.
     // No B-frames, for lowest decoding latency.
     memset(&ctrl, 0, sizeof(ctrl));
     ctrl.id = V4L2_CID_MPEG_VIDEO_B_FRAMES;
     ctrl.value = 0;
     ctrls.push_back(ctrl);

     // Quantization parameter maximum value (for variable bitrate control).
     memset(&ctrl, 0, sizeof(ctrl));
     ctrl.id = V4L2_CID_MPEG_VIDEO_H264_MAX_QP;
     ctrl.value = 51;
     ctrls.push_back(ctrl);

     // Set H.264 profile.
     int32_t profile_value =
         V4L2Device::VideoCodecProfileToV4L2H264Profile(config.output_profile);
     if (profile_value < 0) {
       NOTIFY_ERROR(kInvalidArgumentError);
       return false;
     }
     memset(&ctrl, 0, sizeof(ctrl));
     ctrl.id = V4L2_CID_MPEG_VIDEO_H264_PROFILE;
     ctrl.value = profile_value;
     ctrls.push_back(ctrl);

     // Set H.264 output level from config. Use Level 4.0 as fallback default.
     uint8_t h264_level =
         config.h264_output_level.value_or(H264SPS::kLevelIDC4p0);
     constexpr size_t kH264MacroblockSizeInPixels = 16;
     const uint32_t framerate = config.initial_framerate.value_or(
         VideoEncodeAccelerator::kDefaultFramerate);
     const uint32_t mb_width =
         base::bits::Align(config.input_visible_size.width(),
                           kH264MacroblockSizeInPixels) /
         kH264MacroblockSizeInPixels;
     const uint32_t mb_height =
         base::bits::Align(config.input_visible_size.height(),
                           kH264MacroblockSizeInPixels) /
         kH264MacroblockSizeInPixels;
     const uint32_t framesize_in_mbs = mb_width * mb_height;

     // Check whether the h264 level is valid.
     if (!CheckH264LevelLimits(config.output_profile, h264_level,
                               config.initial_bitrate, framerate,
                               framesize_in_mbs)) {
       base::Optional<uint8_t> valid_level =
           FindValidH264Level(config.output_profile, config.initial_bitrate,
                              framerate, framesize_in_mbs);
       if (!valid_level) {
         VLOGF(1) << "Could not find a valid h264 level for"
                  << " profile=" << config.output_profile
                  << " bitrate=" << config.initial_bitrate
                  << " framerate=" << framerate
                  << " size=" << config.input_visible_size.ToString();
         NOTIFY_ERROR(kInvalidArgumentError);
         return false;
       }

       h264_level = *valid_level;
     }

     int32_t level_value = V4L2Device::H264LevelIdcToV4L2H264Level(h264_level);
     memset(&ctrl, 0, sizeof(ctrl));
     ctrl.id = V4L2_CID_MPEG_VIDEO_H264_LEVEL;
     ctrl.value = level_value;
     ctrls.push_back(ctrl);

     // Ask not to put SPS and PPS into separate bitstream buffers.
     memset(&ctrl, 0, sizeof(ctrl));
     ctrl.id = V4L2_CID_MPEG_VIDEO_HEADER_MODE;
     ctrl.value = V4L2_MPEG_VIDEO_HEADER_MODE_JOINED_WITH_1ST_FRAME;
     ctrls.push_back(ctrl);
   }

   // Enable macroblock-level bitrate control.
   memset(&ctrl, 0, sizeof(ctrl));
   ctrl.id = V4L2_CID_MPEG_VIDEO_MB_RC_ENABLE;
   ctrl.value = 1;
   ctrls.push_back(ctrl);

   // Set GOP length, or default 0 to disable periodic key frames.
   memset(&ctrl, 0, sizeof(ctrl));
   ctrl.id = V4L2_CID_MPEG_VIDEO_GOP_SIZE;
   ctrl.value = config.gop_length.value_or(0);
   ctrls.push_back(ctrl);

   // Ignore return value as these controls are optional.
   SetExtCtrls(ctrls);

   // Optional Exynos specific controls.
   ctrls.clear();
   // Enable "tight" bitrate mode. For this to work properly, frame- and mb-level
   // bitrate controls have to be enabled as well.
   memset(&ctrl, 0, sizeof(ctrl));
   ctrl.id = V4L2_CID_MPEG_MFC51_VIDEO_RC_REACTION_COEFF;
   ctrl.value = 1;
   ctrls.push_back(ctrl);

   // Force bitrate control to average over a GOP (for tight bitrate
   // tolerance).
   memset(&ctrl, 0, sizeof(ctrl));
   ctrl.id = V4L2_CID_MPEG_MFC51_VIDEO_RC_FIXED_TARGET_BIT;
   ctrl.value = 1;
   ctrls.push_back(ctrl);

   // Ignore return value as these controls are optional.
   SetExtCtrls(ctrls);

   return true;
 }

 bool V4L2VideoEncodeAccelerator::CreateInputBuffers() {
   VLOGF(2);
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DCHECK(!input_queue_->IsStreaming());

   if (input_queue_->AllocateBuffers(kInputBufferCount, input_memory_type_) <
       kInputBufferCount) {
     VLOGF(1) << "Failed to allocate V4L2 input buffers.";
     return false;
   }

   DCHECK(input_buffer_map_.empty());
   input_buffer_map_.resize(input_queue_->AllocatedBuffersCount());
   return true;
 }

 bool V4L2VideoEncodeAccelerator::CreateOutputBuffers() {
   VLOGF(2);
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());
   DCHECK(!output_queue_->IsStreaming());

   if (output_queue_->AllocateBuffers(kOutputBufferCount, V4L2_MEMORY_MMAP) <
       kOutputBufferCount) {
     VLOGF(1) << "Failed to allocate V4L2 output buffers.";
     return false;
   }
   return true;
 }

 void V4L2VideoEncodeAccelerator::DestroyInputBuffers() {
   VLOGF(2);
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());

   if (!input_queue_ || input_queue_->AllocatedBuffersCount() == 0)
     return;

   DCHECK(!input_queue_->IsStreaming());
   input_queue_->DeallocateBuffers();
   input_buffer_map_.clear();
 }

 void V4L2VideoEncodeAccelerator::DestroyOutputBuffers() {
   VLOGF(2);
   DCHECK(encoder_thread_.task_runner()->BelongsToCurrentThread());

   if (!output_queue_ || output_queue_->AllocatedBuffersCount() == 0)
     return;

   DCHECK(!output_queue_->IsStreaming());
   output_queue_->DeallocateBuffers();
 }

 }  // namespace media