media/gpu/v4l2/v4l2_slice_video_decode_accelerator.cc - chromium/src.git - Git at Google

 // Copyright 2015 The Chromium Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "media/gpu/v4l2/v4l2_slice_video_decode_accelerator.h"

 #include <errno.h>
 #include <fcntl.h>
 #include <linux/media.h>
 #include <linux/videodev2.h>
 #include <poll.h>
 #include <string.h>
 #include <sys/eventfd.h>
 #include <sys/ioctl.h>
 #include <sys/mman.h>

 #include <memory>

 #include "base/bind.h"
 #include "base/bind_helpers.h"
 #include "base/callback.h"
 #include "base/callback_helpers.h"
 #include "base/command_line.h"
 #include "base/memory/ptr_util.h"
 #include "base/numerics/safe_conversions.h"
 #include "base/single_thread_task_runner.h"
 #include "base/stl_util.h"
 #include "base/strings/stringprintf.h"
 #include "base/threading/thread_task_runner_handle.h"
 #include "base/time/time.h"
 #include "base/trace_event/memory_dump_manager.h"
 #include "base/trace_event/trace_event.h"
 #include "media/base/bind_to_current_loop.h"
 #include "media/base/media_switches.h"
 #include "media/base/unaligned_shared_memory.h"
 #include "media/base/video_types.h"
 #include "media/gpu/macros.h"
 #include "media/gpu/v4l2/v4l2_decode_surface.h"
 #include "media/gpu/v4l2/v4l2_h264_accelerator.h"
 #include "media/gpu/v4l2/v4l2_h264_accelerator_legacy.h"
 #include "media/gpu/v4l2/v4l2_vp8_accelerator.h"
 #include "media/gpu/v4l2/v4l2_vp9_accelerator.h"
 #include "ui/gl/gl_context.h"
 #include "ui/gl/gl_image.h"
 #include "ui/gl/scoped_binders.h"

 #define NOTIFY_ERROR(x)                       \
   do {                                        \
     VLOGF(1) << "Setting error state: " << x; \
     SetErrorState(x);                         \
   } while (0)

 #define IOCTL_OR_ERROR_RETURN_VALUE(type, arg, value, type_str) \
   do {                                                          \
     if (device_->Ioctl(type, arg) != 0) {                       \
       VPLOGF(1) << "ioctl() failed: " << type_str;              \
       return value;                                             \
     }                                                           \
   } while (0)

 #define IOCTL_OR_ERROR_RETURN(type, arg) \
   IOCTL_OR_ERROR_RETURN_VALUE(type, arg, ((void)0), #type)

 #define IOCTL_OR_ERROR_RETURN_FALSE(type, arg) \
   IOCTL_OR_ERROR_RETURN_VALUE(type, arg, false, #type)

 #define IOCTL_OR_LOG_ERROR(type, arg)           \
   do {                                          \
     if (device_->Ioctl(type, arg) != 0)         \
       VPLOGF(1) << "ioctl() failed: " << #type; \
   } while (0)

 namespace media {

 // static
 const uint32_t V4L2SliceVideoDecodeAccelerator::supported_input_fourccs_[] = {
     V4L2_PIX_FMT_H264_SLICE, V4L2_PIX_FMT_VP8_FRAME, V4L2_PIX_FMT_VP9_FRAME,
 };

 V4L2SliceVideoDecodeAccelerator::OutputRecord::OutputRecord()
     : num_times_sent_to_client(0),
       picture_id(-1),
       texture_id(0),
       cleared(false) {}

 V4L2SliceVideoDecodeAccelerator::OutputRecord::OutputRecord(OutputRecord&&) =
     default;

 V4L2SliceVideoDecodeAccelerator::OutputRecord::~OutputRecord() = default;

 struct V4L2SliceVideoDecodeAccelerator::BitstreamBufferRef {
   BitstreamBufferRef(
       base::WeakPtr<VideoDecodeAccelerator::Client>& client,
       const scoped_refptr<base::SingleThreadTaskRunner>& client_task_runner,
       scoped_refptr<DecoderBuffer> buffer,
       int32_t input_id);
   ~BitstreamBufferRef();

   const base::WeakPtr<VideoDecodeAccelerator::Client> client;
   const scoped_refptr<base::SingleThreadTaskRunner> client_task_runner;
   scoped_refptr<DecoderBuffer> buffer;
   off_t bytes_used;
   const int32_t input_id;
 };

 V4L2SliceVideoDecodeAccelerator::BitstreamBufferRef::BitstreamBufferRef(
     base::WeakPtr<VideoDecodeAccelerator::Client>& client,
     const scoped_refptr<base::SingleThreadTaskRunner>& client_task_runner,
     scoped_refptr<DecoderBuffer> buffer,
     int32_t input_id)
     : client(client),
       client_task_runner(client_task_runner),
       buffer(std::move(buffer)),
       bytes_used(0),
       input_id(input_id) {}

 V4L2SliceVideoDecodeAccelerator::BitstreamBufferRef::~BitstreamBufferRef() {
   if (input_id >= 0) {
     DVLOGF(5) << "returning input_id: " << input_id;
     client_task_runner->PostTask(
         FROM_HERE,
         base::BindOnce(
             &VideoDecodeAccelerator::Client::NotifyEndOfBitstreamBuffer, client,
             input_id));
   }
 }

 V4L2SliceVideoDecodeAccelerator::PictureRecord::PictureRecord(
     bool cleared,
     const Picture& picture)
     : cleared(cleared), picture(picture) {}

 V4L2SliceVideoDecodeAccelerator::PictureRecord::~PictureRecord() {}

 V4L2SliceVideoDecodeAccelerator::V4L2SliceVideoDecodeAccelerator(
     const scoped_refptr<V4L2Device>& device,
     EGLDisplay egl_display,
     const BindGLImageCallback& bind_image_cb,
     const MakeGLContextCurrentCallback& make_context_current_cb)
     : input_planes_count_(0),
       output_planes_count_(0),
       child_task_runner_(base::ThreadTaskRunnerHandle::Get()),
       device_(device),
       decoder_thread_("V4L2SliceVideoDecodeAcceleratorThread"),
       device_poll_thread_("V4L2SliceVideoDecodeAcceleratorDevicePollThread"),
       video_profile_(VIDEO_CODEC_PROFILE_UNKNOWN),
       input_format_fourcc_(0),
       output_format_fourcc_(0),
       state_(kUninitialized),
       output_mode_(Config::OutputMode::ALLOCATE),
       decoder_flushing_(false),
       decoder_resetting_(false),
       surface_set_change_pending_(false),
       picture_clearing_count_(0),
       egl_display_(egl_display),
       bind_image_cb_(bind_image_cb),
       make_context_current_cb_(make_context_current_cb),
       gl_image_format_fourcc_(0),
       gl_image_planes_count_(0),
       weak_this_factory_(this) {
   weak_this_ = weak_this_factory_.GetWeakPtr();
 }

 V4L2SliceVideoDecodeAccelerator::~V4L2SliceVideoDecodeAccelerator() {
   DVLOGF(2);

   DCHECK(child_task_runner_->BelongsToCurrentThread());
   DCHECK(!decoder_thread_.IsRunning());
   DCHECK(!device_poll_thread_.IsRunning());

   DCHECK(requests_.empty());
   DCHECK(output_buffer_map_.empty());
 }

 void V4L2SliceVideoDecodeAccelerator::NotifyError(Error error) {
   // Notifying the client should only happen from the client's thread.
   if (!child_task_runner_->BelongsToCurrentThread()) {
     child_task_runner_->PostTask(
         FROM_HERE, base::BindOnce(&V4L2SliceVideoDecodeAccelerator::NotifyError,
                                   weak_this_, error));
     return;
   }

   // Notify the decoder's client an error has occurred.
   if (client_) {
     client_->NotifyError(error);
     client_ptr_factory_.reset();
   }
 }

 bool V4L2SliceVideoDecodeAccelerator::Initialize(const Config& config,
                                                  Client* client) {
   VLOGF(2) << "profile: " << config.profile;
   DCHECK(child_task_runner_->BelongsToCurrentThread());
   DCHECK_EQ(state_, kUninitialized);

   if (config.is_encrypted()) {
     NOTREACHED() << "Encrypted streams are not supported for this VDA";
     return false;
   }

   if (config.output_mode != Config::OutputMode::ALLOCATE &&
       config.output_mode != Config::OutputMode::IMPORT) {
     NOTREACHED() << "Only ALLOCATE and IMPORT OutputModes are supported";
     return false;
   }

   client_ptr_factory_.reset(
       new base::WeakPtrFactory<VideoDecodeAccelerator::Client>(client));
   client_ = client_ptr_factory_->GetWeakPtr();
   // If we haven't been set up to decode on separate thread via
   // TryToSetupDecodeOnSeparateThread(), use the main thread/client for
   // decode tasks.
   if (!decode_task_runner_) {
     decode_task_runner_ = child_task_runner_;
     DCHECK(!decode_client_);
     decode_client_ = client_;
   }

   // We need the context to be initialized to query extensions.
   if (make_context_current_cb_) {
     if (egl_display_ == EGL_NO_DISPLAY) {
       VLOGF(1) << "could not get EGLDisplay";
       return false;
     }

     if (!make_context_current_cb_.Run()) {
       VLOGF(1) << "could not make context current";
       return false;
     }

     if (!gl::g_driver_egl.ext.b_EGL_KHR_fence_sync) {
       VLOGF(1) << "context does not have EGL_KHR_fence_sync";
       return false;
     }
   } else {
     DVLOGF(2) << "No GL callbacks provided, initializing without GL support";
   }

   video_profile_ = config.profile;

   input_planes_count_ = 1;

   input_format_fourcc_ =
       V4L2Device::VideoCodecProfileToV4L2PixFmt(video_profile_, true);

   if (!device_->Open(V4L2Device::Type::kDecoder, input_format_fourcc_)) {
     VLOGF(1) << "Failed to open device for profile: " << config.profile
              << " fourcc: " << FourccToString(input_format_fourcc_);
     return false;
   }

   struct v4l2_requestbuffers reqbufs;
   memset(&reqbufs, 0, sizeof(reqbufs));
   reqbufs.count = 0;
   reqbufs.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
   reqbufs.memory = V4L2_MEMORY_MMAP;
   IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_REQBUFS, &reqbufs);
   if (reqbufs.capabilities & V4L2_BUF_CAP_SUPPORTS_REQUESTS) {
     supports_requests_ = true;
     VLOGF(1) << "Using request API";
     DCHECK(!media_fd_.is_valid());
     // Let's try to open the media device
     // TODO(crbug.com/985230): remove this hardcoding, replace with V4L2Device
     // integration.
     int media_fd = open("/dev/media-dec0", O_RDWR, 0);
     if (media_fd < 0) {
       VPLOGF(1) << "Failed to open media device: ";
       NOTIFY_ERROR(PLATFORM_FAILURE);
     }
     media_fd_ = base::ScopedFD(media_fd);
   } else {
     VLOGF(1) << "Using config store";
   }

   if (video_profile_ >= H264PROFILE_MIN && video_profile_ <= H264PROFILE_MAX) {
     if (supports_requests_) {
       decoder_.reset(new H264Decoder(
           std::make_unique<V4L2H264Accelerator>(this, device_.get())));
     } else {
       decoder_.reset(new H264Decoder(
           std::make_unique<V4L2LegacyH264Accelerator>(this, device_.get())));
     }
   } else if (video_profile_ >= VP8PROFILE_MIN &&
              video_profile_ <= VP8PROFILE_MAX) {
     decoder_.reset(new VP8Decoder(
         std::make_unique<V4L2VP8Accelerator>(this, device_.get())));
   } else if (video_profile_ >= VP9PROFILE_MIN &&
              video_profile_ <= VP9PROFILE_MAX) {
     decoder_.reset(new VP9Decoder(
         std::make_unique<V4L2VP9Accelerator>(this, device_.get())));
   } else {
     NOTREACHED() << "Unsupported profile " << GetProfileName(video_profile_);
     return false;
   }

   // Capabilities check.
   struct v4l2_capability caps;
   const __u32 kCapsRequired = V4L2_CAP_VIDEO_M2M_MPLANE | V4L2_CAP_STREAMING;
   IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_QUERYCAP, &caps);
   if ((caps.capabilities & kCapsRequired) != kCapsRequired) {
     VLOGF(1) << "ioctl() failed: VIDIOC_QUERYCAP"
              << ", caps check failed: 0x" << std::hex << caps.capabilities;
     return false;
   }

   if (!SetupFormats())
     return false;

   if (!decoder_thread_.Start()) {
     VLOGF(1) << "device thread failed to start";
     return false;
   }
   decoder_thread_task_runner_ = decoder_thread_.task_runner();
   base::trace_event::MemoryDumpManager::GetInstance()->RegisterDumpProvider(
       this, "media::V4l2SliceVideoDecodeAccelerator",
       decoder_thread_task_runner_);

   state_ = kInitialized;
   output_mode_ = config.output_mode;

   // InitializeTask will NOTIFY_ERROR on failure.
   decoder_thread_task_runner_->PostTask(
       FROM_HERE,
       base::BindOnce(&V4L2SliceVideoDecodeAccelerator::InitializeTask,
                      base::Unretained(this)));

   VLOGF(2) << "V4L2SliceVideoDecodeAccelerator initialized";
   return true;
 }

 void V4L2SliceVideoDecodeAccelerator::InitializeTask() {
   VLOGF(2);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   DCHECK_EQ(state_, kInitialized);
   TRACE_EVENT0("media,gpu", "V4L2SVDA::InitializeTask");

   if (IsDestroyPending())
     return;

   input_queue_ = device_->GetQueue(V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE);
   output_queue_ = device_->GetQueue(V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE);
   if (!input_queue_ || !output_queue_) {
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return;
   }

   if (!CreateInputBuffers())
     NOTIFY_ERROR(PLATFORM_FAILURE);

   // Output buffers will be created once decoder gives us information
   // about their size and required count.
   state_ = kDecoding;
 }

 void V4L2SliceVideoDecodeAccelerator::Destroy() {
   VLOGF(2);
   DCHECK(child_task_runner_->BelongsToCurrentThread());

   // Signal any waiting/sleeping tasks to early exit as soon as possible to
   // avoid waiting too long for the decoder_thread_ to Stop().
   destroy_pending_.Signal();

   if (decoder_thread_.IsRunning()) {
     decoder_thread_task_runner_->PostTask(
         FROM_HERE, base::BindOnce(&V4L2SliceVideoDecodeAccelerator::DestroyTask,
                                   base::Unretained(this)));

     // Wait for tasks to finish/early-exit.
     decoder_thread_.Stop();
   }

   delete this;
   VLOGF(2) << "Destroyed";
 }

 void V4L2SliceVideoDecodeAccelerator::DestroyTask() {
   DVLOGF(2);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   TRACE_EVENT0("media,gpu", "V4L2SVDA::DestroyTask");

   state_ = kDestroying;

   decoder_->Reset();

   decoder_current_bitstream_buffer_.reset();
   while (!decoder_input_queue_.empty())
     decoder_input_queue_.pop_front();

   // Stop streaming and the device_poll_thread_.
   StopDevicePoll();

   DestroyInputBuffers();
   DestroyOutputs(false);

   media_fd_.reset();

   input_queue_ = nullptr;
   output_queue_ = nullptr;

   base::trace_event::MemoryDumpManager::GetInstance()->UnregisterDumpProvider(
       this);

   DCHECK(surfaces_at_device_.empty());
   DCHECK(surfaces_at_display_.empty());
   DCHECK(decoder_display_queue_.empty());
 }

 bool V4L2SliceVideoDecodeAccelerator::SetupFormats() {
   DCHECK_EQ(state_, kUninitialized);

   size_t input_size;
   gfx::Size max_resolution, min_resolution;
   device_->GetSupportedResolution(input_format_fourcc_, &min_resolution,
                                   &max_resolution);
   if (max_resolution.width() > 1920 && max_resolution.height() > 1088)
     input_size = kInputBufferMaxSizeFor4k;
   else
     input_size = kInputBufferMaxSizeFor1080p;

   struct v4l2_fmtdesc fmtdesc;
   memset(&fmtdesc, 0, sizeof(fmtdesc));
   fmtdesc.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
   bool is_format_supported = false;
   while (device_->Ioctl(VIDIOC_ENUM_FMT, &fmtdesc) == 0) {
     if (fmtdesc.pixelformat == input_format_fourcc_) {
       is_format_supported = true;
       break;
     }
     ++fmtdesc.index;
   }

   if (!is_format_supported) {
     DVLOGF(1) << "Input fourcc " << input_format_fourcc_
               << " not supported by device.";
     return false;
   }

   struct v4l2_format format;
   memset(&format, 0, sizeof(format));
   format.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
   format.fmt.pix_mp.pixelformat = input_format_fourcc_;
   format.fmt.pix_mp.plane_fmt[0].sizeimage = input_size;
   format.fmt.pix_mp.num_planes = input_planes_count_;
   IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_S_FMT, &format);
   DCHECK_EQ(format.fmt.pix_mp.pixelformat, input_format_fourcc_);

   // We have to set up the format for output, because the driver may not allow
   // changing it once we start streaming; whether it can support our chosen
   // output format or not may depend on the input format.
   memset(&fmtdesc, 0, sizeof(fmtdesc));
   fmtdesc.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
   output_format_fourcc_ = 0;
   while (device_->Ioctl(VIDIOC_ENUM_FMT, &fmtdesc) == 0) {
     if (device_->CanCreateEGLImageFrom(fmtdesc.pixelformat)) {
       output_format_fourcc_ = fmtdesc.pixelformat;
       break;
     }
     ++fmtdesc.index;
   }

   if (output_format_fourcc_ == 0) {
     VLOGF(1) << "Could not find a usable output format";
     return false;
   } else {
     gl_image_format_fourcc_ = output_format_fourcc_;
     gl_image_device_ = device_;
   }

   // Only set fourcc for output; resolution, etc., will come from the
   // driver once it extracts it from the stream.
   memset(&format, 0, sizeof(format));
   format.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
   format.fmt.pix_mp.pixelformat = output_format_fourcc_;
   format.fmt.pix_mp.num_planes = V4L2Device::GetNumPlanesOfV4L2PixFmt(output_format_fourcc_);
   IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_S_FMT, &format);
   DCHECK_EQ(format.fmt.pix_mp.pixelformat, output_format_fourcc_);

   DCHECK_EQ(V4L2Device::GetNumPlanesOfV4L2PixFmt(output_format_fourcc_), static_cast<size_t>(format.fmt.pix_mp.num_planes));
   output_planes_count_ = format.fmt.pix_mp.num_planes;
   gl_image_planes_count_ = output_planes_count_;

   return true;
 }

 bool V4L2SliceVideoDecodeAccelerator::CreateInputBuffers() {
   VLOGF(2);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   DCHECK(!input_queue_->IsStreaming());

   if (input_queue_->AllocateBuffers(kNumInputBuffers, V4L2_MEMORY_MMAP) <
       kNumInputBuffers) {
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return false;
   }

   // The remainder of this method only applies if requests are used.
   if (!supports_requests_)
     return true;

   DCHECK(requests_.empty());

   DCHECK(media_fd_.is_valid());
   for (size_t i = 0; i < input_queue_->AllocatedBuffersCount(); i++) {
     int request_fd;

     int ret = HANDLE_EINTR(
         ioctl(media_fd_.get(), MEDIA_IOC_REQUEST_ALLOC, &request_fd));
     if (ret < 0) {
       VPLOGF(1) << "Failed to create request: ";
       return false;
     }

     requests_.push(base::ScopedFD(request_fd));
   }
   DCHECK_EQ(requests_.size(), input_queue_->AllocatedBuffersCount());

   return true;
 }

 bool V4L2SliceVideoDecodeAccelerator::CreateOutputBuffers() {
   VLOGF(2);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   DCHECK(!output_queue_->IsStreaming());
   DCHECK(output_buffer_map_.empty());
   DCHECK(surfaces_at_display_.empty());
   DCHECK(surfaces_at_device_.empty());

   gfx::Size pic_size = decoder_->GetPicSize();
   size_t num_pictures = decoder_->GetRequiredNumOfPictures();

   DCHECK_GT(num_pictures, 0u);
   DCHECK(!pic_size.IsEmpty());

   // Since VdaVideoDecoder doesn't allocate PictureBuffer with size adjusted by
   // itself, we have to adjust here.
   struct v4l2_format format;
   memset(&format, 0, sizeof(format));
   format.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;

   if (device_->Ioctl(VIDIOC_G_FMT, &format) != 0) {
     VPLOGF(1) << "Failed getting OUTPUT format";
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return false;
   }

   format.fmt.pix_mp.width = pic_size.width();
   format.fmt.pix_mp.height = pic_size.height();

   if (device_->Ioctl(VIDIOC_S_FMT, &format) != 0) {
     VPLOGF(1) << "Failed setting OUTPUT format to: " << input_format_fourcc_;
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return false;
   }

   // Get the coded size from the CAPTURE queue
   memset(&format, 0, sizeof(format));
   format.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
   if (device_->Ioctl(VIDIOC_G_FMT, &format) != 0) {
     VPLOGF(1) << "Failed getting CAPTURE format";
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return false;
   }

   coded_size_.SetSize(base::checked_cast<int>(format.fmt.pix_mp.width),
                       base::checked_cast<int>(format.fmt.pix_mp.height));
   DCHECK_EQ(coded_size_.width() % 16, 0);
   DCHECK_EQ(coded_size_.height() % 16, 0);

   gl_image_size_ = coded_size_;

   if (!gfx::Rect(coded_size_).Contains(gfx::Rect(pic_size))) {
     VLOGF(1) << "Got invalid adjusted coded size: " << coded_size_.ToString();
     return false;
   }

   DVLOGF(3) << "buffer_count=" << num_pictures
             << ", pic size=" << pic_size.ToString()
             << ", coded size=" << coded_size_.ToString();

   VideoPixelFormat pixel_format =
       V4L2Device::V4L2PixFmtToVideoPixelFormat(gl_image_format_fourcc_);
   child_task_runner_->PostTask(
       FROM_HERE,
       base::BindOnce(
           &VideoDecodeAccelerator::Client::ProvidePictureBuffersWithVisibleRect,
           client_, num_pictures, pixel_format, 1, coded_size_,
           decoder_->GetVisibleRect(), device_->GetTextureTarget()));

   // Go into kAwaitingPictureBuffers to prevent us from doing any more decoding
   // or event handling while we are waiting for AssignPictureBuffers(). Not
   // having Pictures available would not have prevented us from making decoding
   // progress entirely e.g. in the case of H.264 where we could further decode
   // non-slice NALUs and could even get another resolution change before we were
   // done with this one. After we get the buffers, we'll go back into kIdle and
   // kick off further event processing, and eventually go back into kDecoding
   // once no more events are pending (if any).
   state_ = kAwaitingPictureBuffers;
   return true;
 }

 void V4L2SliceVideoDecodeAccelerator::DestroyInputBuffers() {
   VLOGF(2);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread() ||
          !decoder_thread_.IsRunning());

   if (!input_queue_)
     return;

   DCHECK(!input_queue_->IsStreaming());

   input_queue_->DeallocateBuffers();

   if (supports_requests_)
     requests_ = {};
 }

 void V4L2SliceVideoDecodeAccelerator::DismissPictures(
     const std::vector<int32_t>& picture_buffer_ids,
     base::WaitableEvent* done) {
   DVLOGF(3);
   DCHECK(child_task_runner_->BelongsToCurrentThread());

   for (auto picture_buffer_id : picture_buffer_ids) {
     DVLOGF(4) << "dismissing PictureBuffer id=" << picture_buffer_id;
     client_->DismissPictureBuffer(picture_buffer_id);
   }

   done->Signal();
 }

 void V4L2SliceVideoDecodeAccelerator::DevicePollTask(bool poll_device) {
   DVLOGF(3);
   DCHECK(device_poll_thread_.task_runner()->BelongsToCurrentThread());
   TRACE_EVENT0("media,gpu", "V4L2SVDA::DevicePollTask");
   bool event_pending;
   if (!device_->Poll(poll_device, &event_pending)) {
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return;
   }

   // All processing should happen on ServiceDeviceTask(), since we shouldn't
   // touch encoder state from this thread.
   decoder_thread_task_runner_->PostTask(
       FROM_HERE,
       base::BindOnce(&V4L2SliceVideoDecodeAccelerator::ServiceDeviceTask,
                      base::Unretained(this)));
 }

 void V4L2SliceVideoDecodeAccelerator::ServiceDeviceTask() {
   DVLOGF(4);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   if (IsDestroyPending())
     return;

   // ServiceDeviceTask() should only ever be scheduled from DevicePollTask().

   Dequeue();
   SchedulePollIfNeeded();
 }

 void V4L2SliceVideoDecodeAccelerator::SchedulePollIfNeeded() {
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   if (!device_poll_thread_.IsRunning()) {
     DVLOGF(4) << "Device poll thread stopped, will not schedule poll";
     return;
   }

   DCHECK(input_queue_->IsStreaming() || output_queue_->IsStreaming());

   if (input_queue_->QueuedBuffersCount() +
           output_queue_->QueuedBuffersCount() ==
       0) {
     DVLOGF(4) << "No buffers queued, will not schedule poll";
     return;
   }

   DVLOGF(4) << "Scheduling device poll task";

   device_poll_thread_.task_runner()->PostTask(
       FROM_HERE,
       base::BindOnce(&V4L2SliceVideoDecodeAccelerator::DevicePollTask,
                      base::Unretained(this), true));

   DVLOGF(3) << "buffer counts: "
             << "INPUT[" << decoder_input_queue_.size() << "]"
             << " => DEVICE[" << input_queue_->FreeBuffersCount() << "+"
             << input_queue_->QueuedBuffersCount() << "/"
             << input_queue_->AllocatedBuffersCount() << "]->["
             << output_queue_->FreeBuffersCount() << "+"
             << output_queue_->QueuedBuffersCount() << "/"
             << output_buffer_map_.size() << "]"
             << " => DISPLAYQ[" << decoder_display_queue_.size() << "]"
             << " => CLIENT[" << surfaces_at_display_.size() << "]";
 }

 void V4L2SliceVideoDecodeAccelerator::Enqueue(
     const scoped_refptr<V4L2DecodeSurface>& dec_surface) {
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   const int old_inputs_queued = input_queue_->QueuedBuffersCount();
   const int old_outputs_queued = output_queue_->QueuedBuffersCount();

   if (!EnqueueInputRecord(dec_surface.get())) {
     VLOGF(1) << "Failed queueing an input buffer";
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return;
   }

   if (!EnqueueOutputRecord(dec_surface.get())) {
     VLOGF(1) << "Failed queueing an output buffer";
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return;
   }

   surfaces_at_device_.push(dec_surface);

   if (old_inputs_queued == 0 && old_outputs_queued == 0)
     SchedulePollIfNeeded();
 }

 void V4L2SliceVideoDecodeAccelerator::Dequeue() {
   DVLOGF(4);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   while (input_queue_->QueuedBuffersCount() > 0) {
     DCHECK(input_queue_->IsStreaming());
     auto ret = input_queue_->DequeueBuffer();

     if (ret.first == false) {
       NOTIFY_ERROR(PLATFORM_FAILURE);
       return;
     } else if (!ret.second) {
       // we're just out of buffers to dequeue.
       break;
     }

     DVLOGF(4) << "Dequeued input=" << ret.second->BufferId()
               << " count: " << input_queue_->QueuedBuffersCount();
   }

   while (output_queue_->QueuedBuffersCount() > 0) {
     DCHECK(output_queue_->IsStreaming());
     auto ret = output_queue_->DequeueBuffer();
     if (ret.first == false) {
       NOTIFY_ERROR(PLATFORM_FAILURE);
       return;
     } else if (!ret.second) {
       // we're just out of buffers to dequeue.
       break;
     }

     DVLOGF(4) << "Dequeued output=" << ret.second->BufferId() << " count "
               << output_queue_->QueuedBuffersCount();

     DCHECK(!surfaces_at_device_.empty());
     scoped_refptr<V4L2DecodeSurface> surface = surfaces_at_device_.front();
     surfaces_at_device_.pop();
     DCHECK_EQ(static_cast<size_t>(surface->output_record()),
               ret.second->BufferId());
     surface->SetDecoded();

     surface->SetReleaseCallback(
         base::BindOnce(&V4L2SliceVideoDecodeAccelerator::ReuseOutputBuffer,
                        base::Unretained(this), std::move(ret.second)));
   }

   // A frame was decoded, see if we can output it.
   TryOutputSurfaces();

   ProcessPendingEventsIfNeeded();
   ScheduleDecodeBufferTaskIfNeeded();
 }

 void V4L2SliceVideoDecodeAccelerator::NewEventPending() {
   // Switch to event processing mode if we are decoding. Otherwise we are either
   // already in it, or we will potentially switch to it later, after finishing
   // other tasks.
   if (state_ == kDecoding)
     state_ = kIdle;

   ProcessPendingEventsIfNeeded();
 }

 bool V4L2SliceVideoDecodeAccelerator::FinishEventProcessing() {
   DCHECK_EQ(state_, kIdle);

   state_ = kDecoding;
   ScheduleDecodeBufferTaskIfNeeded();

   return true;
 }

 void V4L2SliceVideoDecodeAccelerator::ProcessPendingEventsIfNeeded() {
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   // Process pending events, if any, in the correct order.
   // We always first process the surface set change, as it is an internal
   // event from the decoder and interleaving it with external requests would
   // put the decoder in an undefined state.
   using ProcessFunc = bool (V4L2SliceVideoDecodeAccelerator::*)();
   const ProcessFunc process_functions[] = {
       &V4L2SliceVideoDecodeAccelerator::FinishSurfaceSetChange,
       &V4L2SliceVideoDecodeAccelerator::FinishFlush,
       &V4L2SliceVideoDecodeAccelerator::FinishReset,
       &V4L2SliceVideoDecodeAccelerator::FinishEventProcessing,
   };

   for (const auto& fn : process_functions) {
     if (state_ != kIdle)
       return;

     if (!(this->*fn)())
       return;
   }
 }

 void V4L2SliceVideoDecodeAccelerator::ReuseOutputBuffer(
     V4L2ReadableBufferRef buffer) {
   DVLOGF(4) << "Reusing output buffer, index=" << buffer->BufferId();
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   ScheduleDecodeBufferTaskIfNeeded();
 }

 bool V4L2SliceVideoDecodeAccelerator::EnqueueInputRecord(
     V4L2DecodeSurface* dec_surface) {
   DVLOGF(4);
   DCHECK_NE(dec_surface, nullptr);

   // Enqueue an input (VIDEO_OUTPUT) buffer for an input video frame.
   V4L2WritableBufferRef input_buffer = std::move(dec_surface->input_buffer());
   DCHECK(input_buffer.IsValid());
   const int index = input_buffer.BufferId();
   input_buffer.PrepareQueueBuffer(*dec_surface);
   if (!std::move(input_buffer).QueueMMap()) {
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return false;
   }

   DVLOGF(4) << "Enqueued input=" << index
             << " count: " << input_queue_->QueuedBuffersCount();

   return true;
 }

 bool V4L2SliceVideoDecodeAccelerator::EnqueueOutputRecord(
     V4L2DecodeSurface* dec_surface) {
   DVLOGF(4);

   // Enqueue an output (VIDEO_CAPTURE) buffer.
   V4L2WritableBufferRef output_buffer = std::move(dec_surface->output_buffer());
   DCHECK(output_buffer.IsValid());
   size_t index = output_buffer.BufferId();
   OutputRecord& output_record = output_buffer_map_[index];
   DCHECK_NE(output_record.picture_id, -1);

   bool ret;
   if (output_mode_ == Config::OutputMode::ALLOCATE)
     ret = std::move(output_buffer).QueueMMap();
   else
     ret = std::move(output_buffer).QueueDMABuf(output_record.dmabuf_fds);

   if (!ret) {
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return false;
   }

   DVLOGF(4) << "Enqueued output=" << index
             << " count: " << output_queue_->QueuedBuffersCount();

   return true;
 }

 bool V4L2SliceVideoDecodeAccelerator::StartDevicePoll() {
   DVLOGF(3) << "Starting device poll";
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   DCHECK(!device_poll_thread_.IsRunning());

   // Start up the device poll thread and schedule its first DevicePollTask().
   if (!device_poll_thread_.Start()) {
     VLOGF(1) << "Device thread failed to start";
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return false;
   }

   if (!input_queue_->Streamon())
     return false;

   if (!output_queue_->Streamon())
     return false;

   device_poll_thread_.task_runner()->PostTask(
       FROM_HERE,
       base::BindOnce(&V4L2SliceVideoDecodeAccelerator::DevicePollTask,
                      base::Unretained(this), true));

   return true;
 }

 bool V4L2SliceVideoDecodeAccelerator::StopDevicePoll() {
   DVLOGF(3) << "Stopping device poll";
   if (decoder_thread_.IsRunning())
     DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   // Signal the DevicePollTask() to stop, and stop the device poll thread.
   if (!device_->SetDevicePollInterrupt()) {
     VPLOGF(1) << "SetDevicePollInterrupt(): failed";
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return false;
   }
   device_poll_thread_.Stop();
   DVLOGF(3) << "Device poll thread stopped";

   // Clear the interrupt now, to be sure.
   if (!device_->ClearDevicePollInterrupt()) {
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return false;
   }

   // We may be called before the queue is acquired.
   if (input_queue_) {
     if (!input_queue_->Streamoff())
       return false;

     DCHECK_EQ(input_queue_->QueuedBuffersCount(), 0u);
   }

   // We may be called before the queue is acquired.
   if (output_queue_) {
     if (!output_queue_->Streamoff())
       return false;

     DCHECK_EQ(output_queue_->QueuedBuffersCount(), 0u);
   }

   // Mark as decoded to allow reuse.
   while (!surfaces_at_device_.empty())
     surfaces_at_device_.pop();

   // Drop all surfaces that were awaiting decode before being displayed,
   // since we've just cancelled all outstanding decodes.
   while (!decoder_display_queue_.empty())
     decoder_display_queue_.pop();

   DVLOGF(3) << "Device poll stopped";
   return true;
 }

 void V4L2SliceVideoDecodeAccelerator::Decode(BitstreamBuffer bitstream_buffer) {
   Decode(bitstream_buffer.ToDecoderBuffer(), bitstream_buffer.id());
 }

 void V4L2SliceVideoDecodeAccelerator::Decode(
     scoped_refptr<DecoderBuffer> buffer,
     int32_t bitstream_id) {
   DVLOGF(4) << "input_id=" << bitstream_id
             << ", size=" << (buffer ? buffer->data_size() : 0);
   DCHECK(decode_task_runner_->BelongsToCurrentThread());

   if (bitstream_id < 0) {
     VLOGF(1) << "Invalid bitstream buffer, id: " << bitstream_id;
     NOTIFY_ERROR(INVALID_ARGUMENT);
     return;
   }

   decoder_thread_task_runner_->PostTask(
       FROM_HERE,
       base::BindOnce(&V4L2SliceVideoDecodeAccelerator::DecodeTask,
                      base::Unretained(this), std::move(buffer), bitstream_id));
 }

 void V4L2SliceVideoDecodeAccelerator::DecodeTask(
     scoped_refptr<DecoderBuffer> buffer,
     int32_t bitstream_id) {
   DVLOGF(4) << "input_id=" << bitstream_id
             << " size=" << (buffer ? buffer->data_size() : 0);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   if (IsDestroyPending())
     return;

   std::unique_ptr<BitstreamBufferRef> bitstream_record(new BitstreamBufferRef(
       decode_client_, decode_task_runner_, std::move(buffer), bitstream_id));

   // Skip empty buffer.
   if (!bitstream_record->buffer)
     return;

   decoder_input_queue_.push_back(std::move(bitstream_record));

   TRACE_COUNTER_ID1("media,gpu", "V4L2SVDA decoder input BitstreamBuffers",
                     this, decoder_input_queue_.size());

   ScheduleDecodeBufferTaskIfNeeded();
 }

 bool V4L2SliceVideoDecodeAccelerator::TrySetNewBistreamBuffer() {
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   DCHECK(!decoder_current_bitstream_buffer_);

   if (decoder_input_queue_.empty())
     return false;

   decoder_current_bitstream_buffer_ = std::move(decoder_input_queue_.front());
   decoder_input_queue_.pop_front();

   if (decoder_current_bitstream_buffer_->input_id == kFlushBufferId) {
     // This is a buffer we queued for ourselves to trigger flush at this time.
     InitiateFlush();
     return false;
   }

   decoder_->SetStream(decoder_current_bitstream_buffer_->input_id,
                       *decoder_current_bitstream_buffer_->buffer);
   return true;
 }

 void V4L2SliceVideoDecodeAccelerator::ScheduleDecodeBufferTaskIfNeeded() {
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   if (state_ == kDecoding) {
     decoder_thread_task_runner_->PostTask(
         FROM_HERE,
         base::BindOnce(&V4L2SliceVideoDecodeAccelerator::DecodeBufferTask,
                        base::Unretained(this)));
   }
 }

 void V4L2SliceVideoDecodeAccelerator::DecodeBufferTask() {
   DVLOGF(4);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   TRACE_EVENT0("media,gpu", "V4L2SVDA::DecodeBufferTask");

   if (IsDestroyPending())
     return;

   if (state_ != kDecoding) {
     DVLOGF(3) << "Early exit, not in kDecoding";
     return;
   }

   while (true) {
     TRACE_EVENT_BEGIN0("media,gpu", "V4L2SVDA::DecodeBufferTask AVD::Decode");
     const AcceleratedVideoDecoder::DecodeResult res = decoder_->Decode();
     TRACE_EVENT_END0("media,gpu", "V4L2SVDA::DecodeBufferTask AVD::Decode");
     switch (res) {
       case AcceleratedVideoDecoder::kAllocateNewSurfaces:
         VLOGF(2) << "Decoder requesting a new set of surfaces";
         InitiateSurfaceSetChange();
         return;

       case AcceleratedVideoDecoder::kRanOutOfStreamData:
         decoder_current_bitstream_buffer_.reset();
         if (!TrySetNewBistreamBuffer())
           return;

         break;

       case AcceleratedVideoDecoder::kRanOutOfSurfaces:
         // No more surfaces for the decoder, we'll come back once we have more.
         DVLOGF(4) << "Ran out of surfaces";
         return;

       case AcceleratedVideoDecoder::kNeedContextUpdate:
         DVLOGF(4) << "Awaiting context update";
         return;

       case AcceleratedVideoDecoder::kDecodeError:
         VLOGF(1) << "Error decoding stream";
         NOTIFY_ERROR(PLATFORM_FAILURE);
         return;

       case AcceleratedVideoDecoder::kTryAgain:
         NOTREACHED() << "Should not reach here unless this class accepts "
                         "encrypted streams.";
         DVLOGF(4) << "No key for decoding stream.";
         NOTIFY_ERROR(PLATFORM_FAILURE);
         return;
     }
   }
 }

 void V4L2SliceVideoDecodeAccelerator::InitiateSurfaceSetChange() {
   VLOGF(2);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   DCHECK_EQ(state_, kDecoding);
   TRACE_EVENT_ASYNC_BEGIN0("media,gpu", "V4L2SVDA Resolution Change", this);
   DCHECK(!surface_set_change_pending_);
   surface_set_change_pending_ = true;
   NewEventPending();
 }

 bool V4L2SliceVideoDecodeAccelerator::FinishSurfaceSetChange() {
   VLOGF(2);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   if (!surface_set_change_pending_)
     return true;

   if (!surfaces_at_device_.empty())
     return false;

   DCHECK_EQ(state_, kIdle);
   DCHECK(decoder_display_queue_.empty());
   // All output buffers should've been returned from decoder and device by now.
   // The only remaining owner of surfaces may be display (client), and we will
   // dismiss them when destroying output buffers below.
   DCHECK_EQ(output_queue_->FreeBuffersCount() + surfaces_at_display_.size(),
             output_buffer_map_.size());

   if (!StopDevicePoll()) {
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return false;
   }

   // Dequeued decoded surfaces may be pended in pending_picture_ready_ if they
   // are waiting for some pictures to be cleared. We should post them right away
   // because they are about to be dismissed and destroyed for surface set
   // change.
   SendPictureReady();

   // This will return only once all buffers are dismissed and destroyed.
   // This does not wait until they are displayed however, as display retains
   // references to the buffers bound to textures and will release them
   // after displaying.
   if (!DestroyOutputs(true)) {
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return false;
   }

   if (!CreateOutputBuffers()) {
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return false;
   }

   surface_set_change_pending_ = false;
   VLOGF(2) << "Surface set change finished";
   TRACE_EVENT_ASYNC_END0("media,gpu", "V4L2SVDA Resolution Change", this);
   return true;
 }

 bool V4L2SliceVideoDecodeAccelerator::DestroyOutputs(bool dismiss) {
   VLOGF(2);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   std::vector<int32_t> picture_buffers_to_dismiss;

   if (output_buffer_map_.empty())
     return true;

   for (auto& output_record : output_buffer_map_) {
     picture_buffers_to_dismiss.push_back(output_record.picture_id);
   }

   if (dismiss) {
     VLOGF(2) << "Scheduling picture dismissal";
     base::WaitableEvent done(base::WaitableEvent::ResetPolicy::AUTOMATIC,
                              base::WaitableEvent::InitialState::NOT_SIGNALED);
     child_task_runner_->PostTask(
         FROM_HERE,
         base::BindOnce(&V4L2SliceVideoDecodeAccelerator::DismissPictures,
                        weak_this_, picture_buffers_to_dismiss, &done));
     done.Wait();
   }

   // At this point client can't call ReusePictureBuffer on any of the pictures
   // anymore, so it's safe to destroy.
   return DestroyOutputBuffers();
 }

 bool V4L2SliceVideoDecodeAccelerator::DestroyOutputBuffers() {
   VLOGF(2);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread() ||
          !decoder_thread_.IsRunning());
   DCHECK(surfaces_at_device_.empty());
   DCHECK(decoder_display_queue_.empty());

   if (!output_queue_ || output_buffer_map_.empty())
     return true;

   DCHECK(!output_queue_->IsStreaming());
   DCHECK_EQ(output_queue_->QueuedBuffersCount(), 0u);

   // Release all buffers waiting for an import buffer event.
   output_wait_map_.clear();

   // Release all buffers awaiting a fence since we are about to destroy them.
   surfaces_awaiting_fence_ = {};

   // It's ok to do this, client will retain references to textures, but we are
   // not interested in reusing the surfaces anymore.
   // This will prevent us from reusing old surfaces in case we have some
   // ReusePictureBuffer() pending on ChildThread already. It's ok to ignore
   // them, because we have already dismissed them (in DestroyOutputs()).
   surfaces_at_display_.clear();
   DCHECK_EQ(output_queue_->FreeBuffersCount(), output_buffer_map_.size());

   output_buffer_map_.clear();

   output_queue_->DeallocateBuffers();

   return true;
 }

 void V4L2SliceVideoDecodeAccelerator::AssignPictureBuffers(
     const std::vector<PictureBuffer>& buffers) {
   VLOGF(2);
   DCHECK(child_task_runner_->BelongsToCurrentThread());

   decoder_thread_task_runner_->PostTask(
       FROM_HERE,
       base::BindOnce(&V4L2SliceVideoDecodeAccelerator::AssignPictureBuffersTask,
                      base::Unretained(this), buffers));
 }

 void V4L2SliceVideoDecodeAccelerator::AssignPictureBuffersTask(
     const std::vector<PictureBuffer>& buffers) {
   VLOGF(2);
   DCHECK(!output_queue_->IsStreaming());
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   DCHECK_EQ(state_, kAwaitingPictureBuffers);
   TRACE_EVENT1("media,gpu", "V4L2SVDA::AssignPictureBuffersTask",
                "buffers_size", buffers.size());

   if (IsDestroyPending())
     return;

   const uint32_t req_buffer_count = decoder_->GetRequiredNumOfPictures();

   if (buffers.size() < req_buffer_count) {
     VLOGF(1) << "Failed to provide requested picture buffers. "
              << "(Got " << buffers.size() << ", requested " << req_buffer_count
              << ")";
     NOTIFY_ERROR(INVALID_ARGUMENT);
     return;
   }

   // If a client allocate a different frame size, S_FMT should be called with
   // the size.
   if (coded_size_ != buffers[0].size()) {
     const auto& new_frame_size = buffers[0].size();
     v4l2_format format = {};
     format.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
     format.fmt.pix_mp.width = new_frame_size.width();
     format.fmt.pix_mp.height = new_frame_size.height();
     format.fmt.pix_mp.pixelformat = output_format_fourcc_;
     format.fmt.pix_mp.num_planes = output_planes_count_;
     if (device_->Ioctl(VIDIOC_S_FMT, &format) != 0) {
       VPLOGF(1) << "Failed with frame size adjusted by client: "
                 << new_frame_size.ToString();
       NOTIFY_ERROR(PLATFORM_FAILURE);
       return;
     }

     coded_size_.SetSize(format.fmt.pix_mp.width, format.fmt.pix_mp.height);
     // If size specified by ProvidePictureBuffers() is adjusted by the client,
     // the size must not be adjusted by a v4l2 driver again.
     if (coded_size_ != new_frame_size) {
       VLOGF(1) << "The size of PictureBuffer is invalid."
                << " size adjusted by the client = " << new_frame_size.ToString()
                << " size adjusted by a driver = " << coded_size_.ToString();
       NOTIFY_ERROR(INVALID_ARGUMENT);
       return;
     }

     if (!gfx::Rect(coded_size_).Contains(gfx::Rect(decoder_->GetPicSize()))) {
       VLOGF(1) << "Got invalid adjusted coded size: " << coded_size_.ToString();
       NOTIFY_ERROR(INVALID_ARGUMENT);
       return;
     }
   }

   gl_image_size_ = coded_size_;

   const v4l2_memory memory =
       (output_mode_ == Config::OutputMode::ALLOCATE ? V4L2_MEMORY_MMAP
                                                     : V4L2_MEMORY_DMABUF);
   if (output_queue_->AllocateBuffers(buffers.size(), memory) !=
       buffers.size()) {
     VLOGF(1) << "Could not allocate enough output buffers";
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return;
   }

   DCHECK(output_buffer_map_.empty());
   DCHECK(output_wait_map_.empty());
   output_buffer_map_.resize(buffers.size());
   // Reserve all buffers until ImportBufferForPictureTask() is called
   while (output_queue_->FreeBuffersCount() > 0) {
     V4L2WritableBufferRef buffer = output_queue_->GetFreeBuffer();
     DCHECK(buffer.IsValid());
     int i = buffer.BufferId();

     DCHECK_EQ(output_wait_map_.count(buffers[i].id()), 0u);
     // The buffer will remain here until ImportBufferForPicture is called,
     // either by the client, or by ourselves, if we are allocating.
     output_wait_map_.emplace(buffers[i].id(), std::move(buffer));
   }
   // All available buffers should be in the wait map now.
   DCHECK_EQ(output_buffer_map_.size(), output_wait_map_.size());

   for (size_t i = 0; i < buffers.size(); i++) {
     OutputRecord& output_record = output_buffer_map_[i];
     DCHECK_EQ(output_record.picture_id, -1);
     DCHECK(output_record.dmabuf_fds.empty());
     DCHECK_EQ(output_record.cleared, false);

     output_record.picture_id = buffers[i].id();
     output_record.texture_id = buffers[i].service_texture_ids().empty()
                                    ? 0
                                    : buffers[i].service_texture_ids()[0];

     output_record.client_texture_id = buffers[i].client_texture_ids().empty()
                                           ? 0
                                           : buffers[i].client_texture_ids()[0];

     if (output_mode_ == Config::OutputMode::ALLOCATE) {
       std::vector<base::ScopedFD> passed_dmabuf_fds =
           gl_image_device_->GetDmabufsForV4L2Buffer(
               i, gl_image_planes_count_, V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE);
       if (passed_dmabuf_fds.empty()) {
         NOTIFY_ERROR(PLATFORM_FAILURE);
         return;
       }

       ImportBufferForPictureTask(output_record.picture_id,
                                  std::move(passed_dmabuf_fds));
     }  // else we'll get triggered via ImportBufferForPicture() from client.
     DVLOGF(3) << "buffer[" << i << "]: picture_id=" << output_record.picture_id;
   }

   if (!StartDevicePoll()) {
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return;
   }

   // Put us in kIdle to allow further event processing.
   // ProcessPendingEventsIfNeeded() will put us back into kDecoding after all
   // other pending events are processed successfully.
   state_ = kIdle;
   ProcessPendingEventsIfNeeded();
 }

 void V4L2SliceVideoDecodeAccelerator::CreateGLImageFor(
     size_t buffer_index,
     int32_t picture_buffer_id,
     std::vector<base::ScopedFD> passed_dmabuf_fds,
     GLuint client_texture_id,
     GLuint texture_id,
     const gfx::Size& size,
     uint32_t fourcc) {
   DVLOGF(3) << "index=" << buffer_index;
   DCHECK(child_task_runner_->BelongsToCurrentThread());
   DCHECK_NE(texture_id, 0u);
   TRACE_EVENT1("media,gpu", "V4L2SVDA::CreateGLImageFor", "picture_buffer_id",
                picture_buffer_id);

   if (!make_context_current_cb_) {
     VLOGF(1) << "GL callbacks required for binding to GLImages";
     NOTIFY_ERROR(INVALID_ARGUMENT);
     return;
   }
   if (!make_context_current_cb_.Run()) {
     VLOGF(1) << "No GL context";
     NOTIFY_ERROR(INVALID_ARGUMENT);
     return;
   }

   scoped_refptr<gl::GLImage> gl_image =
       gl_image_device_->CreateGLImage(size, fourcc, passed_dmabuf_fds);
   if (!gl_image) {
     VLOGF(1) << "Could not create GLImage,"
              << " index=" << buffer_index << " texture_id=" << texture_id;
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return;
   }
   gl::ScopedTextureBinder bind_restore(gl_image_device_->GetTextureTarget(),
                                        texture_id);
   bool ret = gl_image->BindTexImage(gl_image_device_->GetTextureTarget());
   DCHECK(ret);
   bind_image_cb_.Run(client_texture_id, gl_image_device_->GetTextureTarget(),
                      gl_image, true);
   decoder_thread_task_runner_->PostTask(
       FROM_HERE,
       base::BindOnce(&V4L2SliceVideoDecodeAccelerator::AssignDmaBufs,
                      base::Unretained(this), buffer_index, picture_buffer_id,
                      std::move(passed_dmabuf_fds)));
 }

 void V4L2SliceVideoDecodeAccelerator::AssignDmaBufs(
     size_t buffer_index,
     int32_t picture_buffer_id,
     std::vector<base::ScopedFD> passed_dmabuf_fds) {
   DVLOGF(3) << "index=" << buffer_index;
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   if (IsDestroyPending())
     return;

   // It's possible that while waiting for the EGLImages to be allocated and
   // assigned, we have already decoded more of the stream and saw another
   // resolution change. This is a normal situation, in such a case either there
   // is no output record with this index awaiting an EGLImage to be assigned to
   // it, or the record is already updated to use a newer PictureBuffer and is
   // awaiting an EGLImage associated with a different picture_buffer_id. If so,
   // just discard this image, we will get the one we are waiting for later.
   if (buffer_index >= output_buffer_map_.size() ||
       output_buffer_map_[buffer_index].picture_id != picture_buffer_id) {
     DVLOGF(4) << "Picture set already changed, dropping EGLImage";
     return;
   }

   OutputRecord& output_record = output_buffer_map_[buffer_index];
   DCHECK_EQ(output_wait_map_.count(picture_buffer_id), 1u);

   if (output_mode_ == Config::OutputMode::IMPORT) {
     DCHECK(output_record.dmabuf_fds.empty());
     output_record.dmabuf_fds = std::move(passed_dmabuf_fds);
   }

   // Buffer is ready to be used.
   output_wait_map_.erase(picture_buffer_id);
   ScheduleDecodeBufferTaskIfNeeded();
 }

 void V4L2SliceVideoDecodeAccelerator::ImportBufferForPicture(
     int32_t picture_buffer_id,
     VideoPixelFormat pixel_format,
     gfx::GpuMemoryBufferHandle gpu_memory_buffer_handle) {
   DVLOGF(3) << "picture_buffer_id=" << picture_buffer_id;
   DCHECK(child_task_runner_->BelongsToCurrentThread());

   std::vector<base::ScopedFD> dmabuf_fds;
 #if defined(USE_OZONE)
   // If the driver does not accept as many fds as we received from the client,
   // we have to check if the additional fds are actually duplicated fds pointing
   // to previous planes; if so, we can close the duplicates and keep only the
   // original fd(s).
   // Assume that an fd is a duplicate of a previous plane's fd if offset != 0.
   // Otherwise, if offset == 0, return error as it may be pointing to a new
   // plane.
   for (auto& plane : gpu_memory_buffer_handle.native_pixmap_handle.planes) {
     dmabuf_fds.push_back(std::move(plane.fd));
   }
   for (size_t i = dmabuf_fds.size() - 1; i >= gl_image_planes_count_; i--) {
     if (gpu_memory_buffer_handle.native_pixmap_handle.planes[i].offset == 0) {
       VLOGF(1) << "The dmabuf fd points to a new buffer, ";
       NOTIFY_ERROR(INVALID_ARGUMENT);
       return;
     }
     // Drop safely, because this fd is duplicate dmabuf fd pointing to previous
     // buffer and the appropriate address can be accessed by associated offset.
     dmabuf_fds.pop_back();
   }
 #endif

   if (output_mode_ != Config::OutputMode::IMPORT) {
     VLOGF(1) << "Cannot import in non-import mode";
     NOTIFY_ERROR(INVALID_ARGUMENT);
     return;
   }

   if (pixel_format !=
       V4L2Device::V4L2PixFmtToVideoPixelFormat(gl_image_format_fourcc_)) {
     VLOGF(1) << "Unsupported import format: "
              << VideoPixelFormatToString(pixel_format);
     NOTIFY_ERROR(INVALID_ARGUMENT);
     return;
   }

   decoder_thread_task_runner_->PostTask(
       FROM_HERE,
       base::BindOnce(
           &V4L2SliceVideoDecodeAccelerator::ImportBufferForPictureTask,
           base::Unretained(this), picture_buffer_id, std::move(dmabuf_fds)));
 }

 void V4L2SliceVideoDecodeAccelerator::ImportBufferForPictureTask(
     int32_t picture_buffer_id,
     std::vector<base::ScopedFD> passed_dmabuf_fds) {
   DVLOGF(3) << "picture_buffer_id=" << picture_buffer_id;
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   if (IsDestroyPending())
     return;

   const auto iter =
       std::find_if(output_buffer_map_.begin(), output_buffer_map_.end(),
                    [picture_buffer_id](const OutputRecord& output_record) {
                      return output_record.picture_id == picture_buffer_id;
                    });
   if (iter == output_buffer_map_.end()) {
     // It's possible that we've already posted a DismissPictureBuffer for this
     // picture, but it has not yet executed when this ImportBufferForPicture was
     // posted to us by the client. In that case just ignore this (we've already
     // dismissed it and accounted for that).
     DVLOGF(3) << "got picture id=" << picture_buffer_id
               << " not in use (anymore?).";
     return;
   }

   if (!output_wait_map_.count(iter->picture_id)) {
     VLOGF(1) << "Passed buffer is not waiting to be imported";
     NOTIFY_ERROR(INVALID_ARGUMENT);
     return;
   }

   size_t index = iter - output_buffer_map_.begin();

   if (iter->texture_id != 0) {
     child_task_runner_->PostTask(
         FROM_HERE,
         base::BindOnce(&V4L2SliceVideoDecodeAccelerator::CreateGLImageFor,
                        weak_this_, index, picture_buffer_id,
                        std::move(passed_dmabuf_fds), iter->client_texture_id,
                        iter->texture_id, gl_image_size_,
                        gl_image_format_fourcc_));
   } else {
     // No need for a GLImage, start using this buffer now.
     DCHECK_EQ(gl_image_planes_count_, passed_dmabuf_fds.size());
     iter->dmabuf_fds = std::move(passed_dmabuf_fds);

     // Buffer is now ready to be used.
     DCHECK_EQ(output_wait_map_.count(picture_buffer_id), 1u);
     output_wait_map_.erase(picture_buffer_id);
     ScheduleDecodeBufferTaskIfNeeded();
   }
 }

 void V4L2SliceVideoDecodeAccelerator::ReusePictureBuffer(
     int32_t picture_buffer_id) {
   DCHECK(child_task_runner_->BelongsToCurrentThread());
   DVLOGF(4) << "picture_buffer_id=" << picture_buffer_id;

   std::unique_ptr<gl::GLFenceEGL> egl_fence;

   if (make_context_current_cb_) {
     if (!make_context_current_cb_.Run()) {
       VLOGF(1) << "could not make context current";
       NOTIFY_ERROR(PLATFORM_FAILURE);
       return;
     }

     egl_fence = gl::GLFenceEGL::Create();
     if (!egl_fence) {
       VLOGF(1) << "gl::GLFenceEGL::Create() failed";
       NOTIFY_ERROR(PLATFORM_FAILURE);
       return;
     }
   }

   decoder_thread_task_runner_->PostTask(
       FROM_HERE,
       base::BindOnce(&V4L2SliceVideoDecodeAccelerator::ReusePictureBufferTask,
                      base::Unretained(this), picture_buffer_id,
                      std::move(egl_fence)));
 }

 void V4L2SliceVideoDecodeAccelerator::ReusePictureBufferTask(
     int32_t picture_buffer_id,
     std::unique_ptr<gl::GLFenceEGL> egl_fence) {
   DVLOGF(4) << "picture_buffer_id=" << picture_buffer_id;
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   if (IsDestroyPending())
     return;

   V4L2DecodeSurfaceByPictureBufferId::iterator it =
       surfaces_at_display_.find(picture_buffer_id);
   if (it == surfaces_at_display_.end()) {
     // It's possible that we've already posted a DismissPictureBuffer for this
     // picture, but it has not yet executed when this ReusePictureBuffer was
     // posted to us by the client. In that case just ignore this (we've already
     // dismissed it and accounted for that) and let the fence object get
     // destroyed.
     DVLOGF(3) << "got picture id=" << picture_buffer_id
               << " not in use (anymore?).";
     return;
   }

   OutputRecord& output_record = output_buffer_map_[it->second->output_record()];
   if (!output_record.at_client()) {
     VLOGF(1) << "picture_buffer_id not reusable";
     NOTIFY_ERROR(INVALID_ARGUMENT);
     return;
   }

   --output_record.num_times_sent_to_client;
   // A output buffer might be sent multiple times. We only use the last fence.
   // When the last fence is signaled, all the previous fences must be executed.
   if (!output_record.at_client()) {
     // Take ownership of the EGL fence.
     if (egl_fence)
       surfaces_awaiting_fence_.push(
           std::make_pair(std::move(egl_fence), std::move(it->second)));

     surfaces_at_display_.erase(it);
   }
 }

 void V4L2SliceVideoDecodeAccelerator::Flush() {
   VLOGF(2);
   DCHECK(child_task_runner_->BelongsToCurrentThread());

   decoder_thread_task_runner_->PostTask(
       FROM_HERE, base::BindOnce(&V4L2SliceVideoDecodeAccelerator::FlushTask,
                                 base::Unretained(this)));
 }

 void V4L2SliceVideoDecodeAccelerator::FlushTask() {
   VLOGF(2);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   if (IsDestroyPending())
     return;

   // Queue an empty buffer which - when reached - will trigger flush sequence.
   decoder_input_queue_.push_back(std::make_unique<BitstreamBufferRef>(
       decode_client_, decode_task_runner_, nullptr, kFlushBufferId));

   ScheduleDecodeBufferTaskIfNeeded();
 }

 void V4L2SliceVideoDecodeAccelerator::InitiateFlush() {
   VLOGF(2);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   TRACE_EVENT_ASYNC_BEGIN0("media,gpu", "V4L2SVDA Flush", this);

   // This will trigger output for all remaining surfaces in the decoder.
   // However, not all of them may be decoded yet (they would be queued
   // in hardware then).
   if (!decoder_->Flush()) {
     DVLOGF(1) << "Failed flushing the decoder.";
     NOTIFY_ERROR(PLATFORM_FAILURE);
     return;
   }

   // Put the decoder in an idle state, ready to resume.
   decoder_->Reset();

   DCHECK(!decoder_flushing_);
   decoder_flushing_ = true;
   NewEventPending();
 }

 bool V4L2SliceVideoDecodeAccelerator::FinishFlush() {
   VLOGF(4);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   if (!decoder_flushing_)
     return true;

   if (!surfaces_at_device_.empty())
     return false;

   // Even if all output buffers have been returned, the decoder may still
   // be holding on an input device. Wait until the queue is actually drained.
   if (input_queue_->QueuedBuffersCount() != 0)
     return false;

   DCHECK_EQ(state_, kIdle);

   // At this point, all remaining surfaces are decoded and dequeued, and since
   // we have already scheduled output for them in InitiateFlush(), their
   // respective PictureReady calls have been posted (or they have been queued on
   // pending_picture_ready_). So at this time, once we SendPictureReady(),
   // we will have all remaining PictureReady() posted to the client and we
   // can post NotifyFlushDone().
   DCHECK(decoder_display_queue_.empty());

   // Decoder should have already returned all surfaces and all surfaces are
   // out of hardware. There can be no other owners of input buffers.
   DCHECK_EQ(input_queue_->FreeBuffersCount(),
             input_queue_->AllocatedBuffersCount());

   SendPictureReady();

   decoder_flushing_ = false;
   VLOGF(2) << "Flush finished";

   child_task_runner_->PostTask(
       FROM_HERE, base::BindOnce(&Client::NotifyFlushDone, client_));

   TRACE_EVENT_ASYNC_END0("media,gpu", "V4L2SVDA Flush", this);
   return true;
 }

 void V4L2SliceVideoDecodeAccelerator::Reset() {
   VLOGF(2);
   DCHECK(child_task_runner_->BelongsToCurrentThread());

   decoder_thread_task_runner_->PostTask(
       FROM_HERE, base::BindOnce(&V4L2SliceVideoDecodeAccelerator::ResetTask,
                                 base::Unretained(this)));
 }

 void V4L2SliceVideoDecodeAccelerator::ResetTask() {
   VLOGF(2);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   TRACE_EVENT_ASYNC_BEGIN0("media,gpu", "V4L2SVDA Reset", this);

   if (IsDestroyPending())
     return;

   if (decoder_resetting_) {
     // This is a bug in the client, multiple Reset()s before NotifyResetDone()
     // are not allowed.
     NOTREACHED() << "Client should not be requesting multiple Reset()s";
     return;
   }

   // Put the decoder in an idle state, ready to resume.
   decoder_->Reset();

   // Drop all remaining inputs.
   decoder_current_bitstream_buffer_.reset();
   while (!decoder_input_queue_.empty())
     decoder_input_queue_.pop_front();

   decoder_resetting_ = true;
   NewEventPending();
 }

 bool V4L2SliceVideoDecodeAccelerator::FinishReset() {
   VLOGF(4);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   if (!decoder_resetting_)
     return true;

   if (!surfaces_at_device_.empty())
     return false;

   DCHECK_EQ(state_, kIdle);
   DCHECK(!decoder_flushing_);
   SendPictureReady();

   // Drop any pending outputs.
   while (!decoder_display_queue_.empty())
     decoder_display_queue_.pop();

   // At this point we can have no input buffers in the decoder, because we
   // Reset()ed it in ResetTask(), and have not scheduled any new Decode()s
   // having been in kIdle since. We don't have any surfaces in the HW either -
   // we just checked that surfaces_at_device_.empty(), and inputs are tied
   // to surfaces. Since there can be no other owners of input buffers, we can
   // simply mark them all as available.
   DCHECK_EQ(input_queue_->QueuedBuffersCount(), 0u);

   decoder_resetting_ = false;
   VLOGF(2) << "Reset finished";

   child_task_runner_->PostTask(
       FROM_HERE, base::BindOnce(&Client::NotifyResetDone, client_));

   TRACE_EVENT_ASYNC_END0("media,gpu", "V4L2SVDA Reset", this);
   return true;
 }

 bool V4L2SliceVideoDecodeAccelerator::IsDestroyPending() {
   return destroy_pending_.IsSignaled();
 }

 void V4L2SliceVideoDecodeAccelerator::SetErrorState(Error error) {
   // We can touch decoder_state_ only if this is the decoder thread or the
   // decoder thread isn't running.
   if (decoder_thread_.IsRunning() &&
       !decoder_thread_task_runner_->BelongsToCurrentThread()) {
     decoder_thread_task_runner_->PostTask(
         FROM_HERE,
         base::BindOnce(&V4L2SliceVideoDecodeAccelerator::SetErrorState,
                        base::Unretained(this), error));
     return;
   }

   // Notifying the client of an error will only happen if we are already
   // initialized, as the API does not allow doing so before that. Subsequent
   // errors and errors while destroying will be suppressed.
   if (state_ != kError && state_ != kUninitialized && state_ != kDestroying)
     NotifyError(error);

   state_ = kError;
 }

 bool V4L2SliceVideoDecodeAccelerator::SubmitSlice(
     const scoped_refptr<V4L2DecodeSurface>& dec_surface,
     const uint8_t* data,
     size_t size) {
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   V4L2WritableBufferRef& input_buffer = dec_surface->input_buffer();
   DCHECK(input_buffer.IsValid());

   const size_t plane_size = input_buffer.GetPlaneSize(0);
   const size_t bytes_used = input_buffer.GetPlaneBytesUsed(0);

   if (bytes_used + size > plane_size) {
     VLOGF(1) << "Input buffer too small";
     return false;
   }

   uint8_t* mapping = static_cast<uint8_t*>(input_buffer.GetPlaneMapping(0));
   DCHECK_NE(mapping, nullptr);
   memcpy(mapping + bytes_used, data, size);
   input_buffer.SetPlaneBytesUsed(0, bytes_used + size);

   return true;
 }

 void V4L2SliceVideoDecodeAccelerator::DecodeSurface(
     const scoped_refptr<V4L2DecodeSurface>& dec_surface) {
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   DVLOGF(3) << "Submitting decode for surface: " << dec_surface->ToString();
   Enqueue(dec_surface);

   if (!dec_surface->Submit()) {
     VLOGF(1) << "Error while submitting frame for decoding!";
     NOTIFY_ERROR(PLATFORM_FAILURE);
   }
 }

 void V4L2SliceVideoDecodeAccelerator::SurfaceReady(
     const scoped_refptr<V4L2DecodeSurface>& dec_surface,
     int32_t bitstream_id,
     const gfx::Rect& visible_rect,
     const VideoColorSpace& /* color_space */) {
   DVLOGF(4);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   dec_surface->SetVisibleRect(visible_rect);
   decoder_display_queue_.push(std::make_pair(bitstream_id, dec_surface));
   TryOutputSurfaces();
 }

 void V4L2SliceVideoDecodeAccelerator::TryOutputSurfaces() {
   while (!decoder_display_queue_.empty()) {
     scoped_refptr<V4L2DecodeSurface> dec_surface =
         decoder_display_queue_.front().second;

     if (!dec_surface->decoded())
       break;

     int32_t bitstream_id = decoder_display_queue_.front().first;
     decoder_display_queue_.pop();
     OutputSurface(bitstream_id, dec_surface);
   }
 }

 void V4L2SliceVideoDecodeAccelerator::OutputSurface(
     int32_t bitstream_id,
     const scoped_refptr<V4L2DecodeSurface>& dec_surface) {
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   OutputRecord& output_record =
       output_buffer_map_[dec_surface->output_record()];

   if (!output_record.at_client()) {
     bool inserted =
         surfaces_at_display_
             .insert(std::make_pair(output_record.picture_id, dec_surface))
             .second;
     DCHECK(inserted);
   } else {
     // The surface is already sent to client, and not returned back yet.
     DCHECK(surfaces_at_display_.find(output_record.picture_id) !=
            surfaces_at_display_.end());
     CHECK(surfaces_at_display_[output_record.picture_id].get() ==
           dec_surface.get());
   }

   DCHECK_NE(output_record.picture_id, -1);
   ++output_record.num_times_sent_to_client;

   // TODO(hubbe): Insert correct color space. http://crbug.com/647725
   Picture picture(output_record.picture_id, bitstream_id,
                   dec_surface->visible_rect(), gfx::ColorSpace(),
                   true /* allow_overlay */);
   DVLOGF(4) << dec_surface->ToString()
             << ", bitstream_id: " << picture.bitstream_buffer_id()
             << ", picture_id: " << picture.picture_buffer_id()
             << ", visible_rect: " << picture.visible_rect().ToString();
   pending_picture_ready_.push(PictureRecord(output_record.cleared, picture));
   SendPictureReady();
   output_record.cleared = true;
 }

 void V4L2SliceVideoDecodeAccelerator::CheckGLFences() {
   DVLOGF(4);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());

   while (!surfaces_awaiting_fence_.empty() &&
          surfaces_awaiting_fence_.front().first->HasCompleted()) {
     // Buffer at the front of the queue goes back to V4L2Queue's free list
     // and can be reused.
     surfaces_awaiting_fence_.pop();
   }

   // If we have no free buffers available, then preemptively schedule a
   // call to DecodeBufferTask() in a short time, otherwise we may starve out
   // of buffers because fences will not call back into us once they are
   // signaled. The delay chosen roughly corresponds to the time a frame is
   // displayed, which should be optimal in most cases.
   if (output_queue_->FreeBuffersCount() == 0) {
     constexpr int64_t kRescheduleDelayMs = 17;

     decoder_thread_.task_runner()->PostDelayedTask(
         FROM_HERE,
         base::BindOnce(&V4L2SliceVideoDecodeAccelerator::DecodeBufferTask,
                        base::Unretained(this)),
         base::TimeDelta::FromMilliseconds(kRescheduleDelayMs));
   }
 }

 scoped_refptr<V4L2DecodeSurface>
 V4L2SliceVideoDecodeAccelerator::CreateSurface() {
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   DCHECK_EQ(state_, kDecoding);
   TRACE_COUNTER_ID2(
       "media,gpu", "V4L2 input buffers", this, "free",
       input_queue_->FreeBuffersCount(), "in use",
       input_queue_->AllocatedBuffersCount() - input_queue_->FreeBuffersCount());
   TRACE_COUNTER_ID2("media,gpu", "V4L2 output buffers", this, "free",
                     output_queue_->FreeBuffersCount(), "in use",
                     output_queue_->AllocatedBuffersCount() -
                         output_queue_->AllocatedBuffersCount());
   TRACE_COUNTER_ID2("media,gpu", "V4L2 output buffers", this, "at client",
                     GetNumOfOutputRecordsAtClient(), "at device",
                     GetNumOfOutputRecordsAtDevice());

   // Release some output buffers if their fence has been signaled.
   CheckGLFences();

   if (input_queue_->FreeBuffersCount() == 0 ||
       output_queue_->FreeBuffersCount() == 0)
     return nullptr;

   V4L2WritableBufferRef input_buffer = input_queue_->GetFreeBuffer();
   DCHECK(input_buffer.IsValid());
   // All buffers that are returned to the output free queue have their GL
   // fence signaled, so we can use them directly.
   V4L2WritableBufferRef output_buffer = output_queue_->GetFreeBuffer();
   DCHECK(output_buffer.IsValid());

   int input = input_buffer.BufferId();
   int output = output_buffer.BufferId();

   scoped_refptr<V4L2DecodeSurface> dec_surface;

   if (supports_requests_) {
     // Here we just borrow the older request to use it, before
     // immediately putting it back at the back of the queue.
     base::ScopedFD request = std::move(requests_.front());
     requests_.pop();
     auto ret = V4L2RequestDecodeSurface::Create(std::move(input_buffer),
                                                 std::move(output_buffer),
                                                 nullptr, request.get());
     requests_.push(std::move(request));

     // Not being able to create the decode surface at this stage is a
     // fatal error.
     if (!ret) {
       NOTIFY_ERROR(PLATFORM_FAILURE);
       return nullptr;
     }

     dec_surface = std::move(ret).value();
   } else {
     dec_surface = new V4L2ConfigStoreDecodeSurface(
         std::move(input_buffer), std::move(output_buffer), nullptr);
   }

   DVLOGF(4) << "Created surface " << input << " -> " << output;
   return dec_surface;
 }

 void V4L2SliceVideoDecodeAccelerator::SendPictureReady() {
   DVLOGF(4);
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   bool send_now =
       (decoder_resetting_ || decoder_flushing_ || surface_set_change_pending_);
   while (!pending_picture_ready_.empty()) {
     bool cleared = pending_picture_ready_.front().cleared;
     const Picture& picture = pending_picture_ready_.front().picture;
     if (cleared && picture_clearing_count_ == 0) {
       DVLOGF(4) << "Posting picture ready to decode task runner for: "
                 << picture.picture_buffer_id();
       // This picture is cleared. It can be posted to a thread different than
       // the main GPU thread to reduce latency. This should be the case after
       // all pictures are cleared at the beginning.
       decode_task_runner_->PostTask(
           FROM_HERE,
           base::BindOnce(&Client::PictureReady, decode_client_, picture));
       pending_picture_ready_.pop();
     } else if (!cleared || send_now) {
       DVLOGF(4) << "cleared=" << pending_picture_ready_.front().cleared
                 << ", decoder_resetting_=" << decoder_resetting_
                 << ", decoder_flushing_=" << decoder_flushing_
                 << ", surface_set_change_pending_="
                 << surface_set_change_pending_
                 << ", picture_clearing_count_=" << picture_clearing_count_;
       DVLOGF(4) << "Posting picture ready to GPU for: "
                 << picture.picture_buffer_id();
       // If the picture is not cleared, post it to the child thread because it
       // has to be cleared in the child thread. A picture only needs to be
       // cleared once. If the decoder is resetting or flushing or changing
       // resolution, send all pictures to ensure PictureReady arrive before
       // reset done, flush done, or picture dismissed.
       child_task_runner_->PostTaskAndReply(
           FROM_HERE, base::BindOnce(&Client::PictureReady, client_, picture),
           // Unretained is safe. If Client::PictureReady gets to run, |this| is
           // alive. Destroy() will wait the decode thread to finish.
           base::BindOnce(&V4L2SliceVideoDecodeAccelerator::PictureCleared,
                          base::Unretained(this)));
       picture_clearing_count_++;
       pending_picture_ready_.pop();
     } else {
       // This picture is cleared. But some pictures are about to be cleared on
       // the child thread. To preserve the order, do not send this until those
       // pictures are cleared.
       break;
     }
   }
 }

 void V4L2SliceVideoDecodeAccelerator::PictureCleared() {
   DVLOGF(4) << "clearing count=" << picture_clearing_count_;
   DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread());
   DCHECK_GT(picture_clearing_count_, 0);
   picture_clearing_count_--;
   SendPictureReady();
 }

 bool V4L2SliceVideoDecodeAccelerator::TryToSetupDecodeOnSeparateThread(
     const base::WeakPtr<Client>& decode_client,
     const scoped_refptr<base::SingleThreadTaskRunner>& decode_task_runner) {
   decode_client_ = decode_client;
   decode_task_runner_ = decode_task_runner;
   return true;
 }

 // static
 VideoDecodeAccelerator::SupportedProfiles
 V4L2SliceVideoDecodeAccelerator::GetSupportedProfiles() {
   scoped_refptr<V4L2Device> device = V4L2Device::Create();
   if (!device)
     return SupportedProfiles();

   return device->GetSupportedDecodeProfiles(
       base::size(supported_input_fourccs_), supported_input_fourccs_);
 }

 size_t V4L2SliceVideoDecodeAccelerator::GetNumOfOutputRecordsAtDevice() const {
   DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread());
   return output_queue_->QueuedBuffersCount();
 }

 size_t V4L2SliceVideoDecodeAccelerator::GetNumOfOutputRecordsAtClient() const {
   DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread());
   return std::count_if(output_buffer_map_.begin(), output_buffer_map_.end(),
                        [](const auto& r) { return r.at_client(); });
 }

 // base::trace_event::MemoryDumpProvider implementation.
 bool V4L2SliceVideoDecodeAccelerator::OnMemoryDump(
     const base::trace_event::MemoryDumpArgs& args,
     base::trace_event::ProcessMemoryDump* pmd) {
   // OnMemoryDump() must be performed on |decoder_thread_|.
   DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread());

   // VIDEO_OUTPUT queue's memory usage.
   const size_t input_queue_buffers_count =
       input_queue_->AllocatedBuffersCount();
   size_t input_queue_memory_usage = 0;
   std::string input_queue_buffers_memory_type =
       V4L2Device::V4L2MemoryToString(V4L2_MEMORY_MMAP);
   input_queue_memory_usage += input_queue_->GetMemoryUsage();

   // VIDEO_CAPTURE queue's memory usage.
   const size_t output_queue_buffers_count = output_buffer_map_.size();
   size_t output_queue_memory_usage = 0;
   std::string output_queue_buffers_memory_type =
       output_mode_ == Config::OutputMode::ALLOCATE
           ? V4L2Device::V4L2MemoryToString(V4L2_MEMORY_MMAP)
           : V4L2Device::V4L2MemoryToString(V4L2_MEMORY_DMABUF);
   if (output_mode_ == Config::OutputMode::ALLOCATE) {
     // Call QUERY_BUF here because the length of buffers on VIDIOC_CATURE queue
     // are not recorded nowhere in V4L2VideoDecodeAccelerator.
     for (uint32_t index = 0; index < output_buffer_map_.size(); ++index) {
       struct v4l2_buffer v4l2_buffer = {};
       struct v4l2_plane v4l2_planes[VIDEO_MAX_PLANES];
       DCHECK_LT(output_planes_count_, base::size(v4l2_planes));
       v4l2_buffer.m.planes = v4l2_planes;
       v4l2_buffer.length =
           std::min(output_planes_count_, base::size(v4l2_planes));
       v4l2_buffer.index = index;
       v4l2_buffer.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
       v4l2_buffer.memory = V4L2_MEMORY_MMAP;
       IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_QUERYBUF, &v4l2_buffer);
       for (size_t i = 0; i < output_planes_count_; ++i)
         output_queue_memory_usage += v4l2_buffer.m.planes[i].length;
     }
   }

   const size_t total_usage =
       input_queue_memory_usage + output_queue_memory_usage;

   using ::base::trace_event::MemoryAllocatorDump;

   auto dump_name = base::StringPrintf("gpu/v4l2/slice_decoder/0x%" PRIxPTR,
                                       reinterpret_cast<uintptr_t>(this));

   MemoryAllocatorDump* dump = pmd->CreateAllocatorDump(dump_name);
   dump->AddScalar(MemoryAllocatorDump::kNameSize,
                   MemoryAllocatorDump::kUnitsBytes,
                   static_cast<uint64_t>(total_usage));
   dump->AddScalar("input_queue_memory_usage", MemoryAllocatorDump::kUnitsBytes,
                   static_cast<uint64_t>(input_queue_memory_usage));
   dump->AddScalar("input_queue_buffers_count",
                   MemoryAllocatorDump::kUnitsObjects,
                   static_cast<uint64_t>(input_queue_buffers_count));
   dump->AddString("input_queue_buffers_memory_type", "",
                   input_queue_buffers_memory_type);
   dump->AddScalar("output_queue_memory_usage", MemoryAllocatorDump::kUnitsBytes,
                   static_cast<uint64_t>(output_queue_memory_usage));
   dump->AddScalar("output_queue_buffers_count",
                   MemoryAllocatorDump::kUnitsObjects,
                   static_cast<uint64_t>(output_queue_buffers_count));
   dump->AddString("output_queue_buffers_memory_type", "",
                   output_queue_buffers_memory_type);
   return true;
 }

 }  // namespace media