| // Copyright 2015 The Chromium Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include "media/gpu/v4l2/v4l2_slice_video_decode_accelerator.h" |
| |
| #include <errno.h> |
| #include <fcntl.h> |
| #include <linux/media.h> |
| #include <linux/videodev2.h> |
| #include <poll.h> |
| #include <string.h> |
| #include <sys/eventfd.h> |
| #include <sys/ioctl.h> |
| #include <sys/mman.h> |
| |
| #include <memory> |
| |
| #include "base/bind.h" |
| #include "base/bind_helpers.h" |
| #include "base/callback.h" |
| #include "base/callback_helpers.h" |
| #include "base/command_line.h" |
| #include "base/memory/ptr_util.h" |
| #include "base/numerics/safe_conversions.h" |
| #include "base/single_thread_task_runner.h" |
| #include "base/stl_util.h" |
| #include "base/strings/stringprintf.h" |
| #include "base/threading/thread_task_runner_handle.h" |
| #include "base/time/time.h" |
| #include "base/trace_event/memory_dump_manager.h" |
| #include "base/trace_event/trace_event.h" |
| #include "media/base/bind_to_current_loop.h" |
| #include "media/base/media_switches.h" |
| #include "media/base/unaligned_shared_memory.h" |
| #include "media/base/video_types.h" |
| #include "media/gpu/macros.h" |
| #include "media/gpu/v4l2/v4l2_decode_surface.h" |
| #include "media/gpu/v4l2/v4l2_h264_accelerator.h" |
| #include "media/gpu/v4l2/v4l2_vp8_accelerator.h" |
| #include "media/gpu/v4l2/v4l2_vp9_accelerator.h" |
| #include "ui/gl/gl_context.h" |
| #include "ui/gl/gl_image.h" |
| #include "ui/gl/scoped_binders.h" |
| |
| #define NOTIFY_ERROR(x) \ |
| do { \ |
| VLOGF(1) << "Setting error state: " << x; \ |
| SetErrorState(x); \ |
| } while (0) |
| |
| #define IOCTL_OR_ERROR_RETURN_VALUE(type, arg, value, type_str) \ |
| do { \ |
| if (device_->Ioctl(type, arg) != 0) { \ |
| VPLOGF(1) << "ioctl() failed: " << type_str; \ |
| return value; \ |
| } \ |
| } while (0) |
| |
| #define IOCTL_OR_ERROR_RETURN(type, arg) \ |
| IOCTL_OR_ERROR_RETURN_VALUE(type, arg, ((void)0), #type) |
| |
| #define IOCTL_OR_ERROR_RETURN_FALSE(type, arg) \ |
| IOCTL_OR_ERROR_RETURN_VALUE(type, arg, false, #type) |
| |
| #define IOCTL_OR_LOG_ERROR(type, arg) \ |
| do { \ |
| if (device_->Ioctl(type, arg) != 0) \ |
| VPLOGF(1) << "ioctl() failed: " << #type; \ |
| } while (0) |
| |
| namespace media { |
| |
| // static |
| const uint32_t V4L2SliceVideoDecodeAccelerator::supported_input_fourccs_[] = { |
| V4L2_PIX_FMT_H264_SLICE, V4L2_PIX_FMT_VP8_FRAME, V4L2_PIX_FMT_VP9_FRAME, |
| }; |
| |
| V4L2SliceVideoDecodeAccelerator::OutputRecord::OutputRecord() |
| : at_client(false), |
| num_times_sent_to_client(0), |
| picture_id(-1), |
| texture_id(0), |
| cleared(false) {} |
| |
| V4L2SliceVideoDecodeAccelerator::OutputRecord::OutputRecord(OutputRecord&&) = |
| default; |
| |
| V4L2SliceVideoDecodeAccelerator::OutputRecord::~OutputRecord() = default; |
| |
| struct V4L2SliceVideoDecodeAccelerator::BitstreamBufferRef { |
| BitstreamBufferRef( |
| base::WeakPtr<VideoDecodeAccelerator::Client>& client, |
| const scoped_refptr<base::SingleThreadTaskRunner>& client_task_runner, |
| scoped_refptr<DecoderBuffer> buffer, |
| int32_t input_id); |
| ~BitstreamBufferRef(); |
| |
| const base::WeakPtr<VideoDecodeAccelerator::Client> client; |
| const scoped_refptr<base::SingleThreadTaskRunner> client_task_runner; |
| scoped_refptr<DecoderBuffer> buffer; |
| off_t bytes_used; |
| const int32_t input_id; |
| }; |
| |
| V4L2SliceVideoDecodeAccelerator::BitstreamBufferRef::BitstreamBufferRef( |
| base::WeakPtr<VideoDecodeAccelerator::Client>& client, |
| const scoped_refptr<base::SingleThreadTaskRunner>& client_task_runner, |
| scoped_refptr<DecoderBuffer> buffer, |
| int32_t input_id) |
| : client(client), |
| client_task_runner(client_task_runner), |
| buffer(std::move(buffer)), |
| bytes_used(0), |
| input_id(input_id) {} |
| |
| V4L2SliceVideoDecodeAccelerator::BitstreamBufferRef::~BitstreamBufferRef() { |
| if (input_id >= 0) { |
| DVLOGF(5) << "returning input_id: " << input_id; |
| client_task_runner->PostTask( |
| FROM_HERE, |
| base::BindOnce( |
| &VideoDecodeAccelerator::Client::NotifyEndOfBitstreamBuffer, client, |
| input_id)); |
| } |
| } |
| |
| V4L2SliceVideoDecodeAccelerator::PictureRecord::PictureRecord( |
| bool cleared, |
| const Picture& picture) |
| : cleared(cleared), picture(picture) {} |
| |
| V4L2SliceVideoDecodeAccelerator::PictureRecord::~PictureRecord() {} |
| |
| V4L2SliceVideoDecodeAccelerator::V4L2SliceVideoDecodeAccelerator( |
| const scoped_refptr<V4L2Device>& device, |
| EGLDisplay egl_display, |
| const BindGLImageCallback& bind_image_cb, |
| const MakeGLContextCurrentCallback& make_context_current_cb) |
| : input_planes_count_(0), |
| output_planes_count_(0), |
| child_task_runner_(base::ThreadTaskRunnerHandle::Get()), |
| device_(device), |
| decoder_thread_("V4L2SliceVideoDecodeAcceleratorThread"), |
| device_poll_thread_("V4L2SliceVideoDecodeAcceleratorDevicePollThread"), |
| video_profile_(VIDEO_CODEC_PROFILE_UNKNOWN), |
| input_format_fourcc_(0), |
| output_format_fourcc_(0), |
| state_(kUninitialized), |
| output_mode_(Config::OutputMode::ALLOCATE), |
| decoder_flushing_(false), |
| decoder_resetting_(false), |
| surface_set_change_pending_(false), |
| picture_clearing_count_(0), |
| egl_display_(egl_display), |
| bind_image_cb_(bind_image_cb), |
| make_context_current_cb_(make_context_current_cb), |
| weak_this_factory_(this) { |
| weak_this_ = weak_this_factory_.GetWeakPtr(); |
| } |
| |
| V4L2SliceVideoDecodeAccelerator::~V4L2SliceVideoDecodeAccelerator() { |
| DVLOGF(2); |
| |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| DCHECK(!decoder_thread_.IsRunning()); |
| DCHECK(!device_poll_thread_.IsRunning()); |
| |
| DCHECK(requests_.empty()); |
| DCHECK(output_buffer_map_.empty()); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::NotifyError(Error error) { |
| // Notifying the client should only happen from the client's thread. |
| if (!child_task_runner_->BelongsToCurrentThread()) { |
| child_task_runner_->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2SliceVideoDecodeAccelerator::NotifyError, |
| weak_this_, error)); |
| return; |
| } |
| |
| // Notify the decoder's client an error has occurred. |
| if (client_) { |
| client_->NotifyError(error); |
| client_ptr_factory_.reset(); |
| } |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::Initialize(const Config& config, |
| Client* client) { |
| VLOGF(2) << "profile: " << config.profile; |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| DCHECK_EQ(state_, kUninitialized); |
| |
| if (config.is_encrypted()) { |
| NOTREACHED() << "Encrypted streams are not supported for this VDA"; |
| return false; |
| } |
| |
| if (config.output_mode != Config::OutputMode::ALLOCATE && |
| config.output_mode != Config::OutputMode::IMPORT) { |
| NOTREACHED() << "Only ALLOCATE and IMPORT OutputModes are supported"; |
| return false; |
| } |
| |
| client_ptr_factory_.reset( |
| new base::WeakPtrFactory<VideoDecodeAccelerator::Client>(client)); |
| client_ = client_ptr_factory_->GetWeakPtr(); |
| // If we haven't been set up to decode on separate thread via |
| // TryToSetupDecodeOnSeparateThread(), use the main thread/client for |
| // decode tasks. |
| if (!decode_task_runner_) { |
| decode_task_runner_ = child_task_runner_; |
| DCHECK(!decode_client_); |
| decode_client_ = client_; |
| } |
| |
| // We need the context to be initialized to query extensions. |
| if (make_context_current_cb_) { |
| if (egl_display_ == EGL_NO_DISPLAY) { |
| VLOGF(1) << "could not get EGLDisplay"; |
| return false; |
| } |
| |
| if (!make_context_current_cb_.Run()) { |
| VLOGF(1) << "could not make context current"; |
| return false; |
| } |
| |
| if (!gl::g_driver_egl.ext.b_EGL_KHR_fence_sync) { |
| VLOGF(1) << "context does not have EGL_KHR_fence_sync"; |
| return false; |
| } |
| } else { |
| DVLOGF(2) << "No GL callbacks provided, initializing without GL support"; |
| } |
| |
| video_profile_ = config.profile; |
| |
| input_planes_count_ = 1; |
| |
| input_format_fourcc_ = |
| V4L2Device::VideoCodecProfileToV4L2PixFmt(video_profile_, true); |
| |
| if (!device_->Open(V4L2Device::Type::kDecoder, input_format_fourcc_)) { |
| VLOGF(1) << "Failed to open device for profile: " << config.profile |
| << " fourcc: " << FourccToString(input_format_fourcc_); |
| return false; |
| } |
| |
| struct v4l2_requestbuffers reqbufs; |
| memset(&reqbufs, 0, sizeof(reqbufs)); |
| reqbufs.count = 0; |
| reqbufs.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE; |
| reqbufs.memory = V4L2_MEMORY_MMAP; |
| IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_REQBUFS, &reqbufs); |
| if (reqbufs.capabilities & V4L2_BUF_CAP_SUPPORTS_REQUESTS) { |
| supports_requests_ = true; |
| VLOGF(1) << "Using request API"; |
| DCHECK(!media_fd_.is_valid()); |
| // Let's try to open the media device |
| // TODO(crbug.com/985230): remove this hardcoding, replace with V4L2Device |
| // integration. |
| int media_fd = open("/dev/media-dec0", O_RDWR, 0); |
| if (media_fd < 0) { |
| VPLOGF(1) << "Failed to open media device: "; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| } |
| media_fd_ = base::ScopedFD(media_fd); |
| } else { |
| VLOGF(1) << "Using config store"; |
| } |
| |
| if (video_profile_ >= H264PROFILE_MIN && video_profile_ <= H264PROFILE_MAX) { |
| decoder_.reset(new H264Decoder( |
| std::make_unique<V4L2H264Accelerator>(this, device_.get()))); |
| } else if (video_profile_ >= VP8PROFILE_MIN && |
| video_profile_ <= VP8PROFILE_MAX) { |
| decoder_.reset(new VP8Decoder( |
| std::make_unique<V4L2VP8Accelerator>(this, device_.get()))); |
| } else if (video_profile_ >= VP9PROFILE_MIN && |
| video_profile_ <= VP9PROFILE_MAX) { |
| decoder_.reset(new VP9Decoder( |
| std::make_unique<V4L2VP9Accelerator>(this, device_.get()))); |
| } else { |
| NOTREACHED() << "Unsupported profile " << GetProfileName(video_profile_); |
| return false; |
| } |
| |
| // Capabilities check. |
| struct v4l2_capability caps; |
| const __u32 kCapsRequired = V4L2_CAP_VIDEO_M2M_MPLANE | V4L2_CAP_STREAMING; |
| IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_QUERYCAP, &caps); |
| if ((caps.capabilities & kCapsRequired) != kCapsRequired) { |
| VLOGF(1) << "ioctl() failed: VIDIOC_QUERYCAP" |
| << ", caps check failed: 0x" << std::hex << caps.capabilities; |
| return false; |
| } |
| |
| if (!SetupFormats()) |
| return false; |
| |
| if (!decoder_thread_.Start()) { |
| VLOGF(1) << "device thread failed to start"; |
| return false; |
| } |
| decoder_thread_task_runner_ = decoder_thread_.task_runner(); |
| base::trace_event::MemoryDumpManager::GetInstance()->RegisterDumpProvider( |
| this, "media::V4l2SliceVideoDecodeAccelerator", |
| decoder_thread_task_runner_); |
| |
| state_ = kInitialized; |
| output_mode_ = config.output_mode; |
| |
| // InitializeTask will NOTIFY_ERROR on failure. |
| decoder_thread_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::InitializeTask, |
| base::Unretained(this))); |
| |
| VLOGF(2) << "V4L2SliceVideoDecodeAccelerator initialized"; |
| return true; |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::InitializeTask() { |
| VLOGF(2); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| DCHECK_EQ(state_, kInitialized); |
| TRACE_EVENT0("media,gpu", "V4L2SVDA::InitializeTask"); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| input_queue_ = device_->GetQueue(V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE); |
| output_queue_ = device_->GetQueue(V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE); |
| if (!input_queue_ || !output_queue_) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| if (!CreateInputBuffers()) |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| |
| // Output buffers will be created once decoder gives us information |
| // about their size and required count. |
| state_ = kDecoding; |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::Destroy() { |
| VLOGF(2); |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| |
| // Signal any waiting/sleeping tasks to early exit as soon as possible to |
| // avoid waiting too long for the decoder_thread_ to Stop(). |
| destroy_pending_.Signal(); |
| |
| if (decoder_thread_.IsRunning()) { |
| decoder_thread_task_runner_->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2SliceVideoDecodeAccelerator::DestroyTask, |
| base::Unretained(this))); |
| |
| // Wait for tasks to finish/early-exit. |
| decoder_thread_.Stop(); |
| } |
| |
| delete this; |
| VLOGF(2) << "Destroyed"; |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::DestroyTask() { |
| DVLOGF(2); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| TRACE_EVENT0("media,gpu", "V4L2SVDA::DestroyTask"); |
| |
| state_ = kDestroying; |
| |
| decoder_->Reset(); |
| |
| decoder_current_bitstream_buffer_.reset(); |
| while (!decoder_input_queue_.empty()) |
| decoder_input_queue_.pop_front(); |
| |
| // Stop streaming and the device_poll_thread_. |
| StopDevicePoll(); |
| |
| DestroyInputBuffers(); |
| DestroyOutputs(false); |
| |
| media_fd_.reset(); |
| |
| input_queue_ = nullptr; |
| output_queue_ = nullptr; |
| |
| base::trace_event::MemoryDumpManager::GetInstance()->UnregisterDumpProvider( |
| this); |
| |
| DCHECK(surfaces_at_device_.empty()); |
| DCHECK(surfaces_at_display_.empty()); |
| DCHECK(decoder_display_queue_.empty()); |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::SetupFormats() { |
| DCHECK_EQ(state_, kUninitialized); |
| |
| size_t input_size; |
| gfx::Size max_resolution, min_resolution; |
| device_->GetSupportedResolution(input_format_fourcc_, &min_resolution, |
| &max_resolution); |
| if (max_resolution.width() > 1920 && max_resolution.height() > 1088) |
| input_size = kInputBufferMaxSizeFor4k; |
| else |
| input_size = kInputBufferMaxSizeFor1080p; |
| |
| struct v4l2_fmtdesc fmtdesc; |
| memset(&fmtdesc, 0, sizeof(fmtdesc)); |
| fmtdesc.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE; |
| bool is_format_supported = false; |
| while (device_->Ioctl(VIDIOC_ENUM_FMT, &fmtdesc) == 0) { |
| if (fmtdesc.pixelformat == input_format_fourcc_) { |
| is_format_supported = true; |
| break; |
| } |
| ++fmtdesc.index; |
| } |
| |
| if (!is_format_supported) { |
| DVLOGF(1) << "Input fourcc " << input_format_fourcc_ |
| << " not supported by device."; |
| return false; |
| } |
| |
| struct v4l2_format format; |
| memset(&format, 0, sizeof(format)); |
| format.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE; |
| format.fmt.pix_mp.pixelformat = input_format_fourcc_; |
| format.fmt.pix_mp.plane_fmt[0].sizeimage = input_size; |
| format.fmt.pix_mp.num_planes = input_planes_count_; |
| IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_S_FMT, &format); |
| DCHECK_EQ(format.fmt.pix_mp.pixelformat, input_format_fourcc_); |
| |
| // We have to set up the format for output, because the driver may not allow |
| // changing it once we start streaming; whether it can support our chosen |
| // output format or not may depend on the input format. |
| memset(&fmtdesc, 0, sizeof(fmtdesc)); |
| fmtdesc.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE; |
| output_format_fourcc_ = 0; |
| while (device_->Ioctl(VIDIOC_ENUM_FMT, &fmtdesc) == 0) { |
| if (device_->CanCreateEGLImageFrom(fmtdesc.pixelformat)) { |
| output_format_fourcc_ = fmtdesc.pixelformat; |
| break; |
| } |
| ++fmtdesc.index; |
| } |
| |
| if (output_format_fourcc_ == 0) { |
| VLOGF(1) << "Could not find a usable output format"; |
| return false; |
| } |
| |
| // Only set fourcc for output; resolution, etc., will come from the |
| // driver once it extracts it from the stream. |
| memset(&format, 0, sizeof(format)); |
| format.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE; |
| format.fmt.pix_mp.pixelformat = output_format_fourcc_; |
| format.fmt.pix_mp.num_planes = V4L2Device::GetNumPlanesOfV4L2PixFmt(output_format_fourcc_); |
| IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_S_FMT, &format); |
| DCHECK_EQ(format.fmt.pix_mp.pixelformat, output_format_fourcc_); |
| |
| DCHECK_EQ(V4L2Device::GetNumPlanesOfV4L2PixFmt(output_format_fourcc_), static_cast<size_t>(format.fmt.pix_mp.num_planes)); |
| output_planes_count_ = format.fmt.pix_mp.num_planes; |
| |
| return true; |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::CreateInputBuffers() { |
| VLOGF(2); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| DCHECK(!input_queue_->IsStreaming()); |
| |
| if (input_queue_->AllocateBuffers(kNumInputBuffers, V4L2_MEMORY_MMAP) < |
| kNumInputBuffers) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| // The remainder of this method only applies if requests are used. |
| if (!supports_requests_) |
| return true; |
| |
| DCHECK(requests_.empty()); |
| |
| DCHECK(media_fd_.is_valid()); |
| for (size_t i = 0; i < input_queue_->AllocatedBuffersCount(); i++) { |
| int request_fd; |
| |
| int ret = HANDLE_EINTR( |
| ioctl(media_fd_.get(), MEDIA_IOC_REQUEST_ALLOC, &request_fd)); |
| if (ret < 0) { |
| VPLOGF(1) << "Failed to create request: "; |
| return false; |
| } |
| |
| requests_.push(base::ScopedFD(request_fd)); |
| } |
| DCHECK_EQ(requests_.size(), input_queue_->AllocatedBuffersCount()); |
| |
| return true; |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::CreateOutputBuffers() { |
| VLOGF(2); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| DCHECK(!output_queue_->IsStreaming()); |
| DCHECK(output_buffer_map_.empty()); |
| DCHECK(surfaces_at_display_.empty()); |
| DCHECK(surfaces_at_device_.empty()); |
| |
| gfx::Size pic_size = decoder_->GetPicSize(); |
| size_t num_pictures = decoder_->GetRequiredNumOfPictures(); |
| |
| DCHECK_GT(num_pictures, 0u); |
| DCHECK(!pic_size.IsEmpty()); |
| |
| // Since VdaVideoDeecoder doesn't allocate PictureBuffer with size adjusted by |
| // itself, we have to adjust here. |
| struct v4l2_format format; |
| memset(&format, 0, sizeof(format)); |
| format.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE; |
| format.fmt.pix_mp.pixelformat = output_format_fourcc_; |
| format.fmt.pix_mp.width = pic_size.width(); |
| format.fmt.pix_mp.height = pic_size.height(); |
| format.fmt.pix_mp.num_planes = output_planes_count_; |
| |
| if (device_->Ioctl(VIDIOC_S_FMT, &format) != 0) { |
| VPLOGF(1) << "Failed setting format to: " << output_format_fourcc_; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| coded_size_.SetSize(base::checked_cast<int>(format.fmt.pix_mp.width), |
| base::checked_cast<int>(format.fmt.pix_mp.height)); |
| DCHECK_EQ(coded_size_.width() % 16, 0); |
| DCHECK_EQ(coded_size_.height() % 16, 0); |
| |
| if (!gfx::Rect(coded_size_).Contains(gfx::Rect(pic_size))) { |
| VLOGF(1) << "Got invalid adjusted coded size: " << coded_size_.ToString(); |
| return false; |
| } |
| |
| DVLOGF(3) << "buffer_count=" << num_pictures |
| << ", pic size=" << pic_size.ToString() |
| << ", coded size=" << coded_size_.ToString(); |
| |
| VideoPixelFormat pixel_format = |
| V4L2Device::V4L2PixFmtToVideoPixelFormat(output_format_fourcc_); |
| child_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce( |
| &VideoDecodeAccelerator::Client::ProvidePictureBuffersWithVisibleRect, |
| client_, num_pictures, pixel_format, 1, coded_size_, |
| decoder_->GetVisibleRect(), device_->GetTextureTarget())); |
| |
| // Go into kAwaitingPictureBuffers to prevent us from doing any more decoding |
| // or event handling while we are waiting for AssignPictureBuffers(). Not |
| // having Pictures available would not have prevented us from making decoding |
| // progress entirely e.g. in the case of H.264 where we could further decode |
| // non-slice NALUs and could even get another resolution change before we were |
| // done with this one. After we get the buffers, we'll go back into kIdle and |
| // kick off further event processing, and eventually go back into kDecoding |
| // once no more events are pending (if any). |
| state_ = kAwaitingPictureBuffers; |
| return true; |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::DestroyInputBuffers() { |
| VLOGF(2); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread() || |
| !decoder_thread_.IsRunning()); |
| |
| if (!input_queue_) |
| return; |
| |
| DCHECK(!input_queue_->IsStreaming()); |
| |
| input_queue_->DeallocateBuffers(); |
| |
| if (supports_requests_) |
| requests_ = {}; |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::DismissPictures( |
| const std::vector<int32_t>& picture_buffer_ids, |
| base::WaitableEvent* done) { |
| DVLOGF(3); |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| |
| for (auto picture_buffer_id : picture_buffer_ids) { |
| DVLOGF(4) << "dismissing PictureBuffer id=" << picture_buffer_id; |
| client_->DismissPictureBuffer(picture_buffer_id); |
| } |
| |
| done->Signal(); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::DevicePollTask(bool poll_device) { |
| DVLOGF(3); |
| DCHECK(device_poll_thread_.task_runner()->BelongsToCurrentThread()); |
| TRACE_EVENT0("media,gpu", "V4L2SVDA::DevicePollTask"); |
| bool event_pending; |
| if (!device_->Poll(poll_device, &event_pending)) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| // All processing should happen on ServiceDeviceTask(), since we shouldn't |
| // touch encoder state from this thread. |
| decoder_thread_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::ServiceDeviceTask, |
| base::Unretained(this))); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::ServiceDeviceTask() { |
| DVLOGF(4); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| // ServiceDeviceTask() should only ever be scheduled from DevicePollTask(). |
| |
| Dequeue(); |
| SchedulePollIfNeeded(); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::SchedulePollIfNeeded() { |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| if (!device_poll_thread_.IsRunning()) { |
| DVLOGF(4) << "Device poll thread stopped, will not schedule poll"; |
| return; |
| } |
| |
| DCHECK(input_queue_->IsStreaming() || output_queue_->IsStreaming()); |
| |
| if (input_queue_->QueuedBuffersCount() + |
| output_queue_->QueuedBuffersCount() == |
| 0) { |
| DVLOGF(4) << "No buffers queued, will not schedule poll"; |
| return; |
| } |
| |
| DVLOGF(4) << "Scheduling device poll task"; |
| |
| device_poll_thread_.task_runner()->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::DevicePollTask, |
| base::Unretained(this), true)); |
| |
| DVLOGF(3) << "buffer counts: " |
| << "INPUT[" << decoder_input_queue_.size() << "]" |
| << " => DEVICE[" << input_queue_->FreeBuffersCount() << "+" |
| << input_queue_->QueuedBuffersCount() << "/" |
| << input_queue_->AllocatedBuffersCount() << "]->[" |
| << output_queue_->FreeBuffersCount() << "+" |
| << output_queue_->QueuedBuffersCount() << "/" |
| << output_buffer_map_.size() << "]" |
| << " => DISPLAYQ[" << decoder_display_queue_.size() << "]" |
| << " => CLIENT[" << surfaces_at_display_.size() << "]"; |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::Enqueue( |
| const scoped_refptr<V4L2DecodeSurface>& dec_surface) { |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| const int old_inputs_queued = input_queue_->QueuedBuffersCount(); |
| const int old_outputs_queued = output_queue_->QueuedBuffersCount(); |
| |
| if (!EnqueueInputRecord(dec_surface.get())) { |
| VLOGF(1) << "Failed queueing an input buffer"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| if (!EnqueueOutputRecord(dec_surface.get())) { |
| VLOGF(1) << "Failed queueing an output buffer"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| surfaces_at_device_.push(dec_surface); |
| |
| if (old_inputs_queued == 0 && old_outputs_queued == 0) |
| SchedulePollIfNeeded(); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::Dequeue() { |
| DVLOGF(4); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| while (input_queue_->QueuedBuffersCount() > 0) { |
| DCHECK(input_queue_->IsStreaming()); |
| auto ret = input_queue_->DequeueBuffer(); |
| |
| if (ret.first == false) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } else if (!ret.second) { |
| // we're just out of buffers to dequeue. |
| break; |
| } |
| |
| DVLOGF(4) << "Dequeued input=" << ret.second->BufferId() |
| << " count: " << input_queue_->QueuedBuffersCount(); |
| } |
| |
| while (output_queue_->QueuedBuffersCount() > 0) { |
| DCHECK(output_queue_->IsStreaming()); |
| auto ret = output_queue_->DequeueBuffer(); |
| if (ret.first == false) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } else if (!ret.second) { |
| // we're just out of buffers to dequeue. |
| break; |
| } |
| |
| DVLOGF(4) << "Dequeued output=" << ret.second->BufferId() << " count " |
| << output_queue_->QueuedBuffersCount(); |
| |
| DCHECK(!surfaces_at_device_.empty()); |
| scoped_refptr<V4L2DecodeSurface> surface = surfaces_at_device_.front(); |
| surfaces_at_device_.pop(); |
| DCHECK_EQ(static_cast<size_t>(surface->output_record()), |
| ret.second->BufferId()); |
| surface->SetDecoded(); |
| |
| surface->SetReleaseCallback( |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::ReuseOutputBuffer, |
| base::Unretained(this), std::move(ret.second))); |
| } |
| |
| // A frame was decoded, see if we can output it. |
| TryOutputSurfaces(); |
| |
| ProcessPendingEventsIfNeeded(); |
| ScheduleDecodeBufferTaskIfNeeded(); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::NewEventPending() { |
| // Switch to event processing mode if we are decoding. Otherwise we are either |
| // already in it, or we will potentially switch to it later, after finishing |
| // other tasks. |
| if (state_ == kDecoding) |
| state_ = kIdle; |
| |
| ProcessPendingEventsIfNeeded(); |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::FinishEventProcessing() { |
| DCHECK_EQ(state_, kIdle); |
| |
| state_ = kDecoding; |
| ScheduleDecodeBufferTaskIfNeeded(); |
| |
| return true; |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::ProcessPendingEventsIfNeeded() { |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| // Process pending events, if any, in the correct order. |
| // We always first process the surface set change, as it is an internal |
| // event from the decoder and interleaving it with external requests would |
| // put the decoder in an undefined state. |
| using ProcessFunc = bool (V4L2SliceVideoDecodeAccelerator::*)(); |
| const ProcessFunc process_functions[] = { |
| &V4L2SliceVideoDecodeAccelerator::FinishSurfaceSetChange, |
| &V4L2SliceVideoDecodeAccelerator::FinishFlush, |
| &V4L2SliceVideoDecodeAccelerator::FinishReset, |
| &V4L2SliceVideoDecodeAccelerator::FinishEventProcessing, |
| }; |
| |
| for (const auto& fn : process_functions) { |
| if (state_ != kIdle) |
| return; |
| |
| if (!(this->*fn)()) |
| return; |
| } |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::ReuseOutputBuffer( |
| V4L2ReadableBufferRef buffer) { |
| DVLOGF(4) << "Reusing output buffer, index=" << buffer->BufferId(); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| ScheduleDecodeBufferTaskIfNeeded(); |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::EnqueueInputRecord( |
| V4L2DecodeSurface* dec_surface) { |
| DVLOGF(4); |
| DCHECK_NE(dec_surface, nullptr); |
| |
| // Enqueue an input (VIDEO_OUTPUT) buffer for an input video frame. |
| V4L2WritableBufferRef input_buffer = std::move(dec_surface->input_buffer()); |
| DCHECK(input_buffer.IsValid()); |
| const int index = input_buffer.BufferId(); |
| input_buffer.PrepareQueueBuffer(*dec_surface); |
| if (!std::move(input_buffer).QueueMMap()) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| DVLOGF(4) << "Enqueued input=" << index |
| << " count: " << input_queue_->QueuedBuffersCount(); |
| |
| return true; |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::EnqueueOutputRecord( |
| V4L2DecodeSurface* dec_surface) { |
| DVLOGF(4); |
| |
| // Enqueue an output (VIDEO_CAPTURE) buffer. |
| V4L2WritableBufferRef output_buffer = std::move(dec_surface->output_buffer()); |
| DCHECK(output_buffer.IsValid()); |
| size_t index = output_buffer.BufferId(); |
| OutputRecord& output_record = output_buffer_map_[index]; |
| DCHECK_NE(output_record.picture_id, -1); |
| |
| if (output_record.egl_fence) { |
| TRACE_EVENT0("media,gpu", |
| "V4L2SVDA::EnqueueOutputRecord: " |
| "GLFenceEGL::ClientWaitWithTimeoutNanos"); |
| |
| // If we have to wait for completion, wait. Note that free_output_buffers_ |
| // is a FIFO queue, so we always wait on the buffer that has been in the |
| // queue the longest. Every 100ms we check whether the decoder is shutting |
| // down, or we might get stuck waiting on a fence that will never come: |
| // https://crbug.com/845645 |
| while (!IsDestroyPending()) { |
| const EGLTimeKHR wait_ns = |
| base::TimeDelta::FromMilliseconds(100).InNanoseconds(); |
| EGLint result = |
| output_record.egl_fence->ClientWaitWithTimeoutNanos(wait_ns); |
| if (result == EGL_CONDITION_SATISFIED_KHR) { |
| break; |
| } else if (result == EGL_FALSE) { |
| // This will cause tearing, but is safe otherwise. |
| DVLOGF(1) << "GLFenceEGL::ClientWaitWithTimeoutNanos failed!"; |
| break; |
| } |
| DCHECK_EQ(result, EGL_TIMEOUT_EXPIRED_KHR); |
| } |
| |
| if (IsDestroyPending()) |
| return false; |
| |
| output_record.egl_fence.reset(); |
| } |
| |
| bool ret; |
| if (output_mode_ == Config::OutputMode::ALLOCATE) |
| ret = std::move(output_buffer).QueueMMap(); |
| else |
| ret = std::move(output_buffer).QueueDMABuf(output_record.dmabuf_fds); |
| |
| if (!ret) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| DVLOGF(4) << "Enqueued output=" << index |
| << " count: " << output_queue_->QueuedBuffersCount(); |
| |
| return true; |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::StartDevicePoll() { |
| DVLOGF(3) << "Starting device poll"; |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| DCHECK(!device_poll_thread_.IsRunning()); |
| |
| // Start up the device poll thread and schedule its first DevicePollTask(). |
| if (!device_poll_thread_.Start()) { |
| VLOGF(1) << "Device thread failed to start"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| if (!input_queue_->Streamon()) |
| return false; |
| |
| if (!output_queue_->Streamon()) |
| return false; |
| |
| device_poll_thread_.task_runner()->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::DevicePollTask, |
| base::Unretained(this), true)); |
| |
| return true; |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::StopDevicePoll() { |
| DVLOGF(3) << "Stopping device poll"; |
| if (decoder_thread_.IsRunning()) |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| // Signal the DevicePollTask() to stop, and stop the device poll thread. |
| if (!device_->SetDevicePollInterrupt()) { |
| VPLOGF(1) << "SetDevicePollInterrupt(): failed"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| device_poll_thread_.Stop(); |
| DVLOGF(3) << "Device poll thread stopped"; |
| |
| // Clear the interrupt now, to be sure. |
| if (!device_->ClearDevicePollInterrupt()) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| // We may be called before the queue is acquired. |
| if (input_queue_) { |
| if (!input_queue_->Streamoff()) |
| return false; |
| |
| DCHECK_EQ(input_queue_->QueuedBuffersCount(), 0u); |
| } |
| |
| // We may be called before the queue is acquired. |
| if (output_queue_) { |
| if (!output_queue_->Streamoff()) |
| return false; |
| |
| DCHECK_EQ(output_queue_->QueuedBuffersCount(), 0u); |
| } |
| |
| // Mark as decoded to allow reuse. |
| while (!surfaces_at_device_.empty()) |
| surfaces_at_device_.pop(); |
| |
| // Drop all surfaces that were awaiting decode before being displayed, |
| // since we've just cancelled all outstanding decodes. |
| while (!decoder_display_queue_.empty()) |
| decoder_display_queue_.pop(); |
| |
| DVLOGF(3) << "Device poll stopped"; |
| return true; |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::Decode(BitstreamBuffer bitstream_buffer) { |
| Decode(bitstream_buffer.ToDecoderBuffer(), bitstream_buffer.id()); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::Decode( |
| scoped_refptr<DecoderBuffer> buffer, |
| int32_t bitstream_id) { |
| DVLOGF(4) << "input_id=" << bitstream_id |
| << ", size=" << (buffer ? buffer->data_size() : 0); |
| DCHECK(decode_task_runner_->BelongsToCurrentThread()); |
| |
| if (bitstream_id < 0) { |
| VLOGF(1) << "Invalid bitstream buffer, id: " << bitstream_id; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| decoder_thread_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::DecodeTask, |
| base::Unretained(this), std::move(buffer), bitstream_id)); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::DecodeTask( |
| scoped_refptr<DecoderBuffer> buffer, |
| int32_t bitstream_id) { |
| DVLOGF(4) << "input_id=" << bitstream_id |
| << " size=" << (buffer ? buffer->data_size() : 0); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| std::unique_ptr<BitstreamBufferRef> bitstream_record(new BitstreamBufferRef( |
| decode_client_, decode_task_runner_, std::move(buffer), bitstream_id)); |
| |
| // Skip empty buffer. |
| if (!bitstream_record->buffer) |
| return; |
| |
| decoder_input_queue_.push_back(std::move(bitstream_record)); |
| |
| TRACE_COUNTER_ID1("media,gpu", "V4L2SVDA decoder input BitstreamBuffers", |
| this, decoder_input_queue_.size()); |
| |
| ScheduleDecodeBufferTaskIfNeeded(); |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::TrySetNewBistreamBuffer() { |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| DCHECK(!decoder_current_bitstream_buffer_); |
| |
| if (decoder_input_queue_.empty()) |
| return false; |
| |
| decoder_current_bitstream_buffer_ = std::move(decoder_input_queue_.front()); |
| decoder_input_queue_.pop_front(); |
| |
| if (decoder_current_bitstream_buffer_->input_id == kFlushBufferId) { |
| // This is a buffer we queued for ourselves to trigger flush at this time. |
| InitiateFlush(); |
| return false; |
| } |
| |
| decoder_->SetStream(decoder_current_bitstream_buffer_->input_id, |
| *decoder_current_bitstream_buffer_->buffer); |
| return true; |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::ScheduleDecodeBufferTaskIfNeeded() { |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| if (state_ == kDecoding) { |
| decoder_thread_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::DecodeBufferTask, |
| base::Unretained(this))); |
| } |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::DecodeBufferTask() { |
| DVLOGF(4); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| TRACE_EVENT0("media,gpu", "V4L2SVDA::DecodeBufferTask"); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| if (state_ != kDecoding) { |
| DVLOGF(3) << "Early exit, not in kDecoding"; |
| return; |
| } |
| |
| while (true) { |
| TRACE_EVENT_BEGIN0("media,gpu", "V4L2SVDA::DecodeBufferTask AVD::Decode"); |
| const AcceleratedVideoDecoder::DecodeResult res = decoder_->Decode(); |
| TRACE_EVENT_END0("media,gpu", "V4L2SVDA::DecodeBufferTask AVD::Decode"); |
| switch (res) { |
| case AcceleratedVideoDecoder::kAllocateNewSurfaces: |
| VLOGF(2) << "Decoder requesting a new set of surfaces"; |
| InitiateSurfaceSetChange(); |
| return; |
| |
| case AcceleratedVideoDecoder::kRanOutOfStreamData: |
| decoder_current_bitstream_buffer_.reset(); |
| if (!TrySetNewBistreamBuffer()) |
| return; |
| |
| break; |
| |
| case AcceleratedVideoDecoder::kRanOutOfSurfaces: |
| // No more surfaces for the decoder, we'll come back once we have more. |
| DVLOGF(4) << "Ran out of surfaces"; |
| return; |
| |
| case AcceleratedVideoDecoder::kNeedContextUpdate: |
| DVLOGF(4) << "Awaiting context update"; |
| return; |
| |
| case AcceleratedVideoDecoder::kDecodeError: |
| VLOGF(1) << "Error decoding stream"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| |
| case AcceleratedVideoDecoder::kTryAgain: |
| NOTREACHED() << "Should not reach here unless this class accepts " |
| "encrypted streams."; |
| DVLOGF(4) << "No key for decoding stream."; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| } |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::InitiateSurfaceSetChange() { |
| VLOGF(2); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| DCHECK_EQ(state_, kDecoding); |
| TRACE_EVENT_ASYNC_BEGIN0("media,gpu", "V4L2SVDA Resolution Change", this); |
| DCHECK(!surface_set_change_pending_); |
| surface_set_change_pending_ = true; |
| NewEventPending(); |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::FinishSurfaceSetChange() { |
| VLOGF(2); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| if (!surface_set_change_pending_) |
| return true; |
| |
| if (!surfaces_at_device_.empty()) |
| return false; |
| |
| DCHECK_EQ(state_, kIdle); |
| DCHECK(decoder_display_queue_.empty()); |
| // All output buffers should've been returned from decoder and device by now. |
| // The only remaining owner of surfaces may be display (client), and we will |
| // dismiss them when destroying output buffers below. |
| DCHECK_EQ(output_queue_->FreeBuffersCount() + surfaces_at_display_.size(), |
| output_buffer_map_.size()); |
| |
| if (!StopDevicePoll()) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| // Dequeued decoded surfaces may be pended in pending_picture_ready_ if they |
| // are waiting for some pictures to be cleared. We should post them right away |
| // because they are about to be dismissed and destroyed for surface set |
| // change. |
| SendPictureReady(); |
| |
| // This will return only once all buffers are dismissed and destroyed. |
| // This does not wait until they are displayed however, as display retains |
| // references to the buffers bound to textures and will release them |
| // after displaying. |
| if (!DestroyOutputs(true)) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| if (!CreateOutputBuffers()) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| surface_set_change_pending_ = false; |
| VLOGF(2) << "Surface set change finished"; |
| TRACE_EVENT_ASYNC_END0("media,gpu", "V4L2SVDA Resolution Change", this); |
| return true; |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::DestroyOutputs(bool dismiss) { |
| VLOGF(2); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| std::vector<int32_t> picture_buffers_to_dismiss; |
| |
| if (output_buffer_map_.empty()) |
| return true; |
| |
| for (auto& output_record : output_buffer_map_) { |
| output_record.egl_fence.reset(); |
| |
| picture_buffers_to_dismiss.push_back(output_record.picture_id); |
| } |
| |
| if (dismiss) { |
| VLOGF(2) << "Scheduling picture dismissal"; |
| base::WaitableEvent done(base::WaitableEvent::ResetPolicy::AUTOMATIC, |
| base::WaitableEvent::InitialState::NOT_SIGNALED); |
| child_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::DismissPictures, |
| weak_this_, picture_buffers_to_dismiss, &done)); |
| done.Wait(); |
| } |
| |
| // At this point client can't call ReusePictureBuffer on any of the pictures |
| // anymore, so it's safe to destroy. |
| return DestroyOutputBuffers(); |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::DestroyOutputBuffers() { |
| VLOGF(2); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread() || |
| !decoder_thread_.IsRunning()); |
| DCHECK(surfaces_at_device_.empty()); |
| DCHECK(decoder_display_queue_.empty()); |
| |
| if (!output_queue_ || output_buffer_map_.empty()) |
| return true; |
| |
| DCHECK(!output_queue_->IsStreaming()); |
| DCHECK_EQ(output_queue_->QueuedBuffersCount(), 0u); |
| |
| // Release all buffers waiting for an import buffer event. |
| output_wait_map_.clear(); |
| |
| // It's ok to do this, client will retain references to textures, but we are |
| // not interested in reusing the surfaces anymore. |
| // This will prevent us from reusing old surfaces in case we have some |
| // ReusePictureBuffer() pending on ChildThread already. It's ok to ignore |
| // them, because we have already dismissed them (in DestroyOutputs()). |
| for (const auto& surface_at_display : surfaces_at_display_) { |
| size_t index = surface_at_display.second->output_record(); |
| DCHECK_LT(index, output_buffer_map_.size()); |
| OutputRecord& output_record = output_buffer_map_[index]; |
| DCHECK(output_record.at_client); |
| output_record.at_client = false; |
| output_record.num_times_sent_to_client = 0; |
| } |
| surfaces_at_display_.clear(); |
| DCHECK_EQ(output_queue_->FreeBuffersCount(), output_buffer_map_.size()); |
| |
| output_buffer_map_.clear(); |
| |
| output_queue_->DeallocateBuffers(); |
| |
| return true; |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::AssignPictureBuffers( |
| const std::vector<PictureBuffer>& buffers) { |
| VLOGF(2); |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| |
| decoder_thread_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::AssignPictureBuffersTask, |
| base::Unretained(this), buffers)); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::AssignPictureBuffersTask( |
| const std::vector<PictureBuffer>& buffers) { |
| VLOGF(2); |
| DCHECK(!output_queue_->IsStreaming()); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| DCHECK_EQ(state_, kAwaitingPictureBuffers); |
| TRACE_EVENT1("media,gpu", "V4L2SVDA::AssignPictureBuffersTask", |
| "buffers_size", buffers.size()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| const uint32_t req_buffer_count = decoder_->GetRequiredNumOfPictures(); |
| |
| if (buffers.size() < req_buffer_count) { |
| VLOGF(1) << "Failed to provide requested picture buffers. " |
| << "(Got " << buffers.size() << ", requested " << req_buffer_count |
| << ")"; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| // If a client allocate a different frame size, S_FMT should be called with |
| // the size. |
| if (coded_size_ != buffers[0].size()) { |
| const auto& new_frame_size = buffers[0].size(); |
| v4l2_format format = {}; |
| format.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE; |
| format.fmt.pix_mp.width = new_frame_size.width(); |
| format.fmt.pix_mp.height = new_frame_size.height(); |
| format.fmt.pix_mp.pixelformat = output_format_fourcc_; |
| format.fmt.pix_mp.num_planes = output_planes_count_; |
| if (device_->Ioctl(VIDIOC_S_FMT, &format) != 0) { |
| VPLOGF(1) << "Failed with frame size adjusted by client: " |
| << new_frame_size.ToString(); |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| coded_size_.SetSize(format.fmt.pix_mp.width, format.fmt.pix_mp.height); |
| // If size specified by ProvidePictureBuffers() is adjusted by the client, |
| // the size must not be adjusted by a v4l2 driver again. |
| if (coded_size_ != new_frame_size) { |
| VLOGF(1) << "The size of PictureBuffer is invalid." |
| << " size adjusted by the client = " << new_frame_size.ToString() |
| << " size adjusted by a driver = " << coded_size_.ToString(); |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| if (!gfx::Rect(coded_size_).Contains(gfx::Rect(decoder_->GetPicSize()))) { |
| VLOGF(1) << "Got invalid adjusted coded size: " << coded_size_.ToString(); |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| } |
| |
| const v4l2_memory memory = |
| (output_mode_ == Config::OutputMode::ALLOCATE ? V4L2_MEMORY_MMAP |
| : V4L2_MEMORY_DMABUF); |
| if (output_queue_->AllocateBuffers(buffers.size(), memory) != |
| buffers.size()) { |
| VLOGF(1) << "Could not allocate enough output buffers"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| DCHECK(output_buffer_map_.empty()); |
| DCHECK(output_wait_map_.empty()); |
| output_buffer_map_.resize(buffers.size()); |
| // Reserve all buffers until ImportBufferForPictureTask() is called |
| while (output_queue_->FreeBuffersCount() > 0) { |
| V4L2WritableBufferRef buffer = output_queue_->GetFreeBuffer(); |
| DCHECK(buffer.IsValid()); |
| int i = buffer.BufferId(); |
| |
| DCHECK_EQ(output_wait_map_.count(buffers[i].id()), 0u); |
| // The buffer will remain here until ImportBufferForPicture is called, |
| // either by the client, or by ourselves, if we are allocating. |
| output_wait_map_.emplace(buffers[i].id(), std::move(buffer)); |
| } |
| // All available buffers should be in the wait map now. |
| DCHECK_EQ(output_buffer_map_.size(), output_wait_map_.size()); |
| |
| for (size_t i = 0; i < buffers.size(); i++) { |
| OutputRecord& output_record = output_buffer_map_[i]; |
| DCHECK(!output_record.egl_fence); |
| DCHECK_EQ(output_record.picture_id, -1); |
| DCHECK(output_record.dmabuf_fds.empty()); |
| DCHECK_EQ(output_record.cleared, false); |
| |
| output_record.picture_id = buffers[i].id(); |
| output_record.texture_id = buffers[i].service_texture_ids().empty() |
| ? 0 |
| : buffers[i].service_texture_ids()[0]; |
| |
| output_record.client_texture_id = buffers[i].client_texture_ids().empty() |
| ? 0 |
| : buffers[i].client_texture_ids()[0]; |
| |
| if (output_mode_ == Config::OutputMode::ALLOCATE) { |
| std::vector<base::ScopedFD> passed_dmabuf_fds = |
| device_->GetDmabufsForV4L2Buffer(i, output_planes_count_, |
| V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE); |
| if (passed_dmabuf_fds.empty()) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| ImportBufferForPictureTask(output_record.picture_id, |
| std::move(passed_dmabuf_fds)); |
| } // else we'll get triggered via ImportBufferForPicture() from client. |
| DVLOGF(3) << "buffer[" << i << "]: picture_id=" << output_record.picture_id; |
| } |
| |
| if (!StartDevicePoll()) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| // Put us in kIdle to allow further event processing. |
| // ProcessPendingEventsIfNeeded() will put us back into kDecoding after all |
| // other pending events are processed successfully. |
| state_ = kIdle; |
| ProcessPendingEventsIfNeeded(); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::CreateGLImageFor( |
| size_t buffer_index, |
| int32_t picture_buffer_id, |
| std::vector<base::ScopedFD> passed_dmabuf_fds, |
| GLuint client_texture_id, |
| GLuint texture_id, |
| const gfx::Size& size, |
| uint32_t fourcc) { |
| DVLOGF(3) << "index=" << buffer_index; |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| DCHECK_NE(texture_id, 0u); |
| TRACE_EVENT1("media,gpu", "V4L2SVDA::CreateGLImageFor", "picture_buffer_id", |
| picture_buffer_id); |
| |
| if (!make_context_current_cb_) { |
| VLOGF(1) << "GL callbacks required for binding to GLImages"; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| if (!make_context_current_cb_.Run()) { |
| VLOGF(1) << "No GL context"; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| scoped_refptr<gl::GLImage> gl_image = |
| device_->CreateGLImage(size, fourcc, passed_dmabuf_fds); |
| if (!gl_image) { |
| VLOGF(1) << "Could not create GLImage," |
| << " index=" << buffer_index << " texture_id=" << texture_id; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| gl::ScopedTextureBinder bind_restore(device_->GetTextureTarget(), texture_id); |
| bool ret = gl_image->BindTexImage(device_->GetTextureTarget()); |
| DCHECK(ret); |
| bind_image_cb_.Run(client_texture_id, device_->GetTextureTarget(), gl_image, |
| true); |
| decoder_thread_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::AssignDmaBufs, |
| base::Unretained(this), buffer_index, picture_buffer_id, |
| std::move(passed_dmabuf_fds))); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::AssignDmaBufs( |
| size_t buffer_index, |
| int32_t picture_buffer_id, |
| std::vector<base::ScopedFD> passed_dmabuf_fds) { |
| DVLOGF(3) << "index=" << buffer_index; |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| // It's possible that while waiting for the EGLImages to be allocated and |
| // assigned, we have already decoded more of the stream and saw another |
| // resolution change. This is a normal situation, in such a case either there |
| // is no output record with this index awaiting an EGLImage to be assigned to |
| // it, or the record is already updated to use a newer PictureBuffer and is |
| // awaiting an EGLImage associated with a different picture_buffer_id. If so, |
| // just discard this image, we will get the one we are waiting for later. |
| if (buffer_index >= output_buffer_map_.size() || |
| output_buffer_map_[buffer_index].picture_id != picture_buffer_id) { |
| DVLOGF(4) << "Picture set already changed, dropping EGLImage"; |
| return; |
| } |
| |
| OutputRecord& output_record = output_buffer_map_[buffer_index]; |
| DCHECK(!output_record.egl_fence); |
| DCHECK_EQ(output_wait_map_.count(picture_buffer_id), 1u); |
| |
| if (output_mode_ == Config::OutputMode::IMPORT) { |
| DCHECK(output_record.dmabuf_fds.empty()); |
| output_record.dmabuf_fds = std::move(passed_dmabuf_fds); |
| } |
| |
| // Buffer is ready to be used. |
| output_wait_map_.erase(picture_buffer_id); |
| ScheduleDecodeBufferTaskIfNeeded(); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::ImportBufferForPicture( |
| int32_t picture_buffer_id, |
| VideoPixelFormat pixel_format, |
| gfx::GpuMemoryBufferHandle gpu_memory_buffer_handle) { |
| DVLOGF(3) << "picture_buffer_id=" << picture_buffer_id; |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| |
| std::vector<base::ScopedFD> dmabuf_fds; |
| #if defined(USE_OZONE) |
| // If the driver does not accept as many fds as we received from the client, |
| // we have to check if the additional fds are actually duplicated fds pointing |
| // to previous planes; if so, we can close the duplicates and keep only the |
| // original fd(s). |
| // Assume that an fd is a duplicate of a previous plane's fd if offset != 0. |
| // Otherwise, if offset == 0, return error as it may be pointing to a new |
| // plane. |
| for (auto& plane : gpu_memory_buffer_handle.native_pixmap_handle.planes) { |
| dmabuf_fds.push_back(std::move(plane.fd)); |
| } |
| for (size_t i = dmabuf_fds.size() - 1; i >= output_planes_count_; i--) { |
| if (gpu_memory_buffer_handle.native_pixmap_handle.planes[i].offset == 0) { |
| VLOGF(1) << "The dmabuf fd points to a new buffer, "; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| // Drop safely, because this fd is duplicate dmabuf fd pointing to previous |
| // buffer and the appropriate address can be accessed by associated offset. |
| dmabuf_fds.pop_back(); |
| } |
| #endif |
| |
| if (output_mode_ != Config::OutputMode::IMPORT) { |
| VLOGF(1) << "Cannot import in non-import mode"; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| if (pixel_format != |
| V4L2Device::V4L2PixFmtToVideoPixelFormat(output_format_fourcc_)) { |
| VLOGF(1) << "Unsupported import format: " |
| << VideoPixelFormatToString(pixel_format); |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| decoder_thread_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce( |
| &V4L2SliceVideoDecodeAccelerator::ImportBufferForPictureTask, |
| base::Unretained(this), picture_buffer_id, std::move(dmabuf_fds))); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::ImportBufferForPictureTask( |
| int32_t picture_buffer_id, |
| std::vector<base::ScopedFD> passed_dmabuf_fds) { |
| DVLOGF(3) << "picture_buffer_id=" << picture_buffer_id; |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| const auto iter = |
| std::find_if(output_buffer_map_.begin(), output_buffer_map_.end(), |
| [picture_buffer_id](const OutputRecord& output_record) { |
| return output_record.picture_id == picture_buffer_id; |
| }); |
| if (iter == output_buffer_map_.end()) { |
| // It's possible that we've already posted a DismissPictureBuffer for this |
| // picture, but it has not yet executed when this ImportBufferForPicture was |
| // posted to us by the client. In that case just ignore this (we've already |
| // dismissed it and accounted for that). |
| DVLOGF(3) << "got picture id=" << picture_buffer_id |
| << " not in use (anymore?)."; |
| return; |
| } |
| |
| if (!output_wait_map_.count(iter->picture_id)) { |
| VLOGF(1) << "Passed buffer is not waiting to be imported"; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| size_t index = iter - output_buffer_map_.begin(); |
| |
| if (iter->texture_id != 0) { |
| child_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::CreateGLImageFor, |
| weak_this_, index, picture_buffer_id, |
| std::move(passed_dmabuf_fds), iter->client_texture_id, |
| iter->texture_id, coded_size_, output_format_fourcc_)); |
| } else { |
| // No need for a GLImage, start using this buffer now. |
| DCHECK_EQ(output_planes_count_, passed_dmabuf_fds.size()); |
| iter->dmabuf_fds = std::move(passed_dmabuf_fds); |
| |
| // Buffer is now ready to be used. |
| DCHECK_EQ(output_wait_map_.count(picture_buffer_id), 1u); |
| output_wait_map_.erase(picture_buffer_id); |
| ScheduleDecodeBufferTaskIfNeeded(); |
| } |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::ReusePictureBuffer( |
| int32_t picture_buffer_id) { |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| DVLOGF(4) << "picture_buffer_id=" << picture_buffer_id; |
| |
| std::unique_ptr<gl::GLFenceEGL> egl_fence; |
| |
| if (make_context_current_cb_) { |
| if (!make_context_current_cb_.Run()) { |
| VLOGF(1) << "could not make context current"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| egl_fence = gl::GLFenceEGL::Create(); |
| if (!egl_fence) { |
| VLOGF(1) << "gl::GLFenceEGL::Create() failed"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| } |
| |
| decoder_thread_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::ReusePictureBufferTask, |
| base::Unretained(this), picture_buffer_id, |
| std::move(egl_fence))); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::ReusePictureBufferTask( |
| int32_t picture_buffer_id, |
| std::unique_ptr<gl::GLFenceEGL> egl_fence) { |
| DVLOGF(4) << "picture_buffer_id=" << picture_buffer_id; |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| V4L2DecodeSurfaceByPictureBufferId::iterator it = |
| surfaces_at_display_.find(picture_buffer_id); |
| if (it == surfaces_at_display_.end()) { |
| // It's possible that we've already posted a DismissPictureBuffer for this |
| // picture, but it has not yet executed when this ReusePictureBuffer was |
| // posted to us by the client. In that case just ignore this (we've already |
| // dismissed it and accounted for that) and let the fence object get |
| // destroyed. |
| DVLOGF(3) << "got picture id=" << picture_buffer_id |
| << " not in use (anymore?)."; |
| return; |
| } |
| |
| OutputRecord& output_record = output_buffer_map_[it->second->output_record()]; |
| if (!output_record.at_client) { |
| VLOGF(1) << "picture_buffer_id not reusable"; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| --output_record.num_times_sent_to_client; |
| // A output buffer might be sent multiple times. We only use the last fence. |
| // When the last fence is signaled, all the previous fences must be executed. |
| if (output_record.num_times_sent_to_client == 0) { |
| output_record.at_client = false; |
| // Take ownership of the EGL fence. |
| output_record.egl_fence = std::move(egl_fence); |
| |
| surfaces_at_display_.erase(it); |
| } |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::Flush() { |
| VLOGF(2); |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| |
| decoder_thread_task_runner_->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2SliceVideoDecodeAccelerator::FlushTask, |
| base::Unretained(this))); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::FlushTask() { |
| VLOGF(2); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| // Queue an empty buffer which - when reached - will trigger flush sequence. |
| decoder_input_queue_.push_back(std::make_unique<BitstreamBufferRef>( |
| decode_client_, decode_task_runner_, nullptr, kFlushBufferId)); |
| |
| ScheduleDecodeBufferTaskIfNeeded(); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::InitiateFlush() { |
| VLOGF(2); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| TRACE_EVENT_ASYNC_BEGIN0("media,gpu", "V4L2SVDA Flush", this); |
| |
| // This will trigger output for all remaining surfaces in the decoder. |
| // However, not all of them may be decoded yet (they would be queued |
| // in hardware then). |
| if (!decoder_->Flush()) { |
| DVLOGF(1) << "Failed flushing the decoder."; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| // Put the decoder in an idle state, ready to resume. |
| decoder_->Reset(); |
| |
| DCHECK(!decoder_flushing_); |
| decoder_flushing_ = true; |
| NewEventPending(); |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::FinishFlush() { |
| VLOGF(4); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| if (!decoder_flushing_) |
| return true; |
| |
| if (!surfaces_at_device_.empty()) |
| return false; |
| |
| // Even if all output buffers have been returned, the decoder may still |
| // be holding on an input device. Wait until the queue is actually drained. |
| if (input_queue_->QueuedBuffersCount() != 0) |
| return false; |
| |
| DCHECK_EQ(state_, kIdle); |
| |
| // At this point, all remaining surfaces are decoded and dequeued, and since |
| // we have already scheduled output for them in InitiateFlush(), their |
| // respective PictureReady calls have been posted (or they have been queued on |
| // pending_picture_ready_). So at this time, once we SendPictureReady(), |
| // we will have all remaining PictureReady() posted to the client and we |
| // can post NotifyFlushDone(). |
| DCHECK(decoder_display_queue_.empty()); |
| |
| // Decoder should have already returned all surfaces and all surfaces are |
| // out of hardware. There can be no other owners of input buffers. |
| DCHECK_EQ(input_queue_->FreeBuffersCount(), |
| input_queue_->AllocatedBuffersCount()); |
| |
| SendPictureReady(); |
| |
| decoder_flushing_ = false; |
| VLOGF(2) << "Flush finished"; |
| |
| child_task_runner_->PostTask( |
| FROM_HERE, base::BindOnce(&Client::NotifyFlushDone, client_)); |
| |
| TRACE_EVENT_ASYNC_END0("media,gpu", "V4L2SVDA Flush", this); |
| return true; |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::Reset() { |
| VLOGF(2); |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| |
| decoder_thread_task_runner_->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2SliceVideoDecodeAccelerator::ResetTask, |
| base::Unretained(this))); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::ResetTask() { |
| VLOGF(2); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| TRACE_EVENT_ASYNC_BEGIN0("media,gpu", "V4L2SVDA Reset", this); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| if (decoder_resetting_) { |
| // This is a bug in the client, multiple Reset()s before NotifyResetDone() |
| // are not allowed. |
| NOTREACHED() << "Client should not be requesting multiple Reset()s"; |
| return; |
| } |
| |
| // Put the decoder in an idle state, ready to resume. |
| decoder_->Reset(); |
| |
| // Drop all remaining inputs. |
| decoder_current_bitstream_buffer_.reset(); |
| while (!decoder_input_queue_.empty()) |
| decoder_input_queue_.pop_front(); |
| |
| decoder_resetting_ = true; |
| NewEventPending(); |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::FinishReset() { |
| VLOGF(4); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| if (!decoder_resetting_) |
| return true; |
| |
| if (!surfaces_at_device_.empty()) |
| return false; |
| |
| DCHECK_EQ(state_, kIdle); |
| DCHECK(!decoder_flushing_); |
| SendPictureReady(); |
| |
| // Drop any pending outputs. |
| while (!decoder_display_queue_.empty()) |
| decoder_display_queue_.pop(); |
| |
| // At this point we can have no input buffers in the decoder, because we |
| // Reset()ed it in ResetTask(), and have not scheduled any new Decode()s |
| // having been in kIdle since. We don't have any surfaces in the HW either - |
| // we just checked that surfaces_at_device_.empty(), and inputs are tied |
| // to surfaces. Since there can be no other owners of input buffers, we can |
| // simply mark them all as available. |
| DCHECK_EQ(input_queue_->QueuedBuffersCount(), 0u); |
| |
| decoder_resetting_ = false; |
| VLOGF(2) << "Reset finished"; |
| |
| child_task_runner_->PostTask( |
| FROM_HERE, base::BindOnce(&Client::NotifyResetDone, client_)); |
| |
| TRACE_EVENT_ASYNC_END0("media,gpu", "V4L2SVDA Reset", this); |
| return true; |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::IsDestroyPending() { |
| return destroy_pending_.IsSignaled(); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::SetErrorState(Error error) { |
| // We can touch decoder_state_ only if this is the decoder thread or the |
| // decoder thread isn't running. |
| if (decoder_thread_.IsRunning() && |
| !decoder_thread_task_runner_->BelongsToCurrentThread()) { |
| decoder_thread_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::SetErrorState, |
| base::Unretained(this), error)); |
| return; |
| } |
| |
| // Notifying the client of an error will only happen if we are already |
| // initialized, as the API does not allow doing so before that. Subsequent |
| // errors and errors while destroying will be suppressed. |
| if (state_ != kError && state_ != kUninitialized && state_ != kDestroying) |
| NotifyError(error); |
| |
| state_ = kError; |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::SubmitSlice( |
| const scoped_refptr<V4L2DecodeSurface>& dec_surface, |
| const uint8_t* data, |
| size_t size) { |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| V4L2WritableBufferRef& input_buffer = dec_surface->input_buffer(); |
| DCHECK(input_buffer.IsValid()); |
| |
| const size_t plane_size = input_buffer.GetPlaneSize(0); |
| const size_t bytes_used = input_buffer.GetPlaneBytesUsed(0); |
| |
| if (bytes_used + size > plane_size) { |
| VLOGF(1) << "Input buffer too small"; |
| return false; |
| } |
| |
| uint8_t* mapping = static_cast<uint8_t*>(input_buffer.GetPlaneMapping(0)); |
| DCHECK_NE(mapping, nullptr); |
| memcpy(mapping + bytes_used, data, size); |
| input_buffer.SetPlaneBytesUsed(0, bytes_used + size); |
| |
| return true; |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::DecodeSurface( |
| const scoped_refptr<V4L2DecodeSurface>& dec_surface) { |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| DVLOGF(3) << "Submitting decode for surface: " << dec_surface->ToString(); |
| Enqueue(dec_surface); |
| |
| if (!dec_surface->Submit()) { |
| VLOGF(1) << "Error while submitting frame for decoding!"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| } |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::SurfaceReady( |
| const scoped_refptr<V4L2DecodeSurface>& dec_surface, |
| int32_t bitstream_id, |
| const gfx::Rect& visible_rect, |
| const VideoColorSpace& /* color_space */) { |
| DVLOGF(4); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| dec_surface->SetVisibleRect(visible_rect); |
| decoder_display_queue_.push(std::make_pair(bitstream_id, dec_surface)); |
| TryOutputSurfaces(); |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::TryOutputSurfaces() { |
| while (!decoder_display_queue_.empty()) { |
| scoped_refptr<V4L2DecodeSurface> dec_surface = |
| decoder_display_queue_.front().second; |
| |
| if (!dec_surface->decoded()) |
| break; |
| |
| int32_t bitstream_id = decoder_display_queue_.front().first; |
| decoder_display_queue_.pop(); |
| OutputSurface(bitstream_id, dec_surface); |
| } |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::OutputSurface( |
| int32_t bitstream_id, |
| const scoped_refptr<V4L2DecodeSurface>& dec_surface) { |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| |
| OutputRecord& output_record = |
| output_buffer_map_[dec_surface->output_record()]; |
| |
| if (output_record.num_times_sent_to_client == 0) { |
| DCHECK(!output_record.at_client); |
| output_record.at_client = true; |
| bool inserted = |
| surfaces_at_display_ |
| .insert(std::make_pair(output_record.picture_id, dec_surface)) |
| .second; |
| DCHECK(inserted); |
| } else { |
| // The surface is already sent to client, and not returned back yet. |
| DCHECK(output_record.at_client); |
| DCHECK(surfaces_at_display_.find(output_record.picture_id) != |
| surfaces_at_display_.end()); |
| CHECK(surfaces_at_display_[output_record.picture_id].get() == |
| dec_surface.get()); |
| } |
| |
| DCHECK_NE(output_record.picture_id, -1); |
| ++output_record.num_times_sent_to_client; |
| |
| // TODO(hubbe): Insert correct color space. http://crbug.com/647725 |
| Picture picture(output_record.picture_id, bitstream_id, |
| dec_surface->visible_rect(), gfx::ColorSpace(), |
| true /* allow_overlay */); |
| DVLOGF(4) << dec_surface->ToString() |
| << ", bitstream_id: " << picture.bitstream_buffer_id() |
| << ", picture_id: " << picture.picture_buffer_id() |
| << ", visible_rect: " << picture.visible_rect().ToString(); |
| pending_picture_ready_.push(PictureRecord(output_record.cleared, picture)); |
| SendPictureReady(); |
| output_record.cleared = true; |
| } |
| |
| scoped_refptr<V4L2DecodeSurface> |
| V4L2SliceVideoDecodeAccelerator::CreateSurface() { |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| DCHECK_EQ(state_, kDecoding); |
| TRACE_COUNTER_ID2( |
| "media,gpu", "V4L2 input buffers", this, "free", |
| input_queue_->FreeBuffersCount(), "in use", |
| input_queue_->AllocatedBuffersCount() - input_queue_->FreeBuffersCount()); |
| TRACE_COUNTER_ID2("media,gpu", "V4L2 output buffers", this, "free", |
| output_queue_->FreeBuffersCount(), "in use", |
| output_queue_->AllocatedBuffersCount() - |
| output_queue_->AllocatedBuffersCount()); |
| TRACE_COUNTER_ID2("media,gpu", "V4L2 output buffers", this, "at client", |
| GetNumOfOutputRecordsAtClient(), "at device", |
| GetNumOfOutputRecordsAtDevice()); |
| |
| if (input_queue_->FreeBuffersCount() == 0 || |
| output_queue_->FreeBuffersCount() == 0) |
| return nullptr; |
| |
| V4L2WritableBufferRef input_buffer = input_queue_->GetFreeBuffer(); |
| DCHECK(input_buffer.IsValid()); |
| V4L2WritableBufferRef output_buffer = output_queue_->GetFreeBuffer(); |
| DCHECK(output_buffer.IsValid()); |
| |
| int input = input_buffer.BufferId(); |
| int output = output_buffer.BufferId(); |
| |
| scoped_refptr<V4L2DecodeSurface> dec_surface; |
| |
| if (supports_requests_) { |
| // Here we just borrow the older request to use it, before |
| // immediately putting it back at the back of the queue. |
| base::ScopedFD request = std::move(requests_.front()); |
| requests_.pop(); |
| auto ret = V4L2RequestDecodeSurface::Create(std::move(input_buffer), |
| std::move(output_buffer), |
| nullptr, request.get()); |
| requests_.push(std::move(request)); |
| |
| // Not being able to create the decode surface at this stage is a |
| // fatal error. |
| if (!ret) { |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return nullptr; |
| } |
| |
| dec_surface = std::move(ret).value(); |
| } else { |
| dec_surface = new V4L2ConfigStoreDecodeSurface( |
| std::move(input_buffer), std::move(output_buffer), nullptr); |
| } |
| |
| DVLOGF(4) << "Created surface " << input << " -> " << output; |
| return dec_surface; |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::SendPictureReady() { |
| DVLOGF(4); |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| bool send_now = |
| (decoder_resetting_ || decoder_flushing_ || surface_set_change_pending_); |
| while (!pending_picture_ready_.empty()) { |
| bool cleared = pending_picture_ready_.front().cleared; |
| const Picture& picture = pending_picture_ready_.front().picture; |
| if (cleared && picture_clearing_count_ == 0) { |
| DVLOGF(4) << "Posting picture ready to decode task runner for: " |
| << picture.picture_buffer_id(); |
| // This picture is cleared. It can be posted to a thread different than |
| // the main GPU thread to reduce latency. This should be the case after |
| // all pictures are cleared at the beginning. |
| decode_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&Client::PictureReady, decode_client_, picture)); |
| pending_picture_ready_.pop(); |
| } else if (!cleared || send_now) { |
| DVLOGF(4) << "cleared=" << pending_picture_ready_.front().cleared |
| << ", decoder_resetting_=" << decoder_resetting_ |
| << ", decoder_flushing_=" << decoder_flushing_ |
| << ", surface_set_change_pending_=" |
| << surface_set_change_pending_ |
| << ", picture_clearing_count_=" << picture_clearing_count_; |
| DVLOGF(4) << "Posting picture ready to GPU for: " |
| << picture.picture_buffer_id(); |
| // If the picture is not cleared, post it to the child thread because it |
| // has to be cleared in the child thread. A picture only needs to be |
| // cleared once. If the decoder is resetting or flushing or changing |
| // resolution, send all pictures to ensure PictureReady arrive before |
| // reset done, flush done, or picture dismissed. |
| child_task_runner_->PostTaskAndReply( |
| FROM_HERE, base::BindOnce(&Client::PictureReady, client_, picture), |
| // Unretained is safe. If Client::PictureReady gets to run, |this| is |
| // alive. Destroy() will wait the decode thread to finish. |
| base::BindOnce(&V4L2SliceVideoDecodeAccelerator::PictureCleared, |
| base::Unretained(this))); |
| picture_clearing_count_++; |
| pending_picture_ready_.pop(); |
| } else { |
| // This picture is cleared. But some pictures are about to be cleared on |
| // the child thread. To preserve the order, do not send this until those |
| // pictures are cleared. |
| break; |
| } |
| } |
| } |
| |
| void V4L2SliceVideoDecodeAccelerator::PictureCleared() { |
| DVLOGF(4) << "clearing count=" << picture_clearing_count_; |
| DCHECK(decoder_thread_task_runner_->BelongsToCurrentThread()); |
| DCHECK_GT(picture_clearing_count_, 0); |
| picture_clearing_count_--; |
| SendPictureReady(); |
| } |
| |
| bool V4L2SliceVideoDecodeAccelerator::TryToSetupDecodeOnSeparateThread( |
| const base::WeakPtr<Client>& decode_client, |
| const scoped_refptr<base::SingleThreadTaskRunner>& decode_task_runner) { |
| decode_client_ = decode_client; |
| decode_task_runner_ = decode_task_runner; |
| return true; |
| } |
| |
| // static |
| VideoDecodeAccelerator::SupportedProfiles |
| V4L2SliceVideoDecodeAccelerator::GetSupportedProfiles() { |
| scoped_refptr<V4L2Device> device = V4L2Device::Create(); |
| if (!device) |
| return SupportedProfiles(); |
| |
| return device->GetSupportedDecodeProfiles( |
| base::size(supported_input_fourccs_), supported_input_fourccs_); |
| } |
| |
| size_t V4L2SliceVideoDecodeAccelerator::GetNumOfOutputRecordsAtDevice() const { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| return output_queue_->QueuedBuffersCount(); |
| } |
| |
| size_t V4L2SliceVideoDecodeAccelerator::GetNumOfOutputRecordsAtClient() const { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| return std::count_if(output_buffer_map_.begin(), output_buffer_map_.end(), |
| [](const auto& r) { return r.at_client; }); |
| } |
| |
| // base::trace_event::MemoryDumpProvider implementation. |
| bool V4L2SliceVideoDecodeAccelerator::OnMemoryDump( |
| const base::trace_event::MemoryDumpArgs& args, |
| base::trace_event::ProcessMemoryDump* pmd) { |
| // OnMemoryDump() must be performed on |decoder_thread_|. |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| // VIDEO_OUTPUT queue's memory usage. |
| const size_t input_queue_buffers_count = |
| input_queue_->AllocatedBuffersCount(); |
| size_t input_queue_memory_usage = 0; |
| std::string input_queue_buffers_memory_type = |
| V4L2Device::V4L2MemoryToString(V4L2_MEMORY_MMAP); |
| input_queue_memory_usage += input_queue_->GetMemoryUsage(); |
| |
| // VIDEO_CAPTURE queue's memory usage. |
| const size_t output_queue_buffers_count = output_buffer_map_.size(); |
| size_t output_queue_memory_usage = 0; |
| std::string output_queue_buffers_memory_type = |
| output_mode_ == Config::OutputMode::ALLOCATE |
| ? V4L2Device::V4L2MemoryToString(V4L2_MEMORY_MMAP) |
| : V4L2Device::V4L2MemoryToString(V4L2_MEMORY_DMABUF); |
| if (output_mode_ == Config::OutputMode::ALLOCATE) { |
| // Call QUERY_BUF here because the length of buffers on VIDIOC_CATURE queue |
| // are not recorded nowhere in V4L2VideoDecodeAccelerator. |
| for (uint32_t index = 0; index < output_buffer_map_.size(); ++index) { |
| struct v4l2_buffer v4l2_buffer = {}; |
| struct v4l2_plane v4l2_planes[VIDEO_MAX_PLANES]; |
| DCHECK_LT(output_planes_count_, base::size(v4l2_planes)); |
| v4l2_buffer.m.planes = v4l2_planes; |
| v4l2_buffer.length = |
| std::min(output_planes_count_, base::size(v4l2_planes)); |
| v4l2_buffer.index = index; |
| v4l2_buffer.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE; |
| v4l2_buffer.memory = V4L2_MEMORY_MMAP; |
| IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_QUERYBUF, &v4l2_buffer); |
| for (size_t i = 0; i < output_planes_count_; ++i) |
| output_queue_memory_usage += v4l2_buffer.m.planes[i].length; |
| } |
| } |
| |
| const size_t total_usage = |
| input_queue_memory_usage + output_queue_memory_usage; |
| |
| using ::base::trace_event::MemoryAllocatorDump; |
| |
| auto dump_name = base::StringPrintf("gpu/v4l2/slice_decoder/0x%" PRIxPTR, |
| reinterpret_cast<uintptr_t>(this)); |
| |
| MemoryAllocatorDump* dump = pmd->CreateAllocatorDump(dump_name); |
| dump->AddScalar(MemoryAllocatorDump::kNameSize, |
| MemoryAllocatorDump::kUnitsBytes, |
| static_cast<uint64_t>(total_usage)); |
| dump->AddScalar("input_queue_memory_usage", MemoryAllocatorDump::kUnitsBytes, |
| static_cast<uint64_t>(input_queue_memory_usage)); |
| dump->AddScalar("input_queue_buffers_count", |
| MemoryAllocatorDump::kUnitsObjects, |
| static_cast<uint64_t>(input_queue_buffers_count)); |
| dump->AddString("input_queue_buffers_memory_type", "", |
| input_queue_buffers_memory_type); |
| dump->AddScalar("output_queue_memory_usage", MemoryAllocatorDump::kUnitsBytes, |
| static_cast<uint64_t>(output_queue_memory_usage)); |
| dump->AddScalar("output_queue_buffers_count", |
| MemoryAllocatorDump::kUnitsObjects, |
| static_cast<uint64_t>(output_queue_buffers_count)); |
| dump->AddString("output_queue_buffers_memory_type", "", |
| output_queue_buffers_memory_type); |
| return true; |
| } |
| |
| } // namespace media |