blob: b3109191e150e665911354e8fd7965368a789eb9 [file] [log] [blame]
// Copyright 2015 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "media/gpu/v4l2_jpeg_decode_accelerator.h"
#include <errno.h>
#include <linux/videodev2.h>
#include <string.h>
#include <sys/mman.h>
#include <memory>
#include "base/big_endian.h"
#include "base/bind.h"
#include "base/threading/thread_task_runner_handle.h"
#include "media/filters/jpeg_parser.h"
#include "media/gpu/v4l2_jpeg_decode_accelerator.h"
#include "third_party/libyuv/include/libyuv.h"
#define IOCTL_OR_ERROR_RETURN_VALUE(type, arg, value, type_name) \
do { \
if (device_->Ioctl(type, arg) != 0) { \
PLOG(ERROR) << __func__ << "(): ioctl() failed: " << type_name; \
PostNotifyError(kInvalidBitstreamBufferId, PLATFORM_FAILURE); \
return value; \
} \
} while (0)
#define IOCTL_OR_ERROR_RETURN(type, arg) \
IOCTL_OR_ERROR_RETURN_VALUE(type, arg, ((void)0), #type)
#define IOCTL_OR_ERROR_RETURN_FALSE(type, arg) \
IOCTL_OR_ERROR_RETURN_VALUE(type, arg, false, #type)
#define IOCTL_OR_LOG_ERROR(type, arg) \
do { \
if (device_->Ioctl(type, arg) != 0) { \
PLOG(ERROR) << __func__ << "(): ioctl() failed: " << #type; \
PostNotifyError(kInvalidBitstreamBufferId, PLATFORM_FAILURE); \
} \
} while (0)
#define READ_U8_OR_RETURN_FALSE(reader, out) \
do { \
uint8_t _out; \
if (!reader.ReadU8(&_out)) { \
DVLOG(1) \
<< "Error in stream: unexpected EOS while trying to read " #out; \
return false; \
} \
*(out) = _out; \
} while (0)
#define READ_U16_OR_RETURN_FALSE(reader, out) \
do { \
uint16_t _out; \
if (!reader.ReadU16(&_out)) { \
DVLOG(1) \
<< "Error in stream: unexpected EOS while trying to read " #out; \
return false; \
} \
*(out) = _out; \
} while (0)
namespace media {
// This is default huffman segment for 8-bit precision luminance and
// chrominance. The default huffman segment is constructed with the tables from
// JPEG standard section K.3. Actually there are no default tables. They are
// typical tables. These tables are useful for many applications. Lots of
// softwares use them as standard tables such as ffmpeg.
const uint8_t kDefaultDhtSeg[] = {
0xFF, 0xC4, 0x01, 0xA2, 0x00, 0x00, 0x01, 0x05, 0x01, 0x01, 0x01, 0x01,
0x01, 0x01, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x01, 0x02,
0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x01, 0x00, 0x03,
0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x00, 0x00, 0x00,
0x00, 0x00, 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09,
0x0A, 0x0B, 0x10, 0x00, 0x02, 0x01, 0x03, 0x03, 0x02, 0x04, 0x03, 0x05,
0x05, 0x04, 0x04, 0x00, 0x00, 0x01, 0x7D, 0x01, 0x02, 0x03, 0x00, 0x04,
0x11, 0x05, 0x12, 0x21, 0x31, 0x41, 0x06, 0x13, 0x51, 0x61, 0x07, 0x22,
0x71, 0x14, 0x32, 0x81, 0x91, 0xA1, 0x08, 0x23, 0x42, 0xB1, 0xC1, 0x15,
0x52, 0xD1, 0xF0, 0x24, 0x33, 0x62, 0x72, 0x82, 0x09, 0x0A, 0x16, 0x17,
0x18, 0x19, 0x1A, 0x25, 0x26, 0x27, 0x28, 0x29, 0x2A, 0x34, 0x35, 0x36,
0x37, 0x38, 0x39, 0x3A, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48, 0x49, 0x4A,
0x53, 0x54, 0x55, 0x56, 0x57, 0x58, 0x59, 0x5A, 0x63, 0x64, 0x65, 0x66,
0x67, 0x68, 0x69, 0x6A, 0x73, 0x74, 0x75, 0x76, 0x77, 0x78, 0x79, 0x7A,
0x83, 0x84, 0x85, 0x86, 0x87, 0x88, 0x89, 0x8A, 0x92, 0x93, 0x94, 0x95,
0x96, 0x97, 0x98, 0x99, 0x9A, 0xA2, 0xA3, 0xA4, 0xA5, 0xA6, 0xA7, 0xA8,
0xA9, 0xAA, 0xB2, 0xB3, 0xB4, 0xB5, 0xB6, 0xB7, 0xB8, 0xB9, 0xBA, 0xC2,
0xC3, 0xC4, 0xC5, 0xC6, 0xC7, 0xC8, 0xC9, 0xCA, 0xD2, 0xD3, 0xD4, 0xD5,
0xD6, 0xD7, 0xD8, 0xD9, 0xDA, 0xE1, 0xE2, 0xE3, 0xE4, 0xE5, 0xE6, 0xE7,
0xE8, 0xE9, 0xEA, 0xF1, 0xF2, 0xF3, 0xF4, 0xF5, 0xF6, 0xF7, 0xF8, 0xF9,
0xFA, 0x11, 0x00, 0x02, 0x01, 0x02, 0x04, 0x04, 0x03, 0x04, 0x07, 0x05,
0x04, 0x04, 0x00, 0x01, 0x02, 0x77, 0x00, 0x01, 0x02, 0x03, 0x11, 0x04,
0x05, 0x21, 0x31, 0x06, 0x12, 0x41, 0x51, 0x07, 0x61, 0x71, 0x13, 0x22,
0x32, 0x81, 0x08, 0x14, 0x42, 0x91, 0xA1, 0xB1, 0xC1, 0x09, 0x23, 0x33,
0x52, 0xF0, 0x15, 0x62, 0x72, 0xD1, 0x0A, 0x16, 0x24, 0x34, 0xE1, 0x25,
0xF1, 0x17, 0x18, 0x19, 0x1A, 0x26, 0x27, 0x28, 0x29, 0x2A, 0x35, 0x36,
0x37, 0x38, 0x39, 0x3A, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48, 0x49, 0x4A,
0x53, 0x54, 0x55, 0x56, 0x57, 0x58, 0x59, 0x5A, 0x63, 0x64, 0x65, 0x66,
0x67, 0x68, 0x69, 0x6A, 0x73, 0x74, 0x75, 0x76, 0x77, 0x78, 0x79, 0x7A,
0x82, 0x83, 0x84, 0x85, 0x86, 0x87, 0x88, 0x89, 0x8A, 0x92, 0x93, 0x94,
0x95, 0x96, 0x97, 0x98, 0x99, 0x9A, 0xA2, 0xA3, 0xA4, 0xA5, 0xA6, 0xA7,
0xA8, 0xA9, 0xAA, 0xB2, 0xB3, 0xB4, 0xB5, 0xB6, 0xB7, 0xB8, 0xB9, 0xBA,
0xC2, 0xC3, 0xC4, 0xC5, 0xC6, 0xC7, 0xC8, 0xC9, 0xCA, 0xD2, 0xD3, 0xD4,
0xD5, 0xD6, 0xD7, 0xD8, 0xD9, 0xDA, 0xE2, 0xE3, 0xE4, 0xE5, 0xE6, 0xE7,
0xE8, 0xE9, 0xEA, 0xF2, 0xF3, 0xF4, 0xF5, 0xF6, 0xF7, 0xF8, 0xF9, 0xFA};
V4L2JpegDecodeAccelerator::BufferRecord::BufferRecord()
: address(nullptr), length(0), at_device(false) {}
V4L2JpegDecodeAccelerator::BufferRecord::~BufferRecord() {}
V4L2JpegDecodeAccelerator::JobRecord::JobRecord(
const BitstreamBuffer& bitstream_buffer,
scoped_refptr<VideoFrame> video_frame)
: bitstream_buffer_id(bitstream_buffer.id()),
shm(bitstream_buffer, true),
out_frame(video_frame) {}
V4L2JpegDecodeAccelerator::JobRecord::~JobRecord() {}
V4L2JpegDecodeAccelerator::V4L2JpegDecodeAccelerator(
const scoped_refptr<V4L2Device>& device,
const scoped_refptr<base::SingleThreadTaskRunner>& io_task_runner)
: output_buffer_pixelformat_(0),
child_task_runner_(base::ThreadTaskRunnerHandle::Get()),
io_task_runner_(io_task_runner),
client_(nullptr),
device_(device),
decoder_thread_("V4L2JpegDecodeThread"),
device_poll_thread_("V4L2JpegDecodeDevicePollThread"),
input_streamon_(false),
output_streamon_(false),
weak_factory_(this) {
weak_ptr_ = weak_factory_.GetWeakPtr();
}
V4L2JpegDecodeAccelerator::~V4L2JpegDecodeAccelerator() {
DCHECK(child_task_runner_->BelongsToCurrentThread());
if (decoder_thread_.IsRunning()) {
decoder_task_runner_->PostTask(
FROM_HERE, base::Bind(&V4L2JpegDecodeAccelerator::DestroyTask,
base::Unretained(this)));
decoder_thread_.Stop();
}
weak_factory_.InvalidateWeakPtrs();
DCHECK(!device_poll_thread_.IsRunning());
}
void V4L2JpegDecodeAccelerator::DestroyTask() {
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
while (!input_jobs_.empty())
input_jobs_.pop();
while (!running_jobs_.empty())
running_jobs_.pop();
// Stop streaming and the device_poll_thread_.
StopDevicePoll();
DestroyInputBuffers();
DestroyOutputBuffers();
}
void V4L2JpegDecodeAccelerator::VideoFrameReady(int32_t bitstream_buffer_id) {
DCHECK(child_task_runner_->BelongsToCurrentThread());
client_->VideoFrameReady(bitstream_buffer_id);
}
void V4L2JpegDecodeAccelerator::NotifyError(int32_t bitstream_buffer_id,
Error error) {
DCHECK(child_task_runner_->BelongsToCurrentThread());
LOG(ERROR) << "Notifying of error " << error << " for buffer id "
<< bitstream_buffer_id;
client_->NotifyError(bitstream_buffer_id, error);
}
void V4L2JpegDecodeAccelerator::PostNotifyError(int32_t bitstream_buffer_id,
Error error) {
child_task_runner_->PostTask(
FROM_HERE, base::Bind(&V4L2JpegDecodeAccelerator::NotifyError, weak_ptr_,
bitstream_buffer_id, error));
}
bool V4L2JpegDecodeAccelerator::Initialize(Client* client) {
DCHECK(child_task_runner_->BelongsToCurrentThread());
// Capabilities check.
struct v4l2_capability caps;
const __u32 kCapsRequired = V4L2_CAP_STREAMING | V4L2_CAP_VIDEO_M2M;
memset(&caps, 0, sizeof(caps));
if (device_->Ioctl(VIDIOC_QUERYCAP, &caps) != 0) {
PLOG(ERROR) << __func__ << ": ioctl() failed: VIDIOC_QUERYCAP";
return false;
}
if ((caps.capabilities & kCapsRequired) != kCapsRequired) {
LOG(ERROR) << __func__ << ": VIDIOC_QUERYCAP, caps check failed: 0x"
<< std::hex << caps.capabilities;
return false;
}
// Subscribe to the source change event.
struct v4l2_event_subscription sub;
memset(&sub, 0, sizeof(sub));
sub.type = V4L2_EVENT_SOURCE_CHANGE;
if (device_->Ioctl(VIDIOC_SUBSCRIBE_EVENT, &sub) != 0) {
PLOG(ERROR) << __func__ << ": ioctl() failed: VIDIOC_SUBSCRIBE_EVENT";
return false;
}
if (!decoder_thread_.Start()) {
LOG(ERROR) << __func__ << ": decoder thread failed to start";
return false;
}
client_ = client;
decoder_task_runner_ = decoder_thread_.task_runner();
decoder_task_runner_->PostTask(
FROM_HERE, base::Bind(&V4L2JpegDecodeAccelerator::StartDevicePoll,
base::Unretained(this)));
DVLOG(1) << "V4L2JpegDecodeAccelerator initialized.";
return true;
}
void V4L2JpegDecodeAccelerator::Decode(
const BitstreamBuffer& bitstream_buffer,
const scoped_refptr<VideoFrame>& video_frame) {
DVLOG(1) << "Decode(): input_id=" << bitstream_buffer.id()
<< ", size=" << bitstream_buffer.size();
DCHECK(io_task_runner_->BelongsToCurrentThread());
if (bitstream_buffer.id() < 0) {
LOG(ERROR) << "Invalid bitstream_buffer, id: " << bitstream_buffer.id();
if (base::SharedMemory::IsHandleValid(bitstream_buffer.handle()))
base::SharedMemory::CloseHandle(bitstream_buffer.handle());
PostNotifyError(bitstream_buffer.id(), INVALID_ARGUMENT);
return;
}
if (video_frame->format() != PIXEL_FORMAT_I420) {
PostNotifyError(bitstream_buffer.id(), UNSUPPORTED_JPEG);
return;
}
std::unique_ptr<JobRecord> job_record(
new JobRecord(bitstream_buffer, video_frame));
decoder_task_runner_->PostTask(
FROM_HERE, base::Bind(&V4L2JpegDecodeAccelerator::DecodeTask,
base::Unretained(this), base::Passed(&job_record)));
}
bool V4L2JpegDecodeAccelerator::IsSupported() {
v4l2_fmtdesc fmtdesc;
memset(&fmtdesc, 0, sizeof(fmtdesc));
fmtdesc.type = V4L2_BUF_TYPE_VIDEO_OUTPUT;
for (; device_->Ioctl(VIDIOC_ENUM_FMT, &fmtdesc) == 0; ++fmtdesc.index) {
if (fmtdesc.pixelformat == V4L2_PIX_FMT_JPEG)
return true;
}
return false;
}
void V4L2JpegDecodeAccelerator::DecodeTask(
std::unique_ptr<JobRecord> job_record) {
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
if (!job_record->shm.Map()) {
PLOG(ERROR) << __func__ << ": could not map bitstream_buffer";
PostNotifyError(job_record->bitstream_buffer_id, UNREADABLE_INPUT);
return;
}
input_jobs_.push(make_linked_ptr(job_record.release()));
ServiceDeviceTask(false);
}
size_t V4L2JpegDecodeAccelerator::InputBufferQueuedCount() {
return input_buffer_map_.size() - free_input_buffers_.size();
}
size_t V4L2JpegDecodeAccelerator::OutputBufferQueuedCount() {
return output_buffer_map_.size() - free_output_buffers_.size();
}
bool V4L2JpegDecodeAccelerator::ShouldRecreateInputBuffers() {
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
if (input_jobs_.empty())
return false;
linked_ptr<JobRecord> job_record = input_jobs_.front();
// Check input buffer size is enough
return (input_buffer_map_.empty() ||
(job_record->shm.size() + sizeof(kDefaultDhtSeg)) >
input_buffer_map_.front().length);
}
bool V4L2JpegDecodeAccelerator::RecreateInputBuffers() {
DVLOG(3) << __func__;
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
// If running queue is not empty, we should wait until pending frames finish.
if (!running_jobs_.empty())
return true;
DestroyInputBuffers();
if (!CreateInputBuffers()) {
LOG(ERROR) << "Create input buffers failed.";
return false;
}
return true;
}
bool V4L2JpegDecodeAccelerator::RecreateOutputBuffers() {
DVLOG(3) << __func__;
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
DestroyOutputBuffers();
if (!CreateOutputBuffers()) {
LOG(ERROR) << "Create output buffers failed.";
return false;
}
return true;
}
bool V4L2JpegDecodeAccelerator::CreateInputBuffers() {
DVLOG(3) << __func__;
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
DCHECK(!input_streamon_);
DCHECK(!input_jobs_.empty());
linked_ptr<JobRecord> job_record = input_jobs_.front();
// The input image may miss huffman table. We didn't parse the image before,
// so we create more to avoid the situation of not enough memory.
// Reserve twice size to avoid recreating input buffer frequently.
size_t reserve_size = (job_record->shm.size() + sizeof(kDefaultDhtSeg)) * 2;
struct v4l2_format format;
memset(&format, 0, sizeof(format));
format.type = V4L2_BUF_TYPE_VIDEO_OUTPUT;
format.fmt.pix.pixelformat = V4L2_PIX_FMT_JPEG;
format.fmt.pix.sizeimage = reserve_size;
format.fmt.pix.field = V4L2_FIELD_ANY;
IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_S_FMT, &format);
struct v4l2_requestbuffers reqbufs;
memset(&reqbufs, 0, sizeof(reqbufs));
reqbufs.count = kBufferCount;
reqbufs.type = V4L2_BUF_TYPE_VIDEO_OUTPUT;
reqbufs.memory = V4L2_MEMORY_MMAP;
IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_REQBUFS, &reqbufs);
DCHECK(input_buffer_map_.empty());
input_buffer_map_.resize(reqbufs.count);
for (size_t i = 0; i < input_buffer_map_.size(); ++i) {
free_input_buffers_.push_back(i);
struct v4l2_buffer buffer;
memset(&buffer, 0, sizeof(buffer));
buffer.index = i;
buffer.type = V4L2_BUF_TYPE_VIDEO_OUTPUT;
buffer.memory = V4L2_MEMORY_MMAP;
IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_QUERYBUF, &buffer);
void* address = device_->Mmap(NULL, buffer.length, PROT_READ | PROT_WRITE,
MAP_SHARED, buffer.m.offset);
if (address == MAP_FAILED) {
PLOG(ERROR) << __func__ << ": mmap() failed";
PostNotifyError(kInvalidBitstreamBufferId, PLATFORM_FAILURE);
return false;
}
input_buffer_map_[i].address = address;
input_buffer_map_[i].length = buffer.length;
}
return true;
}
bool V4L2JpegDecodeAccelerator::CreateOutputBuffers() {
DVLOG(3) << __func__;
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
DCHECK(!output_streamon_);
DCHECK(!running_jobs_.empty());
linked_ptr<JobRecord> job_record = running_jobs_.front();
size_t frame_size = VideoFrame::AllocationSize(
PIXEL_FORMAT_I420, job_record->out_frame->coded_size());
struct v4l2_format format;
memset(&format, 0, sizeof(format));
format.type = V4L2_BUF_TYPE_VIDEO_CAPTURE;
format.fmt.pix.width = job_record->out_frame->coded_size().width();
format.fmt.pix.height = job_record->out_frame->coded_size().height();
format.fmt.pix.sizeimage = frame_size;
format.fmt.pix.pixelformat = V4L2_PIX_FMT_YUV420;
format.fmt.pix.field = V4L2_FIELD_ANY;
IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_S_FMT, &format);
output_buffer_pixelformat_ = format.fmt.pix.pixelformat;
output_buffer_coded_size_.SetSize(format.fmt.pix.width,
format.fmt.pix.height);
struct v4l2_requestbuffers reqbufs;
memset(&reqbufs, 0, sizeof(reqbufs));
reqbufs.count = kBufferCount;
reqbufs.type = V4L2_BUF_TYPE_VIDEO_CAPTURE;
reqbufs.memory = V4L2_MEMORY_MMAP;
IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_REQBUFS, &reqbufs);
DCHECK(output_buffer_map_.empty());
output_buffer_map_.resize(reqbufs.count);
VideoPixelFormat output_format =
V4L2Device::V4L2PixFmtToVideoPixelFormat(output_buffer_pixelformat_);
for (size_t i = 0; i < output_buffer_map_.size(); ++i) {
free_output_buffers_.push_back(i);
struct v4l2_buffer buffer;
memset(&buffer, 0, sizeof(buffer));
buffer.index = i;
buffer.type = V4L2_BUF_TYPE_VIDEO_CAPTURE;
buffer.memory = V4L2_MEMORY_MMAP;
IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_QUERYBUF, &buffer);
DCHECK_GE(buffer.length,
VideoFrame::AllocationSize(
output_format,
gfx::Size(format.fmt.pix.width, format.fmt.pix.height)));
void* address = device_->Mmap(NULL, buffer.length, PROT_READ | PROT_WRITE,
MAP_SHARED, buffer.m.offset);
if (address == MAP_FAILED) {
PLOG(ERROR) << __func__ << ": mmap() failed";
PostNotifyError(kInvalidBitstreamBufferId, PLATFORM_FAILURE);
return false;
}
output_buffer_map_[i].address = address;
output_buffer_map_[i].length = buffer.length;
}
return true;
}
void V4L2JpegDecodeAccelerator::DestroyInputBuffers() {
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
DCHECK(!input_streamon_);
if (input_streamon_) {
__u32 type = V4L2_BUF_TYPE_VIDEO_OUTPUT;
IOCTL_OR_ERROR_RETURN(VIDIOC_STREAMOFF, &type);
input_streamon_ = false;
}
for (size_t i = 0; i < input_buffer_map_.size(); ++i) {
BufferRecord& input_record = input_buffer_map_[i];
device_->Munmap(input_record.address, input_record.length);
}
struct v4l2_requestbuffers reqbufs;
memset(&reqbufs, 0, sizeof(reqbufs));
reqbufs.count = 0;
reqbufs.type = V4L2_BUF_TYPE_VIDEO_OUTPUT;
reqbufs.memory = V4L2_MEMORY_MMAP;
IOCTL_OR_LOG_ERROR(VIDIOC_REQBUFS, &reqbufs);
input_buffer_map_.clear();
free_input_buffers_.clear();
}
void V4L2JpegDecodeAccelerator::DestroyOutputBuffers() {
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
DCHECK(!output_streamon_);
if (output_streamon_) {
__u32 type = V4L2_BUF_TYPE_VIDEO_CAPTURE;
IOCTL_OR_ERROR_RETURN(VIDIOC_STREAMOFF, &type);
output_streamon_ = false;
}
for (size_t i = 0; i < output_buffer_map_.size(); ++i) {
BufferRecord& output_record = output_buffer_map_[i];
device_->Munmap(output_record.address, output_record.length);
}
struct v4l2_requestbuffers reqbufs;
memset(&reqbufs, 0, sizeof(reqbufs));
reqbufs.count = 0;
reqbufs.type = V4L2_BUF_TYPE_VIDEO_CAPTURE;
reqbufs.memory = V4L2_MEMORY_MMAP;
IOCTL_OR_LOG_ERROR(VIDIOC_REQBUFS, &reqbufs);
output_buffer_map_.clear();
free_output_buffers_.clear();
}
void V4L2JpegDecodeAccelerator::DevicePollTask() {
DCHECK(device_poll_task_runner_->BelongsToCurrentThread());
bool event_pending;
if (!device_->Poll(true, &event_pending)) {
PLOG(ERROR) << __func__ << ": Poll device error.";
PostNotifyError(kInvalidBitstreamBufferId, PLATFORM_FAILURE);
return;
}
// All processing should happen on ServiceDeviceTask(), since we shouldn't
// touch decoder state from this thread.
decoder_task_runner_->PostTask(
FROM_HERE, base::Bind(&V4L2JpegDecodeAccelerator::ServiceDeviceTask,
base::Unretained(this), event_pending));
}
bool V4L2JpegDecodeAccelerator::DequeueSourceChangeEvent() {
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
struct v4l2_event ev;
memset(&ev, 0, sizeof(ev));
if (device_->Ioctl(VIDIOC_DQEVENT, &ev) == 0) {
if (ev.type == V4L2_EVENT_SOURCE_CHANGE) {
DVLOG(3) << __func__
<< ": got source change event: " << ev.u.src_change.changes;
if (ev.u.src_change.changes &
(V4L2_EVENT_SRC_CH_RESOLUTION | V4L2_EVENT_SRC_CH_PIXELFORMAT)) {
return true;
}
LOG(ERROR) << __func__ << ": unexpected source change event.";
} else {
LOG(ERROR) << __func__ << ": got an event (" << ev.type
<< ") we haven't subscribed to.";
}
} else {
LOG(ERROR) << __func__ << ": dequeue event failed.";
}
PostNotifyError(kInvalidBitstreamBufferId, PLATFORM_FAILURE);
return false;
}
void V4L2JpegDecodeAccelerator::ServiceDeviceTask(bool event_pending) {
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
// If DestroyTask() shuts |device_poll_thread_| down, we should early-out.
if (!device_poll_thread_.IsRunning())
return;
if (!running_jobs_.empty())
Dequeue();
if (ShouldRecreateInputBuffers() && !RecreateInputBuffers())
return;
if (event_pending) {
if (!DequeueSourceChangeEvent())
return;
if (!RecreateOutputBuffers())
return;
}
EnqueueInput();
EnqueueOutput();
if (!running_jobs_.empty()) {
device_poll_task_runner_->PostTask(
FROM_HERE, base::Bind(&V4L2JpegDecodeAccelerator::DevicePollTask,
base::Unretained(this)));
}
DVLOG(2) << __func__ << ": buffer counts: INPUT["
<< input_jobs_.size() << "] => DEVICE["
<< free_input_buffers_.size() << "/"
<< input_buffer_map_.size() << "->"
<< free_output_buffers_.size() << "/"
<< output_buffer_map_.size() << "]";
}
void V4L2JpegDecodeAccelerator::EnqueueInput() {
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
while (!input_jobs_.empty() && !free_input_buffers_.empty()) {
// If input buffers are required to re-create, do not enqueue input record
// until all pending frames are handled by device.
if (ShouldRecreateInputBuffers())
break;
if (!EnqueueInputRecord())
return;
}
// Check here because we cannot STREAMON before QBUF in earlier kernel.
// (kernel version < 3.14)
if (!input_streamon_ && InputBufferQueuedCount()) {
__u32 type = V4L2_BUF_TYPE_VIDEO_OUTPUT;
IOCTL_OR_ERROR_RETURN(VIDIOC_STREAMON, &type);
input_streamon_ = true;
}
}
void V4L2JpegDecodeAccelerator::EnqueueOutput() {
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
// Output record can be enqueued because the output coded sizes of the frames
// currently in the pipeline are all the same.
while (running_jobs_.size() > OutputBufferQueuedCount() &&
!free_output_buffers_.empty()) {
if (!EnqueueOutputRecord())
return;
}
// Check here because we cannot STREAMON before QBUF in earlier kernel.
// (kernel version < 3.14)
if (!output_streamon_ && OutputBufferQueuedCount()) {
__u32 type = V4L2_BUF_TYPE_VIDEO_CAPTURE;
IOCTL_OR_ERROR_RETURN(VIDIOC_STREAMON, &type);
output_streamon_ = true;
}
}
static bool CopyOutputImage(const uint32_t src_pixelformat,
const void* src_addr,
const gfx::Size& src_coded_size,
const scoped_refptr<VideoFrame>& dst_frame) {
VideoPixelFormat format =
V4L2Device::V4L2PixFmtToVideoPixelFormat(src_pixelformat);
size_t src_size = VideoFrame::AllocationSize(format, src_coded_size);
uint8_t* dst_y = dst_frame->data(VideoFrame::kYPlane);
uint8_t* dst_u = dst_frame->data(VideoFrame::kUPlane);
uint8_t* dst_v = dst_frame->data(VideoFrame::kVPlane);
size_t dst_y_stride = dst_frame->stride(VideoFrame::kYPlane);
size_t dst_u_stride = dst_frame->stride(VideoFrame::kUPlane);
size_t dst_v_stride = dst_frame->stride(VideoFrame::kVPlane);
// If the source format is I420, ConvertToI420 will simply copy the frame.
if (libyuv::ConvertToI420(static_cast<uint8_t*>(const_cast<void*>(src_addr)),
src_size,
dst_y, dst_y_stride,
dst_u, dst_u_stride,
dst_v, dst_v_stride,
0, 0,
src_coded_size.width(),
src_coded_size.height(),
dst_frame->coded_size().width(),
dst_frame->coded_size().height(),
libyuv::kRotate0,
src_pixelformat)) {
LOG(ERROR) << "ConvertToI420 failed. Source format: " << src_pixelformat;
return false;
}
return true;
}
void V4L2JpegDecodeAccelerator::Dequeue() {
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
// Dequeue completed input (VIDEO_OUTPUT) buffers,
// and recycle to the free list.
struct v4l2_buffer dqbuf;
while (InputBufferQueuedCount() > 0) {
DCHECK(input_streamon_);
memset(&dqbuf, 0, sizeof(dqbuf));
dqbuf.type = V4L2_BUF_TYPE_VIDEO_OUTPUT;
dqbuf.memory = V4L2_MEMORY_MMAP;
if (device_->Ioctl(VIDIOC_DQBUF, &dqbuf) != 0) {
if (errno == EAGAIN) {
// EAGAIN if we're just out of buffers to dequeue.
break;
}
PLOG(ERROR) << "ioctl() failed: input buffer VIDIOC_DQBUF failed.";
PostNotifyError(kInvalidBitstreamBufferId, PLATFORM_FAILURE);
return;
}
BufferRecord& input_record = input_buffer_map_[dqbuf.index];
DCHECK(input_record.at_device);
input_record.at_device = false;
free_input_buffers_.push_back(dqbuf.index);
if (dqbuf.flags & V4L2_BUF_FLAG_ERROR) {
DVLOG(1) << "Dequeue input buffer error.";
PostNotifyError(kInvalidBitstreamBufferId, UNSUPPORTED_JPEG);
running_jobs_.pop();
}
}
// Dequeue completed output (VIDEO_CAPTURE) buffers, recycle to the free list.
// Return the finished buffer to the client via the job ready callback.
// If dequeued input buffer has an error, the error frame has removed from
// |running_jobs_|. We only have to dequeue output buffer when we actually
// have pending frames in |running_jobs_| and also enqueued output buffers.
while (!running_jobs_.empty() && OutputBufferQueuedCount() > 0) {
DCHECK(output_streamon_);
memset(&dqbuf, 0, sizeof(dqbuf));
dqbuf.type = V4L2_BUF_TYPE_VIDEO_CAPTURE;
// From experiments, using MMAP and memory copy is still faster than
// USERPTR. Also, client doesn't need to consider the buffer alignment and
// JpegDecodeAccelerator API will be simpler.
dqbuf.memory = V4L2_MEMORY_MMAP;
if (device_->Ioctl(VIDIOC_DQBUF, &dqbuf) != 0) {
if (errno == EAGAIN) {
// EAGAIN if we're just out of buffers to dequeue.
break;
}
PLOG(ERROR) << "ioctl() failed: output buffer VIDIOC_DQBUF failed.";
PostNotifyError(kInvalidBitstreamBufferId, PLATFORM_FAILURE);
return;
}
BufferRecord& output_record = output_buffer_map_[dqbuf.index];
DCHECK(output_record.at_device);
output_record.at_device = false;
free_output_buffers_.push_back(dqbuf.index);
// Jobs are always processed in FIFO order.
linked_ptr<JobRecord> job_record = running_jobs_.front();
running_jobs_.pop();
if (dqbuf.flags & V4L2_BUF_FLAG_ERROR) {
DVLOG(1) << "Dequeue output buffer error.";
PostNotifyError(kInvalidBitstreamBufferId, UNSUPPORTED_JPEG);
} else {
// Copy the decoded data from output buffer to the buffer provided by the
// client. Do format conversion when output format is not
// V4L2_PIX_FMT_YUV420.
if (!CopyOutputImage(output_buffer_pixelformat_, output_record.address,
output_buffer_coded_size_, job_record->out_frame)) {
PostNotifyError(job_record->bitstream_buffer_id, PLATFORM_FAILURE);
return;
}
DVLOG(3) << "Decoding finished, returning bitstream buffer, id="
<< job_record->bitstream_buffer_id;
child_task_runner_->PostTask(
FROM_HERE, base::Bind(&V4L2JpegDecodeAccelerator::VideoFrameReady,
weak_ptr_, job_record->bitstream_buffer_id));
}
}
}
static bool AddHuffmanTable(const void* input_ptr,
size_t input_size,
void* output_ptr,
size_t output_size) {
DCHECK(input_ptr);
DCHECK(output_ptr);
DCHECK_LE((input_size + sizeof(kDefaultDhtSeg)), output_size);
base::BigEndianReader reader(static_cast<const char*>(input_ptr), input_size);
bool has_marker_dht = false;
bool has_marker_sos = false;
uint8_t marker1, marker2;
READ_U8_OR_RETURN_FALSE(reader, &marker1);
READ_U8_OR_RETURN_FALSE(reader, &marker2);
if (marker1 != JPEG_MARKER_PREFIX || marker2 != JPEG_SOI) {
DLOG(ERROR) << __func__ << ": The input is not a Jpeg";
return false;
}
// copy SOI marker (0xFF, 0xD8)
memcpy(output_ptr, input_ptr, 2);
size_t current_offset = 2;
while (!has_marker_sos && !has_marker_dht) {
const char* start_addr = reader.ptr();
READ_U8_OR_RETURN_FALSE(reader, &marker1);
if (marker1 != JPEG_MARKER_PREFIX) {
DLOG(ERROR) << __func__ << ": marker1 != 0xFF";
return false;
}
do {
READ_U8_OR_RETURN_FALSE(reader, &marker2);
} while (marker2 == JPEG_MARKER_PREFIX); // skip fill bytes
uint16_t size;
READ_U16_OR_RETURN_FALSE(reader, &size);
// The size includes the size field itself.
if (size < sizeof(size)) {
DLOG(ERROR) << __func__ << ": Ill-formed JPEG. Segment size (" << size
<< ") is smaller than size field (" << sizeof(size) << ")";
return false;
}
size -= sizeof(size);
switch (marker2) {
case JPEG_DHT: {
has_marker_dht = true;
break;
}
case JPEG_SOS: {
if (!has_marker_dht) {
memcpy(static_cast<uint8_t*>(output_ptr) + current_offset,
kDefaultDhtSeg, sizeof(kDefaultDhtSeg));
current_offset += sizeof(kDefaultDhtSeg);
}
has_marker_sos = true;
break;
}
default:
break;
}
if (!reader.Skip(size)) {
DLOG(ERROR) << __func__ << ": Ill-formed JPEG. Remaining size ("
<< reader.remaining()
<< ") is smaller than header specified (" << size << ")";
return false;
}
size_t segment_size = static_cast<size_t>(reader.ptr() - start_addr);
memcpy(static_cast<uint8_t*>(output_ptr) + current_offset, start_addr,
segment_size);
current_offset += segment_size;
}
if (reader.remaining()) {
memcpy(static_cast<uint8_t*>(output_ptr) + current_offset, reader.ptr(),
reader.remaining());
}
return true;
}
bool V4L2JpegDecodeAccelerator::EnqueueInputRecord() {
DCHECK(!input_jobs_.empty());
DCHECK(!free_input_buffers_.empty());
// Enqueue an input (VIDEO_OUTPUT) buffer for an input video frame.
linked_ptr<JobRecord> job_record = input_jobs_.front();
input_jobs_.pop();
const int index = free_input_buffers_.back();
BufferRecord& input_record = input_buffer_map_[index];
DCHECK(!input_record.at_device);
// It will add default huffman segment if it's missing.
if (!AddHuffmanTable(job_record->shm.memory(), job_record->shm.size(),
input_record.address, input_record.length)) {
PostNotifyError(job_record->bitstream_buffer_id, PARSE_JPEG_FAILED);
return false;
}
struct v4l2_buffer qbuf;
memset(&qbuf, 0, sizeof(qbuf));
qbuf.index = index;
qbuf.type = V4L2_BUF_TYPE_VIDEO_OUTPUT;
qbuf.memory = V4L2_MEMORY_MMAP;
IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_QBUF, &qbuf);
input_record.at_device = true;
running_jobs_.push(job_record);
free_input_buffers_.pop_back();
DVLOG(3) << __func__
<< ": enqueued frame id=" << job_record->bitstream_buffer_id
<< " to device.";
return true;
}
bool V4L2JpegDecodeAccelerator::EnqueueOutputRecord() {
DCHECK(!free_output_buffers_.empty());
// Enqueue an output (VIDEO_CAPTURE) buffer.
const int index = free_output_buffers_.back();
BufferRecord& output_record = output_buffer_map_[index];
DCHECK(!output_record.at_device);
struct v4l2_buffer qbuf;
memset(&qbuf, 0, sizeof(qbuf));
qbuf.index = index;
qbuf.type = V4L2_BUF_TYPE_VIDEO_CAPTURE;
qbuf.memory = V4L2_MEMORY_MMAP;
IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_QBUF, &qbuf);
output_record.at_device = true;
free_output_buffers_.pop_back();
return true;
}
void V4L2JpegDecodeAccelerator::StartDevicePoll() {
DVLOG(3) << __func__ << ": starting device poll";
DCHECK(decoder_task_runner_->BelongsToCurrentThread());
DCHECK(!device_poll_thread_.IsRunning());
if (!device_poll_thread_.Start()) {
LOG(ERROR) << __func__ << ": Device thread failed to start";
PostNotifyError(kInvalidBitstreamBufferId, PLATFORM_FAILURE);
return;
}
device_poll_task_runner_ = device_poll_thread_.task_runner();
}
bool V4L2JpegDecodeAccelerator::StopDevicePoll() {
DVLOG(3) << __func__ << ": stopping device poll";
// Signal the DevicePollTask() to stop, and stop the device poll thread.
if (!device_->SetDevicePollInterrupt()) {
LOG(ERROR) << __func__ << ": SetDevicePollInterrupt failed.";
PostNotifyError(kInvalidBitstreamBufferId, PLATFORM_FAILURE);
return false;
}
device_poll_thread_.Stop();
// Clear the interrupt now, to be sure.
if (!device_->ClearDevicePollInterrupt())
return false;
return true;
}
} // namespace media