blob: 64c02744f2758f0fcb6494968243dbd8b87e2033 [file] [log] [blame]
// Copyright 2017 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "remoting/codec/webrtc_video_encoder_gpu.h"
#include <memory>
#include <utility>
#include "base/bind.h"
#include "base/bind_helpers.h"
#include "base/logging.h"
#include "base/memory/ptr_util.h"
#include "base/memory/unsafe_shared_memory_region.h"
#include "build/build_config.h"
#include "gpu/config/gpu_preferences.h"
#include "media/gpu/gpu_video_encode_accelerator_factory.h"
#include "remoting/base/constants.h"
#include "third_party/libyuv/include/libyuv/convert_from_argb.h"
#include "third_party/webrtc/modules/desktop_capture/desktop_frame.h"
#include "third_party/webrtc/modules/desktop_capture/desktop_geometry.h"
namespace {
// Currently, the frame scheduler only encodes a single frame at a time. Thus,
// there's no reason to have this set to anything greater than one.
const int kWebrtcVideoEncoderGpuOutputBufferCount = 1;
constexpr media::VideoCodecProfile kH264Profile =
media::VideoCodecProfile::H264PROFILE_MAIN;
constexpr int kH264MinimumTargetBitrateKbpsPerMegapixel = 1800;
void ArgbToI420(const webrtc::DesktopFrame& frame,
scoped_refptr<media::VideoFrame> video_frame) {
const uint8_t* rgb_data = frame.data();
const int rgb_stride = frame.stride();
const int y_stride = video_frame->stride(0);
DCHECK_EQ(video_frame->stride(1), video_frame->stride(2));
const int uv_stride = video_frame->stride(1);
uint8_t* y_data = video_frame->data(0);
uint8_t* u_data = video_frame->data(1);
uint8_t* v_data = video_frame->data(2);
libyuv::ARGBToI420(rgb_data, rgb_stride, y_data, y_stride, u_data, uv_stride,
v_data, uv_stride, video_frame->visible_rect().width(),
video_frame->visible_rect().height());
}
gpu::GpuPreferences CreateGpuPreferences() {
gpu::GpuPreferences gpu_preferences;
#if defined(OS_WIN)
gpu_preferences.enable_media_foundation_vea_on_windows7 = true;
#endif
return gpu_preferences;
}
} // namespace
namespace remoting {
WebrtcVideoEncoderGpu::WebrtcVideoEncoderGpu(
media::VideoCodecProfile codec_profile)
: state_(UNINITIALIZED),
codec_profile_(codec_profile),
bitrate_filter_(kH264MinimumTargetBitrateKbpsPerMegapixel) {}
WebrtcVideoEncoderGpu::~WebrtcVideoEncoderGpu() = default;
// TODO(gusss): Implement either a software fallback or some sort of delay if
// the hardware encoder crashes.
// Bug: crbug.com/751870
void WebrtcVideoEncoderGpu::Encode(std::unique_ptr<webrtc::DesktopFrame> frame,
const FrameParams& params,
WebrtcVideoEncoder::EncodeCallback done) {
DCHECK(frame);
DCHECK(done);
DCHECK_GT(params.duration, base::TimeDelta::FromMilliseconds(0));
bitrate_filter_.SetFrameSize(frame->size().width(), frame->size().height());
if (state_ == INITIALIZATION_ERROR) {
// TODO(zijiehe): The screen resolution limitation of H264 encoder is much
// smaller (3840x2176) than VP8 (16k x 16k) or VP9 (65k x 65k). It's more
// likely the initialization may fail by using H264 encoder. We should
// provide a way to tell the WebrtcVideoStream to stop the video stream.
DLOG(ERROR) << "Encoder failed to initialize; dropping encode request";
// Initialization fails only when the input frame size exceeds the
// limitation.
std::move(done).Run(EncodeResult::FRAME_SIZE_EXCEEDS_CAPABILITY, nullptr);
return;
}
DVLOG(3) << __func__ << " bitrate = " << params.bitrate_kbps << ", "
<< "duration = " << params.duration << ", "
<< "key_frame = " << params.key_frame;
if (state_ == UNINITIALIZED ||
input_visible_size_.width() != frame->size().width() ||
input_visible_size_.height() != frame->size().height()) {
DVLOG(3) << __func__ << " Currently not initialized for frame size "
<< frame->size().width() << "x" << frame->size().height()
<< ". Initializing.";
input_visible_size_ =
gfx::Size(frame->size().width(), frame->size().height());
pending_encode_ = base::BindOnce(&WebrtcVideoEncoderGpu::Encode,
weak_factory_.GetWeakPtr(),
std::move(frame), params, std::move(done));
BeginInitialization();
return;
}
// If we get to this point and state_ != INITIALIZED, we may be attempting to
// have multiple outstanding encode requests, which is not currently
// supported. The current assumption is that the FrameScheduler will wait for
// an Encode to finish before attempting another.
DCHECK_EQ(state_, INITIALIZED);
scoped_refptr<media::VideoFrame> video_frame = media::VideoFrame::CreateFrame(
media::VideoPixelFormat::PIXEL_FORMAT_I420, input_coded_size_,
gfx::Rect(input_visible_size_), input_visible_size_, base::TimeDelta());
base::TimeDelta new_timestamp = previous_timestamp_ + params.duration;
video_frame->set_timestamp(new_timestamp);
previous_timestamp_ = new_timestamp;
// H264 encoder on Windows supports only I420.
ArgbToI420(*frame, video_frame);
callbacks_[video_frame->timestamp()] = std::move(done);
if (params.bitrate_kbps > 0 && params.fps > 0) {
// TODO(zijiehe): Forward frame_rate from FrameParams.
bitrate_filter_.SetBandwidthEstimateKbps(params.bitrate_kbps);
video_encode_accelerator_->RequestEncodingParametersChange(
bitrate_filter_.GetTargetBitrateKbps() * 1000, params.fps);
}
video_encode_accelerator_->Encode(video_frame, params.key_frame);
}
void WebrtcVideoEncoderGpu::RequireBitstreamBuffers(
unsigned int input_count,
const gfx::Size& input_coded_size,
size_t output_buffer_size) {
DCHECK(state_ == INITIALIZING);
DVLOG(3) << __func__ << ", "
<< "input_count = " << input_count << ", "
<< "input_coded_size = " << input_coded_size.width() << "x"
<< input_coded_size.height() << ", "
<< "output_buffer_size = " << output_buffer_size;
required_input_frame_count_ = input_count;
input_coded_size_ = input_coded_size;
output_buffer_size_ = output_buffer_size;
output_buffers_.clear();
for (unsigned int i = 0; i < kWebrtcVideoEncoderGpuOutputBufferCount; ++i) {
auto output_buffer = std::make_unique<OutputBuffer>();
output_buffer->region =
base::UnsafeSharedMemoryRegion::Create(output_buffer_size_);
output_buffer->mapping = output_buffer->region.Map();
// TODO(gusss): Do we need to handle mapping failure more gracefully?
CHECK(output_buffer->IsValid());
output_buffers_.push_back(std::move(output_buffer));
}
for (size_t i = 0; i < output_buffers_.size(); ++i) {
UseOutputBitstreamBufferId(i);
}
state_ = INITIALIZED;
RunAnyPendingEncode();
}
void WebrtcVideoEncoderGpu::BitstreamBufferReady(
int32_t bitstream_buffer_id,
const media::BitstreamBufferMetadata& metadata) {
DVLOG(3) << __func__ << " bitstream_buffer_id = " << bitstream_buffer_id
<< ", "
<< "payload_size = " << metadata.payload_size_bytes << ", "
<< "key_frame = " << metadata.key_frame << ", "
<< "timestamp ms = " << metadata.timestamp.InMilliseconds();
std::unique_ptr<EncodedFrame> encoded_frame =
std::make_unique<EncodedFrame>();
OutputBuffer* output_buffer = output_buffers_[bitstream_buffer_id].get();
DCHECK(output_buffer->IsValid());
base::span<char> data_span =
output_buffer->mapping.GetMemoryAsSpan<char>(metadata.payload_size_bytes);
encoded_frame->data.assign(data_span.begin(), data_span.end());
encoded_frame->key_frame = metadata.key_frame;
encoded_frame->size = webrtc::DesktopSize(input_coded_size_.width(),
input_coded_size_.height());
encoded_frame->quantizer = 0;
encoded_frame->codec = webrtc::kVideoCodecH264;
UseOutputBitstreamBufferId(bitstream_buffer_id);
auto callback_it = callbacks_.find(metadata.timestamp);
DCHECK(callback_it != callbacks_.end())
<< "Callback not found for timestamp " << metadata.timestamp;
std::move(std::get<1>(*callback_it)).Run(
EncodeResult::SUCCEEDED, std::move(encoded_frame));
callbacks_.erase(metadata.timestamp);
}
void WebrtcVideoEncoderGpu::NotifyError(
media::VideoEncodeAccelerator::Error error) {
LOG(ERROR) << __func__ << " error: " << error;
}
bool WebrtcVideoEncoderGpu::OutputBuffer::IsValid() {
return region.IsValid() && mapping.IsValid();
}
void WebrtcVideoEncoderGpu::BeginInitialization() {
DVLOG(3) << __func__;
media::VideoPixelFormat input_format =
media::VideoPixelFormat::PIXEL_FORMAT_I420;
// TODO(zijiehe): implement some logical way to set an initial bitrate.
// Currently we set the bitrate to 8M bits / 1M bytes per frame, and 30 frames
// per second.
uint32_t initial_bitrate = kTargetFrameRate * 1024 * 1024 * 8;
const media::VideoEncodeAccelerator::Config config(
input_format, input_visible_size_, codec_profile_, initial_bitrate);
video_encode_accelerator_ =
media::GpuVideoEncodeAcceleratorFactory::CreateVEA(
config, this, CreateGpuPreferences());
if (!video_encode_accelerator_) {
LOG(ERROR) << "Could not create VideoEncodeAccelerator";
state_ = INITIALIZATION_ERROR;
RunAnyPendingEncode();
return;
}
state_ = INITIALIZING;
}
void WebrtcVideoEncoderGpu::UseOutputBitstreamBufferId(
int32_t bitstream_buffer_id) {
DVLOG(3) << __func__ << " id=" << bitstream_buffer_id;
video_encode_accelerator_->UseOutputBitstreamBuffer(media::BitstreamBuffer(
bitstream_buffer_id,
output_buffers_[bitstream_buffer_id]->region.Duplicate(),
output_buffers_[bitstream_buffer_id]->region.GetSize()));
}
void WebrtcVideoEncoderGpu::RunAnyPendingEncode() {
if (pending_encode_)
std::move(pending_encode_).Run();
}
// static
std::unique_ptr<WebrtcVideoEncoder> WebrtcVideoEncoderGpu::CreateForH264() {
DVLOG(3) << __func__;
LOG(WARNING) << "H264 video encoder is created.";
// HIGH profile requires Windows 8 or upper. Considering encoding latency,
// frame size and image quality, MAIN should be fine for us.
return base::WrapUnique(new WebrtcVideoEncoderGpu(kH264Profile));
}
// static
bool WebrtcVideoEncoderGpu::IsSupportedByH264(
const WebrtcVideoEncoderSelector::Profile& profile) {
media::VideoEncodeAccelerator::SupportedProfiles profiles =
media::GpuVideoEncodeAcceleratorFactory::GetSupportedProfiles(
CreateGpuPreferences());
for (const auto& supported_profile : profiles) {
if (supported_profile.profile != kH264Profile) {
continue;
}
double supported_framerate = supported_profile.max_framerate_numerator;
supported_framerate /= supported_profile.max_framerate_denominator;
if (profile.frame_rate > supported_framerate) {
continue;
}
if (profile.resolution.GetArea() >
supported_profile.max_resolution.GetArea()) {
continue;
}
return true;
}
return false;
}
} // namespace remoting