blob: b0bac85137412b355c4f462a3ddc0ffb86467672 [file] [log] [blame]
// Copyright 2018 The Chromium Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "media/gpu/gpu_video_encode_accelerator_helpers.h"
#include <algorithm>
#include <ostream>
#include "base/check_op.h"
#include "base/notreached.h"
#include "base/numerics/safe_conversions.h"
#include "media/base/bitrate.h"
namespace media {
namespace {
// The maximum number of supported spatial layers and temporal layers. These
// come from the maximum number of layers currently supported by
// VideoEncodeAccelerator implementation.
constexpr size_t kMaxSpatialLayers = 3;
constexpr size_t kMaxTemporalLayers = 3;
// The maximum size for output buffer, which is chosen empirically for
// 1080p video.
constexpr size_t kMaxBitstreamBufferSizeInBytes = 2 * 1024 * 1024; // 2MB
// The frame size for 1080p (FHD) video in pixels.
constexpr int k1080PSizeInPixels = 1920 * 1080;
// The frame size for 1440p (QHD) video in pixels.
constexpr int k1440PSizeInPixels = 2560 * 1440;
// The mapping from resolution, bitrate, framerate to the bitstream buffer size.
struct BitstreamBufferSizeInfo {
int coded_size_area;
uint32_t bitrate_in_bps;
uint32_t framerate;
uint32_t buffer_size_in_bytes;
};
// The bitstream buffer size for each resolution. The table must be sorted in
// increasing order by the resolution. The value is decided by measuring the
// biggest buffer size, and then double the size as margin. (crbug.com/889739)
constexpr BitstreamBufferSizeInfo kBitstreamBufferSizeTable[] = {
{320 * 180, 100000, 30, 15000},
{640 * 360, 500000, 30, 52000},
{1280 * 720, 1200000, 30, 110000},
{1920 * 1080, 4000000, 30, 380000},
{3840 * 2160, 20000000, 30, 970000},
};
// Use quadruple size of kMaxBitstreamBufferSizeInBytes when the input frame
// size is larger than 1440p, double if larger than 1080p. This is chosen
// empirically for some 4k encoding use cases and Android CTS VideoEncoderTest
// (crbug.com/927284).
size_t GetMaxEncodeBitstreamBufferSize(const gfx::Size& size) {
if (size.GetArea() > k1440PSizeInPixels)
return kMaxBitstreamBufferSizeInBytes * 4;
if (size.GetArea() > k1080PSizeInPixels)
return kMaxBitstreamBufferSizeInBytes * 2;
return kMaxBitstreamBufferSizeInBytes;
}
} // namespace
// This function sets the peak equal to the target. The peak can then be
// updated by callers.
VideoBitrateAllocation AllocateBitrateForDefaultEncodingWithBitrates(
const std::vector<uint32_t>& sl_bitrates,
const size_t num_temporal_layers,
const bool uses_vbr) {
CHECK(!sl_bitrates.empty());
CHECK_LE(sl_bitrates.size(), kMaxSpatialLayers);
// The same bitrate factors as the software encoder.
// https://source.chromium.org/chromium/chromium/src/+/main:media/video/vpx_video_encoder.cc;l=131;drc=d383d0b3e4f76789a6de2a221c61d3531f4c59da
constexpr double kTemporalLayersBitrateScaleFactors[][kMaxTemporalLayers] = {
{1.00, 0.00, 0.00}, // For one temporal layer.
{0.60, 0.40, 0.00}, // For two temporal layers.
{0.50, 0.20, 0.30}, // For three temporal layers.
};
CHECK_GT(num_temporal_layers, 0u);
CHECK_LE(num_temporal_layers, std::size(kTemporalLayersBitrateScaleFactors));
DCHECK_EQ(std::size(kTemporalLayersBitrateScaleFactors), kMaxTemporalLayers);
VideoBitrateAllocation bitrate_allocation;
bitrate_allocation = VideoBitrateAllocation(
uses_vbr ? Bitrate::Mode::kVariable : Bitrate::Mode::kConstant);
for (size_t spatial_id = 0; spatial_id < sl_bitrates.size(); ++spatial_id) {
const uint32_t bitrate_bps = sl_bitrates[spatial_id];
for (size_t temporal_id = 0; temporal_id < num_temporal_layers;
++temporal_id) {
const double factor =
kTemporalLayersBitrateScaleFactors[num_temporal_layers - 1]
[temporal_id];
bitrate_allocation.SetBitrate(
spatial_id, temporal_id,
base::saturated_cast<uint32_t>(bitrate_bps * factor));
}
}
return bitrate_allocation;
}
size_t GetEncodeBitstreamBufferSize(const gfx::Size& size,
uint32_t bitrate,
uint32_t framerate) {
DCHECK_NE(framerate, 0u);
for (auto& data : kBitstreamBufferSizeTable) {
if (size.GetArea() <= data.coded_size_area) {
// The buffer size is proportional to (bitrate / framerate), but linear
// interpolation for smaller ratio is not enough. Therefore we only use
// linear extrapolation for larger ratio.
double ratio = std::max(
1.0f * (bitrate / framerate) / (data.bitrate_in_bps / data.framerate),
1.0f);
return std::min(static_cast<size_t>(data.buffer_size_in_bytes * ratio),
GetMaxEncodeBitstreamBufferSize(size));
}
}
return GetMaxEncodeBitstreamBufferSize(size);
}
// Get the maximum output bitstream buffer size. Since we don't change the
// buffer size when we update bitrate and framerate, we have to calculate the
// buffer size for the maximum bitrate.
// However, the maximum bitrate for intel chipset is 40Mbps. The buffer size
// calculated with this bitrate is always larger than 2MB. Therefore we just
// return the value.
// TODO(crbug.com/889739): Deprecate this function after we can update the
// buffer size while requesting new bitrate and framerate.
size_t GetEncodeBitstreamBufferSize(const gfx::Size& size) {
return GetMaxEncodeBitstreamBufferSize(size);
}
std::vector<uint8_t> GetFpsAllocation(size_t num_temporal_layers) {
DCHECK_LT(num_temporal_layers, 4u);
constexpr uint8_t kFullAllocation = 255;
// The frame rate fraction is given as an 8 bit unsigned integer where 0 = 0%
// and 255 = 100%. Each layer's allocated fps refers to the previous one, so
// e.g. your camera is opened at 30fps, and you want to have decode targets at
// 15fps and 7.5fps as well:
// TL0 then gets an allocation of 7.5/30 = 1/4. TL1 adds another 7.5fps to end
// up at (7.5 + 7.5)/30 = 15/30 = 1/2 of the total allocation. TL2 adds the
// final 15fps to end up at (15 + 15)/30, which is the full allocation.
// Therefor, fps_allocation values are as follows,
// fps_allocation[0][0] = kFullAllocation / 4;
// fps_allocation[0][1] = kFullAllocation / 2;
// fps_allocation[0][2] = kFullAllocation;
// For more information, see webrtc::VideoEncoderInfo::fps_allocation.
switch (num_temporal_layers) {
case 1:
// In this case, the number of spatial layers must great than 1.
return {kFullAllocation};
case 2:
return {kFullAllocation / 2, kFullAllocation};
case 3:
return {kFullAllocation / 4, kFullAllocation / 2, kFullAllocation};
default:
NOTREACHED() << "Unsupported temporal layers";
return {};
}
}
VideoBitrateAllocation AllocateBitrateForDefaultEncoding(
const VideoEncodeAccelerator::Config& config) {
if (config.bitrate.mode() == Bitrate::Mode::kExternal) {
return VideoBitrateAllocation(Bitrate::Mode::kExternal);
}
VideoBitrateAllocation allocation;
const bool use_vbr = config.bitrate.mode() == Bitrate::Mode::kVariable;
if (config.spatial_layers.empty()) {
allocation = AllocateBitrateForDefaultEncodingWithBitrates(
{config.bitrate.target_bps()},
/*num_temporal_layers=*/1u, use_vbr);
if (use_vbr) {
allocation.SetPeakBps(config.bitrate.peak_bps());
}
return allocation;
}
const size_t num_temporal_layers =
config.spatial_layers[0].num_of_temporal_layers;
std::vector<uint32_t> bitrates;
bitrates.reserve(config.spatial_layers.size());
for (const auto& spatial_layer : config.spatial_layers) {
DCHECK_EQ(spatial_layer.num_of_temporal_layers, num_temporal_layers);
bitrates.push_back(spatial_layer.bitrate_bps);
}
allocation = AllocateBitrateForDefaultEncodingWithBitrates(
bitrates, num_temporal_layers, use_vbr);
if (use_vbr) {
allocation.SetPeakBps(config.bitrate.peak_bps());
}
return allocation;
}
VideoBitrateAllocation AllocateDefaultBitrateForTesting(
const size_t num_spatial_layers,
const size_t num_temporal_layers,
const Bitrate& bitrate) {
// Higher spatial layers (those to the right) get more bitrate.
constexpr double kSpatialLayersBitrateScaleFactors[][kMaxSpatialLayers] = {
{1.00, 0.00, 0.00}, // For one spatial layer.
{0.30, 0.70, 0.00}, // For two spatial layers.
{0.07, 0.23, 0.70}, // For three spatial layers.
};
CHECK_GT(num_spatial_layers, 0u);
CHECK_LE(num_spatial_layers, std::size(kSpatialLayersBitrateScaleFactors));
DCHECK_EQ(std::size(kSpatialLayersBitrateScaleFactors), kMaxSpatialLayers);
std::vector<uint32_t> bitrates(num_spatial_layers);
for (size_t sid = 0; sid < num_spatial_layers; ++sid) {
const double bitrate_factor =
kSpatialLayersBitrateScaleFactors[num_spatial_layers - 1][sid];
bitrates[sid] = bitrate.target_bps() * bitrate_factor;
}
const bool use_vbr = bitrate.mode() == Bitrate::Mode::kVariable;
auto allocation = AllocateBitrateForDefaultEncodingWithBitrates(
bitrates, num_temporal_layers, use_vbr);
if (use_vbr)
allocation.SetPeakBps(bitrate.peak_bps());
return allocation;
}
} // namespace media