blob: 38efdf7b116db99dc197fbd8a0efb6a1cc7ca41b [file] [log] [blame]
// Copyright 2015 The Chromium Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "media/muxers/webm_muxer.h"
#include <algorithm>
#include <cstdint>
#include <cstring>
#include <memory>
#include <numbers>
#include <optional>
#include <string>
#include <variant>
#include "base/check.h"
#include "base/compiler_specific.h"
#include "base/containers/circular_deque.h"
#include "base/containers/span.h"
#include "base/containers/span_writer.h"
#include "base/logging.h"
#include "base/memory/scoped_refptr.h"
#include "base/metrics/histogram_functions.h"
#include "base/numerics/safe_math.h"
#include "base/sequence_checker.h"
#include "base/time/time.h"
#include "base/timer/elapsed_timer.h"
#include "base/trace_event/trace_event.h"
#include "media/base/audio_codecs.h"
#include "media/base/audio_parameters.h"
#include "media/base/limits.h"
#include "media/base/video_codecs.h"
#include "media/base/video_frame.h"
#include "media/formats/common/opus_constants.h"
#include "media/muxers/muxer.h"
#include "third_party/libwebm/source/mkvmuxer.hpp"
#include "ui/gfx/color_space.h"
#include "ui/gfx/geometry/size.h"
namespace media {
namespace {
namespace av1 {
// CodecPrivate for AV1. See
// https://github.com/ietf-wg-cellar/matroska-specification/blob/master/codec/av1.md.
constexpr int marker = 1;
constexpr int version = 1;
constexpr int high_bitdepth = 0;
constexpr int twelve_bit = 0;
constexpr int monochrome = 0;
constexpr int initial_presentation_delay_present = 0;
constexpr int initial_presentation_delay_minus_one = 0;
constexpr int chroma_sample_position = 0;
constexpr int seq_profile = 0; // Main
constexpr int seq_level_idx_0 = 9; // level 4.1 ~1920x1080@60fps
constexpr int seq_tier_0 = 0;
constexpr int chroma_subsampling_x = 1;
constexpr int chroma_subsampling_y = 1;
constexpr uint8_t codec_private[4] = {
(marker << 7) | version, //
(seq_profile << 5) | seq_level_idx_0, //
(seq_tier_0 << 7) | //
(high_bitdepth << 6) | //
(twelve_bit << 5) | //
(monochrome << 4) | //
(chroma_subsampling_x << 3) | //
(chroma_subsampling_y << 2) | //
chroma_sample_position, //
(initial_presentation_delay_present << 4) | //
initial_presentation_delay_minus_one //
};
} // namespace av1
void WriteOpusHeader(const AudioParameters& params,
base::span<uint8_t> header) {
// See https://wiki.xiph.org/OggOpus#ID_Header.
// Set magic signature.
static constexpr char label[] = "OpusHead";
base::SpanWriter writer(header);
writer.Write(base::byte_span_from_cstring(label));
// Set Opus version.
writer.WriteU8LittleEndian(1);
// Set channel count.
DCHECK_LE(params.channels(), 2);
writer.WriteU8LittleEndian(params.channels());
// Set pre-skip
uint16_t skip = 0;
writer.WriteU16LittleEndian(skip);
// Set original input sample rate in Hz.
writer.WriteU32LittleEndian(params.sample_rate());
// Set output gain in dB.
uint16_t gain = 0;
writer.WriteU16LittleEndian(gain);
// Set channel mapping family (Mono or L/R Stereo).
writer.WriteU8LittleEndian(0);
}
static double GetFrameRate(const Muxer::VideoParameters& params) {
const double kZeroFrameRate = 0.0;
const double kDefaultFrameRate = 30.0;
double frame_rate = params.frame_rate;
if (frame_rate <= kZeroFrameRate ||
frame_rate > limits::kMaxFramesPerSecond) {
frame_rate = kDefaultFrameRate;
}
return frame_rate;
}
static const char kH264CodecId[] = "V_MPEG4/ISO/AVC";
#if BUILDFLAG(ENABLE_HEVC_PARSER_AND_HW_DECODER)
static const char kHevcCodecId[] = "V_MPEGH/ISO/HEVC";
#endif
static const char kPcmCodecId[] = "A_PCM/FLOAT/IEEE";
static const char* MkvCodeIcForMediaVideoCodecId(VideoCodec video_codec) {
switch (video_codec) {
case VideoCodec::kVP8:
return mkvmuxer::Tracks::kVp8CodecId;
case VideoCodec::kVP9:
return mkvmuxer::Tracks::kVp9CodecId;
case VideoCodec::kAV1:
return mkvmuxer::Tracks::kAv1CodecId;
case VideoCodec::kH264:
return kH264CodecId;
#if BUILDFLAG(ENABLE_HEVC_PARSER_AND_HW_DECODER)
case VideoCodec::kHEVC:
return kHevcCodecId;
#endif
default:
NOTREACHED() << "Unsupported codec " << GetCodecName(video_codec);
}
}
std::optional<mkvmuxer::Colour> ColorFromColorSpace(
const gfx::ColorSpace& color) {
using mkvmuxer::Colour;
using MatrixID = gfx::ColorSpace::MatrixID;
using RangeID = gfx::ColorSpace::RangeID;
using TransferID = gfx::ColorSpace::TransferID;
using PrimaryID = gfx::ColorSpace::PrimaryID;
Colour colour;
int matrix_coefficients;
switch (color.GetMatrixID()) {
case MatrixID::BT709:
matrix_coefficients = Colour::kBt709;
break;
case MatrixID::BT2020_NCL:
matrix_coefficients = Colour::kBt2020NonConstantLuminance;
break;
default:
return std::nullopt;
}
colour.set_matrix_coefficients(matrix_coefficients);
int range;
switch (color.GetRangeID()) {
case RangeID::LIMITED:
range = Colour::kBroadcastRange;
break;
case RangeID::FULL:
range = Colour::kFullRange;
break;
default:
return std::nullopt;
}
colour.set_range(range);
int transfer_characteristics;
switch (color.GetTransferID()) {
case TransferID::BT709:
transfer_characteristics = Colour::kIturBt709Tc;
break;
case TransferID::SRGB:
transfer_characteristics = Colour::kIec6196621;
break;
case TransferID::PQ:
transfer_characteristics = Colour::kSmpteSt2084;
break;
default:
return std::nullopt;
}
colour.set_transfer_characteristics(transfer_characteristics);
int primaries;
switch (color.GetPrimaryID()) {
case PrimaryID::BT709:
primaries = Colour::kIturBt709P;
break;
case PrimaryID::BT2020:
primaries = Colour::kIturBt2020;
break;
default:
return std::nullopt;
}
colour.set_primaries(primaries);
return colour;
}
void SetProjection(mkvmuxer::VideoTrack* video_track,
VideoTransformation transformation) {
mkvmuxer::Projection proj = mkvmuxer::Projection();
// This is based off ffmpeg matroska encoding code. The following is to
// determine the roll and yaw (mirroring) of the Projection (mirroring).
const int roll = [transformation]() {
switch (transformation.rotation) {
case VIDEO_ROTATION_0:
return 0;
case VIDEO_ROTATION_90:
return transformation.mirrored ? 90 : -90;
case VIDEO_ROTATION_180:
return 180;
case VIDEO_ROTATION_270:
return transformation.mirrored ? -90 : 90;
}
}();
proj.set_pose_pitch(0);
proj.set_pose_roll(roll);
proj.set_pose_yaw(transformation.mirrored ? 180 : 0);
video_track->SetProjection(proj);
}
} // anonymous namespace
// -----------------------------------------------------------------------------
// WebmMuxer::Delegate:
WebmMuxer::Delegate::Delegate() {
// Creation can be done on a different sequence than main activities.
DETACH_FROM_SEQUENCE(sequence_checker_);
}
WebmMuxer::Delegate::~Delegate() = default;
mkvmuxer::int32 WebmMuxer::Delegate::Write(const void* buf,
mkvmuxer::uint32 len) {
DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
DVLOG(2) << __func__ << " len " << len;
DCHECK(buf);
const auto result = DoWrite(
// SAFETY: Caller is explicitly calling us with a `buf` of size `len` from
// a 3rd party library that we can't change to use spans.
UNSAFE_BUFFERS(base::span(static_cast<const uint8_t*>(buf), len)));
position_ += len;
return result;
}
// -----------------------------------------------------------------------------
// WebmMuxer:
WebmMuxer::WebmMuxer(AudioCodec audio_codec,
bool has_video,
bool has_audio,
std::unique_ptr<Delegate> delegate,
std::optional<base::TimeDelta> max_data_output_interval)
: audio_codec_(audio_codec),
has_video_(has_video),
has_audio_(has_audio),
max_data_output_interval_(
std::max(max_data_output_interval.value_or(base::TimeDelta()),
kMinimumForcedOutputDuration)),
delegate_(std::move(delegate)) {
DCHECK(has_video_ || has_audio_);
DCHECK(delegate_);
DCHECK(audio_codec == AudioCodec::kOpus || audio_codec == AudioCodec::kPCM)
<< " Unsupported audio codec: " << GetCodecName(audio_codec);
delegate_->InitSegment(&segment_);
mkvmuxer::SegmentInfo* const info = segment_.GetSegmentInfo();
info->set_writing_app("Chrome");
info->set_muxing_app("Chrome");
// Creation can be done on a different sequence than main activities.
DETACH_FROM_SEQUENCE(sequence_checker_);
}
WebmMuxer::~WebmMuxer() = default;
bool WebmMuxer::Flush() {
// Depending on the |delegate_|, it can be either non-seekable (i.e. a live
// stream), or seekable (file mode). So calling |segment_.Finalize()| here is
// needed.
DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
return segment_.Finalize();
}
void WebmMuxer::AddVideoTrack(
const gfx::Size& frame_size,
double frame_rate,
std::optional<gfx::ColorSpace> color_space,
std::optional<VideoTransformation> transformation) {
DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
DCHECK_EQ(0u, video_track_index_)
<< "WebmMuxer can only be initialized once.";
video_track_index_ =
segment_.AddVideoTrack(frame_size.width(), frame_size.height(), 0);
if (video_track_index_ <= 0) { // See https://crbug.com/616391.
NOTREACHED() << "Error adding video track";
}
mkvmuxer::VideoTrack* const video_track =
reinterpret_cast<mkvmuxer::VideoTrack*>(
segment_.GetTrackByNumber(video_track_index_));
if (color_space) {
auto colour = ColorFromColorSpace(*color_space);
if (colour) {
video_track->SetColour(*colour);
}
}
if (transformation) {
SetProjection(video_track, transformation.value());
}
DCHECK(video_track);
video_track->set_codec_id(MkvCodeIcForMediaVideoCodecId(video_codec_));
DCHECK_EQ(0ull, video_track->crop_right());
DCHECK_EQ(0ull, video_track->crop_left());
DCHECK_EQ(0ull, video_track->crop_top());
DCHECK_EQ(0ull, video_track->crop_bottom());
DCHECK_EQ(0.0f, video_track->frame_rate());
// Segment's timestamps should be in milliseconds, DCHECK it. See
// http://www.webmproject.org/docs/container/#muxer-guidelines
DCHECK_EQ(1000000ull, segment_.GetSegmentInfo()->timecode_scale());
// Set alpha channel parameters for only VPX (crbug.com/711825).
if (video_codec_ == VideoCodec::kH264 || video_codec_ == VideoCodec::kHEVC) {
return;
}
video_track->SetAlphaMode(mkvmuxer::VideoTrack::kAlpha);
// Alpha channel, if present, is stored in a BlockAdditional next to the
// associated opaque Block, see
// https://matroska.org/technical/specs/index.html#BlockAdditional.
// This follows Method 1 for VP8 encoding of A-channel described on
// http://wiki.webmproject.org/alpha-channel.
video_track->set_max_block_additional_id(1);
}
void WebmMuxer::AddAudioTrack(const AudioParameters& params) {
DVLOG(1) << __func__ << " " << params.AsHumanReadableString();
DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
DCHECK_EQ(0u, audio_track_index_)
<< "WebmMuxer audio can only be initialised once.";
audio_track_index_ =
segment_.AddAudioTrack(params.sample_rate(), params.channels(), 0);
if (audio_track_index_ <= 0) { // See https://crbug.com/616391.
NOTREACHED() << "Error adding audio track";
}
mkvmuxer::AudioTrack* const audio_track =
reinterpret_cast<mkvmuxer::AudioTrack*>(
segment_.GetTrackByNumber(audio_track_index_));
DCHECK(audio_track);
DCHECK_EQ(params.sample_rate(), audio_track->sample_rate());
DCHECK_EQ(params.channels(), static_cast<int>(audio_track->channels()));
DCHECK_LE(params.channels(), 2)
<< "Only 1 or 2 channels supported, requested " << params.channels();
// Audio data is always pcm_f32le.
audio_track->set_bit_depth(32u);
if (audio_codec_ == AudioCodec::kOpus) {
audio_track->set_codec_id(mkvmuxer::Tracks::kOpusCodecId);
uint8_t opus_header[OPUS_EXTRADATA_SIZE];
WriteOpusHeader(params, opus_header);
if (!audio_track->SetCodecPrivate(opus_header, OPUS_EXTRADATA_SIZE)) {
LOG(ERROR) << __func__ << ": failed to set opus header.";
}
// Segment's timestamps should be in milliseconds, DCHECK it. See
// http://www.webmproject.org/docs/container/#muxer-guidelines
DCHECK_EQ(1000000ull, segment_.GetSegmentInfo()->timecode_scale());
} else if (audio_codec_ == AudioCodec::kPCM) {
audio_track->set_codec_id(kPcmCodecId);
}
}
bool WebmMuxer::PutFrame(EncodedFrame frame,
base::TimeDelta relative_timestamp) {
DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
AudioParameters* audio_params = std::get_if<AudioParameters>(&frame.params);
TRACE_EVENT2("media", __func__, "timestamp", relative_timestamp,
"is_keyframe", frame.data->is_key_frame());
DVLOG(2) << __func__ << " - " << (audio_params ? "A " : "V ")
<< frame.data->size() << "B ts " << relative_timestamp;
if (audio_params) {
MaybeForceNewCluster(relative_timestamp);
if (!audio_track_index_) {
AddAudioTrack(*audio_params);
}
} else {
// Clusterfuzz: mkvmuxer suffers from use-after-free on receiving zero-sized
// video data inputs - ignore these.
if (frame.data->empty()) {
return true;
}
auto* video_params = std::get_if<VideoParameters>(&frame.params);
CHECK(video_params);
DCHECK(video_params->codec == VideoCodec::kVP8 ||
video_params->codec == VideoCodec::kVP9 ||
video_params->codec == VideoCodec::kH264 ||
video_params->codec == VideoCodec::kAV1
#if BUILDFLAG(ENABLE_HEVC_PARSER_AND_HW_DECODER)
|| video_params->codec == VideoCodec::kHEVC
#endif
)
<< " Unsupported video codec: " << GetCodecName(video_params->codec);
DCHECK(video_codec_ == VideoCodec::kUnknown ||
video_codec_ == video_params->codec)
<< "Unsupported: codec switched, to: "
<< GetCodecName(video_params->codec);
if (!video_track_index_) {
CHECK(frame.data->is_key_frame());
// |track_index_|, cannot be zero (!), initialize WebmMuxer in that case.
// http://www.matroska.org/technical/specs/index.html#Tracks
video_codec_ = video_params->codec;
AddVideoTrack(video_params->visible_rect_size,
GetFrameRate(*video_params), video_params->color_space,
video_params->transformation);
// Add codec private for AV1.
if (video_params->codec == VideoCodec::kAV1 &&
!segment_.GetTrackByNumber(video_track_index_)
->SetCodecPrivate(av1::codec_private,
sizeof(av1::codec_private))) {
LOG(ERROR) << __func__ << " failed to set CodecPrivate for AV1.";
}
}
}
buffered_frames_.emplace_back(std::move(frame), relative_timestamp);
// Do not emit frames before we've emitted track headers to the muxer.
if ((has_video_ && !video_track_index_) ||
(has_audio_ && !audio_track_index_)) {
return true;
}
bool result = true;
for (auto& [buffered_frame, timestamp] : buffered_frames_) {
result &= WriteWebmFrame(std::move(buffered_frame), timestamp);
}
buffered_frames_.clear();
return result;
}
bool WebmMuxer::WriteWebmFrame(EncodedFrame frame,
base::TimeDelta relative_timestamp) {
if (force_one_libwebm_error_) {
DVLOG(1) << "Forcing a libwebm error";
force_one_libwebm_error_ = false;
return false;
}
auto recorded_timestamp = relative_timestamp.InNanoseconds();
uint8_t track_index = std::get_if<AudioParameters>(&frame.params)
? audio_track_index_
: video_track_index_;
auto frame_data_span = base::span(*frame.data);
return frame.data->side_data() && !frame.data->side_data()->alpha_data.empty()
? segment_.AddFrameWithAdditional(
frame_data_span.data(), frame_data_span.size(),
frame.data->side_data()->alpha_data.data(),
frame.data->side_data()->alpha_data.size(), /*add_id=*/1,
track_index, recorded_timestamp, frame.data->is_key_frame())
: segment_.AddFrame(frame_data_span.data(), frame_data_span.size(),
track_index, recorded_timestamp,
frame.data->is_key_frame());
}
void WebmMuxer::MaybeForceNewCluster(base::TimeDelta media_relative_timestamp) {
DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_);
// Forces a new cluster on the next frame if the time since the last flush
// exceeds the max data output interval. This ensures that data is output
// periodically.
if (cluster_origin_.has_value()) {
if (media_relative_timestamp - *cluster_origin_ >=
max_data_output_interval_) {
TRACE_EVENT0("media", "ForceNewClusterOnNextFrame");
segment_.ForceNewClusterOnNextFrame();
cluster_origin_ = media_relative_timestamp;
}
} else {
cluster_origin_ = media_relative_timestamp;
}
}
} // namespace media