| // Copyright 2014 The Chromium Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include <stddef.h> |
| #include <stdint.h> |
| |
| #include <algorithm> |
| #include <cmath> |
| #include <cstring> |
| #include <iterator> |
| #include <map> |
| #include <memory> |
| #include <vector> |
| |
| #include "base/base64.h" |
| #include "base/command_line.h" |
| #include "base/files/file_path.h" |
| #include "base/files/file_util.h" |
| #include "base/strings/strcat.h" |
| #include "base/strings/stringprintf.h" |
| #include "base/test/trace_event_analyzer.h" |
| #include "base/time/default_tick_clock.h" |
| #include "base/values.h" |
| #include "build/build_config.h" |
| #include "chrome/browser/extensions/api/tab_capture/tab_capture_performance_test_base.h" |
| #include "chrome/browser/ui/browser.h" |
| #include "chrome/common/chrome_paths.h" |
| #include "chrome/common/chrome_switches.h" |
| #include "chrome/test/base/tracing.h" |
| #include "content/public/common/content_switches.h" |
| #include "content/public/test/browser_test_utils.h" |
| #include "media/base/audio_bus.h" |
| #include "media/base/video_frame.h" |
| #include "media/cast/test/skewed_tick_clock.h" |
| #include "media/cast/test/utility/audio_utility.h" |
| #include "media/cast/test/utility/barcode.h" |
| #include "media/cast/test/utility/default_config.h" |
| #include "media/cast/test/utility/in_process_receiver.h" |
| #include "media/cast/test/utility/net_utility.h" |
| #include "media/cast/test/utility/standalone_cast_environment.h" |
| #include "media/cast/test/utility/udp_proxy.h" |
| #include "net/base/ip_address.h" |
| #include "net/base/ip_endpoint.h" |
| #include "net/base/net_errors.h" |
| #include "net/base/rand_callback.h" |
| #include "net/log/net_log_source.h" |
| #include "net/socket/udp_server_socket.h" |
| #include "testing/perf/perf_test.h" |
| |
| namespace { |
| |
| // Number of events to trim from the begining and end. These events don't |
| // contribute anything toward stable measurements: A brief moment of startup |
| // "jank" is acceptable, and shutdown may result in missing events (e.g., if |
| // streaming stops a few frames before capture stops). |
| constexpr int kTrimEvents = 24; // 1 sec at 24fps, or 0.4 sec at 60 fps. |
| |
| // Minimum number of events required for a reasonable analysis. |
| constexpr int kMinDataPointsForFullRun = 100; // 1s of audio, ~5s at 24fps. |
| |
| // Minimum number of events required for data analysis in a non-performance run. |
| constexpr int kMinDataPointsForQuickRun = 3; |
| |
| // A convenience macro to run a gtest expectation in the "full performance run" |
| // setting, or else a warning that something is not being entirely tested in the |
| // "CQ run" setting. This is required because the test runs in the CQ may not be |
| // long enough to collect sufficient tracing data; and, unfortunately, there's |
| // nothing we can do about that. |
| #define EXPECT_FOR_PERFORMANCE_RUN(expr) \ |
| if (!(expr)) { \ |
| const char *_out = #expr; \ |
| if (is_full_performance_run()) { \ |
| LOG(ERROR) << "Failure: " << _out; \ |
| } else { \ |
| LOG(WARNING) << "Allowing failure: " << _out; \ |
| } \ |
| } |
| |
| enum TestFlags { |
| kSmallWindow = 1 << 2, // Window size: 1 = 800x600, 0 = 2000x1000 |
| k24fps = 1 << 3, // Use 24 fps video. |
| k30fps = 1 << 4, // Use 30 fps video. |
| k60fps = 1 << 5, // Use 60 fps video (captured at 30 fps). |
| kProxyWifi = 1 << 6, // Run UDP through UDPProxy wifi profile. |
| kProxySlow = 1 << 7, // Run UDP through UDPProxy slow profile. |
| kProxyBad = 1 << 8, // Run UDP through UDPProxy bad profile. |
| kSlowClock = 1 << 9, // Receiver clock is 10 seconds slow. |
| kFastClock = 1 << 10, // Receiver clock is 10 seconds fast. |
| kAutoThrottling = 1 << 11, // Use auto-resolution/framerate throttling. |
| }; |
| |
| // These are just for testing! Use cryptographically-secure random keys in |
| // production code! |
| static constexpr char kAesKey[16] = {0, 1, 2, 3, 4, 5, 6, 7, |
| 8, 9, 10, 11, 12, 13, 14, 15}; |
| static constexpr char kAesIvMask[16] = {15, 14, 13, 12, 11, 10, 9, 8, |
| 7, 6, 5, 4, 3, 2, 1, 0}; |
| |
| media::cast::FrameReceiverConfig WithAesKeyAndIvSet( |
| const media::cast::FrameReceiverConfig& config) { |
| media::cast::FrameReceiverConfig result = config; |
| result.aes_key = std::string(kAesKey, kAesKey + sizeof(kAesKey)); |
| result.aes_iv_mask = std::string(kAesIvMask, kAesIvMask + sizeof(kAesIvMask)); |
| return result; |
| } |
| |
| class SkewedCastEnvironment : public media::cast::StandaloneCastEnvironment { |
| public: |
| explicit SkewedCastEnvironment(const base::TimeDelta& delta) |
| : StandaloneCastEnvironment(), |
| skewed_clock_(base::DefaultTickClock::GetInstance()) { |
| // If testing with a receiver clock that is ahead or behind the sender |
| // clock, fake a clock that is offset and also ticks at a rate of 50 parts |
| // per million faster or slower than the local sender's clock. This is the |
| // worst-case scenario for skew in-the-wild. |
| if (!delta.is_zero()) { |
| const double skew = delta < base::TimeDelta() ? 0.999950 : 1.000050; |
| skewed_clock_.SetSkew(skew, delta); |
| } |
| clock_ = &skewed_clock_; |
| } |
| |
| protected: |
| ~SkewedCastEnvironment() override {} |
| |
| private: |
| media::cast::test::SkewedTickClock skewed_clock_; |
| }; |
| |
| // We log one of these for each call to OnAudioFrame/OnVideoFrame. |
| struct TimeData { |
| TimeData(uint16_t frame_no_, base::TimeTicks playout_time_) |
| : frame_no(frame_no_), playout_time(playout_time_) {} |
| // The unit here is video frames, for audio data there can be duplicates. |
| // This was decoded from the actual audio/video data. |
| uint16_t frame_no; |
| // This is when we should play this data, according to the sender. |
| base::TimeTicks playout_time; |
| }; |
| |
| // TODO(hubbe): Move to media/cast to use for offline log analysis. |
| class MeanAndError { |
| public: |
| explicit MeanAndError(const std::vector<double>& values) { |
| double sum = 0.0; |
| double sqr_sum = 0.0; |
| num_values_ = values.size(); |
| if (num_values_ > 0) { |
| for (size_t i = 0; i < num_values_; i++) { |
| sum += values[i]; |
| sqr_sum += values[i] * values[i]; |
| } |
| mean_ = sum / num_values_; |
| std_dev_ = |
| sqrt(std::max(0.0, num_values_ * sqr_sum - sum * sum)) / num_values_; |
| } else { |
| mean_ = NAN; |
| std_dev_ = NAN; |
| } |
| } |
| |
| void SetMeanAsAbsoluteValue() { mean_ = std::abs(mean_); } |
| |
| std::string AsString() const { |
| return base::StringPrintf("%f,%f", mean_, std_dev_); |
| } |
| |
| void Print(const std::string& measurement, |
| const std::string& modifier, |
| const std::string& trace, |
| const std::string& unit) { |
| if (num_values_ > 0) { |
| perf_test::PrintResultMeanAndError(measurement, |
| modifier, |
| trace, |
| AsString(), |
| unit, |
| true); |
| } else { |
| LOG(ERROR) << "No events for " << measurement << modifier << " " << trace; |
| } |
| } |
| |
| private: |
| size_t num_values_; |
| double mean_; |
| double std_dev_; |
| }; |
| |
| // This function checks how smooth the data in |data| is. |
| // It computes the average error of deltas and the average delta. |
| // If data[x] == x * A + B, then this function returns zero. |
| // The unit is milliseconds. |
| static MeanAndError AnalyzeJitter(const std::vector<TimeData>& data) { |
| VLOG(0) << "Jitter analysis on " << data.size() << " values."; |
| std::vector<double> deltas; |
| double sum = 0.0; |
| for (size_t i = 1; i < data.size(); i++) { |
| double delta = |
| (data[i].playout_time - data[i - 1].playout_time).InMillisecondsF(); |
| deltas.push_back(delta); |
| sum += delta; |
| } |
| if (deltas.empty()) { |
| // Not enough data. Don't do the following calculation, to avoid a |
| // divide-by-zero. |
| } else { |
| double mean = sum / deltas.size(); |
| for (size_t i = 0; i < deltas.size(); i++) { |
| deltas[i] = fabs(mean - deltas[i]); |
| } |
| } |
| |
| return MeanAndError(deltas); |
| } |
| |
| // An in-process Cast receiver that examines the audio/video frames being |
| // received and logs some data about each received audio/video frame. |
| class TestPatternReceiver : public media::cast::InProcessReceiver { |
| public: |
| explicit TestPatternReceiver( |
| const scoped_refptr<media::cast::CastEnvironment>& cast_environment, |
| const net::IPEndPoint& local_end_point, |
| bool is_full_performance_run) |
| : InProcessReceiver( |
| cast_environment, |
| local_end_point, |
| net::IPEndPoint(), |
| WithAesKeyAndIvSet(media::cast::GetDefaultAudioReceiverConfig()), |
| WithAesKeyAndIvSet(media::cast::GetDefaultVideoReceiverConfig())), |
| is_full_performance_run_(is_full_performance_run) {} |
| |
| typedef std::map<uint16_t, base::TimeTicks> TimeMap; |
| |
| bool is_full_performance_run() const { return is_full_performance_run_; } |
| |
| // Build a map from frame ID (as encoded in the audio and video data) |
| // to the rtp timestamp for that frame. Note that there will be multiple |
| // audio frames which all have the same frame ID. When that happens we |
| // want the minimum rtp timestamp, because that audio frame is supposed |
| // to play at the same time that the corresponding image is presented. |
| void MapFrameTimes(const std::vector<TimeData>& events, TimeMap* map) { |
| const int trim_count = is_full_performance_run_ ? kTrimEvents : 0; |
| for (int i = trim_count; i < static_cast<int>(events.size()) - trim_count; |
| i++) { |
| base::TimeTicks& frame_tick = (*map)[events[i].frame_no]; |
| if (frame_tick.is_null()) { |
| frame_tick = events[i].playout_time; |
| } else { |
| frame_tick = std::min(events[i].playout_time, frame_tick); |
| } |
| } |
| } |
| |
| void Analyze(const std::string& name, const std::string& modifier) { |
| // First, find the minimum rtp timestamp for each audio and video frame. |
| // Note that the data encoded in the audio stream contains video frame |
| // numbers. So in a 30-fps video stream, there will be 1/30s of "1", then |
| // 1/30s of "2", etc. |
| TimeMap audio_frame_times, video_frame_times; |
| MapFrameTimes(audio_events_, &audio_frame_times); |
| const int min_data_points = is_full_performance_run_ |
| ? kMinDataPointsForFullRun |
| : kMinDataPointsForQuickRun; |
| EXPECT_FOR_PERFORMANCE_RUN(min_data_points <= |
| static_cast<int>(audio_frame_times.size())); |
| MapFrameTimes(video_events_, &video_frame_times); |
| EXPECT_FOR_PERFORMANCE_RUN(min_data_points <= |
| static_cast<int>(video_frame_times.size())); |
| std::vector<double> deltas; |
| for (TimeMap::const_iterator i = audio_frame_times.begin(); |
| i != audio_frame_times.end(); |
| ++i) { |
| TimeMap::const_iterator j = video_frame_times.find(i->first); |
| if (j != video_frame_times.end()) { |
| deltas.push_back((i->second - j->second).InMillisecondsF()); |
| } |
| } |
| EXPECT_FOR_PERFORMANCE_RUN(min_data_points <= |
| static_cast<int>(deltas.size())); |
| |
| MeanAndError av_sync(deltas); |
| av_sync.Print(name, modifier, "av_sync", "ms"); |
| // Close to zero is better (av_sync can be negative). |
| av_sync.SetMeanAsAbsoluteValue(); |
| av_sync.Print(name, modifier, "abs_av_sync", "ms"); |
| // lower is better. |
| AnalyzeJitter(audio_events_).Print(name, modifier, "audio_jitter", "ms"); |
| // lower is better. |
| AnalyzeJitter(video_events_).Print(name, modifier, "video_jitter", "ms"); |
| |
| // Mean resolution of video at receiver. Lower stddev is better, while the |
| // mean should be something reasonable given the network constraints |
| // (usually 480 lines or more). Note that this is the video resolution at |
| // the receiver, but changes originate on the sender side. |
| std::vector<double> slice_for_analysis; |
| const int trim_count = is_full_performance_run_ ? kTrimEvents : 0; |
| if (static_cast<int>(video_frame_lines_.size()) > trim_count * 2) { |
| slice_for_analysis.reserve(video_frame_lines_.size() - trim_count * 2); |
| EXPECT_FOR_PERFORMANCE_RUN( |
| min_data_points <= static_cast<int>(slice_for_analysis.capacity())); |
| std::transform(video_frame_lines_.begin() + trim_count, |
| video_frame_lines_.end() - trim_count, |
| std::back_inserter(slice_for_analysis), |
| [](int lines) { return static_cast<double>(lines); }); |
| } |
| MeanAndError(slice_for_analysis) |
| .Print(name, modifier, "playout_resolution", "lines"); |
| |
| // Number of resolution changes. Lower is better (and 1 is ideal). Zero |
| // indicates a lack of data. |
| int last_lines = -1; |
| int change_count = 0; |
| for (int i = trim_count; |
| i < static_cast<int>(video_frame_lines_.size()) - trim_count; ++i) { |
| if (video_frame_lines_[i] != last_lines) { |
| ++change_count; |
| last_lines = video_frame_lines_[i]; |
| } |
| } |
| EXPECT_FOR_PERFORMANCE_RUN(change_count > 0); |
| perf_test::PrintResult(name, modifier, "resolution_changes", |
| base::NumberToString(change_count), "count", true); |
| } |
| |
| private: |
| // Invoked by InProcessReceiver for each received audio frame. |
| void OnAudioFrame(std::unique_ptr<media::AudioBus> audio_frame, |
| base::TimeTicks playout_time, |
| bool is_continuous) override { |
| CHECK(cast_env()->CurrentlyOn(media::cast::CastEnvironment::MAIN)); |
| |
| if (audio_frame->frames() <= 0) { |
| NOTREACHED() << "OnAudioFrame called with no samples?!?"; |
| return; |
| } |
| |
| TRACE_EVENT_INSTANT1("cast_perf_test", "AudioFramePlayout", |
| TRACE_EVENT_SCOPE_THREAD, "playout_time", |
| (playout_time - base::TimeTicks()).InMicroseconds()); |
| |
| // Note: This is the number of the video frame that this audio belongs to. |
| uint16_t frame_no; |
| if (media::cast::DecodeTimestamp(audio_frame->channel(0), |
| audio_frame->frames(), |
| &frame_no)) { |
| audio_events_.push_back(TimeData(frame_no, playout_time)); |
| } else { |
| DVLOG(2) << "Failed to decode audio timestamp!"; |
| } |
| } |
| |
| void OnVideoFrame(scoped_refptr<media::VideoFrame> video_frame, |
| base::TimeTicks playout_time, |
| bool is_continuous) override { |
| CHECK(cast_env()->CurrentlyOn(media::cast::CastEnvironment::MAIN)); |
| |
| TRACE_EVENT_INSTANT1("cast_perf_test", "VideoFramePlayout", |
| TRACE_EVENT_SCOPE_THREAD, "playout_time", |
| (playout_time - base::TimeTicks()).InMicroseconds()); |
| |
| uint16_t frame_no; |
| if (media::cast::test::DecodeBarcode(*video_frame, &frame_no)) { |
| video_events_.push_back(TimeData(frame_no, playout_time)); |
| } else { |
| DVLOG(2) << "Failed to decode barcode!"; |
| } |
| |
| video_frame_lines_.push_back(video_frame->visible_rect().height()); |
| } |
| |
| const bool is_full_performance_run_; |
| |
| std::vector<TimeData> audio_events_; |
| std::vector<TimeData> video_events_; |
| |
| // The height (number of lines) of each video frame received. |
| std::vector<int> video_frame_lines_; |
| |
| DISALLOW_COPY_AND_ASSIGN(TestPatternReceiver); |
| }; |
| |
| class CastV2PerformanceTest : public TabCapturePerformanceTestBase, |
| public testing::WithParamInterface<int> { |
| public: |
| CastV2PerformanceTest() = default; |
| ~CastV2PerformanceTest() override = default; |
| |
| bool HasFlag(TestFlags flag) const { |
| return (GetParam() & flag) == flag; |
| } |
| |
| std::string GetSuffixForTestFlags() const { |
| std::string suffix; |
| // Note: Add "_gpu" tag for backwards-compatibility with existing |
| // Performance Dashboard timeseries data. |
| suffix += "_gpu"; |
| if (HasFlag(kSmallWindow)) |
| suffix += "_small"; |
| if (HasFlag(k24fps)) |
| suffix += "_24fps"; |
| if (HasFlag(k30fps)) |
| suffix += "_30fps"; |
| if (HasFlag(k60fps)) |
| suffix += "_60fps"; |
| if (HasFlag(kProxyWifi)) |
| suffix += "_wifi"; |
| if (HasFlag(kProxySlow)) |
| suffix += "_slowwifi"; |
| if (HasFlag(kProxyBad)) |
| suffix += "_bad"; |
| if (HasFlag(kSlowClock)) |
| suffix += "_slow"; |
| if (HasFlag(kFastClock)) |
| suffix += "_fast"; |
| if (HasFlag(kAutoThrottling)) |
| suffix += "_autothrottling"; |
| return suffix; |
| } |
| |
| int get_fps() const { |
| if (HasFlag(k24fps)) |
| return 24; |
| if (HasFlag(k30fps)) |
| return 30; |
| if (HasFlag(k60fps)) |
| return 60; |
| NOTREACHED(); |
| return 0; |
| } |
| |
| void SetUp() override { |
| // Produce the full HTML test page with the barcode video embedded within |
| // (as a data URI). |
| const base::FilePath video_file = |
| GetApiTestDataDir() |
| .AppendASCII("cast_streaming") |
| .AppendASCII( |
| base::StringPrintf("test_video_%dfps.webm", get_fps())); |
| std::string file_contents; |
| const bool success = base::ReadFileToString(video_file, &file_contents); |
| CHECK(success) << "Failed to load video at: " << video_file.AsUTF8Unsafe(); |
| std::string video_in_base64; |
| base::Base64Encode(file_contents, &video_in_base64); |
| test_page_html_ = |
| base::StrCat({"<html><body>\n" |
| "<video width='100%' height='100%'>\n" |
| " <source src='data:video/webm;base64,", |
| video_in_base64, |
| "'>\n" |
| "</video>\n" |
| "</body></html>"}); |
| |
| TabCapturePerformanceTestBase::SetUp(); |
| } |
| |
| void SetUpCommandLine(base::CommandLine* command_line) override { |
| if (HasFlag(kSmallWindow)) { |
| command_line->AppendSwitchASCII(switches::kWindowSize, "800,600"); |
| } else { |
| command_line->AppendSwitchASCII(switches::kWindowSize, "2000,1500"); |
| } |
| |
| TabCapturePerformanceTestBase::SetUpCommandLine(command_line); |
| } |
| |
| // The key contains the name of the argument and the argument. |
| typedef std::pair<std::string, double> EventMapKey; |
| typedef std::map<EventMapKey, const trace_analyzer::TraceEvent*> EventMap; |
| |
| // Make events findable by their arguments, for instance, if an |
| // event has a "timestamp": 238724 argument, the map will contain |
| // pair<"timestamp", 238724> -> &event. All arguments are indexed. |
| void IndexEvents(trace_analyzer::TraceAnalyzer* analyzer, |
| const std::string& event_name, |
| EventMap* event_map) { |
| trace_analyzer::TraceEventVector events; |
| QueryTraceEvents(analyzer, event_name, &events); |
| for (size_t i = 0; i < events.size(); i++) { |
| std::map<std::string, double>::const_iterator j; |
| for (j = events[i]->arg_numbers.begin(); |
| j != events[i]->arg_numbers.end(); |
| ++j) { |
| (*event_map)[*j] = events[i]; |
| } |
| } |
| } |
| |
| // Look up an event in |event_map|. The return event will have the same |
| // value for the argument |key_name| as |prev_event|. |
| const trace_analyzer::TraceEvent* FindNextEvent( |
| const EventMap& event_map, |
| const trace_analyzer::TraceEvent* prev_event, |
| std::string key_name) { |
| const auto arg_it = prev_event->arg_numbers.find(key_name); |
| if (arg_it == prev_event->arg_numbers.end()) |
| return nullptr; |
| const EventMapKey& key = *arg_it; |
| const auto event_it = event_map.find(key); |
| if (event_it == event_map.end()) |
| return nullptr; |
| return event_it->second; |
| } |
| |
| // Given a vector of vector of data, extract the difference between |
| // two columns (|col_a| and |col_b|) and output the result as a |
| // performance metric. |
| void OutputMeasurement(const std::string& test_name, |
| const std::vector<std::vector<double>>& data, |
| const std::string& measurement_name, |
| int col_a, |
| int col_b) { |
| std::vector<double> tmp; |
| for (size_t i = 0; i < data.size(); i++) { |
| tmp.push_back((data[i][col_b] - data[i][col_a]) / 1000.0); |
| } |
| return MeanAndError(tmp).Print(test_name, |
| GetSuffixForTestFlags(), |
| measurement_name, |
| "ms"); |
| } |
| |
| // Analyze the latency of each frame as it goes from capture to playout. The |
| // event tracing system is used to track the frames. |
| void AnalyzeLatency(const std::string& test_name, |
| trace_analyzer::TraceAnalyzer* analyzer) { |
| // Retrieve and index all "checkpoint" events related to frames progressing |
| // from start to finish. |
| trace_analyzer::TraceEventVector capture_events; |
| // Sender side: |
| QueryTraceEvents(analyzer, "Capture", &capture_events); |
| EventMap onbuffer, sink, inserted, encoded, transmitted, decoded, done; |
| IndexEvents(analyzer, "OnBufferReceived", &onbuffer); |
| IndexEvents(analyzer, "ConsumeVideoFrame", &sink); |
| IndexEvents(analyzer, "InsertRawVideoFrame", &inserted); |
| IndexEvents(analyzer, "VideoFrameEncoded", &encoded); |
| // Receiver side: |
| IndexEvents(analyzer, "PullEncodedVideoFrame", &transmitted); |
| IndexEvents(analyzer, "VideoFrameDecoded", &decoded); |
| IndexEvents(analyzer, "VideoFramePlayout", &done); |
| |
| // Analyzing latency is non-trivial, because only the frame timestamps |
| // uniquely identify frames AND the timestamps take varying forms throughout |
| // the pipeline (TimeTicks, TimeDelta, RtpTimestamp, etc.). Luckily, each |
| // neighboring stage in the pipeline knows about the timestamp from the |
| // prior stage, in whatever form it had, and so it's possible to track |
| // specific frames all the way from capture until playout at the receiver. |
| std::vector<std::pair<EventMap*, std::string>> event_maps; |
| event_maps.push_back(std::make_pair(&onbuffer, "time_delta")); |
| event_maps.push_back(std::make_pair(&sink, "time_delta")); |
| event_maps.push_back(std::make_pair(&inserted, "timestamp")); |
| event_maps.push_back(std::make_pair(&encoded, "rtp_timestamp")); |
| event_maps.push_back(std::make_pair(&transmitted, "rtp_timestamp")); |
| event_maps.push_back(std::make_pair(&decoded, "rtp_timestamp")); |
| event_maps.push_back(std::make_pair(&done, "playout_time")); |
| |
| // For each "begin capture" event, search for all the events following it, |
| // producing a matrix of when each frame reached each pipeline checkpoint. |
| // See the "cheat sheet" below for a description of each pipeline |
| // checkpoint. |
| const int trim_count = is_full_performance_run() ? kTrimEvents : 0; |
| EXPECT_FOR_PERFORMANCE_RUN((trim_count * 2) <= |
| static_cast<int>(capture_events.size())); |
| std::vector<std::vector<double>> traced_frames; |
| for (int i = trim_count; |
| i < static_cast<int>(capture_events.size()) - trim_count; i++) { |
| std::vector<double> times; |
| const trace_analyzer::TraceEvent* event = capture_events[i]; |
| if (!event->other_event) |
| continue; // Begin capture event without a corresponding end event. |
| times.push_back(event->timestamp); // begin capture |
| event = event->other_event; |
| times.push_back(event->timestamp); // end capture |
| const trace_analyzer::TraceEvent* prev_event = event; |
| for (size_t j = 0; j < event_maps.size(); j++) { |
| event = FindNextEvent(*event_maps[j].first, prev_event, |
| event_maps[j].second); |
| if (!event) |
| break; // Missing an event: The frame was dropped along the way. |
| prev_event = event; |
| times.push_back(event->timestamp); |
| } |
| if (event) { |
| // Successfully traced frame from beginning to end. |
| traced_frames.push_back(std::move(times)); |
| } |
| } |
| |
| // Report the fraction of captured frames that were dropped somewhere along |
| // the way (i.e., before playout at the receiver). |
| const int capture_event_count = capture_events.size() - 2 * trim_count; |
| EXPECT_FOR_PERFORMANCE_RUN((is_full_performance_run() |
| ? kMinDataPointsForFullRun |
| : kMinDataPointsForQuickRun) <= |
| capture_event_count); |
| const double success_percent = |
| (capture_event_count == 0) |
| ? NAN |
| : (100.0 * traced_frames.size() / capture_event_count); |
| perf_test::PrintResult( |
| test_name, GetSuffixForTestFlags(), "frame_drop_rate", |
| base::StringPrintf("%f", 100 - success_percent), "percent", true); |
| |
| // Report the latency between various pairs of checkpoints in the pipeline. |
| // Lower latency is better for all of these measurements. |
| // |
| // Cheat sheet: |
| // 0 = Sender: capture begin |
| // 1 = Sender: capture end |
| // 2 = Sender: memory buffer reached the render process |
| // 3 = Sender: frame routed to Cast RTP consumer |
| // 4 = Sender: frame reached VideoSender::InsertRawVideoFrame() |
| // 5 = Sender: frame encoding complete, queueing for transmission |
| // 6 = Receiver: frame fully received from network |
| // 7 = Receiver: frame decoded |
| // 8 = Receiver: frame played out |
| OutputMeasurement(test_name, traced_frames, "total_latency", 0, 8); |
| OutputMeasurement(test_name, traced_frames, "capture_duration", 0, 1); |
| OutputMeasurement(test_name, traced_frames, "send_to_renderer", 1, 3); |
| OutputMeasurement(test_name, traced_frames, "encode", 3, 5); |
| OutputMeasurement(test_name, traced_frames, "transmit", 5, 6); |
| OutputMeasurement(test_name, traced_frames, "decode", 6, 7); |
| OutputMeasurement(test_name, traced_frames, "cast_latency", 3, 8); |
| } |
| |
| MeanAndError AnalyzeTraceDistance(trace_analyzer::TraceAnalyzer* analyzer, |
| const std::string& event_name) { |
| trace_analyzer::TraceEventVector events; |
| QueryTraceEvents(analyzer, event_name, &events); |
| |
| const int trim_count = is_full_performance_run() ? kTrimEvents : 0; |
| std::vector<double> deltas; |
| for (int i = trim_count + 1; |
| i < static_cast<int>(events.size()) - trim_count; ++i) { |
| double delta_micros = events[i]->timestamp - events[i - 1]->timestamp; |
| deltas.push_back(delta_micros / 1000.0); |
| } |
| return MeanAndError(deltas); |
| } |
| |
| protected: |
| // The complete HTML test web page without any external dependencies, |
| // including the entire barcode video as an embedded data URI. Populated in |
| // SetUp(). |
| std::string test_page_html_; |
| |
| // While the source video frame rate may vary (24, 30, or 60 FPS), the maximum |
| // capture frame rate is always fixed at 30 FPS. This allows testing of the |
| // entire system when it is forced to perform a 60→30 frame rate conversion. |
| static constexpr int kMaxCaptureFrameRate = 30; |
| |
| // Naming of performance measurement written to stdout. |
| static const char kTestName[]; |
| }; |
| |
| // static |
| const char CastV2PerformanceTest::kTestName[] = "CastV2Performance"; |
| |
| } // namespace |
| |
| IN_PROC_BROWSER_TEST_P(CastV2PerformanceTest, Performance) { |
| net::IPEndPoint receiver_end_point = media::cast::test::GetFreeLocalPort(); |
| VLOG(1) << "Got local UDP port for testing: " |
| << receiver_end_point.ToString(); |
| |
| // Start the in-process receiver that examines audio/video for the expected |
| // test patterns. |
| base::TimeDelta delta = base::TimeDelta::FromSeconds(0); |
| if (HasFlag(kFastClock)) { |
| delta = base::TimeDelta::FromSeconds(10); |
| } |
| if (HasFlag(kSlowClock)) { |
| delta = base::TimeDelta::FromSeconds(-10); |
| } |
| scoped_refptr<media::cast::StandaloneCastEnvironment> cast_environment( |
| new SkewedCastEnvironment(delta)); |
| auto receiver = std::make_unique<TestPatternReceiver>( |
| cast_environment, receiver_end_point, is_full_performance_run()); |
| receiver->Start(); |
| |
| // Create a proxy for the UDP packets that simulates certain network |
| // environments. |
| std::unique_ptr<media::cast::test::UDPProxy> udp_proxy; |
| if (HasFlag(kProxyWifi) || HasFlag(kProxySlow) || HasFlag(kProxyBad)) { |
| net::IPEndPoint proxy_end_point = media::cast::test::GetFreeLocalPort(); |
| if (HasFlag(kProxyWifi)) { |
| udp_proxy = media::cast::test::UDPProxy::Create( |
| proxy_end_point, receiver_end_point, media::cast::test::WifiNetwork(), |
| media::cast::test::WifiNetwork(), nullptr); |
| } else if (HasFlag(kProxySlow)) { |
| udp_proxy = media::cast::test::UDPProxy::Create( |
| proxy_end_point, receiver_end_point, media::cast::test::SlowNetwork(), |
| media::cast::test::SlowNetwork(), nullptr); |
| } else if (HasFlag(kProxyBad)) { |
| udp_proxy = media::cast::test::UDPProxy::Create( |
| proxy_end_point, receiver_end_point, media::cast::test::BadNetwork(), |
| media::cast::test::BadNetwork(), nullptr); |
| } |
| receiver_end_point = proxy_end_point; |
| } |
| |
| // Load the extension and test page, and tell the extension to start tab |
| // capture + Cast Streaming. |
| LoadExtension(GetApiTestDataDir() |
| .AppendASCII("cast_streaming") |
| .AppendASCII("perftest_extension")); |
| NavigateToTestPage(test_page_html_); |
| const base::Value response = SendMessageToExtension(base::StringPrintf( |
| "{start:true, enableAutoThrottling:%s, maxFrameRate:%d, recvPort:%d," |
| " aesKey:'%s', aesIvMask:'%s'}", |
| HasFlag(kAutoThrottling) ? "true" : "false", kMaxCaptureFrameRate, |
| receiver_end_point.port(), |
| base::HexEncode(kAesKey, sizeof(kAesKey)).c_str(), |
| base::HexEncode(kAesIvMask, sizeof(kAesIvMask)).c_str())); |
| const std::string* reason = response.FindStringKey("reason"); |
| ASSERT_TRUE(response.FindBoolKey("success").value_or(false)) |
| << (reason ? *reason : std::string("<MISSING REASON>")); |
| |
| // Now that capture has started, start playing the barcode video in the test |
| // page. |
| const std::string javascript_to_play_video( |
| "new Promise((resolve) => {\n" |
| " const video = document.getElementsByTagName('video')[0];\n" |
| " video.addEventListener('playing', () => { resolve(true); });\n" |
| " video.play();\n" |
| "})"); |
| LOG(INFO) << "Starting playback of barcode video..."; |
| ASSERT_EQ(true, content::EvalJs( |
| browser()->tab_strip_model()->GetActiveWebContents(), |
| javascript_to_play_video)); |
| |
| // Observe the running browser for a while, collecting a trace. |
| TraceAnalyzerUniquePtr analyzer = TraceAndObserve( |
| "gpu.capture,cast_perf_test", |
| std::vector<base::StringPiece>{ |
| // From the Compositor/Capture pipeline... |
| "Capture", "OnBufferReceived", "ConsumeVideoFrame", |
| // From the Cast Sender's pipeline... |
| "InsertRawVideoFrame", "VideoFrameEncoded", |
| // From the Cast Receiver's pipeline... |
| "PullEncodedVideoFrame", "VideoFrameDecoded", |
| // From the TestPatternReceiver (see class above!)... |
| "VideoFramePlayout", "AudioFramePlayout"}, |
| // In a full performance run, events will be trimmed from both ends of |
| // trace. Otherwise, just require the bare-minimum to verify the stats |
| // calculations will work. |
| is_full_performance_run() ? (2 * kTrimEvents + kMinDataPointsForFullRun) |
| : kMinDataPointsForQuickRun); |
| |
| // Shut down the receiver and all the CastEnvironment threads. |
| VLOG(1) << "Shutting-down receiver and CastEnvironment..."; |
| receiver->Stop(); |
| cast_environment->Shutdown(); |
| |
| VLOG(1) << "Analyzing trace events..."; |
| |
| // This prints out the average time between capture events. |
| // Depending on the test, the capture frame rate is capped (e.g., at 30fps, |
| // this score cannot get any better than 33.33 ms). However, the measurement |
| // is important since it provides a valuable check that capture can keep up |
| // with the content's framerate. |
| MeanAndError capture_data = AnalyzeTraceDistance(analyzer.get(), "Capture"); |
| // Lower is better. |
| capture_data.Print(kTestName, GetSuffixForTestFlags(), |
| "time_between_captures", "ms"); |
| |
| receiver->Analyze(kTestName, GetSuffixForTestFlags()); |
| |
| AnalyzeLatency(kTestName, analyzer.get()); |
| } |
| |
| #if !defined(OS_CHROMEOS) || !defined(MEMORY_SANITIZER) |
| INSTANTIATE_TEST_SUITE_P(, |
| CastV2PerformanceTest, |
| testing::Values(k24fps, |
| k30fps, |
| k60fps, |
| k30fps | kProxyWifi, |
| k30fps | kProxyBad, |
| k30fps | kSlowClock, |
| k30fps | kFastClock, |
| k30fps | kProxyWifi | kAutoThrottling, |
| k30fps | kProxySlow | kAutoThrottling, |
| k30fps | kProxyBad | kAutoThrottling)); |
| #endif |