kjellander@webrtc.org | 35a1756 | 2011-10-06 06:44:54 +0000 | [diff] [blame] | 1 | /* |
pwestin@webrtc.org | ce33035 | 2012-04-12 06:59:14 +0000 | [diff] [blame] | 2 | * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. |
kjellander@webrtc.org | 35a1756 | 2011-10-06 06:44:54 +0000 | [diff] [blame] | 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
kjellander@webrtc.org | 5b97b12 | 2011-12-08 07:42:18 +0000 | [diff] [blame] | 10 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 11 | #include "modules/video_coding/codecs/test/videoprocessor.h" |
kjellander@webrtc.org | 35a1756 | 2011-10-06 06:44:54 +0000 | [diff] [blame] | 12 | |
Yves Gerey | 3e70781 | 2018-11-28 16:47:49 +0100 | [diff] [blame] | 13 | #include <string.h> |
Jonas Olsson | a4d8737 | 2019-07-05 19:08:33 +0200 | [diff] [blame] | 14 | |
ssilkin | 612f858 | 2017-09-28 09:23:17 -0700 | [diff] [blame] | 15 | #include <algorithm> |
Yves Gerey | 3e70781 | 2018-11-28 16:47:49 +0100 | [diff] [blame] | 16 | #include <cstddef> |
kjellander@webrtc.org | 35a1756 | 2011-10-06 06:44:54 +0000 | [diff] [blame] | 17 | #include <limits> |
Mirko Bonadei | 317a1f0 | 2019-09-17 17:06:18 +0200 | [diff] [blame] | 18 | #include <memory> |
Erik Språng | 08127a9 | 2016-11-16 16:41:30 +0100 | [diff] [blame] | 19 | #include <utility> |
kjellander@webrtc.org | 35a1756 | 2011-10-06 06:44:54 +0000 | [diff] [blame] | 20 | |
Mirko Bonadei | d970807 | 2019-01-25 20:26:48 +0100 | [diff] [blame] | 21 | #include "api/scoped_refptr.h" |
Jiawei Ou | c2ebe21 | 2018-11-08 10:02:56 -0800 | [diff] [blame] | 22 | #include "api/video/builtin_video_bitrate_allocator_factory.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 23 | #include "api/video/i420_buffer.h" |
Yves Gerey | 3e70781 | 2018-11-28 16:47:49 +0100 | [diff] [blame] | 24 | #include "api/video/video_bitrate_allocator_factory.h" |
| 25 | #include "api/video/video_frame_buffer.h" |
| 26 | #include "api/video/video_rotation.h" |
| 27 | #include "api/video_codecs/video_codec.h" |
Elad Alon | 370f93a | 2019-06-11 14:57:57 +0200 | [diff] [blame] | 28 | #include "api/video_codecs/video_encoder.h" |
ssilkin | 612f858 | 2017-09-28 09:23:17 -0700 | [diff] [blame] | 29 | #include "common_video/h264/h264_common.h" |
Rasmus Brandt | 5f7a891 | 2018-02-28 17:17:15 +0100 | [diff] [blame] | 30 | #include "common_video/libyuv/include/webrtc_libyuv.h" |
Sergey Silkin | 3be2a55 | 2018-01-17 15:11:44 +0100 | [diff] [blame] | 31 | #include "modules/rtp_rtcp/include/rtp_rtcp_defines.h" |
Yves Gerey | 3e70781 | 2018-11-28 16:47:49 +0100 | [diff] [blame] | 32 | #include "modules/video_coding/codecs/interface/common_constants.h" |
Rasmus Brandt | d00c895 | 2018-03-14 12:29:57 +0100 | [diff] [blame] | 33 | #include "modules/video_coding/include/video_error_codes.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 34 | #include "rtc_base/checks.h" |
Danil Chapovalov | ad89528 | 2019-03-11 10:28:05 +0000 | [diff] [blame] | 35 | #include "rtc_base/task_utils/to_queued_task.h" |
Steve Anton | 10542f2 | 2019-01-11 09:11:00 -0800 | [diff] [blame] | 36 | #include "rtc_base/time_utils.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 37 | #include "test/gtest.h" |
Sergey Silkin | 8d3758e | 2018-03-14 11:28:15 +0100 | [diff] [blame] | 38 | #include "third_party/libyuv/include/libyuv/compare.h" |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 39 | #include "third_party/libyuv/include/libyuv/scale.h" |
kjellander@webrtc.org | 35a1756 | 2011-10-06 06:44:54 +0000 | [diff] [blame] | 40 | |
| 41 | namespace webrtc { |
| 42 | namespace test { |
| 43 | |
Kári Tristan Helgason | 169005d | 2018-05-22 13:34:14 +0200 | [diff] [blame] | 44 | namespace { |
Åsa Persson | 91af24a | 2018-01-24 17:20:18 +0100 | [diff] [blame] | 45 | const int kMsToRtpTimestamp = kVideoPayloadTypeFrequency / 1000; |
Sami Kalliomäki | c75a5e8 | 2018-07-09 13:27:42 +0200 | [diff] [blame] | 46 | const int kMaxBufferedInputFrames = 20; |
brandtr | 17b958c | 2017-03-07 01:41:43 -0800 | [diff] [blame] | 47 | |
Elad Alon | 370f93a | 2019-06-11 14:57:57 +0200 | [diff] [blame] | 48 | const VideoEncoder::Capabilities kCapabilities(false); |
| 49 | |
Sergey Silkin | 3be2a55 | 2018-01-17 15:11:44 +0100 | [diff] [blame] | 50 | size_t GetMaxNaluSizeBytes(const EncodedImage& encoded_frame, |
Kári Tristan Helgason | 169005d | 2018-05-22 13:34:14 +0200 | [diff] [blame] | 51 | const VideoCodecTestFixture::Config& config) { |
ssilkin | 612f858 | 2017-09-28 09:23:17 -0700 | [diff] [blame] | 52 | if (config.codec_settings.codecType != kVideoCodecH264) |
Sergey Silkin | 3be2a55 | 2018-01-17 15:11:44 +0100 | [diff] [blame] | 53 | return 0; |
ssilkin | 612f858 | 2017-09-28 09:23:17 -0700 | [diff] [blame] | 54 | |
| 55 | std::vector<webrtc::H264::NaluIndex> nalu_indices = |
Niels Möller | 77536a2 | 2019-01-15 08:50:01 +0100 | [diff] [blame] | 56 | webrtc::H264::FindNaluIndices(encoded_frame.data(), encoded_frame.size()); |
ssilkin | 612f858 | 2017-09-28 09:23:17 -0700 | [diff] [blame] | 57 | |
| 58 | RTC_CHECK(!nalu_indices.empty()); |
| 59 | |
Sergey Silkin | 3be2a55 | 2018-01-17 15:11:44 +0100 | [diff] [blame] | 60 | size_t max_size = 0; |
ssilkin | 612f858 | 2017-09-28 09:23:17 -0700 | [diff] [blame] | 61 | for (const webrtc::H264::NaluIndex& index : nalu_indices) |
Sergey Silkin | 3be2a55 | 2018-01-17 15:11:44 +0100 | [diff] [blame] | 62 | max_size = std::max(max_size, index.payload_size); |
ssilkin | 612f858 | 2017-09-28 09:23:17 -0700 | [diff] [blame] | 63 | |
Sergey Silkin | 3be2a55 | 2018-01-17 15:11:44 +0100 | [diff] [blame] | 64 | return max_size; |
ssilkin | 612f858 | 2017-09-28 09:23:17 -0700 | [diff] [blame] | 65 | } |
| 66 | |
Niels Möller | d3b8c63 | 2018-08-27 15:33:42 +0200 | [diff] [blame] | 67 | size_t GetTemporalLayerIndex(const CodecSpecificInfo& codec_specific) { |
| 68 | size_t temporal_idx = 0; |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 69 | if (codec_specific.codecType == kVideoCodecVP8) { |
Niels Möller | d3b8c63 | 2018-08-27 15:33:42 +0200 | [diff] [blame] | 70 | temporal_idx = codec_specific.codecSpecific.VP8.temporalIdx; |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 71 | } else if (codec_specific.codecType == kVideoCodecVP9) { |
Niels Möller | d3b8c63 | 2018-08-27 15:33:42 +0200 | [diff] [blame] | 72 | temporal_idx = codec_specific.codecSpecific.VP9.temporal_idx; |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 73 | } |
Niels Möller | d3b8c63 | 2018-08-27 15:33:42 +0200 | [diff] [blame] | 74 | if (temporal_idx == kNoTemporalIdx) { |
| 75 | temporal_idx = 0; |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 76 | } |
Niels Möller | d3b8c63 | 2018-08-27 15:33:42 +0200 | [diff] [blame] | 77 | return temporal_idx; |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 78 | } |
| 79 | |
asapersson | ae9ba04 | 2017-03-07 00:25:38 -0800 | [diff] [blame] | 80 | int GetElapsedTimeMicroseconds(int64_t start_ns, int64_t stop_ns) { |
| 81 | int64_t diff_us = (stop_ns - start_ns) / rtc::kNumNanosecsPerMicrosec; |
| 82 | RTC_DCHECK_GE(diff_us, std::numeric_limits<int>::min()); |
| 83 | RTC_DCHECK_LE(diff_us, std::numeric_limits<int>::max()); |
| 84 | return static_cast<int>(diff_us); |
| 85 | } |
| 86 | |
Sergey Silkin | 8d3758e | 2018-03-14 11:28:15 +0100 | [diff] [blame] | 87 | void CalculateFrameQuality(const I420BufferInterface& ref_buffer, |
| 88 | const I420BufferInterface& dec_buffer, |
Sergey Silkin | b72cc6d | 2020-10-29 08:29:26 +0100 | [diff] [blame] | 89 | VideoCodecTestStats::FrameStatistics* frame_stat, |
Sergey Silkin | 6e1402b | 2019-02-13 09:33:00 +0100 | [diff] [blame] | 90 | bool calc_ssim) { |
Sergey Silkin | 8d3758e | 2018-03-14 11:28:15 +0100 | [diff] [blame] | 91 | if (ref_buffer.width() != dec_buffer.width() || |
| 92 | ref_buffer.height() != dec_buffer.height()) { |
| 93 | RTC_CHECK_GE(ref_buffer.width(), dec_buffer.width()); |
| 94 | RTC_CHECK_GE(ref_buffer.height(), dec_buffer.height()); |
| 95 | // Downscale reference frame. |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 96 | rtc::scoped_refptr<I420Buffer> scaled_buffer = |
Sergey Silkin | 8d3758e | 2018-03-14 11:28:15 +0100 | [diff] [blame] | 97 | I420Buffer::Create(dec_buffer.width(), dec_buffer.height()); |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 98 | I420Scale(ref_buffer.DataY(), ref_buffer.StrideY(), ref_buffer.DataU(), |
| 99 | ref_buffer.StrideU(), ref_buffer.DataV(), ref_buffer.StrideV(), |
| 100 | ref_buffer.width(), ref_buffer.height(), |
| 101 | scaled_buffer->MutableDataY(), scaled_buffer->StrideY(), |
| 102 | scaled_buffer->MutableDataU(), scaled_buffer->StrideU(), |
| 103 | scaled_buffer->MutableDataV(), scaled_buffer->StrideV(), |
| 104 | scaled_buffer->width(), scaled_buffer->height(), |
| 105 | libyuv::kFilterBox); |
Sergey Silkin | 8d3758e | 2018-03-14 11:28:15 +0100 | [diff] [blame] | 106 | |
Sergey Silkin | 6e1402b | 2019-02-13 09:33:00 +0100 | [diff] [blame] | 107 | CalculateFrameQuality(*scaled_buffer, dec_buffer, frame_stat, calc_ssim); |
Sergey Silkin | 8d3758e | 2018-03-14 11:28:15 +0100 | [diff] [blame] | 108 | } else { |
| 109 | const uint64_t sse_y = libyuv::ComputeSumSquareErrorPlane( |
| 110 | dec_buffer.DataY(), dec_buffer.StrideY(), ref_buffer.DataY(), |
| 111 | ref_buffer.StrideY(), dec_buffer.width(), dec_buffer.height()); |
| 112 | |
| 113 | const uint64_t sse_u = libyuv::ComputeSumSquareErrorPlane( |
| 114 | dec_buffer.DataU(), dec_buffer.StrideU(), ref_buffer.DataU(), |
| 115 | ref_buffer.StrideU(), dec_buffer.width() / 2, dec_buffer.height() / 2); |
| 116 | |
| 117 | const uint64_t sse_v = libyuv::ComputeSumSquareErrorPlane( |
| 118 | dec_buffer.DataV(), dec_buffer.StrideV(), ref_buffer.DataV(), |
| 119 | ref_buffer.StrideV(), dec_buffer.width() / 2, dec_buffer.height() / 2); |
| 120 | |
| 121 | const size_t num_y_samples = dec_buffer.width() * dec_buffer.height(); |
| 122 | const size_t num_u_samples = |
| 123 | dec_buffer.width() / 2 * dec_buffer.height() / 2; |
| 124 | |
| 125 | frame_stat->psnr_y = libyuv::SumSquareErrorToPsnr(sse_y, num_y_samples); |
| 126 | frame_stat->psnr_u = libyuv::SumSquareErrorToPsnr(sse_u, num_u_samples); |
| 127 | frame_stat->psnr_v = libyuv::SumSquareErrorToPsnr(sse_v, num_u_samples); |
| 128 | frame_stat->psnr = libyuv::SumSquareErrorToPsnr( |
| 129 | sse_y + sse_u + sse_v, num_y_samples + 2 * num_u_samples); |
Sergey Silkin | 6e1402b | 2019-02-13 09:33:00 +0100 | [diff] [blame] | 130 | |
| 131 | if (calc_ssim) { |
| 132 | frame_stat->ssim = I420SSIM(ref_buffer, dec_buffer); |
| 133 | } |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 134 | } |
| 135 | } |
| 136 | |
brandtr | b78bc75 | 2017-02-22 01:26:59 -0800 | [diff] [blame] | 137 | } // namespace |
| 138 | |
brandtr | c409552 | 2017-08-07 08:12:33 -0700 | [diff] [blame] | 139 | VideoProcessor::VideoProcessor(webrtc::VideoEncoder* encoder, |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 140 | VideoDecoderList* decoders, |
| 141 | FrameReader* input_frame_reader, |
Kári Tristan Helgason | 169005d | 2018-05-22 13:34:14 +0200 | [diff] [blame] | 142 | const VideoCodecTestFixture::Config& config, |
Rasmus Brandt | 7d72d0f | 2019-03-26 16:56:14 +0100 | [diff] [blame] | 143 | VideoCodecTestStatsImpl* stats, |
Rasmus Brandt | 001c782 | 2019-03-22 13:41:48 +0100 | [diff] [blame] | 144 | IvfFileWriterMap* encoded_frame_writers, |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 145 | FrameWriterList* decoded_frame_writers) |
Åsa Persson | f0c4467 | 2017-10-24 16:03:39 +0200 | [diff] [blame] | 146 | : config_(config), |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 147 | num_simulcast_or_spatial_layers_( |
| 148 | std::max(config_.NumberOfSimulcastStreams(), |
| 149 | config_.NumberOfSpatialLayers())), |
Sergey Silkin | b72cc6d | 2020-10-29 08:29:26 +0100 | [diff] [blame] | 150 | analyze_frame_quality_(!config_.measure_cpu), |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 151 | stats_(stats), |
brandtr | 07734a5 | 2017-08-08 08:35:53 -0700 | [diff] [blame] | 152 | encoder_(encoder), |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 153 | decoders_(decoders), |
Jiawei Ou | c2ebe21 | 2018-11-08 10:02:56 -0800 | [diff] [blame] | 154 | bitrate_allocator_( |
| 155 | CreateBuiltinVideoBitrateAllocatorFactory() |
| 156 | ->CreateVideoBitrateAllocator(config_.codec_settings)), |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 157 | framerate_fps_(0), |
brandtr | bdd555c | 2017-08-21 01:34:04 -0700 | [diff] [blame] | 158 | encode_callback_(this), |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 159 | input_frame_reader_(input_frame_reader), |
Rasmus Brandt | 0f1c0bd | 2018-03-12 10:01:16 +0100 | [diff] [blame] | 160 | merged_encoded_frames_(num_simulcast_or_spatial_layers_), |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 161 | encoded_frame_writers_(encoded_frame_writers), |
| 162 | decoded_frame_writers_(decoded_frame_writers), |
Sergey Silkin | 3be2a55 | 2018-01-17 15:11:44 +0100 | [diff] [blame] | 163 | last_inputed_frame_num_(0), |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 164 | last_inputed_timestamp_(0), |
Rasmus Brandt | 0f1c0bd | 2018-03-12 10:01:16 +0100 | [diff] [blame] | 165 | first_encoded_frame_(num_simulcast_or_spatial_layers_, true), |
| 166 | last_encoded_frame_num_(num_simulcast_or_spatial_layers_), |
| 167 | first_decoded_frame_(num_simulcast_or_spatial_layers_, true), |
Sergey Silkin | c89eed9 | 2018-04-01 23:57:51 +0200 | [diff] [blame] | 168 | last_decoded_frame_num_(num_simulcast_or_spatial_layers_), |
Sergey Silkin | b72cc6d | 2020-10-29 08:29:26 +0100 | [diff] [blame] | 169 | last_decoded_frame_buffer_(num_simulcast_or_spatial_layers_), |
| 170 | post_encode_time_ns_(0), |
| 171 | is_finalized_(false) { |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 172 | // Sanity checks. |
Danil Chapovalov | ad89528 | 2019-03-11 10:28:05 +0000 | [diff] [blame] | 173 | RTC_CHECK(TaskQueueBase::Current()) |
Rasmus Brandt | 4b381af | 2018-02-07 13:56:16 +0100 | [diff] [blame] | 174 | << "VideoProcessor must be run on a task queue."; |
Rasmus Brandt | 001c782 | 2019-03-22 13:41:48 +0100 | [diff] [blame] | 175 | RTC_CHECK(stats_); |
| 176 | RTC_CHECK(encoder_); |
| 177 | RTC_CHECK(decoders_); |
| 178 | RTC_CHECK_EQ(decoders_->size(), num_simulcast_or_spatial_layers_); |
| 179 | RTC_CHECK(input_frame_reader_); |
| 180 | RTC_CHECK(encoded_frame_writers_); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 181 | RTC_CHECK(!decoded_frame_writers || |
| 182 | decoded_frame_writers->size() == num_simulcast_or_spatial_layers_); |
brandtr | 17b958c | 2017-03-07 01:41:43 -0800 | [diff] [blame] | 183 | |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 184 | // Setup required callbacks for the encoder and decoder and initialize them. |
brandtr | bdd555c | 2017-08-21 01:34:04 -0700 | [diff] [blame] | 185 | RTC_CHECK_EQ(encoder_->RegisterEncodeCompleteCallback(&encode_callback_), |
Åsa Persson | f0c4467 | 2017-10-24 16:03:39 +0200 | [diff] [blame] | 186 | WEBRTC_VIDEO_CODEC_OK); |
asapersson | 654d54c | 2017-02-10 00:16:07 -0800 | [diff] [blame] | 187 | |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 188 | // Initialize codecs so that they are ready to receive frames. |
Elad Alon | 370f93a | 2019-06-11 14:57:57 +0200 | [diff] [blame] | 189 | RTC_CHECK_EQ(encoder_->InitEncode( |
| 190 | &config_.codec_settings, |
| 191 | VideoEncoder::Settings( |
| 192 | kCapabilities, static_cast<int>(config_.NumberOfCores()), |
| 193 | config_.max_payload_size_bytes)), |
Sergey Silkin | 1723cf9 | 2018-01-22 15:49:55 +0100 | [diff] [blame] | 194 | WEBRTC_VIDEO_CODEC_OK); |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 195 | |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 196 | for (size_t i = 0; i < num_simulcast_or_spatial_layers_; ++i) { |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 197 | decode_callback_.push_back( |
Mirko Bonadei | 317a1f0 | 2019-09-17 17:06:18 +0200 | [diff] [blame] | 198 | std::make_unique<VideoProcessorDecodeCompleteCallback>(this, i)); |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 199 | RTC_CHECK_EQ( |
| 200 | decoders_->at(i)->InitDecode(&config_.codec_settings, |
| 201 | static_cast<int>(config_.NumberOfCores())), |
| 202 | WEBRTC_VIDEO_CODEC_OK); |
| 203 | RTC_CHECK_EQ(decoders_->at(i)->RegisterDecodeCompleteCallback( |
| 204 | decode_callback_.at(i).get()), |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 205 | WEBRTC_VIDEO_CODEC_OK); |
| 206 | } |
kjellander@webrtc.org | 35a1756 | 2011-10-06 06:44:54 +0000 | [diff] [blame] | 207 | } |
| 208 | |
Åsa Persson | f0c4467 | 2017-10-24 16:03:39 +0200 | [diff] [blame] | 209 | VideoProcessor::~VideoProcessor() { |
Sebastian Jansson | b55015e | 2019-04-09 13:44:04 +0200 | [diff] [blame] | 210 | RTC_DCHECK_RUN_ON(&sequence_checker_); |
brandtr | c8c5905 | 2017-08-21 06:44:16 -0700 | [diff] [blame] | 211 | |
Sergey Silkin | b72cc6d | 2020-10-29 08:29:26 +0100 | [diff] [blame] | 212 | if (!is_finalized_) { |
| 213 | Finalize(); |
| 214 | } |
| 215 | |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 216 | // Explicitly reset codecs, in case they don't do that themselves when they |
| 217 | // go out of scope. |
brandtr | 77920a4 | 2017-08-11 07:48:15 -0700 | [diff] [blame] | 218 | RTC_CHECK_EQ(encoder_->Release(), WEBRTC_VIDEO_CODEC_OK); |
brandtr | bdd555c | 2017-08-21 01:34:04 -0700 | [diff] [blame] | 219 | encoder_->RegisterEncodeCompleteCallback(nullptr); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 220 | for (auto& decoder : *decoders_) { |
| 221 | RTC_CHECK_EQ(decoder->Release(), WEBRTC_VIDEO_CODEC_OK); |
| 222 | decoder->RegisterDecodeCompleteCallback(nullptr); |
| 223 | } |
| 224 | |
Rasmus Brandt | d00c895 | 2018-03-14 12:29:57 +0100 | [diff] [blame] | 225 | // Sanity check. |
| 226 | RTC_CHECK_LE(input_frames_.size(), kMaxBufferedInputFrames); |
brandtr | 77920a4 | 2017-08-11 07:48:15 -0700 | [diff] [blame] | 227 | } |
| 228 | |
brandtr | 8935d97 | 2017-09-06 01:53:22 -0700 | [diff] [blame] | 229 | void VideoProcessor::ProcessFrame() { |
Sebastian Jansson | b55015e | 2019-04-09 13:44:04 +0200 | [diff] [blame] | 230 | RTC_DCHECK_RUN_ON(&sequence_checker_); |
Sergey Silkin | b72cc6d | 2020-10-29 08:29:26 +0100 | [diff] [blame] | 231 | RTC_DCHECK(!is_finalized_); |
| 232 | |
Sergey Silkin | 3be2a55 | 2018-01-17 15:11:44 +0100 | [diff] [blame] | 233 | const size_t frame_number = last_inputed_frame_num_++; |
asapersson | 654d54c | 2017-02-10 00:16:07 -0800 | [diff] [blame] | 234 | |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 235 | // Get input frame and store for future quality calculation. |
| 236 | rtc::scoped_refptr<I420BufferInterface> buffer = |
| 237 | input_frame_reader_->ReadFrame(); |
brandtr | bdd555c | 2017-08-21 01:34:04 -0700 | [diff] [blame] | 238 | RTC_CHECK(buffer) << "Tried to read too many frames from the file."; |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 239 | const size_t timestamp = |
Sergey Silkin | 44cec0b | 2019-07-11 14:20:38 +0200 | [diff] [blame] | 240 | last_inputed_timestamp_ + |
| 241 | static_cast<size_t>(kVideoPayloadTypeFrequency / framerate_fps_); |
Artem Titov | 1ebfb6a | 2019-01-03 23:49:37 +0100 | [diff] [blame] | 242 | VideoFrame input_frame = |
| 243 | VideoFrame::Builder() |
| 244 | .set_video_frame_buffer(buffer) |
| 245 | .set_timestamp_rtp(static_cast<uint32_t>(timestamp)) |
| 246 | .set_timestamp_ms(static_cast<int64_t>(timestamp / kMsToRtpTimestamp)) |
| 247 | .set_rotation(webrtc::kVideoRotation_0) |
| 248 | .build(); |
Rasmus Brandt | d00c895 | 2018-03-14 12:29:57 +0100 | [diff] [blame] | 249 | // Store input frame as a reference for quality calculations. |
| 250 | if (config_.decode && !config_.measure_cpu) { |
Rasmus Brandt | 7b92ceb | 2018-06-26 12:34:59 +0200 | [diff] [blame] | 251 | if (input_frames_.size() == kMaxBufferedInputFrames) { |
| 252 | input_frames_.erase(input_frames_.begin()); |
| 253 | } |
Erik Språng | ebe5acb | 2020-12-03 16:18:44 +0100 | [diff] [blame] | 254 | |
| 255 | if (config_.reference_width != -1 && config_.reference_height != -1 && |
| 256 | (input_frame.width() != config_.reference_width || |
| 257 | input_frame.height() != config_.reference_height)) { |
| 258 | rtc::scoped_refptr<I420Buffer> scaled_buffer = I420Buffer::Create( |
| 259 | config_.codec_settings.width, config_.codec_settings.height); |
| 260 | scaled_buffer->ScaleFrom(*input_frame.video_frame_buffer()->ToI420()); |
| 261 | |
| 262 | VideoFrame scaled_reference_frame = input_frame; |
| 263 | scaled_reference_frame.set_video_frame_buffer(scaled_buffer); |
| 264 | input_frames_.emplace(frame_number, scaled_reference_frame); |
| 265 | |
| 266 | if (config_.reference_width == config_.codec_settings.width && |
| 267 | config_.reference_height == config_.codec_settings.height) { |
| 268 | // Both encoding and comparison uses the same down-scale factor, reuse |
| 269 | // it for encoder below. |
| 270 | input_frame = scaled_reference_frame; |
| 271 | } |
| 272 | } else { |
| 273 | input_frames_.emplace(frame_number, input_frame); |
| 274 | } |
Rasmus Brandt | d00c895 | 2018-03-14 12:29:57 +0100 | [diff] [blame] | 275 | } |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 276 | last_inputed_timestamp_ = timestamp; |
brandtr | 17b958c | 2017-03-07 01:41:43 -0800 | [diff] [blame] | 277 | |
Sergey Silkin | c89eed9 | 2018-04-01 23:57:51 +0200 | [diff] [blame] | 278 | post_encode_time_ns_ = 0; |
| 279 | |
Rasmus Brandt | 5f7a891 | 2018-02-28 17:17:15 +0100 | [diff] [blame] | 280 | // Create frame statistics object for all simulcast/spatial layers. |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 281 | for (size_t i = 0; i < num_simulcast_or_spatial_layers_; ++i) { |
Sergey Silkin | 02fed02 | 2018-09-25 13:48:19 +0200 | [diff] [blame] | 282 | FrameStatistics frame_stat(frame_number, timestamp, i); |
| 283 | stats_->AddFrame(frame_stat); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 284 | } |
brandtr | 17b958c | 2017-03-07 01:41:43 -0800 | [diff] [blame] | 285 | |
| 286 | // For the highest measurement accuracy of the encode time, the start/stop |
| 287 | // time recordings should wrap the Encode call as tightly as possible. |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 288 | const int64_t encode_start_ns = rtc::TimeNanos(); |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 289 | for (size_t i = 0; i < num_simulcast_or_spatial_layers_; ++i) { |
| 290 | FrameStatistics* frame_stat = stats_->GetFrame(frame_number, i); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 291 | frame_stat->encode_start_ns = encode_start_ns; |
| 292 | } |
| 293 | |
Erik Språng | ebe5acb | 2020-12-03 16:18:44 +0100 | [diff] [blame] | 294 | if (input_frame.width() != config_.codec_settings.width || |
| 295 | input_frame.height() != config_.codec_settings.height) { |
| 296 | rtc::scoped_refptr<I420Buffer> scaled_buffer = I420Buffer::Create( |
| 297 | config_.codec_settings.width, config_.codec_settings.height); |
| 298 | scaled_buffer->ScaleFrom(*input_frame.video_frame_buffer()->ToI420()); |
| 299 | input_frame.set_video_frame_buffer(scaled_buffer); |
| 300 | } |
| 301 | |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 302 | // Encode. |
Niels Möller | 87e2d78 | 2019-03-07 10:18:23 +0100 | [diff] [blame] | 303 | const std::vector<VideoFrameType> frame_types = |
Niels Möller | 8f7ce22 | 2019-03-21 15:43:58 +0100 | [diff] [blame] | 304 | (frame_number == 0) |
| 305 | ? std::vector<VideoFrameType>{VideoFrameType::kVideoFrameKey} |
| 306 | : std::vector<VideoFrameType>{VideoFrameType::kVideoFrameDelta}; |
Niels Möller | c8d2e73 | 2019-03-06 12:00:33 +0100 | [diff] [blame] | 307 | const int encode_return_code = encoder_->Encode(input_frame, &frame_types); |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 308 | for (size_t i = 0; i < num_simulcast_or_spatial_layers_; ++i) { |
| 309 | FrameStatistics* frame_stat = stats_->GetFrame(frame_number, i); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 310 | frame_stat->encode_return_code = encode_return_code; |
| 311 | } |
kjellander@webrtc.org | 35a1756 | 2011-10-06 06:44:54 +0000 | [diff] [blame] | 312 | } |
| 313 | |
Sergey Silkin | 44cec0b | 2019-07-11 14:20:38 +0200 | [diff] [blame] | 314 | void VideoProcessor::SetRates(size_t bitrate_kbps, double framerate_fps) { |
Sebastian Jansson | b55015e | 2019-04-09 13:44:04 +0200 | [diff] [blame] | 315 | RTC_DCHECK_RUN_ON(&sequence_checker_); |
Sergey Silkin | b72cc6d | 2020-10-29 08:29:26 +0100 | [diff] [blame] | 316 | RTC_DCHECK(!is_finalized_); |
| 317 | |
Sergey Silkin | 44cec0b | 2019-07-11 14:20:38 +0200 | [diff] [blame] | 318 | framerate_fps_ = framerate_fps; |
Florent Castelli | 8bbdb5b | 2019-08-02 15:16:28 +0200 | [diff] [blame] | 319 | bitrate_allocation_ = |
| 320 | bitrate_allocator_->Allocate(VideoBitrateAllocationParameters( |
| 321 | static_cast<uint32_t>(bitrate_kbps * 1000), framerate_fps_)); |
Sergey Silkin | 44cec0b | 2019-07-11 14:20:38 +0200 | [diff] [blame] | 322 | encoder_->SetRates( |
| 323 | VideoEncoder::RateControlParameters(bitrate_allocation_, framerate_fps_)); |
brandtr | bea36fd | 2017-08-07 03:36:54 -0700 | [diff] [blame] | 324 | } |
| 325 | |
Sami Kalliomäki | 451b29c | 2018-07-04 14:33:51 +0200 | [diff] [blame] | 326 | int32_t VideoProcessor::VideoProcessorDecodeCompleteCallback::Decoded( |
| 327 | VideoFrame& image) { |
| 328 | // Post the callback to the right task queue, if needed. |
| 329 | if (!task_queue_->IsCurrent()) { |
| 330 | // There might be a limited amount of output buffers, make a copy to make |
| 331 | // sure we don't block the decoder. |
Artem Titov | 1ebfb6a | 2019-01-03 23:49:37 +0100 | [diff] [blame] | 332 | VideoFrame copy = VideoFrame::Builder() |
| 333 | .set_video_frame_buffer(I420Buffer::Copy( |
| 334 | *image.video_frame_buffer()->ToI420())) |
| 335 | .set_rotation(image.rotation()) |
| 336 | .set_timestamp_us(image.timestamp_us()) |
| 337 | .set_id(image.id()) |
| 338 | .build(); |
Sami Kalliomäki | 451b29c | 2018-07-04 14:33:51 +0200 | [diff] [blame] | 339 | copy.set_timestamp(image.timestamp()); |
| 340 | |
Danil Chapovalov | ad89528 | 2019-03-11 10:28:05 +0000 | [diff] [blame] | 341 | task_queue_->PostTask(ToQueuedTask([this, copy]() { |
Sami Kalliomäki | 451b29c | 2018-07-04 14:33:51 +0200 | [diff] [blame] | 342 | video_processor_->FrameDecoded(copy, simulcast_svc_idx_); |
Danil Chapovalov | ad89528 | 2019-03-11 10:28:05 +0000 | [diff] [blame] | 343 | })); |
Sami Kalliomäki | 451b29c | 2018-07-04 14:33:51 +0200 | [diff] [blame] | 344 | return 0; |
| 345 | } |
| 346 | video_processor_->FrameDecoded(image, simulcast_svc_idx_); |
| 347 | return 0; |
| 348 | } |
| 349 | |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 350 | void VideoProcessor::FrameEncoded( |
| 351 | const webrtc::EncodedImage& encoded_image, |
| 352 | const webrtc::CodecSpecificInfo& codec_specific) { |
Sebastian Jansson | b55015e | 2019-04-09 13:44:04 +0200 | [diff] [blame] | 353 | RTC_DCHECK_RUN_ON(&sequence_checker_); |
brandtr | c8c5905 | 2017-08-21 06:44:16 -0700 | [diff] [blame] | 354 | |
brandtr | 32e0d26 | 2017-02-15 05:29:38 -0800 | [diff] [blame] | 355 | // For the highest measurement accuracy of the encode time, the start/stop |
| 356 | // time recordings should wrap the Encode call as tightly as possible. |
Rasmus Brandt | 5f7a891 | 2018-02-28 17:17:15 +0100 | [diff] [blame] | 357 | const int64_t encode_stop_ns = rtc::TimeNanos(); |
brandtr | 32e0d26 | 2017-02-15 05:29:38 -0800 | [diff] [blame] | 358 | |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 359 | const VideoCodecType codec_type = codec_specific.codecType; |
Rasmus Brandt | f7a3558 | 2017-10-24 10:16:33 +0200 | [diff] [blame] | 360 | if (config_.encoded_frame_checker) { |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 361 | config_.encoded_frame_checker->CheckEncodedFrame(codec_type, encoded_image); |
Rasmus Brandt | f7a3558 | 2017-10-24 10:16:33 +0200 | [diff] [blame] | 362 | } |
brandtr | b78bc75 | 2017-02-22 01:26:59 -0800 | [diff] [blame] | 363 | |
Rasmus Brandt | d062a3c | 2018-03-08 16:45:54 +0100 | [diff] [blame] | 364 | // Layer metadata. |
Niels Möller | d3b8c63 | 2018-08-27 15:33:42 +0200 | [diff] [blame] | 365 | size_t spatial_idx = encoded_image.SpatialIndex().value_or(0); |
| 366 | size_t temporal_idx = GetTemporalLayerIndex(codec_specific); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 367 | |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 368 | FrameStatistics* frame_stat = |
Niels Möller | 2377588 | 2018-08-16 10:24:12 +0200 | [diff] [blame] | 369 | stats_->GetFrameWithTimestamp(encoded_image.Timestamp(), spatial_idx); |
Åsa Persson | a6e7b88 | 2018-01-19 14:57:10 +0100 | [diff] [blame] | 370 | const size_t frame_number = frame_stat->frame_number; |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 371 | |
Rasmus Brandt | 0f1c0bd | 2018-03-12 10:01:16 +0100 | [diff] [blame] | 372 | // Ensure that the encode order is monotonically increasing, within this |
| 373 | // simulcast/spatial layer. |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 374 | RTC_CHECK(first_encoded_frame_[spatial_idx] || |
| 375 | last_encoded_frame_num_[spatial_idx] < frame_number); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 376 | |
| 377 | // Ensure SVC spatial layers are delivered in ascending order. |
Rasmus Brandt | 001c782 | 2019-03-22 13:41:48 +0100 | [diff] [blame] | 378 | const size_t num_spatial_layers = config_.NumberOfSpatialLayers(); |
| 379 | if (!first_encoded_frame_[spatial_idx] && num_spatial_layers > 1) { |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 380 | for (size_t i = 0; i < spatial_idx; ++i) { |
Sergey Silkin | 122ba6c | 2018-03-27 14:32:21 +0200 | [diff] [blame] | 381 | RTC_CHECK_LE(last_encoded_frame_num_[i], frame_number); |
Rasmus Brandt | 0f1c0bd | 2018-03-12 10:01:16 +0100 | [diff] [blame] | 382 | } |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 383 | for (size_t i = spatial_idx + 1; i < num_simulcast_or_spatial_layers_; |
Rasmus Brandt | 0f1c0bd | 2018-03-12 10:01:16 +0100 | [diff] [blame] | 384 | ++i) { |
| 385 | RTC_CHECK_GT(frame_number, last_encoded_frame_num_[i]); |
| 386 | } |
Sergey Silkin | 3be2a55 | 2018-01-17 15:11:44 +0100 | [diff] [blame] | 387 | } |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 388 | first_encoded_frame_[spatial_idx] = false; |
| 389 | last_encoded_frame_num_[spatial_idx] = frame_number; |
brandtr | 17b958c | 2017-03-07 01:41:43 -0800 | [diff] [blame] | 390 | |
brandtr | 8935d97 | 2017-09-06 01:53:22 -0700 | [diff] [blame] | 391 | // Update frame statistics. |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 392 | frame_stat->encoding_successful = true; |
Sergey Silkin | c89eed9 | 2018-04-01 23:57:51 +0200 | [diff] [blame] | 393 | frame_stat->encode_time_us = GetElapsedTimeMicroseconds( |
| 394 | frame_stat->encode_start_ns, encode_stop_ns - post_encode_time_ns_); |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 395 | frame_stat->target_bitrate_kbps = |
Sergey Silkin | bfd54ef | 2018-04-13 23:41:11 +0200 | [diff] [blame] | 396 | bitrate_allocation_.GetTemporalLayerSum(spatial_idx, temporal_idx) / 1000; |
Sergey Silkin | 44cec0b | 2019-07-11 14:20:38 +0200 | [diff] [blame] | 397 | frame_stat->target_framerate_fps = framerate_fps_; |
Niels Möller | 77536a2 | 2019-01-15 08:50:01 +0100 | [diff] [blame] | 398 | frame_stat->length_bytes = encoded_image.size(); |
brandtr | 17b958c | 2017-03-07 01:41:43 -0800 | [diff] [blame] | 399 | frame_stat->frame_type = encoded_image._frameType; |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 400 | frame_stat->temporal_idx = temporal_idx; |
Sergey Silkin | 3be2a55 | 2018-01-17 15:11:44 +0100 | [diff] [blame] | 401 | frame_stat->max_nalu_size_bytes = GetMaxNaluSizeBytes(encoded_image, config_); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 402 | frame_stat->qp = encoded_image.qp_; |
ssilkin | 612f858 | 2017-09-28 09:23:17 -0700 | [diff] [blame] | 403 | |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 404 | if (codec_type == kVideoCodecVP9) { |
| 405 | const CodecSpecificInfoVP9& vp9_info = codec_specific.codecSpecific.VP9; |
| 406 | frame_stat->inter_layer_predicted = vp9_info.inter_layer_predicted; |
Sergey Silkin | 3c30c9c | 2018-05-02 09:18:48 +0200 | [diff] [blame] | 407 | frame_stat->non_ref_for_inter_layer_pred = |
| 408 | vp9_info.non_ref_for_inter_layer_pred; |
Sergey Silkin | 3c30c9c | 2018-05-02 09:18:48 +0200 | [diff] [blame] | 409 | } else { |
| 410 | frame_stat->inter_layer_predicted = false; |
| 411 | frame_stat->non_ref_for_inter_layer_pred = true; |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 412 | } |
| 413 | |
Sergey Silkin | 122ba6c | 2018-03-27 14:32:21 +0200 | [diff] [blame] | 414 | const webrtc::EncodedImage* encoded_image_for_decode = &encoded_image; |
Rasmus Brandt | 001c782 | 2019-03-22 13:41:48 +0100 | [diff] [blame] | 415 | if (config_.decode || !encoded_frame_writers_->empty()) { |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 416 | if (num_spatial_layers > 1) { |
| 417 | encoded_image_for_decode = BuildAndStoreSuperframe( |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 418 | encoded_image, codec_type, frame_number, spatial_idx, |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 419 | frame_stat->inter_layer_predicted); |
Rasmus Brandt | d00c895 | 2018-03-14 12:29:57 +0100 | [diff] [blame] | 420 | } |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 421 | } |
| 422 | |
| 423 | if (config_.decode) { |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 424 | DecodeFrame(*encoded_image_for_decode, spatial_idx); |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 425 | |
Danil Chapovalov | 06bbeb3 | 2020-11-11 12:42:56 +0100 | [diff] [blame] | 426 | if (codec_specific.end_of_picture && num_spatial_layers > 1) { |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 427 | // If inter-layer prediction is enabled and upper layer was dropped then |
| 428 | // base layer should be passed to upper layer decoder. Otherwise decoder |
| 429 | // won't be able to decode next superframe. |
| 430 | const EncodedImage* base_image = nullptr; |
Sergey Silkin | 3c30c9c | 2018-05-02 09:18:48 +0200 | [diff] [blame] | 431 | const FrameStatistics* base_stat = nullptr; |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 432 | for (size_t i = 0; i < num_spatial_layers; ++i) { |
Sergey Silkin | 3c30c9c | 2018-05-02 09:18:48 +0200 | [diff] [blame] | 433 | const bool layer_dropped = (first_decoded_frame_[i] || |
| 434 | last_decoded_frame_num_[i] < frame_number); |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 435 | |
| 436 | // Ensure current layer was decoded. |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 437 | RTC_CHECK(layer_dropped == false || i != spatial_idx); |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 438 | |
| 439 | if (!layer_dropped) { |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 440 | base_image = &merged_encoded_frames_[i]; |
Sergey Silkin | 3c30c9c | 2018-05-02 09:18:48 +0200 | [diff] [blame] | 441 | base_stat = |
Niels Möller | 2377588 | 2018-08-16 10:24:12 +0200 | [diff] [blame] | 442 | stats_->GetFrameWithTimestamp(encoded_image.Timestamp(), i); |
Sergey Silkin | 3c30c9c | 2018-05-02 09:18:48 +0200 | [diff] [blame] | 443 | } else if (base_image && !base_stat->non_ref_for_inter_layer_pred) { |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 444 | DecodeFrame(*base_image, i); |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 445 | } |
| 446 | } |
| 447 | } |
Rasmus Brandt | d00c895 | 2018-03-14 12:29:57 +0100 | [diff] [blame] | 448 | } else { |
| 449 | frame_stat->decode_return_code = WEBRTC_VIDEO_CODEC_NO_OUTPUT; |
Rasmus Brandt | 0f1c0bd | 2018-03-12 10:01:16 +0100 | [diff] [blame] | 450 | } |
Rasmus Brandt | 0f1c0bd | 2018-03-12 10:01:16 +0100 | [diff] [blame] | 451 | |
Rasmus Brandt | 001c782 | 2019-03-22 13:41:48 +0100 | [diff] [blame] | 452 | // Since frames in higher TLs typically depend on frames in lower TLs, |
| 453 | // write out frames in lower TLs to bitstream dumps of higher TLs. |
| 454 | for (size_t write_temporal_idx = temporal_idx; |
| 455 | write_temporal_idx < config_.NumberOfTemporalLayers(); |
| 456 | ++write_temporal_idx) { |
| 457 | const VideoProcessor::LayerKey layer_key(spatial_idx, write_temporal_idx); |
| 458 | auto it = encoded_frame_writers_->find(layer_key); |
| 459 | if (it != encoded_frame_writers_->cend()) { |
| 460 | RTC_CHECK(it->second->WriteFrame(*encoded_image_for_decode, |
| 461 | config_.codec_settings.codecType)); |
| 462 | } |
brandtr | 8935d97 | 2017-09-06 01:53:22 -0700 | [diff] [blame] | 463 | } |
Sergey Silkin | c89eed9 | 2018-04-01 23:57:51 +0200 | [diff] [blame] | 464 | |
Kári Tristan Helgason | f167762 | 2018-08-24 13:21:26 +0200 | [diff] [blame] | 465 | if (!config_.encode_in_real_time) { |
Sergey Silkin | c89eed9 | 2018-04-01 23:57:51 +0200 | [diff] [blame] | 466 | // To get pure encode time for next layers, measure time spent in encode |
| 467 | // callback and subtract it from encode time of next layers. |
| 468 | post_encode_time_ns_ += rtc::TimeNanos() - encode_stop_ns; |
| 469 | } |
kjellander@webrtc.org | 35a1756 | 2011-10-06 06:44:54 +0000 | [diff] [blame] | 470 | } |
| 471 | |
Sergey Silkin | b72cc6d | 2020-10-29 08:29:26 +0100 | [diff] [blame] | 472 | void VideoProcessor::CalcFrameQuality(const I420BufferInterface& decoded_frame, |
| 473 | FrameStatistics* frame_stat) { |
| 474 | RTC_DCHECK_RUN_ON(&sequence_checker_); |
| 475 | |
| 476 | const auto reference_frame = input_frames_.find(frame_stat->frame_number); |
| 477 | RTC_CHECK(reference_frame != input_frames_.cend()) |
| 478 | << "The codecs are either buffering too much, dropping too much, or " |
| 479 | "being too slow relative to the input frame rate."; |
| 480 | |
| 481 | // SSIM calculation is not optimized. Skip it in real-time mode. |
| 482 | const bool calc_ssim = !config_.encode_in_real_time; |
| 483 | CalculateFrameQuality(*reference_frame->second.video_frame_buffer()->ToI420(), |
| 484 | decoded_frame, frame_stat, calc_ssim); |
| 485 | |
| 486 | frame_stat->quality_analysis_successful = true; |
| 487 | } |
| 488 | |
| 489 | void VideoProcessor::WriteDecodedFrame(const I420BufferInterface& decoded_frame, |
| 490 | FrameWriter& frame_writer) { |
| 491 | int input_video_width = config_.codec_settings.width; |
| 492 | int input_video_height = config_.codec_settings.height; |
| 493 | |
| 494 | rtc::scoped_refptr<I420Buffer> scaled_buffer; |
| 495 | const I420BufferInterface* scaled_frame; |
| 496 | |
| 497 | if (decoded_frame.width() == input_video_width && |
| 498 | decoded_frame.height() == input_video_height) { |
| 499 | scaled_frame = &decoded_frame; |
| 500 | } else { |
| 501 | EXPECT_DOUBLE_EQ( |
| 502 | static_cast<double>(input_video_width) / input_video_height, |
| 503 | static_cast<double>(decoded_frame.width()) / decoded_frame.height()); |
| 504 | |
| 505 | scaled_buffer = I420Buffer::Create(input_video_width, input_video_height); |
| 506 | scaled_buffer->ScaleFrom(decoded_frame); |
| 507 | |
| 508 | scaled_frame = scaled_buffer; |
| 509 | } |
| 510 | |
| 511 | // Ensure there is no padding. |
| 512 | RTC_CHECK_EQ(scaled_frame->StrideY(), input_video_width); |
| 513 | RTC_CHECK_EQ(scaled_frame->StrideU(), input_video_width / 2); |
| 514 | RTC_CHECK_EQ(scaled_frame->StrideV(), input_video_width / 2); |
| 515 | |
| 516 | RTC_CHECK_EQ(3 * input_video_width * input_video_height / 2, |
| 517 | frame_writer.FrameLength()); |
| 518 | |
| 519 | RTC_CHECK(frame_writer.WriteFrame(scaled_frame->DataY())); |
| 520 | } |
| 521 | |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 522 | void VideoProcessor::FrameDecoded(const VideoFrame& decoded_frame, |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 523 | size_t spatial_idx) { |
Sebastian Jansson | b55015e | 2019-04-09 13:44:04 +0200 | [diff] [blame] | 524 | RTC_DCHECK_RUN_ON(&sequence_checker_); |
brandtr | c8c5905 | 2017-08-21 06:44:16 -0700 | [diff] [blame] | 525 | |
brandtr | 32e0d26 | 2017-02-15 05:29:38 -0800 | [diff] [blame] | 526 | // For the highest measurement accuracy of the decode time, the start/stop |
| 527 | // time recordings should wrap the Decode call as tightly as possible. |
Rasmus Brandt | 5f7a891 | 2018-02-28 17:17:15 +0100 | [diff] [blame] | 528 | const int64_t decode_stop_ns = rtc::TimeNanos(); |
brandtr | 8bc9385 | 2017-02-15 05:19:51 -0800 | [diff] [blame] | 529 | |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 530 | FrameStatistics* frame_stat = |
| 531 | stats_->GetFrameWithTimestamp(decoded_frame.timestamp(), spatial_idx); |
Åsa Persson | a6e7b88 | 2018-01-19 14:57:10 +0100 | [diff] [blame] | 532 | const size_t frame_number = frame_stat->frame_number; |
Sergey Silkin | 64eaa99 | 2017-11-17 14:47:32 +0100 | [diff] [blame] | 533 | |
Sergey Silkin | b72cc6d | 2020-10-29 08:29:26 +0100 | [diff] [blame] | 534 | if (!first_decoded_frame_[spatial_idx]) { |
| 535 | for (size_t dropped_frame_number = last_decoded_frame_num_[spatial_idx] + 1; |
| 536 | dropped_frame_number < frame_number; ++dropped_frame_number) { |
| 537 | FrameStatistics* dropped_frame_stat = |
| 538 | stats_->GetFrame(dropped_frame_number, spatial_idx); |
| 539 | |
| 540 | if (analyze_frame_quality_ && config_.analyze_quality_of_dropped_frames) { |
| 541 | // Calculate frame quality comparing input frame with last decoded one. |
| 542 | CalcFrameQuality(*last_decoded_frame_buffer_[spatial_idx], |
| 543 | dropped_frame_stat); |
| 544 | } |
| 545 | |
| 546 | if (decoded_frame_writers_ != nullptr) { |
| 547 | // Fill drops with last decoded frame to make them look like freeze at |
| 548 | // playback and to keep decoded layers in sync. |
| 549 | WriteDecodedFrame(*last_decoded_frame_buffer_[spatial_idx], |
| 550 | *decoded_frame_writers_->at(spatial_idx)); |
| 551 | } |
Sergey Silkin | 5613879 | 2018-05-02 10:50:55 +0200 | [diff] [blame] | 552 | } |
| 553 | } |
| 554 | |
Rasmus Brandt | 0f1c0bd | 2018-03-12 10:01:16 +0100 | [diff] [blame] | 555 | // Ensure that the decode order is monotonically increasing, within this |
| 556 | // simulcast/spatial layer. |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 557 | RTC_CHECK(first_decoded_frame_[spatial_idx] || |
| 558 | last_decoded_frame_num_[spatial_idx] < frame_number); |
| 559 | first_decoded_frame_[spatial_idx] = false; |
| 560 | last_decoded_frame_num_[spatial_idx] = frame_number; |
brandtr | 17b958c | 2017-03-07 01:41:43 -0800 | [diff] [blame] | 561 | |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 562 | // Update frame statistics. |
| 563 | frame_stat->decoding_successful = true; |
| 564 | frame_stat->decode_time_us = |
| 565 | GetElapsedTimeMicroseconds(frame_stat->decode_start_ns, decode_stop_ns); |
| 566 | frame_stat->decoded_width = decoded_frame.width(); |
| 567 | frame_stat->decoded_height = decoded_frame.height(); |
| 568 | |
Sergey Silkin | 64eaa99 | 2017-11-17 14:47:32 +0100 | [diff] [blame] | 569 | // Skip quality metrics calculation to not affect CPU usage. |
Sergey Silkin | b72cc6d | 2020-10-29 08:29:26 +0100 | [diff] [blame] | 570 | if (analyze_frame_quality_ || decoded_frame_writers_) { |
| 571 | // Save last decoded frame to handle possible future drops. |
| 572 | rtc::scoped_refptr<I420BufferInterface> i420buffer = |
| 573 | decoded_frame.video_frame_buffer()->ToI420(); |
Sergey Silkin | 6e1402b | 2019-02-13 09:33:00 +0100 | [diff] [blame] | 574 | |
Sergey Silkin | b72cc6d | 2020-10-29 08:29:26 +0100 | [diff] [blame] | 575 | // Copy decoded frame to a buffer without padding/stride such that we can |
| 576 | // dump Y, U and V planes into a file in one shot. |
| 577 | last_decoded_frame_buffer_[spatial_idx] = I420Buffer::Copy( |
| 578 | i420buffer->width(), i420buffer->height(), i420buffer->DataY(), |
| 579 | i420buffer->StrideY(), i420buffer->DataU(), i420buffer->StrideU(), |
| 580 | i420buffer->DataV(), i420buffer->StrideV()); |
Rasmus Brandt | d00c895 | 2018-03-14 12:29:57 +0100 | [diff] [blame] | 581 | } |
Sergey Silkin | 64eaa99 | 2017-11-17 14:47:32 +0100 | [diff] [blame] | 582 | |
Sergey Silkin | b72cc6d | 2020-10-29 08:29:26 +0100 | [diff] [blame] | 583 | if (analyze_frame_quality_) { |
| 584 | CalcFrameQuality(*decoded_frame.video_frame_buffer()->ToI420(), frame_stat); |
Sergey Silkin | 64eaa99 | 2017-11-17 14:47:32 +0100 | [diff] [blame] | 585 | } |
Sergey Silkin | b72cc6d | 2020-10-29 08:29:26 +0100 | [diff] [blame] | 586 | |
| 587 | if (decoded_frame_writers_ != nullptr) { |
| 588 | WriteDecodedFrame(*last_decoded_frame_buffer_[spatial_idx], |
| 589 | *decoded_frame_writers_->at(spatial_idx)); |
| 590 | } |
| 591 | |
| 592 | // Erase all buffered input frames that we have moved past for all |
| 593 | // simulcast/spatial layers. Never buffer more than |
| 594 | // |kMaxBufferedInputFrames| frames, to protect against long runs of |
| 595 | // consecutive frame drops for a particular layer. |
| 596 | const auto min_last_decoded_frame_num = std::min_element( |
| 597 | last_decoded_frame_num_.cbegin(), last_decoded_frame_num_.cend()); |
| 598 | const size_t min_buffered_frame_num = |
| 599 | std::max(0, static_cast<int>(frame_number) - kMaxBufferedInputFrames + 1); |
| 600 | RTC_CHECK(min_last_decoded_frame_num != last_decoded_frame_num_.cend()); |
| 601 | const auto input_frames_erase_before = input_frames_.lower_bound( |
| 602 | std::max(*min_last_decoded_frame_num, min_buffered_frame_num)); |
| 603 | input_frames_.erase(input_frames_.cbegin(), input_frames_erase_before); |
Åsa Persson | f0c4467 | 2017-10-24 16:03:39 +0200 | [diff] [blame] | 604 | } |
brandtr | 17b958c | 2017-03-07 01:41:43 -0800 | [diff] [blame] | 605 | |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 606 | void VideoProcessor::DecodeFrame(const EncodedImage& encoded_image, |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 607 | size_t spatial_idx) { |
Sebastian Jansson | b55015e | 2019-04-09 13:44:04 +0200 | [diff] [blame] | 608 | RTC_DCHECK_RUN_ON(&sequence_checker_); |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 609 | FrameStatistics* frame_stat = |
Niels Möller | 2377588 | 2018-08-16 10:24:12 +0200 | [diff] [blame] | 610 | stats_->GetFrameWithTimestamp(encoded_image.Timestamp(), spatial_idx); |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 611 | |
| 612 | frame_stat->decode_start_ns = rtc::TimeNanos(); |
| 613 | frame_stat->decode_return_code = |
Niels Möller | 7aacdd9 | 2019-03-25 09:11:40 +0100 | [diff] [blame] | 614 | decoders_->at(spatial_idx)->Decode(encoded_image, false, 0); |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 615 | } |
| 616 | |
| 617 | const webrtc::EncodedImage* VideoProcessor::BuildAndStoreSuperframe( |
Rasmus Brandt | 0f1c0bd | 2018-03-12 10:01:16 +0100 | [diff] [blame] | 618 | const EncodedImage& encoded_image, |
| 619 | const VideoCodecType codec, |
| 620 | size_t frame_number, |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 621 | size_t spatial_idx, |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 622 | bool inter_layer_predicted) { |
Rasmus Brandt | 0f1c0bd | 2018-03-12 10:01:16 +0100 | [diff] [blame] | 623 | // Should only be called for SVC. |
| 624 | RTC_CHECK_GT(config_.NumberOfSpatialLayers(), 1); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 625 | |
| 626 | EncodedImage base_image; |
Niels Möller | 77536a2 | 2019-01-15 08:50:01 +0100 | [diff] [blame] | 627 | RTC_CHECK_EQ(base_image.size(), 0); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 628 | |
Sergey Silkin | 122ba6c | 2018-03-27 14:32:21 +0200 | [diff] [blame] | 629 | // Each SVC layer is decoded with dedicated decoder. Find the nearest |
| 630 | // non-dropped base frame and merge it and current frame into superframe. |
Sergey Silkin | 645e2e0 | 2018-04-06 09:42:13 +0200 | [diff] [blame] | 631 | if (inter_layer_predicted) { |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 632 | for (int base_idx = static_cast<int>(spatial_idx) - 1; base_idx >= 0; |
Sergey Silkin | 122ba6c | 2018-03-27 14:32:21 +0200 | [diff] [blame] | 633 | --base_idx) { |
| 634 | EncodedImage lower_layer = merged_encoded_frames_.at(base_idx); |
Niels Möller | 2377588 | 2018-08-16 10:24:12 +0200 | [diff] [blame] | 635 | if (lower_layer.Timestamp() == encoded_image.Timestamp()) { |
Sergey Silkin | 122ba6c | 2018-03-27 14:32:21 +0200 | [diff] [blame] | 636 | base_image = lower_layer; |
| 637 | break; |
| 638 | } |
| 639 | } |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 640 | } |
Niels Möller | 77536a2 | 2019-01-15 08:50:01 +0100 | [diff] [blame] | 641 | const size_t payload_size_bytes = base_image.size() + encoded_image.size(); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 642 | |
Niels Möller | 08ae7ce | 2020-09-23 15:58:12 +0200 | [diff] [blame] | 643 | auto buffer = EncodedImageBuffer::Create(payload_size_bytes); |
Niels Möller | 77536a2 | 2019-01-15 08:50:01 +0100 | [diff] [blame] | 644 | if (base_image.size()) { |
Niels Möller | 24871e4 | 2019-01-17 11:31:13 +0100 | [diff] [blame] | 645 | RTC_CHECK(base_image.data()); |
Niels Möller | 08ae7ce | 2020-09-23 15:58:12 +0200 | [diff] [blame] | 646 | memcpy(buffer->data(), base_image.data(), base_image.size()); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 647 | } |
Niels Möller | 08ae7ce | 2020-09-23 15:58:12 +0200 | [diff] [blame] | 648 | memcpy(buffer->data() + base_image.size(), encoded_image.data(), |
Niels Möller | 77536a2 | 2019-01-15 08:50:01 +0100 | [diff] [blame] | 649 | encoded_image.size()); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 650 | |
Niels Möller | 08ae7ce | 2020-09-23 15:58:12 +0200 | [diff] [blame] | 651 | EncodedImage copied_image = encoded_image; |
| 652 | copied_image.SetEncodedData(buffer); |
Zhaoliang Ma | 074edf6 | 2021-05-11 16:04:46 +0800 | [diff] [blame] | 653 | if (base_image.size()) |
| 654 | copied_image._frameType = base_image._frameType; |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 655 | |
Rasmus Brandt | 0f1c0bd | 2018-03-12 10:01:16 +0100 | [diff] [blame] | 656 | // Replace previous EncodedImage for this spatial layer. |
Niels Möller | 663844d | 2019-02-14 16:15:54 +0100 | [diff] [blame] | 657 | merged_encoded_frames_.at(spatial_idx) = std::move(copied_image); |
Rasmus Brandt | 0f1c0bd | 2018-03-12 10:01:16 +0100 | [diff] [blame] | 658 | |
Sergey Silkin | bc20fe1 | 2018-04-15 21:06:16 +0200 | [diff] [blame] | 659 | return &merged_encoded_frames_.at(spatial_idx); |
Sergey Silkin | 10d9d59 | 2018-02-01 13:25:17 +0100 | [diff] [blame] | 660 | } |
| 661 | |
Sergey Silkin | b72cc6d | 2020-10-29 08:29:26 +0100 | [diff] [blame] | 662 | void VideoProcessor::Finalize() { |
| 663 | RTC_DCHECK_RUN_ON(&sequence_checker_); |
| 664 | RTC_DCHECK(!is_finalized_); |
| 665 | is_finalized_ = true; |
| 666 | |
| 667 | if (!(analyze_frame_quality_ && config_.analyze_quality_of_dropped_frames) && |
| 668 | decoded_frame_writers_ == nullptr) { |
| 669 | return; |
| 670 | } |
| 671 | |
| 672 | for (size_t spatial_idx = 0; spatial_idx < num_simulcast_or_spatial_layers_; |
| 673 | ++spatial_idx) { |
| 674 | if (first_decoded_frame_[spatial_idx]) { |
| 675 | continue; // No decoded frames on this spatial layer. |
| 676 | } |
| 677 | |
| 678 | for (size_t dropped_frame_number = last_decoded_frame_num_[spatial_idx] + 1; |
| 679 | dropped_frame_number < last_inputed_frame_num_; |
| 680 | ++dropped_frame_number) { |
| 681 | FrameStatistics* frame_stat = |
| 682 | stats_->GetFrame(dropped_frame_number, spatial_idx); |
| 683 | |
| 684 | RTC_DCHECK(!frame_stat->decoding_successful); |
| 685 | |
| 686 | if (analyze_frame_quality_ && config_.analyze_quality_of_dropped_frames) { |
| 687 | CalcFrameQuality(*last_decoded_frame_buffer_[spatial_idx], frame_stat); |
| 688 | } |
| 689 | |
| 690 | if (decoded_frame_writers_ != nullptr) { |
| 691 | WriteDecodedFrame(*last_decoded_frame_buffer_[spatial_idx], |
| 692 | *decoded_frame_writers_->at(spatial_idx)); |
| 693 | } |
| 694 | } |
| 695 | } |
| 696 | } |
| 697 | |
kjellander@webrtc.org | 35a1756 | 2011-10-06 06:44:54 +0000 | [diff] [blame] | 698 | } // namespace test |
| 699 | } // namespace webrtc |