blob: f73e06fc26c5d09ab04c59b87ef1971a30319a25 [file] [log] [blame]
kjellander@webrtc.org35a17562011-10-06 06:44:54 +00001/*
pwestin@webrtc.orgce330352012-04-12 06:59:14 +00002 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
kjellander@webrtc.org35a17562011-10-06 06:44:54 +00003 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
kjellander@webrtc.org5b97b122011-12-08 07:42:18 +000010
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#include "modules/video_coding/codecs/test/videoprocessor.h"
kjellander@webrtc.org35a17562011-10-06 06:44:54 +000012
Yves Gerey3e707812018-11-28 16:47:49 +010013#include <string.h>
ssilkin612f8582017-09-28 09:23:17 -070014#include <algorithm>
Yves Gerey3e707812018-11-28 16:47:49 +010015#include <cstddef>
kjellander@webrtc.org35a17562011-10-06 06:44:54 +000016#include <limits>
Erik Språng08127a92016-11-16 16:41:30 +010017#include <utility>
kjellander@webrtc.org35a17562011-10-06 06:44:54 +000018
Yves Gerey3e707812018-11-28 16:47:49 +010019#include "absl/memory/memory.h"
Mirko Bonadeid9708072019-01-25 20:26:48 +010020#include "api/scoped_refptr.h"
Jiawei Ouc2ebe212018-11-08 10:02:56 -080021#include "api/video/builtin_video_bitrate_allocator_factory.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020022#include "api/video/i420_buffer.h"
Yves Gerey3e707812018-11-28 16:47:49 +010023#include "api/video/video_bitrate_allocator_factory.h"
24#include "api/video/video_frame_buffer.h"
25#include "api/video/video_rotation.h"
26#include "api/video_codecs/video_codec.h"
Mirko Bonadei71207422017-09-15 13:58:09 +020027#include "common_types.h" // NOLINT(build/include)
ssilkin612f8582017-09-28 09:23:17 -070028#include "common_video/h264/h264_common.h"
Rasmus Brandt5f7a8912018-02-28 17:17:15 +010029#include "common_video/libyuv/include/webrtc_libyuv.h"
Sergey Silkin3be2a552018-01-17 15:11:44 +010030#include "modules/rtp_rtcp/include/rtp_rtcp_defines.h"
Yves Gerey3e707812018-11-28 16:47:49 +010031#include "modules/video_coding/codecs/interface/common_constants.h"
Rasmus Brandtd00c8952018-03-14 12:29:57 +010032#include "modules/video_coding/include/video_error_codes.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020033#include "rtc_base/checks.h"
Danil Chapovalovad895282019-03-11 10:28:05 +000034#include "rtc_base/task_utils/to_queued_task.h"
Steve Anton10542f22019-01-11 09:11:00 -080035#include "rtc_base/time_utils.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020036#include "test/gtest.h"
Sergey Silkin8d3758e2018-03-14 11:28:15 +010037#include "third_party/libyuv/include/libyuv/compare.h"
Sergey Silkin10d9d592018-02-01 13:25:17 +010038#include "third_party/libyuv/include/libyuv/scale.h"
kjellander@webrtc.org35a17562011-10-06 06:44:54 +000039
40namespace webrtc {
41namespace test {
42
Kári Tristan Helgason169005d2018-05-22 13:34:14 +020043using FrameStatistics = VideoCodecTestStats::FrameStatistics;
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +010044
Kári Tristan Helgason169005d2018-05-22 13:34:14 +020045namespace {
Åsa Persson91af24a2018-01-24 17:20:18 +010046const int kMsToRtpTimestamp = kVideoPayloadTypeFrequency / 1000;
Sami Kalliomäkic75a5e82018-07-09 13:27:42 +020047const int kMaxBufferedInputFrames = 20;
brandtr17b958c2017-03-07 01:41:43 -080048
Sergey Silkin3be2a552018-01-17 15:11:44 +010049size_t GetMaxNaluSizeBytes(const EncodedImage& encoded_frame,
Kári Tristan Helgason169005d2018-05-22 13:34:14 +020050 const VideoCodecTestFixture::Config& config) {
ssilkin612f8582017-09-28 09:23:17 -070051 if (config.codec_settings.codecType != kVideoCodecH264)
Sergey Silkin3be2a552018-01-17 15:11:44 +010052 return 0;
ssilkin612f8582017-09-28 09:23:17 -070053
54 std::vector<webrtc::H264::NaluIndex> nalu_indices =
Niels Möller77536a22019-01-15 08:50:01 +010055 webrtc::H264::FindNaluIndices(encoded_frame.data(), encoded_frame.size());
ssilkin612f8582017-09-28 09:23:17 -070056
57 RTC_CHECK(!nalu_indices.empty());
58
Sergey Silkin3be2a552018-01-17 15:11:44 +010059 size_t max_size = 0;
ssilkin612f8582017-09-28 09:23:17 -070060 for (const webrtc::H264::NaluIndex& index : nalu_indices)
Sergey Silkin3be2a552018-01-17 15:11:44 +010061 max_size = std::max(max_size, index.payload_size);
ssilkin612f8582017-09-28 09:23:17 -070062
Sergey Silkin3be2a552018-01-17 15:11:44 +010063 return max_size;
ssilkin612f8582017-09-28 09:23:17 -070064}
65
Niels Möllerd3b8c632018-08-27 15:33:42 +020066size_t GetTemporalLayerIndex(const CodecSpecificInfo& codec_specific) {
67 size_t temporal_idx = 0;
Rasmus Brandtd062a3c2018-03-08 16:45:54 +010068 if (codec_specific.codecType == kVideoCodecVP8) {
Niels Möllerd3b8c632018-08-27 15:33:42 +020069 temporal_idx = codec_specific.codecSpecific.VP8.temporalIdx;
Rasmus Brandtd062a3c2018-03-08 16:45:54 +010070 } else if (codec_specific.codecType == kVideoCodecVP9) {
Niels Möllerd3b8c632018-08-27 15:33:42 +020071 temporal_idx = codec_specific.codecSpecific.VP9.temporal_idx;
Rasmus Brandtd062a3c2018-03-08 16:45:54 +010072 }
Niels Möllerd3b8c632018-08-27 15:33:42 +020073 if (temporal_idx == kNoTemporalIdx) {
74 temporal_idx = 0;
Rasmus Brandtd062a3c2018-03-08 16:45:54 +010075 }
Niels Möllerd3b8c632018-08-27 15:33:42 +020076 return temporal_idx;
Rasmus Brandtd062a3c2018-03-08 16:45:54 +010077}
78
asaperssonae9ba042017-03-07 00:25:38 -080079int GetElapsedTimeMicroseconds(int64_t start_ns, int64_t stop_ns) {
80 int64_t diff_us = (stop_ns - start_ns) / rtc::kNumNanosecsPerMicrosec;
81 RTC_DCHECK_GE(diff_us, std::numeric_limits<int>::min());
82 RTC_DCHECK_LE(diff_us, std::numeric_limits<int>::max());
83 return static_cast<int>(diff_us);
84}
85
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +010086void ExtractI420BufferWithSize(const VideoFrame& image,
87 int width,
88 int height,
89 rtc::Buffer* buffer) {
Åsa Perssonf0c44672017-10-24 16:03:39 +020090 if (image.width() != width || image.height() != height) {
91 EXPECT_DOUBLE_EQ(static_cast<double>(width) / height,
92 static_cast<double>(image.width()) / image.height());
93 // Same aspect ratio, no cropping needed.
94 rtc::scoped_refptr<I420Buffer> scaled(I420Buffer::Create(width, height));
95 scaled->ScaleFrom(*image.video_frame_buffer()->ToI420());
96
97 size_t length =
98 CalcBufferSize(VideoType::kI420, scaled->width(), scaled->height());
99 buffer->SetSize(length);
100 RTC_CHECK_NE(ExtractBuffer(scaled, length, buffer->data()), -1);
101 return;
102 }
103
104 // No resize.
105 size_t length =
106 CalcBufferSize(VideoType::kI420, image.width(), image.height());
107 buffer->SetSize(length);
108 RTC_CHECK_NE(ExtractBuffer(image, length, buffer->data()), -1);
109}
110
Sergey Silkin8d3758e2018-03-14 11:28:15 +0100111void CalculateFrameQuality(const I420BufferInterface& ref_buffer,
112 const I420BufferInterface& dec_buffer,
Sergey Silkin6e1402b2019-02-13 09:33:00 +0100113 FrameStatistics* frame_stat,
114 bool calc_ssim) {
Sergey Silkin8d3758e2018-03-14 11:28:15 +0100115 if (ref_buffer.width() != dec_buffer.width() ||
116 ref_buffer.height() != dec_buffer.height()) {
117 RTC_CHECK_GE(ref_buffer.width(), dec_buffer.width());
118 RTC_CHECK_GE(ref_buffer.height(), dec_buffer.height());
119 // Downscale reference frame.
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100120 rtc::scoped_refptr<I420Buffer> scaled_buffer =
Sergey Silkin8d3758e2018-03-14 11:28:15 +0100121 I420Buffer::Create(dec_buffer.width(), dec_buffer.height());
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100122 I420Scale(ref_buffer.DataY(), ref_buffer.StrideY(), ref_buffer.DataU(),
123 ref_buffer.StrideU(), ref_buffer.DataV(), ref_buffer.StrideV(),
124 ref_buffer.width(), ref_buffer.height(),
125 scaled_buffer->MutableDataY(), scaled_buffer->StrideY(),
126 scaled_buffer->MutableDataU(), scaled_buffer->StrideU(),
127 scaled_buffer->MutableDataV(), scaled_buffer->StrideV(),
128 scaled_buffer->width(), scaled_buffer->height(),
129 libyuv::kFilterBox);
Sergey Silkin8d3758e2018-03-14 11:28:15 +0100130
Sergey Silkin6e1402b2019-02-13 09:33:00 +0100131 CalculateFrameQuality(*scaled_buffer, dec_buffer, frame_stat, calc_ssim);
Sergey Silkin8d3758e2018-03-14 11:28:15 +0100132 } else {
133 const uint64_t sse_y = libyuv::ComputeSumSquareErrorPlane(
134 dec_buffer.DataY(), dec_buffer.StrideY(), ref_buffer.DataY(),
135 ref_buffer.StrideY(), dec_buffer.width(), dec_buffer.height());
136
137 const uint64_t sse_u = libyuv::ComputeSumSquareErrorPlane(
138 dec_buffer.DataU(), dec_buffer.StrideU(), ref_buffer.DataU(),
139 ref_buffer.StrideU(), dec_buffer.width() / 2, dec_buffer.height() / 2);
140
141 const uint64_t sse_v = libyuv::ComputeSumSquareErrorPlane(
142 dec_buffer.DataV(), dec_buffer.StrideV(), ref_buffer.DataV(),
143 ref_buffer.StrideV(), dec_buffer.width() / 2, dec_buffer.height() / 2);
144
145 const size_t num_y_samples = dec_buffer.width() * dec_buffer.height();
146 const size_t num_u_samples =
147 dec_buffer.width() / 2 * dec_buffer.height() / 2;
148
149 frame_stat->psnr_y = libyuv::SumSquareErrorToPsnr(sse_y, num_y_samples);
150 frame_stat->psnr_u = libyuv::SumSquareErrorToPsnr(sse_u, num_u_samples);
151 frame_stat->psnr_v = libyuv::SumSquareErrorToPsnr(sse_v, num_u_samples);
152 frame_stat->psnr = libyuv::SumSquareErrorToPsnr(
153 sse_y + sse_u + sse_v, num_y_samples + 2 * num_u_samples);
Sergey Silkin6e1402b2019-02-13 09:33:00 +0100154
155 if (calc_ssim) {
156 frame_stat->ssim = I420SSIM(ref_buffer, dec_buffer);
157 }
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100158 }
159}
160
brandtrb78bc752017-02-22 01:26:59 -0800161} // namespace
162
brandtrc4095522017-08-07 08:12:33 -0700163VideoProcessor::VideoProcessor(webrtc::VideoEncoder* encoder,
Sergey Silkin10d9d592018-02-01 13:25:17 +0100164 VideoDecoderList* decoders,
165 FrameReader* input_frame_reader,
Kári Tristan Helgason169005d2018-05-22 13:34:14 +0200166 const VideoCodecTestFixture::Config& config,
167 VideoCodecTestStats* stats,
Sergey Silkin10d9d592018-02-01 13:25:17 +0100168 IvfFileWriterList* encoded_frame_writers,
169 FrameWriterList* decoded_frame_writers)
Åsa Perssonf0c44672017-10-24 16:03:39 +0200170 : config_(config),
Sergey Silkin10d9d592018-02-01 13:25:17 +0100171 num_simulcast_or_spatial_layers_(
172 std::max(config_.NumberOfSimulcastStreams(),
173 config_.NumberOfSpatialLayers())),
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100174 stats_(stats),
brandtr07734a52017-08-08 08:35:53 -0700175 encoder_(encoder),
Sergey Silkin10d9d592018-02-01 13:25:17 +0100176 decoders_(decoders),
Jiawei Ouc2ebe212018-11-08 10:02:56 -0800177 bitrate_allocator_(
178 CreateBuiltinVideoBitrateAllocatorFactory()
179 ->CreateVideoBitrateAllocator(config_.codec_settings)),
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100180 framerate_fps_(0),
brandtrbdd555c2017-08-21 01:34:04 -0700181 encode_callback_(this),
Sergey Silkin10d9d592018-02-01 13:25:17 +0100182 input_frame_reader_(input_frame_reader),
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100183 merged_encoded_frames_(num_simulcast_or_spatial_layers_),
Sergey Silkin10d9d592018-02-01 13:25:17 +0100184 encoded_frame_writers_(encoded_frame_writers),
185 decoded_frame_writers_(decoded_frame_writers),
Sergey Silkin3be2a552018-01-17 15:11:44 +0100186 last_inputed_frame_num_(0),
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100187 last_inputed_timestamp_(0),
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100188 first_encoded_frame_(num_simulcast_or_spatial_layers_, true),
189 last_encoded_frame_num_(num_simulcast_or_spatial_layers_),
190 first_decoded_frame_(num_simulcast_or_spatial_layers_, true),
Sergey Silkinc89eed92018-04-01 23:57:51 +0200191 last_decoded_frame_num_(num_simulcast_or_spatial_layers_),
Sergey Silkin56138792018-05-02 10:50:55 +0200192 decoded_frame_buffer_(num_simulcast_or_spatial_layers_),
Sergey Silkinc89eed92018-04-01 23:57:51 +0200193 post_encode_time_ns_(0) {
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100194 // Sanity checks.
Danil Chapovalovad895282019-03-11 10:28:05 +0000195 RTC_CHECK(TaskQueueBase::Current())
Rasmus Brandt4b381af2018-02-07 13:56:16 +0100196 << "VideoProcessor must be run on a task queue.";
Sergey Silkin10d9d592018-02-01 13:25:17 +0100197 RTC_CHECK(encoder);
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100198 RTC_CHECK(decoders);
199 RTC_CHECK_EQ(decoders->size(), num_simulcast_or_spatial_layers_);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100200 RTC_CHECK(input_frame_reader);
201 RTC_CHECK(stats);
202 RTC_CHECK(!encoded_frame_writers ||
203 encoded_frame_writers->size() == num_simulcast_or_spatial_layers_);
204 RTC_CHECK(!decoded_frame_writers ||
205 decoded_frame_writers->size() == num_simulcast_or_spatial_layers_);
brandtr17b958c2017-03-07 01:41:43 -0800206
Sergey Silkin10d9d592018-02-01 13:25:17 +0100207 // Setup required callbacks for the encoder and decoder and initialize them.
brandtrbdd555c2017-08-21 01:34:04 -0700208 RTC_CHECK_EQ(encoder_->RegisterEncodeCompleteCallback(&encode_callback_),
Åsa Perssonf0c44672017-10-24 16:03:39 +0200209 WEBRTC_VIDEO_CODEC_OK);
asapersson654d54c2017-02-10 00:16:07 -0800210
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100211 // Initialize codecs so that they are ready to receive frames.
Sergey Silkin1723cf92018-01-22 15:49:55 +0100212 RTC_CHECK_EQ(encoder_->InitEncode(&config_.codec_settings,
213 static_cast<int>(config_.NumberOfCores()),
214 config_.max_payload_size_bytes),
215 WEBRTC_VIDEO_CODEC_OK);
Sergey Silkin645e2e02018-04-06 09:42:13 +0200216
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200217 for (size_t i = 0; i < num_simulcast_or_spatial_layers_; ++i) {
Sergey Silkin645e2e02018-04-06 09:42:13 +0200218 decode_callback_.push_back(
Karl Wiberg918f50c2018-07-05 11:40:33 +0200219 absl::make_unique<VideoProcessorDecodeCompleteCallback>(this, i));
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200220 RTC_CHECK_EQ(
221 decoders_->at(i)->InitDecode(&config_.codec_settings,
222 static_cast<int>(config_.NumberOfCores())),
223 WEBRTC_VIDEO_CODEC_OK);
224 RTC_CHECK_EQ(decoders_->at(i)->RegisterDecodeCompleteCallback(
225 decode_callback_.at(i).get()),
Sergey Silkin10d9d592018-02-01 13:25:17 +0100226 WEBRTC_VIDEO_CODEC_OK);
227 }
kjellander@webrtc.org35a17562011-10-06 06:44:54 +0000228}
229
Åsa Perssonf0c44672017-10-24 16:03:39 +0200230VideoProcessor::~VideoProcessor() {
brandtrc8c59052017-08-21 06:44:16 -0700231 RTC_DCHECK_CALLED_SEQUENTIALLY(&sequence_checker_);
232
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100233 // Explicitly reset codecs, in case they don't do that themselves when they
234 // go out of scope.
brandtr77920a42017-08-11 07:48:15 -0700235 RTC_CHECK_EQ(encoder_->Release(), WEBRTC_VIDEO_CODEC_OK);
brandtrbdd555c2017-08-21 01:34:04 -0700236 encoder_->RegisterEncodeCompleteCallback(nullptr);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100237 for (auto& decoder : *decoders_) {
238 RTC_CHECK_EQ(decoder->Release(), WEBRTC_VIDEO_CODEC_OK);
239 decoder->RegisterDecodeCompleteCallback(nullptr);
240 }
241
Rasmus Brandtd00c8952018-03-14 12:29:57 +0100242 // Sanity check.
243 RTC_CHECK_LE(input_frames_.size(), kMaxBufferedInputFrames);
brandtr77920a42017-08-11 07:48:15 -0700244}
245
brandtr8935d972017-09-06 01:53:22 -0700246void VideoProcessor::ProcessFrame() {
brandtrc8c59052017-08-21 06:44:16 -0700247 RTC_DCHECK_CALLED_SEQUENTIALLY(&sequence_checker_);
Sergey Silkin3be2a552018-01-17 15:11:44 +0100248 const size_t frame_number = last_inputed_frame_num_++;
asapersson654d54c2017-02-10 00:16:07 -0800249
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100250 // Get input frame and store for future quality calculation.
251 rtc::scoped_refptr<I420BufferInterface> buffer =
252 input_frame_reader_->ReadFrame();
brandtrbdd555c2017-08-21 01:34:04 -0700253 RTC_CHECK(buffer) << "Tried to read too many frames from the file.";
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100254 const size_t timestamp =
255 last_inputed_timestamp_ + kVideoPayloadTypeFrequency / framerate_fps_;
Artem Titov1ebfb6a2019-01-03 23:49:37 +0100256 VideoFrame input_frame =
257 VideoFrame::Builder()
258 .set_video_frame_buffer(buffer)
259 .set_timestamp_rtp(static_cast<uint32_t>(timestamp))
260 .set_timestamp_ms(static_cast<int64_t>(timestamp / kMsToRtpTimestamp))
261 .set_rotation(webrtc::kVideoRotation_0)
262 .build();
Rasmus Brandtd00c8952018-03-14 12:29:57 +0100263 // Store input frame as a reference for quality calculations.
264 if (config_.decode && !config_.measure_cpu) {
Rasmus Brandt7b92ceb2018-06-26 12:34:59 +0200265 if (input_frames_.size() == kMaxBufferedInputFrames) {
266 input_frames_.erase(input_frames_.begin());
267 }
Rasmus Brandtd00c8952018-03-14 12:29:57 +0100268 input_frames_.emplace(frame_number, input_frame);
269 }
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100270 last_inputed_timestamp_ = timestamp;
brandtr17b958c2017-03-07 01:41:43 -0800271
Sergey Silkinc89eed92018-04-01 23:57:51 +0200272 post_encode_time_ns_ = 0;
273
Rasmus Brandt5f7a8912018-02-28 17:17:15 +0100274 // Create frame statistics object for all simulcast/spatial layers.
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200275 for (size_t i = 0; i < num_simulcast_or_spatial_layers_; ++i) {
Sergey Silkin02fed022018-09-25 13:48:19 +0200276 FrameStatistics frame_stat(frame_number, timestamp, i);
277 stats_->AddFrame(frame_stat);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100278 }
brandtr17b958c2017-03-07 01:41:43 -0800279
280 // For the highest measurement accuracy of the encode time, the start/stop
281 // time recordings should wrap the Encode call as tightly as possible.
Sergey Silkin10d9d592018-02-01 13:25:17 +0100282 const int64_t encode_start_ns = rtc::TimeNanos();
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200283 for (size_t i = 0; i < num_simulcast_or_spatial_layers_; ++i) {
284 FrameStatistics* frame_stat = stats_->GetFrame(frame_number, i);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100285 frame_stat->encode_start_ns = encode_start_ns;
286 }
287
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100288 // Encode.
Niels Möller87e2d782019-03-07 10:18:23 +0100289 const std::vector<VideoFrameType> frame_types =
Niels Möller8f7ce222019-03-21 15:43:58 +0100290 (frame_number == 0)
291 ? std::vector<VideoFrameType>{VideoFrameType::kVideoFrameKey}
292 : std::vector<VideoFrameType>{VideoFrameType::kVideoFrameDelta};
Niels Möllerc8d2e732019-03-06 12:00:33 +0100293 const int encode_return_code = encoder_->Encode(input_frame, &frame_types);
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200294 for (size_t i = 0; i < num_simulcast_or_spatial_layers_; ++i) {
295 FrameStatistics* frame_stat = stats_->GetFrame(frame_number, i);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100296 frame_stat->encode_return_code = encode_return_code;
297 }
kjellander@webrtc.org35a17562011-10-06 06:44:54 +0000298}
299
Sergey Silkin3be2a552018-01-17 15:11:44 +0100300void VideoProcessor::SetRates(size_t bitrate_kbps, size_t framerate_fps) {
brandtrc8c59052017-08-21 06:44:16 -0700301 RTC_DCHECK_CALLED_SEQUENTIALLY(&sequence_checker_);
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100302 framerate_fps_ = static_cast<uint32_t>(framerate_fps);
Sergey Silkin3be2a552018-01-17 15:11:44 +0100303 bitrate_allocation_ = bitrate_allocator_->GetAllocation(
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100304 static_cast<uint32_t>(bitrate_kbps * 1000), framerate_fps_);
305 const int set_rates_result =
306 encoder_->SetRateAllocation(bitrate_allocation_, framerate_fps_);
brandtrbea36fd2017-08-07 03:36:54 -0700307 RTC_DCHECK_GE(set_rates_result, 0)
brandtrbdd555c2017-08-21 01:34:04 -0700308 << "Failed to update encoder with new rate " << bitrate_kbps << ".";
brandtrbea36fd2017-08-07 03:36:54 -0700309}
310
Sami Kalliomäki451b29c2018-07-04 14:33:51 +0200311int32_t VideoProcessor::VideoProcessorDecodeCompleteCallback::Decoded(
312 VideoFrame& image) {
313 // Post the callback to the right task queue, if needed.
314 if (!task_queue_->IsCurrent()) {
315 // There might be a limited amount of output buffers, make a copy to make
316 // sure we don't block the decoder.
Artem Titov1ebfb6a2019-01-03 23:49:37 +0100317 VideoFrame copy = VideoFrame::Builder()
318 .set_video_frame_buffer(I420Buffer::Copy(
319 *image.video_frame_buffer()->ToI420()))
320 .set_rotation(image.rotation())
321 .set_timestamp_us(image.timestamp_us())
322 .set_id(image.id())
323 .build();
Sami Kalliomäki451b29c2018-07-04 14:33:51 +0200324 copy.set_timestamp(image.timestamp());
325
Danil Chapovalovad895282019-03-11 10:28:05 +0000326 task_queue_->PostTask(ToQueuedTask([this, copy]() {
Sami Kalliomäki451b29c2018-07-04 14:33:51 +0200327 video_processor_->FrameDecoded(copy, simulcast_svc_idx_);
Danil Chapovalovad895282019-03-11 10:28:05 +0000328 }));
Sami Kalliomäki451b29c2018-07-04 14:33:51 +0200329 return 0;
330 }
331 video_processor_->FrameDecoded(image, simulcast_svc_idx_);
332 return 0;
333}
334
Sergey Silkin10d9d592018-02-01 13:25:17 +0100335void VideoProcessor::FrameEncoded(
336 const webrtc::EncodedImage& encoded_image,
337 const webrtc::CodecSpecificInfo& codec_specific) {
brandtrc8c59052017-08-21 06:44:16 -0700338 RTC_DCHECK_CALLED_SEQUENTIALLY(&sequence_checker_);
339
brandtr32e0d262017-02-15 05:29:38 -0800340 // For the highest measurement accuracy of the encode time, the start/stop
341 // time recordings should wrap the Encode call as tightly as possible.
Rasmus Brandt5f7a8912018-02-28 17:17:15 +0100342 const int64_t encode_stop_ns = rtc::TimeNanos();
brandtr32e0d262017-02-15 05:29:38 -0800343
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100344 const VideoCodecType codec_type = codec_specific.codecType;
Rasmus Brandtf7a35582017-10-24 10:16:33 +0200345 if (config_.encoded_frame_checker) {
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100346 config_.encoded_frame_checker->CheckEncodedFrame(codec_type, encoded_image);
Rasmus Brandtf7a35582017-10-24 10:16:33 +0200347 }
brandtrb78bc752017-02-22 01:26:59 -0800348
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100349 // Layer metadata.
Niels Möllerd3b8c632018-08-27 15:33:42 +0200350 size_t spatial_idx = encoded_image.SpatialIndex().value_or(0);
351 size_t temporal_idx = GetTemporalLayerIndex(codec_specific);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100352
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200353 FrameStatistics* frame_stat =
Niels Möller23775882018-08-16 10:24:12 +0200354 stats_->GetFrameWithTimestamp(encoded_image.Timestamp(), spatial_idx);
Åsa Perssona6e7b882018-01-19 14:57:10 +0100355 const size_t frame_number = frame_stat->frame_number;
Sergey Silkin10d9d592018-02-01 13:25:17 +0100356
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100357 // Ensure that the encode order is monotonically increasing, within this
358 // simulcast/spatial layer.
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200359 RTC_CHECK(first_encoded_frame_[spatial_idx] ||
360 last_encoded_frame_num_[spatial_idx] < frame_number);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100361
362 // Ensure SVC spatial layers are delivered in ascending order.
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200363 if (!first_encoded_frame_[spatial_idx] &&
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100364 config_.NumberOfSpatialLayers() > 1) {
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200365 for (size_t i = 0; i < spatial_idx; ++i) {
Sergey Silkin122ba6c2018-03-27 14:32:21 +0200366 RTC_CHECK_LE(last_encoded_frame_num_[i], frame_number);
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100367 }
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200368 for (size_t i = spatial_idx + 1; i < num_simulcast_or_spatial_layers_;
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100369 ++i) {
370 RTC_CHECK_GT(frame_number, last_encoded_frame_num_[i]);
371 }
Sergey Silkin3be2a552018-01-17 15:11:44 +0100372 }
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200373 first_encoded_frame_[spatial_idx] = false;
374 last_encoded_frame_num_[spatial_idx] = frame_number;
brandtr17b958c2017-03-07 01:41:43 -0800375
brandtr8935d972017-09-06 01:53:22 -0700376 // Update frame statistics.
Sergey Silkin10d9d592018-02-01 13:25:17 +0100377 frame_stat->encoding_successful = true;
Sergey Silkinc89eed92018-04-01 23:57:51 +0200378 frame_stat->encode_time_us = GetElapsedTimeMicroseconds(
379 frame_stat->encode_start_ns, encode_stop_ns - post_encode_time_ns_);
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200380 frame_stat->target_bitrate_kbps =
Sergey Silkinbfd54ef2018-04-13 23:41:11 +0200381 bitrate_allocation_.GetTemporalLayerSum(spatial_idx, temporal_idx) / 1000;
Niels Möller77536a22019-01-15 08:50:01 +0100382 frame_stat->length_bytes = encoded_image.size();
brandtr17b958c2017-03-07 01:41:43 -0800383 frame_stat->frame_type = encoded_image._frameType;
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200384 frame_stat->temporal_idx = temporal_idx;
Sergey Silkin3be2a552018-01-17 15:11:44 +0100385 frame_stat->max_nalu_size_bytes = GetMaxNaluSizeBytes(encoded_image, config_);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100386 frame_stat->qp = encoded_image.qp_;
ssilkin612f8582017-09-28 09:23:17 -0700387
Sergey Silkin645e2e02018-04-06 09:42:13 +0200388 const size_t num_spatial_layers = config_.NumberOfSpatialLayers();
Sergey Silkinbc0f0d32018-04-24 21:29:14 +0200389 bool end_of_picture = false;
Sergey Silkin645e2e02018-04-06 09:42:13 +0200390 if (codec_type == kVideoCodecVP9) {
391 const CodecSpecificInfoVP9& vp9_info = codec_specific.codecSpecific.VP9;
392 frame_stat->inter_layer_predicted = vp9_info.inter_layer_predicted;
Sergey Silkin3c30c9c2018-05-02 09:18:48 +0200393 frame_stat->non_ref_for_inter_layer_pred =
394 vp9_info.non_ref_for_inter_layer_pred;
Sergey Silkinbc0f0d32018-04-24 21:29:14 +0200395 end_of_picture = vp9_info.end_of_picture;
Sergey Silkin3c30c9c2018-05-02 09:18:48 +0200396 } else {
397 frame_stat->inter_layer_predicted = false;
398 frame_stat->non_ref_for_inter_layer_pred = true;
Sergey Silkin645e2e02018-04-06 09:42:13 +0200399 }
400
Sergey Silkin122ba6c2018-03-27 14:32:21 +0200401 const webrtc::EncodedImage* encoded_image_for_decode = &encoded_image;
Sergey Silkin645e2e02018-04-06 09:42:13 +0200402 if (config_.decode || encoded_frame_writers_) {
403 if (num_spatial_layers > 1) {
404 encoded_image_for_decode = BuildAndStoreSuperframe(
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200405 encoded_image, codec_type, frame_number, spatial_idx,
Sergey Silkin645e2e02018-04-06 09:42:13 +0200406 frame_stat->inter_layer_predicted);
Rasmus Brandtd00c8952018-03-14 12:29:57 +0100407 }
Sergey Silkin645e2e02018-04-06 09:42:13 +0200408 }
409
410 if (config_.decode) {
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200411 DecodeFrame(*encoded_image_for_decode, spatial_idx);
Sergey Silkin645e2e02018-04-06 09:42:13 +0200412
Sergey Silkin3c30c9c2018-05-02 09:18:48 +0200413 if (end_of_picture && num_spatial_layers > 1) {
Sergey Silkin645e2e02018-04-06 09:42:13 +0200414 // If inter-layer prediction is enabled and upper layer was dropped then
415 // base layer should be passed to upper layer decoder. Otherwise decoder
416 // won't be able to decode next superframe.
417 const EncodedImage* base_image = nullptr;
Sergey Silkin3c30c9c2018-05-02 09:18:48 +0200418 const FrameStatistics* base_stat = nullptr;
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200419 for (size_t i = 0; i < num_spatial_layers; ++i) {
Sergey Silkin3c30c9c2018-05-02 09:18:48 +0200420 const bool layer_dropped = (first_decoded_frame_[i] ||
421 last_decoded_frame_num_[i] < frame_number);
Sergey Silkin645e2e02018-04-06 09:42:13 +0200422
423 // Ensure current layer was decoded.
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200424 RTC_CHECK(layer_dropped == false || i != spatial_idx);
Sergey Silkin645e2e02018-04-06 09:42:13 +0200425
426 if (!layer_dropped) {
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200427 base_image = &merged_encoded_frames_[i];
Sergey Silkin3c30c9c2018-05-02 09:18:48 +0200428 base_stat =
Niels Möller23775882018-08-16 10:24:12 +0200429 stats_->GetFrameWithTimestamp(encoded_image.Timestamp(), i);
Sergey Silkin3c30c9c2018-05-02 09:18:48 +0200430 } else if (base_image && !base_stat->non_ref_for_inter_layer_pred) {
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200431 DecodeFrame(*base_image, i);
Sergey Silkin645e2e02018-04-06 09:42:13 +0200432 }
433 }
434 }
Rasmus Brandtd00c8952018-03-14 12:29:57 +0100435 } else {
436 frame_stat->decode_return_code = WEBRTC_VIDEO_CODEC_NO_OUTPUT;
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100437 }
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100438
439 if (encoded_frame_writers_) {
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200440 RTC_CHECK(encoded_frame_writers_->at(spatial_idx)
Sergey Silkin122ba6c2018-03-27 14:32:21 +0200441 ->WriteFrame(*encoded_image_for_decode,
442 config_.codec_settings.codecType));
brandtr8935d972017-09-06 01:53:22 -0700443 }
Sergey Silkinc89eed92018-04-01 23:57:51 +0200444
Kári Tristan Helgasonf1677622018-08-24 13:21:26 +0200445 if (!config_.encode_in_real_time) {
Sergey Silkinc89eed92018-04-01 23:57:51 +0200446 // To get pure encode time for next layers, measure time spent in encode
447 // callback and subtract it from encode time of next layers.
448 post_encode_time_ns_ += rtc::TimeNanos() - encode_stop_ns;
449 }
kjellander@webrtc.org35a17562011-10-06 06:44:54 +0000450}
451
Sergey Silkin645e2e02018-04-06 09:42:13 +0200452void VideoProcessor::FrameDecoded(const VideoFrame& decoded_frame,
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200453 size_t spatial_idx) {
brandtrc8c59052017-08-21 06:44:16 -0700454 RTC_DCHECK_CALLED_SEQUENTIALLY(&sequence_checker_);
455
brandtr32e0d262017-02-15 05:29:38 -0800456 // For the highest measurement accuracy of the decode time, the start/stop
457 // time recordings should wrap the Decode call as tightly as possible.
Rasmus Brandt5f7a8912018-02-28 17:17:15 +0100458 const int64_t decode_stop_ns = rtc::TimeNanos();
brandtr8bc93852017-02-15 05:19:51 -0800459
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200460 FrameStatistics* frame_stat =
461 stats_->GetFrameWithTimestamp(decoded_frame.timestamp(), spatial_idx);
Åsa Perssona6e7b882018-01-19 14:57:10 +0100462 const size_t frame_number = frame_stat->frame_number;
Sergey Silkin64eaa992017-11-17 14:47:32 +0100463
Sergey Silkin56138792018-05-02 10:50:55 +0200464 if (decoded_frame_writers_ && !first_decoded_frame_[spatial_idx]) {
465 // Fill drops with last decoded frame to make them look like freeze at
466 // playback and to keep decoded layers in sync.
467 for (size_t i = last_decoded_frame_num_[spatial_idx] + 1; i < frame_number;
468 ++i) {
469 RTC_CHECK(decoded_frame_writers_->at(spatial_idx)
470 ->WriteFrame(decoded_frame_buffer_[spatial_idx].data()));
471 }
472 }
473
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100474 // Ensure that the decode order is monotonically increasing, within this
475 // simulcast/spatial layer.
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200476 RTC_CHECK(first_decoded_frame_[spatial_idx] ||
477 last_decoded_frame_num_[spatial_idx] < frame_number);
478 first_decoded_frame_[spatial_idx] = false;
479 last_decoded_frame_num_[spatial_idx] = frame_number;
brandtr17b958c2017-03-07 01:41:43 -0800480
Sergey Silkin10d9d592018-02-01 13:25:17 +0100481 // Update frame statistics.
482 frame_stat->decoding_successful = true;
483 frame_stat->decode_time_us =
484 GetElapsedTimeMicroseconds(frame_stat->decode_start_ns, decode_stop_ns);
485 frame_stat->decoded_width = decoded_frame.width();
486 frame_stat->decoded_height = decoded_frame.height();
487
Sergey Silkin64eaa992017-11-17 14:47:32 +0100488 // Skip quality metrics calculation to not affect CPU usage.
489 if (!config_.measure_cpu) {
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100490 const auto reference_frame = input_frames_.find(frame_number);
491 RTC_CHECK(reference_frame != input_frames_.cend())
492 << "The codecs are either buffering too much, dropping too much, or "
493 "being too slow relative the input frame rate.";
Sergey Silkin6e1402b2019-02-13 09:33:00 +0100494
495 // SSIM calculation is not optimized. Skip it in real-time mode.
496 const bool calc_ssim = !config_.encode_in_real_time;
Sergey Silkin8d3758e2018-03-14 11:28:15 +0100497 CalculateFrameQuality(
498 *reference_frame->second.video_frame_buffer()->ToI420(),
Sergey Silkin6e1402b2019-02-13 09:33:00 +0100499 *decoded_frame.video_frame_buffer()->ToI420(), frame_stat, calc_ssim);
Niels Möller718a7632016-06-13 13:06:01 +0200500
Rasmus Brandtd00c8952018-03-14 12:29:57 +0100501 // Erase all buffered input frames that we have moved past for all
502 // simulcast/spatial layers. Never buffer more than
503 // |kMaxBufferedInputFrames| frames, to protect against long runs of
504 // consecutive frame drops for a particular layer.
505 const auto min_last_decoded_frame_num = std::min_element(
506 last_decoded_frame_num_.cbegin(), last_decoded_frame_num_.cend());
507 const size_t min_buffered_frame_num = std::max(
508 0, static_cast<int>(frame_number) - kMaxBufferedInputFrames + 1);
509 RTC_CHECK(min_last_decoded_frame_num != last_decoded_frame_num_.cend());
510 const auto input_frames_erase_before = input_frames_.lower_bound(
511 std::max(*min_last_decoded_frame_num, min_buffered_frame_num));
512 input_frames_.erase(input_frames_.cbegin(), input_frames_erase_before);
513 }
Sergey Silkin64eaa992017-11-17 14:47:32 +0100514
Sergey Silkin10d9d592018-02-01 13:25:17 +0100515 if (decoded_frame_writers_) {
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100516 ExtractI420BufferWithSize(decoded_frame, config_.codec_settings.width,
Sergey Silkin56138792018-05-02 10:50:55 +0200517 config_.codec_settings.height,
518 &decoded_frame_buffer_[spatial_idx]);
519 RTC_CHECK_EQ(decoded_frame_buffer_[spatial_idx].size(),
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200520 decoded_frame_writers_->at(spatial_idx)->FrameLength());
521 RTC_CHECK(decoded_frame_writers_->at(spatial_idx)
Sergey Silkin56138792018-05-02 10:50:55 +0200522 ->WriteFrame(decoded_frame_buffer_[spatial_idx].data()));
Sergey Silkin64eaa992017-11-17 14:47:32 +0100523 }
Åsa Perssonf0c44672017-10-24 16:03:39 +0200524}
brandtr17b958c2017-03-07 01:41:43 -0800525
Sergey Silkin645e2e02018-04-06 09:42:13 +0200526void VideoProcessor::DecodeFrame(const EncodedImage& encoded_image,
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200527 size_t spatial_idx) {
Sergey Silkin645e2e02018-04-06 09:42:13 +0200528 RTC_DCHECK_CALLED_SEQUENTIALLY(&sequence_checker_);
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200529 FrameStatistics* frame_stat =
Niels Möller23775882018-08-16 10:24:12 +0200530 stats_->GetFrameWithTimestamp(encoded_image.Timestamp(), spatial_idx);
Sergey Silkin645e2e02018-04-06 09:42:13 +0200531
532 frame_stat->decode_start_ns = rtc::TimeNanos();
533 frame_stat->decode_return_code =
Jeroen de Borst2c7b9822019-03-07 19:40:07 +0000534 decoders_->at(spatial_idx)->Decode(encoded_image, false, nullptr, 0);
Sergey Silkin645e2e02018-04-06 09:42:13 +0200535}
536
537const webrtc::EncodedImage* VideoProcessor::BuildAndStoreSuperframe(
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100538 const EncodedImage& encoded_image,
539 const VideoCodecType codec,
540 size_t frame_number,
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200541 size_t spatial_idx,
Sergey Silkin645e2e02018-04-06 09:42:13 +0200542 bool inter_layer_predicted) {
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100543 // Should only be called for SVC.
544 RTC_CHECK_GT(config_.NumberOfSpatialLayers(), 1);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100545
546 EncodedImage base_image;
Niels Möller77536a22019-01-15 08:50:01 +0100547 RTC_CHECK_EQ(base_image.size(), 0);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100548
Sergey Silkin122ba6c2018-03-27 14:32:21 +0200549 // Each SVC layer is decoded with dedicated decoder. Find the nearest
550 // non-dropped base frame and merge it and current frame into superframe.
Sergey Silkin645e2e02018-04-06 09:42:13 +0200551 if (inter_layer_predicted) {
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200552 for (int base_idx = static_cast<int>(spatial_idx) - 1; base_idx >= 0;
Sergey Silkin122ba6c2018-03-27 14:32:21 +0200553 --base_idx) {
554 EncodedImage lower_layer = merged_encoded_frames_.at(base_idx);
Niels Möller23775882018-08-16 10:24:12 +0200555 if (lower_layer.Timestamp() == encoded_image.Timestamp()) {
Sergey Silkin122ba6c2018-03-27 14:32:21 +0200556 base_image = lower_layer;
557 break;
558 }
559 }
Sergey Silkin10d9d592018-02-01 13:25:17 +0100560 }
Niels Möller77536a22019-01-15 08:50:01 +0100561 const size_t payload_size_bytes = base_image.size() + encoded_image.size();
Sergey Silkin10d9d592018-02-01 13:25:17 +0100562
Niels Möller663844d2019-02-14 16:15:54 +0100563 EncodedImage copied_image = encoded_image;
Niels Möller009ab3c2019-03-08 11:26:58 +0100564 copied_image.Allocate(payload_size_bytes);
Niels Möller77536a22019-01-15 08:50:01 +0100565 if (base_image.size()) {
Niels Möller24871e42019-01-17 11:31:13 +0100566 RTC_CHECK(base_image.data());
Niels Möller663844d2019-02-14 16:15:54 +0100567 memcpy(copied_image.data(), base_image.data(), base_image.size());
Sergey Silkin10d9d592018-02-01 13:25:17 +0100568 }
Niels Möller663844d2019-02-14 16:15:54 +0100569 memcpy(copied_image.data() + base_image.size(), encoded_image.data(),
Niels Möller77536a22019-01-15 08:50:01 +0100570 encoded_image.size());
Sergey Silkin10d9d592018-02-01 13:25:17 +0100571
Niels Möller77536a22019-01-15 08:50:01 +0100572 copied_image.set_size(payload_size_bytes);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100573
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100574 // Replace previous EncodedImage for this spatial layer.
Niels Möller663844d2019-02-14 16:15:54 +0100575 merged_encoded_frames_.at(spatial_idx) = std::move(copied_image);
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100576
Sergey Silkinbc20fe12018-04-15 21:06:16 +0200577 return &merged_encoded_frames_.at(spatial_idx);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100578}
579
kjellander@webrtc.org35a17562011-10-06 06:44:54 +0000580} // namespace test
581} // namespace webrtc