blob: 64f9c5c878467bb04d35a251c72f278389bce45f [file] [log] [blame]
kjellander@webrtc.org35a17562011-10-06 06:44:54 +00001/*
marpan@webrtc.orgf4c2de92012-06-05 21:07:28 +00002 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
kjellander@webrtc.org35a17562011-10-06 06:44:54 +00003 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
kjellander@webrtc.org5b97b122011-12-08 07:42:18 +000010
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#ifndef MODULES_VIDEO_CODING_CODECS_TEST_VIDEOPROCESSOR_H_
12#define MODULES_VIDEO_CODING_CODECS_TEST_VIDEOPROCESSOR_H_
kjellander@webrtc.org35a17562011-10-06 06:44:54 +000013
Yves Gerey3e707812018-11-28 16:47:49 +010014#include <stddef.h>
15#include <stdint.h>
brandtrb57f4262017-08-30 06:29:51 -070016#include <map>
Erik Språng08127a92016-11-16 16:41:30 +010017#include <memory>
Rasmus Brandt001c7822019-03-22 13:41:48 +010018#include <utility>
brandtr17b958c2017-03-07 01:41:43 -080019#include <vector>
kjellander@webrtc.org35a17562011-10-06 06:44:54 +000020
Danil Chapovalov471783f2019-03-11 14:26:02 +010021#include "absl/memory/memory.h"
Yves Gerey3e707812018-11-28 16:47:49 +010022#include "absl/types/optional.h"
Danil Chapovalov471783f2019-03-11 14:26:02 +010023#include "api/task_queue/queued_task.h"
Danil Chapovalovad895282019-03-11 10:28:05 +000024#include "api/task_queue/task_queue_base.h"
Kári Tristan Helgason169005d2018-05-22 13:34:14 +020025#include "api/test/videocodec_test_fixture.h"
Yves Gerey3e707812018-11-28 16:47:49 +010026#include "api/video/encoded_image.h"
27#include "api/video/video_bitrate_allocation.h"
Jiawei Ou4206a0a2018-07-20 15:49:43 -070028#include "api/video/video_bitrate_allocator.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020029#include "api/video/video_frame.h"
Yves Gerey3e707812018-11-28 16:47:49 +010030#include "api/video_codecs/video_decoder.h"
31#include "api/video_codecs/video_encoder.h"
Yves Gerey3e707812018-11-28 16:47:49 +010032#include "modules/include/module_common_types.h"
Rasmus Brandt7d72d0f2019-03-26 16:56:14 +010033#include "modules/video_coding/codecs/test/videocodec_test_stats_impl.h"
Kári Tristan Helgason169005d2018-05-22 13:34:14 +020034#include "modules/video_coding/include/video_codec_interface.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020035#include "modules/video_coding/utility/ivf_file_writer.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020036#include "rtc_base/buffer.h"
Yves Gerey3e707812018-11-28 16:47:49 +010037#include "rtc_base/checks.h"
Steve Anton10542f22019-01-11 09:11:00 -080038#include "rtc_base/constructor_magic.h"
Sebastian Janssonb55015e2019-04-09 13:44:04 +020039#include "rtc_base/synchronization/sequence_checker.h"
Yves Gerey3e707812018-11-28 16:47:49 +010040#include "rtc_base/thread_annotations.h"
41#include "rtc_base/thread_checker.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020042#include "test/testsupport/frame_reader.h"
43#include "test/testsupport/frame_writer.h"
kjellander@webrtc.org35a17562011-10-06 06:44:54 +000044
45namespace webrtc {
46namespace test {
47
kjellander@webrtc.org35a17562011-10-06 06:44:54 +000048// Handles encoding/decoding of video using the VideoEncoder/VideoDecoder
49// interfaces. This is done in a sequential manner in order to be able to
50// measure times properly.
51// The class processes a frame at the time for the configured input file.
52// It maintains state of where in the source input file the processing is at.
kjellander@webrtc.org35a17562011-10-06 06:44:54 +000053class VideoProcessor {
54 public:
Sergey Silkin10d9d592018-02-01 13:25:17 +010055 using VideoDecoderList = std::vector<std::unique_ptr<VideoDecoder>>;
Rasmus Brandt001c7822019-03-22 13:41:48 +010056 using LayerKey = std::pair<int /* spatial_idx */, int /* temporal_idx */>;
57 using IvfFileWriterMap = std::map<LayerKey, std::unique_ptr<IvfFileWriter>>;
58 // TODO(brandtr): Consider changing FrameWriterList to be a FrameWriterMap,
59 // to be able to save different TLs separately.
Sergey Silkin10d9d592018-02-01 13:25:17 +010060 using FrameWriterList = std::vector<std::unique_ptr<FrameWriter>>;
61
brandtrc4095522017-08-07 08:12:33 -070062 VideoProcessor(webrtc::VideoEncoder* encoder,
Sergey Silkin10d9d592018-02-01 13:25:17 +010063 VideoDecoderList* decoders,
64 FrameReader* input_frame_reader,
Kári Tristan Helgason169005d2018-05-22 13:34:14 +020065 const VideoCodecTestFixture::Config& config,
Rasmus Brandt7d72d0f2019-03-26 16:56:14 +010066 VideoCodecTestStatsImpl* stats,
Rasmus Brandt001c7822019-03-22 13:41:48 +010067 IvfFileWriterMap* encoded_frame_writers,
Sergey Silkin10d9d592018-02-01 13:25:17 +010068 FrameWriterList* decoded_frame_writers);
brandtrc4095522017-08-07 08:12:33 -070069 ~VideoProcessor();
kjellander@webrtc.org35a17562011-10-06 06:44:54 +000070
Sergey Silkin10d9d592018-02-01 13:25:17 +010071 // Reads a frame and sends it to the encoder. When the encode callback
72 // is received, the encoded frame is buffered. After encoding is finished
73 // buffered frame is sent to decoder. Quality evaluation is done in
74 // the decode callback.
brandtr8935d972017-09-06 01:53:22 -070075 void ProcessFrame();
marpan@webrtc.orgf4c2de92012-06-05 21:07:28 +000076
brandtrbdd555c2017-08-21 01:34:04 -070077 // Updates the encoder with target rates. Must be called at least once.
Sergey Silkin3be2a552018-01-17 15:11:44 +010078 void SetRates(size_t bitrate_kbps, size_t framerate_fps);
kjellander@webrtc.org35a17562011-10-06 06:44:54 +000079
80 private:
kjellander@webrtc.org35a17562011-10-06 06:44:54 +000081 class VideoProcessorEncodeCompleteCallback
pbos@webrtc.org7f7162a2013-07-30 15:18:31 +000082 : public webrtc::EncodedImageCallback {
kjellander@webrtc.org35a17562011-10-06 06:44:54 +000083 public:
brandtrc4095522017-08-07 08:12:33 -070084 explicit VideoProcessorEncodeCompleteCallback(
85 VideoProcessor* video_processor)
brandtrc8c59052017-08-21 06:44:16 -070086 : video_processor_(video_processor),
Danil Chapovalovad895282019-03-11 10:28:05 +000087 task_queue_(TaskQueueBase::Current()) {
Rasmus Brandt5f7a8912018-02-28 17:17:15 +010088 RTC_DCHECK(video_processor_);
Rasmus Brandt4b381af2018-02-07 13:56:16 +010089 RTC_DCHECK(task_queue_);
90 }
brandtrc8c59052017-08-21 06:44:16 -070091
Sergey Ulanov525df3f2016-08-02 17:46:41 -070092 Result OnEncodedImage(
pbos@webrtc.org273a4142014-12-01 15:23:21 +000093 const webrtc::EncodedImage& encoded_image,
94 const webrtc::CodecSpecificInfo* codec_specific_info,
brandtr8bc93852017-02-15 05:19:51 -080095 const webrtc::RTPFragmentationHeader* fragmentation) override {
brandtr8bc93852017-02-15 05:19:51 -080096 RTC_CHECK(codec_specific_info);
brandtrc8c59052017-08-21 06:44:16 -070097
Rasmus Brandt4b381af2018-02-07 13:56:16 +010098 // Post the callback to the right task queue, if needed.
99 if (!task_queue_->IsCurrent()) {
Danil Chapovalov471783f2019-03-11 14:26:02 +0100100 task_queue_->PostTask(absl::make_unique<EncodeCallbackTask>(
101 video_processor_, encoded_image, codec_specific_info));
brandtrc8c59052017-08-21 06:44:16 -0700102 return Result(Result::OK, 0);
103 }
104
Sergey Silkin10d9d592018-02-01 13:25:17 +0100105 video_processor_->FrameEncoded(encoded_image, *codec_specific_info);
brandtr8bc93852017-02-15 05:19:51 -0800106 return Result(Result::OK, 0);
107 }
kjellander@webrtc.org35a17562011-10-06 06:44:54 +0000108
109 private:
Danil Chapovalov471783f2019-03-11 14:26:02 +0100110 class EncodeCallbackTask : public QueuedTask {
brandtrc8c59052017-08-21 06:44:16 -0700111 public:
112 EncodeCallbackTask(VideoProcessor* video_processor,
113 const webrtc::EncodedImage& encoded_image,
brandtr45535622017-08-22 03:33:11 -0700114 const webrtc::CodecSpecificInfo* codec_specific_info)
brandtrc8c59052017-08-21 06:44:16 -0700115 : video_processor_(video_processor),
brandtrc8c59052017-08-21 06:44:16 -0700116 encoded_image_(encoded_image),
117 codec_specific_info_(*codec_specific_info) {
Niels Möller663844d2019-02-14 16:15:54 +0100118 encoded_image_.Retain();
brandtrc8c59052017-08-21 06:44:16 -0700119 }
120
121 bool Run() override {
Sergey Silkin10d9d592018-02-01 13:25:17 +0100122 video_processor_->FrameEncoded(encoded_image_, codec_specific_info_);
brandtrc8c59052017-08-21 06:44:16 -0700123 return true;
124 }
125
126 private:
127 VideoProcessor* const video_processor_;
brandtrc8c59052017-08-21 06:44:16 -0700128 webrtc::EncodedImage encoded_image_;
129 const webrtc::CodecSpecificInfo codec_specific_info_;
brandtrc8c59052017-08-21 06:44:16 -0700130 };
131
brandtrc4095522017-08-07 08:12:33 -0700132 VideoProcessor* const video_processor_;
Danil Chapovalovad895282019-03-11 10:28:05 +0000133 TaskQueueBase* const task_queue_;
kjellander@webrtc.org35a17562011-10-06 06:44:54 +0000134 };
135
kjellander@webrtc.org35a17562011-10-06 06:44:54 +0000136 class VideoProcessorDecodeCompleteCallback
philipelcce46fc2015-12-21 03:04:49 -0800137 : public webrtc::DecodedImageCallback {
kjellander@webrtc.org35a17562011-10-06 06:44:54 +0000138 public:
brandtrc4095522017-08-07 08:12:33 -0700139 explicit VideoProcessorDecodeCompleteCallback(
Sergey Silkin645e2e02018-04-06 09:42:13 +0200140 VideoProcessor* video_processor,
141 size_t simulcast_svc_idx)
brandtrc8c59052017-08-21 06:44:16 -0700142 : video_processor_(video_processor),
Sergey Silkin645e2e02018-04-06 09:42:13 +0200143 simulcast_svc_idx_(simulcast_svc_idx),
Danil Chapovalovad895282019-03-11 10:28:05 +0000144 task_queue_(TaskQueueBase::Current()) {
Rasmus Brandt5f7a8912018-02-28 17:17:15 +0100145 RTC_DCHECK(video_processor_);
Rasmus Brandt4b381af2018-02-07 13:56:16 +0100146 RTC_DCHECK(task_queue_);
147 }
brandtrc8c59052017-08-21 06:44:16 -0700148
Sami Kalliomäki451b29c2018-07-04 14:33:51 +0200149 int32_t Decoded(webrtc::VideoFrame& image) override;
brandtrc8c59052017-08-21 06:44:16 -0700150
philipelcce46fc2015-12-21 03:04:49 -0800151 int32_t Decoded(webrtc::VideoFrame& image,
152 int64_t decode_time_ms) override {
brandtr6bb8e0e2017-02-20 04:35:52 -0800153 return Decoded(image);
kjellander@webrtc.org35a17562011-10-06 06:44:54 +0000154 }
brandtrc8c59052017-08-21 06:44:16 -0700155
brandtr6bb8e0e2017-02-20 04:35:52 -0800156 void Decoded(webrtc::VideoFrame& image,
Danil Chapovalov0040b662018-06-18 10:48:16 +0200157 absl::optional<int32_t> decode_time_ms,
158 absl::optional<uint8_t> qp) override {
brandtrbea36fd2017-08-07 03:36:54 -0700159 Decoded(image);
sakalcc452e12017-02-09 04:53:45 -0800160 }
kjellander@webrtc.org35a17562011-10-06 06:44:54 +0000161
162 private:
brandtrc4095522017-08-07 08:12:33 -0700163 VideoProcessor* const video_processor_;
Sergey Silkin645e2e02018-04-06 09:42:13 +0200164 const size_t simulcast_svc_idx_;
Danil Chapovalovad895282019-03-11 10:28:05 +0000165 TaskQueueBase* const task_queue_;
kjellander@webrtc.org35a17562011-10-06 06:44:54 +0000166 };
brandtr8bc93852017-02-15 05:19:51 -0800167
brandtrbdd555c2017-08-21 01:34:04 -0700168 // Invoked by the callback adapter when a frame has completed encoding.
Sergey Silkin10d9d592018-02-01 13:25:17 +0100169 void FrameEncoded(const webrtc::EncodedImage& encoded_image,
170 const webrtc::CodecSpecificInfo& codec_specific);
brandtr8bc93852017-02-15 05:19:51 -0800171
brandtrbdd555c2017-08-21 01:34:04 -0700172 // Invoked by the callback adapter when a frame has completed decoding.
Sergey Silkin645e2e02018-04-06 09:42:13 +0200173 void FrameDecoded(const webrtc::VideoFrame& image, size_t simulcast_svc_idx);
174
175 void DecodeFrame(const EncodedImage& encoded_image, size_t simulcast_svc_idx);
brandtr8bc93852017-02-15 05:19:51 -0800176
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100177 // In order to supply the SVC decoders with super frames containing all
178 // lower layer frames, we merge and store the layer frames in this method.
Sergey Silkin645e2e02018-04-06 09:42:13 +0200179 const webrtc::EncodedImage* BuildAndStoreSuperframe(
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100180 const EncodedImage& encoded_image,
181 const VideoCodecType codec,
182 size_t frame_number,
Sergey Silkin645e2e02018-04-06 09:42:13 +0200183 size_t simulcast_svc_idx,
184 bool inter_layer_predicted) RTC_RUN_ON(sequence_checker_);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100185
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100186 // Test input/output.
Kári Tristan Helgason169005d2018-05-22 13:34:14 +0200187 VideoCodecTestFixture::Config config_ RTC_GUARDED_BY(sequence_checker_);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100188 const size_t num_simulcast_or_spatial_layers_;
Rasmus Brandt7d72d0f2019-03-26 16:56:14 +0100189 VideoCodecTestStatsImpl* const stats_;
Sergey Silkin10d9d592018-02-01 13:25:17 +0100190
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100191 // Codecs.
brandtr8bc93852017-02-15 05:19:51 -0800192 webrtc::VideoEncoder* const encoder_;
Sergey Silkin10d9d592018-02-01 13:25:17 +0100193 VideoDecoderList* const decoders_;
brandtraebc61e2017-02-28 07:13:47 -0800194 const std::unique_ptr<VideoBitrateAllocator> bitrate_allocator_;
Erik Språng566124a2018-04-23 12:32:22 +0200195 VideoBitrateAllocation bitrate_allocation_ RTC_GUARDED_BY(sequence_checker_);
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100196 uint32_t framerate_fps_ RTC_GUARDED_BY(sequence_checker_);
brandtraebc61e2017-02-28 07:13:47 -0800197
198 // Adapters for the codec callbacks.
brandtrbdd555c2017-08-21 01:34:04 -0700199 VideoProcessorEncodeCompleteCallback encode_callback_;
Sergey Silkin645e2e02018-04-06 09:42:13 +0200200 // Assign separate callback object to each decoder. This allows us to identify
201 // decoded layer in frame decode callback.
202 // simulcast_svc_idx -> decode callback.
203 std::vector<std::unique_ptr<VideoProcessorDecodeCompleteCallback>>
204 decode_callback_;
brandtraebc61e2017-02-28 07:13:47 -0800205
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100206 // Each call to ProcessFrame() will read one frame from |input_frame_reader_|.
207 FrameReader* const input_frame_reader_;
208
209 // Input frames are used as reference for frame quality evaluations.
Sergey Silkin64eaa992017-11-17 14:47:32 +0100210 // Async codecs might queue frames. To handle that we keep input frame
211 // and release it after corresponding coded frame is decoded and quality
212 // measurement is done.
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100213 // frame_number -> frame.
214 std::map<size_t, VideoFrame> input_frames_ RTC_GUARDED_BY(sequence_checker_);
Sergey Silkin10d9d592018-02-01 13:25:17 +0100215
216 // Encoder delivers coded frame layer-by-layer. We store coded frames and
217 // then, after all layers are encoded, decode them. Such separation of
218 // frame processing on superframe level simplifies encoding/decoding time
219 // measurement.
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100220 // simulcast_svc_idx -> merged SVC encoded frame.
221 std::vector<EncodedImage> merged_encoded_frames_
Sergey Silkin10d9d592018-02-01 13:25:17 +0100222 RTC_GUARDED_BY(sequence_checker_);
223
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100224 // These (optional) file writers are used to persistently store the encoded
225 // and decoded bitstreams. Each frame writer is enabled by being non-null.
Rasmus Brandt001c7822019-03-22 13:41:48 +0100226 IvfFileWriterMap* const encoded_frame_writers_;
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100227 FrameWriterList* const decoded_frame_writers_;
brandtr8bc93852017-02-15 05:19:51 -0800228
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100229 // Metadata for inputed/encoded/decoded frames. Used for frame identification,
230 // frame drop detection, etc. We assume that encoded/decoded frames are
231 // ordered within each simulcast/spatial layer, but we do not make any
232 // assumptions of frame ordering between layers.
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100233 size_t last_inputed_frame_num_ RTC_GUARDED_BY(sequence_checker_);
234 size_t last_inputed_timestamp_ RTC_GUARDED_BY(sequence_checker_);
Rasmus Brandt0f1c0bd2018-03-12 10:01:16 +0100235 // simulcast_svc_idx -> encode status.
236 std::vector<bool> first_encoded_frame_ RTC_GUARDED_BY(sequence_checker_);
237 // simulcast_svc_idx -> frame_number.
238 std::vector<size_t> last_encoded_frame_num_ RTC_GUARDED_BY(sequence_checker_);
239 // simulcast_svc_idx -> decode status.
240 std::vector<bool> first_decoded_frame_ RTC_GUARDED_BY(sequence_checker_);
241 // simulcast_svc_idx -> frame_number.
242 std::vector<size_t> last_decoded_frame_num_ RTC_GUARDED_BY(sequence_checker_);
Sergey Silkin56138792018-05-02 10:50:55 +0200243 // simulcast_svc_idx -> buffer.
244 std::vector<rtc::Buffer> decoded_frame_buffer_
245 RTC_GUARDED_BY(sequence_checker_);
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100246
Sergey Silkinc89eed92018-04-01 23:57:51 +0200247 // Time spent in frame encode callback. It is accumulated for layers and
248 // reset when frame encode starts. When next layer is encoded post-encode time
249 // is substracted from measured encode time. Thus we get pure encode time.
250 int64_t post_encode_time_ns_ RTC_GUARDED_BY(sequence_checker_);
251
Rasmus Brandtd062a3c2018-03-08 16:45:54 +0100252 // This class must be operated on a TaskQueue.
Sebastian Janssonb55015e2019-04-09 13:44:04 +0200253 SequenceChecker sequence_checker_;
brandtrbdd555c2017-08-21 01:34:04 -0700254
255 RTC_DISALLOW_COPY_AND_ASSIGN(VideoProcessor);
kjellander@webrtc.org35a17562011-10-06 06:44:54 +0000256};
257
258} // namespace test
259} // namespace webrtc
260
Mirko Bonadei92ea95e2017-09-15 06:47:31 +0200261#endif // MODULES_VIDEO_CODING_CODECS_TEST_VIDEOPROCESSOR_H_