blob: cece073aaa9afeea1c186510f11ed45ab12200ac [file] [log] [blame]
Erik Språng08127a92016-11-16 16:41:30 +01001/*
2 * Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#include "modules/video_coding/include/video_codec_initializer.h"
Erik Språng08127a92016-11-16 16:41:30 +010012
Yves Gerey3e707812018-11-28 16:47:49 +010013#include <stdint.h>
14#include <string.h>
Jonas Olssona4d87372019-07-05 19:08:33 +020015
Yves Gerey3e707812018-11-28 16:47:49 +010016#include <algorithm>
17
18#include "absl/types/optional.h"
Mirko Bonadeid9708072019-01-25 20:26:48 +010019#include "api/scoped_refptr.h"
Elad Alonc67a4d62019-10-11 16:54:18 +020020#include "api/units/data_rate.h"
Yves Gerey3e707812018-11-28 16:47:49 +010021#include "api/video/video_bitrate_allocation.h"
Anders Carlssondd8c1652018-01-30 10:32:13 +010022#include "api/video_codecs/video_encoder.h"
Danil Chapovalov4005e5a2020-11-25 17:01:22 +010023#include "modules/video_coding/codecs/av1/av1_svc_config.h"
Niels Möller05954892022-05-13 13:34:37 +020024#include "modules/video_coding/codecs/vp8/vp8_scalability.h"
Sergey Silkin86684962018-03-28 19:32:37 +020025#include "modules/video_coding/codecs/vp9/svc_config.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020026#include "modules/video_coding/include/video_coding_defines.h"
Niels Möller05954892022-05-13 13:34:37 +020027#include "modules/video_coding/svc/scalability_mode_util.h"
Yves Gerey3e707812018-11-28 16:47:49 +010028#include "rtc_base/checks.h"
Elad Alonc67a4d62019-10-11 16:54:18 +020029#include "rtc_base/experiments/min_video_bitrate_experiment.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020030#include "rtc_base/logging.h"
Elad Alonc67a4d62019-10-11 16:54:18 +020031#include "rtc_base/numerics/safe_conversions.h"
Erik Språng08127a92016-11-16 16:41:30 +010032
33namespace webrtc {
34
Jiawei Ouc2ebe212018-11-08 10:02:56 -080035bool VideoCodecInitializer::SetupCodec(const VideoEncoderConfig& config,
36 const std::vector<VideoStream>& streams,
37 VideoCodec* codec) {
Niels Möller259a4972018-04-05 15:36:51 +020038 if (config.codec_type == kVideoCodecMultiplex) {
Niels Möller24a842a2018-03-22 08:52:50 +010039 VideoEncoderConfig associated_config = config.Copy();
40 associated_config.codec_type = kVideoCodecVP9;
Jiawei Ouc2ebe212018-11-08 10:02:56 -080041 if (!SetupCodec(associated_config, streams, codec)) {
Emircan Uysaler0a375472017-12-11 12:21:02 +053042 RTC_LOG(LS_ERROR) << "Failed to create stereo encoder configuration.";
43 return false;
44 }
Emircan Uysalerd7ae3c32018-01-25 13:01:09 -080045 codec->codecType = kVideoCodecMultiplex;
Emircan Uysaler0a375472017-12-11 12:21:02 +053046 return true;
47 }
48
Yves Gerey665174f2018-06-19 15:03:05 +020049 *codec = VideoEncoderConfigToVideoCodec(config, streams);
Erik Språng08127a92016-11-16 16:41:30 +010050 return true;
51}
52
Erik Språng08127a92016-11-16 16:41:30 +010053// TODO(sprang): Split this up and separate the codec specific parts.
54VideoCodec VideoCodecInitializer::VideoEncoderConfigToVideoCodec(
55 const VideoEncoderConfig& config,
Niels Möllerf1338562018-04-26 09:51:47 +020056 const std::vector<VideoStream>& streams) {
Erik Språng08127a92016-11-16 16:41:30 +010057 static const int kEncoderMinBitrateKbps = 30;
58 RTC_DCHECK(!streams.empty());
59 RTC_DCHECK_GE(config.min_transmit_bitrate_bps, 0);
60
61 VideoCodec video_codec;
Niels Möller259a4972018-04-05 15:36:51 +020062 video_codec.codecType = config.codec_type;
Erik Språng08127a92016-11-16 16:41:30 +010063
64 switch (config.content_type) {
65 case VideoEncoderConfig::ContentType::kRealtimeVideo:
Niels Möllere3cf3d02018-06-13 11:52:16 +020066 video_codec.mode = VideoCodecMode::kRealtimeVideo;
Erik Språng08127a92016-11-16 16:41:30 +010067 break;
68 case VideoEncoderConfig::ContentType::kScreen:
Niels Möllere3cf3d02018-06-13 11:52:16 +020069 video_codec.mode = VideoCodecMode::kScreensharing;
Erik Språng08127a92016-11-16 16:41:30 +010070 break;
71 }
72
Florent Castellid3511012020-08-04 11:40:23 +020073 video_codec.legacy_conference_mode =
74 config.content_type == VideoEncoderConfig::ContentType::kScreen &&
75 config.legacy_conference_mode;
76
Niels Möller807328f2022-05-12 16:16:39 +020077 video_codec.SetFrameDropEnabled(config.frame_drop_enabled);
Erik Språng08127a92016-11-16 16:41:30 +010078 video_codec.numberOfSimulcastStreams =
79 static_cast<unsigned char>(streams.size());
80 video_codec.minBitrate = streams[0].min_bitrate_bps / 1000;
Seth Hampson46e31ba2018-01-18 10:39:54 -080081 bool codec_active = false;
Artem Titovdcd7fc72021-08-09 13:02:57 +020082 // Active configuration might not be fully copied to `streams` for SVC yet.
83 // Therefore the `config` is checked here.
Ilya Nikolaevskiy7a824672020-06-18 19:16:53 +020084 for (const VideoStream& stream : config.simulcast_layers) {
Seth Hampson46e31ba2018-01-18 10:39:54 -080085 if (stream.active) {
86 codec_active = true;
87 break;
88 }
89 }
90 // Set active for the entire video codec for the non simulcast case.
91 video_codec.active = codec_active;
Erik Språng08127a92016-11-16 16:41:30 +010092 if (video_codec.minBitrate < kEncoderMinBitrateKbps)
93 video_codec.minBitrate = kEncoderMinBitrateKbps;
ilnik04f4d122017-06-19 07:18:55 -070094 video_codec.timing_frame_thresholds = {kDefaultTimingFramesDelayMs,
95 kDefaultOutlierFrameSizePercent};
kwiberg352444f2016-11-28 15:58:53 -080096 RTC_DCHECK_LE(streams.size(), kMaxSimulcastStreams);
Sergey Silkin86684962018-03-28 19:32:37 +020097
Florent Castelli907dc802019-12-06 15:03:19 +010098 int max_framerate = 0;
99
Niels Möller79d566b2022-04-29 11:03:13 +0200100 absl::optional<ScalabilityMode> scalability_mode =
101 streams[0].scalability_mode;
Erik Språng08127a92016-11-16 16:41:30 +0100102 for (size_t i = 0; i < streams.size(); ++i) {
Niels Möllerc0a9f352022-05-20 13:38:49 +0200103 SimulcastStream* sim_stream = &video_codec.simulcastStream[i];
kwibergaf476c72016-11-28 15:21:39 -0800104 RTC_DCHECK_GT(streams[i].width, 0);
105 RTC_DCHECK_GT(streams[i].height, 0);
Erik Språng08127a92016-11-16 16:41:30 +0100106 RTC_DCHECK_GT(streams[i].max_framerate, 0);
Erik Språng08127a92016-11-16 16:41:30 +0100107 RTC_DCHECK_GE(streams[i].min_bitrate_bps, 0);
108 RTC_DCHECK_GE(streams[i].target_bitrate_bps, streams[i].min_bitrate_bps);
109 RTC_DCHECK_GE(streams[i].max_bitrate_bps, streams[i].target_bitrate_bps);
110 RTC_DCHECK_GE(streams[i].max_qp, 0);
111
112 sim_stream->width = static_cast<uint16_t>(streams[i].width);
113 sim_stream->height = static_cast<uint16_t>(streams[i].height);
Sergey Silkin1946a3f2018-08-22 11:42:16 +0200114 sim_stream->maxFramerate = streams[i].max_framerate;
Erik Språng08127a92016-11-16 16:41:30 +0100115 sim_stream->minBitrate = streams[i].min_bitrate_bps / 1000;
116 sim_stream->targetBitrate = streams[i].target_bitrate_bps / 1000;
117 sim_stream->maxBitrate = streams[i].max_bitrate_bps / 1000;
118 sim_stream->qpMax = streams[i].max_qp;
Niels Möller05954892022-05-13 13:34:37 +0200119
120 int num_temporal_layers =
121 streams[i].scalability_mode.has_value()
122 ? ScalabilityModeToNumTemporalLayers(*streams[i].scalability_mode)
123 : streams[i].num_temporal_layers.value_or(1);
124
Sergey Silkina796a7e2018-03-01 15:11:29 +0100125 sim_stream->numberOfTemporalLayers =
Niels Möller05954892022-05-13 13:34:37 +0200126 static_cast<unsigned char>(num_temporal_layers);
Seth Hampson46e31ba2018-01-18 10:39:54 -0800127 sim_stream->active = streams[i].active;
Erik Språng08127a92016-11-16 16:41:30 +0100128
129 video_codec.width =
Danil Chapovalov350531e2018-06-08 11:04:04 +0000130 std::max(video_codec.width, static_cast<uint16_t>(streams[i].width));
Erik Språng08127a92016-11-16 16:41:30 +0100131 video_codec.height =
Danil Chapovalov350531e2018-06-08 11:04:04 +0000132 std::max(video_codec.height, static_cast<uint16_t>(streams[i].height));
Erik Språng08127a92016-11-16 16:41:30 +0100133 video_codec.minBitrate =
134 std::min(static_cast<uint16_t>(video_codec.minBitrate),
135 static_cast<uint16_t>(streams[i].min_bitrate_bps / 1000));
136 video_codec.maxBitrate += streams[i].max_bitrate_bps / 1000;
137 video_codec.qpMax = std::max(video_codec.qpMax,
138 static_cast<unsigned int>(streams[i].max_qp));
Florent Castelli907dc802019-12-06 15:03:19 +0100139 max_framerate = std::max(max_framerate, streams[i].max_framerate);
philipel87e99092020-11-18 11:52:04 +0100140
Niels Möller05954892022-05-13 13:34:37 +0200141 // TODO(bugs.webrtc.org/11607): Since scalability mode is a top-level
142 // setting on VideoCodec, setting it makes sense only if it is the same for
143 // all simulcast streams.
philipel87e99092020-11-18 11:52:04 +0100144 if (streams[0].scalability_mode != streams[i].scalability_mode) {
philipel87e99092020-11-18 11:52:04 +0100145 scalability_mode.reset();
Niels Möller05954892022-05-13 13:34:37 +0200146 // For VP8, top-level scalability mode doesn't matter, since configuration
147 // is based on the per-simulcast stream configuration of temporal layers.
148 if (video_codec.codecType != kVideoCodecVP8) {
149 RTC_LOG(LS_WARNING) << "Inconsistent scalability modes configured.";
150 }
philipel87e99092020-11-18 11:52:04 +0100151 }
152 }
153
154 if (scalability_mode.has_value()) {
155 video_codec.SetScalabilityMode(*scalability_mode);
Erik Språng08127a92016-11-16 16:41:30 +0100156 }
157
158 if (video_codec.maxBitrate == 0) {
159 // Unset max bitrate -> cap to one bit per pixel.
160 video_codec.maxBitrate =
161 (video_codec.width * video_codec.height * video_codec.maxFramerate) /
162 1000;
163 }
164 if (video_codec.maxBitrate < kEncoderMinBitrateKbps)
165 video_codec.maxBitrate = kEncoderMinBitrateKbps;
166
Florent Castelli907dc802019-12-06 15:03:19 +0100167 video_codec.maxFramerate = max_framerate;
Per Kjellanderf86cf4c2020-12-30 15:27:35 +0100168 video_codec.spatialLayers[0] = {0};
169 video_codec.spatialLayers[0].width = video_codec.width;
170 video_codec.spatialLayers[0].height = video_codec.height;
171 video_codec.spatialLayers[0].maxFramerate = max_framerate;
172 video_codec.spatialLayers[0].numberOfTemporalLayers =
173 streams[0].num_temporal_layers.value_or(1);
Sergey Silkin86684962018-03-28 19:32:37 +0200174
175 // Set codec specific options
176 if (config.encoder_specific_settings)
177 config.encoder_specific_settings->FillEncoderSpecificSettings(&video_codec);
178
179 switch (video_codec.codecType) {
180 case kVideoCodecVP8: {
181 if (!config.encoder_specific_settings) {
182 *video_codec.VP8() = VideoEncoder::GetDefaultVp8Settings();
183 }
184
Niels Möller05954892022-05-13 13:34:37 +0200185 // Validate specified scalability modes. If some layer has an unsupported
186 // mode, store it as the top-level scalability mode, which will make
187 // InitEncode fail with an appropriate error.
188 for (const auto& stream : streams) {
189 if (stream.scalability_mode.has_value() &&
190 !VP8SupportsScalabilityMode(*stream.scalability_mode)) {
191 RTC_LOG(LS_WARNING)
192 << "Invalid scalability mode for VP8: "
193 << ScalabilityModeToString(*stream.scalability_mode);
194 video_codec.SetScalabilityMode(*stream.scalability_mode);
195 break;
196 }
197 }
198 video_codec.VP8()->numberOfTemporalLayers =
199 streams.back().scalability_mode.has_value()
200 ? ScalabilityModeToNumTemporalLayers(
201 *streams.back().scalability_mode)
202 : streams.back().num_temporal_layers.value_or(
203 video_codec.VP8()->numberOfTemporalLayers);
204
Sergey Silkin86684962018-03-28 19:32:37 +0200205 RTC_DCHECK_GE(video_codec.VP8()->numberOfTemporalLayers, 1);
206 RTC_DCHECK_LE(video_codec.VP8()->numberOfTemporalLayers,
207 kMaxTemporalStreams);
208
Sergey Silkin86684962018-03-28 19:32:37 +0200209 break;
210 }
211 case kVideoCodecVP9: {
Ilya Nikolaevskiy72859e52020-02-05 17:31:00 +0100212 // Force the first stream to always be active.
213 video_codec.simulcastStream[0].active = codec_active;
214
Sergey Silkin86684962018-03-28 19:32:37 +0200215 if (!config.encoder_specific_settings) {
216 *video_codec.VP9() = VideoEncoder::GetDefaultVp9Settings();
217 }
218
219 video_codec.VP9()->numberOfTemporalLayers = static_cast<unsigned char>(
220 streams.back().num_temporal_layers.value_or(
221 video_codec.VP9()->numberOfTemporalLayers));
222 RTC_DCHECK_GE(video_codec.VP9()->numberOfTemporalLayers, 1);
223 RTC_DCHECK_LE(video_codec.VP9()->numberOfTemporalLayers,
224 kMaxTemporalStreams);
225
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200226 RTC_DCHECK(config.spatial_layers.empty() ||
227 config.spatial_layers.size() ==
228 video_codec.VP9()->numberOfSpatialLayers);
229
230 std::vector<SpatialLayer> spatial_layers;
231 if (!config.spatial_layers.empty()) {
232 // Layering is set explicitly.
233 spatial_layers = config.spatial_layers;
Asa Perssoncde992d2022-05-16 22:37:34 +0200234 } else if (scalability_mode.has_value()) {
235 // Layering is set via scalability mode.
236 spatial_layers = GetVp9SvcConfig(video_codec);
237 if (spatial_layers.empty())
238 break;
Sergey Silkin86684962018-03-28 19:32:37 +0200239 } else {
Ilya Nikolaevskiy39fb8172020-04-14 10:28:19 +0200240 size_t first_active_layer = 0;
Ilya Nikolaevskiy03d90962020-02-11 12:50:38 +0100241 for (size_t spatial_idx = 0;
242 spatial_idx < config.simulcast_layers.size(); ++spatial_idx) {
243 if (config.simulcast_layers[spatial_idx].active) {
Ilya Nikolaevskiy39fb8172020-04-14 10:28:19 +0200244 first_active_layer = spatial_idx;
Ilya Nikolaevskiy03d90962020-02-11 12:50:38 +0100245 break;
246 }
247 }
248
Sergey Silkin1946a3f2018-08-22 11:42:16 +0200249 spatial_layers = GetSvcConfig(
250 video_codec.width, video_codec.height, video_codec.maxFramerate,
Ilya Nikolaevskiy39fb8172020-04-14 10:28:19 +0200251 first_active_layer, video_codec.VP9()->numberOfSpatialLayers,
Sergey Silkin1946a3f2018-08-22 11:42:16 +0200252 video_codec.VP9()->numberOfTemporalLayers,
253 video_codec.mode == VideoCodecMode::kScreensharing);
Sergey Silkin86684962018-03-28 19:32:37 +0200254
Sergey Silkin33120922018-11-28 13:32:13 +0100255 // If there was no request for spatial layering, don't limit bitrate
256 // of single spatial layer.
257 const bool no_spatial_layering =
258 video_codec.VP9()->numberOfSpatialLayers <= 1;
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200259 if (no_spatial_layering) {
260 // Use codec's bitrate limits.
261 spatial_layers.back().minBitrate = video_codec.minBitrate;
Ilya Nikolaevskiy9ef5e052019-03-05 10:08:35 +0100262 spatial_layers.back().targetBitrate = video_codec.maxBitrate;
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200263 spatial_layers.back().maxBitrate = video_codec.maxBitrate;
Sergey Silkin86684962018-03-28 19:32:37 +0200264 }
Sergey Silkin8b9b5f92018-12-10 09:28:53 +0100265
Ilya Nikolaevskiy7a824672020-06-18 19:16:53 +0200266 for (size_t spatial_idx = first_active_layer;
Sergey Silkin8b9b5f92018-12-10 09:28:53 +0100267 spatial_idx < config.simulcast_layers.size() &&
Ilya Nikolaevskiya945cda2020-09-22 15:55:23 +0200268 spatial_idx < spatial_layers.size() + first_active_layer;
Sergey Silkin8b9b5f92018-12-10 09:28:53 +0100269 ++spatial_idx) {
Ilya Nikolaevskiy39fb8172020-04-14 10:28:19 +0200270 spatial_layers[spatial_idx - first_active_layer].active =
Sergey Silkin8b9b5f92018-12-10 09:28:53 +0100271 config.simulcast_layers[spatial_idx].active;
272 }
Sergey Silkin86684962018-03-28 19:32:37 +0200273 }
274
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200275 RTC_DCHECK(!spatial_layers.empty());
276 for (size_t i = 0; i < spatial_layers.size(); ++i) {
277 video_codec.spatialLayers[i] = spatial_layers[i];
278 }
279
Ilya Nikolaevskiy09eb6e22020-06-05 12:36:32 +0200280 // The top spatial layer dimensions may not be equal to the input
281 // resolution because of the rounding or explicit configuration.
282 // This difference must be propagated to the stream configuration.
283 video_codec.width = spatial_layers.back().width;
284 video_codec.height = spatial_layers.back().height;
285 video_codec.simulcastStream[0].width = spatial_layers.back().width;
286 video_codec.simulcastStream[0].height = spatial_layers.back().height;
287
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200288 // Update layering settings.
289 video_codec.VP9()->numberOfSpatialLayers =
290 static_cast<unsigned char>(spatial_layers.size());
291 RTC_DCHECK_GE(video_codec.VP9()->numberOfSpatialLayers, 1);
292 RTC_DCHECK_LE(video_codec.VP9()->numberOfSpatialLayers,
293 kMaxSpatialLayers);
294
295 video_codec.VP9()->numberOfTemporalLayers = static_cast<unsigned char>(
296 spatial_layers.back().numberOfTemporalLayers);
297 RTC_DCHECK_GE(video_codec.VP9()->numberOfTemporalLayers, 1);
298 RTC_DCHECK_LE(video_codec.VP9()->numberOfTemporalLayers,
299 kMaxTemporalStreams);
300
Sergey Silkin86684962018-03-28 19:32:37 +0200301 break;
302 }
Danil Chapovalov4005e5a2020-11-25 17:01:22 +0100303 case kVideoCodecAV1:
philipel94375292022-05-13 13:16:44 +0200304 if (SetAv1SvcConfig(video_codec,
305 /*num_temporal_layers=*/
306 streams.back().num_temporal_layers.value_or(1),
307 /*num_spatial_layers=*/
308 std::max<int>(config.spatial_layers.size(), 1))) {
Erik Språngf8654442021-06-01 16:52:24 +0200309 for (size_t i = 0; i < config.spatial_layers.size(); ++i) {
310 video_codec.spatialLayers[i].active = config.spatial_layers[i].active;
311 }
312 } else {
Danil Chapovalov4005e5a2020-11-25 17:01:22 +0100313 RTC_LOG(LS_WARNING) << "Failed to configure svc bitrates for av1.";
314 }
315 break;
Sergey Silkin86684962018-03-28 19:32:37 +0200316 case kVideoCodecH264: {
Niels Möllercf2c8912022-05-18 10:45:46 +0200317 RTC_CHECK(!config.encoder_specific_settings);
318
319 *video_codec.H264() = VideoEncoder::GetDefaultH264Settings();
Johnny Lee1a1c52b2019-02-08 14:25:40 -0500320 video_codec.H264()->numberOfTemporalLayers = static_cast<unsigned char>(
321 streams.back().num_temporal_layers.value_or(
322 video_codec.H264()->numberOfTemporalLayers));
323 RTC_DCHECK_GE(video_codec.H264()->numberOfTemporalLayers, 1);
324 RTC_DCHECK_LE(video_codec.H264()->numberOfTemporalLayers,
325 kMaxTemporalStreams);
Sergey Silkin86684962018-03-28 19:32:37 +0200326 break;
327 }
328 default:
329 // TODO(pbos): Support encoder_settings codec-agnostically.
330 RTC_DCHECK(!config.encoder_specific_settings)
331 << "Encoder-specific settings for codec type not wired up.";
332 break;
333 }
334
Elad Alonc67a4d62019-10-11 16:54:18 +0200335 const absl::optional<DataRate> experimental_min_bitrate =
336 GetExperimentalMinVideoBitrate(video_codec.codecType);
337 if (experimental_min_bitrate) {
338 const int experimental_min_bitrate_kbps =
339 rtc::saturated_cast<int>(experimental_min_bitrate->kbps());
340 video_codec.minBitrate = experimental_min_bitrate_kbps;
341 video_codec.simulcastStream[0].minBitrate = experimental_min_bitrate_kbps;
342 if (video_codec.codecType == kVideoCodecVP9) {
343 video_codec.spatialLayers[0].minBitrate = experimental_min_bitrate_kbps;
344 }
345 }
346
Erik Språng08127a92016-11-16 16:41:30 +0100347 return video_codec;
348}
349
350} // namespace webrtc