blob: 1cec6d2aeaaccd7c8f431e14c4e809157beb3cad [file] [log] [blame]
Erik Språng08127a92016-11-16 16:41:30 +01001/*
2 * Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#include "modules/video_coding/include/video_codec_initializer.h"
Erik Språng08127a92016-11-16 16:41:30 +010012
Yves Gerey3e707812018-11-28 16:47:49 +010013#include <stdint.h>
14#include <string.h>
Jonas Olssona4d87372019-07-05 19:08:33 +020015
Yves Gerey3e707812018-11-28 16:47:49 +010016#include <algorithm>
17
18#include "absl/types/optional.h"
Mirko Bonadeid9708072019-01-25 20:26:48 +010019#include "api/scoped_refptr.h"
Elad Alonc67a4d62019-10-11 16:54:18 +020020#include "api/units/data_rate.h"
Yves Gerey3e707812018-11-28 16:47:49 +010021#include "api/video/video_bitrate_allocation.h"
Anders Carlssondd8c1652018-01-30 10:32:13 +010022#include "api/video_codecs/video_encoder.h"
Danil Chapovalov4005e5a2020-11-25 17:01:22 +010023#include "modules/video_coding/codecs/av1/av1_svc_config.h"
Sergey Silkin86684962018-03-28 19:32:37 +020024#include "modules/video_coding/codecs/vp9/svc_config.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020025#include "modules/video_coding/include/video_coding_defines.h"
Yves Gerey3e707812018-11-28 16:47:49 +010026#include "rtc_base/checks.h"
Elad Alonc67a4d62019-10-11 16:54:18 +020027#include "rtc_base/experiments/min_video_bitrate_experiment.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020028#include "rtc_base/logging.h"
Elad Alonc67a4d62019-10-11 16:54:18 +020029#include "rtc_base/numerics/safe_conversions.h"
Erik Språng08127a92016-11-16 16:41:30 +010030
31namespace webrtc {
32
Jiawei Ouc2ebe212018-11-08 10:02:56 -080033bool VideoCodecInitializer::SetupCodec(const VideoEncoderConfig& config,
34 const std::vector<VideoStream>& streams,
35 VideoCodec* codec) {
Niels Möller259a4972018-04-05 15:36:51 +020036 if (config.codec_type == kVideoCodecMultiplex) {
Niels Möller24a842a2018-03-22 08:52:50 +010037 VideoEncoderConfig associated_config = config.Copy();
38 associated_config.codec_type = kVideoCodecVP9;
Jiawei Ouc2ebe212018-11-08 10:02:56 -080039 if (!SetupCodec(associated_config, streams, codec)) {
Emircan Uysaler0a375472017-12-11 12:21:02 +053040 RTC_LOG(LS_ERROR) << "Failed to create stereo encoder configuration.";
41 return false;
42 }
Emircan Uysalerd7ae3c32018-01-25 13:01:09 -080043 codec->codecType = kVideoCodecMultiplex;
Emircan Uysaler0a375472017-12-11 12:21:02 +053044 return true;
45 }
46
Yves Gerey665174f2018-06-19 15:03:05 +020047 *codec = VideoEncoderConfigToVideoCodec(config, streams);
Erik Språng08127a92016-11-16 16:41:30 +010048 return true;
49}
50
Erik Språng08127a92016-11-16 16:41:30 +010051// TODO(sprang): Split this up and separate the codec specific parts.
52VideoCodec VideoCodecInitializer::VideoEncoderConfigToVideoCodec(
53 const VideoEncoderConfig& config,
Niels Möllerf1338562018-04-26 09:51:47 +020054 const std::vector<VideoStream>& streams) {
Erik Språng08127a92016-11-16 16:41:30 +010055 static const int kEncoderMinBitrateKbps = 30;
56 RTC_DCHECK(!streams.empty());
57 RTC_DCHECK_GE(config.min_transmit_bitrate_bps, 0);
58
59 VideoCodec video_codec;
Niels Möller259a4972018-04-05 15:36:51 +020060 video_codec.codecType = config.codec_type;
Erik Språng08127a92016-11-16 16:41:30 +010061
62 switch (config.content_type) {
63 case VideoEncoderConfig::ContentType::kRealtimeVideo:
Niels Möllere3cf3d02018-06-13 11:52:16 +020064 video_codec.mode = VideoCodecMode::kRealtimeVideo;
Erik Språng08127a92016-11-16 16:41:30 +010065 break;
66 case VideoEncoderConfig::ContentType::kScreen:
Niels Möllere3cf3d02018-06-13 11:52:16 +020067 video_codec.mode = VideoCodecMode::kScreensharing;
Erik Språng08127a92016-11-16 16:41:30 +010068 break;
69 }
70
Florent Castellid3511012020-08-04 11:40:23 +020071 video_codec.legacy_conference_mode =
72 config.content_type == VideoEncoderConfig::ContentType::kScreen &&
73 config.legacy_conference_mode;
74
Erik Språng08127a92016-11-16 16:41:30 +010075 video_codec.numberOfSimulcastStreams =
76 static_cast<unsigned char>(streams.size());
77 video_codec.minBitrate = streams[0].min_bitrate_bps / 1000;
Seth Hampson46e31ba2018-01-18 10:39:54 -080078 bool codec_active = false;
Artem Titovdcd7fc72021-08-09 13:02:57 +020079 // Active configuration might not be fully copied to `streams` for SVC yet.
80 // Therefore the `config` is checked here.
Ilya Nikolaevskiy7a824672020-06-18 19:16:53 +020081 for (const VideoStream& stream : config.simulcast_layers) {
Seth Hampson46e31ba2018-01-18 10:39:54 -080082 if (stream.active) {
83 codec_active = true;
84 break;
85 }
86 }
87 // Set active for the entire video codec for the non simulcast case.
88 video_codec.active = codec_active;
Erik Språng08127a92016-11-16 16:41:30 +010089 if (video_codec.minBitrate < kEncoderMinBitrateKbps)
90 video_codec.minBitrate = kEncoderMinBitrateKbps;
ilnik04f4d122017-06-19 07:18:55 -070091 video_codec.timing_frame_thresholds = {kDefaultTimingFramesDelayMs,
92 kDefaultOutlierFrameSizePercent};
kwiberg352444f2016-11-28 15:58:53 -080093 RTC_DCHECK_LE(streams.size(), kMaxSimulcastStreams);
Sergey Silkin86684962018-03-28 19:32:37 +020094
Florent Castelli907dc802019-12-06 15:03:19 +010095 int max_framerate = 0;
96
Niels Möller79d566b2022-04-29 11:03:13 +020097 absl::optional<ScalabilityMode> scalability_mode =
98 streams[0].scalability_mode;
Erik Språng08127a92016-11-16 16:41:30 +010099 for (size_t i = 0; i < streams.size(); ++i) {
Niels Möller5b69aa62020-08-14 15:32:14 +0200100 SpatialLayer* sim_stream = &video_codec.simulcastStream[i];
kwibergaf476c72016-11-28 15:21:39 -0800101 RTC_DCHECK_GT(streams[i].width, 0);
102 RTC_DCHECK_GT(streams[i].height, 0);
Erik Språng08127a92016-11-16 16:41:30 +0100103 RTC_DCHECK_GT(streams[i].max_framerate, 0);
Erik Språng08127a92016-11-16 16:41:30 +0100104 RTC_DCHECK_GE(streams[i].min_bitrate_bps, 0);
105 RTC_DCHECK_GE(streams[i].target_bitrate_bps, streams[i].min_bitrate_bps);
106 RTC_DCHECK_GE(streams[i].max_bitrate_bps, streams[i].target_bitrate_bps);
107 RTC_DCHECK_GE(streams[i].max_qp, 0);
108
109 sim_stream->width = static_cast<uint16_t>(streams[i].width);
110 sim_stream->height = static_cast<uint16_t>(streams[i].height);
Sergey Silkin1946a3f2018-08-22 11:42:16 +0200111 sim_stream->maxFramerate = streams[i].max_framerate;
Erik Språng08127a92016-11-16 16:41:30 +0100112 sim_stream->minBitrate = streams[i].min_bitrate_bps / 1000;
113 sim_stream->targetBitrate = streams[i].target_bitrate_bps / 1000;
114 sim_stream->maxBitrate = streams[i].max_bitrate_bps / 1000;
115 sim_stream->qpMax = streams[i].max_qp;
Sergey Silkina796a7e2018-03-01 15:11:29 +0100116 sim_stream->numberOfTemporalLayers =
117 static_cast<unsigned char>(streams[i].num_temporal_layers.value_or(1));
Seth Hampson46e31ba2018-01-18 10:39:54 -0800118 sim_stream->active = streams[i].active;
Erik Språng08127a92016-11-16 16:41:30 +0100119
120 video_codec.width =
Danil Chapovalov350531e2018-06-08 11:04:04 +0000121 std::max(video_codec.width, static_cast<uint16_t>(streams[i].width));
Erik Språng08127a92016-11-16 16:41:30 +0100122 video_codec.height =
Danil Chapovalov350531e2018-06-08 11:04:04 +0000123 std::max(video_codec.height, static_cast<uint16_t>(streams[i].height));
Erik Språng08127a92016-11-16 16:41:30 +0100124 video_codec.minBitrate =
125 std::min(static_cast<uint16_t>(video_codec.minBitrate),
126 static_cast<uint16_t>(streams[i].min_bitrate_bps / 1000));
127 video_codec.maxBitrate += streams[i].max_bitrate_bps / 1000;
128 video_codec.qpMax = std::max(video_codec.qpMax,
129 static_cast<unsigned int>(streams[i].max_qp));
Florent Castelli907dc802019-12-06 15:03:19 +0100130 max_framerate = std::max(max_framerate, streams[i].max_framerate);
philipel87e99092020-11-18 11:52:04 +0100131
132 if (streams[0].scalability_mode != streams[i].scalability_mode) {
133 RTC_LOG(LS_WARNING) << "Inconsistent scalability modes configured.";
134 scalability_mode.reset();
135 }
136 }
137
138 if (scalability_mode.has_value()) {
139 video_codec.SetScalabilityMode(*scalability_mode);
Erik Språng08127a92016-11-16 16:41:30 +0100140 }
141
142 if (video_codec.maxBitrate == 0) {
143 // Unset max bitrate -> cap to one bit per pixel.
144 video_codec.maxBitrate =
145 (video_codec.width * video_codec.height * video_codec.maxFramerate) /
146 1000;
147 }
148 if (video_codec.maxBitrate < kEncoderMinBitrateKbps)
149 video_codec.maxBitrate = kEncoderMinBitrateKbps;
150
Florent Castelli907dc802019-12-06 15:03:19 +0100151 video_codec.maxFramerate = max_framerate;
Per Kjellanderf86cf4c2020-12-30 15:27:35 +0100152 video_codec.spatialLayers[0] = {0};
153 video_codec.spatialLayers[0].width = video_codec.width;
154 video_codec.spatialLayers[0].height = video_codec.height;
155 video_codec.spatialLayers[0].maxFramerate = max_framerate;
156 video_codec.spatialLayers[0].numberOfTemporalLayers =
157 streams[0].num_temporal_layers.value_or(1);
Sergey Silkin86684962018-03-28 19:32:37 +0200158
159 // Set codec specific options
160 if (config.encoder_specific_settings)
161 config.encoder_specific_settings->FillEncoderSpecificSettings(&video_codec);
162
163 switch (video_codec.codecType) {
164 case kVideoCodecVP8: {
165 if (!config.encoder_specific_settings) {
166 *video_codec.VP8() = VideoEncoder::GetDefaultVp8Settings();
167 }
168
169 video_codec.VP8()->numberOfTemporalLayers = static_cast<unsigned char>(
170 streams.back().num_temporal_layers.value_or(
171 video_codec.VP8()->numberOfTemporalLayers));
172 RTC_DCHECK_GE(video_codec.VP8()->numberOfTemporalLayers, 1);
173 RTC_DCHECK_LE(video_codec.VP8()->numberOfTemporalLayers,
174 kMaxTemporalStreams);
175
Sergey Silkin86684962018-03-28 19:32:37 +0200176 break;
177 }
178 case kVideoCodecVP9: {
Ilya Nikolaevskiy72859e52020-02-05 17:31:00 +0100179 // Force the first stream to always be active.
180 video_codec.simulcastStream[0].active = codec_active;
181
Sergey Silkin86684962018-03-28 19:32:37 +0200182 if (!config.encoder_specific_settings) {
183 *video_codec.VP9() = VideoEncoder::GetDefaultVp9Settings();
184 }
185
186 video_codec.VP9()->numberOfTemporalLayers = static_cast<unsigned char>(
187 streams.back().num_temporal_layers.value_or(
188 video_codec.VP9()->numberOfTemporalLayers));
189 RTC_DCHECK_GE(video_codec.VP9()->numberOfTemporalLayers, 1);
190 RTC_DCHECK_LE(video_codec.VP9()->numberOfTemporalLayers,
191 kMaxTemporalStreams);
192
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200193 RTC_DCHECK(config.spatial_layers.empty() ||
194 config.spatial_layers.size() ==
195 video_codec.VP9()->numberOfSpatialLayers);
196
197 std::vector<SpatialLayer> spatial_layers;
198 if (!config.spatial_layers.empty()) {
199 // Layering is set explicitly.
200 spatial_layers = config.spatial_layers;
Sergey Silkin86684962018-03-28 19:32:37 +0200201 } else {
Ilya Nikolaevskiy39fb8172020-04-14 10:28:19 +0200202 size_t first_active_layer = 0;
Ilya Nikolaevskiy03d90962020-02-11 12:50:38 +0100203 for (size_t spatial_idx = 0;
204 spatial_idx < config.simulcast_layers.size(); ++spatial_idx) {
205 if (config.simulcast_layers[spatial_idx].active) {
Ilya Nikolaevskiy39fb8172020-04-14 10:28:19 +0200206 first_active_layer = spatial_idx;
Ilya Nikolaevskiy03d90962020-02-11 12:50:38 +0100207 break;
208 }
209 }
210
Sergey Silkin1946a3f2018-08-22 11:42:16 +0200211 spatial_layers = GetSvcConfig(
212 video_codec.width, video_codec.height, video_codec.maxFramerate,
Ilya Nikolaevskiy39fb8172020-04-14 10:28:19 +0200213 first_active_layer, video_codec.VP9()->numberOfSpatialLayers,
Sergey Silkin1946a3f2018-08-22 11:42:16 +0200214 video_codec.VP9()->numberOfTemporalLayers,
215 video_codec.mode == VideoCodecMode::kScreensharing);
Sergey Silkin86684962018-03-28 19:32:37 +0200216
Sergey Silkin33120922018-11-28 13:32:13 +0100217 // If there was no request for spatial layering, don't limit bitrate
218 // of single spatial layer.
219 const bool no_spatial_layering =
220 video_codec.VP9()->numberOfSpatialLayers <= 1;
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200221 if (no_spatial_layering) {
222 // Use codec's bitrate limits.
223 spatial_layers.back().minBitrate = video_codec.minBitrate;
Ilya Nikolaevskiy9ef5e052019-03-05 10:08:35 +0100224 spatial_layers.back().targetBitrate = video_codec.maxBitrate;
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200225 spatial_layers.back().maxBitrate = video_codec.maxBitrate;
Sergey Silkin86684962018-03-28 19:32:37 +0200226 }
Sergey Silkin8b9b5f92018-12-10 09:28:53 +0100227
Ilya Nikolaevskiy7a824672020-06-18 19:16:53 +0200228 for (size_t spatial_idx = first_active_layer;
Sergey Silkin8b9b5f92018-12-10 09:28:53 +0100229 spatial_idx < config.simulcast_layers.size() &&
Ilya Nikolaevskiya945cda2020-09-22 15:55:23 +0200230 spatial_idx < spatial_layers.size() + first_active_layer;
Sergey Silkin8b9b5f92018-12-10 09:28:53 +0100231 ++spatial_idx) {
Ilya Nikolaevskiy39fb8172020-04-14 10:28:19 +0200232 spatial_layers[spatial_idx - first_active_layer].active =
Sergey Silkin8b9b5f92018-12-10 09:28:53 +0100233 config.simulcast_layers[spatial_idx].active;
234 }
Sergey Silkin86684962018-03-28 19:32:37 +0200235 }
236
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200237 RTC_DCHECK(!spatial_layers.empty());
238 for (size_t i = 0; i < spatial_layers.size(); ++i) {
239 video_codec.spatialLayers[i] = spatial_layers[i];
240 }
241
Ilya Nikolaevskiy09eb6e22020-06-05 12:36:32 +0200242 // The top spatial layer dimensions may not be equal to the input
243 // resolution because of the rounding or explicit configuration.
244 // This difference must be propagated to the stream configuration.
245 video_codec.width = spatial_layers.back().width;
246 video_codec.height = spatial_layers.back().height;
247 video_codec.simulcastStream[0].width = spatial_layers.back().width;
248 video_codec.simulcastStream[0].height = spatial_layers.back().height;
249
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200250 // Update layering settings.
251 video_codec.VP9()->numberOfSpatialLayers =
252 static_cast<unsigned char>(spatial_layers.size());
253 RTC_DCHECK_GE(video_codec.VP9()->numberOfSpatialLayers, 1);
254 RTC_DCHECK_LE(video_codec.VP9()->numberOfSpatialLayers,
255 kMaxSpatialLayers);
256
257 video_codec.VP9()->numberOfTemporalLayers = static_cast<unsigned char>(
258 spatial_layers.back().numberOfTemporalLayers);
259 RTC_DCHECK_GE(video_codec.VP9()->numberOfTemporalLayers, 1);
260 RTC_DCHECK_LE(video_codec.VP9()->numberOfTemporalLayers,
261 kMaxTemporalStreams);
262
Sergey Silkin86684962018-03-28 19:32:37 +0200263 break;
264 }
Danil Chapovalov4005e5a2020-11-25 17:01:22 +0100265 case kVideoCodecAV1:
philipel94375292022-05-13 13:16:44 +0200266 if (SetAv1SvcConfig(video_codec,
267 /*num_temporal_layers=*/
268 streams.back().num_temporal_layers.value_or(1),
269 /*num_spatial_layers=*/
270 std::max<int>(config.spatial_layers.size(), 1))) {
Erik Språngf8654442021-06-01 16:52:24 +0200271 for (size_t i = 0; i < config.spatial_layers.size(); ++i) {
272 video_codec.spatialLayers[i].active = config.spatial_layers[i].active;
273 }
274 } else {
Danil Chapovalov4005e5a2020-11-25 17:01:22 +0100275 RTC_LOG(LS_WARNING) << "Failed to configure svc bitrates for av1.";
276 }
277 break;
Sergey Silkin86684962018-03-28 19:32:37 +0200278 case kVideoCodecH264: {
279 if (!config.encoder_specific_settings)
280 *video_codec.H264() = VideoEncoder::GetDefaultH264Settings();
Johnny Lee1a1c52b2019-02-08 14:25:40 -0500281 video_codec.H264()->numberOfTemporalLayers = static_cast<unsigned char>(
282 streams.back().num_temporal_layers.value_or(
283 video_codec.H264()->numberOfTemporalLayers));
284 RTC_DCHECK_GE(video_codec.H264()->numberOfTemporalLayers, 1);
285 RTC_DCHECK_LE(video_codec.H264()->numberOfTemporalLayers,
286 kMaxTemporalStreams);
Sergey Silkin86684962018-03-28 19:32:37 +0200287 break;
288 }
289 default:
290 // TODO(pbos): Support encoder_settings codec-agnostically.
291 RTC_DCHECK(!config.encoder_specific_settings)
292 << "Encoder-specific settings for codec type not wired up.";
293 break;
294 }
295
Elad Alonc67a4d62019-10-11 16:54:18 +0200296 const absl::optional<DataRate> experimental_min_bitrate =
297 GetExperimentalMinVideoBitrate(video_codec.codecType);
298 if (experimental_min_bitrate) {
299 const int experimental_min_bitrate_kbps =
300 rtc::saturated_cast<int>(experimental_min_bitrate->kbps());
301 video_codec.minBitrate = experimental_min_bitrate_kbps;
302 video_codec.simulcastStream[0].minBitrate = experimental_min_bitrate_kbps;
303 if (video_codec.codecType == kVideoCodecVP9) {
304 video_codec.spatialLayers[0].minBitrate = experimental_min_bitrate_kbps;
305 }
306 }
307
Erik Språng08127a92016-11-16 16:41:30 +0100308 return video_codec;
309}
310
311} // namespace webrtc