blob: 10bceda0d23b0114493432413b5d1f2744c3175e [file] [log] [blame]
Niels Möller802506c2018-05-31 10:44:51 +02001/*
2 * Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
11#ifndef API_VIDEO_CODECS_VIDEO_CODEC_H_
12#define API_VIDEO_CODECS_VIDEO_CODEC_H_
13
Yves Gerey988cc082018-10-23 12:03:01 +020014#include <stddef.h>
15#include <stdint.h>
Jonas Olssona4d87372019-07-05 19:08:33 +020016
Niels Möllera46bd4b2018-06-08 14:03:44 +020017#include <string>
Niels Möller802506c2018-05-31 10:44:51 +020018
Danil Chapovalov9f4859e2020-10-16 17:45:41 +020019#include "absl/strings/string_view.h"
Yves Gerey988cc082018-10-23 12:03:01 +020020#include "api/video/video_bitrate_allocation.h"
Niels Möller22b70ff2018-11-20 11:06:58 +010021#include "api/video/video_codec_type.h"
Niels Möller79d566b2022-04-29 11:03:13 +020022#include "api/video_codecs/scalability_mode.h"
Niels Möllerc0a9f352022-05-20 13:38:49 +020023#include "api/video_codecs/simulcast_stream.h"
Niels Möller5b69aa62020-08-14 15:32:14 +020024#include "api/video_codecs/spatial_layer.h"
Mirko Bonadei276827c2018-10-16 14:13:50 +020025#include "rtc_base/system/rtc_export.h"
Niels Möller802506c2018-05-31 10:44:51 +020026
Niels Möllera46bd4b2018-06-08 14:03:44 +020027namespace webrtc {
28
29// The VideoCodec class represents an old defacto-apis, which we're migrating
Niels Möller802506c2018-05-31 10:44:51 +020030// away from slowly.
31
Niels Möllera46bd4b2018-06-08 14:03:44 +020032// Video codec
Niels Möllere3cf3d02018-06-13 11:52:16 +020033enum class VideoCodecComplexity {
Erik Språnge4589cb2022-04-06 16:44:30 +020034 kComplexityLow = -1,
Niels Möllera46bd4b2018-06-08 14:03:44 +020035 kComplexityNormal = 0,
36 kComplexityHigh = 1,
37 kComplexityHigher = 2,
38 kComplexityMax = 3
39};
40
41// VP8 specific
42struct VideoCodecVP8 {
43 bool operator==(const VideoCodecVP8& other) const;
44 bool operator!=(const VideoCodecVP8& other) const {
45 return !(*this == other);
46 }
Niels Möller79924572022-07-05 14:22:27 +020047 // Temporary utility method for transition deleting numberOfTemporalLayers
48 // setting (replaced by ScalabilityMode).
49 void SetNumberOfTemporalLayers(unsigned char n) {
50 numberOfTemporalLayers = n;
51 }
Niels Möllera46bd4b2018-06-08 14:03:44 +020052 unsigned char numberOfTemporalLayers;
53 bool denoisingOn;
54 bool automaticResizeOn;
Niels Möllera46bd4b2018-06-08 14:03:44 +020055 int keyFrameInterval;
56};
57
Sergey Silkincf267052019-04-09 11:40:09 +020058enum class InterLayerPredMode : int {
59 kOff = 0, // Inter-layer prediction is disabled.
60 kOn = 1, // Inter-layer prediction is enabled.
61 kOnKeyPic = 2 // Inter-layer prediction is enabled but limited to key frames.
Niels Möllera46bd4b2018-06-08 14:03:44 +020062};
63
64// VP9 specific.
65struct VideoCodecVP9 {
66 bool operator==(const VideoCodecVP9& other) const;
67 bool operator!=(const VideoCodecVP9& other) const {
68 return !(*this == other);
69 }
Niels Möller79924572022-07-05 14:22:27 +020070 // Temporary utility method for transition deleting numberOfTemporalLayers
71 // setting (replaced by ScalabilityMode).
72 void SetNumberOfTemporalLayers(unsigned char n) {
73 numberOfTemporalLayers = n;
74 }
Niels Möllera46bd4b2018-06-08 14:03:44 +020075 unsigned char numberOfTemporalLayers;
76 bool denoisingOn;
Niels Möllera46bd4b2018-06-08 14:03:44 +020077 int keyFrameInterval;
78 bool adaptiveQpMode;
79 bool automaticResizeOn;
80 unsigned char numberOfSpatialLayers;
81 bool flexibleMode;
82 InterLayerPredMode interLayerPred;
83};
84
85// H264 specific.
86struct VideoCodecH264 {
87 bool operator==(const VideoCodecH264& other) const;
88 bool operator!=(const VideoCodecH264& other) const {
89 return !(*this == other);
90 }
Niels Möller79924572022-07-05 14:22:27 +020091 // Temporary utility method for transition deleting numberOfTemporalLayers
92 // setting (replaced by ScalabilityMode).
93 void SetNumberOfTemporalLayers(unsigned char n) {
94 numberOfTemporalLayers = n;
95 }
Niels Möllera46bd4b2018-06-08 14:03:44 +020096 int keyFrameInterval;
Johnny Lee1a1c52b2019-02-08 14:25:40 -050097 uint8_t numberOfTemporalLayers;
Niels Möllera46bd4b2018-06-08 14:03:44 +020098};
99
100// Translates from name of codec to codec type and vice versa.
Mirko Bonadeiac194142018-10-22 17:08:37 +0200101RTC_EXPORT const char* CodecTypeToPayloadString(VideoCodecType type);
102RTC_EXPORT VideoCodecType PayloadStringToCodecType(const std::string& name);
Niels Möllera46bd4b2018-06-08 14:03:44 +0200103
104union VideoCodecUnion {
105 VideoCodecVP8 VP8;
106 VideoCodecVP9 VP9;
107 VideoCodecH264 H264;
108};
109
Niels Möllere3cf3d02018-06-13 11:52:16 +0200110enum class VideoCodecMode { kRealtimeVideo, kScreensharing };
Niels Möllera46bd4b2018-06-08 14:03:44 +0200111
112// Common video codec properties
Mirko Bonadei276827c2018-10-16 14:13:50 +0200113class RTC_EXPORT VideoCodec {
Niels Möllera46bd4b2018-06-08 14:03:44 +0200114 public:
115 VideoCodec();
116
Danil Chapovalov9f4859e2020-10-16 17:45:41 +0200117 // Scalability mode as described in
118 // https://www.w3.org/TR/webrtc-svc/#scalabilitymodes*
Niels Möller79d566b2022-04-29 11:03:13 +0200119 absl::optional<ScalabilityMode> GetScalabilityMode() const {
120 return scalability_mode_;
Danil Chapovalov9f4859e2020-10-16 17:45:41 +0200121 }
Niels Möller79d566b2022-04-29 11:03:13 +0200122 void SetScalabilityMode(ScalabilityMode scalability_mode) {
123 scalability_mode_ = scalability_mode;
124 }
125 void UnsetScalabilityMode() { scalability_mode_ = absl::nullopt; }
Danil Chapovalov9f4859e2020-10-16 17:45:41 +0200126
“Michael3147e292022-02-19 16:48:50 -0600127 VideoCodecComplexity GetVideoEncoderComplexity() const;
128 void SetVideoEncoderComplexity(VideoCodecComplexity complexity_setting);
129
Niels Möller807328f2022-05-12 16:16:39 +0200130 bool GetFrameDropEnabled() const;
131 void SetFrameDropEnabled(bool enabled);
132
Niels Möllera46bd4b2018-06-08 14:03:44 +0200133 // Public variables. TODO(hta): Make them private with accessors.
134 VideoCodecType codecType;
Niels Möllera46bd4b2018-06-08 14:03:44 +0200135
136 // TODO(nisse): Change to int, for consistency.
137 uint16_t width;
138 uint16_t height;
139
Jonas Olssona4d87372019-07-05 19:08:33 +0200140 unsigned int startBitrate; // kilobits/sec.
141 unsigned int maxBitrate; // kilobits/sec.
142 unsigned int minBitrate; // kilobits/sec.
Niels Möllera46bd4b2018-06-08 14:03:44 +0200143
144 uint32_t maxFramerate;
145
146 // This enables/disables encoding and sending when there aren't multiple
147 // simulcast streams,by allocating 0 bitrate if inactive.
148 bool active;
149
150 unsigned int qpMax;
151 unsigned char numberOfSimulcastStreams;
Niels Möllerc0a9f352022-05-20 13:38:49 +0200152 SimulcastStream simulcastStream[kMaxSimulcastStreams];
Niels Möllera46bd4b2018-06-08 14:03:44 +0200153 SpatialLayer spatialLayers[kMaxSpatialLayers];
154
155 VideoCodecMode mode;
156 bool expect_encode_from_texture;
157
158 // Timing frames configuration. There is delay of delay_ms between two
159 // consequent timing frames, excluding outliers. Frame is always made a
160 // timing frame if it's at least outlier_ratio in percent of "ideal" average
161 // frame given bitrate and framerate, i.e. if it's bigger than
162 // |outlier_ratio / 100.0 * bitrate_bps / fps| in bits. This way, timing
163 // frames will not be sent too often usually. Yet large frames will always
164 // have timing information for debug purposes because they are more likely to
165 // cause extra delays.
166 struct TimingFrameTriggerThresholds {
167 int64_t delay_ms;
168 uint16_t outlier_ratio_percent;
169 } timing_frame_thresholds;
170
Florent Castellid3511012020-08-04 11:40:23 +0200171 // Legacy Google conference mode flag for simulcast screenshare
172 bool legacy_conference_mode;
173
Niels Möllera46bd4b2018-06-08 14:03:44 +0200174 bool operator==(const VideoCodec& other) const = delete;
175 bool operator!=(const VideoCodec& other) const = delete;
176
177 // Accessors for codec specific information.
178 // There is a const version of each that returns a reference,
179 // and a non-const version that returns a pointer, in order
180 // to allow modification of the parameters.
181 VideoCodecVP8* VP8();
182 const VideoCodecVP8& VP8() const;
183 VideoCodecVP9* VP9();
184 const VideoCodecVP9& VP9() const;
185 VideoCodecH264* H264();
186 const VideoCodecH264& H264() const;
187
188 private:
189 // TODO(hta): Consider replacing the union with a pointer type.
190 // This will allow removing the VideoCodec* types from this file.
191 VideoCodecUnion codec_specific_;
Niels Möller79d566b2022-04-29 11:03:13 +0200192 absl::optional<ScalabilityMode> scalability_mode_;
“Michael3147e292022-02-19 16:48:50 -0600193 // 'complexity_' indicates the CPU capability of the client. It's used to
194 // determine encoder CPU complexity (e.g., cpu_used for VP8, VP9. and AV1).
Erik Språng4da317f2022-05-17 13:51:01 +0200195 VideoCodecComplexity complexity_;
Niels Möllerbe2fb412022-05-17 15:39:41 +0200196 bool frame_drop_enabled_ = false;
Niels Möllera46bd4b2018-06-08 14:03:44 +0200197};
198
199} // namespace webrtc
Niels Möller802506c2018-05-31 10:44:51 +0200200#endif // API_VIDEO_CODECS_VIDEO_CODEC_H_