blob: d61dd9849899566bb2bb395136320d08afd79de7 [file] [log] [blame]
henrike@webrtc.org28e20752013-07-10 00:45:36 +00001/*
kjellanderb24317b2016-02-10 07:54:43 -08002 * Copyright 2012 The WebRTC project authors. All Rights Reserved.
henrike@webrtc.org28e20752013-07-10 00:45:36 +00003 *
kjellanderb24317b2016-02-10 07:54:43 -08004 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
henrike@webrtc.org28e20752013-07-10 00:45:36 +00009 */
10
11// This file contains interfaces for MediaStream, MediaTrack and MediaSource.
12// These interfaces are used for implementing MediaStream and MediaTrack as
13// defined in http://dev.w3.org/2011/webrtc/editor/webrtc.html#stream-api. These
Niels Möllere942b142019-09-17 14:30:41 +020014// interfaces must be used only with PeerConnection.
henrike@webrtc.org28e20752013-07-10 00:45:36 +000015
Steve Anton10542f22019-01-11 09:11:00 -080016#ifndef API_MEDIA_STREAM_INTERFACE_H_
17#define API_MEDIA_STREAM_INTERFACE_H_
henrike@webrtc.org28e20752013-07-10 00:45:36 +000018
pbos9baddf22017-01-02 06:44:41 -080019#include <stddef.h>
20
henrike@webrtc.org28e20752013-07-10 00:45:36 +000021#include <string>
22#include <vector>
23
Danil Chapovalov0bc58cf2018-06-21 13:32:56 +020024#include "absl/types/optional.h"
Piotr (Peter) Slatala95ca6e12018-11-13 07:57:07 -080025#include "api/audio_options.h"
Mirko Bonadeid9708072019-01-25 20:26:48 +010026#include "api/scoped_refptr.h"
Markus Handell9982efa2019-11-21 11:56:50 +010027#include "api/video/recordable_encoded_frame.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020028#include "api/video/video_frame.h"
Niels Möllerc6ce9c52018-05-11 11:15:30 +020029#include "api/video/video_sink_interface.h"
Niels Möller0327c2d2018-05-21 14:09:31 +020030#include "api/video/video_source_interface.h"
Markus Handell6fa9e682021-10-13 22:50:53 +020031#include "api/video_track_source_constraints.h"
Ivo Creusen56d46092017-11-24 17:29:59 +010032#include "modules/audio_processing/include/audio_processing_statistics.h"
Steve Anton10542f22019-01-11 09:11:00 -080033#include "rtc_base/ref_count.h"
Mirko Bonadei66e76792019-04-02 11:33:59 +020034#include "rtc_base/system/rtc_export.h"
henrike@webrtc.org28e20752013-07-10 00:45:36 +000035
henrike@webrtc.org28e20752013-07-10 00:45:36 +000036namespace webrtc {
37
38// Generic observer interface.
39class ObserverInterface {
40 public:
41 virtual void OnChanged() = 0;
42
43 protected:
44 virtual ~ObserverInterface() {}
45};
46
47class NotifierInterface {
48 public:
49 virtual void RegisterObserver(ObserverInterface* observer) = 0;
50 virtual void UnregisterObserver(ObserverInterface* observer) = 0;
51
52 virtual ~NotifierInterface() {}
53};
54
deadbeefb10f32f2017-02-08 01:38:21 -080055// Base class for sources. A MediaStreamTrack has an underlying source that
56// provides media. A source can be shared by multiple tracks.
Mirko Bonadei66e76792019-04-02 11:33:59 +020057class RTC_EXPORT MediaSourceInterface : public rtc::RefCountInterface,
58 public NotifierInterface {
henrike@webrtc.org28e20752013-07-10 00:45:36 +000059 public:
Yves Gerey665174f2018-06-19 15:03:05 +020060 enum SourceState { kInitializing, kLive, kEnded, kMuted };
henrike@webrtc.org28e20752013-07-10 00:45:36 +000061
62 virtual SourceState state() const = 0;
63
tommi6eca7e32015-12-15 04:27:11 -080064 virtual bool remote() const = 0;
65
henrike@webrtc.org28e20752013-07-10 00:45:36 +000066 protected:
Danil Chapovalov2a5ce2b2018-02-07 09:38:31 +010067 ~MediaSourceInterface() override = default;
henrike@webrtc.org28e20752013-07-10 00:45:36 +000068};
69
deadbeefb10f32f2017-02-08 01:38:21 -080070// C++ version of MediaStreamTrack.
71// See: https://www.w3.org/TR/mediacapture-streams/#mediastreamtrack
Mirko Bonadei66e76792019-04-02 11:33:59 +020072class RTC_EXPORT MediaStreamTrackInterface : public rtc::RefCountInterface,
73 public NotifierInterface {
henrike@webrtc.org28e20752013-07-10 00:45:36 +000074 public:
75 enum TrackState {
perkjc8f952d2016-03-23 00:33:56 -070076 kLive,
77 kEnded,
henrike@webrtc.org28e20752013-07-10 00:45:36 +000078 };
79
Niels Möller6dcd4dc2019-08-26 10:45:28 +020080 static const char* const kAudioKind;
81 static const char* const kVideoKind;
deadbeeffac06552015-11-25 11:26:01 -080082
nissefcc640f2016-04-01 01:10:42 -070083 // The kind() method must return kAudioKind only if the object is a
84 // subclass of AudioTrackInterface, and kVideoKind only if the
85 // object is a subclass of VideoTrackInterface. It is typically used
86 // to protect a static_cast<> to the corresponding subclass.
henrike@webrtc.org28e20752013-07-10 00:45:36 +000087 virtual std::string kind() const = 0;
deadbeefb10f32f2017-02-08 01:38:21 -080088
89 // Track identifier.
henrike@webrtc.org28e20752013-07-10 00:45:36 +000090 virtual std::string id() const = 0;
deadbeefb10f32f2017-02-08 01:38:21 -080091
92 // A disabled track will produce silence (if audio) or black frames (if
93 // video). Can be disabled and re-enabled.
henrike@webrtc.org28e20752013-07-10 00:45:36 +000094 virtual bool enabled() const = 0;
henrike@webrtc.org28e20752013-07-10 00:45:36 +000095 virtual bool set_enabled(bool enable) = 0;
fischman@webrtc.org32001ef2013-08-12 23:26:21 +000096
deadbeefb10f32f2017-02-08 01:38:21 -080097 // Live or ended. A track will never be live again after becoming ended.
98 virtual TrackState state() const = 0;
99
fischman@webrtc.org32001ef2013-08-12 23:26:21 +0000100 protected:
Danil Chapovalov2a5ce2b2018-02-07 09:38:31 +0100101 ~MediaStreamTrackInterface() override = default;
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000102};
103
deadbeefb10f32f2017-02-08 01:38:21 -0800104// VideoTrackSourceInterface is a reference counted source used for
105// VideoTracks. The same source can be used by multiple VideoTracks.
perkj773be362017-07-31 23:22:01 -0700106// VideoTrackSourceInterface is designed to be invoked on the signaling thread
107// except for rtc::VideoSourceInterface<VideoFrame> methods that will be invoked
108// on the worker thread via a VideoTrack. A custom implementation of a source
109// can inherit AdaptedVideoTrackSource instead of directly implementing this
110// interface.
Yves Gerey665174f2018-06-19 15:03:05 +0200111class VideoTrackSourceInterface : public MediaSourceInterface,
112 public rtc::VideoSourceInterface<VideoFrame> {
perkja3ede6c2016-03-08 01:27:48 +0100113 public:
nissefcc640f2016-04-01 01:10:42 -0700114 struct Stats {
115 // Original size of captured frame, before video adaptation.
116 int input_width;
117 int input_height;
118 };
perkja3ede6c2016-03-08 01:27:48 +0100119
perkj0d3eef22016-03-09 02:39:17 +0100120 // Indicates that parameters suitable for screencasts should be automatically
121 // applied to RtpSenders.
122 // TODO(perkj): Remove these once all known applications have moved to
deadbeefb10f32f2017-02-08 01:38:21 -0800123 // explicitly setting suitable parameters for screencasts and don't need this
perkj0d3eef22016-03-09 02:39:17 +0100124 // implicit behavior.
125 virtual bool is_screencast() const = 0;
126
Perc0d31e92016-03-31 17:23:39 +0200127 // Indicates that the encoder should denoise video before encoding it.
128 // If it is not set, the default configuration is used which is different
129 // depending on video codec.
perkj0d3eef22016-03-09 02:39:17 +0100130 // TODO(perkj): Remove this once denoising is done by the source, and not by
131 // the encoder.
Danil Chapovalov0bc58cf2018-06-21 13:32:56 +0200132 virtual absl::optional<bool> needs_denoising() const = 0;
perkja3ede6c2016-03-08 01:27:48 +0100133
deadbeefb10f32f2017-02-08 01:38:21 -0800134 // Returns false if no stats are available, e.g, for a remote source, or a
135 // source which has not seen its first frame yet.
136 //
137 // Implementation should avoid blocking.
nissefcc640f2016-04-01 01:10:42 -0700138 virtual bool GetStats(Stats* stats) = 0;
139
Markus Handell9982efa2019-11-21 11:56:50 +0100140 // Returns true if encoded output can be enabled in the source.
Markus Handell6efc14b2020-05-05 20:11:13 +0200141 virtual bool SupportsEncodedOutput() const = 0;
Markus Handell9982efa2019-11-21 11:56:50 +0100142
143 // Reliably cause a key frame to be generated in encoded output.
144 // TODO(bugs.webrtc.org/11115): find optimal naming.
Markus Handell6efc14b2020-05-05 20:11:13 +0200145 virtual void GenerateKeyFrame() = 0;
Markus Handell9982efa2019-11-21 11:56:50 +0100146
147 // Add an encoded video sink to the source and additionally cause
148 // a key frame to be generated from the source. The sink will be
149 // invoked from a decoder queue.
Markus Handell9982efa2019-11-21 11:56:50 +0100150 virtual void AddEncodedSink(
Markus Handell6efc14b2020-05-05 20:11:13 +0200151 rtc::VideoSinkInterface<RecordableEncodedFrame>* sink) = 0;
Markus Handell9982efa2019-11-21 11:56:50 +0100152
153 // Removes an encoded video sink from the source.
Markus Handell9982efa2019-11-21 11:56:50 +0100154 virtual void RemoveEncodedSink(
Markus Handell6efc14b2020-05-05 20:11:13 +0200155 rtc::VideoSinkInterface<RecordableEncodedFrame>* sink) = 0;
Markus Handell9982efa2019-11-21 11:56:50 +0100156
Markus Handell6fa9e682021-10-13 22:50:53 +0200157 // Notify about constraints set on the source. The information eventually gets
158 // routed to attached sinks via VideoSinkInterface<>::OnConstraintsChanged.
159 // The call is expected to happen on the network thread.
160 // TODO(crbug/1255737): make pure virtual once downstream project adapts.
161 virtual void ProcessConstraints(
162 const webrtc::VideoTrackSourceConstraints& constraints) {}
163
perkja3ede6c2016-03-08 01:27:48 +0100164 protected:
Danil Chapovalov2a5ce2b2018-02-07 09:38:31 +0100165 ~VideoTrackSourceInterface() override = default;
perkja3ede6c2016-03-08 01:27:48 +0100166};
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000167
perkj773be362017-07-31 23:22:01 -0700168// VideoTrackInterface is designed to be invoked on the signaling thread except
169// for rtc::VideoSourceInterface<VideoFrame> methods that must be invoked
170// on the worker thread.
171// PeerConnectionFactory::CreateVideoTrack can be used for creating a VideoTrack
172// that ensures thread safety and that all methods are called on the right
173// thread.
Mirko Bonadei35214fc2019-09-23 14:54:28 +0200174class RTC_EXPORT VideoTrackInterface
175 : public MediaStreamTrackInterface,
176 public rtc::VideoSourceInterface<VideoFrame> {
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000177 public:
pbos5214a0a2016-12-16 15:39:11 -0800178 // Video track content hint, used to override the source is_screencast
179 // property.
Harald Alvestrandc19ab072018-06-18 08:53:10 +0200180 // See https://crbug.com/653531 and https://w3c.github.io/mst-content-hint.
181 enum class ContentHint { kNone, kFluid, kDetailed, kText };
pbos5214a0a2016-12-16 15:39:11 -0800182
mbonadei539d1042017-07-10 02:40:49 -0700183 // Register a video sink for this track. Used to connect the track to the
184 // underlying video engine.
185 void AddOrUpdateSink(rtc::VideoSinkInterface<VideoFrame>* sink,
186 const rtc::VideoSinkWants& wants) override {}
187 void RemoveSink(rtc::VideoSinkInterface<VideoFrame>* sink) override {}
188
perkja3ede6c2016-03-08 01:27:48 +0100189 virtual VideoTrackSourceInterface* GetSource() const = 0;
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000190
Danil Chapovalov2a5ce2b2018-02-07 09:38:31 +0100191 virtual ContentHint content_hint() const;
pbos5214a0a2016-12-16 15:39:11 -0800192 virtual void set_content_hint(ContentHint hint) {}
193
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000194 protected:
Danil Chapovalov2a5ce2b2018-02-07 09:38:31 +0100195 ~VideoTrackInterface() override = default;
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000196};
197
tommi6eca7e32015-12-15 04:27:11 -0800198// Interface for receiving audio data from a AudioTrack.
199class AudioTrackSinkInterface {
200 public:
201 virtual void OnData(const void* audio_data,
202 int bits_per_sample,
203 int sample_rate,
Peter Kasting69558702016-01-12 16:26:35 -0800204 size_t number_of_channels,
Minyue Li99d6d812020-01-29 10:25:12 +0100205 size_t number_of_frames) {
Artem Titovd3251962021-11-15 16:57:07 +0100206 RTC_DCHECK_NOTREACHED() << "This method must be overridden, or not used.";
Minyue Li99d6d812020-01-29 10:25:12 +0100207 }
208
Artem Titov0e61fdd2021-07-25 21:50:14 +0200209 // In this method, `absolute_capture_timestamp_ms`, when available, is
Minyue Li99d6d812020-01-29 10:25:12 +0100210 // supposed to deliver the timestamp when this audio frame was originally
211 // captured. This timestamp MUST be based on the same clock as
212 // rtc::TimeMillis().
213 virtual void OnData(const void* audio_data,
214 int bits_per_sample,
215 int sample_rate,
216 size_t number_of_channels,
217 size_t number_of_frames,
218 absl::optional<int64_t> absolute_capture_timestamp_ms) {
219 // TODO(bugs.webrtc.org/10739): Deprecate the old OnData and make this one
220 // pure virtual.
221 return OnData(audio_data, bits_per_sample, sample_rate, number_of_channels,
222 number_of_frames);
223 }
tommi6eca7e32015-12-15 04:27:11 -0800224
Gustaf Ullberg46ea5d72020-12-15 15:12:16 +0100225 // Returns the number of channels encoded by the sink. This can be less than
226 // the number_of_channels if down-mixing occur. A value of -1 means an unknown
227 // number.
228 virtual int NumPreferredChannels() const { return -1; }
229
tommi6eca7e32015-12-15 04:27:11 -0800230 protected:
231 virtual ~AudioTrackSinkInterface() {}
232};
233
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000234// AudioSourceInterface is a reference counted source used for AudioTracks.
deadbeefb10f32f2017-02-08 01:38:21 -0800235// The same source can be used by multiple AudioTracks.
Mirko Bonadei66e76792019-04-02 11:33:59 +0200236class RTC_EXPORT AudioSourceInterface : public MediaSourceInterface {
wu@webrtc.orgb9a088b2014-02-13 23:18:49 +0000237 public:
238 class AudioObserver {
239 public:
240 virtual void OnSetVolume(double volume) = 0;
241
242 protected:
243 virtual ~AudioObserver() {}
244 };
245
deadbeefb10f32f2017-02-08 01:38:21 -0800246 // TODO(deadbeef): Makes all the interfaces pure virtual after they're
247 // implemented in chromium.
248
Artem Titov0e61fdd2021-07-25 21:50:14 +0200249 // Sets the volume of the source. `volume` is in the range of [0, 10].
Tommif888bb52015-12-12 01:37:01 +0100250 // TODO(tommi): This method should be on the track and ideally volume should
251 // be applied in the track in a way that does not affect clones of the track.
wu@webrtc.orgb9a088b2014-02-13 23:18:49 +0000252 virtual void SetVolume(double volume) {}
253
deadbeefb10f32f2017-02-08 01:38:21 -0800254 // Registers/unregisters observers to the audio source.
wu@webrtc.orgb9a088b2014-02-13 23:18:49 +0000255 virtual void RegisterAudioObserver(AudioObserver* observer) {}
256 virtual void UnregisterAudioObserver(AudioObserver* observer) {}
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000257
tommi6eca7e32015-12-15 04:27:11 -0800258 // TODO(tommi): Make pure virtual.
259 virtual void AddSink(AudioTrackSinkInterface* sink) {}
260 virtual void RemoveSink(AudioTrackSinkInterface* sink) {}
Piotr (Peter) Slatala95ca6e12018-11-13 07:57:07 -0800261
262 // Returns options for the AudioSource.
263 // (for some of the settings this approach is broken, e.g. setting
264 // audio network adaptation on the source is the wrong layer of abstraction).
265 virtual const cricket::AudioOptions options() const;
mallinath@webrtc.org67ee6b92014-02-03 16:57:16 +0000266};
267
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000268// Interface of the audio processor used by the audio track to collect
269// statistics.
buildbot@webrtc.orgd4e598d2014-07-29 17:36:52 +0000270class AudioProcessorInterface : public rtc::RefCountInterface {
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000271 public:
Ivo Creusenae026092017-11-20 13:07:16 +0100272 struct AudioProcessorStatistics {
273 bool typing_noise_detected = false;
Ivo Creusen56d46092017-11-24 17:29:59 +0100274 AudioProcessingStats apm_statistics;
Ivo Creusenae026092017-11-20 13:07:16 +0100275 };
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000276
Artem Titov0e61fdd2021-07-25 21:50:14 +0200277 // Get audio processor statistics. The `has_remote_tracks` argument should be
Ivo Creusenae026092017-11-20 13:07:16 +0100278 // set if there are active remote tracks (this would usually be true during
279 // a call). If there are no remote tracks some of the stats will not be set by
280 // the AudioProcessor, because they only make sense if there is at least one
281 // remote track.
Sam Zackrisson28127632018-11-01 11:37:15 +0100282 virtual AudioProcessorStatistics GetStats(bool has_remote_tracks) = 0;
Ivo Creusenae026092017-11-20 13:07:16 +0100283
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000284 protected:
Danil Chapovalov2a5ce2b2018-02-07 09:38:31 +0100285 ~AudioProcessorInterface() override = default;
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000286};
287
Mirko Bonadei35214fc2019-09-23 14:54:28 +0200288class RTC_EXPORT AudioTrackInterface : public MediaStreamTrackInterface {
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000289 public:
deadbeefb10f32f2017-02-08 01:38:21 -0800290 // TODO(deadbeef): Figure out if the following interface should be const or
291 // not.
Yves Gerey665174f2018-06-19 15:03:05 +0200292 virtual AudioSourceInterface* GetSource() const = 0;
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000293
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000294 // Add/Remove a sink that will receive the audio data from the track.
295 virtual void AddSink(AudioTrackSinkInterface* sink) = 0;
296 virtual void RemoveSink(AudioTrackSinkInterface* sink) = 0;
mallinath@webrtc.org67ee6b92014-02-03 16:57:16 +0000297
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000298 // Get the signal level from the audio track.
299 // Return true on success, otherwise false.
deadbeefb10f32f2017-02-08 01:38:21 -0800300 // TODO(deadbeef): Change the interface to int GetSignalLevel() and pure
301 // virtual after it's implemented in chromium.
Danil Chapovalov2a5ce2b2018-02-07 09:38:31 +0100302 virtual bool GetSignalLevel(int* level);
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000303
deadbeef8d60a942017-02-27 14:47:33 -0800304 // Get the audio processor used by the audio track. Return null if the track
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000305 // does not have any processor.
deadbeefb10f32f2017-02-08 01:38:21 -0800306 // TODO(deadbeef): Make the interface pure virtual.
Danil Chapovalov2a5ce2b2018-02-07 09:38:31 +0100307 virtual rtc::scoped_refptr<AudioProcessorInterface> GetAudioProcessor();
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000308
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000309 protected:
Danil Chapovalov2a5ce2b2018-02-07 09:38:31 +0100310 ~AudioTrackInterface() override = default;
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000311};
312
Yves Gerey665174f2018-06-19 15:03:05 +0200313typedef std::vector<rtc::scoped_refptr<AudioTrackInterface> > AudioTrackVector;
314typedef std::vector<rtc::scoped_refptr<VideoTrackInterface> > VideoTrackVector;
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000315
deadbeefb10f32f2017-02-08 01:38:21 -0800316// C++ version of https://www.w3.org/TR/mediacapture-streams/#mediastream.
317//
318// A major difference is that remote audio/video tracks (received by a
319// PeerConnection/RtpReceiver) are not synchronized simply by adding them to
320// the same stream; a session description with the correct "a=msid" attributes
321// must be pushed down.
322//
323// Thus, this interface acts as simply a container for tracks.
buildbot@webrtc.orgd4e598d2014-07-29 17:36:52 +0000324class MediaStreamInterface : public rtc::RefCountInterface,
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000325 public NotifierInterface {
326 public:
Seth Hampson13b8bad2018-03-13 16:05:28 -0700327 virtual std::string id() const = 0;
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000328
329 virtual AudioTrackVector GetAudioTracks() = 0;
330 virtual VideoTrackVector GetVideoTracks() = 0;
Yves Gerey665174f2018-06-19 15:03:05 +0200331 virtual rtc::scoped_refptr<AudioTrackInterface> FindAudioTrack(
332 const std::string& track_id) = 0;
333 virtual rtc::scoped_refptr<VideoTrackInterface> FindVideoTrack(
334 const std::string& track_id) = 0;
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000335
336 virtual bool AddTrack(AudioTrackInterface* track) = 0;
337 virtual bool AddTrack(VideoTrackInterface* track) = 0;
338 virtual bool RemoveTrack(AudioTrackInterface* track) = 0;
339 virtual bool RemoveTrack(VideoTrackInterface* track) = 0;
340
341 protected:
Danil Chapovalov2a5ce2b2018-02-07 09:38:31 +0100342 ~MediaStreamInterface() override = default;
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000343};
344
345} // namespace webrtc
346
Steve Anton10542f22019-01-11 09:11:00 -0800347#endif // API_MEDIA_STREAM_INTERFACE_H_