blob: 1228861c4242d3fb3c8695da01a79de94dde0a5a [file] [log] [blame]
Fredrik Solenberg23fba1f2015-04-29 15:24:01 +02001/*
2 * Copyright (c) 2015 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#ifndef CALL_AUDIO_RECEIVE_STREAM_H_
12#define CALL_AUDIO_RECEIVE_STREAM_H_
Fredrik Solenberg23fba1f2015-04-29 15:24:01 +020013
Fredrik Solenberg04f49312015-06-08 13:04:56 +020014#include <map>
kwibergfffa42b2016-02-23 10:46:32 -080015#include <memory>
Fredrik Solenberg23fba1f2015-04-29 15:24:01 +020016#include <string>
17#include <vector>
18
Danil Chapovalovb9b146c2018-06-15 12:28:07 +020019#include "absl/types/optional.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020020#include "api/audio_codecs/audio_decoder_factory.h"
21#include "api/call/transport.h"
Steve Anton10542f22019-01-11 09:11:00 -080022#include "api/crypto/crypto_options.h"
Steve Anton10542f22019-01-11 09:11:00 -080023#include "api/rtp_parameters.h"
Tommi1c1f5402021-06-14 10:54:20 +020024#include "call/receive_stream.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020025#include "call/rtp_config.h"
Fredrik Solenberg23fba1f2015-04-29 15:24:01 +020026
27namespace webrtc {
Tommif888bb52015-12-12 01:37:01 +010028class AudioSinkInterface;
Fredrik Solenberg04f49312015-06-08 13:04:56 +020029
Tommi3176ef72022-05-22 20:47:28 +020030class AudioReceiveStreamInterface : public MediaReceiveStreamInterface {
Fredrik Solenberg23fba1f2015-04-29 15:24:01 +020031 public:
Fredrik Solenberg4f4ec0a2015-10-22 10:49:27 +020032 struct Stats {
Paulina Hensman11b34f42018-04-09 14:24:52 +020033 Stats();
34 ~Stats();
Fredrik Solenberg4f4ec0a2015-10-22 10:49:27 +020035 uint32_t remote_ssrc = 0;
Niels Möllerac0a4cb2019-10-09 15:01:33 +020036 int64_t payload_bytes_rcvd = 0;
37 int64_t header_and_padding_bytes_rcvd = 0;
Fredrik Solenberg4f4ec0a2015-10-22 10:49:27 +020038 uint32_t packets_rcvd = 0;
Ivo Creusen8d8ffdb2019-04-30 09:45:21 +020039 uint64_t fec_packets_received = 0;
40 uint64_t fec_packets_discarded = 0;
Philipp Hanckeaf512282022-10-14 09:32:58 +020041 int32_t packets_lost = 0;
Minyue Li28a2c632021-07-07 15:53:38 +020042 uint64_t packets_discarded = 0;
Jakob Ivarssone54914a2021-07-01 11:16:05 +020043 uint32_t nacks_sent = 0;
Fredrik Solenberg4f4ec0a2015-10-22 10:49:27 +020044 std::string codec_name;
Danil Chapovalovb9b146c2018-06-15 12:28:07 +020045 absl::optional<int> codec_payload_type;
Fredrik Solenberg4f4ec0a2015-10-22 10:49:27 +020046 uint32_t jitter_ms = 0;
47 uint32_t jitter_buffer_ms = 0;
48 uint32_t jitter_buffer_preferred_ms = 0;
49 uint32_t delay_estimate_ms = 0;
50 int32_t audio_level = -1;
Gustaf Ullberg9a2e9062017-09-18 09:28:20 +020051 // Stats below correspond to similarly-named fields in the WebRTC stats
52 // spec. https://w3c.github.io/webrtc-stats/#dom-rtcmediastreamtrackstats
zsteine76bd3a2017-07-14 12:17:49 -070053 double total_output_energy = 0.0;
Steve Anton2dbc69f2017-08-24 17:15:13 -070054 uint64_t total_samples_received = 0;
zsteine76bd3a2017-07-14 12:17:49 -070055 double total_output_duration = 0.0;
Steve Anton2dbc69f2017-08-24 17:15:13 -070056 uint64_t concealed_samples = 0;
Ivo Creusen8d8ffdb2019-04-30 09:45:21 +020057 uint64_t silent_concealed_samples = 0;
Gustaf Ullberg9a2e9062017-09-18 09:28:20 +020058 uint64_t concealment_events = 0;
Gustaf Ullbergb0a02072017-10-02 12:00:34 +020059 double jitter_buffer_delay_seconds = 0.0;
Chen Xing0acffb52019-01-15 15:46:29 +010060 uint64_t jitter_buffer_emitted_count = 0;
Artem Titove618cc92020-03-11 11:18:54 +010061 double jitter_buffer_target_delay_seconds = 0.0;
Ivo Creusen1a84b562022-07-19 16:33:10 +020062 double jitter_buffer_minimum_delay_seconds = 0.0;
Ivo Creusen8d8ffdb2019-04-30 09:45:21 +020063 uint64_t inserted_samples_for_deceleration = 0;
64 uint64_t removed_samples_for_acceleration = 0;
Gustaf Ullberg9a2e9062017-09-18 09:28:20 +020065 // Stats below DO NOT correspond directly to anything in the WebRTC stats
Fredrik Solenberg4f4ec0a2015-10-22 10:49:27 +020066 float expand_rate = 0.0f;
67 float speech_expand_rate = 0.0f;
68 float secondary_decoded_rate = 0.0f;
minyue-webrtc0e320ec2017-08-28 13:51:27 +020069 float secondary_discarded_rate = 0.0f;
Fredrik Solenberg4f4ec0a2015-10-22 10:49:27 +020070 float accelerate_rate = 0.0f;
71 float preemptive_expand_rate = 0.0f;
Jakob Ivarsson352ce5c2018-11-27 12:52:16 +010072 uint64_t delayed_packet_outage_samples = 0;
Fredrik Solenberg4f4ec0a2015-10-22 10:49:27 +020073 int32_t decoding_calls_to_silence_generator = 0;
74 int32_t decoding_calls_to_neteq = 0;
75 int32_t decoding_normal = 0;
Alex Narest5b5d97c2019-08-07 18:15:08 +020076 // TODO(alexnarest): Consider decoding_neteq_plc for consistency
Fredrik Solenberg4f4ec0a2015-10-22 10:49:27 +020077 int32_t decoding_plc = 0;
Alex Narest5b5d97c2019-08-07 18:15:08 +020078 int32_t decoding_codec_plc = 0;
Fredrik Solenberg4f4ec0a2015-10-22 10:49:27 +020079 int32_t decoding_cng = 0;
80 int32_t decoding_plc_cng = 0;
henrik.lundin63489782016-09-20 01:47:12 -070081 int32_t decoding_muted_output = 0;
Fredrik Solenberg4f4ec0a2015-10-22 10:49:27 +020082 int64_t capture_start_ntp_time_ms = 0;
Henrik Boström01738c62019-04-15 17:32:00 +020083 // The timestamp at which the last packet was received, i.e. the time of the
84 // local clock when it was received - not the RTP timestamp of that packet.
85 // https://w3c.github.io/webrtc-stats/#dom-rtcinboundrtpstreamstats-lastpacketreceivedtimestamp
86 absl::optional<int64_t> last_packet_received_timestamp_ms;
Ruslan Burakov8af88962018-11-22 17:21:10 +010087 uint64_t jitter_buffer_flushes = 0;
Jakob Ivarsson232b3fd2019-03-06 09:18:40 +010088 double relative_packet_arrival_delay_seconds = 0.0;
Henrik Lundin44125fa2019-04-29 17:00:46 +020089 int32_t interruption_count = 0;
90 int32_t total_interruption_duration_ms = 0;
Åsa Perssonfcf79cc2019-10-22 15:23:44 +020091 // https://w3c.github.io/webrtc-stats/#dom-rtcinboundrtpstreamstats-estimatedplayouttimestamp
92 absl::optional<int64_t> estimated_playout_ntp_timestamp_ms;
Alessio Bazzicaf7b1b952021-03-23 17:23:04 +010093 // Remote outbound stats derived by the received RTCP sender reports.
94 // https://w3c.github.io/webrtc-stats/#remoteoutboundrtpstats-dict*
95 absl::optional<int64_t> last_sender_report_timestamp_ms;
96 absl::optional<int64_t> last_sender_report_remote_timestamp_ms;
97 uint32_t sender_reports_packets_sent = 0;
98 uint64_t sender_reports_bytes_sent = 0;
99 uint64_t sender_reports_reports_count = 0;
Ivo Creusen2562cf02021-09-03 14:51:22 +0000100 absl::optional<TimeDelta> round_trip_time;
101 TimeDelta total_round_trip_time = TimeDelta::Zero();
102 int round_trip_time_measurements;
Fredrik Solenberg4f4ec0a2015-10-22 10:49:27 +0200103 };
Fredrik Solenberg04f49312015-06-08 13:04:56 +0200104
Fredrik Solenberg23fba1f2015-04-29 15:24:01 +0200105 struct Config {
Paulina Hensman11b34f42018-04-09 14:24:52 +0200106 Config();
107 ~Config();
108
Fredrik Solenberg23fba1f2015-04-29 15:24:01 +0200109 std::string ToString() const;
110
111 // Receive-stream specific RTP settings.
Tommi7a15ff32022-05-09 18:54:02 +0000112 struct Rtp : public ReceiveStreamRtpConfig {
Paulina Hensman11b34f42018-04-09 14:24:52 +0200113 Rtp();
114 ~Rtp();
115
Fredrik Solenberg23fba1f2015-04-29 15:24:01 +0200116 std::string ToString() const;
117
solenberg8189b022016-06-14 12:13:00 -0700118 // See NackConfig for description.
119 NackConfig nack;
Fredrik Solenberg23fba1f2015-04-29 15:24:01 +0200120 } rtp;
Fredrik Solenberg04f49312015-06-08 13:04:56 +0200121
Ivo Creusen2562cf02021-09-03 14:51:22 +0000122 // Receive-side RTT.
123 bool enable_non_sender_rtt = false;
124
solenbergcf18b342015-10-01 08:13:42 -0700125 Transport* rtcp_send_transport = nullptr;
126
Fredrik Solenberg8f5787a2018-01-11 13:52:30 +0100127 // NetEq settings.
Jakob Ivarsson647d5e62019-03-15 10:37:31 +0100128 size_t jitter_buffer_max_packets = 200;
Fredrik Solenberg8f5787a2018-01-11 13:52:30 +0100129 bool jitter_buffer_fast_accelerate = false;
Jakob Ivarsson10403ae2018-11-27 15:45:20 +0100130 int jitter_buffer_min_delay_ms = 0;
Fredrik Solenberg8f5787a2018-01-11 13:52:30 +0100131
pbos8fc7fa72015-07-15 08:02:58 -0700132 // Identifier for an A/V synchronization group. Empty string to disable.
133 // TODO(pbos): Synchronize streams in a sync group, not just one video
134 // stream to one audio stream. Tracked by issue webrtc:4762.
135 std::string sync_group;
136
kwibergd32bf752017-01-19 07:03:59 -0800137 // Decoder specifications for every payload type that we can receive.
138 std::map<int, SdpAudioFormat> decoder_map;
ossu29b1a8d2016-06-13 07:34:51 -0700139
140 rtc::scoped_refptr<AudioDecoderFactory> decoder_factory;
Karl Wiberg08126342018-03-20 19:18:55 +0100141
Danil Chapovalovb9b146c2018-06-15 12:28:07 +0200142 absl::optional<AudioCodecPairId> codec_pair_id;
Benjamin Wright84583f62018-10-04 14:22:34 -0700143
Benjamin Wrightbfb444c2018-10-15 10:20:24 -0700144 // Per PeerConnection crypto options.
145 webrtc::CryptoOptions crypto_options;
146
Benjamin Wright84583f62018-10-04 14:22:34 -0700147 // An optional custom frame decryptor that allows the entire frame to be
148 // decrypted in whatever way the caller choses. This is not required by
149 // default.
Tommi6eda26c2021-06-09 13:46:28 +0200150 // TODO(tommi): Remove this member variable from the struct. It's not
Tommi3176ef72022-05-22 20:47:28 +0200151 // a part of the AudioReceiveStreamInterface state but rather a pass through
Tommi6eda26c2021-06-09 13:46:28 +0200152 // variable.
Benjamin Wright84583f62018-10-04 14:22:34 -0700153 rtc::scoped_refptr<webrtc::FrameDecryptorInterface> frame_decryptor;
Marina Ciocea3e9af7f2020-04-01 07:46:16 +0200154
155 // An optional frame transformer used by insertable streams to transform
156 // encoded frames.
Tommi6eda26c2021-06-09 13:46:28 +0200157 // TODO(tommi): Remove this member variable from the struct. It's not
Tommi3176ef72022-05-22 20:47:28 +0200158 // a part of the AudioReceiveStreamInterface state but rather a pass through
Tommi6eda26c2021-06-09 13:46:28 +0200159 // variable.
Marina Ciocea3e9af7f2020-04-01 07:46:16 +0200160 rtc::scoped_refptr<webrtc::FrameTransformerInterface> frame_transformer;
Fredrik Solenberg23fba1f2015-04-29 15:24:01 +0200161 };
162
Tommi6eda26c2021-06-09 13:46:28 +0200163 // Methods that support reconfiguring the stream post initialization.
Tommi6eda26c2021-06-09 13:46:28 +0200164 virtual void SetDecoderMap(std::map<int, SdpAudioFormat> decoder_map) = 0;
Tommia136ed42022-05-30 15:08:13 +0200165 virtual void SetNackHistory(int history_ms) = 0;
Ivo Creusen2562cf02021-09-03 14:51:22 +0000166 virtual void SetNonSenderRttMeasurement(bool enabled) = 0;
167
Tomas Gunnarsson8467cf22021-01-17 14:36:44 +0100168 // Returns true if the stream has been started.
169 virtual bool IsRunning() const = 0;
170
Niels Möller6b4d9622020-09-14 10:47:50 +0200171 virtual Stats GetStats(bool get_and_clear_legacy_stats) const = 0;
172 Stats GetStats() { return GetStats(/*get_and_clear_legacy_stats=*/true); }
Tommif888bb52015-12-12 01:37:01 +0100173
174 // Sets an audio sink that receives unmixed audio from the receive stream.
Fredrik Solenberg8f5787a2018-01-11 13:52:30 +0100175 // Ownership of the sink is managed by the caller.
deadbeef884f5852016-01-15 09:20:04 -0800176 // Only one sink can be set and passing a null sink clears an existing one.
Tommif888bb52015-12-12 01:37:01 +0100177 // NOTE: Audio must still somehow be pulled through AudioTransport for audio
178 // to stream through this sink. In practice, this happens if mixed audio
179 // is being pulled+rendered and/or if audio is being pulled for the purposes
180 // of feeding to the AEC.
Fredrik Solenberg8f5787a2018-01-11 13:52:30 +0100181 virtual void SetSink(AudioSinkInterface* sink) = 0;
pbos1ba8d392016-05-01 20:18:34 -0700182
solenberg217fb662016-06-17 08:30:54 -0700183 // Sets playback gain of the stream, applied when mixing, and thus after it
184 // is potentially forwarded to any attached AudioSinkInterface implementation.
185 virtual void SetGain(float gain) = 0;
186
Ruslan Burakov3b50f9f2019-02-06 09:45:56 +0100187 // Sets a base minimum for the playout delay. Base minimum delay sets lower
188 // bound on minimum delay value determining lower bound on playout delay.
189 //
190 // Returns true if value was successfully set, false overwise.
191 virtual bool SetBaseMinimumPlayoutDelayMs(int delay_ms) = 0;
192
193 // Returns current value of base minimum delay in milliseconds.
194 virtual int GetBaseMinimumPlayoutDelayMs() const = 0;
195
Tommicb7c7362022-05-09 14:49:37 +0000196 // Synchronization source (stream identifier) to be received.
197 // This member will not change mid-stream and can be assumed to be const
198 // post initialization.
199 virtual uint32_t remote_ssrc() const = 0;
200
pbos1ba8d392016-05-01 20:18:34 -0700201 protected:
Tommi3176ef72022-05-22 20:47:28 +0200202 virtual ~AudioReceiveStreamInterface() {}
Fredrik Solenberg23fba1f2015-04-29 15:24:01 +0200203};
Tommi3176ef72022-05-22 20:47:28 +0200204
Fredrik Solenberg23fba1f2015-04-29 15:24:01 +0200205} // namespace webrtc
206
Mirko Bonadei92ea95e2017-09-15 06:47:31 +0200207#endif // CALL_AUDIO_RECEIVE_STREAM_H_