Fredrik Solenberg | 23fba1f | 2015-04-29 15:24:01 +0200 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2015 The WebRTC project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 11 | #ifndef CALL_AUDIO_RECEIVE_STREAM_H_ |
| 12 | #define CALL_AUDIO_RECEIVE_STREAM_H_ |
Fredrik Solenberg | 23fba1f | 2015-04-29 15:24:01 +0200 | [diff] [blame] | 13 | |
Fredrik Solenberg | 04f4931 | 2015-06-08 13:04:56 +0200 | [diff] [blame] | 14 | #include <map> |
kwiberg | fffa42b | 2016-02-23 10:46:32 -0800 | [diff] [blame] | 15 | #include <memory> |
Fredrik Solenberg | 23fba1f | 2015-04-29 15:24:01 +0200 | [diff] [blame] | 16 | #include <string> |
| 17 | #include <vector> |
| 18 | |
Danil Chapovalov | b9b146c | 2018-06-15 12:28:07 +0200 | [diff] [blame] | 19 | #include "absl/types/optional.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 20 | #include "api/audio_codecs/audio_decoder_factory.h" |
| 21 | #include "api/call/transport.h" |
Steve Anton | 10542f2 | 2019-01-11 09:11:00 -0800 | [diff] [blame] | 22 | #include "api/crypto/crypto_options.h" |
Steve Anton | 10542f2 | 2019-01-11 09:11:00 -0800 | [diff] [blame] | 23 | #include "api/rtp_parameters.h" |
Tommi | 1c1f540 | 2021-06-14 10:54:20 +0200 | [diff] [blame] | 24 | #include "call/receive_stream.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 25 | #include "call/rtp_config.h" |
Fredrik Solenberg | 23fba1f | 2015-04-29 15:24:01 +0200 | [diff] [blame] | 26 | |
| 27 | namespace webrtc { |
Tommi | f888bb5 | 2015-12-12 01:37:01 +0100 | [diff] [blame] | 28 | class AudioSinkInterface; |
Fredrik Solenberg | 04f4931 | 2015-06-08 13:04:56 +0200 | [diff] [blame] | 29 | |
Tommi | 1c1f540 | 2021-06-14 10:54:20 +0200 | [diff] [blame] | 30 | class AudioReceiveStream : public MediaReceiveStream { |
Fredrik Solenberg | 23fba1f | 2015-04-29 15:24:01 +0200 | [diff] [blame] | 31 | public: |
Fredrik Solenberg | 4f4ec0a | 2015-10-22 10:49:27 +0200 | [diff] [blame] | 32 | struct Stats { |
Paulina Hensman | 11b34f4 | 2018-04-09 14:24:52 +0200 | [diff] [blame] | 33 | Stats(); |
| 34 | ~Stats(); |
Fredrik Solenberg | 4f4ec0a | 2015-10-22 10:49:27 +0200 | [diff] [blame] | 35 | uint32_t remote_ssrc = 0; |
Niels Möller | ac0a4cb | 2019-10-09 15:01:33 +0200 | [diff] [blame] | 36 | int64_t payload_bytes_rcvd = 0; |
| 37 | int64_t header_and_padding_bytes_rcvd = 0; |
Fredrik Solenberg | 4f4ec0a | 2015-10-22 10:49:27 +0200 | [diff] [blame] | 38 | uint32_t packets_rcvd = 0; |
Ivo Creusen | 8d8ffdb | 2019-04-30 09:45:21 +0200 | [diff] [blame] | 39 | uint64_t fec_packets_received = 0; |
| 40 | uint64_t fec_packets_discarded = 0; |
Fredrik Solenberg | 4f4ec0a | 2015-10-22 10:49:27 +0200 | [diff] [blame] | 41 | uint32_t packets_lost = 0; |
Minyue Li | 28a2c63 | 2021-07-07 15:53:38 +0200 | [diff] [blame] | 42 | uint64_t packets_discarded = 0; |
Jakob Ivarsson | e54914a | 2021-07-01 11:16:05 +0200 | [diff] [blame] | 43 | uint32_t nacks_sent = 0; |
Fredrik Solenberg | 4f4ec0a | 2015-10-22 10:49:27 +0200 | [diff] [blame] | 44 | std::string codec_name; |
Danil Chapovalov | b9b146c | 2018-06-15 12:28:07 +0200 | [diff] [blame] | 45 | absl::optional<int> codec_payload_type; |
Fredrik Solenberg | 4f4ec0a | 2015-10-22 10:49:27 +0200 | [diff] [blame] | 46 | uint32_t jitter_ms = 0; |
| 47 | uint32_t jitter_buffer_ms = 0; |
| 48 | uint32_t jitter_buffer_preferred_ms = 0; |
| 49 | uint32_t delay_estimate_ms = 0; |
| 50 | int32_t audio_level = -1; |
Gustaf Ullberg | 9a2e906 | 2017-09-18 09:28:20 +0200 | [diff] [blame] | 51 | // Stats below correspond to similarly-named fields in the WebRTC stats |
| 52 | // spec. https://w3c.github.io/webrtc-stats/#dom-rtcmediastreamtrackstats |
zstein | e76bd3a | 2017-07-14 12:17:49 -0700 | [diff] [blame] | 53 | double total_output_energy = 0.0; |
Steve Anton | 2dbc69f | 2017-08-24 17:15:13 -0700 | [diff] [blame] | 54 | uint64_t total_samples_received = 0; |
zstein | e76bd3a | 2017-07-14 12:17:49 -0700 | [diff] [blame] | 55 | double total_output_duration = 0.0; |
Steve Anton | 2dbc69f | 2017-08-24 17:15:13 -0700 | [diff] [blame] | 56 | uint64_t concealed_samples = 0; |
Ivo Creusen | 8d8ffdb | 2019-04-30 09:45:21 +0200 | [diff] [blame] | 57 | uint64_t silent_concealed_samples = 0; |
Gustaf Ullberg | 9a2e906 | 2017-09-18 09:28:20 +0200 | [diff] [blame] | 58 | uint64_t concealment_events = 0; |
Gustaf Ullberg | b0a0207 | 2017-10-02 12:00:34 +0200 | [diff] [blame] | 59 | double jitter_buffer_delay_seconds = 0.0; |
Chen Xing | 0acffb5 | 2019-01-15 15:46:29 +0100 | [diff] [blame] | 60 | uint64_t jitter_buffer_emitted_count = 0; |
Artem Titov | e618cc9 | 2020-03-11 11:18:54 +0100 | [diff] [blame] | 61 | double jitter_buffer_target_delay_seconds = 0.0; |
Ivo Creusen | 8d8ffdb | 2019-04-30 09:45:21 +0200 | [diff] [blame] | 62 | uint64_t inserted_samples_for_deceleration = 0; |
| 63 | uint64_t removed_samples_for_acceleration = 0; |
Gustaf Ullberg | 9a2e906 | 2017-09-18 09:28:20 +0200 | [diff] [blame] | 64 | // Stats below DO NOT correspond directly to anything in the WebRTC stats |
Fredrik Solenberg | 4f4ec0a | 2015-10-22 10:49:27 +0200 | [diff] [blame] | 65 | float expand_rate = 0.0f; |
| 66 | float speech_expand_rate = 0.0f; |
| 67 | float secondary_decoded_rate = 0.0f; |
minyue-webrtc | 0e320ec | 2017-08-28 13:51:27 +0200 | [diff] [blame] | 68 | float secondary_discarded_rate = 0.0f; |
Fredrik Solenberg | 4f4ec0a | 2015-10-22 10:49:27 +0200 | [diff] [blame] | 69 | float accelerate_rate = 0.0f; |
| 70 | float preemptive_expand_rate = 0.0f; |
Jakob Ivarsson | 352ce5c | 2018-11-27 12:52:16 +0100 | [diff] [blame] | 71 | uint64_t delayed_packet_outage_samples = 0; |
Fredrik Solenberg | 4f4ec0a | 2015-10-22 10:49:27 +0200 | [diff] [blame] | 72 | int32_t decoding_calls_to_silence_generator = 0; |
| 73 | int32_t decoding_calls_to_neteq = 0; |
| 74 | int32_t decoding_normal = 0; |
Alex Narest | 5b5d97c | 2019-08-07 18:15:08 +0200 | [diff] [blame] | 75 | // TODO(alexnarest): Consider decoding_neteq_plc for consistency |
Fredrik Solenberg | 4f4ec0a | 2015-10-22 10:49:27 +0200 | [diff] [blame] | 76 | int32_t decoding_plc = 0; |
Alex Narest | 5b5d97c | 2019-08-07 18:15:08 +0200 | [diff] [blame] | 77 | int32_t decoding_codec_plc = 0; |
Fredrik Solenberg | 4f4ec0a | 2015-10-22 10:49:27 +0200 | [diff] [blame] | 78 | int32_t decoding_cng = 0; |
| 79 | int32_t decoding_plc_cng = 0; |
henrik.lundin | 6348978 | 2016-09-20 01:47:12 -0700 | [diff] [blame] | 80 | int32_t decoding_muted_output = 0; |
Fredrik Solenberg | 4f4ec0a | 2015-10-22 10:49:27 +0200 | [diff] [blame] | 81 | int64_t capture_start_ntp_time_ms = 0; |
Henrik Boström | 01738c6 | 2019-04-15 17:32:00 +0200 | [diff] [blame] | 82 | // The timestamp at which the last packet was received, i.e. the time of the |
| 83 | // local clock when it was received - not the RTP timestamp of that packet. |
| 84 | // https://w3c.github.io/webrtc-stats/#dom-rtcinboundrtpstreamstats-lastpacketreceivedtimestamp |
| 85 | absl::optional<int64_t> last_packet_received_timestamp_ms; |
Ruslan Burakov | 8af8896 | 2018-11-22 17:21:10 +0100 | [diff] [blame] | 86 | uint64_t jitter_buffer_flushes = 0; |
Jakob Ivarsson | 232b3fd | 2019-03-06 09:18:40 +0100 | [diff] [blame] | 87 | double relative_packet_arrival_delay_seconds = 0.0; |
Henrik Lundin | 44125fa | 2019-04-29 17:00:46 +0200 | [diff] [blame] | 88 | int32_t interruption_count = 0; |
| 89 | int32_t total_interruption_duration_ms = 0; |
Åsa Persson | fcf79cc | 2019-10-22 15:23:44 +0200 | [diff] [blame] | 90 | // https://w3c.github.io/webrtc-stats/#dom-rtcinboundrtpstreamstats-estimatedplayouttimestamp |
| 91 | absl::optional<int64_t> estimated_playout_ntp_timestamp_ms; |
Alessio Bazzica | f7b1b95 | 2021-03-23 17:23:04 +0100 | [diff] [blame] | 92 | // Remote outbound stats derived by the received RTCP sender reports. |
| 93 | // https://w3c.github.io/webrtc-stats/#remoteoutboundrtpstats-dict* |
| 94 | absl::optional<int64_t> last_sender_report_timestamp_ms; |
| 95 | absl::optional<int64_t> last_sender_report_remote_timestamp_ms; |
| 96 | uint32_t sender_reports_packets_sent = 0; |
| 97 | uint64_t sender_reports_bytes_sent = 0; |
| 98 | uint64_t sender_reports_reports_count = 0; |
Ivo Creusen | 2562cf0 | 2021-09-03 14:51:22 +0000 | [diff] [blame] | 99 | absl::optional<TimeDelta> round_trip_time; |
| 100 | TimeDelta total_round_trip_time = TimeDelta::Zero(); |
| 101 | int round_trip_time_measurements; |
Fredrik Solenberg | 4f4ec0a | 2015-10-22 10:49:27 +0200 | [diff] [blame] | 102 | }; |
Fredrik Solenberg | 04f4931 | 2015-06-08 13:04:56 +0200 | [diff] [blame] | 103 | |
Fredrik Solenberg | 23fba1f | 2015-04-29 15:24:01 +0200 | [diff] [blame] | 104 | struct Config { |
Paulina Hensman | 11b34f4 | 2018-04-09 14:24:52 +0200 | [diff] [blame] | 105 | Config(); |
| 106 | ~Config(); |
| 107 | |
Fredrik Solenberg | 23fba1f | 2015-04-29 15:24:01 +0200 | [diff] [blame] | 108 | std::string ToString() const; |
| 109 | |
| 110 | // Receive-stream specific RTP settings. |
Tommi | 1c1f540 | 2021-06-14 10:54:20 +0200 | [diff] [blame] | 111 | struct Rtp : public RtpConfig { |
Paulina Hensman | 11b34f4 | 2018-04-09 14:24:52 +0200 | [diff] [blame] | 112 | Rtp(); |
| 113 | ~Rtp(); |
| 114 | |
Fredrik Solenberg | 23fba1f | 2015-04-29 15:24:01 +0200 | [diff] [blame] | 115 | std::string ToString() const; |
| 116 | |
solenberg | 8189b02 | 2016-06-14 12:13:00 -0700 | [diff] [blame] | 117 | // See NackConfig for description. |
| 118 | NackConfig nack; |
Fredrik Solenberg | 23fba1f | 2015-04-29 15:24:01 +0200 | [diff] [blame] | 119 | } rtp; |
Fredrik Solenberg | 04f4931 | 2015-06-08 13:04:56 +0200 | [diff] [blame] | 120 | |
Ivo Creusen | 2562cf0 | 2021-09-03 14:51:22 +0000 | [diff] [blame] | 121 | // Receive-side RTT. |
| 122 | bool enable_non_sender_rtt = false; |
| 123 | |
solenberg | cf18b34 | 2015-10-01 08:13:42 -0700 | [diff] [blame] | 124 | Transport* rtcp_send_transport = nullptr; |
| 125 | |
Fredrik Solenberg | 8f5787a | 2018-01-11 13:52:30 +0100 | [diff] [blame] | 126 | // NetEq settings. |
Jakob Ivarsson | 647d5e6 | 2019-03-15 10:37:31 +0100 | [diff] [blame] | 127 | size_t jitter_buffer_max_packets = 200; |
Fredrik Solenberg | 8f5787a | 2018-01-11 13:52:30 +0100 | [diff] [blame] | 128 | bool jitter_buffer_fast_accelerate = false; |
Jakob Ivarsson | 10403ae | 2018-11-27 15:45:20 +0100 | [diff] [blame] | 129 | int jitter_buffer_min_delay_ms = 0; |
Jakob Ivarsson | 53eae87 | 2019-01-10 15:58:36 +0100 | [diff] [blame] | 130 | bool jitter_buffer_enable_rtx_handling = false; |
Fredrik Solenberg | 8f5787a | 2018-01-11 13:52:30 +0100 | [diff] [blame] | 131 | |
pbos | 8fc7fa7 | 2015-07-15 08:02:58 -0700 | [diff] [blame] | 132 | // Identifier for an A/V synchronization group. Empty string to disable. |
| 133 | // TODO(pbos): Synchronize streams in a sync group, not just one video |
| 134 | // stream to one audio stream. Tracked by issue webrtc:4762. |
| 135 | std::string sync_group; |
| 136 | |
kwiberg | d32bf75 | 2017-01-19 07:03:59 -0800 | [diff] [blame] | 137 | // Decoder specifications for every payload type that we can receive. |
| 138 | std::map<int, SdpAudioFormat> decoder_map; |
ossu | 29b1a8d | 2016-06-13 07:34:51 -0700 | [diff] [blame] | 139 | |
| 140 | rtc::scoped_refptr<AudioDecoderFactory> decoder_factory; |
Karl Wiberg | 0812634 | 2018-03-20 19:18:55 +0100 | [diff] [blame] | 141 | |
Danil Chapovalov | b9b146c | 2018-06-15 12:28:07 +0200 | [diff] [blame] | 142 | absl::optional<AudioCodecPairId> codec_pair_id; |
Benjamin Wright | 84583f6 | 2018-10-04 14:22:34 -0700 | [diff] [blame] | 143 | |
Benjamin Wright | bfb444c | 2018-10-15 10:20:24 -0700 | [diff] [blame] | 144 | // Per PeerConnection crypto options. |
| 145 | webrtc::CryptoOptions crypto_options; |
| 146 | |
Benjamin Wright | 84583f6 | 2018-10-04 14:22:34 -0700 | [diff] [blame] | 147 | // An optional custom frame decryptor that allows the entire frame to be |
| 148 | // decrypted in whatever way the caller choses. This is not required by |
| 149 | // default. |
Tommi | 6eda26c | 2021-06-09 13:46:28 +0200 | [diff] [blame] | 150 | // TODO(tommi): Remove this member variable from the struct. It's not |
| 151 | // a part of the AudioReceiveStream state but rather a pass through |
| 152 | // variable. |
Benjamin Wright | 84583f6 | 2018-10-04 14:22:34 -0700 | [diff] [blame] | 153 | rtc::scoped_refptr<webrtc::FrameDecryptorInterface> frame_decryptor; |
Marina Ciocea | 3e9af7f | 2020-04-01 07:46:16 +0200 | [diff] [blame] | 154 | |
| 155 | // An optional frame transformer used by insertable streams to transform |
| 156 | // encoded frames. |
Tommi | 6eda26c | 2021-06-09 13:46:28 +0200 | [diff] [blame] | 157 | // TODO(tommi): Remove this member variable from the struct. It's not |
| 158 | // a part of the AudioReceiveStream state but rather a pass through |
| 159 | // variable. |
Marina Ciocea | 3e9af7f | 2020-04-01 07:46:16 +0200 | [diff] [blame] | 160 | rtc::scoped_refptr<webrtc::FrameTransformerInterface> frame_transformer; |
Fredrik Solenberg | 23fba1f | 2015-04-29 15:24:01 +0200 | [diff] [blame] | 161 | }; |
| 162 | |
Tommi | 6eda26c | 2021-06-09 13:46:28 +0200 | [diff] [blame] | 163 | // Methods that support reconfiguring the stream post initialization. |
Tommi | 6eda26c | 2021-06-09 13:46:28 +0200 | [diff] [blame] | 164 | virtual void SetDecoderMap(std::map<int, SdpAudioFormat> decoder_map) = 0; |
| 165 | virtual void SetUseTransportCcAndNackHistory(bool use_transport_cc, |
| 166 | int history_ms) = 0; |
Ivo Creusen | 2562cf0 | 2021-09-03 14:51:22 +0000 | [diff] [blame] | 167 | virtual void SetNonSenderRttMeasurement(bool enabled) = 0; |
| 168 | |
Tomas Gunnarsson | 8467cf2 | 2021-01-17 14:36:44 +0100 | [diff] [blame] | 169 | // Returns true if the stream has been started. |
| 170 | virtual bool IsRunning() const = 0; |
| 171 | |
Niels Möller | 6b4d962 | 2020-09-14 10:47:50 +0200 | [diff] [blame] | 172 | virtual Stats GetStats(bool get_and_clear_legacy_stats) const = 0; |
| 173 | Stats GetStats() { return GetStats(/*get_and_clear_legacy_stats=*/true); } |
Tommi | f888bb5 | 2015-12-12 01:37:01 +0100 | [diff] [blame] | 174 | |
| 175 | // Sets an audio sink that receives unmixed audio from the receive stream. |
Fredrik Solenberg | 8f5787a | 2018-01-11 13:52:30 +0100 | [diff] [blame] | 176 | // Ownership of the sink is managed by the caller. |
deadbeef | 884f585 | 2016-01-15 09:20:04 -0800 | [diff] [blame] | 177 | // Only one sink can be set and passing a null sink clears an existing one. |
Tommi | f888bb5 | 2015-12-12 01:37:01 +0100 | [diff] [blame] | 178 | // NOTE: Audio must still somehow be pulled through AudioTransport for audio |
| 179 | // to stream through this sink. In practice, this happens if mixed audio |
| 180 | // is being pulled+rendered and/or if audio is being pulled for the purposes |
| 181 | // of feeding to the AEC. |
Fredrik Solenberg | 8f5787a | 2018-01-11 13:52:30 +0100 | [diff] [blame] | 182 | virtual void SetSink(AudioSinkInterface* sink) = 0; |
pbos | 1ba8d39 | 2016-05-01 20:18:34 -0700 | [diff] [blame] | 183 | |
solenberg | 217fb66 | 2016-06-17 08:30:54 -0700 | [diff] [blame] | 184 | // Sets playback gain of the stream, applied when mixing, and thus after it |
| 185 | // is potentially forwarded to any attached AudioSinkInterface implementation. |
| 186 | virtual void SetGain(float gain) = 0; |
| 187 | |
Ruslan Burakov | 3b50f9f | 2019-02-06 09:45:56 +0100 | [diff] [blame] | 188 | // Sets a base minimum for the playout delay. Base minimum delay sets lower |
| 189 | // bound on minimum delay value determining lower bound on playout delay. |
| 190 | // |
| 191 | // Returns true if value was successfully set, false overwise. |
| 192 | virtual bool SetBaseMinimumPlayoutDelayMs(int delay_ms) = 0; |
| 193 | |
| 194 | // Returns current value of base minimum delay in milliseconds. |
| 195 | virtual int GetBaseMinimumPlayoutDelayMs() const = 0; |
| 196 | |
Tommi | cb7c736 | 2022-05-09 14:49:37 +0000 | [diff] [blame^] | 197 | // Synchronization source (stream identifier) to be received. |
| 198 | // This member will not change mid-stream and can be assumed to be const |
| 199 | // post initialization. |
| 200 | virtual uint32_t remote_ssrc() const = 0; |
| 201 | |
pbos | 1ba8d39 | 2016-05-01 20:18:34 -0700 | [diff] [blame] | 202 | protected: |
| 203 | virtual ~AudioReceiveStream() {} |
Fredrik Solenberg | 23fba1f | 2015-04-29 15:24:01 +0200 | [diff] [blame] | 204 | }; |
Fredrik Solenberg | 23fba1f | 2015-04-29 15:24:01 +0200 | [diff] [blame] | 205 | } // namespace webrtc |
| 206 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 207 | #endif // CALL_AUDIO_RECEIVE_STREAM_H_ |