blob: d296a57658c73fe46b3536bb7f3a53096d258f05 [file] [log] [blame]
turaj@webrtc.org7959e162013-09-12 18:30:26 +00001/*
2 * Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#include "modules/audio_coding/acm2/acm_receiver.h"
turaj@webrtc.org7959e162013-09-12 18:30:26 +000012
Yves Gerey988cc082018-10-23 12:03:01 +020013#include <stdlib.h>
14#include <string.h>
15#include <cstdint>
turaj@webrtc.org7959e162013-09-12 18:30:26 +000016#include <vector>
17
Niels Möller2edab4c2018-10-22 09:48:08 +020018#include "absl/strings/match.h"
Yves Gerey988cc082018-10-23 12:03:01 +020019#include "api/audio/audio_frame.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020020#include "api/audio_codecs/audio_decoder.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020021#include "modules/audio_coding/acm2/acm_resampler.h"
22#include "modules/audio_coding/acm2/call_statistics.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020023#include "modules/audio_coding/neteq/include/neteq.h"
Fredrik Solenbergbbf21a32018-04-12 22:44:09 +020024#include "modules/include/module_common_types.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020025#include "rtc_base/checks.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020026#include "rtc_base/logging.h"
Karl Wiberge40468b2017-11-22 10:42:26 +010027#include "rtc_base/numerics/safe_conversions.h"
Jonas Olssonabbe8412018-04-03 13:40:05 +020028#include "rtc_base/strings/audio_format_to_string.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020029#include "system_wrappers/include/clock.h"
turaj@webrtc.org7959e162013-09-12 18:30:26 +000030
31namespace webrtc {
32
turaj@webrtc.org6d5d2482013-10-06 04:47:28 +000033namespace acm2 {
34
henrik.lundin@webrtc.org0bc9b5a2014-04-29 08:09:31 +000035AcmReceiver::AcmReceiver(const AudioCodingModule::Config& config)
kwiberg6f0f6162016-09-20 03:07:46 -070036 : last_audio_buffer_(new int16_t[AudioFrame::kMaxDataSizeSamples]),
ossue3525782016-05-25 07:37:43 -070037 neteq_(NetEq::Create(config.neteq_config, config.decoder_factory)),
henrik.lundin@webrtc.org0bc9b5a2014-04-29 08:09:31 +000038 clock_(config.clock),
henrik.lundin678c9032015-11-02 08:31:23 -080039 resampled_last_output_frame_(true) {
Henrik Lundin02ed2012017-06-08 09:03:55 +020040 RTC_DCHECK(clock_);
Henrik Lundin76c10672018-05-07 13:47:28 +020041 memset(last_audio_buffer_.get(), 0,
42 sizeof(int16_t) * AudioFrame::kMaxDataSizeSamples);
turaj@webrtc.org7959e162013-09-12 18:30:26 +000043}
44
Henrik Lundin6af93992017-06-14 14:13:02 +020045AcmReceiver::~AcmReceiver() = default;
turaj@webrtc.org7959e162013-09-12 18:30:26 +000046
47int AcmReceiver::SetMinimumDelay(int delay_ms) {
48 if (neteq_->SetMinimumDelay(delay_ms))
49 return 0;
Mirko Bonadei675513b2017-11-09 11:09:25 +010050 RTC_LOG(LERROR) << "AcmReceiver::SetExtraDelay " << delay_ms;
turaj@webrtc.org7959e162013-09-12 18:30:26 +000051 return -1;
52}
53
turaj@webrtc.org7959e162013-09-12 18:30:26 +000054int AcmReceiver::SetMaximumDelay(int delay_ms) {
55 if (neteq_->SetMaximumDelay(delay_ms))
56 return 0;
Mirko Bonadei675513b2017-11-09 11:09:25 +010057 RTC_LOG(LERROR) << "AcmReceiver::SetExtraDelay " << delay_ms;
turaj@webrtc.org7959e162013-09-12 18:30:26 +000058 return -1;
59}
60
Ruslan Burakov9bee67c2019-02-05 13:49:26 +010061bool AcmReceiver::SetBaseMinimumDelayMs(int delay_ms) {
62 return neteq_->SetBaseMinimumDelayMs(delay_ms);
63}
64
65int AcmReceiver::GetBaseMinimumDelayMs() const {
66 return neteq_->GetBaseMinimumDelayMs();
67}
68
Danil Chapovalovb6021232018-06-19 13:26:36 +020069absl::optional<int> AcmReceiver::last_packet_sample_rate_hz() const {
Tommi9090e0b2016-01-20 13:39:36 +010070 rtc::CritScope lock(&crit_sect_);
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +010071 if (!last_decoder_) {
72 return absl::nullopt;
73 }
74 return last_decoder_->second.clockrate_hz;
henrik.lundin057fb892015-11-23 08:19:52 -080075}
76
henrik.lundind89814b2015-11-23 06:49:25 -080077int AcmReceiver::last_output_sample_rate_hz() const {
78 return neteq_->last_output_sample_rate_hz();
turaj@webrtc.org7959e162013-09-12 18:30:26 +000079}
80
Niels Möllerafb5dbb2019-02-15 15:21:47 +010081int AcmReceiver::InsertPacket(const RTPHeader& rtp_header,
kwibergee2bac22015-11-11 10:34:00 -080082 rtc::ArrayView<const uint8_t> incoming_payload) {
henrik.lundinb8c55b12017-05-10 07:38:01 -070083 if (incoming_payload.empty()) {
Niels Möllerafb5dbb2019-02-15 15:21:47 +010084 neteq_->InsertEmptyPacket(rtp_header);
henrik.lundinb8c55b12017-05-10 07:38:01 -070085 return 0;
86 }
87
Niels Möllerafb5dbb2019-02-15 15:21:47 +010088 int payload_type = rtp_header.payloadType;
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +010089 auto format = neteq_->GetDecoderFormat(payload_type);
90 if (format && absl::EqualsIgnoreCase(format->name, "red")) {
91 // This is a RED packet. Get the format of the audio codec.
92 payload_type = incoming_payload[0] & 0x7f;
93 format = neteq_->GetDecoderFormat(payload_type);
94 }
95 if (!format) {
96 RTC_LOG_F(LS_ERROR) << "Payload-type "
97 << payload_type
98 << " is not registered.";
99 return -1;
100 }
101
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000102 {
Tommi9090e0b2016-01-20 13:39:36 +0100103 rtc::CritScope lock(&crit_sect_);
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100104 if (absl::EqualsIgnoreCase(format->name, "cn")) {
105 if (last_decoder_ && last_decoder_->second.num_channels > 1) {
kwiberg6f0f6162016-09-20 03:07:46 -0700106 // This is a CNG and the audio codec is not mono, so skip pushing in
107 // packets into NetEq.
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000108 return 0;
kwiberg6f0f6162016-09-20 03:07:46 -0700109 }
110 } else {
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100111 RTC_DCHECK(format);
112 last_decoder_ = std::make_pair(payload_type, *format);
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000113 }
henrik.lundin@webrtc.orga90abde2014-06-09 18:35:11 +0000114 } // |crit_sect_| is released.
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000115
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100116 uint32_t receive_timestamp = NowInTimestamp(format->clockrate_hz);
Niels Möllerafb5dbb2019-02-15 15:21:47 +0100117 if (neteq_->InsertPacket(rtp_header, incoming_payload, receive_timestamp) <
118 0) {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100119 RTC_LOG(LERROR) << "AcmReceiver::InsertPacket "
Niels Möllerafb5dbb2019-02-15 15:21:47 +0100120 << static_cast<int>(rtp_header.payloadType)
Mirko Bonadei675513b2017-11-09 11:09:25 +0100121 << " Failed to insert packet";
henrik.lundin@webrtc.orgeecf5e62014-06-24 13:11:22 +0000122 return -1;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000123 }
124 return 0;
125}
126
henrik.lundin834a6ea2016-05-13 03:45:24 -0700127int AcmReceiver::GetAudio(int desired_freq_hz,
128 AudioFrame* audio_frame,
129 bool* muted) {
henrik.lundin63489782016-09-20 01:47:12 -0700130 RTC_DCHECK(muted);
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000131 // Accessing members, take the lock.
Tommi9090e0b2016-01-20 13:39:36 +0100132 rtc::CritScope lock(&crit_sect_);
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000133
henrik.lundin834a6ea2016-05-13 03:45:24 -0700134 if (neteq_->GetAudio(audio_frame, muted) != NetEq::kOK) {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100135 RTC_LOG(LERROR) << "AcmReceiver::GetAudio - NetEq Failed.";
henrik.lundin@webrtc.orgeecf5e62014-06-24 13:11:22 +0000136 return -1;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000137 }
138
henrik.lundind89814b2015-11-23 06:49:25 -0800139 const int current_sample_rate_hz = neteq_->last_output_sample_rate_hz();
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000140
141 // Update if resampling is required.
henrik.lundind89814b2015-11-23 06:49:25 -0800142 const bool need_resampling =
143 (desired_freq_hz != -1) && (current_sample_rate_hz != desired_freq_hz);
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000144
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000145 if (need_resampling && !resampled_last_output_frame_) {
146 // Prime the resampler with the last frame.
147 int16_t temp_output[AudioFrame::kMaxDataSizeSamples];
henrik.lundind89814b2015-11-23 06:49:25 -0800148 int samples_per_channel_int = resampler_.Resample10Msec(
149 last_audio_buffer_.get(), current_sample_rate_hz, desired_freq_hz,
henrik.lundin6d8e0112016-03-04 10:34:21 -0800150 audio_frame->num_channels_, AudioFrame::kMaxDataSizeSamples,
151 temp_output);
Peter Kastingdce40cf2015-08-24 14:52:23 -0700152 if (samples_per_channel_int < 0) {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100153 RTC_LOG(LERROR) << "AcmReceiver::GetAudio - "
154 "Resampling last_audio_buffer_ failed.";
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000155 return -1;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000156 }
157 }
158
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000159 // TODO(henrik.lundin) Glitches in the output may appear if the output rate
160 // from NetEq changes. See WebRTC issue 3923.
161 if (need_resampling) {
yujo36b1a5f2017-06-12 12:45:32 -0700162 // TODO(yujo): handle this more efficiently for muted frames.
henrik.lundind89814b2015-11-23 06:49:25 -0800163 int samples_per_channel_int = resampler_.Resample10Msec(
yujo36b1a5f2017-06-12 12:45:32 -0700164 audio_frame->data(), current_sample_rate_hz, desired_freq_hz,
henrik.lundin6d8e0112016-03-04 10:34:21 -0800165 audio_frame->num_channels_, AudioFrame::kMaxDataSizeSamples,
yujo36b1a5f2017-06-12 12:45:32 -0700166 audio_frame->mutable_data());
Peter Kastingdce40cf2015-08-24 14:52:23 -0700167 if (samples_per_channel_int < 0) {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100168 RTC_LOG(LERROR)
169 << "AcmReceiver::GetAudio - Resampling audio_buffer_ failed.";
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000170 return -1;
171 }
henrik.lundin6d8e0112016-03-04 10:34:21 -0800172 audio_frame->samples_per_channel_ =
173 static_cast<size_t>(samples_per_channel_int);
174 audio_frame->sample_rate_hz_ = desired_freq_hz;
175 RTC_DCHECK_EQ(
176 audio_frame->sample_rate_hz_,
kwibergd3edd772017-03-01 18:52:48 -0800177 rtc::dchecked_cast<int>(audio_frame->samples_per_channel_ * 100));
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000178 resampled_last_output_frame_ = true;
179 } else {
180 resampled_last_output_frame_ = false;
181 // We might end up here ONLY if codec is changed.
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000182 }
183
henrik.lundin6d8e0112016-03-04 10:34:21 -0800184 // Store current audio in |last_audio_buffer_| for next time.
yujo36b1a5f2017-06-12 12:45:32 -0700185 memcpy(last_audio_buffer_.get(), audio_frame->data(),
henrik.lundin6d8e0112016-03-04 10:34:21 -0800186 sizeof(int16_t) * audio_frame->samples_per_channel_ *
187 audio_frame->num_channels_);
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000188
henrik.lundin63489782016-09-20 01:47:12 -0700189 call_stats_.DecodedByNetEq(audio_frame->speech_type_, *muted);
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000190 return 0;
191}
192
kwiberg1c07c702017-03-27 07:15:49 -0700193void AcmReceiver::SetCodecs(const std::map<int, SdpAudioFormat>& codecs) {
194 neteq_->SetCodecs(codecs);
195}
196
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000197void AcmReceiver::FlushBuffers() {
198 neteq_->FlushBuffers();
199}
200
kwiberg6b19b562016-09-20 04:02:25 -0700201void AcmReceiver::RemoveAllCodecs() {
Tommi9090e0b2016-01-20 13:39:36 +0100202 rtc::CritScope lock(&crit_sect_);
kwiberg6b19b562016-09-20 04:02:25 -0700203 neteq_->RemoveAllPayloadTypes();
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100204 last_decoder_ = absl::nullopt;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000205}
206
Danil Chapovalovb6021232018-06-19 13:26:36 +0200207absl::optional<uint32_t> AcmReceiver::GetPlayoutTimestamp() {
henrik.lundin9a410dd2016-04-06 01:39:22 -0700208 return neteq_->GetPlayoutTimestamp();
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000209}
210
henrik.lundinb3f1c5d2016-08-22 15:39:53 -0700211int AcmReceiver::FilteredCurrentDelayMs() const {
212 return neteq_->FilteredCurrentDelayMs();
213}
214
Henrik Lundinabbff892017-11-29 09:14:04 +0100215int AcmReceiver::TargetDelayMs() const {
216 return neteq_->TargetDelayMs();
217}
218
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100219absl::optional<std::pair<int, SdpAudioFormat>>
220 AcmReceiver::LastDecoder() const {
Tommi9090e0b2016-01-20 13:39:36 +0100221 rtc::CritScope lock(&crit_sect_);
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100222 if (!last_decoder_) {
223 return absl::nullopt;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000224 }
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100225 RTC_DCHECK_NE(-1, last_decoder_->first); // Payload type should be valid.
226 return last_decoder_;
ossue280cde2016-10-12 11:04:10 -0700227}
228
minyue@webrtc.orgc0bd7be2015-02-18 15:24:13 +0000229void AcmReceiver::GetNetworkStatistics(NetworkStatistics* acm_stat) {
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000230 NetEqNetworkStatistics neteq_stat;
231 // NetEq function always returns zero, so we don't check the return value.
232 neteq_->NetworkStatistics(&neteq_stat);
233
234 acm_stat->currentBufferSize = neteq_stat.current_buffer_size_ms;
235 acm_stat->preferredBufferSize = neteq_stat.preferred_buffer_size_ms;
turaj@webrtc.org532f3dc2013-09-19 00:12:23 +0000236 acm_stat->jitterPeaksFound = neteq_stat.jitter_peaks_found ? true : false;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000237 acm_stat->currentPacketLossRate = neteq_stat.packet_loss_rate;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000238 acm_stat->currentExpandRate = neteq_stat.expand_rate;
minyue@webrtc.orgc0bd7be2015-02-18 15:24:13 +0000239 acm_stat->currentSpeechExpandRate = neteq_stat.speech_expand_rate;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000240 acm_stat->currentPreemptiveRate = neteq_stat.preemptive_rate;
241 acm_stat->currentAccelerateRate = neteq_stat.accelerate_rate;
minyue@webrtc.orgc0bd7be2015-02-18 15:24:13 +0000242 acm_stat->currentSecondaryDecodedRate = neteq_stat.secondary_decoded_rate;
minyue-webrtc0c3ca752017-08-23 15:59:38 +0200243 acm_stat->currentSecondaryDiscardedRate = neteq_stat.secondary_discarded_rate;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000244 acm_stat->clockDriftPPM = neteq_stat.clockdrift_ppm;
henrik.lundin@webrtc.org20c71fd2014-04-22 10:11:21 +0000245 acm_stat->addedSamples = neteq_stat.added_zero_samples;
Henrik Lundin1bb8cf82015-08-25 13:08:04 +0200246 acm_stat->meanWaitingTimeMs = neteq_stat.mean_waiting_time_ms;
247 acm_stat->medianWaitingTimeMs = neteq_stat.median_waiting_time_ms;
248 acm_stat->minWaitingTimeMs = neteq_stat.min_waiting_time_ms;
249 acm_stat->maxWaitingTimeMs = neteq_stat.max_waiting_time_ms;
Steve Anton2dbc69f2017-08-24 17:15:13 -0700250
251 NetEqLifetimeStatistics neteq_lifetime_stat = neteq_->GetLifetimeStatistics();
252 acm_stat->totalSamplesReceived = neteq_lifetime_stat.total_samples_received;
253 acm_stat->concealedSamples = neteq_lifetime_stat.concealed_samples;
Gustaf Ullberg9a2e9062017-09-18 09:28:20 +0200254 acm_stat->concealmentEvents = neteq_lifetime_stat.concealment_events;
Gustaf Ullbergb0a02072017-10-02 12:00:34 +0200255 acm_stat->jitterBufferDelayMs = neteq_lifetime_stat.jitter_buffer_delay_ms;
Chen Xing0acffb52019-01-15 15:46:29 +0100256 acm_stat->jitterBufferEmittedCount =
257 neteq_lifetime_stat.jitter_buffer_emitted_count;
Jakob Ivarsson352ce5c2018-11-27 12:52:16 +0100258 acm_stat->delayedPacketOutageSamples =
259 neteq_lifetime_stat.delayed_packet_outage_samples;
Ruslan Burakov8af88962018-11-22 17:21:10 +0100260
261 NetEqOperationsAndState neteq_operations_and_state =
262 neteq_->GetOperationsAndState();
263 acm_stat->packetBufferFlushes =
264 neteq_operations_and_state.packet_buffer_flushes;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000265}
266
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000267int AcmReceiver::EnableNack(size_t max_nack_list_size) {
henrik.lundin48ed9302015-10-29 05:36:24 -0700268 neteq_->EnableNack(max_nack_list_size);
269 return 0;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000270}
271
272void AcmReceiver::DisableNack() {
henrik.lundin48ed9302015-10-29 05:36:24 -0700273 neteq_->DisableNack();
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000274}
275
276std::vector<uint16_t> AcmReceiver::GetNackList(
pkasting@chromium.org16825b12015-01-12 21:51:21 +0000277 int64_t round_trip_time_ms) const {
henrik.lundin48ed9302015-10-29 05:36:24 -0700278 return neteq_->GetNackList(round_trip_time_ms);
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000279}
280
281void AcmReceiver::ResetInitialDelay() {
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000282 neteq_->SetMinimumDelay(0);
283 // TODO(turajs): Should NetEq Buffer be flushed?
284}
285
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000286uint32_t AcmReceiver::NowInTimestamp(int decoder_sampling_rate) const {
287 // Down-cast the time to (32-6)-bit since we only care about
288 // the least significant bits. (32-6) bits cover 2^(32-6) = 67108864 ms.
289 // We masked 6 most significant bits of 32-bit so there is no overflow in
290 // the conversion from milliseconds to timestamp.
Yves Gerey665174f2018-06-19 15:03:05 +0200291 const uint32_t now_in_ms =
292 static_cast<uint32_t>(clock_->TimeInMilliseconds() & 0x03ffffff);
293 return static_cast<uint32_t>((decoder_sampling_rate / 1000) * now_in_ms);
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000294}
295
wu@webrtc.org24301a62013-12-13 19:17:43 +0000296void AcmReceiver::GetDecodingCallStatistics(
297 AudioDecodingCallStats* stats) const {
Tommi9090e0b2016-01-20 13:39:36 +0100298 rtc::CritScope lock(&crit_sect_);
wu@webrtc.org24301a62013-12-13 19:17:43 +0000299 *stats = call_stats_.GetDecodingStatistics();
300}
301
turaj@webrtc.org6d5d2482013-10-06 04:47:28 +0000302} // namespace acm2
303
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000304} // namespace webrtc