blob: ea84036fb5a1598198e4d26eefbbf8d657ccb47d [file] [log] [blame]
turaj@webrtc.org7959e162013-09-12 18:30:26 +00001/*
2 * Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#include "modules/audio_coding/acm2/acm_receiver.h"
turaj@webrtc.org7959e162013-09-12 18:30:26 +000012
Yves Gerey988cc082018-10-23 12:03:01 +020013#include <stdlib.h>
14#include <string.h>
15#include <cstdint>
turaj@webrtc.org7959e162013-09-12 18:30:26 +000016#include <vector>
17
Niels Möller2edab4c2018-10-22 09:48:08 +020018#include "absl/strings/match.h"
Yves Gerey988cc082018-10-23 12:03:01 +020019#include "api/audio/audio_frame.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020020#include "api/audio_codecs/audio_decoder.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020021#include "modules/audio_coding/acm2/acm_resampler.h"
22#include "modules/audio_coding/acm2/call_statistics.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020023#include "modules/audio_coding/neteq/include/neteq.h"
Yves Gerey988cc082018-10-23 12:03:01 +020024#include "modules/audio_coding/neteq/neteq_decoder_enum.h"
Fredrik Solenbergbbf21a32018-04-12 22:44:09 +020025#include "modules/include/module_common_types.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020026#include "rtc_base/checks.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020027#include "rtc_base/logging.h"
Karl Wiberge40468b2017-11-22 10:42:26 +010028#include "rtc_base/numerics/safe_conversions.h"
Jonas Olssonabbe8412018-04-03 13:40:05 +020029#include "rtc_base/strings/audio_format_to_string.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020030#include "system_wrappers/include/clock.h"
turaj@webrtc.org7959e162013-09-12 18:30:26 +000031
32namespace webrtc {
33
turaj@webrtc.org6d5d2482013-10-06 04:47:28 +000034namespace acm2 {
35
henrik.lundin@webrtc.org0bc9b5a2014-04-29 08:09:31 +000036AcmReceiver::AcmReceiver(const AudioCodingModule::Config& config)
kwiberg6f0f6162016-09-20 03:07:46 -070037 : last_audio_buffer_(new int16_t[AudioFrame::kMaxDataSizeSamples]),
ossue3525782016-05-25 07:37:43 -070038 neteq_(NetEq::Create(config.neteq_config, config.decoder_factory)),
henrik.lundin@webrtc.org0bc9b5a2014-04-29 08:09:31 +000039 clock_(config.clock),
henrik.lundin678c9032015-11-02 08:31:23 -080040 resampled_last_output_frame_(true) {
Henrik Lundin02ed2012017-06-08 09:03:55 +020041 RTC_DCHECK(clock_);
Henrik Lundin76c10672018-05-07 13:47:28 +020042 memset(last_audio_buffer_.get(), 0,
43 sizeof(int16_t) * AudioFrame::kMaxDataSizeSamples);
turaj@webrtc.org7959e162013-09-12 18:30:26 +000044}
45
Henrik Lundin6af93992017-06-14 14:13:02 +020046AcmReceiver::~AcmReceiver() = default;
turaj@webrtc.org7959e162013-09-12 18:30:26 +000047
48int AcmReceiver::SetMinimumDelay(int delay_ms) {
49 if (neteq_->SetMinimumDelay(delay_ms))
50 return 0;
Mirko Bonadei675513b2017-11-09 11:09:25 +010051 RTC_LOG(LERROR) << "AcmReceiver::SetExtraDelay " << delay_ms;
turaj@webrtc.org7959e162013-09-12 18:30:26 +000052 return -1;
53}
54
turaj@webrtc.org7959e162013-09-12 18:30:26 +000055int AcmReceiver::SetMaximumDelay(int delay_ms) {
56 if (neteq_->SetMaximumDelay(delay_ms))
57 return 0;
Mirko Bonadei675513b2017-11-09 11:09:25 +010058 RTC_LOG(LERROR) << "AcmReceiver::SetExtraDelay " << delay_ms;
turaj@webrtc.org7959e162013-09-12 18:30:26 +000059 return -1;
60}
61
Danil Chapovalovb6021232018-06-19 13:26:36 +020062absl::optional<int> AcmReceiver::last_packet_sample_rate_hz() const {
Tommi9090e0b2016-01-20 13:39:36 +010063 rtc::CritScope lock(&crit_sect_);
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +010064 if (!last_decoder_) {
65 return absl::nullopt;
66 }
67 return last_decoder_->second.clockrate_hz;
henrik.lundin057fb892015-11-23 08:19:52 -080068}
69
henrik.lundind89814b2015-11-23 06:49:25 -080070int AcmReceiver::last_output_sample_rate_hz() const {
71 return neteq_->last_output_sample_rate_hz();
turaj@webrtc.org7959e162013-09-12 18:30:26 +000072}
73
turaj@webrtc.org7959e162013-09-12 18:30:26 +000074int AcmReceiver::InsertPacket(const WebRtcRTPHeader& rtp_header,
kwibergee2bac22015-11-11 10:34:00 -080075 rtc::ArrayView<const uint8_t> incoming_payload) {
henrik.lundinb8c55b12017-05-10 07:38:01 -070076 if (incoming_payload.empty()) {
77 neteq_->InsertEmptyPacket(rtp_header.header);
78 return 0;
79 }
80
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +010081 const RTPHeader& header = rtp_header.header; // Just a shorthand.
82 int payload_type = header.payloadType;
83 auto format = neteq_->GetDecoderFormat(payload_type);
84 if (format && absl::EqualsIgnoreCase(format->name, "red")) {
85 // This is a RED packet. Get the format of the audio codec.
86 payload_type = incoming_payload[0] & 0x7f;
87 format = neteq_->GetDecoderFormat(payload_type);
88 }
89 if (!format) {
90 RTC_LOG_F(LS_ERROR) << "Payload-type "
91 << payload_type
92 << " is not registered.";
93 return -1;
94 }
95
turaj@webrtc.org7959e162013-09-12 18:30:26 +000096 {
Tommi9090e0b2016-01-20 13:39:36 +010097 rtc::CritScope lock(&crit_sect_);
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +010098 if (absl::EqualsIgnoreCase(format->name, "cn")) {
99 if (last_decoder_ && last_decoder_->second.num_channels > 1) {
kwiberg6f0f6162016-09-20 03:07:46 -0700100 // This is a CNG and the audio codec is not mono, so skip pushing in
101 // packets into NetEq.
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000102 return 0;
kwiberg6f0f6162016-09-20 03:07:46 -0700103 }
104 } else {
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100105 RTC_DCHECK(format);
106 last_decoder_ = std::make_pair(payload_type, *format);
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000107 }
henrik.lundin@webrtc.orga90abde2014-06-09 18:35:11 +0000108 } // |crit_sect_| is released.
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000109
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100110 uint32_t receive_timestamp = NowInTimestamp(format->clockrate_hz);
111 if (neteq_->InsertPacket(header, incoming_payload, receive_timestamp) < 0) {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100112 RTC_LOG(LERROR) << "AcmReceiver::InsertPacket "
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100113 << static_cast<int>(header.payloadType)
Mirko Bonadei675513b2017-11-09 11:09:25 +0100114 << " Failed to insert packet";
henrik.lundin@webrtc.orgeecf5e62014-06-24 13:11:22 +0000115 return -1;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000116 }
117 return 0;
118}
119
henrik.lundin834a6ea2016-05-13 03:45:24 -0700120int AcmReceiver::GetAudio(int desired_freq_hz,
121 AudioFrame* audio_frame,
122 bool* muted) {
henrik.lundin63489782016-09-20 01:47:12 -0700123 RTC_DCHECK(muted);
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000124 // Accessing members, take the lock.
Tommi9090e0b2016-01-20 13:39:36 +0100125 rtc::CritScope lock(&crit_sect_);
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000126
henrik.lundin834a6ea2016-05-13 03:45:24 -0700127 if (neteq_->GetAudio(audio_frame, muted) != NetEq::kOK) {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100128 RTC_LOG(LERROR) << "AcmReceiver::GetAudio - NetEq Failed.";
henrik.lundin@webrtc.orgeecf5e62014-06-24 13:11:22 +0000129 return -1;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000130 }
131
henrik.lundind89814b2015-11-23 06:49:25 -0800132 const int current_sample_rate_hz = neteq_->last_output_sample_rate_hz();
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000133
134 // Update if resampling is required.
henrik.lundind89814b2015-11-23 06:49:25 -0800135 const bool need_resampling =
136 (desired_freq_hz != -1) && (current_sample_rate_hz != desired_freq_hz);
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000137
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000138 if (need_resampling && !resampled_last_output_frame_) {
139 // Prime the resampler with the last frame.
140 int16_t temp_output[AudioFrame::kMaxDataSizeSamples];
henrik.lundind89814b2015-11-23 06:49:25 -0800141 int samples_per_channel_int = resampler_.Resample10Msec(
142 last_audio_buffer_.get(), current_sample_rate_hz, desired_freq_hz,
henrik.lundin6d8e0112016-03-04 10:34:21 -0800143 audio_frame->num_channels_, AudioFrame::kMaxDataSizeSamples,
144 temp_output);
Peter Kastingdce40cf2015-08-24 14:52:23 -0700145 if (samples_per_channel_int < 0) {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100146 RTC_LOG(LERROR) << "AcmReceiver::GetAudio - "
147 "Resampling last_audio_buffer_ failed.";
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000148 return -1;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000149 }
150 }
151
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000152 // TODO(henrik.lundin) Glitches in the output may appear if the output rate
153 // from NetEq changes. See WebRTC issue 3923.
154 if (need_resampling) {
yujo36b1a5f2017-06-12 12:45:32 -0700155 // TODO(yujo): handle this more efficiently for muted frames.
henrik.lundind89814b2015-11-23 06:49:25 -0800156 int samples_per_channel_int = resampler_.Resample10Msec(
yujo36b1a5f2017-06-12 12:45:32 -0700157 audio_frame->data(), current_sample_rate_hz, desired_freq_hz,
henrik.lundin6d8e0112016-03-04 10:34:21 -0800158 audio_frame->num_channels_, AudioFrame::kMaxDataSizeSamples,
yujo36b1a5f2017-06-12 12:45:32 -0700159 audio_frame->mutable_data());
Peter Kastingdce40cf2015-08-24 14:52:23 -0700160 if (samples_per_channel_int < 0) {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100161 RTC_LOG(LERROR)
162 << "AcmReceiver::GetAudio - Resampling audio_buffer_ failed.";
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000163 return -1;
164 }
henrik.lundin6d8e0112016-03-04 10:34:21 -0800165 audio_frame->samples_per_channel_ =
166 static_cast<size_t>(samples_per_channel_int);
167 audio_frame->sample_rate_hz_ = desired_freq_hz;
168 RTC_DCHECK_EQ(
169 audio_frame->sample_rate_hz_,
kwibergd3edd772017-03-01 18:52:48 -0800170 rtc::dchecked_cast<int>(audio_frame->samples_per_channel_ * 100));
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000171 resampled_last_output_frame_ = true;
172 } else {
173 resampled_last_output_frame_ = false;
174 // We might end up here ONLY if codec is changed.
henrik.lundin@webrtc.org913f7b82014-10-21 06:54:23 +0000175 }
176
henrik.lundin6d8e0112016-03-04 10:34:21 -0800177 // Store current audio in |last_audio_buffer_| for next time.
yujo36b1a5f2017-06-12 12:45:32 -0700178 memcpy(last_audio_buffer_.get(), audio_frame->data(),
henrik.lundin6d8e0112016-03-04 10:34:21 -0800179 sizeof(int16_t) * audio_frame->samples_per_channel_ *
180 audio_frame->num_channels_);
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000181
henrik.lundin63489782016-09-20 01:47:12 -0700182 call_stats_.DecodedByNetEq(audio_frame->speech_type_, *muted);
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000183 return 0;
184}
185
kwiberg1c07c702017-03-27 07:15:49 -0700186void AcmReceiver::SetCodecs(const std::map<int, SdpAudioFormat>& codecs) {
187 neteq_->SetCodecs(codecs);
188}
189
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000190void AcmReceiver::FlushBuffers() {
191 neteq_->FlushBuffers();
192}
193
kwiberg6b19b562016-09-20 04:02:25 -0700194void AcmReceiver::RemoveAllCodecs() {
Tommi9090e0b2016-01-20 13:39:36 +0100195 rtc::CritScope lock(&crit_sect_);
kwiberg6b19b562016-09-20 04:02:25 -0700196 neteq_->RemoveAllPayloadTypes();
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100197 last_decoder_ = absl::nullopt;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000198}
199
Danil Chapovalovb6021232018-06-19 13:26:36 +0200200absl::optional<uint32_t> AcmReceiver::GetPlayoutTimestamp() {
henrik.lundin9a410dd2016-04-06 01:39:22 -0700201 return neteq_->GetPlayoutTimestamp();
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000202}
203
henrik.lundinb3f1c5d2016-08-22 15:39:53 -0700204int AcmReceiver::FilteredCurrentDelayMs() const {
205 return neteq_->FilteredCurrentDelayMs();
206}
207
Henrik Lundinabbff892017-11-29 09:14:04 +0100208int AcmReceiver::TargetDelayMs() const {
209 return neteq_->TargetDelayMs();
210}
211
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100212absl::optional<std::pair<int, SdpAudioFormat>>
213 AcmReceiver::LastDecoder() const {
Tommi9090e0b2016-01-20 13:39:36 +0100214 rtc::CritScope lock(&crit_sect_);
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100215 if (!last_decoder_) {
216 return absl::nullopt;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000217 }
Fredrik Solenbergf693bfa2018-12-11 12:22:10 +0100218 RTC_DCHECK_NE(-1, last_decoder_->first); // Payload type should be valid.
219 return last_decoder_;
ossue280cde2016-10-12 11:04:10 -0700220}
221
minyue@webrtc.orgc0bd7be2015-02-18 15:24:13 +0000222void AcmReceiver::GetNetworkStatistics(NetworkStatistics* acm_stat) {
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000223 NetEqNetworkStatistics neteq_stat;
224 // NetEq function always returns zero, so we don't check the return value.
225 neteq_->NetworkStatistics(&neteq_stat);
226
227 acm_stat->currentBufferSize = neteq_stat.current_buffer_size_ms;
228 acm_stat->preferredBufferSize = neteq_stat.preferred_buffer_size_ms;
turaj@webrtc.org532f3dc2013-09-19 00:12:23 +0000229 acm_stat->jitterPeaksFound = neteq_stat.jitter_peaks_found ? true : false;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000230 acm_stat->currentPacketLossRate = neteq_stat.packet_loss_rate;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000231 acm_stat->currentExpandRate = neteq_stat.expand_rate;
minyue@webrtc.orgc0bd7be2015-02-18 15:24:13 +0000232 acm_stat->currentSpeechExpandRate = neteq_stat.speech_expand_rate;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000233 acm_stat->currentPreemptiveRate = neteq_stat.preemptive_rate;
234 acm_stat->currentAccelerateRate = neteq_stat.accelerate_rate;
minyue@webrtc.orgc0bd7be2015-02-18 15:24:13 +0000235 acm_stat->currentSecondaryDecodedRate = neteq_stat.secondary_decoded_rate;
minyue-webrtc0c3ca752017-08-23 15:59:38 +0200236 acm_stat->currentSecondaryDiscardedRate = neteq_stat.secondary_discarded_rate;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000237 acm_stat->clockDriftPPM = neteq_stat.clockdrift_ppm;
henrik.lundin@webrtc.org20c71fd2014-04-22 10:11:21 +0000238 acm_stat->addedSamples = neteq_stat.added_zero_samples;
Henrik Lundin1bb8cf82015-08-25 13:08:04 +0200239 acm_stat->meanWaitingTimeMs = neteq_stat.mean_waiting_time_ms;
240 acm_stat->medianWaitingTimeMs = neteq_stat.median_waiting_time_ms;
241 acm_stat->minWaitingTimeMs = neteq_stat.min_waiting_time_ms;
242 acm_stat->maxWaitingTimeMs = neteq_stat.max_waiting_time_ms;
Steve Anton2dbc69f2017-08-24 17:15:13 -0700243
244 NetEqLifetimeStatistics neteq_lifetime_stat = neteq_->GetLifetimeStatistics();
245 acm_stat->totalSamplesReceived = neteq_lifetime_stat.total_samples_received;
246 acm_stat->concealedSamples = neteq_lifetime_stat.concealed_samples;
Gustaf Ullberg9a2e9062017-09-18 09:28:20 +0200247 acm_stat->concealmentEvents = neteq_lifetime_stat.concealment_events;
Gustaf Ullbergb0a02072017-10-02 12:00:34 +0200248 acm_stat->jitterBufferDelayMs = neteq_lifetime_stat.jitter_buffer_delay_ms;
Jakob Ivarsson352ce5c2018-11-27 12:52:16 +0100249 acm_stat->delayedPacketOutageSamples =
250 neteq_lifetime_stat.delayed_packet_outage_samples;
Ruslan Burakov8af88962018-11-22 17:21:10 +0100251
252 NetEqOperationsAndState neteq_operations_and_state =
253 neteq_->GetOperationsAndState();
254 acm_stat->packetBufferFlushes =
255 neteq_operations_and_state.packet_buffer_flushes;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000256}
257
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000258int AcmReceiver::EnableNack(size_t max_nack_list_size) {
henrik.lundin48ed9302015-10-29 05:36:24 -0700259 neteq_->EnableNack(max_nack_list_size);
260 return 0;
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000261}
262
263void AcmReceiver::DisableNack() {
henrik.lundin48ed9302015-10-29 05:36:24 -0700264 neteq_->DisableNack();
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000265}
266
267std::vector<uint16_t> AcmReceiver::GetNackList(
pkasting@chromium.org16825b12015-01-12 21:51:21 +0000268 int64_t round_trip_time_ms) const {
henrik.lundin48ed9302015-10-29 05:36:24 -0700269 return neteq_->GetNackList(round_trip_time_ms);
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000270}
271
272void AcmReceiver::ResetInitialDelay() {
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000273 neteq_->SetMinimumDelay(0);
274 // TODO(turajs): Should NetEq Buffer be flushed?
275}
276
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000277uint32_t AcmReceiver::NowInTimestamp(int decoder_sampling_rate) const {
278 // Down-cast the time to (32-6)-bit since we only care about
279 // the least significant bits. (32-6) bits cover 2^(32-6) = 67108864 ms.
280 // We masked 6 most significant bits of 32-bit so there is no overflow in
281 // the conversion from milliseconds to timestamp.
Yves Gerey665174f2018-06-19 15:03:05 +0200282 const uint32_t now_in_ms =
283 static_cast<uint32_t>(clock_->TimeInMilliseconds() & 0x03ffffff);
284 return static_cast<uint32_t>((decoder_sampling_rate / 1000) * now_in_ms);
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000285}
286
wu@webrtc.org24301a62013-12-13 19:17:43 +0000287void AcmReceiver::GetDecodingCallStatistics(
288 AudioDecodingCallStats* stats) const {
Tommi9090e0b2016-01-20 13:39:36 +0100289 rtc::CritScope lock(&crit_sect_);
wu@webrtc.org24301a62013-12-13 19:17:43 +0000290 *stats = call_stats_.GetDecodingStatistics();
291}
292
turaj@webrtc.org6d5d2482013-10-06 04:47:28 +0000293} // namespace acm2
294
turaj@webrtc.org7959e162013-09-12 18:30:26 +0000295} // namespace webrtc