Blame - modules/audio_coding/acm2/audio_coding_module.cc - webrtc.googlesource.com/src

blob: 97a204ac4f9dba18e348fa928cecb66a7333506a [file] [log] [blame]

turaj@webrtc.org	7959e16	2013-09-12 18:30:26 +0000	[diff] [blame]	1	/*
				2	* Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
				3	*
				4	* Use of this source code is governed by a BSD-style license
				5	* that can be found in the LICENSE file in the root of the source
				6	* tree. An additional intellectual property rights grant can be found
				7	* in the file PATENTS. All contributing project authors may
				8	* be found in the AUTHORS file in the root of the source tree.
				9	*/
				10
Mirko Bonadei	92ea95e	2017-09-15 06:47:31 +0200	[diff] [blame]	11	#include "modules/audio_coding/include/audio_coding_module.h"
turaj@webrtc.org	7959e16	2013-09-12 18:30:26 +0000	[diff] [blame]	12
Jonathan Yu	36344a0	2017-07-30 01:55:34 -0700	[diff] [blame]	13	#include <algorithm>
Yves Gerey	988cc08	2018-10-23 12:03:01 +0200	[diff] [blame]	14	#include <cstdint>
Jonathan Yu	36344a0	2017-07-30 01:55:34 -0700	[diff] [blame]	15
Niels Möller	2edab4c	2018-10-22 09:48:08 +0200	[diff] [blame]	16	#include "absl/strings/match.h"
Ali Tofigh	714e3cb	2022-07-20 12:53:07 +0200	[diff] [blame]	17	#include "absl/strings/string_view.h"
Yves Gerey	988cc08	2018-10-23 12:03:01 +0200	[diff] [blame]	18	#include "api/array_view.h"
Per Åhgren	4dd56a3	2019-11-19 21:00:59 +0100	[diff] [blame]	19	#include "modules/audio_coding/acm2/acm_remixing.h"
Mirko Bonadei	92ea95e	2017-09-15 06:47:31 +0200	[diff] [blame]	20	#include "modules/audio_coding/acm2/acm_resampler.h"
Fredrik Solenberg	bbf21a3	2018-04-12 22:44:09 +0200	[diff] [blame]	21	#include "modules/include/module_common_types.h"
Yves Gerey	988cc08	2018-10-23 12:03:01 +0200	[diff] [blame]	22	#include "modules/include/module_common_types_public.h"
				23	#include "rtc_base/buffer.h"
Mirko Bonadei	92ea95e	2017-09-15 06:47:31 +0200	[diff] [blame]	24	#include "rtc_base/checks.h"
				25	#include "rtc_base/logging.h"
Karl Wiberg	e40468b	2017-11-22 10:42:26 +0100	[diff] [blame]	26	#include "rtc_base/numerics/safe_conversions.h"
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	27	#include "rtc_base/synchronization/mutex.h"
Yves Gerey	988cc08	2018-10-23 12:03:01 +0200	[diff] [blame]	28	#include "rtc_base/thread_annotations.h"
Mirko Bonadei	92ea95e	2017-09-15 06:47:31 +0200	[diff] [blame]	29	#include "system_wrappers/include/metrics.h"
turaj@webrtc.org	7959e16	2013-09-12 18:30:26 +0000	[diff] [blame]	30
				31	namespace webrtc {
				32
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	33	namespace {
				34
Per Åhgren	4f2e940	2019-10-04 11:06:15 +0200	[diff] [blame]	35	// Initial size for the buffer in InputBuffer. This matches 6 channels of 10 ms
				36	// 48 kHz data.
				37	constexpr size_t kInitialInputDataBufferSize = 6 * 480;
				38
Per Åhgren	d82a02c	2020-03-12 11:53:30 +0100	[diff] [blame]	39	constexpr int32_t kMaxInputSampleRateHz = 192000;
				40
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	41	class AudioCodingModuleImpl final : public AudioCodingModule {
				42	public:
Henrik Lundin	84f7569	2023-02-01 12:07:10 +0000	[diff] [blame]	43	explicit AudioCodingModuleImpl();
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	44	~AudioCodingModuleImpl() override;
				45
				46	/////////////////////////////////////////
				47	// Sender
				48	//
				49
kwiberg	24c7c12	2016-09-28 11:57:10 -0700	[diff] [blame]	50	void ModifyEncoder(rtc::FunctionView<void(std::unique_ptr<AudioEncoder>*)>
				51	modifier) override;
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	52
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	53	// Register a transport callback which will be
				54	// called to deliver the encoded buffers.
				55	int RegisterTransportCallback(AudioPacketizationCallback* transport) override;
				56
				57	// Add 10 ms of raw (PCM) audio data to the encoder.
				58	int Add10MsData(const AudioFrame& audio_frame) override;
				59
				60	/////////////////////////////////////////
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	61	// (FEC) Forward Error Correction (codec internal)
				62	//
				63
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	64	// Set target packet loss rate
				65	int SetPacketLossRate(int loss_rate) override;
				66
				67	/////////////////////////////////////////
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	68	// Statistics
				69	//
				70
ivoc	e1198e0	2017-09-08 08:13:19 -0700	[diff] [blame]	71	ANAStats GetANAStats() const override;
				72
Jakob Ivarsson	bf08745	2021-11-11 13:43:49 +0100	[diff] [blame]	73	int GetTargetBitrate() const override;
				74
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	75	private:
				76	struct InputData {
Per Åhgren	4f2e940	2019-10-04 11:06:15 +0200	[diff] [blame]	77	InputData() : buffer(kInitialInputDataBufferSize) {}
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	78	uint32_t input_timestamp;
				79	const int16_t* audio;
				80	size_t length_per_channel;
				81	size_t audio_channel;
				82	// If a re-mix is required (up or down), this buffer will store a re-mixed
				83	// version of the input.
Per Åhgren	4f2e940	2019-10-04 11:06:15 +0200	[diff] [blame]	84	std::vector<int16_t> buffer;
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	85	};
				86
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	87	InputData input_data_ RTC_GUARDED_BY(acm_mutex_);
Per Åhgren	4f2e940	2019-10-04 11:06:15 +0200	[diff] [blame]	88
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	89	// This member class writes values to the named UMA histogram, but only if
				90	// the value has changed since the last time (and always for the first call).
				91	class ChangeLogger {
				92	public:
Ali Tofigh	714e3cb	2022-07-20 12:53:07 +0200	[diff] [blame]	93	explicit ChangeLogger(absl::string_view histogram_name)
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	94	: histogram_name_(histogram_name) {}
				95	// Logs the new value if it is different from the last logged value, or if
				96	// this is the first call.
				97	void MaybeLog(int value);
				98
				99	private:
				100	int last_value_ = 0;
				101	int first_time_ = true;
				102	const std::string histogram_name_;
				103	};
				104
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	105	int Add10MsDataInternal(const AudioFrame& audio_frame, InputData* input_data)
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	106	RTC_EXCLUSIVE_LOCKS_REQUIRED(acm_mutex_);
Minyue Li	dea73ee	2020-02-18 15:45:41 +0100	[diff] [blame]	107
Artem Titov	d00ce74	2021-07-28 20:00:17 +0200	[diff] [blame]	108	// TODO(bugs.webrtc.org/10739): change `absolute_capture_timestamp_ms` to
Minyue Li	dea73ee	2020-02-18 15:45:41 +0100	[diff] [blame]	109	// int64_t when it always receives a valid value.
				110	int Encode(const InputData& input_data,
				111	absl::optional<int64_t> absolute_capture_timestamp_ms)
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	112	RTC_EXCLUSIVE_LOCKS_REQUIRED(acm_mutex_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	113
Ali Tofigh	714e3cb	2022-07-20 12:53:07 +0200	[diff] [blame]	114	bool HaveValidEncoder(absl::string_view caller_name) const
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	115	RTC_EXCLUSIVE_LOCKS_REQUIRED(acm_mutex_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	116
				117	// Preprocessing of input audio, including resampling and down-mixing if
				118	// required, before pushing audio into encoder's buffer.
				119	//
				120	// in_frame: input audio-frame
				121	// ptr_out: pointer to output audio_frame. If no preprocessing is required
Artem Titov	d00ce74	2021-07-28 20:00:17 +0200	[diff] [blame]	122	// `ptr_out` will be pointing to `in_frame`, otherwise pointing to
				123	// `preprocess_frame_`.
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	124	//
				125	// Return value:
				126	// -1: if encountering an error.
				127	// 0: otherwise.
				128	int PreprocessToAddData(const AudioFrame& in_frame,
				129	const AudioFrame** ptr_out)
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	130	RTC_EXCLUSIVE_LOCKS_REQUIRED(acm_mutex_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	131
				132	// Change required states after starting to receive the codec corresponding
Artem Titov	d00ce74	2021-07-28 20:00:17 +0200	[diff] [blame]	133	// to `index`.
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	134	int UpdateUponReceivingCodec(int index);
				135
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	136	mutable Mutex acm_mutex_;
				137	rtc::Buffer encode_buffer_ RTC_GUARDED_BY(acm_mutex_);
				138	uint32_t expected_codec_ts_ RTC_GUARDED_BY(acm_mutex_);
				139	uint32_t expected_in_ts_ RTC_GUARDED_BY(acm_mutex_);
				140	acm2::ACMResampler resampler_ RTC_GUARDED_BY(acm_mutex_);
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	141	ChangeLogger bitrate_logger_ RTC_GUARDED_BY(acm_mutex_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	142
Karl Wiberg	49c33ce	2018-11-12 14:21:58 +0100	[diff] [blame]	143	// Current encoder stack, provided by a call to RegisterEncoder.
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	144	std::unique_ptr<AudioEncoder> encoder_stack_ RTC_GUARDED_BY(acm_mutex_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	145
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	146	// This is to keep track of CN instances where we can send DTMFs.
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	147	uint8_t previous_pltype_ RTC_GUARDED_BY(acm_mutex_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	148
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	149	AudioFrame preprocess_frame_ RTC_GUARDED_BY(acm_mutex_);
				150	bool first_10ms_data_ RTC_GUARDED_BY(acm_mutex_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	151
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	152	bool first_frame_ RTC_GUARDED_BY(acm_mutex_);
				153	uint32_t last_timestamp_ RTC_GUARDED_BY(acm_mutex_);
				154	uint32_t last_rtp_timestamp_ RTC_GUARDED_BY(acm_mutex_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	155
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	156	Mutex callback_mutex_;
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	157	AudioPacketizationCallback* packetization_callback_
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	158	RTC_GUARDED_BY(callback_mutex_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	159
				160	int codec_histogram_bins_log_[static_cast<size_t>(
				161	AudioEncoder::CodecType::kMaxLoggedAudioCodecTypes)];
				162	int number_of_consecutive_empty_packets_;
				163	};
				164
				165	// Adds a codec usage sample to the histogram.
				166	void UpdateCodecTypeHistogram(size_t codec_type) {
				167	RTC_HISTOGRAM_ENUMERATION(
				168	"WebRTC.Audio.Encoder.CodecType", static_cast<int>(codec_type),
				169	static_cast<int>(
				170	webrtc::AudioEncoder::CodecType::kMaxLoggedAudioCodecTypes));
				171	}
				172
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	173	void AudioCodingModuleImpl::ChangeLogger::MaybeLog(int value) {
				174	if (value != last_value_ \|\| first_time_) {
				175	first_time_ = false;
				176	last_value_ = value;
				177	RTC_HISTOGRAM_COUNTS_SPARSE_100(histogram_name_, value);
				178	}
				179	}
				180
Henrik Lundin	84f7569	2023-02-01 12:07:10 +0000	[diff] [blame]	181	AudioCodingModuleImpl::AudioCodingModuleImpl()
solenberg	c7b4a45	2017-09-28 07:37:11 -0700	[diff] [blame]	182	: expected_codec_ts_(0xD87F3F9F),
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	183	expected_in_ts_(0xD87F3F9F),
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	184	bitrate_logger_("WebRTC.Audio.TargetBitrateInKbps"),
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	185	encoder_stack_(nullptr),
				186	previous_pltype_(255),
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	187	first_10ms_data_(false),
				188	first_frame_(true),
				189	packetization_callback_(NULL),
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	190	codec_histogram_bins_log_(),
				191	number_of_consecutive_empty_packets_(0) {
Mirko Bonadei	675513b	2017-11-09 11:09:25 +0100	[diff] [blame]	192	RTC_LOG(LS_INFO) << "Created";
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	193	}
				194
				195	AudioCodingModuleImpl::~AudioCodingModuleImpl() = default;
				196
Minyue Li	dea73ee	2020-02-18 15:45:41 +0100	[diff] [blame]	197	int32_t AudioCodingModuleImpl::Encode(
				198	const InputData& input_data,
				199	absl::optional<int64_t> absolute_capture_timestamp_ms) {
				200	// TODO(bugs.webrtc.org/10739): add dcheck that
Artem Titov	cfea218	2021-08-10 01:22:31 +0200	[diff] [blame]	201	// `audio_frame.absolute_capture_timestamp_ms()` always has a value.
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	202	AudioEncoder::EncodedInfo encoded_info;
				203	uint8_t previous_pltype;
				204
				205	// Check if there is an encoder before.
				206	if (!HaveValidEncoder("Process"))
				207	return -1;
				208
Yves Gerey	665174f	2018-06-19 15:03:05 +0200	[diff] [blame]	209	if (!first_frame_) {
deadbeef	fcada90	2016-08-24 12:45:13 -0700	[diff] [blame]	210	RTC_DCHECK(IsNewerTimestamp(input_data.input_timestamp, last_timestamp_))
ossu	63fb95a	2016-07-06 09:34:22 -0700	[diff] [blame]	211	<< "Time should not move backwards";
				212	}
				213
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	214	// Scale the timestamp to the codec's RTP timestamp rate.
				215	uint32_t rtp_timestamp =
Karl Wiberg	053c371	2019-05-16 15:24:17 +0200	[diff] [blame]	216	first_frame_
				217	? input_data.input_timestamp
				218	: last_rtp_timestamp_ +
				219	rtc::dchecked_cast<uint32_t>(rtc::CheckedDivExact(
				220	int64_t{input_data.input_timestamp - last_timestamp_} *
				221	encoder_stack_->RtpTimestampRateHz(),
				222	int64_t{encoder_stack_->SampleRateHz()}));
Minyue Li	ff0e4db	2020-01-23 13:45:50 +0100	[diff] [blame]	223
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	224	last_timestamp_ = input_data.input_timestamp;
				225	last_rtp_timestamp_ = rtp_timestamp;
				226	first_frame_ = false;
				227
				228	// Clear the buffer before reuse - encoded data will get appended.
				229	encode_buffer_.Clear();
				230	encoded_info = encoder_stack_->Encode(
Yves Gerey	665174f	2018-06-19 15:03:05 +0200	[diff] [blame]	231	rtp_timestamp,
				232	rtc::ArrayView<const int16_t>(
				233	input_data.audio,
				234	input_data.audio_channel * input_data.length_per_channel),
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	235	&encode_buffer_);
				236
				237	bitrate_logger_.MaybeLog(encoder_stack_->GetTargetBitrate() / 1000);
				238	if (encode_buffer_.size() == 0 && !encoded_info.send_even_if_empty) {
				239	// Not enough data.
				240	return 0;
				241	}
				242	previous_pltype = previous_pltype_; // Read it while we have the critsect.
				243
				244	// Log codec type to histogram once every 500 packets.
				245	if (encoded_info.encoded_bytes == 0) {
				246	++number_of_consecutive_empty_packets_;
				247	} else {
				248	size_t codec_type = static_cast<size_t>(encoded_info.encoder_type);
				249	codec_histogram_bins_log_[codec_type] +=
				250	number_of_consecutive_empty_packets_ + 1;
				251	number_of_consecutive_empty_packets_ = 0;
				252	if (codec_histogram_bins_log_[codec_type] >= 500) {
				253	codec_histogram_bins_log_[codec_type] -= 500;
				254	UpdateCodecTypeHistogram(codec_type);
				255	}
				256	}
				257
Niels Möller	87e2d78	2019-03-07 10:18:23 +0100	[diff] [blame]	258	AudioFrameType frame_type;
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	259	if (encode_buffer_.size() == 0 && encoded_info.send_even_if_empty) {
Niels Möller	c936cb6	2019-03-19 14:10:16 +0100	[diff] [blame]	260	frame_type = AudioFrameType::kEmptyFrame;
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	261	encoded_info.payload_type = previous_pltype;
				262	} else {
kwiberg	af476c7	2016-11-28 15:21:39 -0800	[diff] [blame]	263	RTC_DCHECK_GT(encode_buffer_.size(), 0);
Niels Möller	c936cb6	2019-03-19 14:10:16 +0100	[diff] [blame]	264	frame_type = encoded_info.speech ? AudioFrameType::kAudioFrameSpeech
				265	: AudioFrameType::kAudioFrameCN;
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	266	}
				267
				268	{
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	269	MutexLock lock(&callback_mutex_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	270	if (packetization_callback_) {
				271	packetization_callback_->SendData(
				272	frame_type, encoded_info.payload_type, encoded_info.encoded_timestamp,
Minyue Li	ff0e4db	2020-01-23 13:45:50 +0100	[diff] [blame]	273	encode_buffer_.data(), encode_buffer_.size(),
Minyue Li	dea73ee	2020-02-18 15:45:41 +0100	[diff] [blame]	274	absolute_capture_timestamp_ms.value_or(-1));
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	275	}
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	276	}
				277	previous_pltype_ = encoded_info.payload_type;
				278	return static_cast<int32_t>(encode_buffer_.size());
				279	}
				280
				281	/////////////////////////////////////////
				282	// Sender
				283	//
				284
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	285	void AudioCodingModuleImpl::ModifyEncoder(
kwiberg	24c7c12	2016-09-28 11:57:10 -0700	[diff] [blame]	286	rtc::FunctionView<void(std::unique_ptr<AudioEncoder>*)> modifier) {
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	287	MutexLock lock(&acm_mutex_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	288	modifier(&encoder_stack_);
				289	}
				290
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	291	// Register a transport callback which will be called to deliver
				292	// the encoded buffers.
				293	int AudioCodingModuleImpl::RegisterTransportCallback(
				294	AudioPacketizationCallback* transport) {
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	295	MutexLock lock(&callback_mutex_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	296	packetization_callback_ = transport;
				297	return 0;
				298	}
				299
				300	// Add 10MS of raw (PCM) audio data to the encoder.
				301	int AudioCodingModuleImpl::Add10MsData(const AudioFrame& audio_frame) {
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	302	MutexLock lock(&acm_mutex_);
Per Åhgren	4f2e940	2019-10-04 11:06:15 +0200	[diff] [blame]	303	int r = Add10MsDataInternal(audio_frame, &input_data_);
Minyue Li	dea73ee	2020-02-18 15:45:41 +0100	[diff] [blame]	304	// TODO(bugs.webrtc.org/10739): add dcheck that
Artem Titov	cfea218	2021-08-10 01:22:31 +0200	[diff] [blame]	305	// `audio_frame.absolute_capture_timestamp_ms()` always has a value.
Minyue Li	dea73ee	2020-02-18 15:45:41 +0100	[diff] [blame]	306	return r < 0
				307	? r
				308	: Encode(input_data_, audio_frame.absolute_capture_timestamp_ms());
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	309	}
				310
				311	int AudioCodingModuleImpl::Add10MsDataInternal(const AudioFrame& audio_frame,
				312	InputData* input_data) {
				313	if (audio_frame.samples_per_channel_ == 0) {
Artem Titov	d325196	2021-11-15 16:57:07 +0100	[diff] [blame]	314	RTC_DCHECK_NOTREACHED();
Mirko Bonadei	675513b	2017-11-09 11:09:25 +0100	[diff] [blame]	315	RTC_LOG(LS_ERROR) << "Cannot Add 10 ms audio, payload length is zero";
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	316	return -1;
				317	}
				318
Per Åhgren	d82a02c	2020-03-12 11:53:30 +0100	[diff] [blame]	319	if (audio_frame.sample_rate_hz_ > kMaxInputSampleRateHz) {
Artem Titov	d325196	2021-11-15 16:57:07 +0100	[diff] [blame]	320	RTC_DCHECK_NOTREACHED();
Mirko Bonadei	675513b	2017-11-09 11:09:25 +0100	[diff] [blame]	321	RTC_LOG(LS_ERROR) << "Cannot Add 10 ms audio, input frequency not valid";
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	322	return -1;
				323	}
				324
				325	// If the length and frequency matches. We currently just support raw PCM.
				326	if (static_cast<size_t>(audio_frame.sample_rate_hz_ / 100) !=
				327	audio_frame.samples_per_channel_) {
Mirko Bonadei	675513b	2017-11-09 11:09:25 +0100	[diff] [blame]	328	RTC_LOG(LS_ERROR)
Alex Loiko	300ec8c	2017-05-30 17:23:28 +0200	[diff] [blame]	329	<< "Cannot Add 10 ms audio, input frequency and length doesn't match";
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	330	return -1;
				331	}
				332
Alex Loiko	6543881	2019-02-22 10:13:44 +0100	[diff] [blame]	333	if (audio_frame.num_channels_ != 1 && audio_frame.num_channels_ != 2 &&
				334	audio_frame.num_channels_ != 4 && audio_frame.num_channels_ != 6 &&
				335	audio_frame.num_channels_ != 8) {
Mirko Bonadei	675513b	2017-11-09 11:09:25 +0100	[diff] [blame]	336	RTC_LOG(LS_ERROR) << "Cannot Add 10 ms audio, invalid number of channels.";
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	337	return -1;
				338	}
				339
				340	// Do we have a codec registered?
				341	if (!HaveValidEncoder("Add10MsData")) {
				342	return -1;
				343	}
				344
				345	const AudioFrame* ptr_frame;
				346	// Perform a resampling, also down-mix if it is required and can be
				347	// performed before resampling (a down mix prior to resampling will take
				348	// place if both primary and secondary encoders are mono and input is in
				349	// stereo).
				350	if (PreprocessToAddData(audio_frame, &ptr_frame) < 0) {
				351	return -1;
				352	}
				353
				354	// Check whether we need an up-mix or down-mix?
				355	const size_t current_num_channels = encoder_stack_->NumChannels();
				356	const bool same_num_channels =
				357	ptr_frame->num_channels_ == current_num_channels;
				358
yujo	36b1a5f	2017-06-12 12:45:32 -0700	[diff] [blame]	359	// TODO(yujo): Skip encode of muted frames.
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	360	input_data->input_timestamp = ptr_frame->timestamp_;
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	361	input_data->length_per_channel = ptr_frame->samples_per_channel_;
				362	input_data->audio_channel = current_num_channels;
				363
Per Åhgren	4f2e940	2019-10-04 11:06:15 +0200	[diff] [blame]	364	if (!same_num_channels) {
				365	// Remixes the input frame to the output data and in the process resize the
				366	// output data if needed.
Per Åhgren	4dd56a3	2019-11-19 21:00:59 +0100	[diff] [blame]	367	ReMixFrame(*ptr_frame, current_num_channels, &input_data->buffer);
Per Åhgren	4f2e940	2019-10-04 11:06:15 +0200	[diff] [blame]	368
Artem Titov	d00ce74	2021-07-28 20:00:17 +0200	[diff] [blame]	369	// For pushing data to primary, point the `ptr_audio` to correct buffer.
Per Åhgren	4f2e940	2019-10-04 11:06:15 +0200	[diff] [blame]	370	input_data->audio = input_data->buffer.data();
				371	RTC_DCHECK_GE(input_data->buffer.size(),
				372	input_data->length_per_channel * input_data->audio_channel);
				373	} else {
				374	// When adding data to encoders this pointer is pointing to an audio buffer
				375	// with correct number of channels.
				376	input_data->audio = ptr_frame->data();
				377	}
				378
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	379	return 0;
				380	}
				381
				382	// Perform a resampling and down-mix if required. We down-mix only if
				383	// encoder is mono and input is stereo. In case of dual-streaming, both
				384	// encoders has to be mono for down-mix to take place.
				385	// \|*ptr_out\| will point to the pre-processed audio-frame. If no pre-processing
Artem Titov	d00ce74	2021-07-28 20:00:17 +0200	[diff] [blame]	386	// is required, \|*ptr_out\| points to `in_frame`.
yujo	36b1a5f	2017-06-12 12:45:32 -0700	[diff] [blame]	387	// TODO(yujo): Make this more efficient for muted frames.
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	388	int AudioCodingModuleImpl::PreprocessToAddData(const AudioFrame& in_frame,
				389	const AudioFrame** ptr_out) {
				390	const bool resample =
				391	in_frame.sample_rate_hz_ != encoder_stack_->SampleRateHz();
				392
				393	// This variable is true if primary codec and secondary codec (if exists)
				394	// are both mono and input is stereo.
				395	// TODO(henrik.lundin): This condition should probably be
				396	// in_frame.num_channels_ > encoder_stack_->NumChannels()
				397	const bool down_mix =
				398	in_frame.num_channels_ == 2 && encoder_stack_->NumChannels() == 1;
				399
				400	if (!first_10ms_data_) {
				401	expected_in_ts_ = in_frame.timestamp_;
				402	expected_codec_ts_ = in_frame.timestamp_;
				403	first_10ms_data_ = true;
				404	} else if (in_frame.timestamp_ != expected_in_ts_) {
Mirko Bonadei	675513b	2017-11-09 11:09:25 +0100	[diff] [blame]	405	RTC_LOG(LS_WARNING) << "Unexpected input timestamp: " << in_frame.timestamp_
				406	<< ", expected: " << expected_in_ts_;
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	407	expected_codec_ts_ +=
				408	(in_frame.timestamp_ - expected_in_ts_) *
				409	static_cast<uint32_t>(
				410	static_cast<double>(encoder_stack_->SampleRateHz()) /
				411	static_cast<double>(in_frame.sample_rate_hz_));
				412	expected_in_ts_ = in_frame.timestamp_;
				413	}
				414
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	415	if (!down_mix && !resample) {
				416	// No pre-processing is required.
ossu	63fb95a	2016-07-06 09:34:22 -0700	[diff] [blame]	417	if (expected_in_ts_ == expected_codec_ts_) {
				418	// If we've never resampled, we can use the input frame as-is
				419	*ptr_out = &in_frame;
				420	} else {
				421	// Otherwise we'll need to alter the timestamp. Since in_frame is const,
				422	// we'll have to make a copy of it.
				423	preprocess_frame_.CopyFrom(in_frame);
				424	preprocess_frame_.timestamp_ = expected_codec_ts_;
				425	*ptr_out = &preprocess_frame_;
				426	}
				427
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	428	expected_in_ts_ += static_cast<uint32_t>(in_frame.samples_per_channel_);
				429	expected_codec_ts_ += static_cast<uint32_t>(in_frame.samples_per_channel_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	430	return 0;
				431	}
				432
				433	*ptr_out = &preprocess_frame_;
				434	preprocess_frame_.num_channels_ = in_frame.num_channels_;
Per Åhgren	4dd56a3	2019-11-19 21:00:59 +0100	[diff] [blame]	435	preprocess_frame_.samples_per_channel_ = in_frame.samples_per_channel_;
Per Åhgren	d82a02c	2020-03-12 11:53:30 +0100	[diff] [blame]	436	std::array<int16_t, AudioFrame::kMaxDataSizeSamples> audio;
				437	const int16_t* src_ptr_audio;
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	438	if (down_mix) {
Per Åhgren	d82a02c	2020-03-12 11:53:30 +0100	[diff] [blame]	439	// If a resampling is required, the output of a down-mix is written into a
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	440	// local buffer, otherwise, it will be written to the output frame.
Yves Gerey	665174f	2018-06-19 15:03:05 +0200	[diff] [blame]	441	int16_t* dest_ptr_audio =
Per Åhgren	4dd56a3	2019-11-19 21:00:59 +0100	[diff] [blame]	442	resample ? audio.data() : preprocess_frame_.mutable_data();
Per Åhgren	d82a02c	2020-03-12 11:53:30 +0100	[diff] [blame]	443	RTC_DCHECK_GE(audio.size(), preprocess_frame_.samples_per_channel_);
Per Åhgren	4dd56a3	2019-11-19 21:00:59 +0100	[diff] [blame]	444	RTC_DCHECK_GE(audio.size(), in_frame.samples_per_channel_);
				445	DownMixFrame(in_frame,
				446	rtc::ArrayView<int16_t>(
				447	dest_ptr_audio, preprocess_frame_.samples_per_channel_));
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	448	preprocess_frame_.num_channels_ = 1;
Per Åhgren	d82a02c	2020-03-12 11:53:30 +0100	[diff] [blame]	449
				450	// Set the input of the resampler to the down-mixed signal.
Per Åhgren	4dd56a3	2019-11-19 21:00:59 +0100	[diff] [blame]	451	src_ptr_audio = audio.data();
Per Åhgren	d82a02c	2020-03-12 11:53:30 +0100	[diff] [blame]	452	} else {
				453	// Set the input of the resampler to the original data.
				454	src_ptr_audio = in_frame.data();
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	455	}
				456
				457	preprocess_frame_.timestamp_ = expected_codec_ts_;
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	458	preprocess_frame_.sample_rate_hz_ = in_frame.sample_rate_hz_;
				459	// If it is required, we have to do a resampling.
				460	if (resample) {
				461	// The result of the resampler is written to output frame.
yujo	36b1a5f	2017-06-12 12:45:32 -0700	[diff] [blame]	462	int16_t* dest_ptr_audio = preprocess_frame_.mutable_data();
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	463
				464	int samples_per_channel = resampler_.Resample10Msec(
				465	src_ptr_audio, in_frame.sample_rate_hz_, encoder_stack_->SampleRateHz(),
				466	preprocess_frame_.num_channels_, AudioFrame::kMaxDataSizeSamples,
				467	dest_ptr_audio);
				468
				469	if (samples_per_channel < 0) {
Mirko Bonadei	675513b	2017-11-09 11:09:25 +0100	[diff] [blame]	470	RTC_LOG(LS_ERROR) << "Cannot add 10 ms audio, resampling failed";
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	471	return -1;
				472	}
				473	preprocess_frame_.samples_per_channel_ =
				474	static_cast<size_t>(samples_per_channel);
				475	preprocess_frame_.sample_rate_hz_ = encoder_stack_->SampleRateHz();
				476	}
				477
				478	expected_codec_ts_ +=
				479	static_cast<uint32_t>(preprocess_frame_.samples_per_channel_);
				480	expected_in_ts_ += static_cast<uint32_t>(in_frame.samples_per_channel_);
				481
				482	return 0;
				483	}
				484
				485	/////////////////////////////////////////
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	486	// (FEC) Forward Error Correction (codec internal)
				487	//
				488
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	489	int AudioCodingModuleImpl::SetPacketLossRate(int loss_rate) {
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	490	MutexLock lock(&acm_mutex_);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	491	if (HaveValidEncoder("SetPacketLossRate")) {
minyue	4b9a2cb	2016-11-30 06:49:59 -0800	[diff] [blame]	492	encoder_stack_->OnReceivedUplinkPacketLossFraction(loss_rate / 100.0);
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	493	}
				494	return 0;
				495	}
				496
				497	/////////////////////////////////////////
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	498	// Statistics
				499	//
				500
Ali Tofigh	714e3cb	2022-07-20 12:53:07 +0200	[diff] [blame]	501	bool AudioCodingModuleImpl::HaveValidEncoder(
				502	absl::string_view caller_name) const {
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	503	if (!encoder_stack_) {
Mirko Bonadei	675513b	2017-11-09 11:09:25 +0100	[diff] [blame]	504	RTC_LOG(LS_ERROR) << caller_name << " failed: No send codec is registered.";
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	505	return false;
				506	}
				507	return true;
				508	}
				509
ivoc	e1198e0	2017-09-08 08:13:19 -0700	[diff] [blame]	510	ANAStats AudioCodingModuleImpl::GetANAStats() const {
Markus Handell	0df0fae	2020-07-07 15:53:34 +0200	[diff] [blame]	511	MutexLock lock(&acm_mutex_);
ivoc	e1198e0	2017-09-08 08:13:19 -0700	[diff] [blame]	512	if (encoder_stack_)
				513	return encoder_stack_->GetANAStats();
				514	// If no encoder is set, return default stats.
				515	return ANAStats();
				516	}
				517
Jakob Ivarsson	bf08745	2021-11-11 13:43:49 +0100	[diff] [blame]	518	int AudioCodingModuleImpl::GetTargetBitrate() const {
				519	MutexLock lock(&acm_mutex_);
				520	if (!encoder_stack_) {
				521	return -1;
				522	}
				523	return encoder_stack_->GetTargetBitrate();
				524	}
				525
kwiberg	c13ded5	2016-06-17 06:00:45 -0700	[diff] [blame]	526	} // namespace
				527
Henrik Lundin	84f7569	2023-02-01 12:07:10 +0000	[diff] [blame]	528	std::unique_ptr<AudioCodingModule> AudioCodingModule::Create() {
				529	return std::make_unique<AudioCodingModuleImpl>();
kwiberg	36a4388	2016-08-29 05:33:32 -0700	[diff] [blame]	530	}
				531
turaj@webrtc.org	7959e16	2013-09-12 18:30:26 +0000	[diff] [blame]	532	} // namespace webrtc