Blame - modules/audio_coding/include/audio_coding_module.h - webrtc.googlesource.com/src

blob: 31da3d46ab350f5627953e4f043c12916372046d [file] [log] [blame]

kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	1	/*
				2	* Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
				3	*
				4	* Use of this source code is governed by a BSD-style license
				5	* that can be found in the LICENSE file in the root of the source
				6	* tree. An additional intellectual property rights grant can be found
				7	* in the file PATENTS. All contributing project authors may
				8	* be found in the AUTHORS file in the root of the source tree.
				9	*/
				10
Mirko Bonadei	92ea95e	2017-09-15 06:47:31 +0200	[diff] [blame]	11	#ifndef MODULES_AUDIO_CODING_INCLUDE_AUDIO_CODING_MODULE_H_
				12	#define MODULES_AUDIO_CODING_INCLUDE_AUDIO_CODING_MODULE_H_
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	13
kwiberg	84be511	2016-04-27 01:19:58 -0700	[diff] [blame]	14	#include <memory>
henrik.lundin	4cf61dd	2015-12-09 06:20:58 -0800	[diff] [blame]	15	#include <string>
Fredrik Solenberg	f693bfa	2018-12-11 12:22:10 +0100	[diff] [blame]	16	#include <utility>
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	17	#include <vector>
				18
Danil Chapovalov	b602123	2018-06-19 13:26:36 +0200	[diff] [blame]	19	#include "absl/types/optional.h"
Mirko Bonadei	92ea95e	2017-09-15 06:47:31 +0200	[diff] [blame]	20	#include "api/audio_codecs/audio_decoder_factory.h"
				21	#include "api/audio_codecs/audio_encoder.h"
Artem Titov	741daaf	2019-03-21 14:37:36 +0100	[diff] [blame]	22	#include "api/function_view.h"
Ivo Creusen	3ce44a3	2019-10-31 14:38:11 +0100	[diff] [blame]	23	#include "api/neteq/neteq.h"
Ivo Creusen	c3d1f9b	2019-11-01 11:47:51 +0100	[diff] [blame]	24	#include "api/neteq/neteq_factory.h"
Mirko Bonadei	92ea95e	2017-09-15 06:47:31 +0200	[diff] [blame]	25	#include "modules/audio_coding/include/audio_coding_module_typedefs.h"
Mirko Bonadei	92ea95e	2017-09-15 06:47:31 +0200	[diff] [blame]	26	#include "system_wrappers/include/clock.h"
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	27
				28	namespace webrtc {
				29
				30	// forward declarations
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	31	class AudioDecoder;
				32	class AudioEncoder;
				33	class AudioFrame;
Niels Möller	afb5dbb	2019-02-15 15:21:47 +0100	[diff] [blame]	34	struct RTPHeader;
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	35
				36	#define WEBRTC_10MS_PCM_AUDIO 960 // 16 bits super wideband 48 kHz
				37
				38	// Callback class used for sending data ready to be packetized
				39	class AudioPacketizationCallback {
				40	public:
				41	virtual ~AudioPacketizationCallback() {}
				42
Niels Möller	87e2d78	2019-03-07 10:18:23 +0100	[diff] [blame]	43	virtual int32_t SendData(AudioFrameType frame_type,
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	44	uint8_t payload_type,
				45	uint32_t timestamp,
				46	const uint8_t* payload_data,
Minyue Li	48655cf	2020-01-23 13:45:50 +0100	[diff] [blame^]	47	size_t payload_len_bytes,
				48	int64_t absolute_capture_timestamp_ms) {
				49	// TODO(bugs.webrtc.org/10739): Deprecate the old SendData and make this one
				50	// pure virtual.
				51	RTC_NOTREACHED() << "This method must be overridden, or not used.";
				52	return -1;
				53	}
				54	virtual int32_t SendData(AudioFrameType frame_type,
				55	uint8_t payload_type,
				56	uint32_t timestamp,
				57	const uint8_t* payload_data,
				58	size_t payload_len_bytes) {
				59	return SendData(frame_type, payload_type, timestamp, payload_data,
				60	payload_len_bytes, 0);
				61	}
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	62	};
				63
				64	// Callback class used for reporting VAD decision
				65	class ACMVADCallback {
				66	public:
				67	virtual ~ACMVADCallback() {}
				68
Niels Möller	87e2d78	2019-03-07 10:18:23 +0100	[diff] [blame]	69	virtual int32_t InFrameType(AudioFrameType frame_type) = 0;
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	70	};
				71
				72	class AudioCodingModule {
				73	protected:
				74	AudioCodingModule() {}
				75
				76	public:
				77	struct Config {
Karl Wiberg	5817d3d	2018-04-06 10:06:42 +0200	[diff] [blame]	78	explicit Config(
				79	rtc::scoped_refptr<AudioDecoderFactory> decoder_factory = nullptr);
kwiberg	36a4388	2016-08-29 05:33:32 -0700	[diff] [blame]	80	Config(const Config&);
				81	~Config();
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	82
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	83	NetEq::Config neteq_config;
				84	Clock* clock;
ossu	e352578	2016-05-25 07:37:43 -0700	[diff] [blame]	85	rtc::scoped_refptr<AudioDecoderFactory> decoder_factory;
Ivo Creusen	c3d1f9b	2019-11-01 11:47:51 +0100	[diff] [blame]	86	NetEqFactory* neteq_factory = nullptr;
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	87	};
				88
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	89	static AudioCodingModule* Create(const Config& config);
				90	virtual ~AudioCodingModule() = default;
				91
				92	///////////////////////////////////////////////////////////////////////////
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	93	// Sender
				94	//
				95
kwiberg	4cdbd57	2016-03-30 03:10:05 -0700	[diff] [blame]	96	// \|modifier\| is called exactly once with one argument: a pointer to the
				97	// unique_ptr that holds the current encoder (which is null if there is no
				98	// current encoder). For the duration of the call, \|modifier\| has exclusive
				99	// access to the unique_ptr; it may call the encoder, steal the encoder and
				100	// replace it with another encoder or with nullptr, etc.
				101	virtual void ModifyEncoder(
kwiberg	24c7c12	2016-09-28 11:57:10 -0700	[diff] [blame]	102	rtc::FunctionView<void(std::unique_ptr<AudioEncoder>*)> modifier) = 0;
kwiberg	4cdbd57	2016-03-30 03:10:05 -0700	[diff] [blame]	103
				104	// Utility method for simply replacing the existing encoder with a new one.
				105	void SetEncoder(std::unique_ptr<AudioEncoder> new_encoder) {
				106	ModifyEncoder([&](std::unique_ptr<AudioEncoder>* encoder) {
				107	*encoder = std::move(new_encoder);
				108	});
				109	}
				110
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	111	// int32_t RegisterTransportCallback()
				112	// Register a transport callback which will be called to deliver
				113	// the encoded buffers whenever Process() is called and a
				114	// bit-stream is ready.
				115	//
				116	// Input:
				117	// -transport : pointer to the callback class
				118	// transport->SendData() is called whenever
				119	// Process() is called and bit-stream is ready
				120	// to deliver.
				121	//
				122	// Return value:
				123	// -1 if the transport callback could not be registered
				124	// 0 if registration is successful.
				125	//
				126	virtual int32_t RegisterTransportCallback(
				127	AudioPacketizationCallback* transport) = 0;
				128
				129	///////////////////////////////////////////////////////////////////////////
				130	// int32_t Add10MsData()
				131	// Add 10MS of raw (PCM) audio data and encode it. If the sampling
				132	// frequency of the audio does not match the sampling frequency of the
				133	// current encoder ACM will resample the audio. If an encoded packet was
				134	// produced, it will be delivered via the callback object registered using
				135	// RegisterTransportCallback, and the return value from this function will
				136	// be the number of bytes encoded.
				137	//
				138	// Input:
				139	// -audio_frame : the input audio frame, containing raw audio
Fredrik Solenberg	bbf21a3	2018-04-12 22:44:09 +0200	[diff] [blame]	140	// sampling frequency etc.
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	141	//
				142	// Return value:
				143	// >= 0 number of bytes encoded.
				144	// -1 some error occurred.
				145	//
				146	virtual int32_t Add10MsData(const AudioFrame& audio_frame) = 0;
				147
				148	///////////////////////////////////////////////////////////////////////////
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	149	// int SetPacketLossRate()
				150	// Sets expected packet loss rate for encoding. Some encoders provide packet
				151	// loss gnostic encoding to make stream less sensitive to packet losses,
				152	// through e.g., FEC. No effects on codecs that do not provide such encoding.
				153	//
				154	// Input:
				155	// -packet_loss_rate : expected packet loss rate (0 -- 100 inclusive).
				156	//
				157	// Return value
				158	// -1 if failed to set packet loss rate,
				159	// 0 if succeeded.
				160	//
minyue	7e30432	2016-10-12 05:00:55 -0700	[diff] [blame]	161	// This is only used in test code that rely on old ACM APIs.
				162	// TODO(minyue): Remove it when possible.
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	163	virtual int SetPacketLossRate(int packet_loss_rate) = 0;
				164
				165	///////////////////////////////////////////////////////////////////////////
				166	// (VAD) Voice Activity Detection
				167	//
				168
				169	///////////////////////////////////////////////////////////////////////////
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	170	// int32_t RegisterVADCallback()
				171	// Call this method to register a callback function which is called
				172	// any time that ACM encounters an empty frame. That is a frame which is
				173	// recognized inactive. Depending on the codec WebRtc VAD or internal codec
				174	// VAD is employed to identify a frame as active/inactive.
				175	//
				176	// Input:
				177	// -vad_callback : pointer to a callback function.
				178	//
				179	// Return value:
				180	// -1 if failed to register the callback function.
				181	// 0 if the callback function is registered successfully.
				182	//
				183	virtual int32_t RegisterVADCallback(ACMVADCallback* vad_callback) = 0;
				184
				185	///////////////////////////////////////////////////////////////////////////
				186	// Receiver
				187	//
				188
				189	///////////////////////////////////////////////////////////////////////////
				190	// int32_t InitializeReceiver()
				191	// Any decoder-related state of ACM will be initialized to the
				192	// same state when ACM is created. This will not interrupt or
				193	// effect encoding functionality of ACM. ACM would lose all the
				194	// decoding-related settings by calling this function.
				195	// For instance, all registered codecs are deleted and have to be
				196	// registered again.
				197	//
				198	// Return value:
				199	// -1 if failed to initialize,
				200	// 0 if succeeded.
				201	//
				202	virtual int32_t InitializeReceiver() = 0;
				203
kwiberg	1c07c70	2017-03-27 07:15:49 -0700	[diff] [blame]	204	// Replace any existing decoders with the given payload type -> decoder map.
				205	virtual void SetReceiveCodecs(
				206	const std::map<int, SdpAudioFormat>& codecs) = 0;
				207
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	208	///////////////////////////////////////////////////////////////////////////
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	209	// int32_t IncomingPacket()
				210	// Call this function to insert a parsed RTP packet into ACM.
				211	//
				212	// Inputs:
				213	// -incoming_payload : received payload.
				214	// -payload_len_bytes : the length of payload in bytes.
				215	// -rtp_info : the relevant information retrieved from RTP
				216	// header.
				217	//
				218	// Return value:
				219	// -1 if failed to push in the payload
				220	// 0 if payload is successfully pushed in.
				221	//
				222	virtual int32_t IncomingPacket(const uint8_t* incoming_payload,
				223	const size_t payload_len_bytes,
Niels Möller	afb5dbb	2019-02-15 15:21:47 +0100	[diff] [blame]	224	const RTPHeader& rtp_header) = 0;
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	225
				226	///////////////////////////////////////////////////////////////////////////
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	227	// int32_t PlayoutData10Ms(
				228	// Get 10 milliseconds of raw audio data for playout, at the given sampling
				229	// frequency. ACM will perform a resampling if required.
				230	//
				231	// Input:
				232	// -desired_freq_hz : the desired sampling frequency, in Hertz, of the
				233	// output audio. If set to -1, the function returns
				234	// the audio at the current sampling frequency.
				235	//
				236	// Output:
				237	// -audio_frame : output audio frame which contains raw audio data
Fredrik Solenberg	bbf21a3	2018-04-12 22:44:09 +0200	[diff] [blame]	238	// and other relevant parameters.
henrik.lundin	834a6ea	2016-05-13 03:45:24 -0700	[diff] [blame]	239	// -muted : if true, the sample data in audio_frame is not
				240	// populated, and must be interpreted as all zero.
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	241	//
				242	// Return value:
				243	// -1 if the function fails,
				244	// 0 if the function succeeds.
				245	//
				246	virtual int32_t PlayoutData10Ms(int32_t desired_freq_hz,
henrik.lundin	834a6ea	2016-05-13 03:45:24 -0700	[diff] [blame]	247	AudioFrame* audio_frame,
				248	bool* muted) = 0;
				249
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	250	///////////////////////////////////////////////////////////////////////////
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	251	// statistics
				252	//
				253
				254	///////////////////////////////////////////////////////////////////////////
				255	// int32_t GetNetworkStatistics()
				256	// Get network statistics. Note that the internal statistics of NetEq are
				257	// reset by this call.
				258	//
				259	// Input:
				260	// -network_statistics : a structure that contains network statistics.
				261	//
				262	// Return value:
				263	// -1 if failed to set the network statistics,
				264	// 0 if statistics are set successfully.
				265	//
				266	virtual int32_t GetNetworkStatistics(
				267	NetworkStatistics* network_statistics) = 0;
				268
ivoc	e1198e0	2017-09-08 08:13:19 -0700	[diff] [blame]	269	virtual ANAStats GetANAStats() const = 0;
kjellander	3e6db23	2015-11-26 04:44:54 -0800	[diff] [blame]	270	};
				271
				272	} // namespace webrtc
				273
Mirko Bonadei	92ea95e	2017-09-15 06:47:31 +0200	[diff] [blame]	274	#endif // MODULES_AUDIO_CODING_INCLUDE_AUDIO_CODING_MODULE_H_